2016-04-17 09:30:14 +00:00
|
|
|
/*
|
|
|
|
This file is part of Telegram Desktop,
|
2018-01-03 10:23:14 +00:00
|
|
|
the official desktop application for the Telegram messaging service.
|
2016-04-17 09:30:14 +00:00
|
|
|
|
2018-01-03 10:23:14 +00:00
|
|
|
For license and copyright information please follow this link:
|
|
|
|
https://github.com/telegramdesktop/tdesktop/blob/master/LEGAL
|
2016-04-17 09:30:14 +00:00
|
|
|
*/
|
2016-04-18 20:33:43 +00:00
|
|
|
#include "codegen/numbers/parsed_file.h"
|
2016-04-17 09:30:14 +00:00
|
|
|
|
2016-04-18 20:33:43 +00:00
|
|
|
#include <iostream>
|
2016-04-17 17:52:17 +00:00
|
|
|
#include <QtCore/QMap>
|
2016-04-18 20:33:43 +00:00
|
|
|
#include <QtCore/QDir>
|
|
|
|
#include <QtCore/QRegularExpression>
|
|
|
|
#include "codegen/common/basic_tokenized_file.h"
|
|
|
|
#include "codegen/common/logging.h"
|
2016-04-18 22:00:54 +00:00
|
|
|
#include "codegen/common/clean_file_reader.h"
|
|
|
|
#include "codegen/common/checked_utf8_string.h"
|
2016-04-17 09:30:14 +00:00
|
|
|
|
2016-04-18 20:33:43 +00:00
|
|
|
using BasicToken = codegen::common::BasicTokenizedFile::Token;
|
|
|
|
using BasicType = BasicToken::Type;
|
2016-04-17 09:30:14 +00:00
|
|
|
|
2016-04-18 20:33:43 +00:00
|
|
|
namespace codegen {
|
|
|
|
namespace numbers {
|
|
|
|
namespace {
|
2016-04-17 13:22:00 +00:00
|
|
|
|
2016-04-18 22:00:54 +00:00
|
|
|
QByteArray replaceStrings(const QString &filepath) {
|
|
|
|
common::CleanFileReader reader(filepath);
|
|
|
|
if (!reader.read()) {
|
|
|
|
return QByteArray();
|
|
|
|
}
|
|
|
|
common::CheckedUtf8String string(reader.currentPtr(), reader.charsLeft());
|
|
|
|
if (!string.isValid()) {
|
|
|
|
return QByteArray();
|
|
|
|
}
|
|
|
|
|
|
|
|
QStringList lines = string.toString().split('\n');
|
|
|
|
for (auto &line : lines) {
|
2016-04-19 10:59:59 +00:00
|
|
|
auto match = QRegularExpression("^(\\d+;[A-Z]+;)([^;]+)(;.*)?$").match(line);
|
2016-04-18 22:00:54 +00:00
|
|
|
if (match.hasMatch()) {
|
|
|
|
line = match.captured(1) + '"' + match.captured(2) + '"' + match.captured(3);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return lines.join('\n').toUtf8();
|
|
|
|
}
|
|
|
|
|
2016-04-18 20:33:43 +00:00
|
|
|
} // namespace
|
2016-04-17 09:30:14 +00:00
|
|
|
|
2016-04-18 20:33:43 +00:00
|
|
|
ParsedFile::ParsedFile(const Options &options)
|
2016-04-18 22:00:54 +00:00
|
|
|
: content_(replaceStrings(options.inputPath))
|
|
|
|
, file_(content_, options.inputPath)
|
2016-04-18 20:33:43 +00:00
|
|
|
, options_(options) {
|
|
|
|
}
|
2016-04-17 13:22:00 +00:00
|
|
|
|
2016-04-18 20:33:43 +00:00
|
|
|
bool ParsedFile::read() {
|
2016-04-18 22:00:54 +00:00
|
|
|
if (content_.isEmpty() || !file_.read()) {
|
2016-04-18 20:33:43 +00:00
|
|
|
return false;
|
2016-04-17 13:22:00 +00:00
|
|
|
}
|
2016-04-17 09:30:14 +00:00
|
|
|
|
2016-04-18 20:33:43 +00:00
|
|
|
auto filepath = QFileInfo(options_.inputPath).absoluteFilePath();
|
|
|
|
do {
|
2016-04-18 22:00:54 +00:00
|
|
|
if (auto code = file_.getToken(BasicType::Int)) {
|
|
|
|
if (!file_.getToken(BasicType::Semicolon)) {
|
|
|
|
logErrorUnexpectedToken() << "';'";
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
if (!file_.getToken(BasicType::Name)) {
|
|
|
|
logErrorUnexpectedToken() << "country code";
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
if (!file_.getToken(BasicType::Semicolon)) {
|
|
|
|
logErrorUnexpectedToken() << "';'";
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
if (!file_.getToken(BasicType::String)) {
|
|
|
|
logErrorUnexpectedToken() << "country name";
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
if (file_.getToken(BasicType::Semicolon)) {
|
|
|
|
if (auto firstPart = file_.getToken(BasicType::Int)) {
|
|
|
|
if (firstPart.original.toByteArray() != code.original.toByteArray()) {
|
|
|
|
file_.putBack();
|
|
|
|
result_.data.insert(code.original.toStringUnchecked(), Rule());
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
Rule rule;
|
|
|
|
while (auto part = file_.getToken(BasicType::Name)) {
|
|
|
|
rule.push_back(part.original.size());
|
|
|
|
}
|
|
|
|
result_.data.insert(code.original.toStringUnchecked(), rule);
|
|
|
|
if (rule.isEmpty()) {
|
|
|
|
logErrorUnexpectedToken() << "bad phone pattern";
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!file_.getToken(BasicType::Semicolon)) {
|
|
|
|
logErrorUnexpectedToken() << "';'";
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
if (!file_.getToken(BasicType::Int)) {
|
|
|
|
logErrorUnexpectedToken() << "country phone len";
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
file_.getToken(BasicType::Semicolon);
|
|
|
|
continue;
|
|
|
|
} else {
|
|
|
|
logErrorUnexpectedToken() << "country phone pattern";
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
} else if (file_.getToken(BasicType::Int)) {
|
|
|
|
file_.putBack();
|
|
|
|
result_.data.insert(code.original.toStringUnchecked(), Rule());
|
|
|
|
continue;
|
|
|
|
} else {
|
|
|
|
logErrorUnexpectedToken() << "country phone pattern";
|
|
|
|
return false;
|
|
|
|
}
|
2016-04-18 20:33:43 +00:00
|
|
|
}
|
|
|
|
if (file_.atEnd()) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
logErrorUnexpectedToken() << "numbers rule";
|
|
|
|
} while (!failed());
|
2016-04-17 13:22:00 +00:00
|
|
|
|
2016-04-18 20:33:43 +00:00
|
|
|
if (failed()) {
|
|
|
|
result_.data.clear();
|
2016-04-17 13:22:00 +00:00
|
|
|
}
|
2016-04-18 20:33:43 +00:00
|
|
|
return !failed();
|
|
|
|
}
|
2016-04-17 09:30:14 +00:00
|
|
|
|
2016-04-18 20:33:43 +00:00
|
|
|
} // namespace numbers
|
2016-04-17 09:30:14 +00:00
|
|
|
} // namespace codegen
|