123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601 |
- /*
- * JsonParser.cpp, part of VCMI engine
- *
- * Authors: listed in file AUTHORS in main folder
- *
- * License: GNU General Public License v2.0 or later
- * Full text of license available in license.txt file, in main folder
- *
- */
- #include "StdInc.h"
- #include "JsonParser.h"
- #include "../ScopeGuard.h"
- #include "../TextOperations.h"
- #include "JsonFormatException.h"
- VCMI_LIB_NAMESPACE_BEGIN
- JsonParser::JsonParser(const std::byte * inputString, size_t stringSize, const JsonParsingSettings & settings)
- : settings(settings)
- , input(reinterpret_cast<const char *>(inputString), stringSize)
- , lineCount(1)
- , currentDepth(0)
- , lineStart(0)
- , pos(0)
- {
- }
- JsonNode JsonParser::parse(const std::string & fileName)
- {
- JsonNode root;
- if(input.empty())
- {
- error("File is empty", false);
- }
- else
- {
- if(!TextOperations::isValidUnicodeString(input.data(), input.size()))
- error("Not a valid UTF-8 file", false);
- // If file starts with BOM - skip it
- uint32_t firstCharacter = TextOperations::getUnicodeCodepoint(input.data(), input.size());
- if (firstCharacter == 0xFEFF)
- pos += TextOperations::getUnicodeCharacterSize(input[0]);
- extractValue(root);
- extractWhitespace(false);
- //Warn if there are any non-whitespace symbols left
- if(pos < input.size())
- error("Not all file was parsed!", true);
- }
- if(!errors.empty())
- {
- logMod->warn("%s is not valid JSON!", fileName);
- logMod->warn(errors);
- }
- return root;
- }
- bool JsonParser::isValid()
- {
- return errors.empty();
- }
- bool JsonParser::extractSeparator()
- {
- if(!extractWhitespace())
- return false;
- if(input[pos] != ':')
- return error("Separator expected");
- pos++;
- return true;
- }
- bool JsonParser::extractValue(JsonNode & node)
- {
- if(!extractWhitespace())
- return false;
- switch(input[pos])
- {
- case '\"':
- case '\'':
- return extractString(node);
- case 'n':
- return extractNull(node);
- case 't':
- return extractTrue(node);
- case 'f':
- return extractFalse(node);
- case '{':
- return extractStruct(node);
- case '[':
- return extractArray(node);
- case '-':
- case '+':
- case '.':
- return extractFloat(node);
- default:
- {
- if(input[pos] >= '0' && input[pos] <= '9')
- return extractFloat(node);
- return error("Value expected!");
- }
- }
- }
- bool JsonParser::extractWhitespace(bool verbose)
- {
- //TODO: JSON5 - C-style multi-line comments
- //TODO: JSON5 - Additional white space characters are allowed
- while(true)
- {
- while(pos < input.size() && static_cast<ui8>(input[pos]) <= ' ')
- {
- if(input[pos] == '\n')
- {
- lineCount++;
- lineStart = pos + 1;
- }
- pos++;
- }
- if(pos >= input.size() || input[pos] != '/')
- break;
- if(settings.mode == JsonParsingSettings::JsonFormatMode::JSON)
- error("Comments are not permitted in json!", true);
- pos++;
- if(pos == input.size())
- break;
- if(input[pos] == '/')
- pos++;
- else
- error("Comments must consist of two slashes!", true);
- while(pos < input.size() && input[pos] != '\n')
- pos++;
- }
- if(pos >= input.size() && verbose)
- return error("Unexpected end of file!");
- return true;
- }
- bool JsonParser::extractEscaping(std::string & str)
- {
- // TODO: support unicode escaping:
- // \u1234
- switch(input[pos])
- {
- case '\"':
- str += '\"';
- break;
- case '\\':
- str += '\\';
- break;
- case 'b':
- str += '\b';
- break;
- case 'f':
- str += '\f';
- break;
- case 'n':
- str += '\n';
- break;
- case 'r':
- str += '\r';
- break;
- case 't':
- str += '\t';
- break;
- case '/':
- str += '/';
- break;
- default:
- return error("Unknown escape sequence!", true);
- }
- return true;
- }
- bool JsonParser::extractString(std::string & str)
- {
- //TODO: JSON5 - line breaks escaping
- if(settings.mode < JsonParsingSettings::JsonFormatMode::JSON5)
- {
- if(input[pos] != '\"')
- return error("String expected!");
- }
- else
- {
- if(input[pos] != '\"' && input[pos] != '\'')
- return error("String expected!");
- }
- char lineTerminator = input[pos];
- pos++;
- size_t first = pos;
- while(pos != input.size())
- {
- if(input[pos] == lineTerminator) // Correct end of string
- {
- str.append(&input[first], pos - first);
- pos++;
- return true;
- }
- if(input[pos] == '\\') // Escaping
- {
- str.append(&input[first], pos - first);
- pos++;
- if(pos == input.size())
- break;
- extractEscaping(str);
- first = pos + 1;
- }
- if(input[pos] == '\n') // end-of-line
- {
- str.append(&input[first], pos - first);
- return error("Closing quote not found!", true);
- }
- if(static_cast<unsigned char>(input[pos]) < ' ') // control character
- {
- str.append(&input[first], pos - first);
- first = pos + 1;
- error("Illegal character in the string!", true);
- }
- pos++;
- }
- return error("Unterminated string!");
- }
- bool JsonParser::extractString(JsonNode & node)
- {
- std::string str;
- if(!extractString(str))
- return false;
- node.setType(JsonNode::JsonType::DATA_STRING);
- node.String() = str;
- return true;
- }
- bool JsonParser::extractLiteral(std::string & literal)
- {
- while(pos < input.size())
- {
- bool isUpperCase = input[pos] >= 'A' && input[pos] <= 'Z';
- bool isLowerCase = input[pos] >= 'a' && input[pos] <= 'z';
- bool isNumber = input[pos] >= '0' && input[pos] <= '9';
- if(!isUpperCase && !isLowerCase && !isNumber)
- break;
- literal += input[pos];
- pos++;
- }
- return true;
- }
- bool JsonParser::extractAndCompareLiteral(const std::string & expectedLiteral)
- {
- std::string literal;
- if(!extractLiteral(literal))
- return false;
- if(literal != expectedLiteral)
- {
- return error("Expected " + expectedLiteral + ", but unknown literal found", true);
- return false;
- }
- return true;
- }
- bool JsonParser::extractNull(JsonNode & node)
- {
- if(!extractAndCompareLiteral("null"))
- return false;
- node.clear();
- return true;
- }
- bool JsonParser::extractTrue(JsonNode & node)
- {
- if(!extractAndCompareLiteral("true"))
- return false;
- node.Bool() = true;
- return true;
- }
- bool JsonParser::extractFalse(JsonNode & node)
- {
- if(!extractAndCompareLiteral("false"))
- return false;
- node.Bool() = false;
- return true;
- }
- bool JsonParser::extractStruct(JsonNode & node)
- {
- node.setType(JsonNode::JsonType::DATA_STRUCT);
- if(currentDepth > settings.maxDepth)
- error("Maximum allowed depth of json structure has been reached", true);
- pos++;
- currentDepth++;
- auto guard = vstd::makeScopeGuard([this]()
- {
- currentDepth--;
- });
- if(!extractWhitespace())
- return false;
- //Empty struct found
- if(input[pos] == '}')
- {
- pos++;
- return true;
- }
- while(true)
- {
- if(!extractWhitespace())
- return false;
- bool overrideFlag = false;
- std::string key;
- if(settings.mode < JsonParsingSettings::JsonFormatMode::JSON5)
- {
- if(!extractString(key))
- return false;
- }
- else
- {
- if(input[pos] == '\'' || input[pos] == '\"')
- {
- if(!extractString(key))
- return false;
- }
- else
- {
- if(!extractLiteral(key))
- return false;
- }
- }
- if(key.find('#') != std::string::npos)
- {
- // split key string into actual key and meta-flags
- std::vector<std::string> keyAndFlags;
- boost::split(keyAndFlags, key, boost::is_any_of("#"));
- key = keyAndFlags[0];
- for(int i = 1; i < keyAndFlags.size(); i++)
- {
- if(keyAndFlags[i] == "override")
- overrideFlag = true;
- else
- error("Encountered unknown flag #" + keyAndFlags[i], true);
- }
- }
- if(node.Struct().find(key) != node.Struct().end())
- error("Duplicate element encountered!", true);
- if(!extractSeparator())
- return false;
- if(!extractElement(node.Struct()[key], '}'))
- return false;
- node.Struct()[key].setOverrideFlag(overrideFlag);
- if(input[pos] == '}')
- {
- pos++;
- return true;
- }
- }
- }
- bool JsonParser::extractArray(JsonNode & node)
- {
- if(currentDepth > settings.maxDepth)
- error("Macimum allowed depth of json structure has been reached", true);
- currentDepth++;
- auto guard = vstd::makeScopeGuard([this]()
- {
- currentDepth--;
- });
- pos++;
- node.setType(JsonNode::JsonType::DATA_VECTOR);
- if(!extractWhitespace())
- return false;
- //Empty array found
- if(input[pos] == ']')
- {
- pos++;
- return true;
- }
- while(true)
- {
- //NOTE: currently 50% of time is this vector resizing.
- //May be useful to use list during parsing and then swap() all items to vector
- node.Vector().resize(node.Vector().size() + 1);
- if(!extractElement(node.Vector().back(), ']'))
- return false;
- if(input[pos] == ']')
- {
- pos++;
- return true;
- }
- }
- }
- bool JsonParser::extractElement(JsonNode & node, char terminator)
- {
- if(!extractValue(node))
- return false;
- if(!extractWhitespace())
- return false;
- bool comma = (input[pos] == ',');
- if(comma)
- {
- pos++;
- if(!extractWhitespace())
- return false;
- }
- if(input[pos] == terminator)
- {
- if(comma && settings.mode < JsonParsingSettings::JsonFormatMode::JSON5)
- error("Extra comma found!", true);
- return true;
- }
- if(!comma)
- error("Comma expected!", true);
- return true;
- }
- bool JsonParser::extractFloat(JsonNode & node)
- {
- //TODO: JSON5 - hexacedimal support
- //TODO: JSON5 - Numbers may be IEEE 754 positive infinity, negative infinity, and NaN (why?)
- assert(input[pos] == '-' || (input[pos] >= '0' && input[pos] <= '9'));
- bool negative = false;
- double result = 0;
- si64 integerPart = 0;
- bool isFloat = false;
- if(input[pos] == '+')
- {
- if(settings.mode < JsonParsingSettings::JsonFormatMode::JSON5)
- error("Positive numbers should not have plus sign!", true);
- pos++;
- }
- else if(input[pos] == '-')
- {
- pos++;
- negative = true;
- }
- if(input[pos] < '0' || input[pos] > '9')
- {
- if(input[pos] != '.' && settings.mode < JsonParsingSettings::JsonFormatMode::JSON5)
- return error("Number expected!");
- }
- //Extract integer part
- while(input[pos] >= '0' && input[pos] <= '9')
- {
- integerPart = integerPart * 10 + (input[pos] - '0');
- pos++;
- }
- result = static_cast<double>(integerPart);
- if(input[pos] == '.')
- {
- //extract fractional part
- isFloat = true;
- pos++;
- double fractMult = 0.1;
- if(settings.mode < JsonParsingSettings::JsonFormatMode::JSON5 && (input[pos] < '0' || input[pos] > '9'))
- return error("Decimal part expected!");
- while(input[pos] >= '0' && input[pos] <= '9')
- {
- result = result + fractMult * (input[pos] - '0');
- fractMult /= 10;
- pos++;
- }
- }
- if(input[pos] == 'e')
- {
- //extract exponential part
- pos++;
- isFloat = true;
- bool powerNegative = false;
- double power = 0;
- if(input[pos] == '-')
- {
- pos++;
- powerNegative = true;
- }
- else if(input[pos] == '+')
- {
- pos++;
- }
- if(input[pos] < '0' || input[pos] > '9')
- return error("Exponential part expected!");
- while(input[pos] >= '0' && input[pos] <= '9')
- {
- power = power * 10 + (input[pos] - '0');
- pos++;
- }
- if(powerNegative)
- power = -power;
- result *= std::pow(10, power);
- }
- if(isFloat)
- {
- if(negative)
- result = -result;
- node.setType(JsonNode::JsonType::DATA_FLOAT);
- node.Float() = result;
- }
- else
- {
- if(negative)
- integerPart = -integerPart;
- node.setType(JsonNode::JsonType::DATA_INTEGER);
- node.Integer() = integerPart;
- }
- return true;
- }
- bool JsonParser::error(const std::string & message, bool warning)
- {
- if(settings.strict)
- throw JsonFormatException(message);
- std::ostringstream stream;
- std::string type(warning ? " warning: " : " error: ");
- if(!errors.empty())
- {
- // only add the line breaks between error messages so we don't have a trailing line break
- stream << "\n";
- }
- stream << "At line " << lineCount << ", position " << pos - lineStart << type << message;
- errors += stream.str();
- return warning;
- }
- VCMI_LIB_NAMESPACE_END
|