/* * Copyright (c) 2010-2012 OTClient * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to deal * in the Software without restriction, including without limitation the rights * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell * copies of the Software, and to permit persons to whom the Software is * furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in * all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN * THE SOFTWARE. */ #include "otmlparser.h" #include "otmldocument.h" #include "otmlexception.h" #include OTMLParser::OTMLParser(OTMLDocumentPtr doc, std::istream& in) : currentDepth(0), currentLine(0), doc(doc), currentParent(doc), previousNode(0), in(in) { } void OTMLParser::parse() { if(!in.good()) throw OTMLException(doc, "cannot read from input stream"); while(!in.eof()) parseLine(getNextLine()); } std::string OTMLParser::getNextLine() { currentLine++; std::string line; std::getline(in, line); return line; } int OTMLParser::getLineDepth(const std::string& line, bool multilining) { // count number of spaces at the line beginning std::size_t spaces = 0; while(line[spaces] == ' ') spaces++; // pre calculate depth int depth = spaces / 2; if(!multilining || depth <= currentDepth) { // check the next character is a tab if(line[spaces] == '\t') throw OTMLException(doc, "indentation with tabs are not allowed", currentLine); // must indent every 2 spaces if(spaces % 2 != 0) throw OTMLException(doc, "must indent every 2 spaces", currentLine); } return depth; } void OTMLParser::parseLine(std::string line) { int depth = getLineDepth(line); if(depth == -1) return; // remove line sides spaces boost::trim(line); // skip empty lines if(line.empty()) return; // skip comments if(boost::starts_with(line, "//")) return; // a depth above, change current parent to the previous added node if(depth == currentDepth+1) { currentParent = previousNode; // a depth below, change parent to previous parent } else if(depth < currentDepth) { for(int i=0;iparent(); // if it isn't the current depth, it's a syntax error } else if(depth != currentDepth) throw OTMLException(doc, "invalid indentation depth, are you indenting correctly?", currentLine); // sets current depth currentDepth = depth; // alright, new depth is set, the line is not empty and it isn't a comment // then it must be a node, so we parse it parseNode(line); } void OTMLParser::parseNode(const std::string& data) { std::string tag; std::string value; std::size_t dotsPos = data.find_first_of(':'); int nodeLine = currentLine; // node that has no tag and may have a value if(!data.empty() && data[0] == '-') { value = data.substr(1); boost::trim(value); // node that has tag and possible a value } else if(dotsPos != std::string::npos) { tag = data.substr(0, dotsPos); if(data.size() > dotsPos+1) value = data.substr(dotsPos+1); // node that has only a tag } else { tag = data; } boost::trim(tag); boost::trim(value); // process multitine values if(value == "|" || value == "|-" || value == "|+") { // reads next lines until we can a value below the same depth std::string multiLineData; do { size_t lastPos = in.tellg(); std::string line = getNextLine(); int depth = getLineDepth(line, true); // depth above current depth, add the text to the multiline if(depth > currentDepth) { multiLineData += line.substr((currentDepth+1)*2); // it has contents below the current depth } else { // if not empty, its a node boost::trim(line); if(!line.empty()) { // rewind and break in.seekg(lastPos, std::ios::beg); currentLine--; break; } } multiLineData += "\n"; } while(!in.eof()); /* determine how to treat new lines at the end * | strip all new lines at the end and add just a new one * |- strip all new lines at the end * |+ keep all the new lines at the end (the new lines until next node) */ if(value == "|" || value == "|-") { // remove all new lines at the end int lastPos = multiLineData.length(); while(multiLineData[--lastPos] == '\n') multiLineData.erase(lastPos, 1); if(value == "|") multiLineData.append("\n"); } // else it's |+ value = multiLineData; } // create the node OTMLNodePtr node = OTMLNode::create(tag); node->setUnique(dotsPos != std::string::npos); node->setTag(tag); node->setSource(doc->source() + ":" + stdext::unsafe_cast(nodeLine)); // ~ is considered the null value if(value == "~") node->setNull(true); else { if(boost::starts_with(value, "[") && boost::ends_with(value, "]")) { std::string tmp = value.substr(1, value.length()-2); boost::tokenizer> tokens(tmp); for(std::string v : tokens) node->writeIn(stdext::trim(v)); } else node->setValue(value); } currentParent->addChild(node); previousNode = node; }