Some more code reformatting

[libs/datafile.git] / source / textparser.cpp
diff --git a/source/textparser.cpp b/source/textparser.cpp

index 78d2f1df6334b32dbf67a7871975deda4dafb0a4..8bcde35802108ba2f16c32584e6ace17b1e33ee9 100644 (file)
--- a/source/textparser.cpp
+++ b/source/textparser.cpp
@@ -1,7 +1,7 @@
  /* $Id$
  
  This file is part of libmspdatafile
-Copyright © 2007  Mikko Rasa, Mikkosoft Productions
+Copyright © 2007-2008, 2010  Mikko Rasa, Mikkosoft Productions
  Distributed under the LGPL
  */
  
@@ -28,74 +28,73 @@ Statement TextParser::parse()
  Statement TextParser::parse_statement(const Token *t)
  {
         Statement result;
-       bool      sub=false;
-       bool      finish=false;
+       bool      sub = false;
+       bool      finish = false;
  
         while(in)
         {
                 Token token;
                 if(t)
                 {
-                       token=*t;
-                       t=0;
+                       token = *t;
+                       t = 0;
                 }
                 else
-                       token=parse_token();
+                       token = parse_token();
  
                 if(result.keyword.empty())
                 {
                         if(token.str.empty())
                                 break;
                         else if(token.type!=Token::IDENTIFIER)
-                               throw ParseError(format("%s: Syntax error at token '%s' (expected an identifier)", get_location(), token.str), src, in.get_line_number());
-                       result.keyword=token.str;
-                       result.valid=true;
-                       result.source=src;
-                       result.line=in.get_line_number();
+                               throw_at(ParseError(format("Syntax error at token '%s' (expected an identifier)", token.str)), get_location());
+                       result.keyword = token.str;
+                       result.valid = true;
+                       result.source = src;
+                       result.line = in.get_line_number();
                 }
                 else if(sub)
                 {
                         if(token.str=="}")
                         {
-                               sub=false;
-                               finish=true;
+                               sub = false;
+                               finish = true;
                         }
                         else
                         {
-                               Statement ss=parse_statement(&token);
+                               Statement ss = parse_statement(&token);
                                 result.sub.push_back(ss);
                         }
                 }
                 else if(finish)
                 {
                         if(token.str!=";")
-                               throw ParseError(format("%s: Syntax error at token '%s' (Expected a ';')", get_location(), token.str), src, in.get_line_number());
+                               throw_at(ParseError(format("Syntax error at token '%s' (Expected a ';')", token.str)), get_location());
                         break;
                 }
                 else if(token.str=="{")
-                       sub=true;
+                       sub = true;
                 else if(token.str==";")
                         break;
                 else if(token.type==Token::INTEGER)
-                       result.args.push_back(Value(INTEGER, token.str));
+                       result.append(lexical_cast<IntType::Store>(token.str));
                 else if(token.type==Token::FLOAT)
-                       result.args.push_back(Value(FLOAT, token.str));
+                       result.append(lexical_cast<FloatType::Store>(token.str));
                 else if(token.type==Token::STRING)
-                       result.args.push_back(Value(STRING, token.str));
+                       result.append(token.str);
                 else if(token.type==Token::IDENTIFIER)
                 {
                         if(token.str=="true")
-                               result.args.push_back(Value(BOOLEAN, "1"));
+                               result.append(true);
                         else if(token.str=="false")
-                               result.args.push_back(Value(BOOLEAN, "0"));
+                               result.append(false);
                         else
-                               result.args.push_back(Value(ENUM, token.str));
-                       //result.args.push_back(resolve_identifiertoken.str);
+                               result.append(Symbol(token.str));
                 }
                 else if(token.str=="")
-                       throw ParseError(src+": Unexcepted end of input", src, in.get_line_number());
+                       throw_at(ParseError("Unexcepted end of input"), get_location());
                 else
-                       throw ParseError(get_location()+": Syntax error", src, in.get_line_number());
+                       throw_at(ParseError("Syntax error"), get_location());
         }
  
         return result;
@@ -103,31 +102,33 @@ Statement TextParser::parse_statement(const Token *t)
  
  Token TextParser::parse_token()
  {
-       int c=0;
-       unsigned comment=0;
+       int c = 0;
+       int comment = 0;
  
         // Skip over comments and whitespace
-       while(in)
+       while(in && comment>=0)
         {
-               c=in.get();
-               int next=in.peek();
+               c = in.get();
+               int next = in.peek();
  
                 if(c=='/' && next=='/')
-                       comment=1;
+                       comment = 1;
                 else if(c=='/' && next=='*')
-                       comment=2;
+                       comment = 2;
                 else if(c=='\n' && comment==1)
-                       comment=0;
+                       comment = 0;
                 else if(c=='*' && next=='/' && comment==2)
-                       comment=3;
+                       comment = 3;
                 else if(comment==3)   // Skip the second character of block comment end
-                       comment=0;
+                       comment = 0;
                 else if(!isspace(c) && !comment)
-                       break;
+                       comment = -1;
         }
  
-       if(comment)  // Didn't hit any non-whitespace
-               throw ParseError(src+": Unfinished comment at end of input", src, in.get_line_number());
+       if(comment>0)  // EOF while in comment
+               throw_at(ParseError("Unfinished comment at end of input"), get_location());
+       else if(comment==0)  // Didn't hit any non-whitespace
+               return Token(Token::SPECIAL, "");
  
         enum ParseState
         {
@@ -163,131 +164,132 @@ Token TextParser::parse_token()
                 Token::IDENTIFIER
         };
  
-       ParseState state=INIT;
+       ParseState state = INIT;
         string     buf;
-       bool       escape=false;
+       bool       escape = false;
  
-       while(in)
+       while(in || state==INIT)
         {
                 if(state!=INIT)
-                       c=in.get();
-               int next=in.peek();
+                       c = in.get();
+               int next = in.peek();
  
-               buf+=c;
+               buf += c;
  
                 switch(state)
                 {
                 case INIT:
                         if(c=='0')
-                               state=ZERO;
+                               state = ZERO;
                         else if(c=='-' || c=='+')
-                               state=SIGN;
+                               state = SIGN;
                         else if(c=='.')
-                               state=FLOAT;
+                               state = FLOAT;
                         else if(c=='"')
-                               state=STRING;
+                               state = STRING;
                         else if(c=='{' || c=='}' || c==';')
                                 return Token(Token::SPECIAL, string(1, c));
                         else if(isdigit(c))
-                               state=DECIMAL;
+                               state = DECIMAL;
                         else if(isalpha(c) || c=='_')
-                               state=IDENTIFIER;
+                               state = IDENTIFIER;
                         else
-                               parse_error(c, state);
+                               parse_error(c, "0-9A-Za-z_.\"{};+-");
                         break;
  
                 case SIGN:
                         if(c=='0')
-                               state=ZERO;
+                               state = ZERO;
                         else if(isdigit(c))
-                               state=DECIMAL;
+                               state = DECIMAL;
                         else if(c=='.')
-                               state=FLOAT;
+                               state = FLOAT;
                         else
-                               parse_error(c, state);
+                               parse_error(c, "0-9.");
                         break;
  
                 case ZERO:
                         if(c=='x')
-                               state=HEXADECIMAL;
+                               state = HEXADECIMAL;
                         else if(isdigit(c))
-                               state=OCTAL;
+                               state = OCTAL;
                         else if(c=='.')
-                               state=FLOAT;
+                               state = FLOAT;
                         else
-                               parse_error(c, state);
+                               parse_error(c, "0-9A-Fa-f.");
                         break;
  
                 case DECIMAL:
                         if(c=='.')
-                               state=FLOAT;
+                               state = FLOAT;
                         else if(!isdigit(c))
-                               parse_error(c, state);
+                               parse_error(c, "0-9.");
                         break;
  
                 case HEXADECIMAL:
                         if(!isxdigit(c))
-                               parse_error(c, state);
+                               parse_error(c, "0-9A-Fa-f");
                         break;
  
                 case OCTAL:
                         if(!isodigit(c))
-                               parse_error(c, state);
+                               parse_error(c, "0-7");
                         break;
  
                 case FLOAT:
                         if(c=='e' || c=='E')
-                               state=FLOATEXPINIT;
+                               state = FLOATEXPINIT;
                         else if(!isdigit(c))
-                               parse_error(c, state);
+                               parse_error(c, "0-9Ee");
                         break;
  
                 case FLOATEXPINIT:
                         if(c=='+' || c=='-')
-                               state=FLOATEXPSIGN;
+                               state = FLOATEXPSIGN;
                         else if(isdigit(c))
-                               state=FLOATEXP;
+                               state = FLOATEXP;
                         else
-                               parse_error(c, state);
+                               parse_error(c, "0-9+-");
                         break;
  
                 case FLOATEXPSIGN:
                         if(isdigit(c))
-                               state=FLOATEXP;
+                               state = FLOATEXP;
                         else
-                               parse_error(c, state);
+                               parse_error(c, "0-9");
                         break;
  
                 case FLOATEXP:
                         if(!isdigit(c))
-                               parse_error(c, state);
+                               parse_error(c, "0-9");
                         break;
  
                 case STRING:
                         if(c=='\\')
-                               escape=!escape;
+                               escape = !escape;
                         else if(c=='"' && !escape)
                         {
                                 try
                                 {
                                         return Token(Token::STRING, c_unescape(buf.substr(1, buf.size()-2)));
                                 }
-                               catch(const Exception &e)
+                               catch(Exception &e)
                                 {
-                                       throw ParseError(format("%s: %s", get_location(), e.what()), src, in.get_line_number());
+                                       e.at(get_location());
+                                       throw;
                                 }
                         }
                         else
-                               escape=false;
+                               escape = false;
                         break;
  
                 case IDENTIFIER:
                         if(!isalpha(c) && !isdigit(c) && c!='_')
-                               parse_error(c, state);
+                               parse_error(c, "0-9A-Za-z_");
                         break;
  
                 default:
-                       throw Exception(get_location()+": Internal error (bad state)");
+                       throw_at(InvalidState("Internal error (bad state)"), get_location());
                 }
  
                 if(is_delimiter(next) && state>=ACCEPT)
@@ -314,9 +316,9 @@ string TextParser::get_location()
         return ss.str();
  }
  
-void TextParser::parse_error(int c, int state)
+void TextParser::parse_error(int c, const char *e)
  {
-       throw ParseError(format("%s: Parse error at '%c' (state %d)", get_location(), static_cast<char>(c), state), src, in.get_line_number());
+       throw_at(ParseError(format("Parse error at '%c', expected one of \"%s\"", static_cast<char>(c), e)), get_location());
  }
  
  } // namespace DataFile