| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284 |
- //
- // XQueryTokenizer.cs
- //
- // Author:
- // Atsushi Enomoto <[email protected]>
- //
- // Copyright (C) 2004 Novell, Inc (http://www.novell.com)
- //
- // Permission is hereby granted, free of charge, to any person obtaining
- // a copy of this software and associated documentation files (the
- // "Software"), to deal in the Software without restriction, including
- // without limitation the rights to use, copy, modify, merge, publish,
- // distribute, sublicense, and/or sell copies of the Software, and to
- // permit persons to whom the Software is furnished to do so, subject to
- // the following conditions:
- //
- // The above copyright notice and this permission notice shall be
- // included in all copies or substantial portions of the Software.
- //
- // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- // EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
- // MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- // NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
- // LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
- // OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
- // WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
- //
- #if NET_2_0
- using System;
- using System.Collections;
- using System.Collections.Generic;
- using System.IO;
- using System.Security.Policy;
- using System.Xml;
- using System.Xml.Query;
- using System.Xml.Schema;
- using System.Xml.XPath;
- using Mono.Xml.XQuery;
- using Mono.Xml.XPath2;
- namespace Mono.Xml.XQuery.Parser
- {
- // FIXME: make internal in the future
- public class XQueryTokenizer
- : Mono.Xml.XQuery.Parser.yyParser.yyInput, IXmlLineInfo
- {
- int line = 1;
- int column = 0;
- bool nextIncrementLine;
- // namespace resolver
- XmlNamespaceManager nsResolver;
- string defaultFunctionNamespace = XQueryFunction.Namespace;
- // input source
- TextReader source;
- int peekChar = -1;
- // token info
- int currentToken;
- string prefixName;
- object tokenValue;
- int lookAheadToken = -1;
- object lookAheadTokenValue;
- // state info
- WhitespaceHandling ws = WhitespaceHandling.Arbitrary;
- ParseState state = ParseState.Default;
- Stack stateStack;
- char [] buffer = new char [30];
- int bufferIndex;
- public XQueryTokenizer (TextReader reader)
- {
- this.source = reader;
- stateStack = new Stack ();
- nsResolver = new XmlNamespaceManager (new NameTable ());
- nsResolver.AddNamespace ("xs", XmlSchema.Namespace);
- nsResolver.AddNamespace ("xdt", XmlSchema.XdtNamespace);
- // FIXME: Are they really predefined?
- nsResolver.AddNamespace ("xsi", XmlSchema.InstanceNamespace);
- nsResolver.AddNamespace ("fn", "http://www.w3.org/2003/11/xpath-functions");
- nsResolver.AddNamespace ("local", "http://www.w3.org/2003/11/xquery-local-functions");
- }
- internal IXmlNamespaceResolver NSResolver {
- get { return nsResolver; }
- }
- internal string DefaultFunctionNamespace {
- get { return defaultFunctionNamespace; }
- set { defaultFunctionNamespace = value; }
- }
- public void AddNamespace (string prefix, string ns)
- {
- nsResolver.AddNamespace (prefix, ns);
- }
- public bool advance ()
- {
- if (currentToken < 0)
- return false;
- if (lookAheadToken >= 0) {
- tokenValue = lookAheadTokenValue;
- currentToken = lookAheadToken;
- lookAheadToken = -1;
- }
- else
- currentToken = ParseToken ();
- return currentToken >= 0;
- }
- public int token ()
- {
- return currentToken;
- }
- public object value ()
- {
- return tokenValue;
- }
- public bool HasLineInfo ()
- {
- return true;
- }
- public int LineNumber {
- get { return line; }
- }
- public int LinePosition {
- get { return column; }
- }
- internal WhitespaceHandling Space {
- get { return ws; }
- set { ws = value; }
- }
- internal ParseState State {
- get { return state; }
- set {
- // Console.Error.WriteLine ("**** eno **** state transition from {0} to {1}, stack count = {2}", state, value, stateStack.Count);
- //foreach (ParseState ps in stateStack.ToArray ()) Console.Error.WriteLine ("***** eno ***** " + ps);
- state = value;
- }
- }
- internal void PushState (ParseState newState)
- {
- stateStack.Push (newState);
- // Console.Error.WriteLine ("**** eno **** state pushed {0}, added stack count = {1}", newState, stateStack.Count);
- //foreach (ParseState ps in stateStack.ToArray ()) Console.Error.WriteLine ("***** eno ***** " + ps);
- }
- internal void PopState ()
- {
- if (stateStack.Count == 0)
- throw Error ("Internal state transition error. State stack is empty.");
- state = (ParseState) stateStack.Pop ();
- // Console.Error.WriteLine ("**** eno **** state pop, now as {0}, stack count = {1}", state, stateStack.Count);
- //foreach (ParseState ps in stateStack.ToArray ()) Console.Error.WriteLine ("***** eno ***** " + ps);
- }
- private XmlQueryCompileException Error (string message)
- {
- return new XmlQueryCompileException (message, this, null, null);
- }
- private int ParseToken ()
- {
- bufferIndex = 0;
- switch (state) {
- case ParseState.StartTag:
- break;
- default:
- SkipWhitespaces ();
- break;
- }
- /*
- switch (ws) {
- case WhitespaceHandling.Arbitrary:
- SkipWhitespaces ();
- break;
- case WhitespaceHandling.Explicit:
- if (!XmlChar.IsWhitespace (PeekChar ()))
- throw Error ("Whitespace is required.");
- goto case WhitespaceHandling.Arbitrary;
- }
- */
- int c = PeekChar ();
- if (c < 0)
- return -1;
- // FIXME: consider DOUBLE_LITERAL
- if (Char.IsNumber ((char) c)) {
- tokenValue = ReadDecimal (false);
- return Token.DECIMAL_LITERAL;
- }
- switch (state) {
- case ParseState.OccurenceIndicator:
- return ParseOccurenceIndicator ();
- case ParseState.XmlPIContent:
- return ParseXmlPIContent ();
- case ParseState.XmlComment:
- return ParseXmlCommentContent ();
- case ParseState.ElementContent:
- return ParseElementContent ();
- case ParseState.StartTag:
- return ParseStartTag ();
- case ParseState.QuotAttributeContent:
- return ParseAttributeContent ('"');
- case ParseState.AposAttributeContent:
- return ParseAttributeContent ('\'');
- default:
- return ParseDefault ();
- }
- }
- private int ParseXQueryComment ()
- {
- while (true) {
- int c = ReadChar ();
- if (c < 0)
- throw Error ("Unexpected end of query text inside XML processing instruction content");
- if (c == ':') {
- if (PeekChar () == ')') {
- ReadChar ();
- tokenValue = CreateValueString ();
- return Token.XML_PI_TO_END;
- }
- else
- AddValueChar (':');
- }
- else
- AddValueChar ((char) c);
- }
- }
- private int ParseXmlPIContent ()
- {
- while (true) {
- int c = ReadChar ();
- if (c < 0)
- throw Error ("Unexpected end of query text inside XML processing instruction content");
- if (c == '?') {
- if (PeekChar () == '>') {
- ReadChar ();
- tokenValue = CreateValueString ();
- return Token.XML_PI_TO_END;
- }
- else
- AddValueChar ('?');
- }
- else
- AddValueChar ((char) c);
- }
- }
- private int ParseXmlCommentContent ()
- {
- // FIXME: handle ---> correctly
- while (true) {
- int c = ReadChar ();
- if (c < 0)
- throw Error ("Unexpected end of query text inside XML comment content");
- if (c == '-') {
- if (PeekChar () == '-') {
- ReadChar ();
- if (PeekChar () == '>') {
- tokenValue = CreateValueString ();
- return Token.XML_COMMENT_TO_END;
- } else {
- AddValueChar ('-');
- AddValueChar ('-');
- }
- }
- else
- AddValueChar ('-');
- }
- else
- AddValueChar ((char) c);
- }
- }
- private int ParseXmlCDataContent ()
- {
- // FIXME: handle ]]]> correctly
- while (true) {
- int c = ReadChar ();
- if (c < 0)
- throw Error ("Unexpected end of query text inside XML CDATA section content");
- if (c == ']') {
- ReadChar ();
- if (PeekChar () == ']') {
- ReadChar ();
- if (PeekChar () == '>') {
- tokenValue = CreateValueString ();
- return Token.XML_CDATA_TO_END;
- } else {
- AddValueChar (']');
- AddValueChar (']');
- }
- }
- else
- AddValueChar (']');
- }
- else
- AddValueChar ((char) c);
- }
- }
- private int ParseElementContent ()
- {
- tokenValue = null;
- int c = PeekChar ();
- if (c < 0)
- throw Error ("Unexpected end of query text inside XML processing instruction content");
- switch ((char) c) {
- case '<':
- case '{':
- return ParseDefault ();
- }
- while (true) {
- c = PeekChar ();
- if (c < 0)
- throw Error ("Unexpected end of query text inside XML processing instruction content");
- switch ((char) c) {
- case '&':
- ReadChar ();
- ReadPredefinedEntity ();
- continue;
- case '<':
- tokenValue += CreateValueString ();
- return Token.ELEM_CONTENT_LITERAL;
- default:
- AddValueChar ((char) c);
- ReadChar ();
- continue;
- }
- }
- }
- private void ReadPredefinedEntity ()
- {
- string token = ReadOneToken ();
- Expect (";");
- switch (token) {
- case "lt":
- AddValueChar ('<');
- return;
- case "gt":
- AddValueChar ('>');
- return;
- case "amp":
- AddValueChar ('&');
- return;
- case "quot":
- AddValueChar ('"');
- return;
- case "apos":
- AddValueChar ('\'');
- return;
- default:
- throw Error (String.Format ("Unexpected general entity name: {0} .", token));
- }
- }
- // FIXME: not used as yet
- private int ParseExtContent ()
- {
- // FIXME: handle :::) correctly
- while (true) {
- int c = PeekChar ();
- if (c < 0)
- throw Error ("Unexpected end of query text inside external content");
- if (c == ':') {
- ReadChar ();
- if (PeekChar () == ':') {
- ReadChar ();
- if (PeekChar () == ')') {
- tokenValue = CreateValueString ();
- return Token.EXT_CONTENT;
- } else {
- AddValueChar (':');
- AddValueChar (':');
- }
- }
- else
- AddValueChar (':');
- }
- else
- AddValueChar ((char) c);
- }
- }
- private int ParseOccurenceIndicator ()
- {
- state = ParseState.Operator;
- switch (PeekChar ()) {
- case '?':
- ReadChar ();
- return Token.QUESTION;
- case '*':
- ReadChar ();
- return Token.ASTERISK;
- case '+':
- ReadChar ();
- return Token.PLUS;
- default:
- return ParseOperator ();
- }
- }
- private int ParseStartTag ()
- {
- int c = PeekChar ();
- switch (c) {
- case '\'':
- ReadChar ();
- return Token.APOS;
- case '"':
- ReadChar ();
- return Token.QUOT;
- case '>':
- ReadChar ();
- return Token.GREATER;
- case '/':
- ReadChar ();
- Expect (">");
- return Token.EMPTY_TAG_CLOSE;
- }
- // FIXME: there seems a bug in the spec that StartTag
- // state must accept QName without heading space for
- // start tag name.
- // if (!XmlChar.IsWhitespace (PeekChar ()))
- // throw Error ("Whitespace is required.");
- SkipWhitespaces ();
- return ParseDefault (); // only QName is allowed here.
- }
- private int ParseAttributeContent (char closeChar)
- {
- int t = Token.ATT_VALUE_LITERAL;
- while (true) {
- int c = PeekChar ();
- if (c < 0)
- throw Error ("Unexpected end of attribute value content.");
- if (c == closeChar) {
- ReadChar ();
- c = PeekChar ();
- if (c == closeChar) {
- ReadChar ();
- AddValueChar (closeChar);
- }
- else
- t = closeChar == '"' ? Token.QUOT : Token.APOS;
- }
- else if (c == '{') {
- ReadChar ();
- c = PeekChar ();
- if (c == '{') {
- ReadChar ();
- AddValueChar ('{');
- }
- else
- t = Token.OPEN_CURLY;
- }
- else
- AddValueChar ((char) ReadChar ());
- if (t != Token.ATT_VALUE_LITERAL) {
- if (bufferIndex > 0) {
- lookAheadToken = t;
- tokenValue = CreateValueString ();
- return Token.ATT_VALUE_LITERAL;
- }
- else
- return t;
- }
- }
- }
- private int ParseOperator ()
- {
- // TODO: implement
- return ParseDefault ();
- }
- private int ParseDefault ()
- {
- int c = ReadChar ();
- switch (c) {
- case '.':
- if (PeekChar () == '.') {
- ReadChar ();
- return Token.DOT2;
- }
- else if (Char.IsNumber ((char) PeekChar ())) {
- tokenValue = ReadDecimal (true);
- }
- return Token.DOT;
- case ',':
- return Token.COMMA;
- case ';':
- return Token.SEMICOLON;
- case '(':
- if (PeekChar () == ':') {
- ReadChar ();
- if (PeekChar () == ':') {
- ReadChar ();
- return Token.PRAGMA_OPEN;
- }
- ParseXQueryComment ();
- return ParseToken (); // start again
- }
- return Token.OPEN_PAREN;
- case ')':
- return Token.CLOSE_PAREN;
- case ':':
- switch (PeekChar ()) {
- case ':':
- ReadChar ();
- if (PeekChar () == ')') {
- ReadChar ();
- return Token.PRAGMA_CLOSE;
- }
- return Token.COLON2;
- case ')':
- ReadChar ();
- return Token.CLOSE_PAREN_COLON;
- case '=':
- ReadChar ();
- return Token.COLON_EQUAL;
- }
- return Token.COLON;
- case '[':
- return Token.OPEN_BRACKET;
- case ']':
- return Token.CLOSE_BRACKET;
- case '{':
- return Token.OPEN_CURLY;
- case '}':
- return Token.CLOSE_CURLY;
- case '$':
- return Token.DOLLAR;
- case '\'':
- tokenValue = ReadQuoted ('\'');
- return Token.STRING_LITERAL;
- case '"':
- tokenValue = ReadQuoted ('"');
- return Token.STRING_LITERAL;
- case '=':
- return Token.EQUAL;
- case '<':
- // only happens when state is ElementContent
- // (otherwise it might be "/foo</bar")
- if (state == ParseState.ElementContent) {
- switch ((char) PeekChar ()) {
- case '/':
- ReadChar ();
- return Token.END_TAG_START;
- case '!':
- ReadChar ();
- switch (PeekChar ()) {
- case '-':
- ReadChar ();
- if (ReadChar () != '-')
- throw Error ("Invalid sequence of characters '<!-'.");
-
- return Token.XML_COMMENT_START;
- case '[':
- ReadChar ();
- Expect ("CDATA[");
- return Token.XML_CDATA_START;
- }
- throw Error ("Invalid sequence of characters '<!'.");
- case '?':
- ReadChar ();
- return Token.XML_PI_START;
- default:
- return Token.LESSER;
- }
- }
- switch (PeekChar ()) {
- case '<':
- ReadChar ();
- return Token.LESSER2;
- case '=':
- ReadChar ();
- return Token.LESSER_EQUAL;
- }
- return Token.LESSER;
- case '>':
- switch (PeekChar ()) {
- case '>':
- ReadChar ();
- return Token.GREATER2;
- case '=':
- ReadChar ();
- return Token.GREATER_EQUAL;
- }
- return Token.GREATER;
- case '|':
- return Token.BAR;
- case '*':
- if (PeekChar () == ':') {
- ReadChar ();
- // FIXME: more check
- tokenValue = new XmlQualifiedName (ReadOneToken (), "*");
- return Token.WILD_PREFIX;
- }
- return Token.ASTERISK;
- case '+':
- return Token.PLUS;
- case '-':
- return Token.MINUS;
- case '/':
- // only happens when state is StartTag
- // (otherwise it might be "/>$extvar")
- if (state == ParseState.StartTag && PeekChar () == '>') {
- ReadChar ();
- return Token.EMPTY_TAG_CLOSE;
- }
- if (PeekChar () == '/') {
- ReadChar ();
- return Token.SLASH2;
- }
- return Token.SLASH;
- case '?':
- return Token.QUESTION;
- case '@':
- return Token.AT;
- }
- peekChar = c;
- prefixName = null;
- string name = ReadOneToken ();
- tokenValue = name;
- bool validKeyword = false;
- switch (state) {
- case ParseState.XmlSpaceDecl:
- switch (name) {
- case "preserve":
- return Token.PRESERVE;
- case "strip":
- return Token.STRIP;
- }
- break;
- case ParseState.CloseKindTest:
- if (name == "nillable")
- return Token.NILLABLE;
- break;
- case ParseState.ExtKey:
- switch (name) {
- case "pragma":
- return Token.PRAGMA;
- case "extension":
- return Token.EXTENSION;
- }
- break;
- case ParseState.KindTest:
- switch (name) {
- case "context":
- return Token.CONTEXT;
- case "element":
- return Token.ELEMENT;
- case "global":
- return Token.GLOBAL;
- case "type":
- return Token.TYPE;
- }
- break;
- case ParseState.ItemType:
- switch (name) {
- case "attribute":
- return Token.ATTRIBUTE;
- case "comment":
- return Token.COMMENT;
- case "document-node":
- return Token.DOCUMENT_NODE;
- case "element":
- return Token.ELEMENT;
- case "empty":
- return Token.EMPTY;
- case "item":
- return Token.ITEM;
- case "node":
- return Token.NODE;
- case "processing-instruction":
- return Token.PROCESSING_INSTRUCTION;
- case "text":
- return Token.TEXT;
- }
- break;
- case ParseState.NamespaceKeyword:
- switch (name) {
- case "declare":
- return Token.DECLARE;
- case "default":
- return Token.DEFAULT;
- case "element":
- return Token.ELEMENT;
- case "function":
- return Token.FUNCTION;
- case "namespace":
- return Token.NAMESPACE;
- }
- break;
- case ParseState.OccurenceIndicator:
- case ParseState.Operator:
- switch (name) {
- case "and":
- case "as":
- case "ascending":
- case "at":
- case "base-uri":
- case "by":
- case "case":
- case "cast":
- case "castable":
- case "collation":
- case "declare":
- case "default":
- case "descending":
- case "div":
- case "element":
- case "else":
- case "empty":
- case "eq":
- case "every":
- case "except":
- case "external":
- case "for":
- case "function":
- case "ge":
- case "global":
- case "greatest":
- case "gt":
- case "idiv":
- case "import":
- case "in":
- case "instance":
- case "intersect":
- case "is":
- case "lax":
- case "le":
- case "least":
- case "let":
- case "lt":
- case "mod":
- case "module":
- case "namespace":
- case "ne":
- case "of":
- case "or":
- case "order":
- case "ordered":
- case "ordering":
- case "return":
- case "satisfies":
- case "schema":
- case "skip":
- case "some":
- case "stable":
- case "strict":
- case "then":
- case "to":
- case "treat":
- case "typwswitch":
- case "union":
- case "unordered":
- case "variable":
- case "where":
- case "xmlspace":
- validKeyword = true;
- break;
- }
- break;
- case ParseState.Default:
- switch (name) {
- case "ancestor":
- case "ancestor-or-self":
- case "as":
- case "attribute":
- case "base-uri":
- case "child":
- case "collation":
- case "comment":
- case "construction":
- case "declare":
- case "default":
- case "descendant":
- case "descendant-or-self":
- case "document":
- case "document-node":
- case "element":
- case "every":
- case "following":
- case "following-sibling":
- case "for":
- case "function":
- case "global":
- case "if":
- case "import":
- case "lax":
- case "let":
- case "module":
- case "namespace":
- case "node":
- case "ordered":
- case "parent":
- case "preceding":
- case "preceding-sibling":
- case "processing-instruction":
- case "schema":
- case "self":
- case "some":
- case "strict":
- case "strip":
- case "text":
- case "typeswitch":
- case "unordered":
- case "validate":
- case "validation":
- case "version":
- case "xmlspace":
- case "xquery":
- validKeyword = true;
- break;
- }
- break;
- }
- if (validKeyword) {
- switch (name) {
- case "xquery":
- return Token.XQUERY;
- case "version":
- return Token.VERSION;
- case "pragma":
- return Token.PRAGMA;
- case "extension":
- return Token.EXTENSION;
- case "module":
- return Token.MODULE;
- case "namespace":
- return Token.NAMESPACE;
- case "declare":
- return Token.DECLARE;
- case "xmlspace":
- return Token.XMLSPACE;
- case "preserve":
- return Token.PRESERVE;
- case "strip":
- return Token.STRIP;
- case "default":
- return Token.DEFAULT;
- case "construction":
- return Token.CONSTRUCTION;
- case "ordering":
- return Token.ORDERING;
- case "ordered":
- return Token.ORDERED;
- case "unordered":
- return Token.UNORDERED;
- case "document-node":
- return Token.DOCUMENT_NODE;
- case "document":
- return Token.DOCUMENT;
- case "element":
- return Token.ELEMENT;
- case "attribute":
- return Token.ATTRIBUTE;
- case "processing-instruction":
- return Token.PROCESSING_INSTRUCTION;
- case "comment":
- return Token.COMMENT;
- case "text":
- return Token.TEXT;
- case "node":
- return Token.NODE;
- case "function":
- return Token.FUNCTION;
- case "collation":
- return Token.COLLATION;
- case "base-uri":
- return Token.BASEURI;
- case "import":
- return Token.IMPORT;
- case "schema":
- return Token.SCHEMA;
- case "at":
- return Token.AT;
- case "variable":
- return Token.VARIABLE;
- case "as":
- return Token.AS;
- case "external":
- return Token.EXTERNAL;
- case "validation":
- return Token.VALIDATION;
- case "lax":
- return Token.LAX;
- case "strict":
- return Token.STRICT;
- case "skip":
- return Token.SKIP;
- case "return":
- return Token.RETURN;
- case "for":
- return Token.FOR;
- case "let":
- return Token.LET;
- case "in":
- return Token.IN;
- case "where":
- return Token.WHERE;
- case "order":
- return Token.ORDER;
- case "by":
- return Token.BY;
- case "stable":
- return Token.STABLE;
- case "ascending":
- return Token.ASCENDING;
- case "descending":
- return Token.DESCENDING;
- case "empty":
- return Token.EMPTY;
- case "greatest":
- return Token.GREATEST;
- case "least":
- return Token.LEAST;
- case "some":
- return Token.SOME;
- case "every":
- return Token.EVERY;
- case "satisfies":
- return Token.SATISFIES;
- case "is":
- return Token.IS;
- case "to":
- return Token.TO;
- case "eq":
- return Token.EQ;
- case "ne":
- return Token.NE;
- case "lt":
- return Token.LT;
- case "le":
- return Token.LE;
- case "gt":
- return Token.GT;
- case "ge":
- return Token.GE;
- case "and":
- return Token.AND;
- case "or":
- return Token.OR;
- case "instance":
- return Token.INSTANCE;
- case "of":
- return Token.OF;
- case "if":
- return Token.IF;
- case "then":
- return Token.THEN;
- case "else":
- return Token.ELSE;
- case "typeswitch":
- return Token.TYPESWITCH;
- case "case":
- return Token.CASE;
- case "treat":
- return Token.TREAT;
- case "castable":
- return Token.CASTABLE;
- case "cast":
- return Token.CAST;
- case "div":
- return Token.DIV;
- case "idiv":
- return Token.IDIV;
- case "mod":
- return Token.MOD;
- case "union":
- return Token.UNION;
- case "intersect":
- return Token.INTERSECT;
- case "except":
- return Token.EXCEPT;
- case "validate":
- return Token.VALIDATE;
- case "context":
- return Token.CONTEXT;
- case "nillable":
- return Token.NILLABLE;
- case "item":
- return Token.ITEM;
- case "global":
- return Token.GLOBAL;
- case "type":
- return Token.TYPE;
- case "child":
- return Token.CHILD;
- case "descendant":
- return Token.DESCENDANT;
- case "self":
- return Token.SELF;
- case "descendant-or-self":
- return Token.DESCENDANT_OR_SELF;
- case "following-sibling":
- return Token.FOLLOWING_SIBLING;
- case "following":
- return Token.FOLLOWING;
- case "parent":
- return Token.PARENT;
- case "ancestor":
- return Token.ANCESTOR;
- case "preceding":
- return Token.PRECEDING;
- case "preceding-sibling":
- return Token.PRECEDING_SIBLING;
- case "ancestor-or-self":
- return Token.ANCESTOR_OR_SELF;
- }
- }
- switch (state) {
- case ParseState.NamespaceDecl:
- case ParseState.NamespaceKeyword:
- case ParseState.XmlSpaceDecl:
- case ParseState.KindTestForPI:
- case ParseState.XmlPI:
- return Token.NCNAME;
- }
- if (PeekChar () == ':') {
- ReadChar ();
- prefixName = name;
- switch (PeekChar ()) {
- case '*':
- ReadChar ();
- name = "*";
- break;
- case '=': // ex. let foo:= ...
- ReadChar ();
- tokenValue = new XmlQualifiedName (name, nsResolver.DefaultNamespace);
- lookAheadToken = Token.COLON_EQUAL;
- return Token.QNAME;
- default:
- name = ReadOneToken ();
- break;
- }
- string ns = nsResolver.LookupNamespace (prefixName);
- if (ns == null)
- throw Error (String.Format ("Prefix '{0}' is not mapped to any namespace URI.", prefixName));
- tokenValue = new XmlQualifiedName (name, ns);
- prefixName = null;
- return name == "*" ? Token.WILD_LOCALNAME : Token.QNAME;
- }
- tokenValue = new XmlQualifiedName (name);
- return Token.QNAME;
- }
- private int PeekChar ()
- {
- if (peekChar == -1)
- peekChar = source.Read ();
- return peekChar;
- }
- private int ReadChar ()
- {
- int ret;
- if (peekChar != -1) {
- ret = peekChar;
- peekChar = -1;
- }
- else
- ret = source.Read ();
- if (nextIncrementLine) {
- line++;
- column = 0;
- nextIncrementLine = false;
- }
- column++;
- switch (ret) {
- case '\r':
- break;
- case '\n':
- nextIncrementLine = true;
- goto default;
- default:
- break;
- }
- return ret;
- }
- private void SkipWhitespaces ()
- {
- while (true) {
- switch (PeekChar ()) {
- case ' ':
- case '\t':
- case '\r':
- case '\n':
- ReadChar ();
- continue;
- default:
- return;
- }
- }
- }
- private void AddValueChar (char c)
- {
- if (bufferIndex == buffer.Length) {
- char [] newBuf = new char [bufferIndex * 2];
- Array.Copy (buffer, newBuf, bufferIndex);
- buffer = newBuf;
- }
- buffer [bufferIndex++] = c;
- }
- private string CreateValueString ()
- {
- return new string (buffer, 0, bufferIndex);
- }
- private void Expect (string expected)
- {
- for (int i = 0; i < expected.Length; i++)
- if (ReadChar () != expected [i])
- throw Error (String.Format ("Expected token '{0}' did not appear.", expected));
- }
- // TODO: parse three quoted
- private string ReadQuoted (char quoteChar)
- {
- bufferIndex = 0;
- bool loop = true;
- do {
- int c = ReadChar ();
- switch (c) {
- case -1:
- case '"':
- if (quoteChar == '"')
- loop = false;
- break;
- case '\'':
- if (quoteChar == '\'')
- loop = false;
- break;
- default:
- AddValueChar ((char) c);
- break;
- }
- } while (loop);
- return CreateValueString ();
- }
- private decimal ReadDecimal (bool floatingPoint)
- {
- bufferIndex = 0;
- bool cond = true;
- do {
- int c = PeekChar ();
- if (c < 0) {
- cond = false;
- }
- // FIXME: more complex
- else if (Char.IsNumber ((char) c) || c == '.') {
- ReadChar ();
- AddValueChar ((char) c);
- continue;
- }
- else
- cond = false;
- } while (cond);
- string s = (floatingPoint ? "." : "") + CreateValueString ();
- return decimal.Parse (s);
- }
- private string ReadOneToken ()
- {
- bufferIndex = 0;
- bool loop = true;
- do {
- int c = PeekChar ();
- switch (c) {
- case -1:
- case ' ':
- case '\t':
- case '\r':
- case '\n':
- loop = false;
- break;
- default:
- if (!IsTokenContinuable (c)) {
- if (c == ':') {
- if (prefixName != null)
- throw new XmlQueryCompileException ("Invalid colon was found.");
- prefixName = CreateValueString ();
- }
- loop = false;
- break;
- }
- ReadChar ();
- AddValueChar ((char) c);
- break;
- }
- } while (loop);
- return CreateValueString ();
- }
- private bool IsTokenContinuable (int c)
- {
- switch (c) {
- case '-':
- case '_':
- case '.':
- return true;
- }
- return XmlChar.IsNCNameChar (c);
- }
- }
- public enum WhitespaceHandling {
- Arbitrary,
- Explicit,
- Significant
- }
- public enum ParseState {
- Default,
- Operator,
- NamespaceDecl,
- NamespaceKeyword,
- XmlSpaceDecl,
- ItemType,
- KindTest,
- KindTestForPI,
- CloseKindTest,
- OccurenceIndicator,
- SchemaContextStep,
- VarName,
- StartTag,
- ElementContent,
- EndTag,
- XmlComment,
- ExprComment,
- ExtKey,
- XmlPI,
- XmlPIContent,
- CDataSection,
- QuotAttributeContent,
- AposAttributeContent,
- }
- }
- #endif
|