| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732 |
- //
- // System.Xml.XmlTextReader
- //
- // Author:
- // Jason Diamond ([email protected])
- // Adam Treat ([email protected])
- // Atsushi Enomoto ([email protected])
- //
- // (C) 2001, 2002 Jason Diamond http://injektilo.org/
- //
- // FIXME:
- //
- // I haven't checked whether DTD parser runs correct.
- //
- // More strict well-formedness checking should be done.
- //
- // NameTables aren't being used completely yet.
- //
- // Some thought needs to be given to performance. There's too many
- // strings being allocated.
- //
- using System;
- using System.Collections;
- using System.IO;
- using System.Text;
- using Mono.Xml;
- using Mono.Xml.Native;
- namespace System.Xml
- {
- public class XmlTextReader : XmlReader, IXmlLineInfo
- {
- WhitespaceHandling whitespaceHandling = WhitespaceHandling.All;
- #region Constructors
- protected XmlTextReader ()
- {
- }
- public XmlTextReader (Stream input)
- : this (new XmlStreamReader (input))
- {
- }
- public XmlTextReader (string url)
- : this(url, new NameTable ())
- {
- }
- public XmlTextReader (TextReader input)
- : this (input, new NameTable ())
- {
- }
- protected XmlTextReader (XmlNameTable nt)
- : this (String.Empty, null, XmlNodeType.None, null)
- {
- }
- public XmlTextReader (Stream input, XmlNameTable nt)
- : this(new XmlStreamReader (input), nt)
- {
- }
- public XmlTextReader (string url, Stream input)
- : this (url, new XmlStreamReader (input))
- {
- }
- public XmlTextReader (string url, TextReader input)
- : this (url, input, new NameTable ())
- {
- }
- [MonoTODO("Non-filename-url must be supported. Waiting for WebClient")]
- public XmlTextReader (string url, XmlNameTable nt)
- : this (url, new XmlStreamReader (url), nt)
- {
- }
- public XmlTextReader (TextReader input, XmlNameTable nt)
- : this (String.Empty, input, nt)
- {
- }
- public XmlTextReader (Stream xmlFragment, XmlNodeType fragType, XmlParserContext context)
- : this (context.BaseURI, new XmlStreamReader (xmlFragment), fragType, context)
- {
- }
- public XmlTextReader (string url, Stream input, XmlNameTable nt)
- : this (url, new XmlStreamReader (input), nt)
- {
- }
- public XmlTextReader (string url, TextReader input, XmlNameTable nt)
- : this (url, input, XmlNodeType.Document, null)
- {
- }
- [MonoTODO("TODO as same as private XmlTextReader(TextReader, XmlNodeType, XmlParserContext)")]
- public XmlTextReader (string xmlFragment, XmlNodeType fragType, XmlParserContext context)
- : this (context != null ? context.BaseURI : String.Empty,
- new StringReader (xmlFragment),
- fragType,
- context)
- {
- }
- // TODO still remains as described at head of this file,
- // but it might not be TODO of the constructors...
- XmlTextReader (string url, TextReader fragment, XmlNodeType fragType, XmlParserContext context)
- {
- InitializeContext (url, context, fragment, fragType);
- }
- #endregion
- #region Properties
- public override int AttributeCount
- {
- get { return attributes.Count; }
- }
- public override string BaseURI
- {
- get { return parserContext.BaseURI; }
- }
- public override int Depth
- {
- get {
- return elementDepth;
- }
- }
- public Encoding Encoding
- {
- get { return parserContext.Encoding; }
- }
- public override bool EOF
- {
- get
- {
- return
- readState == ReadState.EndOfFile ||
- readState == ReadState.Closed;
- }
- }
- public override bool HasValue
- {
- get { return value != String.Empty; }
- }
- public override bool IsDefault
- {
- get
- {
- // XmlTextReader does not expand default attributes.
- return false;
- }
- }
- public override bool IsEmptyElement
- {
- get { return isEmptyElement; }
- }
- public override string this [int i]
- {
- get { return GetAttribute (i); }
- }
- public override string this [string name]
- {
- get { return GetAttribute (name); }
- }
- public override string this [string localName, string namespaceName]
- {
- get { return GetAttribute (localName, namespaceName); }
- }
- public int LineNumber
- {
- get { return currentInput.LineNumber; }
- }
- public int LinePosition
- {
- get { return currentInput.LinePosition; }
- }
- public override string LocalName
- {
- get { return localName; }
- }
- public override string Name
- {
- get { return name; }
- }
- public bool Namespaces
- {
- get { return namespaces; }
- set {
- if (readState != ReadState.Initial)
- throw new InvalidOperationException ("Namespaces have to be set before reading.");
- namespaces = value;
- }
- }
- public override string NamespaceURI
- {
- get { return namespaceURI; }
- }
- public override XmlNameTable NameTable
- {
- get { return parserContext.NameTable; }
- }
- public override XmlNodeType NodeType
- {
- get { return nodeType; }
- }
- [MonoTODO]
- public bool Normalization
- {
- get { throw new NotImplementedException (); }
- set { throw new NotImplementedException (); }
- }
- public override string Prefix
- {
- get { return prefix; }
- }
- public override char QuoteChar
- {
- get {
- // value string holds attribute quotation char.
- if (NodeType == XmlNodeType.Attribute)
- return value [0];
- else
- return '"';
- }
- }
- public override ReadState ReadState
- {
- get { return readState; }
- }
- public override string Value
- {
- get {
- if(NodeType == XmlNodeType.Attribute)
- return UnescapeAttributeValue(value);
- else
- return value;
- }
- }
- public WhitespaceHandling WhitespaceHandling
- {
- get { return whitespaceHandling; }
- set { whitespaceHandling = value; }
- }
- public override string XmlLang
- {
- get { return parserContext.XmlLang; }
- }
- public XmlResolver XmlResolver
- {
- set { resolver = value; }
- }
- public override XmlSpace XmlSpace
- {
- get { return parserContext.XmlSpace; }
- }
- #endregion
- #region Methods
- public override void Close ()
- {
- readState = ReadState.Closed;
- foreach (XmlParserInput input in parserInputStack.ToArray ())
- input.Close ();
- this.currentInput.Close ();
- }
- public override string GetAttribute (int i)
- {
- if (i > attributes.Count)
- throw new ArgumentOutOfRangeException ("i is smaller than AttributeCount");
- else
- return UnescapeAttributeValue (attributes [orderedAttributes [i]] as string);
- }
- // MS.NET 1.0 documentation says that this method returns String.Empty for
- // not-exist attribute, but in fact it returns null.
- // That description is corrected in MS.NET 1.1 documentation.
- public override string GetAttribute (string name)
- {
- return UnescapeAttributeValue (attributes [name] as string);
- }
- private int GetIndexOfQualifiedAttribute (string localName, string namespaceURI)
- {
- for(int i = 0; i < orderedAttributes.Count; i++)
- {
- string thisName = (string) orderedAttributes [i];
- int indexOfColon = thisName.IndexOf (':');
- if (indexOfColon != -1) {
- string thisLocalName = thisName.Substring (indexOfColon + 1);
- if (localName == thisLocalName) {
- string thisPrefix = thisName.Substring (0, indexOfColon);
- string thisNamespaceURI = LookupNamespace (thisPrefix);
- if (namespaceURI == thisNamespaceURI)
- return i;
- }
- } else if (localName == "xmlns" && namespaceURI == "http://www.w3.org/2000/xmlns/" && thisName == "xmlns")
- return i;
- }
- return -1;
- }
- public override string GetAttribute (string localName, string namespaceURI)
- {
- int idx = this.GetIndexOfQualifiedAttribute (localName, namespaceURI);
- if (idx < 0)
- return String.Empty;
- return UnescapeAttributeValue (attributes [orderedAttributes [idx]] as string);
- }
- [MonoTODO]
- public TextReader GetRemainder ()
- {
- throw new NotImplementedException ();
- }
- bool IXmlLineInfo.HasLineInfo ()
- {
- return true;
- }
- public override string LookupNamespace (string prefix)
- {
- return parserContext.NamespaceManager.LookupNamespace (prefix);
- }
- public override void MoveToAttribute (int i)
- {
- MoveToElement ();
- if (attributes == null || orderedAttributes.Count < i || i < 0)
- throw new ArgumentOutOfRangeException ("attribute index out of range.");
- if (orderedAttributesEnumerator == null) {
- SaveProperties ();
- }
- orderedAttributesEnumerator = orderedAttributes.GetEnumerator ();
- for (int n=0; n<=i; n++)
- orderedAttributesEnumerator.MoveNext();
- string name = orderedAttributes [i] as string;
- string value = attributes [name] as string;
- SetProperties (
- XmlNodeType.Attribute, // nodeType
- name, // name
- false, // isEmptyElement
- value, // value
- false // clearAttributes
- );
- attributeValuePos = 0;
- }
- public override bool MoveToAttribute (string name)
- {
- MoveToElement ();
- bool match = false;
- if (attributes == null)
- return false;
- if (orderedAttributesEnumerator == null) {
- SaveProperties ();
- }
- orderedAttributesEnumerator = orderedAttributes.GetEnumerator ();
- while (orderedAttributesEnumerator.MoveNext ()) {
- if(name == orderedAttributesEnumerator.Current as string) {
- match = true;
- break;
- }
- }
- if (match) {
- string value = attributes [name] as string;
- SetProperties (
- XmlNodeType.Attribute, // nodeType
- name, // name
- false, // isEmptyElement
- value, // value
- false // clearAttributes
- );
- attributeValuePos = 0;
- }
- return match;
- }
- public override bool MoveToAttribute (string localName, string namespaceName)
- {
- MoveToElement ();
- if (attributes == null)
- return false;
- int idx = GetIndexOfQualifiedAttribute (localName, namespaceName);
- if (idx < 0)
- return false;
- MoveToAttribute (idx);
- return true;
- }
- public override bool MoveToElement ()
- {
- if (orderedAttributesEnumerator != null) {
- orderedAttributesEnumerator = null;
- if (isPropertySaved)
- RestoreProperties ();
- return true;
- }
- return false;
- }
- public override bool MoveToFirstAttribute ()
- {
- MoveToElement ();
- return MoveToNextAttribute ();
- }
- public override bool MoveToNextAttribute ()
- {
- if (attributes == null)
- return false;
- if (orderedAttributesEnumerator == null) {
- SaveProperties ();
- orderedAttributesEnumerator = orderedAttributes.GetEnumerator ();
- }
- if (orderedAttributesEnumerator.MoveNext ()) {
- string name = orderedAttributesEnumerator.Current as string;
- string value = attributes [name] as string;
- SetProperties (
- XmlNodeType.Attribute, // nodeType
- name, // name
- false, // isEmptyElement
- value, // value
- false // clearAttributes
- );
- attributeValuePos = 0;
- return true;
- }
- return false;
- }
- public override bool Read ()
- {
- bool more = false;
- isPropertySaved = false;
- readState = ReadState.Interactive;
- // It was moved from end of ReadStartTag ().
- if (depthUp)
- ++depth;
- depthUp = false;
- more = ReadContent ();
- return more;
- }
- public override bool ReadAttributeValue ()
- {
- // 'attributeString' holds real string value (without their
- // quotation characters).
- //
- // 'attributeValuePos' holds current position
- // of 'attributeString' while iterating ReadAttribute().
- // It may be:
- // -1 if ReadAttributeValue() has already finished.
- // 0 if ReadAttributeValue() ready to start reading.
- // >0 if ReadAttributeValue() already got 1 or more values
- //
- // local 'refPosition' holds the position on the
- // attributeString which may be used next time.
- if (attributeValuePos < 0)
- return false;
- // If not started, then initialize attributeString when parsing is at start.
- if (attributeValuePos == 0)
- attributeString =
- value.Substring (1, value.Length - 2);
- returnEntityReference = false;
- value = String.Empty;
- int refPosition;
- int loop = 0;
- do {
- refPosition = attributeString.IndexOf ('&', attributeValuePos);
- if (refPosition < 0) {
- // Reached to the end of value string.
- value += attributeString.Substring (attributeValuePos);
- attributeValuePos = -1;
- break;
- } else if (refPosition == attributeValuePos) {
- string parsed = ReadAttributeValueReference ();
- if (parsed != null)
- value += parsed;
- else {
- // Found that an entity reference starts from this point.
- // reset position to after '&'.
- attributeValuePos = refPosition;
- if (value.Length <= 0) {
- int endNamePos = attributeString.IndexOf (";", attributeValuePos);
- value = attributeString.Substring (attributeValuePos+1, endNamePos - attributeValuePos - 1);
- attributeValuePos += value.Length + 2;
- returnEntityReference = true;
- }
- break;
- }
- } else {
- value += attributeString.Substring (attributeValuePos,
- refPosition - attributeValuePos);
- attributeValuePos = refPosition;
- continue;
- }
- } while (++loop > 0);
- if (returnEntityReference)
- SetProperties (XmlNodeType.EntityReference,
- value,
- false,
- String.Empty,
- false);
- else
- SetProperties (XmlNodeType.Text,
- "#text",
- false,
- value,
- false);
- return true;
- }
- [MonoTODO]
- public int ReadBase64 (byte [] buffer, int offset, int length)
- {
- throw new NotImplementedException ();
- }
- [MonoTODO]
- public int ReadBinHex (byte [] buffer, int offset, int length)
- {
- throw new NotImplementedException ();
- }
- [MonoTODO]
- public int ReadChars (char [] buffer, int offset, int length)
- {
- throw new NotImplementedException ();
- }
- public override string ReadInnerXml ()
- {
- if (readState != ReadState.Interactive)
- return String.Empty;
- switch (NodeType) {
- case XmlNodeType.Attribute:
- return value.Substring (1, value.Length - 2);
- case XmlNodeType.Element:
- if (IsEmptyElement)
- return String.Empty;
- int startDepth = depth;
- if (innerXmlBuilder == null)
- innerXmlBuilder = new StringBuilder ();
- innerXmlBuilder.Length = 0;
- bool loop = true;
- do {
- Read ();
- if (NodeType ==XmlNodeType.None)
- throw new XmlException ("unexpected end of xml.");
- else if (NodeType == XmlNodeType.EndElement && depth == startDepth) {
- loop = false;
- Read ();
- }
- else
- innerXmlBuilder.Append (currentTag);
- } while (loop);
- string xml = innerXmlBuilder.ToString ();
- innerXmlBuilder.Length = 0;
- return xml;
- case XmlNodeType.None:
- // MS document is incorrect. Seems not to progress.
- return String.Empty;
- default:
- Read ();
- return String.Empty;
- }
- }
- public override string ReadOuterXml ()
- {
- if (readState != ReadState.Interactive)
- return String.Empty;
- switch (NodeType) {
- case XmlNodeType.Attribute:
- // strictly incompatible with MS... (it holds spaces attribute between name, value and "=" char (very trivial).
- return String.Format ("{0}={1}{2}{1}", Name, QuoteChar, ReadInnerXml ());
- case XmlNodeType.Element:
- bool isEmpty = IsEmptyElement;
- string startTag = currentTag.ToString ();
- string name = Name;
- if (NodeType == XmlNodeType.Element && !isEmpty)
- return String.Format ("{0}{1}</{2}>", startTag, ReadInnerXml (), name);
- else
- return currentTag.ToString ();
- case XmlNodeType.None:
- // MS document is incorrect. Seems not to progress.
- return String.Empty;
- default:
- Read ();
- return String.Empty;
- }
- }
- public override string ReadString ()
- {
- return ReadStringInternal ();
- }
- [MonoTODO]
- public void ResetState ()
- {
- throw new NotImplementedException ();
- }
- public override void ResolveEntity ()
- {
- // XmlTextReaders don't resolve entities.
- throw new InvalidOperationException ("XmlTextReader cannot resolve external entities.");
- }
- #endregion
- #region Internals
- // Parsed DTD Objects
- internal DTDObjectModel currentSubset;
- #endregion
- #region Privates
- private XmlParserContext parserContext;
- private XmlParserInput currentInput;
- private Stack parserInputStack = new Stack ();
- private ReadState readState;
- private int depth;
- private int elementDepth;
- private bool depthUp;
- private bool popScope;
- private Stack elementStack;
- private bool haveEnteredDocument;
- private bool allowMultipleRoot = false;
- private XmlNodeType nodeType;
- private string name;
- private string prefix;
- private string localName;
- private string namespaceURI;
- private bool isEmptyElement;
- private string value;
- private bool isPropertySaved;
- private XmlNodeType saveNodeType;
- private string saveName;
- private string savePrefix;
- private string saveLocalName;
- private string saveNamespaceURI;
- private bool saveIsEmptyElement;
- private Hashtable attributes;
- private ArrayList orderedAttributes;
- private IEnumerator orderedAttributesEnumerator;
- private bool returnEntityReference;
- private string entityReferenceName;
- private char [] nameBuffer;
- private int nameLength;
- private int nameCapacity;
- private const int initialNameCapacity = 256;
- private char [] valueBuffer;
- private int valueLength;
- private int valueCapacity;
- private const int initialValueCapacity = 8192;
- // A buffer for ReadContent for ReadOuterXml
- private StringBuilder currentTag {
- get {
- return currentInput.CurrentMarkup;
- }
- }
- private string attributeString = String.Empty;
- private int attributeValuePos;
- // This should be only referenced(used) by ReadInnerXml(). Kind of flyweight pattern.
- private StringBuilder innerXmlBuilder;
- // Parameter entity placeholder
- private Hashtable parameterEntities = new Hashtable ();
- int dtdIncludeSect;
- private XmlResolver resolver = new XmlUrlResolver ();
- private bool namespaces = true;
- private XmlException ReaderError (string message)
- {
- return new XmlException (message, LineNumber, LinePosition);
- }
- private void Init ()
- {
- readState = ReadState.Initial;
- depth = 0;
- depthUp = false;
- popScope = false;
- elementStack = new Stack();
- haveEnteredDocument = false;
- nodeType = XmlNodeType.None;
- name = String.Empty;
- prefix = String.Empty;
- localName = string.Empty;
- isEmptyElement = false;
- value = String.Empty;
- attributes = new Hashtable ();
- orderedAttributes = new ArrayList ();
- orderedAttributesEnumerator = null;
- returnEntityReference = false;
- entityReferenceName = String.Empty;
- nameBuffer = new char [initialNameCapacity];
- nameLength = 0;
- nameCapacity = initialNameCapacity;
- valueBuffer = new char [initialValueCapacity];
- valueLength = 0;
- valueCapacity = initialValueCapacity;
- }
- private void InitializeContext (string url, XmlParserContext context, TextReader fragment, XmlNodeType fragType)
- {
- parserContext = context;
- if (context == null) {
- XmlNameTable nt = new NameTable ();
- parserContext = new XmlParserContext (nt,
- new XmlNamespaceManager (nt),
- String.Empty,
- XmlSpace.None);
- }
- if (url != null && url != String.Empty) {
- string path = Path.GetFullPath (".");
- UriBuilder ub = new UriBuilder (path);
- ub.Scheme = "file";
- parserContext.BaseURI = new Uri (ub.Uri, url).ToString ();
- }
- Init ();
- switch (fragType) {
- case XmlNodeType.Attribute:
- value = String.Format ("{0}{1}{0}", "'", fragment.ReadToEnd ().Replace ("'", "'"));
- break;
- case XmlNodeType.Element:
- allowMultipleRoot = true;
- break;
- case XmlNodeType.Document:
- break;
- default:
- throw new XmlException (String.Format ("NodeType {0} is not allowed to create XmlTextReader.", fragType));
- }
- this.currentInput = new XmlParserInput (fragment, url);
- StreamReader sr = fragment as StreamReader;
- }
- // Use this method rather than setting the properties
- // directly so that all the necessary properties can
- // be changed in harmony with each other. Maybe the
- // fields should be in a seperate class to help enforce
- // this.
- private void SetProperties (
- XmlNodeType nodeType,
- string name,
- bool isEmptyElement,
- string value,
- bool clearAttributes)
- {
- this.nodeType = nodeType;
- this.name = name;
- this.isEmptyElement = isEmptyElement;
- this.value = value;
- this.elementDepth = depth;
- if (clearAttributes)
- ClearAttributes ();
- if (namespaces) {
- int indexOfColon = name.IndexOf (':');
- if (indexOfColon == -1) {
- prefix = String.Empty;
- localName = name;
- } else {
- prefix = name.Substring (0, indexOfColon);
- localName = name.Substring (indexOfColon + 1);
- }
- } else {
- prefix = String.Empty;
- localName = name;
- }
- switch (nodeType) {
- case XmlNodeType.Attribute:
- if (prefix == string.Empty) namespaceURI = string.Empty;
- else namespaceURI = LookupNamespace (prefix);
- if (localName == "xmlns" && prefix == "")
- namespaceURI = "http://www.w3.org/2000/xmlns/";
- break;
- case XmlNodeType.Element:
- case XmlNodeType.EndElement:
- namespaceURI = LookupNamespace (prefix);
- break;
- default:
- namespaceURI = "";
- break;
- }
- }
- private void SaveProperties ()
- {
- // If already saved, then return.
- if (isPropertySaved)
- return;
- saveNodeType = nodeType;
- saveName = name;
- savePrefix = prefix;
- saveLocalName = localName;
- saveNamespaceURI = namespaceURI;
- saveIsEmptyElement = isEmptyElement;
- // An element's value is always String.Empty.
- isPropertySaved = true;
- }
- private void RestoreProperties ()
- {
- nodeType = saveNodeType;
- name = saveName;
- prefix = savePrefix;
- localName = saveLocalName;
- namespaceURI = saveNamespaceURI;
- isEmptyElement = saveIsEmptyElement;
- value = String.Empty;
- isPropertySaved = false;
- }
- private void AddAttribute (string name, string value)
- {
- attributes.Add (name, value);
- orderedAttributes.Add (name);
- }
- private void ClearAttributes ()
- {
- if (attributes.Count > 0) {
- attributes.Clear ();
- orderedAttributes.Clear ();
- }
- orderedAttributesEnumerator = null;
- }
- private int PeekChar ()
- {
- return currentInput.PeekChar ();
- }
- private int ReadChar ()
- {
- return currentInput.ReadChar ();
- }
- // This should really keep track of some state so
- // that it's not possible to have more than one document
- // element or text outside of the document element.
- private bool ReadContent ()
- {
- currentTag.Length = 0;
- if (popScope) {
- parserContext.NamespaceManager.PopScope ();
- popScope = false;
- }
- if (returnEntityReference) {
- SetEntityReferenceProperties ();
- } else {
- switch (PeekChar ()) {
- case '<':
- ReadChar ();
- ReadTag ();
- break;
- case '\r': goto case ' ';
- case '\n': goto case ' ';
- case '\t': goto case ' ';
- case ' ':
- if (whitespaceHandling == WhitespaceHandling.All ||
- whitespaceHandling == WhitespaceHandling.Significant)
- return ReadWhitespace ();
- SkipWhitespace ();
- return ReadContent ();
- case -1:
- if (depth > 0)
- throw new XmlException ("unexpected end of file. Current depth is " + depth);
- readState = ReadState.EndOfFile;
- SetProperties (
- XmlNodeType.None, // nodeType
- String.Empty, // name
- false, // isEmptyElement
- String.Empty, // value
- true // clearAttributes
- );
- break;
- default:
- ReadText (true);
- break;
- }
- }
- return this.ReadState != ReadState.EndOfFile;
- }
- private void SetEntityReferenceProperties ()
- {
- SetProperties (
- XmlNodeType.EntityReference, // nodeType
- entityReferenceName, // name
- false, // isEmptyElement
- String.Empty, // value
- true // clearAttributes
- );
- returnEntityReference = false;
- entityReferenceName = String.Empty;
- }
- // The leading '<' has already been consumed.
- private void ReadTag ()
- {
- switch (PeekChar ())
- {
- case '/':
- ReadChar ();
- ReadEndTag ();
- break;
- case '?':
- ReadChar ();
- ReadProcessingInstruction ();
- break;
- case '!':
- ReadChar ();
- ReadDeclaration ();
- break;
- default:
- ReadStartTag ();
- break;
- }
- }
- // The leading '<' has already been consumed.
- private void ReadStartTag ()
- {
- parserContext.NamespaceManager.PushScope ();
- string name = ReadName ();
- if (haveEnteredDocument && elementStack.Count == 0 && !allowMultipleRoot)
- throw ReaderError("document has terminated, cannot open new element");
- haveEnteredDocument = true;
- bool isEmptyElement = false;
- ClearAttributes ();
- SkipWhitespace ();
- if (XmlConstructs.IsNameStart (PeekChar ()))
- ReadAttributes (false);
- if (PeekChar () == '/') {
- ReadChar ();
- isEmptyElement = true;
- popScope = true;
- }
- else {
- depthUp = true;
- elementStack.Push (name);
- string baseUri = GetAttribute ("xml:base");
- if (baseUri != null)
- parserContext.BaseURI = baseUri;
- string xmlLang = GetAttribute ("xml:lang");
- if (xmlLang != null)
- parserContext.XmlLang = xmlLang;
- string xmlSpaceAttr = GetAttribute ("xml:space");
- if (xmlSpaceAttr != null) {
- if (xmlSpaceAttr == "preserve")
- parserContext.XmlSpace = XmlSpace.Preserve;
- else if (xmlSpaceAttr == "default")
- parserContext.XmlSpace = XmlSpace.Default;
- else
- throw this.ReaderError (String.Format ("Invalid xml:space value: {0}", xmlSpaceAttr));
- }
- parserContext.PushScope ();
- }
- Expect ('>');
- SetProperties (
- XmlNodeType.Element, // nodeType
- name, // name
- isEmptyElement, // isEmptyElement
- String.Empty, // value
- false // clearAttributes
- );
- }
- // The reader is positioned on the first character
- // of the element's name.
- private void ReadEndTag ()
- {
- string name = ReadName ();
- if (elementStack.Count == 0)
- throw ReaderError("closing element without matching opening element");
- string expected = (string)elementStack.Pop();
- if (expected != name)
- throw ReaderError(String.Format ("unmatched closing element: expected {0} but found {1}", expected, name));
- parserContext.PopScope ();
- SkipWhitespace ();
- Expect ('>');
- --depth;
- SetProperties (
- XmlNodeType.EndElement, // nodeType
- name, // name
- false, // isEmptyElement
- String.Empty, // value
- true // clearAttributes
- );
- popScope = true;
- }
- private void AppendNameChar (int ch)
- {
- CheckNameCapacity ();
- nameBuffer [nameLength++] = (char)ch;
- }
- private void CheckNameCapacity ()
- {
- if (nameLength == nameCapacity) {
- nameCapacity = nameCapacity * 2;
- char [] oldNameBuffer = nameBuffer;
- nameBuffer = new char [nameCapacity];
- Array.Copy (oldNameBuffer, nameBuffer, nameLength);
- }
- }
- private string CreateNameString ()
- {
- return parserContext.NameTable.Add (nameBuffer, 0, nameLength);
- }
- private void AppendValueChar (int ch)
- {
- CheckValueCapacity ();
- valueBuffer [valueLength++] = (char)ch;
- }
- private void CheckValueCapacity ()
- {
- if (valueLength == valueCapacity) {
- valueCapacity = valueCapacity * 2;
- char [] oldValueBuffer = valueBuffer;
- valueBuffer = new char [valueCapacity];
- Array.Copy (oldValueBuffer, valueBuffer, valueLength);
- }
- }
- private string CreateValueString ()
- {
- return new String (valueBuffer, 0, valueLength);
- }
- // The reader is positioned on the first character
- // of the text.
- private void ReadText (bool cleanValue)
- {
- if (cleanValue)
- valueLength = 0;
- int ch = PeekChar ();
- while (ch != '<' && ch != -1) {
- if (ch == '&') {
- ReadChar ();
- if (ReadReference (false))
- break;
- } else
- AppendValueChar (ReadChar ());
- ch = PeekChar ();
- }
- if (returnEntityReference && valueLength == 0) {
- SetEntityReferenceProperties ();
- } else {
- SetProperties (
- XmlNodeType.Text, // nodeType
- String.Empty, // name
- false, // isEmptyElement
- CreateValueString (), // value
- true // clearAttributes
- );
- }
- }
- // The leading '&' has already been consumed.
- // Returns true if the entity reference isn't a simple
- // character reference or one of the predefined entities.
- // This allows the ReadText method to break so that the
- // next call to Read will return the EntityReference node.
- private bool ReadReference (bool ignoreEntityReferences)
- {
- if (PeekChar () == '#') {
- ReadChar ();
- ReadCharacterReference ();
- } else
- ReadEntityReference (ignoreEntityReferences);
- return returnEntityReference;
- }
- private void ReadCharacterReference ()
- {
- int value = 0;
- if (PeekChar () == 'x') {
- ReadChar ();
- while (PeekChar () != ';' && PeekChar () != -1) {
- int ch = ReadChar ();
- if (ch >= '0' && ch <= '9')
- value = (value << 4) + ch - '0';
- else if (ch >= 'A' && ch <= 'F')
- value = (value << 4) + ch - 'A' + 10;
- else if (ch >= 'a' && ch <= 'f')
- value = (value << 4) + ch - 'a' + 10;
- else
- throw ReaderError (
- String.Format (
- "invalid hexadecimal digit: {0} (#x{1:X})",
- (char)ch,
- ch));
- }
- } else {
- while (PeekChar () != ';' && PeekChar () != -1) {
- int ch = ReadChar ();
- if (ch >= '0' && ch <= '9')
- value = value * 10 + ch - '0';
- else
- throw ReaderError (
- String.Format (
- "invalid decimal digit: {0} (#x{1:X})",
- (char)ch,
- ch));
- }
- }
- ReadChar (); // ';'
- AppendValueChar (value);
- }
- private void ReadEntityReference (bool ignoreEntityReferences)
- {
- nameLength = 0;
- int ch = PeekChar ();
- while (ch != ';' && ch != -1) {
- AppendNameChar (ReadChar ());
- ch = PeekChar ();
- }
- Expect (';');
- string name = CreateNameString ();
- switch (name)
- {
- case "lt":
- AppendValueChar ('<');
- break;
- case "gt":
- AppendValueChar ('>');
- break;
- case "amp":
- AppendValueChar ('&');
- break;
- case "apos":
- AppendValueChar ('\'');
- break;
- case "quot":
- AppendValueChar ('"');
- break;
- default:
- if (ignoreEntityReferences) {
- AppendValueChar ('&');
- foreach (char ch2 in name) {
- AppendValueChar (ch2);
- }
- AppendValueChar (';');
- } else {
- returnEntityReference = true;
- entityReferenceName = name;
- }
- break;
- }
- }
- // The reader is positioned on the first character of
- // the attribute name.
- private void ReadAttributes (bool allowPIEnd)
- {
- int peekChar = -1;
- bool requireWhitespace = false;
- do {
- if (!SkipWhitespace () && requireWhitespace)
- throw new XmlException ("Unexpected token. Name is required here.");
- string name = ReadName ();
- SkipWhitespace ();
- Expect ('=');
- SkipWhitespace ();
- string value = ReadAttribute ();
- if (name == "xmlns")
- parserContext.NamespaceManager.AddNamespace (String.Empty, UnescapeAttributeValue (value));
- else if (name.StartsWith ("xmlns:"))
- parserContext.NamespaceManager.AddNamespace (name.Substring (6), UnescapeAttributeValue (value));
- AddAttribute (name, value);
- if (XmlConstructs.IsSpace (PeekChar ()))
- SkipWhitespace ();
- else
- requireWhitespace = true;
- peekChar = PeekChar ();
- if (peekChar == '?' && allowPIEnd)
- break;
- } while (peekChar != '/' && peekChar != '>' && peekChar != -1);
- }
- // The reader is positioned on the quote character.
- // *Keeps quote char* to value to get_QuoteChar() correctly.
- private string ReadAttribute ()
- {
- valueLength = 0;
- int quoteChar = ReadChar ();
- if (quoteChar != '\'' && quoteChar != '\"')
- throw ReaderError ("an attribute value was not quoted");
- AppendValueChar (quoteChar);
- while (PeekChar () != quoteChar) {
- int ch = ReadChar ();
- switch (ch)
- {
- case '<':
- throw ReaderError ("attribute values cannot contain '<'");
- case -1:
- throw ReaderError ("unexpected end of file in an attribute value");
- default:
- AppendValueChar (ch);
- break;
- }
- }
- ReadChar (); // quoteChar
- AppendValueChar (quoteChar);
- return CreateValueString ();
- }
- // The reader is positioned on the first character
- // of the target.
- //
- // It may be xml declaration or processing instruction.
- private void ReadProcessingInstruction ()
- {
- string target = ReadName ();
- if (target == "xml") {
- ReadXmlDeclaration ();
- return;
- }
- SkipWhitespace ();
- valueLength = 0;
- while (PeekChar () != -1) {
- int ch = ReadChar ();
- if (ch == '?' && PeekChar () == '>') {
- ReadChar ();
- break;
- }
- AppendValueChar ((char)ch);
- }
- SetProperties (
- XmlNodeType.ProcessingInstruction, // nodeType
- target, // name
- false, // isEmptyElement
- CreateValueString (), // value
- true // clearAttributes
- );
- }
- // The reader is positioned after "<?xml "
- private void ReadXmlDeclaration ()
- {
- ClearAttributes ();
- ReadAttributes (true); // They must have "version."
- Expect ("?>");
- SetProperties (
- XmlNodeType.XmlDeclaration, // nodeType
- "xml", // name
- false, // isEmptyElement
- currentInput.CurrentMarkup.ToString (6, currentInput.CurrentMarkup.Length - 6), // value
- false // clearAttributes
- );
- }
- // The reader is positioned on the first character after
- // the leading '<!'.
- private void ReadDeclaration ()
- {
- int ch = PeekChar ();
- switch (ch)
- {
- case '-':
- Expect ("--");
- ReadComment ();
- break;
- case '[':
- ReadChar ();
- Expect ("CDATA[");
- ReadCDATA ();
- break;
- case 'D':
- Expect ("DOCTYPE");
- ReadDoctypeDecl ();
- break;
- }
- }
- // The reader is positioned on the first character after
- // the leading '<!--'.
- private void ReadComment ()
- {
- valueLength = 0;
- while (PeekChar () != -1) {
- int ch = ReadChar ();
- if (ch == '-' && PeekChar () == '-') {
- ReadChar ();
- if (PeekChar () != '>')
- throw ReaderError ("comments cannot contain '--'");
- ReadChar ();
- break;
- }
- AppendValueChar ((char)ch);
- }
- SetProperties (
- XmlNodeType.Comment, // nodeType
- String.Empty, // name
- false, // isEmptyElement
- CreateValueString (), // value
- true // clearAttributes
- );
- }
- // The reader is positioned on the first character after
- // the leading '<![CDATA['.
- private void ReadCDATA ()
- {
- valueLength = 0;
- bool skip = false;
- int ch = 0;
- while (PeekChar () != -1) {
- if (!skip)
- ch = ReadChar ();
- skip = false;
- if (ch == ']' && PeekChar () == ']') {
- ch = ReadChar (); // ']'
- if (PeekChar () == '>') {
- ReadChar (); // '>'
- break;
- } else {
- skip = true;
- // AppendValueChar (']');
- // AppendValueChar (']');
- // ch = ReadChar ();
- }
- }
- AppendValueChar ((char)ch);
- }
- SetProperties (
- XmlNodeType.CDATA, // nodeType
- String.Empty, // name
- false, // isEmptyElement
- CreateValueString (), // value
- true // clearAttributes
- );
- }
- // The reader is positioned on the first character after
- // the leading '<!DOCTYPE'.
- private void ReadDoctypeDecl ()
- {
- string doctypeName = null;
- string publicId = String.Empty;
- string systemId = String.Empty;
- int intSubsetStartLine = 0;
- int intSubsetStartColumn = 0;
- SkipWhitespace ();
- doctypeName = ReadName ();
- SkipWhitespace ();
- switch(PeekChar ())
- {
- case 'S':
- systemId = ReadSystemLiteral (true);
- break;
- case 'P':
- publicId = ReadPubidLiteral ();
- SkipWhitespace ();
- systemId = ReadSystemLiteral (false);
- break;
- }
- SkipWhitespace ();
- if(PeekChar () == '[')
- {
- // read markupdecl etc. or end of decl
- ReadChar ();
- intSubsetStartLine = this.LineNumber;
- intSubsetStartColumn = this.LinePosition;
- int startPos = currentTag.Length;
- // do {
- ReadInternalSubset ();
- // } while (nodeType != XmlNodeType.None);
- int endPos = currentTag.Length - 1;
- parserContext.InternalSubset = currentTag.ToString (startPos, endPos - startPos);
- }
- // end of DOCTYPE decl.
- SkipWhitespace ();
- Expect ('>');
- // now compile DTD
- currentSubset = new DTDObjectModel (); // merges both internal and external subsets in the meantime,
- int originalParserDepth = parserInputStack.Count;
- if (intSubsetStartLine > 0) {
- XmlParserInput original = currentInput;
- currentInput = new XmlParserInput (new StringReader (parserContext.InternalSubset), BaseURI, intSubsetStartLine, intSubsetStartColumn);
- do {
- CompileDTDSubset ();
- if (PeekChar () == -1 && parserInputStack.Count > 0)
- popParserInput ();
- } while (nodeType != XmlNodeType.None || parserInputStack.Count > originalParserDepth);
- if (dtdIncludeSect != 0)
- this.ReaderError ("INCLUDE section is not ended correctly.");
- currentInput = original;
- }
- if (systemId != String.Empty && resolver != null) {
- pushParserInput (systemId);
- do {
- this.CompileDTDSubset ();
- if (PeekChar () == -1 && parserInputStack.Count > 1)
- popParserInput ();
- } while (nodeType != XmlNodeType.None || parserInputStack.Count > originalParserDepth + 1);
- popParserInput ();
- }
- // set properties for <!DOCTYPE> node
- SetProperties (
- XmlNodeType.DocumentType, // nodeType
- doctypeName, // name
- false, // isEmptyElement
- parserContext.InternalSubset, // value
- true // clearAttributes
- );
- }
- private void pushParserInput (string url)
- {
- #if true
- Uri baseUri = null;
- try {
- baseUri = new Uri (BaseURI);
- } catch (UriFormatException) {
- }
- Uri absUri = resolver.ResolveUri (baseUri, url);
- string absPath = absUri.ToString ();
- #else
- #if !NetworkDisabled
- try {
- Uri baseUrl = new Uri (BaseURI);
- absPath = resolver.ResolveUri (baseUrl, url).ToString ();
- } catch (UriFormatException) {
- if (Path.IsPathRooted (url))
- absPath = url;
- else if (BaseURI != String.Empty)
- absPath = new FileInfo (BaseURI).DirectoryName + Path.DirectorySeparatorChar + url;
- else
- absPath = url;
- }
- #else
- if (Path.IsPathRooted (url))
- absPath = url;
- else if (BaseURI != String.Empty)
- absPath = new FileInfo (BaseURI).DirectoryName + Path.DirectorySeparatorChar + url;
- else
- absPath = url;
- #endif
- #endif
- foreach (XmlParserInput i in parserInputStack.ToArray ()) {
- if (i.BaseURI == absPath)
- this.ReaderError ("Nested inclusion is not allowed: " + url);
- }
- parserInputStack.Push (currentInput);
- currentInput = new XmlParserInput (new XmlStreamReader (absUri.ToString (), false), absPath);
- parserContext.PushScope ();
- parserContext.BaseURI = absPath;
- }
- private void popParserInput ()
- {
- currentInput = parserInputStack.Pop () as XmlParserInput;
- parserContext.PopScope ();
- }
- private enum DtdInputState
- {
- Free = 1,
- ElementDecl,
- AttlistDecl,
- EntityDecl,
- NotationDecl,
- PI,
- Comment,
- InsideSingleQuoted,
- InsideDoubleQuoted,
- }
- private class DtdInputStateStack
- {
- Stack intern = new Stack ();
- public DtdInputStateStack ()
- {
- Push (DtdInputState.Free);
- }
- public DtdInputState Peek ()
- {
- return (DtdInputState) intern.Peek ();
- }
- public DtdInputState Pop ()
- {
- return (DtdInputState) intern.Pop ();
- }
- public void Push (DtdInputState val)
- {
- intern.Push (val);
- }
- }
- DtdInputStateStack stateStack = new DtdInputStateStack ();
- DtdInputState State {
- get { return stateStack.Peek (); }
- }
- // Simply read but not generate any result.
- private void ReadInternalSubset ()
- {
- bool continueParse = true;
- while (continueParse) {
- switch (ReadChar ()) {
- case ']':
- switch (State) {
- case DtdInputState.Free:
- continueParse = false;
- break;
- case DtdInputState.InsideDoubleQuoted:
- continue;
- case DtdInputState.InsideSingleQuoted:
- continue;
- default:
- throw ReaderError ("unexpected end of file at DTD.");
- }
- break;
- case -1:
- throw ReaderError ("unexpected end of file at DTD.");
- case '<':
- if (State == DtdInputState.InsideDoubleQuoted ||
- State == DtdInputState.InsideSingleQuoted)
- continue; // well-formed
- switch (ReadChar ()) {
- case '?':
- stateStack.Push (DtdInputState.PI);
- break;
- case '!':
- switch (ReadChar ()) {
- case 'E':
- switch (ReadChar ()) {
- case 'L':
- Expect ("EMENT");
- stateStack.Push (DtdInputState.ElementDecl);
- break;
- case 'N':
- Expect ("TITY");
- stateStack.Push (DtdInputState.EntityDecl);
- break;
- default:
- throw ReaderError ("unexpected token '<!E'.");
- }
- break;
- case 'A':
- Expect ("TTLIST");
- stateStack.Push (DtdInputState.AttlistDecl);
- break;
- case 'N':
- Expect ("OTATION");
- stateStack.Push (DtdInputState.NotationDecl);
- break;
- case '-':
- Expect ("-");
- stateStack.Push (DtdInputState.Comment);
- break;
- }
- break;
- default:
- throw ReaderError ("unexpected '>'.");
- }
- break;
- case '\'':
- if (State == DtdInputState.InsideSingleQuoted)
- stateStack.Pop ();
- else if (State != DtdInputState.InsideDoubleQuoted && State != DtdInputState.Comment)
- stateStack.Push (DtdInputState.InsideSingleQuoted);
- break;
- case '"':
- if (State == DtdInputState.InsideDoubleQuoted)
- stateStack.Pop ();
- else if (State != DtdInputState.InsideSingleQuoted && State != DtdInputState.Comment)
- stateStack.Push (DtdInputState.InsideDoubleQuoted);
- break;
- case '>':
- switch (State) {
- case DtdInputState.ElementDecl:
- goto case DtdInputState.NotationDecl;
- case DtdInputState.AttlistDecl:
- goto case DtdInputState.NotationDecl;
- case DtdInputState.EntityDecl:
- goto case DtdInputState.NotationDecl;
- case DtdInputState.NotationDecl:
- stateStack.Pop ();
- break;
- case DtdInputState.InsideDoubleQuoted:
- continue;
- case DtdInputState.InsideSingleQuoted:
- continue; // well-formed
- case DtdInputState.Comment:
- continue;
- default:
- throw ReaderError ("unexpected token '>'");
- }
- break;
- case '?':
- if (State == DtdInputState.PI) {
- if (ReadChar () == '>')
- stateStack.Pop ();
- }
- break;
- case '-':
- if (State == DtdInputState.Comment) {
- if (PeekChar () == '-') {
- ReadChar ();
- Expect ('>');
- stateStack.Pop ();
- }
- }
- break;
- case '%':
- if (State != DtdInputState.Free && State != DtdInputState.EntityDecl && State != DtdInputState.Comment && State != DtdInputState.InsideDoubleQuoted && State != DtdInputState.InsideSingleQuoted)
- throw ReaderError ("Parameter Entity Reference cannot appear as a part of markupdecl (see XML spec 2.8).");
- break;
- }
- }
- }
- // Read any one of following:
- // elementdecl, AttlistDecl, EntityDecl, NotationDecl,
- // PI, Comment, Parameter Entity, or doctype termination char(']')
- //
- // returns a node of some nodeType or null, setting nodeType.
- // (if None then ']' was found.)
- private void CompileDTDSubset()
- {
- SkipWhitespace ();
- switch(PeekChar ())
- {
- case -1:
- nodeType = XmlNodeType.None;
- break;
- case '%':
- TryExpandPERef ();
- break;
- case '<':
- ReadChar ();
- switch(ReadChar ())
- {
- case '?':
- // Only read, no store.
- ReadProcessingInstruction ();
- break;
- case '!':
- CompileDeclaration ();
- break;
- default:
- throw ReaderError ("Syntax Error after '<' character.");
- }
- break;
- case ']':
- // End of inclusion
- Expect ("]]>");
- dtdIncludeSect--;
- SkipWhitespace ();
- break;
- default:
- throw ReaderError (String.Format ("Syntax Error inside doctypedecl markup : {0}({1})", PeekChar (), (char) PeekChar ()));
- }
- }
- private void CompileDeclaration ()
- {
- nodeType = XmlNodeType.DocumentType; // Hack!!
- switch(ReadChar ())
- {
- case '-':
- Expect ('-');
- // Only read, no store.
- ReadComment ();
- break;
- case 'E':
- switch(ReadChar ())
- {
- case 'N':
- Expect ("TITY");
- SkipWhitespace ();
- LOOPBACK:
- if (PeekChar () == '%') {
- ReadChar ();
- if (!XmlConstructs.IsSpace (PeekChar ())) {
- ExpandPERef ();
- goto LOOPBACK;
- // throw ReaderError ("expected whitespace between '%' and name.");
- } else {
- SkipWhitespace ();
- TryExpandPERef ();
- if (XmlConstructs.IsName (PeekChar ()))
- ReadParameterEntityDecl ();
- else
- throw ReaderError ("expected name character");
- }
- break;
- }
- DTDEntityDeclaration ent = ReadEntityDecl ();
- if (currentSubset.EntityDecls [ent.Name] == null)
- currentSubset.EntityDecls.Add (ent.Name, ent);
- break;
- case 'L':
- Expect ("EMENT");
- DTDElementDeclaration el = ReadElementDecl ();
- currentSubset.ElementDecls.Add (el.Name, el);
- break;
- default:
- throw ReaderError ("Syntax Error after '<!E' (ELEMENT or ENTITY must be found)");
- }
- break;
- case 'A':
- Expect ("TTLIST");
- DTDAttListDeclaration atl = ReadAttListDecl ();
- if (currentSubset.AttListDecls.ContainsKey (atl.Name))
- currentSubset.AttListDecls.Add (atl.Name, atl);
- break;
- case 'N':
- Expect ("OTATION");
- DTDNotationDeclaration not = ReadNotationDecl ();
- currentSubset.NotationDecls.Add (not.Name, not);
- break;
- case '[':
- // conditional sections
- SkipWhitespace ();
- TryExpandPERef ();
- SkipWhitespace ();
- Expect ('I');
- switch (ReadChar ()) {
- case 'N':
- Expect ("CLUDE");
- SkipWhitespace ();
- Expect ('[');
- dtdIncludeSect++;
- break;
- case 'G':
- Expect ("NORE");
- ReadIgnoreSect ();
- break;
- }
- break;
- default:
- throw ReaderError ("Syntax Error after '<!' characters.");
- }
- }
- private void ReadIgnoreSect ()
- {
- bool skip = false;
- SkipWhitespace ();
- Expect ('[');
- int dtdIgnoreSect = 1;
- while (dtdIgnoreSect > 0) {
- switch (skip ? PeekChar () : ReadChar ()) {
- case -1:
- throw ReaderError ("Unexpected IGNORE section end.");
- case '<':
- if (ReadChar () == '!' && ReadChar () == '[')
- dtdIgnoreSect++;
- break;
- case ']':
- if (ReadChar () == ']') {
- if (ReadChar () == '>')
- dtdIgnoreSect--;
- else
- skip = true;
- }
- break;
- }
- skip = false;
- }
- }
- // The reader is positioned on the head of the name.
- private DTDElementDeclaration ReadElementDecl ()
- {
- DTDElementDeclaration decl = new DTDElementDeclaration ();
- SkipWhitespace ();
- TryExpandPERef ();
- decl.Name = ReadName ();
- SkipWhitespace ();
- TryExpandPERef ();
- ReadContentSpec (decl);
- SkipWhitespace ();
- Expect ('>');
- return decl;
- }
- // read 'children'(BNF) of contentspec
- private void ReadContentSpec (DTDElementDeclaration decl)
- {
- switch(PeekChar ())
- {
- case 'E':
- decl.IsEmpty = true;
- Expect ("EMPTY");
- break;
- case 'A':
- decl.IsAny = true;
- Expect ("ANY");
- break;
- case '(':
- DTDContentModel model = decl.ContentModel;
- ReadChar ();
- SkipWhitespace ();
- TryExpandPERef ();
- if(PeekChar () == '#') {
- // Mixed Contents
- decl.IsMixedContent = true;
- Expect ("#PCDATA");
- SkipWhitespace ();
- TryExpandPERef ();
- SkipWhitespace ();
- while(PeekChar () != ')') {
- Expect('|');
- SkipWhitespace ();
- TryExpandPERef ();
- SkipWhitespace ();
- model.ChildModels.Add (ReadName ());
- SkipWhitespace ();
- TryExpandPERef ();
- }
- Expect (')');
- if(PeekChar () == '*')
- ReadChar (); // ZeroOrMore
- } else {
- // Non-Mixed Contents
- model.ChildModels.Add (ReadCP ());
- SkipWhitespace ();
- do { // copied from ReadCP() ...;-)
- TryExpandPERef ();
- SkipWhitespace ();
- if(PeekChar ()=='|') {
- // CPType=Or
- model.OrderType = DTDContentOrderType.Or;
- ReadChar ();
- SkipWhitespace ();
- model.ChildModels.Add (ReadCP ());
- SkipWhitespace ();
- }
- else if(PeekChar () == ',')
- {
- // CPType=Seq
- model.OrderType = DTDContentOrderType.Seq;
- ReadChar ();
- SkipWhitespace ();
- model.ChildModels.Add (ReadCP ());
- SkipWhitespace ();
- }
- else
- break;
- }
- while(true);
- Expect (')');
- switch(PeekChar ())
- {
- case '?':
- model.MinOccurs = 0;
- ReadChar ();
- break;
- case '*':
- model.MinOccurs = 0;
- model.MaxOccurs = decimal.MaxValue;
- ReadChar ();
- break;
- case '+':
- model.MaxOccurs = decimal.MaxValue;
- ReadChar ();
- break;
- }
- SkipWhitespace ();
- }
- SkipWhitespace ();
- break;
- }
- }
- // Read 'cp' (BNF) of contentdecl (BNF)
- private DTDContentModel ReadCP ()
- {
- DTDContentModel model = new DTDContentModel ();
- TryExpandPERef ();
- if(PeekChar () == '(') {
- ReadChar ();
- SkipWhitespace ();
- model.ChildModels.Add (ReadCP ());
- SkipWhitespace ();
- do {
- TryExpandPERef ();
- SkipWhitespace ();
- if(PeekChar ()=='|') {
- // CPType=Or
- model.OrderType = DTDContentOrderType.Or;
- ReadChar ();
- SkipWhitespace ();
- model.ChildModels.Add (ReadCP ());
- SkipWhitespace ();
- }
- else if(PeekChar () == ',') {
- // CPType=Seq
- model.OrderType = DTDContentOrderType.Seq;
- ReadChar ();
- SkipWhitespace ();
- model.ChildModels.Add (ReadCP ());
- SkipWhitespace ();
- }
- else
- break;
- }
- while(true);
- SkipWhitespace ();
- Expect (')');
- }
- else {
- TryExpandPERef ();
- model.ElementName = ReadName ();
- }
- switch(PeekChar ()) {
- case '?':
- model.MinOccurs = 0;
- ReadChar ();
- break;
- case '*':
- model.MinOccurs = 0;
- model.MaxOccurs = decimal.MaxValue;
- ReadChar ();
- break;
- case '+':
- model.MaxOccurs = decimal.MaxValue;
- ReadChar ();
- break;
- }
- return model;
- }
- // The reader is positioned on the first name char.
- private void ReadParameterEntityDecl ()
- {
- DTDParameterEntityDeclaration decl =
- new DTDParameterEntityDeclaration();
- decl.BaseURI = BaseURI;
- decl.Name = ReadName ();
- SkipWhitespace ();
- if (PeekChar () == 'S' || PeekChar () == 'P') {
- // throw new NotImplementedException ("External parameter entity reference is not implemented yet.");
- // read publicId/systemId
- ReadExternalID ();
- decl.PublicId = attributes ["PUBLIC"] as string;
- decl.SystemId = attributes ["SYSTEM"] as string;
- SkipWhitespace ();
- }
- else {
- TryExpandPERef ();
- int quoteChar = ReadChar ();
- int start = currentTag.Length;
- while (true) {
- SkipWhitespace ();
- int c = PeekChar ();
- if ((int) c == -1)
- throw new XmlException ("unexpected end of stream in entity value definition.");
- switch (c) {
- case '"':
- ReadChar ();
- if (quoteChar == '"') goto SKIP;
- break;
- case '\'':
- ReadChar ();
- if (quoteChar == '\'') goto SKIP;
- break;
- case '%':
- ImportAsPERef ();
- break;
- default:
- ReadChar ();
- break;
- }
- }
- SKIP:
- decl.Value = currentTag.ToString (start, currentTag.Length - start - 1);
- }
- SkipWhitespace ();
- Expect ('>');
- if (parameterEntities [decl.Name] == null) {
- parameterEntities.Add (decl.Name, decl);
- }
- }
- // reader is positioned on '%'
- private void ImportAsPERef ()
- {
- StringBuilder sb = null;
- int peRefStart = currentTag.Length;
- string appendStr = "";
- ReadChar ();
- string peName = ReadName ();
- Expect (';');
- DTDParameterEntityDeclaration peDecl =
- this.parameterEntities [peName] as DTDParameterEntityDeclaration;
- if (peDecl == null)
- throw ReaderError ("Parameter entity " + peName + " not found.");
- if (peDecl.SystemId != null) {
- pushParserInput (peDecl.SystemId);
- if (sb == null)
- sb = new StringBuilder ();
- else
- sb.Length = 0;
- while (PeekChar () != -1)
- sb.Append (ReadChar ());
- popParserInput ();
- appendStr = sb.ToString ();
- } else {
- appendStr = peDecl.Value;
- }
- currentTag.Remove (peRefStart,
- currentTag.Length - peRefStart);
- currentTag.Append (Dereference (appendStr));
- }
- // The reader is positioned on the head of the name.
- private DTDEntityDeclaration ReadEntityDecl ()
- {
- DTDEntityDeclaration decl = new DTDEntityDeclaration ();
- decl.Name = ReadName ();
- SkipWhitespace ();
- TryExpandPERef ();
- SkipWhitespace ();
- if (PeekChar () == 'S' || PeekChar () == 'P') {
- // external entity
- ReadExternalID ();
- decl.PublicId = attributes ["PUBLIC"] as string;
- decl.SystemId = attributes ["SYSTEM"] as string;
- SkipWhitespace ();
- if (PeekChar () == 'N')
- {
- // NDataDecl
- Expect ("NDATA");
- SkipWhitespace ();
- decl.NotationName = ReadName (); // ndata_name
- }
- }
- else {
- // general entity
- decl.EntityValue = ReadEntityValueDecl ();
- }
- SkipWhitespace ();
- Expect ('>');
- return decl;
- }
- private string ReadEntityValueDecl ()
- {
- SkipWhitespace ();
- // quotation char will be finally removed on unescaping
- int quoteChar = ReadChar ();
- int start = currentTag.Length;
- if (quoteChar != '\'' && quoteChar != '"')
- throw new XmlException ("quotation char was expected.");
- while (PeekChar () != quoteChar) {
- switch (PeekChar ()) {
- case '%':
- this.ImportAsPERef ();
- continue;
- case '&':
- ReadChar ();
- // Expect ('#');
- // ReadCharacterReference ();
- ReadReference (true);
- break;
- case -1:
- throw new XmlException ("unexpected end of stream.");
- default:
- ReadChar ();
- break;
- }
- }
- string value = Dereference (currentTag.ToString (start, currentTag.Length - start));
- Expect (quoteChar);
- return value;
- }
- private DTDAttListDeclaration ReadAttListDecl ()
- {
- SkipWhitespace ();
- TryExpandPERef ();
- string name = ReadName (); // target element name
- DTDAttListDeclaration decl =
- currentSubset.AttListDecls [name] as DTDAttListDeclaration;
- if (decl == null)
- decl = new DTDAttListDeclaration ();
- decl.Name = name;
- SkipWhitespace ();
- TryExpandPERef ();
- SkipWhitespace ();
- while (XmlConstructs.IsName ((char) PeekChar ())) {
- DTDAttributeDefinition def = ReadAttributeDefinition ();
- if (decl.AttributeDefinitions [def.Name] == null)
- decl.AttributeDefinitions.Add (def.Name, def);
- SkipWhitespace ();
- TryExpandPERef ();
- SkipWhitespace ();
- }
- SkipWhitespace ();
- Expect ('>');
- return decl;
- }
- private DTDAttributeDefinition ReadAttributeDefinition ()
- {
- DTDAttributeDefinition def = new DTDAttributeDefinition ();
- // attr_name
- TryExpandPERef ();
- def.Name = ReadName ();
- SkipWhitespace ();
- // attr_value
- TryExpandPERef ();
- switch(PeekChar ()) {
- case 'C': // CDATA
- Expect ("CDATA");
- def.AttributeType = DTDAttributeType.CData;
- break;
- case 'I': // ID, IDREF, IDREFS
- Expect ("ID");
- if(PeekChar () == 'R') {
- Expect ("REF");
- if(PeekChar () == 'S') {
- // IDREFS
- ReadChar ();
- def.AttributeType = DTDAttributeType.IdRefs;
- }
- else // IDREF
- def.AttributeType = DTDAttributeType.IdRef;
- }
- else // ID
- def.AttributeType = DTDAttributeType.Id;
- break;
- case 'E': // ENTITY, ENTITIES
- Expect ("ENTIT");
- switch(ReadChar ()) {
- case 'Y': // ENTITY
- def.AttributeType = DTDAttributeType.Entity;
- break;
- case 'I': // ENTITIES
- Expect ("ES");
- def.AttributeType = DTDAttributeType.Entities;
- break;
- }
- break;
- case 'N': // NMTOKEN, NMTOKENS, NOTATION
- ReadChar ();
- switch(PeekChar ()) {
- case 'M':
- Expect ("MTOKEN");
- if(PeekChar ()=='S') { // NMTOKENS
- ReadChar ();
- def.AttributeType = DTDAttributeType.NmTokens;
- }
- else // NMTOKEN
- def.AttributeType = DTDAttributeType.NmToken;
- break;
- case 'O':
- Expect ("OTATION");
- def.AttributeType = DTDAttributeType.Notation;
- SkipWhitespace ();
- Expect ('(');
- SkipWhitespace ();
- def.EnumeratedNotations.Add (ReadName ()); // notation name
- SkipWhitespace ();
- while(PeekChar () == '|') {
- ReadChar ();
- SkipWhitespace ();
- def.EnumeratedNotations.Add (ReadName ()); // notation name
- SkipWhitespace ();
- }
- Expect (')');
- break;
- default:
- throw new XmlException ("attribute declaration syntax error.");
- }
- break;
- default: // Enumerated Values
- TryExpandPERef ();
- Expect ('(');
- SkipWhitespace ();
- def.EnumeratedAttributeDeclaration.Add (ReadNmToken ()); // enum value
- SkipWhitespace ();
- while(PeekChar () == '|') {
- ReadChar ();
- SkipWhitespace ();
- def.EnumeratedAttributeDeclaration.Add (ReadNmToken ()); // enum value
- SkipWhitespace ();
- }
- Expect (')');
- break;
- }
- SkipWhitespace ();
- TryExpandPERef ();
- // def_value
- if(PeekChar () == '#')
- {
- ReadChar ();
- switch(PeekChar ())
- {
- case 'R':
- Expect ("REQUIRED");
- def.OccurenceType = DTDAttributeOccurenceType.Required;
- break;
- case 'I':
- Expect ("IMPLIED");
- def.OccurenceType = DTDAttributeOccurenceType.Optional;
- break;
- case 'F':
- Expect ("FIXED");
- def.OccurenceType = DTDAttributeOccurenceType.Fixed;
- SkipWhitespace ();
- def.UnresolvedDefaultValue = ReadAttribute ();
- break;
- }
- } else {
- // one of the enumerated value
- if (PeekChar () == -1) {
- popParserInput ();
- }
- SkipWhitespace ();
- def.UnresolvedDefaultValue = ReadAttribute ();
- }
- return def;
- }
- private DTDNotationDeclaration ReadNotationDecl()
- {
- DTDNotationDeclaration decl = new DTDNotationDeclaration ();
- SkipWhitespace ();
- decl.Name = ReadName (); // notation name
- if (namespaces) { // copy from SetProperties ;-)
- int indexOfColon = decl.Name.IndexOf (':');
- if (indexOfColon == -1) {
- decl.Prefix = String.Empty;
- decl.LocalName = decl.Name;
- } else {
- decl.Prefix = decl.Name.Substring (0, indexOfColon);
- decl.LocalName = decl.Name.Substring (indexOfColon + 1);
- }
- } else {
- decl.Prefix = String.Empty;
- decl.LocalName = decl.Name;
- }
- SkipWhitespace ();
- if(PeekChar () == 'P') {
- decl.PublicId = ReadPubidLiteral ();
- SkipWhitespace ();
- if (PeekChar () == '\'' || PeekChar () == '"') {
- decl.SystemId = ReadSystemLiteral (false);
- SkipWhitespace ();
- }
- } else if(PeekChar () == 'S') {
- decl.SystemId = ReadSystemLiteral (true);
- SkipWhitespace ();
- }
- if(decl.PublicId == null && decl.SystemId == null)
- throw new XmlException ("public or system declaration required for \"NOTATION\" declaration.");
- Expect ('>');
- return decl;
- }
- private void TryExpandPERef ()
- {
- if (PeekChar () == '%') {
- ReadChar ();
- if (!XmlConstructs.IsName (PeekChar ()))
- return;
- ExpandPERef ();
- }
- }
- // reader is positioned on the first letter of the name.
- private void ExpandPERef ()
- {
- ExpandPERef (true);
- }
- private void ExpandPERef (bool attachSpace)
- {
- string peName = ReadName ();
- Expect (";");
- ExpandNamedPERef (peName, attachSpace);
- }
- private void ExpandNamedPERef (string peName, bool attachSpace)
- {
- DTDParameterEntityDeclaration decl =
- parameterEntities [peName] as DTDParameterEntityDeclaration;
- if (decl == null)
- throw new XmlException ("undeclared parameter entity: '" + peName + "'");
- if (decl.SystemId != null) {
- pushParserInput (decl.SystemId);
- }
- // add buffer
- else
- currentInput.InsertParameterEntityBuffer (attachSpace ? " " + Dereference (decl.Value) + " " : decl.Value);
- SkipWhitespace (); // is it ok?
- // while (PeekChar () == '%')
- // TryExpandPERef (); // recursive
- }
- private void ReadExternalID() {
- switch(PeekChar ()) {
- case 'S':
- attributes ["PUBLIC"] = null;
- attributes ["SYSTEM"] = ReadSystemLiteral (true);
- break;
- case 'P':
- attributes ["PUBLIC"] = ReadPubidLiteral ();
- SkipWhitespace ();
- attributes ["SYSTEM"] = ReadSystemLiteral (false);
- break;
- }
- }
- // The reader is positioned on the first 'S' of "SYSTEM".
- private string ReadSystemLiteral (bool expectSYSTEM)
- {
- if(expectSYSTEM)
- Expect ("SYSTEM");
- SkipWhitespace ();
- int quoteChar = ReadChar (); // apos or quot
- int startPos = currentTag.Length;
- int c = 0;
- while(c != quoteChar) {
- c = ReadChar ();
- if(c < 0) throw ReaderError ("Unexpected end of stream in ExternalID.");
- }
- return currentTag.ToString (startPos, currentTag.Length - 1 - startPos);
- }
- private string ReadPubidLiteral()
- {
- Expect ("PUBLIC");
- SkipWhitespace ();
- int quoteChar = ReadChar ();
- int startPos = currentTag.Length;
- int c = 0;
- while(c != quoteChar)
- {
- c = ReadChar ();
- if(c < 0) throw ReaderError ("Unexpected end of stream in ExternalID.");
- if(c != quoteChar && !XmlConstructs.IsPubid (c))
- throw ReaderError("character '" + (char)c + "' not allowed for PUBLIC ID");
- }
- return currentTag.ToString (startPos, currentTag.Length - 1 - startPos);
- }
- // The reader is positioned on the first character
- // of the name.
- internal string ReadName ()
- {
- return ReadNameOrNmToken(false);
- }
- // The reader is positioned on the first character
- // of the name.
- private string ReadNmToken ()
- {
- return ReadNameOrNmToken(true);
- }
- private string ReadNameOrNmToken(bool isNameToken)
- {
- int ch = PeekChar ();
- if(isNameToken) {
- if (!XmlConstructs.IsName ((char) ch))
- throw ReaderError (String.Format ("a name did not start with a legal character {0} ({1})", ch, (char)ch));
- }
- else {
- if (!XmlConstructs.IsNameStart ((char) PeekChar ()))
- throw ReaderError (String.Format ("a name did not start with a legal character {0} ({1})", ch, (char)ch));
- }
- nameLength = 0;
- AppendNameChar (ReadChar ());
- while (XmlConstructs.IsName (PeekChar ())) {
- AppendNameChar (ReadChar ());
- }
- return CreateNameString ();
- }
- // Read the next character and compare it against the
- // specified character.
- private void Expect (int expected)
- {
- int ch = ReadChar ();
- if (ch != expected) {
- throw ReaderError (
- String.Format (
- "expected '{0}' ({1:X}) but found '{2}' ({3:X})",
- (char)expected,
- expected,
- (char)ch,
- ch));
- }
- }
- private void Expect (string expected)
- {
- int len = expected.Length;
- for(int i=0; i< len; i++)
- Expect (expected[i]);
- }
- // Does not consume the first non-whitespace character.
- private bool SkipWhitespace ()
- {
- //FIXME: Should not skip if whitespaceHandling == WhiteSpaceHandling.None
- bool skipped = XmlConstructs.IsSpace (PeekChar ());
- while (XmlConstructs.IsSpace (PeekChar ()))
- ReadChar ();
- return skipped;
- }
- private bool ReadWhitespace ()
- {
- valueLength = 0;
- int ch = PeekChar ();
- do {
- AppendValueChar (ReadChar ());
- } while ((ch = PeekChar ()) != -1 && XmlConstructs.IsSpace (ch));
- if (ch != -1 && ch != '<')
- ReadText (false);
- else
- SetProperties (XmlNodeType.Whitespace,
- String.Empty,
- false,
- CreateValueString (),
- true);
- return (PeekChar () != -1);
- }
- // read entity reference from attribute string and if parsable then return the value.
- private string ReadAttributeValueReference ()
- {
- int endEntityPosition = attributeString.IndexOf(';',
- attributeValuePos);
- string entityName = attributeString.Substring (attributeValuePos + 1,
- endEntityPosition - attributeValuePos - 1);
- attributeValuePos = endEntityPosition + 1;
- if(entityName [0] == '#') {
- char c;
- // character entity
- if(entityName [1] == 'x') {
- // hexadecimal
- c = (char) int.Parse ("0" + entityName.Substring (2),
- System.Globalization.NumberStyles.HexNumber);
- } else {
- // decimal
- c = (char) int.Parse (entityName.Substring (1));
- }
- return c.ToString();
- }
- else {
- switch(entityName)
- {
- case "lt": return "<";
- case "gt": return ">";
- case "amp": return "&";
- case "quot": return "\"";
- case "apos": return "'";
- default: return null;
- }
- }
- }
- private string UnescapeAttributeValue (string unresolved)
- {
- if(unresolved == null) return null;
- // trim start/end edge of quotation character.
- return Dereference (unresolved.Substring (1, unresolved.Length - 2));
- }
- private string Dereference (string unresolved)
- {
- StringBuilder resolved = new StringBuilder();
- int pos = 0;
- int next = unresolved.IndexOf ('&');
- if(next < 0)
- return unresolved;
- while(next >= 0) {
- if(pos < next)
- resolved.Append (unresolved.Substring (pos, next - pos));// - 1);
- int endPos = unresolved.IndexOf (';', next+1);
- string entityName =
- unresolved.Substring (next + 1, endPos - next - 1);
- if(entityName [0] == '#') {
- char c;
- // character entity
- if(entityName [1] == 'x') {
- // hexadecimal
- c = (char) int.Parse ("0" + entityName.Substring (2),
- System.Globalization.NumberStyles.HexNumber);
- } else {
- // decimal
- c = (char) int.Parse (entityName.Substring (1));
- }
- resolved.Append (c);
- } else {
- switch(entityName) {
- case "lt": resolved.Append ("<"); break;
- case "gt": resolved.Append (">"); break;
- case "amp": resolved.Append ("&"); break;
- case "quot": resolved.Append ("\""); break;
- case "apos": resolved.Append ("'"); break;
- // With respect to "Value", MS document is helpless
- // and the implemention returns inconsistent value
- // (e.g. XML: "&ent; &ent;" ---> Value: "&ent; &ent;".)
- default: resolved.Append ("&" + entityName + ";"); break;
- }
- }
- pos = endPos + 1;
- if(pos > unresolved.Length)
- break;
- next = unresolved.IndexOf('&', pos);
- }
- resolved.Append (unresolved.Substring(pos));
- return resolved.ToString();
- }
- #endregion
- }
- }
|