AngleSharp by Florian Rappl

<PackageReference Include="AngleSharp" Version="0.9.0" />

 HtmlDomBuilder

sealed class HtmlDomBuilder
Represents the Tree construction as specified in 8.2.5 Tree construction, on the following page: http://www.w3.org/html/wg/drafts/html/master/syntax.html
using AngleSharp.Dom; using AngleSharp.Dom.Html; using AngleSharp.Dom.Mathml; using AngleSharp.Dom.Svg; using AngleSharp.Extensions; using AngleSharp.Html; using AngleSharp.Network; using System; using System.Collections.Generic; using System.Diagnostics; using System.Text; using System.Threading; using System.Threading.Tasks; namespace AngleSharp.Parser.Html { [DebuggerStepThrough] internal sealed class HtmlDomBuilder { private readonly HtmlTokenizer _tokenizer; private readonly HtmlDocument _document; private readonly List<Element> _openElements; private readonly List<Element> _formattingElements; private readonly Stack<HtmlTreeMode> _templateModes; private HtmlFormElement _currentFormElement; private HtmlTreeMode _currentMode; private HtmlTreeMode _previousMode; private HtmlParserOptions _options; private Element _fragmentContext; private bool _foster; private bool _frameset; private Task _waiting; public bool IsFragmentCase => _fragmentContext != null; public Element AdjustedCurrentNode { get { if (_fragmentContext == null || _openElements.Count != 1) return CurrentNode; return _fragmentContext; } } public Element CurrentNode { get { if (_openElements.Count <= 0) return null; return _openElements[_openElements.Count - 1]; } } internal HtmlDomBuilder(HtmlDocument document) { _tokenizer = new HtmlTokenizer(document.Source, document.Options.Events); _document = document; _openElements = new List<Element>(); _templateModes = new Stack<HtmlTreeMode>(); _formattingElements = new List<Element>(); _frameset = true; _currentMode = HtmlTreeMode.Initial; } public async Task<HtmlDocument> ParseAsync(HtmlParserOptions options, CancellationToken cancelToken) { TextSource source = _document.Source; _options = options; HtmlToken token; do { if (source.Length - source.Index < 1024) await source.Prefetch(8192, cancelToken).ConfigureAwait(false); token = _tokenizer.Get(); Consume(token); if (_waiting != null) { await _waiting.ConfigureAwait(false); _waiting = null; } } while (token.Type != HtmlTokenType.EndOfFile); return _document; } public HtmlDocument Parse(HtmlParserOptions options) { HtmlToken htmlToken = null; _options = options; do { htmlToken = _tokenizer.Get(); Consume(htmlToken); if (_waiting != null) { _waiting.Wait(); _waiting = null; } } while (htmlToken.Type != HtmlTokenType.EndOfFile); return _document; } public HtmlDocument ParseFragment(HtmlParserOptions options, Element context) { if (context == null) throw new ArgumentNullException("context"); string localName = context.LocalName; if (localName.IsOneOf(Tags.Title, Tags.Textarea)) _tokenizer.State = HtmlParseMode.RCData; else if (localName.IsOneOf(Tags.Style, Tags.Xmp, Tags.Iframe, Tags.NoEmbed, Tags.NoFrames)) { _tokenizer.State = HtmlParseMode.Rawtext; } else if (localName.Is(Tags.Script)) { _tokenizer.State = HtmlParseMode.Script; } else if (localName.Is(Tags.Plaintext)) { _tokenizer.State = HtmlParseMode.Plaintext; } else if (localName.Is(Tags.NoScript) && options.IsScripting) { _tokenizer.State = HtmlParseMode.Rawtext; } HtmlHtmlElement htmlHtmlElement = new HtmlHtmlElement(_document, null); _document.AddNode(htmlHtmlElement); _openElements.Add(htmlHtmlElement); if (context is HtmlTemplateElement) _templateModes.Push(HtmlTreeMode.InTemplate); Reset(context); _fragmentContext = context; _tokenizer.IsAcceptingCharacterData = !AdjustedCurrentNode.Flags.HasFlag(NodeFlags.HtmlMember); do { if (context is HtmlFormElement) { _currentFormElement = (HtmlFormElement)context; break; } context = (context.ParentElement as Element); } while (context != null); return Parse(options); } private void Restart() { _currentMode = HtmlTreeMode.Initial; _tokenizer.State = HtmlParseMode.PCData; _document.ReplaceAll(null, true); _frameset = true; _openElements.Clear(); _formattingElements.Clear(); _templateModes.Clear(); } private void Reset(Element context = null) { bool flag = false; Element element = null; int num = _openElements.Count - 1; while (true) { if (num < 0) return; element = _openElements[num]; if (num == 0) { flag = true; element = (context ?? element); } string localName = element.LocalName; if (localName.Is(Tags.Select)) { _currentMode = HtmlTreeMode.InSelect; return; } if (Tags.AllTableCells.Contains(localName)) { _currentMode = (flag ? HtmlTreeMode.InBody : HtmlTreeMode.InCell); return; } if (localName.Is(Tags.Tr)) { _currentMode = HtmlTreeMode.InRow; return; } if (Tags.AllTableSections.Contains(localName)) { _currentMode = HtmlTreeMode.InTableBody; return; } if (localName.Is(Tags.Body)) { _currentMode = HtmlTreeMode.InBody; return; } if (localName.Is(Tags.Table)) { _currentMode = HtmlTreeMode.InTable; return; } if (localName.Is(Tags.Caption)) { _currentMode = HtmlTreeMode.InCaption; return; } if (localName.Is(Tags.Colgroup)) { _currentMode = HtmlTreeMode.InColumnGroup; return; } if (localName.Is(Tags.Template)) { _currentMode = _templateModes.Peek(); return; } if (localName.Is(Tags.Html)) { _currentMode = HtmlTreeMode.BeforeHead; return; } if (localName.Is(Tags.Head)) { _currentMode = (flag ? HtmlTreeMode.InBody : HtmlTreeMode.InHead); return; } if (localName.Is(Tags.Frameset)) { _currentMode = HtmlTreeMode.InFrameset; return; } if (flag) break; num--; } _currentMode = HtmlTreeMode.InBody; } private void Consume(HtmlToken token) { Element adjustedCurrentNode = AdjustedCurrentNode; if (adjustedCurrentNode == null || token.Type == HtmlTokenType.EndOfFile || adjustedCurrentNode.Flags.HasFlag(NodeFlags.HtmlMember) || (adjustedCurrentNode.Flags.HasFlag(NodeFlags.HtmlTip) && token.IsHtmlCompatible) || (adjustedCurrentNode.Flags.HasFlag(NodeFlags.MathTip) && token.IsMathCompatible) || (adjustedCurrentNode.Flags.HasFlag(NodeFlags.MathMember) && token.IsSvg && adjustedCurrentNode.LocalName.Is(Tags.AnnotationXml))) Home(token); else Foreign(token); } private void Home(HtmlToken token) { switch (_currentMode) { case HtmlTreeMode.Initial: Initial(token); break; case HtmlTreeMode.BeforeHtml: BeforeHtml(token); break; case HtmlTreeMode.BeforeHead: BeforeHead(token); break; case HtmlTreeMode.InHead: InHead(token); break; case HtmlTreeMode.InHeadNoScript: InHeadNoScript(token); break; case HtmlTreeMode.AfterHead: AfterHead(token); break; case HtmlTreeMode.InBody: InBody(token); break; case HtmlTreeMode.Text: Text(token); break; case HtmlTreeMode.InTable: InTable(token); break; case HtmlTreeMode.InCaption: InCaption(token); break; case HtmlTreeMode.InColumnGroup: InColumnGroup(token); break; case HtmlTreeMode.InTableBody: InTableBody(token); break; case HtmlTreeMode.InRow: InRow(token); break; case HtmlTreeMode.InCell: InCell(token); break; case HtmlTreeMode.InSelect: InSelect(token); break; case HtmlTreeMode.InSelectInTable: InSelectInTable(token); break; case HtmlTreeMode.InTemplate: InTemplate(token); break; case HtmlTreeMode.AfterBody: AfterBody(token); break; case HtmlTreeMode.InFrameset: InFrameset(token); break; case HtmlTreeMode.AfterFrameset: AfterFrameset(token); break; case HtmlTreeMode.AfterAfterBody: AfterAfterBody(token); break; case HtmlTreeMode.AfterAfterFrameset: AfterAfterFrameset(token); break; } } private void Initial(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Doctype: { HtmlDoctypeToken htmlDoctypeToken = (HtmlDoctypeToken)token; if (!htmlDoctypeToken.IsValid) RaiseErrorOccurred(HtmlParseError.DoctypeInvalid, token); _document.AddNode(new DocumentType(_document, htmlDoctypeToken.Name ?? string.Empty) { SystemIdentifier = htmlDoctypeToken.SystemIdentifier, PublicIdentifier = htmlDoctypeToken.PublicIdentifier }); if (htmlDoctypeToken.IsFullQuirks) _document.QuirksMode = QuirksMode.On; else if (htmlDoctypeToken.IsLimitedQuirks) { _document.QuirksMode = QuirksMode.Limited; } _currentMode = HtmlTreeMode.BeforeHtml; return; } case HtmlTokenType.Character: token.TrimStart(); if (token.IsEmpty) return; break; case HtmlTokenType.Comment: _document.AddComment(token); return; } if (!_options.IsEmbedded) { RaiseErrorOccurred(HtmlParseError.DoctypeMissing, token); _document.QuirksMode = QuirksMode.On; } _currentMode = HtmlTreeMode.BeforeHtml; BeforeHtml(token); } private void BeforeHtml(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Character: token.TrimStart(); if (token.IsEmpty) return; break; case HtmlTokenType.Comment: _document.AddComment(token); return; case HtmlTokenType.StartTag: if (token.Name.Is(Tags.Html)) { AddRoot(token.AsTag()); _currentMode = HtmlTreeMode.BeforeHead; return; } break; case HtmlTokenType.EndTag: if (!Tags.AllBeforeHead.Contains(token.Name)) { RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, token); return; } break; case HtmlTokenType.Doctype: RaiseErrorOccurred(HtmlParseError.DoctypeTagInappropriate, token); return; } BeforeHtml(HtmlTagToken.Open(Tags.Html)); BeforeHead(token); } private void BeforeHead(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Character: token.TrimStart(); if (token.IsEmpty) return; break; case HtmlTokenType.StartTag: { string name = token.Name; if (name.Is(Tags.Html)) { InBody(token); return; } if (name.Is(Tags.Head)) { AddElement(new HtmlHeadElement(_document, null), token.AsTag(), false); _currentMode = HtmlTreeMode.InHead; return; } break; } case HtmlTokenType.EndTag: if (!Tags.AllBeforeHead.Contains(token.Name)) { RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, token); return; } break; case HtmlTokenType.Comment: CurrentNode.AddComment(token); return; case HtmlTokenType.Doctype: RaiseErrorOccurred(HtmlParseError.DoctypeTagInappropriate, token); return; } BeforeHead(HtmlTagToken.Open(Tags.Head)); InHead(token); } private void InHead(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Character: { string text = token.TrimStart(); AddCharacters(text); if (token.IsEmpty) return; break; } case HtmlTokenType.Comment: CurrentNode.AddComment(token); return; case HtmlTokenType.Doctype: RaiseErrorOccurred(HtmlParseError.DoctypeTagInappropriate, token); return; case HtmlTokenType.StartTag: { string name2 = token.Name; if (name2.Is(Tags.Html)) { InBody(token); return; } if (name2.Is(Tags.Meta)) { HtmlMetaElement htmlMetaElement = new HtmlMetaElement(_document, null); AddElement(htmlMetaElement, token.AsTag(), true); Encoding encoding = htmlMetaElement.GetEncoding(); CloseCurrentNode(); if (encoding != null) try { _document.Source.CurrentEncoding = encoding; } catch (NotSupportedException) { Restart(); } return; } if (Tags.AllHeadBase.Contains(name2)) { AddElement(token.AsTag(), true); CloseCurrentNode(); return; } if (name2.Is(Tags.Title)) { RCDataAlgorithm(token.AsTag()); return; } if (name2.IsOneOf(Tags.Style, Tags.NoFrames) || (_options.IsScripting && name2.Is(Tags.NoScript))) { RawtextAlgorithm(token.AsTag()); return; } if (name2.Is(Tags.NoScript)) { AddElement(token.AsTag(), false); _currentMode = HtmlTreeMode.InHeadNoScript; return; } if (name2.Is(Tags.Script)) { HtmlScriptElement htmlScriptElement = new HtmlScriptElement(_document, null); AddElement(htmlScriptElement, token.AsTag(), false); htmlScriptElement.SetStarted(IsFragmentCase); _tokenizer.State = HtmlParseMode.Script; _previousMode = _currentMode; _currentMode = HtmlTreeMode.Text; return; } if (name2.Is(Tags.Head)) { RaiseErrorOccurred(HtmlParseError.HeadTagMisplaced, token); return; } if (name2.Is(Tags.Template)) { AddElement(new HtmlTemplateElement(_document, null), token.AsTag(), false); _formattingElements.AddScopeMarker(); _frameset = false; _currentMode = HtmlTreeMode.InTemplate; _templateModes.Push(HtmlTreeMode.InTemplate); return; } break; } case HtmlTokenType.EndTag: { string name = token.Name; if (name.Is(Tags.Head)) { CloseCurrentNode(); _currentMode = HtmlTreeMode.AfterHead; _waiting = _document.WaitForReady(); return; } if (name.Is(Tags.Template)) { if (TagCurrentlyOpen(Tags.Template)) { GenerateImpliedEndTags(); if (!CurrentNode.LocalName.Is(Tags.Template)) RaiseErrorOccurred(HtmlParseError.TagClosingMismatch, token); CloseTemplate(); } else RaiseErrorOccurred(HtmlParseError.TagInappropriate, token); return; } if (!name.IsOneOf(Tags.Html, Tags.Body, Tags.Br)) { RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, token); return; } break; } } CloseCurrentNode(); _currentMode = HtmlTreeMode.AfterHead; AfterHead(token); } private void InHeadNoScript(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Character: { string text = token.TrimStart(); AddCharacters(text); if (token.IsEmpty) return; break; } case HtmlTokenType.Comment: InHead(token); return; case HtmlTokenType.StartTag: { string name2 = token.Name; if (Tags.AllNoScript.Contains(name2)) { InHead(token); return; } if (name2.Is(Tags.Html)) { InBody(token); return; } if (name2.IsOneOf(Tags.Head, Tags.NoScript)) { RaiseErrorOccurred(HtmlParseError.TagInappropriate, token); return; } break; } case HtmlTokenType.EndTag: { string name = token.Name; if (name.Is(Tags.NoScript)) { CloseCurrentNode(); _currentMode = HtmlTreeMode.InHead; return; } if (!name.Is(Tags.Br)) { RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, token); return; } break; } case HtmlTokenType.Doctype: RaiseErrorOccurred(HtmlParseError.DoctypeTagInappropriate, token); return; } RaiseErrorOccurred(HtmlParseError.TokenNotPossible, token); CloseCurrentNode(); _currentMode = HtmlTreeMode.InHead; InHead(token); } private void AfterHead(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Character: { string text = token.TrimStart(); AddCharacters(text); if (token.IsEmpty) return; break; } case HtmlTokenType.Comment: CurrentNode.AddComment(token); return; case HtmlTokenType.Doctype: RaiseErrorOccurred(HtmlParseError.DoctypeTagInappropriate, token); return; case HtmlTokenType.StartTag: { string name = token.Name; if (name.Is(Tags.Html)) { InBody(token); return; } if (name.Is(Tags.Body)) { AfterHeadStartTagBody(token.AsTag()); return; } if (name.Is(Tags.Frameset)) { AddElement(new HtmlFrameSetElement(_document, null), token.AsTag(), false); _currentMode = HtmlTreeMode.InFrameset; return; } if (Tags.AllHeadNoTemplate.Contains(name)) { RaiseErrorOccurred(HtmlParseError.TagMustBeInHead, token); int count = _openElements.Count; Element item = _document.Head as Element; _openElements.Add(item); InHead(token); _openElements.Remove(item); return; } if (name.Is(Tags.Head)) { RaiseErrorOccurred(HtmlParseError.HeadTagMisplaced, token); return; } break; } case HtmlTokenType.EndTag: if (!token.Name.IsOneOf(Tags.Html, Tags.Body, Tags.Br)) { RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, token); return; } break; } AfterHeadStartTagBody(HtmlTagToken.Open(Tags.Body)); _frameset = true; Home(token); } private void InBodyStartTag(HtmlTagToken tag) { string name = tag.Name; if (name.Is(Tags.Div)) { if (IsInButtonScope()) InBodyEndTagParagraph(tag); AddElement(tag, false); } else if (name.Is(Tags.A)) { for (int num = _formattingElements.Count - 1; num >= 0; num--) { if (_formattingElements[num] == null) break; if (_formattingElements[num].LocalName.Is(Tags.A)) { Element item = _formattingElements[num]; RaiseErrorOccurred(HtmlParseError.AnchorNested, tag); HeisenbergAlgorithm(HtmlTagToken.Close(Tags.A)); _openElements.Remove(item); _formattingElements.Remove(item); break; } } ReconstructFormatting(); HtmlAnchorElement element = new HtmlAnchorElement(_document, null); AddElement(element, tag, false); _formattingElements.AddFormatting(element); } else if (name.Is(Tags.Span)) { ReconstructFormatting(); AddElement(tag, false); } else if (name.Is(Tags.Li)) { InBodyStartTagListItem(tag); } else if (name.Is(Tags.Img)) { InBodyStartTagBreakrow(tag); } else if (name.IsOneOf(Tags.Ul, Tags.P)) { if (IsInButtonScope()) InBodyEndTagParagraph(tag); AddElement(tag, false); } else if (Tags.AllSemanticFormatting.Contains(name)) { ReconstructFormatting(); _formattingElements.AddFormatting(AddElement(tag, false)); } else if (name.Is(Tags.Script)) { InHead(tag); } else if (Tags.AllHeadings.Contains(name)) { if (IsInButtonScope()) InBodyEndTagParagraph(tag); if (Tags.AllHeadings.Contains(CurrentNode.LocalName)) { RaiseErrorOccurred(HtmlParseError.HeadingNested, tag); CloseCurrentNode(); } AddElement(new HtmlHeadingElement(_document, name, null), tag, false); } else if (name.Is(Tags.Input)) { ReconstructFormatting(); AddElement(new HtmlInputElement(_document, null), tag, true); CloseCurrentNode(); if (!tag.GetAttribute(AttributeNames.Type).Isi(AttributeNames.Hidden)) _frameset = false; } else if (name.Is(Tags.Form)) { if (_currentFormElement == null) { if (IsInButtonScope()) InBodyEndTagParagraph(tag); _currentFormElement = new HtmlFormElement(_document, null); AddElement(_currentFormElement, tag, false); } else RaiseErrorOccurred(HtmlParseError.FormAlreadyOpen, tag); } else if (Tags.AllBody.Contains(name)) { if (IsInButtonScope()) InBodyEndTagParagraph(tag); AddElement(tag, false); } else if (Tags.AllClassicFormatting.Contains(name)) { ReconstructFormatting(); _formattingElements.AddFormatting(AddElement(tag, false)); } else if (Tags.AllHead.Contains(name)) { InHead(tag); } else if (name.IsOneOf(Tags.Pre, Tags.Listing)) { if (IsInButtonScope()) InBodyEndTagParagraph(tag); AddElement(tag, false); _frameset = false; PreventNewLine(); } else if (name.Is(Tags.Button)) { if (IsInScope(Tags.Button)) { RaiseErrorOccurred(HtmlParseError.ButtonInScope, tag); InBodyEndTagBlock(tag); InBody(tag); } else { ReconstructFormatting(); AddElement(new HtmlButtonElement(_document, null), tag, false); _frameset = false; } } else if (name.Is(Tags.Table)) { if (_document.QuirksMode != QuirksMode.On && IsInButtonScope()) InBodyEndTagParagraph(tag); AddElement(new HtmlTableElement(_document, null), tag, false); _frameset = false; _currentMode = HtmlTreeMode.InTable; } else if (Tags.AllBodyBreakrow.Contains(name)) { InBodyStartTagBreakrow(tag); } else if (Tags.AllBodyClosed.Contains(name)) { AddElement(tag, true); CloseCurrentNode(); } else if (name.Is(Tags.Hr)) { if (IsInButtonScope()) InBodyEndTagParagraph(tag); AddElement(new HtmlHrElement(_document, null), tag, true); CloseCurrentNode(); _frameset = false; } else if (name.Is(Tags.Textarea)) { AddElement(new HtmlTextAreaElement(_document, null), tag, false); _tokenizer.State = HtmlParseMode.RCData; _previousMode = _currentMode; _frameset = false; _currentMode = HtmlTreeMode.Text; PreventNewLine(); } else if (name.Is(Tags.Select)) { ReconstructFormatting(); AddElement(new HtmlSelectElement(_document, null), tag, false); _frameset = false; switch (_currentMode) { case HtmlTreeMode.InTable: case HtmlTreeMode.InCaption: case HtmlTreeMode.InTableBody: case HtmlTreeMode.InRow: case HtmlTreeMode.InCell: _currentMode = HtmlTreeMode.InSelectInTable; break; default: _currentMode = HtmlTreeMode.InSelect; break; } } else if (name.IsOneOf(Tags.Optgroup, Tags.Option)) { if (CurrentNode.LocalName.Is(Tags.Option)) InBodyEndTagAnythingElse(HtmlTagToken.Close(Tags.Option)); ReconstructFormatting(); AddElement(tag, false); } else if (name.IsOneOf(Tags.Dd, Tags.Dt)) { InBodyStartTagDefinitionItem(tag); } else if (name.Is(Tags.Iframe)) { _frameset = false; RawtextAlgorithm(tag); } else if (Tags.AllBodyObsolete.Contains(name)) { ReconstructFormatting(); AddElement(tag, false); _formattingElements.AddScopeMarker(); _frameset = false; } else if (name.Is(Tags.Image)) { RaiseErrorOccurred(HtmlParseError.ImageTagNamedWrong, tag); tag.Name = Tags.Img; InBodyStartTagBreakrow(tag); } else if (name.Is(Tags.NoBr)) { ReconstructFormatting(); if (IsInScope(Tags.NoBr)) { RaiseErrorOccurred(HtmlParseError.NobrInScope, tag); HeisenbergAlgorithm(tag); ReconstructFormatting(); } _formattingElements.AddFormatting(AddElement(tag, false)); } else if (name.Is(Tags.Xmp)) { if (IsInButtonScope()) InBodyEndTagParagraph(tag); ReconstructFormatting(); _frameset = false; RawtextAlgorithm(tag); } else if (name.IsOneOf(Tags.Rb, Tags.Rtc)) { if (IsInScope(Tags.Ruby)) { GenerateImpliedEndTags(); if (!CurrentNode.LocalName.Is(Tags.Ruby)) RaiseErrorOccurred(HtmlParseError.TagDoesNotMatchCurrentNode, tag); } AddElement(tag, false); } else if (name.IsOneOf(Tags.Rp, Tags.Rt)) { if (IsInScope(Tags.Ruby)) { GenerateImpliedEndTagsExceptFor(Tags.Rtc); if (!CurrentNode.LocalName.IsOneOf(Tags.Ruby, Tags.Rtc)) RaiseErrorOccurred(HtmlParseError.TagDoesNotMatchCurrentNode, tag); } AddElement(tag, false); } else if (name.Is(Tags.NoEmbed)) { RawtextAlgorithm(tag); } else if (name.Is(Tags.NoScript)) { if (_options.IsScripting) RawtextAlgorithm(tag); else { ReconstructFormatting(); AddElement(tag, false); } } else if (name.Is(Tags.Math)) { MathElement mathElement = new MathElement(_document, name, null, NodeFlags.None); ReconstructFormatting(); for (int i = 0; i < tag.Attributes.Count; i++) { string key = tag.Attributes[i].Key; string value = tag.Attributes[i].Value; mathElement.AdjustAttribute(key.AdjustToMathAttribute(), value); } AddElement(mathElement); if (tag.IsSelfClosing) _openElements.Remove(mathElement); } else if (name.Is(Tags.Svg)) { SvgElement svgElement = new SvgElement(_document, name, null, NodeFlags.None); ReconstructFormatting(); for (int j = 0; j < tag.Attributes.Count; j++) { string key2 = tag.Attributes[j].Key; string value2 = tag.Attributes[j].Value; svgElement.AdjustAttribute(key2.AdjustToSvgAttribute(), value2); } AddElement(svgElement); if (tag.IsSelfClosing) _openElements.Remove(svgElement); } else if (name.Is(Tags.Plaintext)) { if (IsInButtonScope()) InBodyEndTagParagraph(tag); AddElement(tag, false); _tokenizer.State = HtmlParseMode.Plaintext; } else if (name.Is(Tags.Frameset)) { RaiseErrorOccurred(HtmlParseError.FramesetMisplaced, tag); if (_openElements.Count != 1 && _openElements[1].LocalName.Is(Tags.Body) && _frameset) { _openElements[1].RemoveFromParent(); while (_openElements.Count > 1) { CloseCurrentNode(); } AddElement(new HtmlFrameSetElement(_document, null), tag, false); _currentMode = HtmlTreeMode.InFrameset; } } else if (name.Is(Tags.Html)) { RaiseErrorOccurred(HtmlParseError.HtmlTagMisplaced, tag); if (_templateModes.Count == 0) _openElements[0].SetUniqueAttributes(tag.Attributes); } else if (name.Is(Tags.Body)) { RaiseErrorOccurred(HtmlParseError.BodyTagMisplaced, tag); if (_templateModes.Count == 0 && _openElements.Count > 1 && _openElements[1].LocalName.Is(Tags.Body)) { _frameset = false; _openElements[1].SetUniqueAttributes(tag.Attributes); } } else if (name.Is(Tags.IsIndex)) { RaiseErrorOccurred(HtmlParseError.TagInappropriate, tag); if (_currentFormElement == null) { InBody(HtmlTagToken.Open(Tags.Form)); if (tag.GetAttribute(AttributeNames.Action).Length > 0) _currentFormElement.SetAttribute(AttributeNames.Action, tag.GetAttribute(AttributeNames.Action)); InBody(HtmlTagToken.Open(Tags.Hr)); InBody(HtmlTagToken.Open(Tags.Label)); if (tag.GetAttribute(AttributeNames.Prompt).Length > 0) AddCharacters(tag.GetAttribute(AttributeNames.Prompt)); else AddCharacters("This is a searchable index. Enter search keywords: "); HtmlTagToken htmlTagToken = HtmlTagToken.Open(Tags.Input); htmlTagToken.AddAttribute(AttributeNames.Name, Tags.IsIndex); for (int k = 0; k < tag.Attributes.Count; k++) { if (!tag.Attributes[k].Key.IsOneOf(AttributeNames.Name, AttributeNames.Action, AttributeNames.Prompt)) htmlTagToken.AddAttribute(tag.Attributes[k].Key, tag.Attributes[k].Value); } InBody(htmlTagToken); InBody(HtmlTagToken.Close(Tags.Label)); InBody(HtmlTagToken.Open(Tags.Hr)); InBody(HtmlTagToken.Close(Tags.Form)); } } else if (Tags.AllNested.Contains(name)) { RaiseErrorOccurred(HtmlParseError.TagCannotStartHere, tag); } else { ReconstructFormatting(); AddElement(tag, false); } } private void InBodyEndTag(HtmlTagToken tag) { string name = tag.Name; if (name.Is(Tags.Div)) InBodyEndTagBlock(tag); else if (name.Is(Tags.A)) { HeisenbergAlgorithm(tag); } else if (name.Is(Tags.Li)) { if (IsInListItemScope()) { GenerateImpliedEndTagsExceptFor(name); if (!CurrentNode.LocalName.Is(Tags.Li)) RaiseErrorOccurred(HtmlParseError.TagDoesNotMatchCurrentNode, tag); ClearStackBackTo(Tags.Li); CloseCurrentNode(); } else RaiseErrorOccurred(HtmlParseError.ListItemNotInScope, tag); } else if (name.Is(Tags.P)) { InBodyEndTagParagraph(tag); } else if (Tags.AllBlocks.Contains(name)) { InBodyEndTagBlock(tag); } else if (Tags.AllFormatting.Contains(name)) { HeisenbergAlgorithm(tag); } else if (name.Is(Tags.Form)) { HtmlFormElement currentFormElement = _currentFormElement; _currentFormElement = null; if (currentFormElement != null && IsInScope(currentFormElement.LocalName)) { GenerateImpliedEndTags(); if (CurrentNode != currentFormElement) RaiseErrorOccurred(HtmlParseError.FormClosedWrong, tag); _openElements.Remove(currentFormElement); } else RaiseErrorOccurred(HtmlParseError.FormNotInScope, tag); } else if (name.Is(Tags.Br)) { RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, tag); InBodyStartTagBreakrow(HtmlTagToken.Open(Tags.Br)); } else if (Tags.AllHeadings.Contains(name)) { if (IsInScope(Tags.AllHeadings)) { GenerateImpliedEndTags(); if (!CurrentNode.LocalName.Is(name)) RaiseErrorOccurred(HtmlParseError.TagDoesNotMatchCurrentNode, tag); ClearStackBackTo(Tags.AllHeadings); CloseCurrentNode(); } else RaiseErrorOccurred(HtmlParseError.HeadingNotInScope, tag); } else if (name.IsOneOf(Tags.Dd, Tags.Dt)) { if (IsInScope(name)) { GenerateImpliedEndTagsExceptFor(name); if (!CurrentNode.LocalName.Is(name)) RaiseErrorOccurred(HtmlParseError.TagDoesNotMatchCurrentNode, tag); ClearStackBackTo(name); CloseCurrentNode(); } else RaiseErrorOccurred(HtmlParseError.ListItemNotInScope, tag); } else if (name.IsOneOf(Tags.Applet, Tags.Marquee, Tags.Object)) { if (IsInScope(name)) { GenerateImpliedEndTags(); if (!CurrentNode.LocalName.Is(name)) RaiseErrorOccurred(HtmlParseError.TagDoesNotMatchCurrentNode, tag); ClearStackBackTo(name); CloseCurrentNode(); _formattingElements.ClearFormatting(); } else RaiseErrorOccurred(HtmlParseError.ObjectNotInScope, tag); } else if (name.Is(Tags.Body)) { InBodyEndTagBody(tag); } else if (name.Is(Tags.Html)) { if (InBodyEndTagBody(tag)) AfterBody(tag); } else if (name.Is(Tags.Template)) { InHead(tag); } else { InBodyEndTagAnythingElse(tag); } } private void InBody(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Character: ReconstructFormatting(); AddCharacters(token.Data); if (token.HasContent) _frameset = false; break; case HtmlTokenType.StartTag: InBodyStartTag(token.AsTag()); break; case HtmlTokenType.EndTag: InBodyEndTag(token.AsTag()); break; case HtmlTokenType.Comment: CurrentNode.AddComment(token); break; case HtmlTokenType.Doctype: RaiseErrorOccurred(HtmlParseError.DoctypeTagInappropriate, token); break; case HtmlTokenType.EndOfFile: CheckBodyOnClosing(token); if (_templateModes.Count != 0) InTemplate(token); else End(); break; } } private void Text(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Comment: break; case HtmlTokenType.Character: AddCharacters(token.Data); break; case HtmlTokenType.EndTag: if (!token.Name.Is(Tags.Script)) { CloseCurrentNode(); _currentMode = _previousMode; } else HandleScript(CurrentNode as HtmlScriptElement); break; case HtmlTokenType.EndOfFile: RaiseErrorOccurred(HtmlParseError.EOF, token); CloseCurrentNode(); _currentMode = _previousMode; Consume(token); break; } } private void InTable(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Comment: CurrentNode.AddComment(token); return; case HtmlTokenType.Doctype: RaiseErrorOccurred(HtmlParseError.DoctypeTagInappropriate, token); return; case HtmlTokenType.StartTag: { string name2 = token.Name; if (name2.Is(Tags.Caption)) { ClearStackBackTo(Tags.Table); _formattingElements.AddScopeMarker(); AddElement(new HtmlTableCaptionElement(_document, null), token.AsTag(), false); _currentMode = HtmlTreeMode.InCaption; } else if (name2.Is(Tags.Colgroup)) { ClearStackBackTo(Tags.Table); AddElement(new HtmlTableColgroupElement(_document, null), token.AsTag(), false); _currentMode = HtmlTreeMode.InColumnGroup; } else if (name2.Is(Tags.Col)) { InTable(HtmlTagToken.Open(Tags.Colgroup)); InColumnGroup(token); } else if (Tags.AllTableSections.Contains(name2)) { ClearStackBackTo(Tags.Table); AddElement(new HtmlTableSectionElement(_document, name2, null), token.AsTag(), false); _currentMode = HtmlTreeMode.InTableBody; } else if (Tags.AllTableCellsRows.Contains(name2)) { InTable(HtmlTagToken.Open(Tags.Tbody)); InTableBody(token); } else if (name2.Is(Tags.Table)) { RaiseErrorOccurred(HtmlParseError.TableNesting, token); if (InTableEndTagTable(token)) Home(token); } else if (name2.Is(Tags.Input)) { HtmlTagToken htmlTagToken = token.AsTag(); if (htmlTagToken.GetAttribute(AttributeNames.Type).Isi(AttributeNames.Hidden)) { RaiseErrorOccurred(HtmlParseError.InputUnexpected, token); AddElement(new HtmlInputElement(_document, null), htmlTagToken, true); CloseCurrentNode(); } else { RaiseErrorOccurred(HtmlParseError.TokenNotPossible, token); InBodyWithFoster(token); } } else if (name2.Is(Tags.Form)) { RaiseErrorOccurred(HtmlParseError.FormInappropriate, token); if (_currentFormElement == null) { _currentFormElement = new HtmlFormElement(_document, null); AddElement(_currentFormElement, token.AsTag(), false); CloseCurrentNode(); } } else if (Tags.AllTableHead.Contains(name2)) { InHead(token); } else { RaiseErrorOccurred(HtmlParseError.IllegalElementInTableDetected, token); InBodyWithFoster(token); } return; } case HtmlTokenType.EndTag: { string name = token.Name; if (name.Is(Tags.Table)) InTableEndTagTable(token); else if (name.Is(Tags.Template)) { InHead(token); } else if (Tags.AllTableSpecial.Contains(name) || Tags.AllTableInner.Contains(name)) { RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, token); } else { RaiseErrorOccurred(HtmlParseError.IllegalElementInTableDetected, token); InBodyWithFoster(token); } return; } case HtmlTokenType.EndOfFile: InBody(token); return; case HtmlTokenType.Character: if (Tags.AllTableMajor.Contains(CurrentNode.LocalName)) { InTableText(token); return; } break; } RaiseErrorOccurred(HtmlParseError.TokenNotPossible, token); InBodyWithFoster(token); } private void InTableText(HtmlToken token) { if (token.HasContent) { RaiseErrorOccurred(HtmlParseError.TokenNotPossible, token); InBodyWithFoster(token); } else AddCharacters(token.Data); } private void InCaption(HtmlToken token) { switch (token.Type) { case HtmlTokenType.EndTag: { string name2 = token.Name; if (name2.Is(Tags.Caption)) { InCaptionEndTagCaption(token); return; } if (Tags.AllCaptionStart.Contains(name2)) { RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, token); return; } if (name2.Is(Tags.Table)) { RaiseErrorOccurred(HtmlParseError.TableNesting, token); if (InCaptionEndTagCaption(token)) InTable(token); return; } break; } case HtmlTokenType.StartTag: { string name = token.Name; if (Tags.AllCaptionEnd.Contains(name)) { RaiseErrorOccurred(HtmlParseError.TagCannotStartHere, token); if (InCaptionEndTagCaption(token)) InTable(token); return; } break; } } InBody(token); } private void InColumnGroup(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Character: { string text = token.TrimStart(); AddCharacters(text); if (token.IsEmpty) return; break; } case HtmlTokenType.Comment: CurrentNode.AddComment(token); return; case HtmlTokenType.Doctype: RaiseErrorOccurred(HtmlParseError.DoctypeTagInappropriate, token); return; case HtmlTokenType.StartTag: { string name2 = token.Name; if (name2.Is(Tags.Html)) { InBody(token); return; } if (name2.Is(Tags.Col)) { AddElement(new HtmlTableColElement(_document, null), token.AsTag(), true); CloseCurrentNode(); return; } if (name2.Is(Tags.Template)) { InHead(token); return; } break; } case HtmlTokenType.EndTag: { string name = token.Name; if (name.Is(Tags.Colgroup)) { InColumnGroupEndTagColgroup(token); return; } if (name.Is(Tags.Col)) { RaiseErrorOccurred(HtmlParseError.TagClosedWrong, token); return; } if (name.Is(Tags.Template)) { InHead(token); return; } break; } case HtmlTokenType.EndOfFile: InBody(token); return; } if (InColumnGroupEndTagColgroup(token)) InTable(token); } private void InTableBody(HtmlToken token) { switch (token.Type) { case HtmlTokenType.StartTag: { string name2 = token.Name; if (name2.Is(Tags.Tr)) { ClearStackBackTo(Tags.AllTableSections); AddElement(new HtmlTableRowElement(_document, null), token.AsTag(), false); _currentMode = HtmlTreeMode.InRow; return; } if (Tags.AllTableCells.Contains(name2)) { InTableBody(HtmlTagToken.Open(Tags.Tr)); InRow(token); return; } if (Tags.AllTableGeneral.Contains(name2)) { InTableBodyCloseTable(token.AsTag()); return; } break; } case HtmlTokenType.EndTag: { string name = token.Name; if (Tags.AllTableSections.Contains(name)) { if (IsInTableScope(name)) { ClearStackBackTo(Tags.AllTableSections); CloseCurrentNode(); _currentMode = HtmlTreeMode.InTable; } else RaiseErrorOccurred(HtmlParseError.TableSectionNotInScope, token); return; } if (name.Is(Tags.Tr) || Tags.AllTableSpecial.Contains(name)) { RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, token); return; } if (name.Is(Tags.Table)) { InTableBodyCloseTable(token.AsTag()); return; } break; } } InTable(token); } private void InRow(HtmlToken token) { switch (token.Type) { case HtmlTokenType.StartTag: { string name2 = token.Name; if (Tags.AllTableCells.Contains(name2)) { ClearStackBackTo(Tags.Tr); AddElement(token.AsTag(), false); _currentMode = HtmlTreeMode.InCell; _formattingElements.AddScopeMarker(); return; } if (name2.Is(Tags.Tr) || Tags.AllTableGeneral.Contains(name2)) { if (InRowEndTagTablerow(token)) InTableBody(token); return; } break; } case HtmlTokenType.EndTag: { string name = token.Name; if (name.Is(Tags.Tr)) { InRowEndTagTablerow(token); return; } if (name.Is(Tags.Table)) { if (InRowEndTagTablerow(token)) InTableBody(token); return; } if (Tags.AllTableSections.Contains(name)) { if (IsInTableScope(name)) { InRowEndTagTablerow(token); InTableBody(token); } else RaiseErrorOccurred(HtmlParseError.TableSectionNotInScope, token); return; } if (Tags.AllTableSpecial.Contains(name)) { RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, token); return; } break; } } InTable(token); } private void InCell(HtmlToken token) { switch (token.Type) { case HtmlTokenType.StartTag: { string name2 = token.Name; if (Tags.AllTableCellsRows.Contains(name2) || Tags.AllTableGeneral.Contains(name2)) { if (IsInTableScope(Tags.AllTableCells)) { InCellEndTagCell(token); Home(token); } else RaiseErrorOccurred(HtmlParseError.TableCellNotInScope, token); return; } break; } case HtmlTokenType.EndTag: { string name = token.Name; if (Tags.AllTableCells.Contains(name)) InCellEndTagCell(token); else if (Tags.AllTableCore.Contains(name)) { if (IsInTableScope(name)) { InCellEndTagCell(token); Home(token); } else RaiseErrorOccurred(HtmlParseError.TableNotInScope, token); } else if (!Tags.AllTableSpecial.Contains(name)) { InBody(token); } else { RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, token); } return; } } InBody(token); } private void InSelect(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Character: AddCharacters(token.Data); break; case HtmlTokenType.Comment: CurrentNode.AddComment(token); break; case HtmlTokenType.Doctype: RaiseErrorOccurred(HtmlParseError.DoctypeTagInappropriate, token); break; case HtmlTokenType.StartTag: { string name2 = token.Name; if (name2.Is(Tags.Html)) InBody(token); else if (name2.Is(Tags.Option)) { if (CurrentNode.LocalName.Is(Tags.Option)) InSelectEndTagOption(token); AddElement(new HtmlOptionElement(_document, null), token.AsTag(), false); } else if (name2.Is(Tags.Optgroup)) { if (CurrentNode.LocalName.Is(Tags.Option)) InSelectEndTagOption(token); if (CurrentNode.LocalName.Is(Tags.Optgroup)) InSelectEndTagOptgroup(token); AddElement(new HtmlOptionsGroupElement(_document, null), token.AsTag(), false); } else if (name2.Is(Tags.Select)) { RaiseErrorOccurred(HtmlParseError.SelectNesting, token); InSelectEndTagSelect(); } else if (Tags.AllInput.Contains(name2)) { RaiseErrorOccurred(HtmlParseError.IllegalElementInSelectDetected, token); if (IsInSelectScope(Tags.Select)) { InSelectEndTagSelect(); Home(token); } } else if (name2.IsOneOf(Tags.Template, Tags.Script)) { InHead(token); } else { RaiseErrorOccurred(HtmlParseError.IllegalElementInSelectDetected, token); } break; } case HtmlTokenType.EndTag: { string name = token.Name; if (name.Is(Tags.Template)) InHead(token); else if (name.Is(Tags.Optgroup)) { InSelectEndTagOptgroup(token); } else if (name.Is(Tags.Option)) { InSelectEndTagOption(token); } else if (name.Is(Tags.Select) && IsInSelectScope(Tags.Select)) { InSelectEndTagSelect(); } else if (name.Is(Tags.Select)) { RaiseErrorOccurred(HtmlParseError.SelectNotInScope, token); } else { RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, token); } break; } case HtmlTokenType.EndOfFile: InBody(token); break; default: RaiseErrorOccurred(HtmlParseError.TokenNotPossible, token); break; } } private void InSelectInTable(HtmlToken token) { switch (token.Type) { case HtmlTokenType.StartTag: { string name2 = token.Name; if (Tags.AllTableSelects.Contains(name2)) { RaiseErrorOccurred(HtmlParseError.IllegalElementInSelectDetected, token); InSelectEndTagSelect(); Home(token); return; } break; } case HtmlTokenType.EndTag: { string name = token.Name; if (Tags.AllTableSelects.Contains(name)) { RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, token); if (IsInTableScope(name)) { InSelectEndTagSelect(); Home(token); } return; } break; } } InSelect(token); } private void InTemplate(HtmlToken token) { switch (token.Type) { case HtmlTokenType.StartTag: { string name = token.Name; if (name.Is(Tags.Script) || Tags.AllHead.Contains(name)) InHead(token); else if (Tags.AllTableRoot.Contains(name)) { TemplateStep(token, HtmlTreeMode.InTable); } else if (name.Is(Tags.Col)) { TemplateStep(token, HtmlTreeMode.InColumnGroup); } else if (name.Is(Tags.Tr)) { TemplateStep(token, HtmlTreeMode.InTableBody); } else if (Tags.AllTableCells.Contains(name)) { TemplateStep(token, HtmlTreeMode.InRow); } else { TemplateStep(token, HtmlTreeMode.InBody); } break; } case HtmlTokenType.EndTag: if (token.Name.Is(Tags.Template)) InHead(token); else RaiseErrorOccurred(HtmlParseError.TagCannotEndHere, token); break; case HtmlTokenType.EndOfFile: if (TagCurrentlyOpen(Tags.Template)) { RaiseErrorOccurred(HtmlParseError.EOF, token); CloseTemplate(); Home(token); } else End(); break; default: InBody(token); break; } } private void AfterBody(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Character: { string text = token.TrimStart(); ReconstructFormatting(); AddCharacters(text); if (token.IsEmpty) return; break; } case HtmlTokenType.Comment: _openElements[0].AddComment(token); return; case HtmlTokenType.Doctype: RaiseErrorOccurred(HtmlParseError.DoctypeTagInappropriate, token); return; case HtmlTokenType.StartTag: if (token.Name.Is(Tags.Html)) { InBody(token); return; } break; case HtmlTokenType.EndTag: if (token.Name.Is(Tags.Html)) { if (IsFragmentCase) RaiseErrorOccurred(HtmlParseError.TagInvalidInFragmentMode, token); else _currentMode = HtmlTreeMode.AfterAfterBody; return; } break; case HtmlTokenType.EndOfFile: End(); return; } RaiseErrorOccurred(HtmlParseError.TokenNotPossible, token); _currentMode = HtmlTreeMode.InBody; InBody(token); } private void InFrameset(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Character: { string text = token.TrimStart(); AddCharacters(text); if (token.IsEmpty) return; break; } case HtmlTokenType.Comment: CurrentNode.AddComment(token); return; case HtmlTokenType.Doctype: RaiseErrorOccurred(HtmlParseError.DoctypeTagInappropriate, token); return; case HtmlTokenType.StartTag: { string name = token.Name; if (name.Is(Tags.Html)) { InBody(token); return; } if (name.Is(Tags.Frameset)) { AddElement(new HtmlFrameSetElement(_document, null), token.AsTag(), false); return; } if (name.Is(Tags.Frame)) { AddElement(new HtmlFrameElement(_document, null), token.AsTag(), true); CloseCurrentNode(); return; } if (name.Is(Tags.NoFrames)) { InHead(token); return; } break; } case HtmlTokenType.EndTag: if (token.Name.Is(Tags.Frameset)) { if (CurrentNode != _openElements[0]) { CloseCurrentNode(); if (!IsFragmentCase && !CurrentNode.LocalName.Is(Tags.Frameset)) _currentMode = HtmlTreeMode.AfterFrameset; } else RaiseErrorOccurred(HtmlParseError.CurrentNodeIsRoot, token); return; } break; case HtmlTokenType.EndOfFile: if (CurrentNode != _document.DocumentElement) RaiseErrorOccurred(HtmlParseError.CurrentNodeIsNotRoot, token); End(); return; } RaiseErrorOccurred(HtmlParseError.TokenNotPossible, token); } private void AfterFrameset(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Character: { string text = token.TrimStart(); AddCharacters(text); if (token.IsEmpty) return; break; } case HtmlTokenType.Comment: CurrentNode.AddComment(token); return; case HtmlTokenType.Doctype: RaiseErrorOccurred(HtmlParseError.DoctypeTagInappropriate, token); return; case HtmlTokenType.StartTag: { string name = token.Name; if (name.Is(Tags.Html)) { InBody(token); return; } if (name.Is(Tags.NoFrames)) { InHead(token); return; } break; } case HtmlTokenType.EndTag: if (token.Name.Is(Tags.Html)) { _currentMode = HtmlTreeMode.AfterAfterFrameset; return; } break; case HtmlTokenType.EndOfFile: End(); return; } RaiseErrorOccurred(HtmlParseError.TokenNotPossible, token); } private void AfterAfterBody(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Character: { string text = token.TrimStart(); ReconstructFormatting(); AddCharacters(text); if (token.IsEmpty) return; break; } case HtmlTokenType.EndOfFile: End(); return; case HtmlTokenType.Comment: _document.AddComment(token); return; case HtmlTokenType.Doctype: InBody(token); return; case HtmlTokenType.StartTag: if (token.Name.Is(Tags.Html)) { InBody(token); return; } break; } RaiseErrorOccurred(HtmlParseError.TokenNotPossible, token); _currentMode = HtmlTreeMode.InBody; InBody(token); } private void AfterAfterFrameset(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Comment: _document.AddComment(token); return; case HtmlTokenType.Character: { string text = token.TrimStart(); ReconstructFormatting(); AddCharacters(text); if (token.IsEmpty) return; break; } case HtmlTokenType.Doctype: InBody(token); return; case HtmlTokenType.StartTag: { string name = token.Name; if (name.Is(Tags.Html)) { InBody(token); return; } if (name.Is(Tags.NoFrames)) { InHead(token); return; } break; } case HtmlTokenType.EndOfFile: End(); return; } RaiseErrorOccurred(HtmlParseError.TokenNotPossible, token); } private void TemplateStep(HtmlToken token, HtmlTreeMode mode) { _templateModes.Pop(); _templateModes.Push(mode); _currentMode = mode; Home(token); } private void CloseTemplate() { while (_openElements.Count > 0) { HtmlTemplateElement htmlTemplateElement = CurrentNode as HtmlTemplateElement; CloseCurrentNode(); if (htmlTemplateElement != null) { htmlTemplateElement.PopulateFragment(); break; } } _formattingElements.ClearFormatting(); _templateModes.Pop(); Reset(null); } private void InTableBodyCloseTable(HtmlTagToken tag) { if (IsInTableScope(Tags.AllTableSections)) { ClearStackBackTo(Tags.AllTableSections); CloseCurrentNode(); _currentMode = HtmlTreeMode.InTable; InTable(tag); } else RaiseErrorOccurred(HtmlParseError.TableSectionNotInScope, tag); } private void InSelectEndTagOption(HtmlToken token) { if (CurrentNode.LocalName.Is(Tags.Option)) CloseCurrentNode(); else RaiseErrorOccurred(HtmlParseError.TagDoesNotMatchCurrentNode, token); } private void InSelectEndTagOptgroup(HtmlToken token) { if (_openElements.Count > 1 && _openElements[_openElements.Count - 1].LocalName.Is(Tags.Option) && _openElements[_openElements.Count - 2].LocalName.Is(Tags.Optgroup)) CloseCurrentNode(); if (CurrentNode.LocalName.Is(Tags.Optgroup)) CloseCurrentNode(); else RaiseErrorOccurred(HtmlParseError.TagDoesNotMatchCurrentNode, token); } private bool InColumnGroupEndTagColgroup(HtmlToken token) { if (CurrentNode.LocalName.Is(Tags.Colgroup)) { CloseCurrentNode(); _currentMode = HtmlTreeMode.InTable; return true; } RaiseErrorOccurred(HtmlParseError.TagDoesNotMatchCurrentNode, token); return false; } private void AfterHeadStartTagBody(HtmlTagToken token) { AddElement(new HtmlBodyElement(_document, null), token, false); _frameset = false; _currentMode = HtmlTreeMode.InBody; } private void RawtextAlgorithm(HtmlTagToken tag) { AddElement(tag, false); _previousMode = _currentMode; _currentMode = HtmlTreeMode.Text; _tokenizer.State = HtmlParseMode.Rawtext; } private void RCDataAlgorithm(HtmlTagToken tag) { AddElement(tag, false); _previousMode = _currentMode; _currentMode = HtmlTreeMode.Text; _tokenizer.State = HtmlParseMode.RCData; } private void InBodyStartTagListItem(HtmlTagToken tag) { int num = _openElements.Count - 1; Element element = _openElements[num]; _frameset = false; while (true) { if (element.LocalName.Is(Tags.Li)) { InBody(HtmlTagToken.Close(element.LocalName)); break; } if (element.Flags.HasFlag(NodeFlags.Special) && !Tags.AllBasicBlocks.Contains(element.LocalName)) break; element = _openElements[--num]; } if (IsInButtonScope()) InBodyEndTagParagraph(tag); AddElement(tag, false); } private void InBodyStartTagDefinitionItem(HtmlTagToken tag) { _frameset = false; int num = _openElements.Count - 1; Element element = _openElements[num]; while (true) { if (element.LocalName.IsOneOf(Tags.Dd, Tags.Dt)) { InBody(HtmlTagToken.Close(element.LocalName)); break; } if (element.Flags.HasFlag(NodeFlags.Special) && !Tags.AllBasicBlocks.Contains(element.LocalName)) break; element = _openElements[--num]; } if (IsInButtonScope()) InBodyEndTagParagraph(tag); AddElement(tag, false); } private bool InBodyEndTagBlock(HtmlTagToken tag) { if (IsInScope(tag.Name)) { GenerateImpliedEndTags(); if (!CurrentNode.LocalName.Is(tag.Name)) RaiseErrorOccurred(HtmlParseError.TagDoesNotMatchCurrentNode, tag); ClearStackBackTo(tag.Name); CloseCurrentNode(); return true; } RaiseErrorOccurred(HtmlParseError.BlockNotInScope, tag); return false; } private void HeisenbergAlgorithm(HtmlTagToken tag) { int num = 0; int num2 = 0; int num3 = 0; int num4 = 0; Element element; Element element2; while (true) { if (num >= 8) return; element = null; element2 = null; num++; num4 = 0; num2 = 0; for (int num5 = _formattingElements.Count - 1; num5 >= 0; num5--) { if (_formattingElements[num5] == null) break; if (_formattingElements[num5].LocalName.Is(tag.Name)) { num4 = num5; element = _formattingElements[num5]; break; } } if (element == null) { InBodyEndTagAnythingElse(tag); return; } int num6 = _openElements.IndexOf(element); if (num6 == -1) { RaiseErrorOccurred(HtmlParseError.FormattingElementNotFound, tag); _formattingElements.Remove(element); return; } if (!IsInScope(element.LocalName)) { RaiseErrorOccurred(HtmlParseError.ElementNotInScope, tag); return; } if (num6 != _openElements.Count - 1) RaiseErrorOccurred(HtmlParseError.TagClosedWrong, tag); num3 = num4; for (int i = num6 + 1; i < _openElements.Count; i++) { if (_openElements[i].Flags.HasFlag(NodeFlags.Special)) { num4 = i; element2 = _openElements[i]; break; } } if (element2 == null) break; Element element3 = _openElements[num6 - 1]; Element element4 = element2; Element element5 = element2; while (true) { num2++; element4 = _openElements[--num4]; if (element4 == element) break; if (num2 > 3 && _formattingElements.Contains(element4)) _formattingElements.Remove(element4); if (!_formattingElements.Contains(element4)) _openElements.Remove(element4); else { Element element6 = CopyElement(element4); element3.AddNode(element6); _openElements[num4] = element6; for (int j = 0; j != _formattingElements.Count; j++) { if (_formattingElements[j] == element4) { _formattingElements[j] = element6; break; } } element4 = element6; if (element5 == element2) num3++; if (element5.Parent != null) element5.Parent.RemoveChild(element5); element4.AddNode(element5); element5 = element4; } } if (element5.Parent != null) element5.Parent.RemoveChild(element5); if (!Tags.AllTableMajor.Contains(element3.LocalName)) element3.AddNode(element5); else AddElementWithFoster(element5); Element element7 = CopyElement(element); while (element2.ChildNodes.Length > 0) { Node node = element2.ChildNodes[0]; element2.RemoveNode(0, node); element7.AddNode(node); } element2.AddNode(element7); _formattingElements.Remove(element); _formattingElements.Insert(num3, element7); _openElements.Remove(element); _openElements.Insert(_openElements.IndexOf(element2) + 1, element7); } do { element2 = CurrentNode; CloseCurrentNode(); } while (element2 != element); _formattingElements.Remove(element); } private Element CopyElement(Element element) { return (Element)element.Clone(false); } private void InBodyWithFoster(HtmlToken token) { _foster = true; InBody(token); _foster = false; } private void InBodyEndTagAnythingElse(HtmlTagToken tag) { int num = _openElements.Count - 1; Element element = CurrentNode; while (true) { if (element == null) return; if (element.LocalName.Is(tag.Name)) { GenerateImpliedEndTagsExceptFor(tag.Name); if (!element.LocalName.Is(tag.Name)) RaiseErrorOccurred(HtmlParseError.TagClosedWrong, tag); int num2 = _openElements.Count - 1; while (num <= num2) { CloseCurrentNode(); num2--; } return; } if (element.Flags.HasFlag(NodeFlags.Special)) break; element = _openElements[--num]; } RaiseErrorOccurred(HtmlParseError.TagClosedWrong, tag); } private bool InBodyEndTagBody(HtmlToken token) { if (IsInScope(Tags.Body)) { CheckBodyOnClosing(token); _currentMode = HtmlTreeMode.AfterBody; return true; } RaiseErrorOccurred(HtmlParseError.BodyNotInScope, token); return false; } private void InBodyStartTagBreakrow(HtmlTagToken tag) { ReconstructFormatting(); AddElement(tag, false); CloseCurrentNode(); _frameset = false; } private bool InBodyEndTagParagraph(HtmlToken token) { if (IsInButtonScope()) { GenerateImpliedEndTagsExceptFor(Tags.P); if (!CurrentNode.LocalName.Is(Tags.P)) RaiseErrorOccurred(HtmlParseError.TagDoesNotMatchCurrentNode, token); ClearStackBackTo(Tags.P); CloseCurrentNode(); return true; } RaiseErrorOccurred(HtmlParseError.ParagraphNotInScope, token); InBody(HtmlTagToken.Open(Tags.P)); InBodyEndTagParagraph(token); return false; } private bool InTableEndTagTable(HtmlToken token) { if (IsInTableScope(Tags.Table)) { ClearStackBackTo(Tags.Table); CloseCurrentNode(); Reset(null); return true; } RaiseErrorOccurred(HtmlParseError.TableNotInScope, token); return false; } private bool InRowEndTagTablerow(HtmlToken token) { if (IsInTableScope(Tags.Tr)) { ClearStackBackTo(Tags.Tr); CloseCurrentNode(); _currentMode = HtmlTreeMode.InTableBody; return true; } RaiseErrorOccurred(HtmlParseError.TableRowNotInScope, token); return false; } private void InSelectEndTagSelect() { ClearStackBackTo(Tags.Select); CloseCurrentNode(); Reset(null); } private bool InCaptionEndTagCaption(HtmlToken token) { if (IsInTableScope(Tags.Caption)) { GenerateImpliedEndTags(); if (!CurrentNode.LocalName.Is(Tags.Caption)) RaiseErrorOccurred(HtmlParseError.TagDoesNotMatchCurrentNode, token); ClearStackBackTo(Tags.Caption); CloseCurrentNode(); _formattingElements.ClearFormatting(); _currentMode = HtmlTreeMode.InTable; return true; } RaiseErrorOccurred(HtmlParseError.CaptionNotInScope, token); return false; } private bool InCellEndTagCell(HtmlToken token) { if (IsInTableScope(Tags.AllTableCells)) { GenerateImpliedEndTags(); if (!Tags.AllTableCells.Contains(CurrentNode.LocalName)) RaiseErrorOccurred(HtmlParseError.TagDoesNotMatchCurrentNode, token); ClearStackBackTo(Tags.AllTableCells); CloseCurrentNode(); _formattingElements.ClearFormatting(); _currentMode = HtmlTreeMode.InRow; return true; } RaiseErrorOccurred(HtmlParseError.TableCellNotInScope, token); return false; } private void Foreign(HtmlToken token) { switch (token.Type) { case HtmlTokenType.Character: AddCharacters(token.Data.Replace('', '�')); if (token.HasContent) _frameset = false; break; case HtmlTokenType.StartTag: { string name2 = token.Name; HtmlTagToken htmlTagToken = token.AsTag(); if (name2.Is(Tags.Font)) { for (int i = 0; i != htmlTagToken.Attributes.Count; i++) { if (htmlTagToken.Attributes[i].Key.IsOneOf(AttributeNames.Color, AttributeNames.Face, AttributeNames.Size)) { ForeignNormalTag(htmlTagToken); return; } } ForeignSpecialTag(htmlTagToken); } else if (Tags.AllForeignExceptions.Contains(name2)) { ForeignNormalTag(htmlTagToken); } else { ForeignSpecialTag(htmlTagToken); } break; } case HtmlTokenType.EndTag: { string name = token.Name; Element element = CurrentNode; HtmlScriptElement htmlScriptElement = element as HtmlScriptElement; if (htmlScriptElement != null) HandleScript(htmlScriptElement); else { if (!element.LocalName.Is(name)) RaiseErrorOccurred(HtmlParseError.TagClosingMismatch, token); int num = _openElements.Count - 1; while (true) { if (num <= 0) return; if (element.LocalName.Isi(name)) { _openElements.RemoveRange(num + 1, _openElements.Count - num - 1); CloseCurrentNode(); return; } element = _openElements[num - 1]; if (element.Flags.HasFlag(NodeFlags.HtmlMember)) break; num--; } Home(token); } break; } case HtmlTokenType.Comment: CurrentNode.AddComment(token); break; case HtmlTokenType.Doctype: RaiseErrorOccurred(HtmlParseError.DoctypeTagInappropriate, token); break; } } private void ForeignSpecialTag(HtmlTagToken tag) { Element element = CreateForeignElementFrom(tag); if (element != null) { CurrentNode.AddNode(element); if (!tag.IsSelfClosing) { _openElements.Add(element); _tokenizer.IsAcceptingCharacterData = true; } else if (tag.Name.Is(Tags.Script)) { Foreign(HtmlTagToken.Close(Tags.Script)); } } } private Element CreateForeignElementFrom(HtmlTagToken tag) { if (AdjustedCurrentNode.Flags.HasFlag(NodeFlags.MathMember)) { MathElement mathElement = Factory.MathElements.Create(_document, tag.Name, null); for (int i = 0; i < tag.Attributes.Count; i++) { string key = tag.Attributes[i].Key; string value = tag.Attributes[i].Value; mathElement.AdjustAttribute(key.AdjustToMathAttribute(), value); } return mathElement; } if (AdjustedCurrentNode.Flags.HasFlag(NodeFlags.SvgMember)) { SvgElement svgElement = Factory.SvgElements.CreateSanatized(_document, tag.Name); for (int j = 0; j < tag.Attributes.Count; j++) { string key2 = tag.Attributes[j].Key; string value2 = tag.Attributes[j].Value; svgElement.AdjustAttribute(key2.AdjustToSvgAttribute(), value2); } return svgElement; } return null; } private void ForeignNormalTag(HtmlTagToken tag) { RaiseErrorOccurred(HtmlParseError.TagCannotStartHere, tag); if (IsFragmentCase) ForeignSpecialTag(tag); else { Element currentNode = CurrentNode; do { if (currentNode.LocalName.Is(Tags.AnnotationXml)) { string attribute = currentNode.GetAttribute(null, AttributeNames.Encoding); if (attribute.Isi(MimeTypes.Html) || attribute.Isi(MimeTypes.ApplicationXHtml)) { AddElement(tag, false); return; } } CloseCurrentNode(); currentNode = CurrentNode; } while ((currentNode.Flags & (NodeFlags.HtmlMember | NodeFlags.HtmlTip | NodeFlags.MathTip)) == NodeFlags.None); Consume(tag); } } private bool IsInScope(string tagName) { for (int num = _openElements.Count - 1; num >= 0; num--) { Element element = _openElements[num]; if (element.LocalName.Is(tagName)) return true; if (element.Flags.HasFlag(NodeFlags.Scoped)) return false; } return false; } private bool IsInScope(HashSet<string> tags) { for (int num = _openElements.Count - 1; num >= 0; num--) { Element element = _openElements[num]; if (tags.Contains(element.LocalName)) return true; if (element.Flags.HasFlag(NodeFlags.Scoped)) return false; } return false; } private bool IsInListItemScope() { for (int num = _openElements.Count - 1; num >= 0; num--) { Element element = _openElements[num]; if (element.LocalName.Is(Tags.Li)) return true; if (element.Flags.HasFlag(NodeFlags.HtmlListScoped)) return false; } return false; } private bool IsInButtonScope() { for (int num = _openElements.Count - 1; num >= 0; num--) { Element element = _openElements[num]; if (element.LocalName.Is(Tags.P)) return true; if (element.Flags.HasFlag(NodeFlags.Scoped) || element.LocalName.Is(Tags.Button)) return false; } return false; } private bool IsInTableScope(HashSet<string> tags) { for (int num = _openElements.Count - 1; num >= 0; num--) { Element element = _openElements[num]; if (tags.Contains(element.LocalName)) return true; if (element.Flags.HasFlag(NodeFlags.HtmlTableScoped)) return false; } return false; } private bool IsInTableScope(string tagName) { for (int num = _openElements.Count - 1; num >= 0; num--) { Element element = _openElements[num]; if (element.LocalName.Is(tagName)) return true; if (element.Flags.HasFlag(NodeFlags.HtmlTableScoped)) return false; } return false; } private bool IsInSelectScope(string tagName) { for (int num = _openElements.Count - 1; num >= 0; num--) { Element element = _openElements[num]; if (element.LocalName.Is(tagName)) return true; if (!element.Flags.HasFlag(NodeFlags.HtmlSelectScoped)) return false; } return false; } private void HandleScript(HtmlScriptElement script) { if (script != null && !IsFragmentCase) { _document.PerformMicrotaskCheckpoint(); _document.ProvideStableState(); CloseCurrentNode(); _currentMode = _previousMode; if (script.Prepare()) _waiting = RunScript(script); } } private async Task RunScript(HtmlScriptElement script) { await _document.WaitForReady().ConfigureAwait(false); script.Run(); } private void CheckBodyOnClosing(HtmlToken token) { int num = 0; while (true) { if (num >= _openElements.Count) return; if (!_openElements[num].Flags.HasFlag(NodeFlags.ImplicitelyClosed)) break; num++; } RaiseErrorOccurred(HtmlParseError.BodyClosedWrong, token); } private bool TagCurrentlyOpen(string tagName) { for (int i = 0; i < _openElements.Count; i++) { if (_openElements[i].LocalName.Is(tagName)) return true; } return false; } private void PreventNewLine() { HtmlToken htmlToken = _tokenizer.Get(); if (htmlToken.Type == HtmlTokenType.Character) htmlToken.RemoveNewLine(); Home(htmlToken); } private void End() { while (_openElements.Count != 0) { CloseCurrentNode(); } if (_document.ReadyState == DocumentReadyState.Loading) _waiting = _document.FinishLoading(); } private void AddRoot(HtmlTagToken tag) { HtmlHtmlElement htmlHtmlElement = new HtmlHtmlElement(_document, null); _document.AddNode(htmlHtmlElement); SetupElement(htmlHtmlElement, tag, false); _openElements.Add(htmlHtmlElement); _tokenizer.IsAcceptingCharacterData = false; _document.ApplyManifest(); } private void CloseCurrentNode() { if (_openElements.Count > 0) { _openElements.RemoveAt(_openElements.Count - 1); Element adjustedCurrentNode = AdjustedCurrentNode; _tokenizer.IsAcceptingCharacterData = (adjustedCurrentNode != null && !adjustedCurrentNode.Flags.HasFlag(NodeFlags.HtmlMember)); } } private void SetupElement(Element element, HtmlTagToken tag, bool acknowledgeSelfClosing) { if (tag.IsSelfClosing && !acknowledgeSelfClosing) RaiseErrorOccurred(HtmlParseError.TagCannotBeSelfClosed, tag); element.SetAttributes(tag.Attributes); } private Element AddElement(HtmlTagToken tag, bool acknowledgeSelfClosing = false) { HtmlElement htmlElement = Factory.HtmlElements.Create(_document, tag.Name, null); SetupElement(htmlElement, tag, acknowledgeSelfClosing); AddElement(htmlElement); return htmlElement; } private void AddElement(Element element, HtmlTagToken tag, bool acknowledgeSelfClosing = false) { SetupElement(element, tag, acknowledgeSelfClosing); AddElement(element); } private void AddElement(Element element) { Element currentNode = CurrentNode; if (_foster && Tags.AllTableMajor.Contains(currentNode.LocalName)) AddElementWithFoster(element); else currentNode.AddNode(element); _openElements.Add(element); _tokenizer.IsAcceptingCharacterData = !element.Flags.HasFlag(NodeFlags.HtmlMember); } private void AddElementWithFoster(Element element) { bool flag = false; int num = _openElements.Count; while (--num != 0) { if (_openElements[num].LocalName.Is(Tags.Template)) { _openElements[num].AddNode(element); return; } if (_openElements[num].LocalName.Is(Tags.Table)) { flag = true; break; } } Node node = _openElements[num].Parent ?? _openElements[num + 1]; if (flag && _openElements[num].Parent != null) { int num2 = 0; while (true) { if (num2 >= node.ChildNodes.Length) return; if (node.ChildNodes[num2] == _openElements[num]) break; num2++; } node.InsertNode(num2, element); } else node.AddNode(element); } private void AddCharacters(string text) { if (!string.IsNullOrEmpty(text)) { Element currentNode = CurrentNode; if (_foster && Tags.AllTableMajor.Contains(currentNode.LocalName)) AddCharactersWithFoster(text); else currentNode.AppendText(text); } } private void AddCharactersWithFoster(string text) { bool flag = false; int num = _openElements.Count; while (--num != 0) { if (_openElements[num].LocalName.Is(Tags.Template)) { _openElements[num].AppendText(text); return; } if (_openElements[num].LocalName.Is(Tags.Table)) { flag = true; break; } } Node node = _openElements[num].Parent ?? _openElements[num + 1]; if (flag && _openElements[num].Parent != null) { int num2 = 0; while (true) { if (num2 >= node.ChildNodes.Length) return; if (node.ChildNodes[num2] == _openElements[num]) break; num2++; } node.InsertText(num2, text); } else node.AppendText(text); } private void ClearStackBackTo(string tagName) { Element currentNode = CurrentNode; while (!currentNode.LocalName.IsOneOf(tagName, Tags.Html, Tags.Template)) { CloseCurrentNode(); currentNode = CurrentNode; } } private void ClearStackBackTo(HashSet<string> tags) { Element currentNode = CurrentNode; while (!tags.Contains(currentNode.LocalName) && !currentNode.LocalName.IsOneOf(Tags.Html, Tags.Template)) { CloseCurrentNode(); currentNode = CurrentNode; } } private void GenerateImpliedEndTagsExceptFor(string tagName) { Element currentNode = CurrentNode; while (currentNode.Flags.HasFlag(NodeFlags.ImpliedEnd) && !currentNode.LocalName.Is(tagName)) { CloseCurrentNode(); currentNode = CurrentNode; } } private void GenerateImpliedEndTags() { while (CurrentNode.Flags.HasFlag(NodeFlags.ImpliedEnd)) { CloseCurrentNode(); } } private void ReconstructFormatting() { if (_formattingElements.Count != 0) { int i = _formattingElements.Count - 1; Element element = _formattingElements[i]; if (element != null && !_openElements.Contains(element)) { while (i > 0) { element = _formattingElements[--i]; if (element == null || _openElements.Contains(element)) { i++; break; } } for (; i < _formattingElements.Count; i++) { Element element2 = CopyElement(_formattingElements[i]); AddElement(element2); _formattingElements[i] = element2; } } } } private void RaiseErrorOccurred(HtmlParseError code, HtmlToken token) { _tokenizer.RaiseErrorOccurred(code, token.Position); } } }