1 /* This Source Code Form is subject to the terms of the Mozilla Public
2  * License, v. 2.0. If a copy of the MPL was not distributed with this
3  * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
4 
5 #include "nsHtml5StringParser.h"
6 #include "nsHtml5TreeOpExecutor.h"
7 #include "nsHtml5TreeBuilder.h"
8 #include "nsHtml5Tokenizer.h"
9 #include "nsIContent.h"
10 #include "nsIDocument.h"
11 #include "nsIDOMDocumentFragment.h"
12 #include "nsHtml5DependentUTF16Buffer.h"
13 
NS_IMPL_ISUPPORTS0(nsHtml5StringParser)14 NS_IMPL_ISUPPORTS0(nsHtml5StringParser)
15 
16 nsHtml5StringParser::nsHtml5StringParser()
17   : mBuilder(new nsHtml5OplessBuilder())
18   , mTreeBuilder(new nsHtml5TreeBuilder(mBuilder))
19   , mTokenizer(new nsHtml5Tokenizer(mTreeBuilder, false))
20 {
21   MOZ_COUNT_CTOR(nsHtml5StringParser);
22   mTokenizer->setInterner(&mAtomTable);
23 }
24 
~nsHtml5StringParser()25 nsHtml5StringParser::~nsHtml5StringParser()
26 {
27   MOZ_COUNT_DTOR(nsHtml5StringParser);
28 }
29 
30 nsresult
ParseFragment(const nsAString & aSourceBuffer,nsIContent * aTargetNode,nsIAtom * aContextLocalName,int32_t aContextNamespace,bool aQuirks,bool aPreventScriptExecution)31 nsHtml5StringParser::ParseFragment(const nsAString& aSourceBuffer,
32                                    nsIContent* aTargetNode,
33                                    nsIAtom* aContextLocalName,
34                                    int32_t aContextNamespace,
35                                    bool aQuirks,
36                                    bool aPreventScriptExecution)
37 {
38   NS_ENSURE_TRUE(aSourceBuffer.Length() <= INT32_MAX,
39                  NS_ERROR_OUT_OF_MEMORY);
40 
41   nsIDocument* doc = aTargetNode->OwnerDoc();
42   nsIURI* uri = doc->GetDocumentURI();
43   NS_ENSURE_TRUE(uri, NS_ERROR_NOT_AVAILABLE);
44 
45   mTreeBuilder->setFragmentContext(aContextLocalName,
46                                    aContextNamespace,
47                                    aTargetNode,
48                                    aQuirks);
49 
50 #ifdef DEBUG
51   if (!aPreventScriptExecution) {
52     NS_ASSERTION(!aTargetNode->IsInUncomposedDoc(),
53                  "If script execution isn't prevented, "
54                  "the target node must not be in doc.");
55     nsCOMPtr<nsIDOMDocumentFragment> domFrag = do_QueryInterface(aTargetNode);
56     NS_ASSERTION(domFrag,
57       "If script execution isn't prevented, must parse to DOM fragment.");
58   }
59 #endif
60 
61   mTreeBuilder->SetPreventScriptExecution(aPreventScriptExecution);
62 
63   return Tokenize(aSourceBuffer, doc, true);
64 }
65 
66 nsresult
ParseDocument(const nsAString & aSourceBuffer,nsIDocument * aTargetDoc,bool aScriptingEnabledForNoscriptParsing)67 nsHtml5StringParser::ParseDocument(const nsAString& aSourceBuffer,
68                                    nsIDocument* aTargetDoc,
69                                    bool aScriptingEnabledForNoscriptParsing)
70 {
71   MOZ_ASSERT(!aTargetDoc->GetFirstChild());
72 
73   NS_ENSURE_TRUE(aSourceBuffer.Length() <= INT32_MAX,
74                  NS_ERROR_OUT_OF_MEMORY);
75 
76   mTreeBuilder->setFragmentContext(nullptr,
77                                    kNameSpaceID_None,
78                                    nullptr,
79                                    false);
80 
81   mTreeBuilder->SetPreventScriptExecution(true);
82 
83   return Tokenize(aSourceBuffer, aTargetDoc, aScriptingEnabledForNoscriptParsing);
84 }
85 
86 nsresult
Tokenize(const nsAString & aSourceBuffer,nsIDocument * aDocument,bool aScriptingEnabledForNoscriptParsing)87 nsHtml5StringParser::Tokenize(const nsAString& aSourceBuffer,
88                               nsIDocument* aDocument,
89                               bool aScriptingEnabledForNoscriptParsing) {
90 
91   nsIURI* uri = aDocument->GetDocumentURI();
92 
93   mBuilder->Init(aDocument, uri, nullptr, nullptr);
94 
95   mBuilder->SetParser(this);
96   mBuilder->SetNodeInfoManager(aDocument->NodeInfoManager());
97 
98   // Mark the parser as *not* broken by passing NS_OK
99   nsresult rv = mBuilder->MarkAsBroken(NS_OK);
100 
101   mTreeBuilder->setScriptingEnabled(aScriptingEnabledForNoscriptParsing);
102   mTreeBuilder->setIsSrcdocDocument(aDocument->IsSrcdocDocument());
103   mBuilder->Start();
104   mTokenizer->start();
105   if (!aSourceBuffer.IsEmpty()) {
106     bool lastWasCR = false;
107     nsHtml5DependentUTF16Buffer buffer(aSourceBuffer);
108     while (buffer.hasMore()) {
109       buffer.adjust(lastWasCR);
110       lastWasCR = false;
111       if (buffer.hasMore()) {
112         if (!mTokenizer->EnsureBufferSpace(buffer.getLength())) {
113           rv = mBuilder->MarkAsBroken(NS_ERROR_OUT_OF_MEMORY);
114           break;
115         }
116         lastWasCR = mTokenizer->tokenizeBuffer(&buffer);
117         if (NS_FAILED(rv = mBuilder->IsBroken())) {
118           break;
119         }
120       }
121     }
122   }
123   if (NS_SUCCEEDED(rv)) {
124     mTokenizer->eof();
125   }
126   mTokenizer->end();
127   mBuilder->Finish();
128   mAtomTable.Clear();
129   return rv;
130 }
131