summaryrefslogtreecommitdiff
path: root/Source/WebCore/html/parser/HTMLSourceTracker.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'Source/WebCore/html/parser/HTMLSourceTracker.cpp')
-rw-r--r--Source/WebCore/html/parser/HTMLSourceTracker.cpp87
1 files changed, 87 insertions, 0 deletions
diff --git a/Source/WebCore/html/parser/HTMLSourceTracker.cpp b/Source/WebCore/html/parser/HTMLSourceTracker.cpp
new file mode 100644
index 000000000..e7c68764b
--- /dev/null
+++ b/Source/WebCore/html/parser/HTMLSourceTracker.cpp
@@ -0,0 +1,87 @@
+/*
+ * Copyright (C) 2010 Adam Barth. All Rights Reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY
+ * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+ * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR
+ * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
+ * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+ * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
+ * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
+ * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+ * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include "config.h"
+#include "HTMLSourceTracker.h"
+#include "HTMLTokenizer.h"
+#include <wtf/text/StringBuilder.h>
+
+namespace WebCore {
+
+HTMLSourceTracker::HTMLSourceTracker()
+{
+}
+
+void HTMLSourceTracker::start(const HTMLInputStream& input, HTMLTokenizer* tokenizer, HTMLToken& token)
+{
+ if (token.type() == HTMLTokenTypes::Uninitialized) {
+ m_previousSource.clear();
+ if (tokenizer->numberOfBufferedCharacters())
+ m_previousSource = tokenizer->bufferedCharacters();
+ } else
+ m_previousSource.append(m_currentSource);
+
+ m_currentSource = input.current();
+ token.setBaseOffset(m_currentSource.numberOfCharactersConsumed() - m_previousSource.length());
+}
+
+void HTMLSourceTracker::end(const HTMLInputStream& input, HTMLTokenizer* tokenizer, HTMLToken& token)
+{
+ m_cachedSourceForToken = String();
+
+ // FIXME: This work should really be done by the HTMLTokenizer.
+ token.end(input.current().numberOfCharactersConsumed() - tokenizer->numberOfBufferedCharacters());
+}
+
+String HTMLSourceTracker::sourceForToken(const HTMLToken& token)
+{
+ if (token.type() == HTMLTokenTypes::EndOfFile)
+ return String(); // Hides the null character we use to mark the end of file.
+
+ if (!m_cachedSourceForToken.isEmpty())
+ return m_cachedSourceForToken;
+
+ ASSERT(!token.startIndex());
+ size_t length = static_cast<size_t>(token.endIndex() - token.startIndex());
+
+ StringBuilder source;
+ source.reserveCapacity(length);
+
+ size_t i = 0;
+ for ( ; i < length && !m_previousSource.isEmpty(); ++i) {
+ source.append(*m_previousSource);
+ m_previousSource.advance();
+ }
+ for ( ; i < length; ++i) {
+ ASSERT(!m_currentSource.isEmpty());
+ source.append(*m_currentSource);
+ m_currentSource.advance();
+ }
+
+ m_cachedSourceForToken = source.toString();
+ return m_cachedSourceForToken;
+}
+
+}