1 /* 2 * Copyright (C) 2010 Adam Barth. All Rights Reserved. 3 * 4 * Redistribution and use in source and binary forms, with or without 5 * modification, are permitted provided that the following conditions 6 * are met: 7 * 1. Redistributions of source code must retain the above copyright 8 * notice, this list of conditions and the following disclaimer. 9 * 2. Redistributions in binary form must reproduce the above copyright 10 * notice, this list of conditions and the following disclaimer in the 11 * documentation and/or other materials provided with the distribution. 12 * 13 * THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY 14 * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 15 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 16 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR 17 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, 18 * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, 19 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR 20 * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY 21 * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 22 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 23 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 24 */ 25 26 #include "config.h" 27 #include "core/html/parser/HTMLSourceTracker.h" 28 29 #include "core/html/parser/HTMLTokenizer.h" 30 #include "wtf/text/StringBuilder.h" 31 32 namespace WebCore { 33 34 HTMLSourceTracker::HTMLSourceTracker() 35 { 36 } 37 38 void HTMLSourceTracker::start(SegmentedString& currentInput, HTMLTokenizer* tokenizer, HTMLToken& token) 39 { 40 if (token.type() == HTMLToken::Uninitialized) { 41 m_previousSource.clear(); 42 if (tokenizer->numberOfBufferedCharacters()) 43 m_previousSource = tokenizer->bufferedCharacters(); 44 } else 45 m_previousSource.append(m_currentSource); 46 47 m_currentSource = currentInput; 48 token.setBaseOffset(m_currentSource.numberOfCharactersConsumed() - m_previousSource.length()); 49 } 50 51 void HTMLSourceTracker::end(SegmentedString& currentInput, HTMLTokenizer* tokenizer, HTMLToken& token) 52 { 53 m_cachedSourceForToken = String(); 54 55 // FIXME: This work should really be done by the HTMLTokenizer. 56 token.end(currentInput.numberOfCharactersConsumed() - tokenizer->numberOfBufferedCharacters()); 57 } 58 59 String HTMLSourceTracker::sourceForToken(const HTMLToken& token) 60 { 61 if (!m_cachedSourceForToken.isEmpty()) 62 return m_cachedSourceForToken; 63 64 size_t length; 65 if (token.type() == HTMLToken::EndOfFile) { 66 // Consume the remainder of the input, omitting the null character we use to mark the end of the file. 67 length = m_previousSource.length() + m_currentSource.length() - 1; 68 } else { 69 ASSERT(!token.startIndex()); 70 length = static_cast<size_t>(token.endIndex() - token.startIndex()); 71 } 72 73 StringBuilder source; 74 source.reserveCapacity(length); 75 76 size_t i = 0; 77 for ( ; i < length && !m_previousSource.isEmpty(); ++i) { 78 source.append(m_previousSource.currentChar()); 79 m_previousSource.advance(); 80 } 81 for ( ; i < length; ++i) { 82 ASSERT(!m_currentSource.isEmpty()); 83 source.append(m_currentSource.currentChar()); 84 m_currentSource.advance(); 85 } 86 87 m_cachedSourceForToken = source.toString(); 88 return m_cachedSourceForToken; 89 } 90 91 } 92