blob: 5d8fae12e7f2bb08845b13c100431a4ce12411da [file] [log] [blame]
Torne (Richard Coles)51b29062013-11-28 11:56:03 +00001/*
2 * Copyright (C) 2003 Lars Knoll (knoll@kde.org)
3 * Copyright (C) 2004, 2005, 2006, 2008, 2009, 2010 Apple Inc. All rights reserved.
4 * Copyright (C) 2008 Eric Seidel <eric@webkit.org>
5 * Copyright (C) 2009 - 2010 Torch Mobile (Beijing) Co. Ltd. All rights reserved.
6 *
7 * This library is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Library General Public
9 * License as published by the Free Software Foundation; either
10 * version 2 of the License, or (at your option) any later version.
11 *
12 * This library is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Library General Public License for more details.
16 *
17 * You should have received a copy of the GNU Library General Public License
18 * along with this library; see the file COPYING.LIB. If not, write to
19 * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
20 * Boston, MA 02110-1301, USA.
21 */
22
23#ifndef CSSTokenizer_h
24#define CSSTokenizer_h
25
26#include "wtf/Noncopyable.h"
27#include "wtf/OwnPtr.h"
28#include "wtf/text/WTFString.h"
29
30namespace WebCore {
31
Torne (Richard Coles)09380292014-02-21 12:17:33 +000032class BisonCSSParser;
Torne (Richard Coles)51b29062013-11-28 11:56:03 +000033struct CSSParserLocation;
34struct CSSParserString;
35
36class CSSTokenizer {
37 WTF_MAKE_NONCOPYABLE(CSSTokenizer);
38public:
39 // FIXME: This should not be needed but there are still some ties between the 2 classes.
Torne (Richard Coles)09380292014-02-21 12:17:33 +000040 friend class BisonCSSParser;
Torne (Richard Coles)51b29062013-11-28 11:56:03 +000041
Torne (Richard Coles)09380292014-02-21 12:17:33 +000042 CSSTokenizer(BisonCSSParser& parser)
Torne (Richard Coles)51b29062013-11-28 11:56:03 +000043 : m_parser(parser)
44 , m_parsedTextPrefixLength(0)
45 , m_parsedTextSuffixLength(0)
46 , m_parsingMode(NormalMode)
47 , m_is8BitSource(false)
48 , m_length(0)
49 , m_token(0)
50 , m_lineNumber(0)
51 , m_tokenStartLineNumber(0)
52 , m_internal(true)
53 {
54 m_tokenStart.ptr8 = 0;
55 }
56
57 void setupTokenizer(const char* prefix, unsigned prefixLength, const String&, const char* suffix, unsigned suffixLength);
58
59 CSSParserLocation currentLocation();
60
61 inline int lex(void* yylval) { return (this->*m_lexFunc)(yylval); }
62
63 inline unsigned safeUserStringTokenOffset()
64 {
65 return std::min(tokenStartOffset(), static_cast<unsigned>(m_length - 1 - m_parsedTextSuffixLength)) - m_parsedTextPrefixLength;
66 }
67
68 bool is8BitSource() const { return m_is8BitSource; }
69
70 // FIXME: These 2 functions should be private so that we don't need the definitions below.
71 template <typename CharacterType>
72 inline CharacterType* tokenStart();
73
74 inline unsigned tokenStartOffset();
75
76private:
77 UChar*& currentCharacter16();
78
79 template <typename CharacterType>
80 inline CharacterType*& currentCharacter();
81
82 template <typename CharacterType>
83 inline CharacterType* dataStart();
84
85 template <typename CharacterType>
86 inline void setTokenStart(CharacterType*);
87
88 template <typename CharacterType>
89 inline bool isIdentifierStart();
90
91 template <typename CharacterType>
92 inline CSSParserLocation tokenLocation();
93
94 template <typename CharacterType>
95 unsigned parseEscape(CharacterType*&);
96 template <typename DestCharacterType>
97 inline void UnicodeToChars(DestCharacterType*&, unsigned);
98 template <typename SrcCharacterType, typename DestCharacterType>
99 inline bool parseIdentifierInternal(SrcCharacterType*&, DestCharacterType*&, bool&);
100
101 template <typename CharacterType>
102 inline void parseIdentifier(CharacterType*&, CSSParserString&, bool&);
103
104 template <typename SrcCharacterType, typename DestCharacterType>
105 inline bool parseStringInternal(SrcCharacterType*&, DestCharacterType*&, UChar);
106
107 template <typename CharacterType>
108 inline void parseString(CharacterType*&, CSSParserString& resultString, UChar);
109
110 template <typename CharacterType>
111 inline bool findURI(CharacterType*& start, CharacterType*& end, UChar& quote);
112
113 template <typename SrcCharacterType, typename DestCharacterType>
114 inline bool parseURIInternal(SrcCharacterType*&, DestCharacterType*&, UChar quote);
115
116 template <typename CharacterType>
117 inline void parseURI(CSSParserString&);
118 template <typename CharacterType>
119 inline bool parseUnicodeRange();
120 template <typename CharacterType>
121 bool parseNthChild();
122 template <typename CharacterType>
123 bool parseNthChildExtra();
124 template <typename CharacterType>
125 inline bool detectFunctionTypeToken(int);
126 template <typename CharacterType>
127 inline void detectMediaQueryToken(int);
128 template <typename CharacterType>
129 inline void detectNumberToken(CharacterType*, int);
130 template <typename CharacterType>
131 inline void detectDashToken(int);
132 template <typename CharacterType>
133 inline void detectAtToken(int, bool);
134 template <typename CharacterType>
135 inline void detectSupportsToken(int);
Torne (Richard Coles)51b29062013-11-28 11:56:03 +0000136
137 template <typename SourceCharacterType>
138 int realLex(void* yylval);
139
Torne (Richard Coles)09380292014-02-21 12:17:33 +0000140 BisonCSSParser& m_parser;
Torne (Richard Coles)51b29062013-11-28 11:56:03 +0000141
142 size_t m_parsedTextPrefixLength;
143 size_t m_parsedTextSuffixLength;
144
145 enum ParsingMode {
146 NormalMode,
147 MediaQueryMode,
148 SupportsMode,
149 NthChildMode
150 };
151
152 ParsingMode m_parsingMode;
153 bool m_is8BitSource;
154 OwnPtr<LChar[]> m_dataStart8;
155 OwnPtr<UChar[]> m_dataStart16;
156 LChar* m_currentCharacter8;
157 UChar* m_currentCharacter16;
158 union {
159 LChar* ptr8;
160 UChar* ptr16;
161 } m_tokenStart;
162 unsigned m_length;
163 int m_token;
164 int m_lineNumber;
165 int m_tokenStartLineNumber;
166
167 // FIXME: This boolean is misnamed. Also it would be nice if we could consolidate it
168 // with the CSSParserMode logic to determine if internal properties are allowed.
169 bool m_internal;
170
171 int (CSSTokenizer::*m_lexFunc)(void*);
172};
173
174inline unsigned CSSTokenizer::tokenStartOffset()
175{
176 if (is8BitSource())
177 return m_tokenStart.ptr8 - m_dataStart8.get();
178 return m_tokenStart.ptr16 - m_dataStart16.get();
179}
180
181template <>
182inline LChar* CSSTokenizer::tokenStart<LChar>()
183{
184 return m_tokenStart.ptr8;
185}
186
187template <>
188inline UChar* CSSTokenizer::tokenStart<UChar>()
189{
190 return m_tokenStart.ptr16;
191}
192
193} // namespace WebCore
194
195#endif // CSSTokenizer_h