Context Navigation

Lexer.h@ 67494

Visit:

Last change on this file since 67494 was 66962, checked in by [email protected], 15 years ago

Refactoring multiline comments in the lexer
https://bugs.webkit.org/show_bug.cgi?id=45289

Reviewed by Darin Adler.

MultiLine comment parsing is moved to a separate function.

Slight performance increase on --parse-only tests (from 33.6ms to 32.8ms)
SunSpider reports no change (from 523.1ms to 521.2ms).

parser/Lexer.cpp:

(JSC::Lexer::parseMultilineComment):
(JSC::Lexer::lex):

parser/Lexer.h:

Property svn:eol-style set to native

File size: 5.2 KB

Line
1	/*
2	* Copyright (C) 1999-2000 Harri Porten ([email protected])
3	* Copyright (C) 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009 Apple Inc. All rights reserved.
4	* Copyright (C) 2010 Zoltan Herczeg ([email protected])
5	*
6	* This library is free software; you can redistribute it and/or
7	* modify it under the terms of the GNU Library General Public
8	* License as published by the Free Software Foundation; either
9	* version 2 of the License, or (at your option) any later version.
10	*
11	* This library is distributed in the hope that it will be useful,
12	* but WITHOUT ANY WARRANTY; without even the implied warranty of
13	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14	* Library General Public License for more details.
15	*
16	* You should have received a copy of the GNU Library General Public License
17	* along with this library; see the file COPYING.LIB. If not, write to
18	* the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
19	* Boston, MA 02110-1301, USA.
20	*
21	*/
22
23	#ifndef Lexer_h
24	#define Lexer_h
25
26	#include "JSParser.h"
27	#include "Lookup.h"
28	#include "ParserArena.h"
29	#include "SourceCode.h"
30	#include <wtf/ASCIICType.h>
31	#include <wtf/AlwaysInline.h>
32	#include <wtf/SegmentedVector.h>
33	#include <wtf/Vector.h>
34	#include <wtf/unicode/Unicode.h>
35
36	namespace JSC {
37
38	class RegExp;
39
40	class Lexer : public Noncopyable {
41	public:
42	// Character manipulation functions.
43	static bool isWhiteSpace(int character);
44	static bool isLineTerminator(int character);
45	static unsigned char convertHex(int c1, int c2);
46	static UChar convertUnicode(int c1, int c2, int c3, int c4);
47
48	// Functions to set up parsing.
49	void setCode(const SourceCode&, ParserArena&);
50	void setIsReparsing() { m_isReparsing = true; }
51
52	// Functions for the parser itself.
53	enum LexType { IdentifyReservedWords, IgnoreReservedWords };
54	JSTokenType lex(JSTokenData* lvalp, JSTokenInfo* llocp, LexType);
55	int lineNumber() const { return m_lineNumber; }
56	void setLastLineNumber(int lastLineNumber) { m_lastLineNumber = lastLineNumber; }
57	int lastLineNumber() const { return m_lastLineNumber; }
58	bool prevTerminator() const { return m_terminator; }
59	SourceCode sourceCode(int openBrace, int closeBrace, int firstLine);
60	bool scanRegExp(const Identifier& pattern, const Identifier& flags, UChar patternPrefix = 0);
61	bool skipRegExp();
62
63	// Functions for use after parsing.
64	bool sawError() const { return m_error; }
65	void clear();
66	int currentOffset() { return m_code - m_codeStart; }
67	void setOffset(int offset)
68	{
69	m_code = m_codeStart + offset;
70	m_current = *m_code;
71	}
72
73	private:
74	friend class JSGlobalData;
75
76	Lexer(JSGlobalData*);
77	~Lexer();
78
79	void record8(int);
80	void record16(int);
81	void record16(UChar);
82
83	void copyCodeWithoutBOMs();
84
85	ALWAYS_INLINE void shift();
86	ALWAYS_INLINE int peek(int offset);
87	int getUnicodeCharacter();
88	void shiftLineTerminator();
89
90	ALWAYS_INLINE const UChar* currentCharacter() const;
91	ALWAYS_INLINE int currentOffset() const;
92
93	ALWAYS_INLINE const Identifier* makeIdentifier(const UChar* characters, size_t length);
94
95	ALWAYS_INLINE bool lastTokenWasRestrKeyword() const;
96
97	ALWAYS_INLINE JSTokenType parseIdentifier(JSTokenData*, LexType);
98	ALWAYS_INLINE bool parseString(JSTokenData* lvalp);
99	ALWAYS_INLINE void parseHex(double& returnValue);
100	ALWAYS_INLINE bool parseOctal(double& returnValue);
101	ALWAYS_INLINE bool parseDecimal(double& returnValue);
102	ALWAYS_INLINE void parseNumberAfterDecimalPoint();
103	ALWAYS_INLINE bool parseNumberAfterExponentIndicator();
104	ALWAYS_INLINE bool parseMultilineComment();
105
106	static const size_t initialReadBufferCapacity = 32;
107
108	int m_lineNumber;
109	int m_lastLineNumber;
110
111	Vector<char> m_buffer8;
112	Vector<UChar> m_buffer16;
113	bool m_terminator;
114	bool m_delimited; // encountered delimiter like "'" and "}" on last run
115	int m_lastToken;
116
117	const SourceCode* m_source;
118	const UChar* m_code;
119	const UChar* m_codeStart;
120	const UChar* m_codeEnd;
121	bool m_isReparsing;
122	bool m_atLineStart;
123	bool m_error;
124
125	// current and following unicode characters (int to allow for -1 for end-of-file marker)
126	int m_current;
127
128	IdentifierArena* m_arena;
129
130	JSGlobalData* m_globalData;
131
132	const HashTable m_keywordTable;
133	};
134
135	inline bool Lexer::isWhiteSpace(int ch)
136	{
137	return isASCII(ch) ? (ch == ' ' \|\| ch == '\t' \|\| ch == 0xB \|\| ch == 0xC) : (WTF::Unicode::isSeparatorSpace(ch) \|\| ch == 0xFEFF);
138	}
139
140	inline bool Lexer::isLineTerminator(int ch)
141	{
142	return ch == '\r' \|\| ch == '\n' \|\| (ch & ~1) == 0x2028;
143	}
144
145	inline unsigned char Lexer::convertHex(int c1, int c2)
146	{
147	return (toASCIIHexValue(c1) << 4) \| toASCIIHexValue(c2);
148	}
149
150	inline UChar Lexer::convertUnicode(int c1, int c2, int c3, int c4)
151	{
152	return (convertHex(c1, c2) << 8) \| convertHex(c3, c4);
153	}
154
155	} // namespace JSC
156
157	#endif // Lexer_h

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: webkit/trunk/JavaScriptCore/parser/Lexer.h@ 67494

Download in other formats: