Blame - test/cctest/test-parsing.cc - fp2-dev/platform/external/v8

blob: 6bcae7c308a4fd5fdcaa1a22ae566230d3310c68 [file] [log] [blame]

Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	1	// Copyright 2012 the V8 project authors. All rights reserved.
Steve Block	d0582a6	2009-12-15 09:54:21 +0000	[diff] [blame]	2	// Redistribution and use in source and binary forms, with or without
				3	// modification, are permitted provided that the following conditions are
				4	// met:
				5	//
				6	// * Redistributions of source code must retain the above copyright
				7	// notice, this list of conditions and the following disclaimer.
				8	// * Redistributions in binary form must reproduce the above
				9	// copyright notice, this list of conditions and the following
				10	// disclaimer in the documentation and/or other materials provided
				11	// with the distribution.
				12	// * Neither the name of Google Inc. nor the names of its
				13	// contributors may be used to endorse or promote products derived
				14	// from this software without specific prior written permission.
				15	//
				16	// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
				17	// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
				18	// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
				19	// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
				20	// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
				21	// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
				22	// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
				23	// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
				24	// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
				25	// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
				26	// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
				27
				28	#include <stdlib.h>
Teng-Hui Zhu	3e5fa29	2010-11-09 16:16:48 -0800	[diff] [blame]	29	#include <stdio.h>
Shimeng (Simon) Wang	8a31eba	2010-12-06 19:01:33 -0800	[diff] [blame]	30	#include <string.h>
Steve Block	d0582a6	2009-12-15 09:54:21 +0000	[diff] [blame]	31
				32	#include "v8.h"
				33
Steve Block	d0582a6	2009-12-15 09:54:21 +0000	[diff] [blame]	34	#include "cctest.h"
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	35	#include "compiler.h"
Ben Murdoch	589d697	2011-11-30 16:04:58 +0000	[diff] [blame]	36	#include "execution.h"
				37	#include "isolate.h"
				38	#include "parser.h"
				39	#include "preparser.h"
				40	#include "scanner-character-streams.h"
				41	#include "token.h"
				42	#include "utils.h"
Steve Block	d0582a6	2009-12-15 09:54:21 +0000	[diff] [blame]	43
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	44	TEST(ScanKeywords) {
Steve Block	d0582a6	2009-12-15 09:54:21 +0000	[diff] [blame]	45	struct KeywordToken {
				46	const char* keyword;
				47	i::Token::Value token;
				48	};
				49
				50	static const KeywordToken keywords[] = {
				51	#define KEYWORD(t, s, d) { s, i::Token::t },
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	52	TOKEN_LIST(IGNORE_TOKEN, KEYWORD)
Steve Block	d0582a6	2009-12-15 09:54:21 +0000	[diff] [blame]	53	#undef KEYWORD
				54	{ NULL, i::Token::IDENTIFIER }
				55	};
				56
Steve Block	d0582a6	2009-12-15 09:54:21 +0000	[diff] [blame]	57	KeywordToken key_token;
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	58	i::UnicodeCache unicode_cache;
				59	i::byte buffer[32];
Steve Block	d0582a6	2009-12-15 09:54:21 +0000	[diff] [blame]	60	for (int i = 0; (key_token = keywords[i]).keyword != NULL; i++) {
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	61	const i::byte* keyword =
				62	reinterpret_cast<const i::byte*>(key_token.keyword);
				63	int length = i::StrLength(key_token.keyword);
				64	CHECK(static_cast<int>(sizeof(buffer)) >= length);
				65	{
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	66	i::Utf8ToUtf16CharacterStream stream(keyword, length);
				67	i::Scanner scanner(&unicode_cache);
				68	// The scanner should parse Harmony keywords for this test.
				69	scanner.SetHarmonyScoping(true);
				70	scanner.SetHarmonyModules(true);
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	71	scanner.Initialize(&stream);
				72	CHECK_EQ(key_token.token, scanner.Next());
				73	CHECK_EQ(i::Token::EOS, scanner.Next());
Steve Block	d0582a6	2009-12-15 09:54:21 +0000	[diff] [blame]	74	}
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	75	// Removing characters will make keyword matching fail.
				76	{
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	77	i::Utf8ToUtf16CharacterStream stream(keyword, length - 1);
				78	i::Scanner scanner(&unicode_cache);
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	79	scanner.Initialize(&stream);
				80	CHECK_EQ(i::Token::IDENTIFIER, scanner.Next());
				81	CHECK_EQ(i::Token::EOS, scanner.Next());
Steve Block	d0582a6	2009-12-15 09:54:21 +0000	[diff] [blame]	82	}
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	83	// Adding characters will make keyword matching fail.
				84	static const char chars_to_append[] = { 'z', '0', '_' };
				85	for (int j = 0; j < static_cast<int>(ARRAY_SIZE(chars_to_append)); ++j) {
				86	memmove(buffer, keyword, length);
				87	buffer[length] = chars_to_append[j];
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	88	i::Utf8ToUtf16CharacterStream stream(buffer, length + 1);
				89	i::Scanner scanner(&unicode_cache);
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	90	scanner.Initialize(&stream);
				91	CHECK_EQ(i::Token::IDENTIFIER, scanner.Next());
				92	CHECK_EQ(i::Token::EOS, scanner.Next());
				93	}
				94	// Replacing characters will make keyword matching fail.
				95	{
				96	memmove(buffer, keyword, length);
				97	buffer[length - 1] = '_';
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	98	i::Utf8ToUtf16CharacterStream stream(buffer, length);
				99	i::Scanner scanner(&unicode_cache);
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	100	scanner.Initialize(&stream);
				101	CHECK_EQ(i::Token::IDENTIFIER, scanner.Next());
				102	CHECK_EQ(i::Token::EOS, scanner.Next());
				103	}
Steve Block	d0582a6	2009-12-15 09:54:21 +0000	[diff] [blame]	104	}
Steve Block	d0582a6	2009-12-15 09:54:21 +0000	[diff] [blame]	105	}
				106
Iain Merrick	9ac36c9	2010-09-13 15:29:50 +0100	[diff] [blame]	107
				108	TEST(ScanHTMLEndComments) {
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	109	v8::V8::Initialize();
				110
Iain Merrick	9ac36c9	2010-09-13 15:29:50 +0100	[diff] [blame]	111	// Regression test. See:
				112	// http://code.google.com/p/chromium/issues/detail?id=53548
				113	// Tests that --> is correctly interpreted as comment-to-end-of-line if there
Ben Murdoch	3fb3ca8	2011-12-02 17:19:32 +0000	[diff] [blame]	114	// is only whitespace before it on the line (with comments considered as
				115	// whitespace, even a multiline-comment containing a newline).
				116	// This was not the case if it occurred before the first real token
Iain Merrick	9ac36c9	2010-09-13 15:29:50 +0100	[diff] [blame]	117	// in the input.
				118	const char* tests[] = {
				119	// Before first real token.
				120	"--> is eol-comment\nvar y = 37;\n",
				121	"\n --> is eol-comment\nvar y = 37;\n",
				122	"/* precomment */ --> is eol-comment\nvar y = 37;\n",
				123	"\n/* precomment */ --> is eol-comment\nvar y = 37;\n",
				124	// After first real token.
				125	"var x = 42;\n--> is eol-comment\nvar y = 37;\n",
				126	"var x = 42;\n/* precomment */ --> is eol-comment\nvar y = 37;\n",
				127	NULL
				128	};
				129
Ben Murdoch	3fb3ca8	2011-12-02 17:19:32 +0000	[diff] [blame]	130	const char* fail_tests[] = {
				131	"x --> is eol-comment\nvar y = 37;\n",
				132	"\"\\n\" --> is eol-comment\nvar y = 37;\n",
				133	"x/* precomment */ --> is eol-comment\nvar y = 37;\n",
				134	"x/* precomment\n */ --> is eol-comment\nvar y = 37;\n",
				135	"var x = 42; --> is eol-comment\nvar y = 37;\n",
				136	"var x = 42; /* precomment\n */ --> is eol-comment\nvar y = 37;\n",
				137	NULL
				138	};
				139
Iain Merrick	9ac36c9	2010-09-13 15:29:50 +0100	[diff] [blame]	140	// Parser/Scanner needs a stack limit.
				141	int marker;
Steve Block	44f0eee	2011-05-26 01:26:41 +0100	[diff] [blame]	142	i::Isolate::Current()->stack_guard()->SetStackLimit(
Iain Merrick	9ac36c9	2010-09-13 15:29:50 +0100	[diff] [blame]	143	reinterpret_cast<uintptr_t>(&marker) - 128 * 1024);
				144
				145	for (int i = 0; tests[i]; i++) {
				146	v8::ScriptData* data =
Kristian Monsen	0d5e116	2010-09-30 15:31:59 +0100	[diff] [blame]	147	v8::ScriptData::PreCompile(tests[i], i::StrLength(tests[i]));
Iain Merrick	9ac36c9	2010-09-13 15:29:50 +0100	[diff] [blame]	148	CHECK(data != NULL && !data->HasError());
				149	delete data;
				150	}
Ben Murdoch	3fb3ca8	2011-12-02 17:19:32 +0000	[diff] [blame]	151
				152	for (int i = 0; fail_tests[i]; i++) {
				153	v8::ScriptData* data =
				154	v8::ScriptData::PreCompile(fail_tests[i], i::StrLength(fail_tests[i]));
				155	CHECK(data == NULL \|\| data->HasError());
				156	delete data;
				157	}
Iain Merrick	9ac36c9	2010-09-13 15:29:50 +0100	[diff] [blame]	158	}
				159
				160
				161	class ScriptResource : public v8::String::ExternalAsciiStringResource {
				162	public:
				163	ScriptResource(const char* data, size_t length)
				164	: data_(data), length_(length) { }
				165
				166	const char* data() const { return data_; }
				167	size_t length() const { return length_; }
				168
				169	private:
				170	const char* data_;
				171	size_t length_;
				172	};
				173
				174
				175	TEST(Preparsing) {
				176	v8::HandleScope handles;
				177	v8::Persistent<v8::Context> context = v8::Context::New();
				178	v8::Context::Scope context_scope(context);
				179	int marker;
Steve Block	44f0eee	2011-05-26 01:26:41 +0100	[diff] [blame]	180	i::Isolate::Current()->stack_guard()->SetStackLimit(
Iain Merrick	9ac36c9	2010-09-13 15:29:50 +0100	[diff] [blame]	181	reinterpret_cast<uintptr_t>(&marker) - 128 * 1024);
				182
				183	// Source containing functions that might be lazily compiled and all types
				184	// of symbols (string, propertyName, regexp).
				185	const char* source =
				186	"var x = 42;"
				187	"function foo(a) { return function nolazy(b) { return a + b; } }"
				188	"function bar(a) { if (a) return function lazy(b) { return b; } }"
				189	"var z = {'string': 'string literal', bareword: 'propertyName', "
				190	" 42: 'number literal', for: 'keyword as propertyName', "
				191	" f\\u006fr: 'keyword propertyname with escape'};"
				192	"var v = /RegExp Literal/;"
				193	"var w = /RegExp Literal\\u0020With Escape/gin;"
				194	"var y = { get getter() { return 42; }, "
				195	" set setter(v) { this.value = v; }};";
Kristian Monsen	0d5e116	2010-09-30 15:31:59 +0100	[diff] [blame]	196	int source_length = i::StrLength(source);
Iain Merrick	9ac36c9	2010-09-13 15:29:50 +0100	[diff] [blame]	197	const char* error_source = "var x = y z;";
Kristian Monsen	0d5e116	2010-09-30 15:31:59 +0100	[diff] [blame]	198	int error_source_length = i::StrLength(error_source);
Iain Merrick	9ac36c9	2010-09-13 15:29:50 +0100	[diff] [blame]	199
				200	v8::ScriptData* preparse =
				201	v8::ScriptData::PreCompile(source, source_length);
				202	CHECK(!preparse->HasError());
				203	bool lazy_flag = i::FLAG_lazy;
				204	{
				205	i::FLAG_lazy = true;
				206	ScriptResource* resource = new ScriptResource(source, source_length);
				207	v8::Local<v8::String> script_source = v8::String::NewExternal(resource);
				208	v8::Script::Compile(script_source, NULL, preparse);
				209	}
				210
				211	{
				212	i::FLAG_lazy = false;
				213
				214	ScriptResource* resource = new ScriptResource(source, source_length);
				215	v8::Local<v8::String> script_source = v8::String::NewExternal(resource);
				216	v8::Script::New(script_source, NULL, preparse, v8::Local<v8::String>());
				217	}
				218	delete preparse;
				219	i::FLAG_lazy = lazy_flag;
				220
				221	// Syntax error.
				222	v8::ScriptData* error_preparse =
				223	v8::ScriptData::PreCompile(error_source, error_source_length);
				224	CHECK(error_preparse->HasError());
				225	i::ScriptDataImpl *pre_impl =
				226	reinterpret_cast<i::ScriptDataImpl*>(error_preparse);
				227	i::Scanner::Location error_location =
				228	pre_impl->MessageLocation();
				229	// Error is at "z" in source, location 10..11.
				230	CHECK_EQ(10, error_location.beg_pos);
				231	CHECK_EQ(11, error_location.end_pos);
				232	// Should not crash.
				233	const char* message = pre_impl->BuildMessage();
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	234	pre_impl->BuildArgs();
Iain Merrick	9ac36c9	2010-09-13 15:29:50 +0100	[diff] [blame]	235	CHECK_GT(strlen(message), 0);
				236	}
Teng-Hui Zhu	3e5fa29	2010-11-09 16:16:48 -0800	[diff] [blame]	237
				238
				239	TEST(StandAlonePreParser) {
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	240	v8::V8::Initialize();
				241
Teng-Hui Zhu	3e5fa29	2010-11-09 16:16:48 -0800	[diff] [blame]	242	int marker;
Steve Block	44f0eee	2011-05-26 01:26:41 +0100	[diff] [blame]	243	i::Isolate::Current()->stack_guard()->SetStackLimit(
Teng-Hui Zhu	3e5fa29	2010-11-09 16:16:48 -0800	[diff] [blame]	244	reinterpret_cast<uintptr_t>(&marker) - 128 * 1024);
				245
				246	const char* programs[] = {
				247	"{label: 42}",
				248	"var x = 42;",
				249	"function foo(x, y) { return x + y; }",
Ben Murdoch	3fb3ca8	2011-12-02 17:19:32 +0000	[diff] [blame]	250	"%ArgleBargle(glop);",
Teng-Hui Zhu	3e5fa29	2010-11-09 16:16:48 -0800	[diff] [blame]	251	"var x = new new Function('this.x = 42');",
				252	NULL
				253	};
				254
Ben Murdoch	8b112d2	2011-06-08 16:22:53 +0100	[diff] [blame]	255	uintptr_t stack_limit = i::Isolate::Current()->stack_guard()->real_climit();
Teng-Hui Zhu	3e5fa29	2010-11-09 16:16:48 -0800	[diff] [blame]	256	for (int i = 0; programs[i]; i++) {
				257	const char* program = programs[i];
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	258	i::Utf8ToUtf16CharacterStream stream(
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	259	reinterpret_cast<const i::byte*>(program),
				260	static_cast<unsigned>(strlen(program)));
Teng-Hui Zhu	3e5fa29	2010-11-09 16:16:48 -0800	[diff] [blame]	261	i::CompleteParserRecorder log;
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	262	i::Scanner scanner(i::Isolate::Current()->unicode_cache());
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	263	scanner.Initialize(&stream);
				264
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	265	int flags = i::kAllowLazy \| i::kAllowNativesSyntax;
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	266	v8::preparser::PreParser::PreParseResult result =
				267	v8::preparser::PreParser::PreParseProgram(&scanner,
				268	&log,
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	269	flags,
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	270	stack_limit);
				271	CHECK_EQ(v8::preparser::PreParser::kPreParseSuccess, result);
Teng-Hui Zhu	3e5fa29	2010-11-09 16:16:48 -0800	[diff] [blame]	272	i::ScriptDataImpl data(log.ExtractData());
				273	CHECK(!data.has_error());
				274	}
				275	}
Shimeng (Simon) Wang	8a31eba	2010-12-06 19:01:33 -0800	[diff] [blame]	276
				277
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	278	TEST(StandAlonePreParserNoNatives) {
				279	v8::V8::Initialize();
				280
				281	int marker;
				282	i::Isolate::Current()->stack_guard()->SetStackLimit(
				283	reinterpret_cast<uintptr_t>(&marker) - 128 * 1024);
				284
				285	const char* programs[] = {
				286	"%ArgleBargle(glop);",
				287	"var x = %_IsSmi(42);",
				288	NULL
				289	};
				290
				291	uintptr_t stack_limit = i::Isolate::Current()->stack_guard()->real_climit();
				292	for (int i = 0; programs[i]; i++) {
				293	const char* program = programs[i];
				294	i::Utf8ToUtf16CharacterStream stream(
				295	reinterpret_cast<const i::byte*>(program),
				296	static_cast<unsigned>(strlen(program)));
				297	i::CompleteParserRecorder log;
				298	i::Scanner scanner(i::Isolate::Current()->unicode_cache());
				299	scanner.Initialize(&stream);
				300
				301	// Flags don't allow natives syntax.
				302	v8::preparser::PreParser::PreParseResult result =
				303	v8::preparser::PreParser::PreParseProgram(&scanner,
				304	&log,
				305	i::kAllowLazy,
				306	stack_limit);
				307	CHECK_EQ(v8::preparser::PreParser::kPreParseSuccess, result);
				308	i::ScriptDataImpl data(log.ExtractData());
				309	// Data contains syntax error.
				310	CHECK(data.has_error());
				311	}
				312	}
				313
				314
Shimeng (Simon) Wang	8a31eba	2010-12-06 19:01:33 -0800	[diff] [blame]	315	TEST(RegressChromium62639) {
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	316	v8::V8::Initialize();
				317
Shimeng (Simon) Wang	8a31eba	2010-12-06 19:01:33 -0800	[diff] [blame]	318	int marker;
Ben Murdoch	8b112d2	2011-06-08 16:22:53 +0100	[diff] [blame]	319	i::Isolate::Current()->stack_guard()->SetStackLimit(
Shimeng (Simon) Wang	8a31eba	2010-12-06 19:01:33 -0800	[diff] [blame]	320	reinterpret_cast<uintptr_t>(&marker) - 128 * 1024);
				321
				322	const char* program = "var x = 'something';\n"
				323	"escape: function() {}";
				324	// Fails parsing expecting an identifier after "function".
				325	// Before fix, didn't check *ok after Expect(Token::Identifier, ok),
				326	// and then used the invalid currently scanned literal. This always
				327	// failed in debug mode, and sometimes crashed in release mode.
				328
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	329	i::Utf8ToUtf16CharacterStream stream(
				330	reinterpret_cast<const i::byte*>(program),
				331	static_cast<unsigned>(strlen(program)));
Shimeng (Simon) Wang	8a31eba	2010-12-06 19:01:33 -0800	[diff] [blame]	332	i::ScriptDataImpl* data =
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	333	i::ParserApi::PreParse(&stream, NULL, false);
Shimeng (Simon) Wang	8a31eba	2010-12-06 19:01:33 -0800	[diff] [blame]	334	CHECK(data->HasError());
				335	delete data;
				336	}
				337
				338
				339	TEST(Regress928) {
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	340	v8::V8::Initialize();
				341
Shimeng (Simon) Wang	8a31eba	2010-12-06 19:01:33 -0800	[diff] [blame]	342	// Preparsing didn't consider the catch clause of a try statement
				343	// as with-content, which made it assume that a function inside
				344	// the block could be lazily compiled, and an extra, unexpected,
				345	// entry was added to the data.
				346	int marker;
Ben Murdoch	8b112d2	2011-06-08 16:22:53 +0100	[diff] [blame]	347	i::Isolate::Current()->stack_guard()->SetStackLimit(
Shimeng (Simon) Wang	8a31eba	2010-12-06 19:01:33 -0800	[diff] [blame]	348	reinterpret_cast<uintptr_t>(&marker) - 128 * 1024);
				349
				350	const char* program =
				351	"try { } catch (e) { var foo = function () { /* first */ } }"
				352	"var bar = function () { /* second */ }";
				353
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	354	v8::HandleScope handles;
				355	i::Handle<i::String> source(
				356	FACTORY->NewStringFromAscii(i::CStrVector(program)));
				357	i::ScriptDataImpl* data = i::ParserApi::PartialPreParse(source, NULL, false);
Shimeng (Simon) Wang	8a31eba	2010-12-06 19:01:33 -0800	[diff] [blame]	358	CHECK(!data->HasError());
				359
				360	data->Initialize();
				361
Ben Murdoch	e0cee9b	2011-05-25 10:26:03 +0100	[diff] [blame]	362	int first_function =
				363	static_cast<int>(strstr(program, "function") - program);
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	364	int first_lbrace = first_function + i::StrLength("function () ");
Shimeng (Simon) Wang	8a31eba	2010-12-06 19:01:33 -0800	[diff] [blame]	365	CHECK_EQ('{', program[first_lbrace]);
				366	i::FunctionEntry entry1 = data->GetFunctionEntry(first_lbrace);
				367	CHECK(!entry1.is_valid());
				368
Ben Murdoch	e0cee9b	2011-05-25 10:26:03 +0100	[diff] [blame]	369	int second_function =
				370	static_cast<int>(strstr(program + first_lbrace, "function") - program);
				371	int second_lbrace =
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	372	second_function + i::StrLength("function () ");
Shimeng (Simon) Wang	8a31eba	2010-12-06 19:01:33 -0800	[diff] [blame]	373	CHECK_EQ('{', program[second_lbrace]);
				374	i::FunctionEntry entry2 = data->GetFunctionEntry(second_lbrace);
				375	CHECK(entry2.is_valid());
				376	CHECK_EQ('}', program[entry2.end_pos() - 1]);
				377	delete data;
				378	}
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	379
				380
				381	TEST(PreParseOverflow) {
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	382	v8::V8::Initialize();
				383
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	384	int marker;
Ben Murdoch	8b112d2	2011-06-08 16:22:53 +0100	[diff] [blame]	385	i::Isolate::Current()->stack_guard()->SetStackLimit(
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	386	reinterpret_cast<uintptr_t>(&marker) - 128 * 1024);
				387
				388	size_t kProgramSize = 1024 * 1024;
Ben Murdoch	589d697	2011-11-30 16:04:58 +0000	[diff] [blame]	389	i::SmartArrayPointer<char> program(
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	390	reinterpret_cast<char*>(malloc(kProgramSize + 1)));
				391	memset(*program, '(', kProgramSize);
				392	program[kProgramSize] = '\0';
				393
Ben Murdoch	8b112d2	2011-06-08 16:22:53 +0100	[diff] [blame]	394	uintptr_t stack_limit = i::Isolate::Current()->stack_guard()->real_climit();
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	395
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	396	i::Utf8ToUtf16CharacterStream stream(
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	397	reinterpret_cast<const i::byte>(program),
				398	static_cast<unsigned>(kProgramSize));
				399	i::CompleteParserRecorder log;
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	400	i::Scanner scanner(i::Isolate::Current()->unicode_cache());
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	401	scanner.Initialize(&stream);
				402
				403
				404	v8::preparser::PreParser::PreParseResult result =
				405	v8::preparser::PreParser::PreParseProgram(&scanner,
				406	&log,
				407	true,
				408	stack_limit);
				409	CHECK_EQ(v8::preparser::PreParser::kPreParseStackOverflow, result);
				410	}
				411
				412
				413	class TestExternalResource: public v8::String::ExternalStringResource {
				414	public:
				415	explicit TestExternalResource(uint16_t* data, int length)
				416	: data_(data), length_(static_cast<size_t>(length)) { }
				417
				418	~TestExternalResource() { }
				419
				420	const uint16_t* data() const {
				421	return data_;
				422	}
				423
				424	size_t length() const {
				425	return length_;
				426	}
				427	private:
				428	uint16_t* data_;
				429	size_t length_;
				430	};
				431
				432
				433	#define CHECK_EQU(v1, v2) CHECK_EQ(static_cast<int>(v1), static_cast<int>(v2))
				434
				435	void TestCharacterStream(const char* ascii_source,
				436	unsigned length,
				437	unsigned start = 0,
				438	unsigned end = 0) {
				439	if (end == 0) end = length;
				440	unsigned sub_length = end - start;
				441	i::HandleScope test_scope;
Ben Murdoch	589d697	2011-11-30 16:04:58 +0000	[diff] [blame]	442	i::SmartArrayPointer<i::uc16> uc16_buffer(new i::uc16[length]);
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	443	for (unsigned i = 0; i < length; i++) {
				444	uc16_buffer[i] = static_cast<i::uc16>(ascii_source[i]);
				445	}
				446	i::Vector<const char> ascii_vector(ascii_source, static_cast<int>(length));
				447	i::Handle<i::String> ascii_string(
Steve Block	44f0eee	2011-05-26 01:26:41 +0100	[diff] [blame]	448	FACTORY->NewStringFromAscii(ascii_vector));
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	449	TestExternalResource resource(*uc16_buffer, length);
				450	i::Handle<i::String> uc16_string(
Steve Block	44f0eee	2011-05-26 01:26:41 +0100	[diff] [blame]	451	FACTORY->NewExternalStringFromTwoByte(&resource));
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	452
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	453	i::ExternalTwoByteStringUtf16CharacterStream uc16_stream(
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	454	i::Handle<i::ExternalTwoByteString>::cast(uc16_string), start, end);
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	455	i::GenericStringUtf16CharacterStream string_stream(ascii_string, start, end);
				456	i::Utf8ToUtf16CharacterStream utf8_stream(
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	457	reinterpret_cast<const i::byte*>(ascii_source), end);
				458	utf8_stream.SeekForward(start);
				459
				460	unsigned i = start;
				461	while (i < end) {
				462	// Read streams one char at a time
				463	CHECK_EQU(i, uc16_stream.pos());
				464	CHECK_EQU(i, string_stream.pos());
				465	CHECK_EQU(i, utf8_stream.pos());
				466	int32_t c0 = ascii_source[i];
				467	int32_t c1 = uc16_stream.Advance();
				468	int32_t c2 = string_stream.Advance();
				469	int32_t c3 = utf8_stream.Advance();
				470	i++;
				471	CHECK_EQ(c0, c1);
				472	CHECK_EQ(c0, c2);
				473	CHECK_EQ(c0, c3);
				474	CHECK_EQU(i, uc16_stream.pos());
				475	CHECK_EQU(i, string_stream.pos());
				476	CHECK_EQU(i, utf8_stream.pos());
				477	}
				478	while (i > start + sub_length / 4) {
				479	// Pushback, re-read, pushback again.
				480	int32_t c0 = ascii_source[i - 1];
				481	CHECK_EQU(i, uc16_stream.pos());
				482	CHECK_EQU(i, string_stream.pos());
				483	CHECK_EQU(i, utf8_stream.pos());
				484	uc16_stream.PushBack(c0);
				485	string_stream.PushBack(c0);
				486	utf8_stream.PushBack(c0);
				487	i--;
				488	CHECK_EQU(i, uc16_stream.pos());
				489	CHECK_EQU(i, string_stream.pos());
				490	CHECK_EQU(i, utf8_stream.pos());
				491	int32_t c1 = uc16_stream.Advance();
				492	int32_t c2 = string_stream.Advance();
				493	int32_t c3 = utf8_stream.Advance();
				494	i++;
				495	CHECK_EQU(i, uc16_stream.pos());
				496	CHECK_EQU(i, string_stream.pos());
				497	CHECK_EQU(i, utf8_stream.pos());
				498	CHECK_EQ(c0, c1);
				499	CHECK_EQ(c0, c2);
				500	CHECK_EQ(c0, c3);
				501	uc16_stream.PushBack(c0);
				502	string_stream.PushBack(c0);
				503	utf8_stream.PushBack(c0);
				504	i--;
				505	CHECK_EQU(i, uc16_stream.pos());
				506	CHECK_EQU(i, string_stream.pos());
				507	CHECK_EQU(i, utf8_stream.pos());
				508	}
				509	unsigned halfway = start + sub_length / 2;
				510	uc16_stream.SeekForward(halfway - i);
				511	string_stream.SeekForward(halfway - i);
				512	utf8_stream.SeekForward(halfway - i);
				513	i = halfway;
				514	CHECK_EQU(i, uc16_stream.pos());
				515	CHECK_EQU(i, string_stream.pos());
				516	CHECK_EQU(i, utf8_stream.pos());
				517
				518	while (i < end) {
				519	// Read streams one char at a time
				520	CHECK_EQU(i, uc16_stream.pos());
				521	CHECK_EQU(i, string_stream.pos());
				522	CHECK_EQU(i, utf8_stream.pos());
				523	int32_t c0 = ascii_source[i];
				524	int32_t c1 = uc16_stream.Advance();
				525	int32_t c2 = string_stream.Advance();
				526	int32_t c3 = utf8_stream.Advance();
				527	i++;
				528	CHECK_EQ(c0, c1);
				529	CHECK_EQ(c0, c2);
				530	CHECK_EQ(c0, c3);
				531	CHECK_EQU(i, uc16_stream.pos());
				532	CHECK_EQU(i, string_stream.pos());
				533	CHECK_EQU(i, utf8_stream.pos());
				534	}
				535
				536	int32_t c1 = uc16_stream.Advance();
				537	int32_t c2 = string_stream.Advance();
				538	int32_t c3 = utf8_stream.Advance();
				539	CHECK_LT(c1, 0);
				540	CHECK_LT(c2, 0);
				541	CHECK_LT(c3, 0);
				542	}
				543
				544
				545	TEST(CharacterStreams) {
				546	v8::HandleScope handles;
				547	v8::Persistent<v8::Context> context = v8::Context::New();
				548	v8::Context::Scope context_scope(context);
				549
				550	TestCharacterStream("abc\0\n\r\x7f", 7);
				551	static const unsigned kBigStringSize = 4096;
				552	char buffer[kBigStringSize + 1];
				553	for (unsigned i = 0; i < kBigStringSize; i++) {
				554	buffer[i] = static_cast<char>(i & 0x7f);
				555	}
				556	TestCharacterStream(buffer, kBigStringSize);
				557
				558	TestCharacterStream(buffer, kBigStringSize, 576, 3298);
				559
				560	TestCharacterStream("\0", 1);
				561	TestCharacterStream("", 0);
				562	}
				563
				564
				565	TEST(Utf8CharacterStream) {
				566	static const unsigned kMaxUC16CharU = unibrow::Utf8::kMaxThreeByteChar;
				567	static const int kMaxUC16Char = static_cast<int>(kMaxUC16CharU);
				568
				569	static const int kAllUtf8CharsSize =
				570	(unibrow::Utf8::kMaxOneByteChar + 1) +
				571	(unibrow::Utf8::kMaxTwoByteChar - unibrow::Utf8::kMaxOneByteChar) * 2 +
				572	(unibrow::Utf8::kMaxThreeByteChar - unibrow::Utf8::kMaxTwoByteChar) * 3;
				573	static const unsigned kAllUtf8CharsSizeU =
				574	static_cast<unsigned>(kAllUtf8CharsSize);
				575
				576	char buffer[kAllUtf8CharsSizeU];
				577	unsigned cursor = 0;
				578	for (int i = 0; i <= kMaxUC16Char; i++) {
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	579	cursor += unibrow::Utf8::Encode(buffer + cursor,
				580	i,
				581	unibrow::Utf16::kNoPreviousCharacter);
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	582	}
				583	ASSERT(cursor == kAllUtf8CharsSizeU);
				584
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	585	i::Utf8ToUtf16CharacterStream stream(reinterpret_cast<const i::byte*>(buffer),
				586	kAllUtf8CharsSizeU);
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	587	for (int i = 0; i <= kMaxUC16Char; i++) {
				588	CHECK_EQU(i, stream.pos());
				589	int32_t c = stream.Advance();
				590	CHECK_EQ(i, c);
				591	CHECK_EQU(i + 1, stream.pos());
				592	}
				593	for (int i = kMaxUC16Char; i >= 0; i--) {
				594	CHECK_EQU(i + 1, stream.pos());
				595	stream.PushBack(i);
				596	CHECK_EQU(i, stream.pos());
				597	}
				598	int i = 0;
				599	while (stream.pos() < kMaxUC16CharU) {
				600	CHECK_EQU(i, stream.pos());
				601	unsigned progress = stream.SeekForward(12);
				602	i += progress;
				603	int32_t c = stream.Advance();
				604	if (i <= kMaxUC16Char) {
				605	CHECK_EQ(i, c);
				606	} else {
				607	CHECK_EQ(-1, c);
				608	}
				609	i += 1;
				610	CHECK_EQU(i, stream.pos());
				611	}
				612	}
				613
				614	#undef CHECK_EQU
				615
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	616	void TestStreamScanner(i::Utf16CharacterStream* stream,
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	617	i::Token::Value* expected_tokens,
				618	int skip_pos = 0, // Zero means not skipping.
				619	int skip_to = 0) {
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	620	i::Scanner scanner(i::Isolate::Current()->unicode_cache());
Steve Block	9fac840	2011-05-12 15:51:54 +0100	[diff] [blame]	621	scanner.Initialize(stream);
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	622
				623	int i = 0;
				624	do {
				625	i::Token::Value expected = expected_tokens[i];
				626	i::Token::Value actual = scanner.Next();
				627	CHECK_EQ(i::Token::String(expected), i::Token::String(actual));
				628	if (scanner.location().end_pos == skip_pos) {
				629	scanner.SeekForward(skip_to);
				630	}
				631	i++;
				632	} while (expected_tokens[i] != i::Token::ILLEGAL);
				633	}
				634
				635	TEST(StreamScanner) {
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	636	v8::V8::Initialize();
				637
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	638	const char* str1 = "{ foo get for : / <- \n\n /foo*/ bib";
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	639	i::Utf8ToUtf16CharacterStream stream1(reinterpret_cast<const i::byte*>(str1),
				640	static_cast<unsigned>(strlen(str1)));
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	641	i::Token::Value expectations1[] = {
				642	i::Token::LBRACE,
				643	i::Token::IDENTIFIER,
				644	i::Token::IDENTIFIER,
				645	i::Token::FOR,
				646	i::Token::COLON,
				647	i::Token::MUL,
				648	i::Token::DIV,
				649	i::Token::LT,
				650	i::Token::SUB,
				651	i::Token::IDENTIFIER,
				652	i::Token::EOS,
				653	i::Token::ILLEGAL
				654	};
				655	TestStreamScanner(&stream1, expectations1, 0, 0);
				656
				657	const char* str2 = "case default const {THIS\nPART\nSKIPPED} do";
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	658	i::Utf8ToUtf16CharacterStream stream2(reinterpret_cast<const i::byte*>(str2),
				659	static_cast<unsigned>(strlen(str2)));
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	660	i::Token::Value expectations2[] = {
				661	i::Token::CASE,
				662	i::Token::DEFAULT,
				663	i::Token::CONST,
				664	i::Token::LBRACE,
				665	// Skipped part here
				666	i::Token::RBRACE,
				667	i::Token::DO,
				668	i::Token::EOS,
				669	i::Token::ILLEGAL
				670	};
				671	ASSERT_EQ('{', str2[19]);
				672	ASSERT_EQ('}', str2[37]);
				673	TestStreamScanner(&stream2, expectations2, 20, 37);
				674
				675	const char* str3 = "{}}}}";
				676	i::Token::Value expectations3[] = {
				677	i::Token::LBRACE,
				678	i::Token::RBRACE,
				679	i::Token::RBRACE,
				680	i::Token::RBRACE,
				681	i::Token::RBRACE,
				682	i::Token::EOS,
				683	i::Token::ILLEGAL
				684	};
				685	// Skip zero-four RBRACEs.
				686	for (int i = 0; i <= 4; i++) {
				687	expectations3[6 - i] = i::Token::ILLEGAL;
				688	expectations3[5 - i] = i::Token::EOS;
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	689	i::Utf8ToUtf16CharacterStream stream3(
Ben Murdoch	b0fe162	2011-05-05 13:52:32 +0100	[diff] [blame]	690	reinterpret_cast<const i::byte*>(str3),
				691	static_cast<unsigned>(strlen(str3)));
				692	TestStreamScanner(&stream3, expectations3, 1, 1 + i);
				693	}
				694	}
Ben Murdoch	086aeea	2011-05-13 15:57:08 +0100	[diff] [blame]	695
				696
				697	void TestScanRegExp(const char* re_source, const char* expected) {
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	698	i::Utf8ToUtf16CharacterStream stream(
Ben Murdoch	086aeea	2011-05-13 15:57:08 +0100	[diff] [blame]	699	reinterpret_cast<const i::byte*>(re_source),
				700	static_cast<unsigned>(strlen(re_source)));
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	701	i::Scanner scanner(i::Isolate::Current()->unicode_cache());
Ben Murdoch	086aeea	2011-05-13 15:57:08 +0100	[diff] [blame]	702	scanner.Initialize(&stream);
				703
				704	i::Token::Value start = scanner.peek();
				705	CHECK(start == i::Token::DIV \|\| start == i::Token::ASSIGN_DIV);
				706	CHECK(scanner.ScanRegExpPattern(start == i::Token::ASSIGN_DIV));
				707	scanner.Next(); // Current token is now the regexp literal.
				708	CHECK(scanner.is_literal_ascii());
				709	i::Vector<const char> actual = scanner.literal_ascii_string();
				710	for (int i = 0; i < actual.length(); i++) {
				711	CHECK_NE('\0', expected[i]);
				712	CHECK_EQ(expected[i], actual[i]);
				713	}
				714	}
				715
				716
				717	TEST(RegExpScanning) {
Ben Murdoch	69a99ed	2011-11-30 16:03:39 +0000	[diff] [blame]	718	v8::V8::Initialize();
				719
Ben Murdoch	086aeea	2011-05-13 15:57:08 +0100	[diff] [blame]	720	// RegExp token with added garbage at the end. The scanner should only
				721	// scan the RegExp until the terminating slash just before "flipperwald".
				722	TestScanRegExp("/b/flipperwald", "b");
				723	// Incomplete escape sequences doesn't hide the terminating slash.
				724	TestScanRegExp("/\\x/flipperwald", "\\x");
				725	TestScanRegExp("/\\u/flipperwald", "\\u");
				726	TestScanRegExp("/\\u1/flipperwald", "\\u1");
				727	TestScanRegExp("/\\u12/flipperwald", "\\u12");
				728	TestScanRegExp("/\\u123/flipperwald", "\\u123");
				729	TestScanRegExp("/\\c/flipperwald", "\\c");
				730	TestScanRegExp("/\\c//flipperwald", "\\c");
				731	// Slashes inside character classes are not terminating.
				732	TestScanRegExp("/[/]/flipperwald", "[/]");
				733	TestScanRegExp("/[\\s-/]/flipperwald", "[\\s-/]");
				734	// Incomplete escape sequences inside a character class doesn't hide
				735	// the end of the character class.
				736	TestScanRegExp("/[\\c/]/flipperwald", "[\\c/]");
				737	TestScanRegExp("/[\\c]/flipperwald", "[\\c]");
				738	TestScanRegExp("/[\\x]/flipperwald", "[\\x]");
				739	TestScanRegExp("/[\\x1]/flipperwald", "[\\x1]");
				740	TestScanRegExp("/[\\u]/flipperwald", "[\\u]");
				741	TestScanRegExp("/[\\u1]/flipperwald", "[\\u1]");
				742	TestScanRegExp("/[\\u12]/flipperwald", "[\\u12]");
				743	TestScanRegExp("/[\\u123]/flipperwald", "[\\u123]");
				744	// Escaped ']'s wont end the character class.
				745	TestScanRegExp("/[\\]/]/flipperwald", "[\\]/]");
				746	// Escaped slashes are not terminating.
				747	TestScanRegExp("/\\//flipperwald", "\\/");
				748	// Starting with '=' works too.
				749	TestScanRegExp("/=/", "=");
				750	TestScanRegExp("/=?/", "=?");
				751	}
Ben Murdoch	692be65	2012-01-10 18:47:50 +0000	[diff] [blame]	752
				753
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	754	static int Utf8LengthHelper(const char* s) {
				755	int len = i::StrLength(s);
				756	int character_length = len;
				757	for (int i = 0; i < len; i++) {
				758	unsigned char c = s[i];
				759	int input_offset = 0;
				760	int output_adjust = 0;
				761	if (c > 0x7f) {
				762	if (c < 0xc0) continue;
				763	if (c >= 0xf0) {
				764	if (c >= 0xf8) {
				765	// 5 and 6 byte UTF-8 sequences turn into a kBadChar for each UTF-8
				766	// byte.
				767	continue; // Handle first UTF-8 byte.
				768	}
				769	if ((c & 7) == 0 && ((s[i + 1] & 0x30) == 0)) {
				770	// This 4 byte sequence could have been coded as a 3 byte sequence.
				771	// Record a single kBadChar for the first byte and continue.
				772	continue;
				773	}
				774	input_offset = 3;
				775	// 4 bytes of UTF-8 turn into 2 UTF-16 code units.
				776	character_length -= 2;
				777	} else if (c >= 0xe0) {
				778	if ((c & 0xf) == 0 && ((s[i + 1] & 0x20) == 0)) {
				779	// This 3 byte sequence could have been coded as a 2 byte sequence.
				780	// Record a single kBadChar for the first byte and continue.
				781	continue;
				782	}
				783	input_offset = 2;
				784	// 3 bytes of UTF-8 turn into 1 UTF-16 code unit.
				785	output_adjust = 2;
				786	} else {
				787	if ((c & 0x1e) == 0) {
				788	// This 2 byte sequence could have been coded as a 1 byte sequence.
				789	// Record a single kBadChar for the first byte and continue.
				790	continue;
				791	}
				792	input_offset = 1;
				793	// 2 bytes of UTF-8 turn into 1 UTF-16 code unit.
				794	output_adjust = 1;
				795	}
				796	bool bad = false;
				797	for (int j = 1; j <= input_offset; j++) {
				798	if ((s[i + j] & 0xc0) != 0x80) {
				799	// Bad UTF-8 sequence turns the first in the sequence into kBadChar,
				800	// which is a single UTF-16 code unit.
				801	bad = true;
				802	break;
				803	}
				804	}
				805	if (!bad) {
				806	i += input_offset;
				807	character_length -= output_adjust;
				808	}
				809	}
				810	}
				811	return character_length;
				812	}
				813
				814
				815	TEST(ScopePositions) {
				816	// Test the parser for correctly setting the start and end positions
				817	// of a scope. We check the scope positions of exactly one scope
				818	// nested in the global scope of a program. 'inner source' is the
				819	// source code that determines the part of the source belonging
				820	// to the nested scope. 'outer_prefix' and 'outer_suffix' are
				821	// parts of the source that belong to the global scope.
				822	struct SourceData {
				823	const char* outer_prefix;
				824	const char* inner_source;
				825	const char* outer_suffix;
				826	i::ScopeType scope_type;
				827	i::LanguageMode language_mode;
				828	};
				829
				830	const SourceData source_data[] = {
				831	{ " with ({}) ", "{ block; }", " more;", i::WITH_SCOPE, i::CLASSIC_MODE },
				832	{ " with ({}) ", "{ block; }", "; more;", i::WITH_SCOPE, i::CLASSIC_MODE },
				833	{ " with ({}) ", "{\n"
				834	" block;\n"
				835	" }", "\n"
				836	" more;", i::WITH_SCOPE, i::CLASSIC_MODE },
				837	{ " with ({}) ", "statement;", " more;", i::WITH_SCOPE, i::CLASSIC_MODE },
				838	{ " with ({}) ", "statement", "\n"
				839	" more;", i::WITH_SCOPE, i::CLASSIC_MODE },
				840	{ " with ({})\n"
				841	" ", "statement;", "\n"
				842	" more;", i::WITH_SCOPE, i::CLASSIC_MODE },
				843	{ " try {} catch ", "(e) { block; }", " more;",
				844	i::CATCH_SCOPE, i::CLASSIC_MODE },
				845	{ " try {} catch ", "(e) { block; }", "; more;",
				846	i::CATCH_SCOPE, i::CLASSIC_MODE },
				847	{ " try {} catch ", "(e) {\n"
				848	" block;\n"
				849	" }", "\n"
				850	" more;", i::CATCH_SCOPE, i::CLASSIC_MODE },
				851	{ " try {} catch ", "(e) { block; }", " finally { block; } more;",
				852	i::CATCH_SCOPE, i::CLASSIC_MODE },
				853	{ " start;\n"
				854	" ", "{ let block; }", " more;", i::BLOCK_SCOPE, i::EXTENDED_MODE },
				855	{ " start;\n"
				856	" ", "{ let block; }", "; more;", i::BLOCK_SCOPE, i::EXTENDED_MODE },
				857	{ " start;\n"
				858	" ", "{\n"
				859	" let block;\n"
				860	" }", "\n"
				861	" more;", i::BLOCK_SCOPE, i::EXTENDED_MODE },
				862	{ " start;\n"
				863	" function fun", "(a,b) { infunction; }", " more;",
				864	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				865	{ " start;\n"
				866	" function fun", "(a,b) {\n"
				867	" infunction;\n"
				868	" }", "\n"
				869	" more;", i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				870	{ " (function fun", "(a,b) { infunction; }", ")();",
				871	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				872	{ " for ", "(let x = 1 ; x < 10; ++ x) { block; }", " more;",
				873	i::BLOCK_SCOPE, i::EXTENDED_MODE },
				874	{ " for ", "(let x = 1 ; x < 10; ++ x) { block; }", "; more;",
				875	i::BLOCK_SCOPE, i::EXTENDED_MODE },
				876	{ " for ", "(let x = 1 ; x < 10; ++ x) {\n"
				877	" block;\n"
				878	" }", "\n"
				879	" more;", i::BLOCK_SCOPE, i::EXTENDED_MODE },
				880	{ " for ", "(let x = 1 ; x < 10; ++ x) statement;", " more;",
				881	i::BLOCK_SCOPE, i::EXTENDED_MODE },
				882	{ " for ", "(let x = 1 ; x < 10; ++ x) statement", "\n"
				883	" more;", i::BLOCK_SCOPE, i::EXTENDED_MODE },
				884	{ " for ", "(let x = 1 ; x < 10; ++ x)\n"
				885	" statement;", "\n"
				886	" more;", i::BLOCK_SCOPE, i::EXTENDED_MODE },
				887	{ " for ", "(let x in {}) { block; }", " more;",
				888	i::BLOCK_SCOPE, i::EXTENDED_MODE },
				889	{ " for ", "(let x in {}) { block; }", "; more;",
				890	i::BLOCK_SCOPE, i::EXTENDED_MODE },
				891	{ " for ", "(let x in {}) {\n"
				892	" block;\n"
				893	" }", "\n"
				894	" more;", i::BLOCK_SCOPE, i::EXTENDED_MODE },
				895	{ " for ", "(let x in {}) statement;", " more;",
				896	i::BLOCK_SCOPE, i::EXTENDED_MODE },
				897	{ " for ", "(let x in {}) statement", "\n"
				898	" more;", i::BLOCK_SCOPE, i::EXTENDED_MODE },
				899	{ " for ", "(let x in {})\n"
				900	" statement;", "\n"
				901	" more;", i::BLOCK_SCOPE, i::EXTENDED_MODE },
				902	// Check that 6-byte and 4-byte encodings of UTF-8 strings do not throw
				903	// the preparser off in terms of byte offsets.
				904	// 6 byte encoding.
				905	{ " 'foo\355\240\201\355\260\211';\n"
				906	" (function fun", "(a,b) { infunction; }", ")();",
				907	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				908	// 4 byte encoding.
				909	{ " 'foo\360\220\220\212';\n"
				910	" (function fun", "(a,b) { infunction; }", ")();",
				911	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				912	// 3 byte encoding of \u0fff.
				913	{ " 'foo\340\277\277';\n"
				914	" (function fun", "(a,b) { infunction; }", ")();",
				915	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				916	// Broken 6 byte encoding with missing last byte.
				917	{ " 'foo\355\240\201\355\211';\n"
				918	" (function fun", "(a,b) { infunction; }", ")();",
				919	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				920	// Broken 3 byte encoding of \u0fff with missing last byte.
				921	{ " 'foo\340\277';\n"
				922	" (function fun", "(a,b) { infunction; }", ")();",
				923	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				924	// Broken 3 byte encoding of \u0fff with missing 2 last bytes.
				925	{ " 'foo\340';\n"
				926	" (function fun", "(a,b) { infunction; }", ")();",
				927	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				928	// Broken 3 byte encoding of \u00ff should be a 2 byte encoding.
				929	{ " 'foo\340\203\277';\n"
				930	" (function fun", "(a,b) { infunction; }", ")();",
				931	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				932	// Broken 3 byte encoding of \u007f should be a 2 byte encoding.
				933	{ " 'foo\340\201\277';\n"
				934	" (function fun", "(a,b) { infunction; }", ")();",
				935	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				936	// Unpaired lead surrogate.
				937	{ " 'foo\355\240\201';\n"
				938	" (function fun", "(a,b) { infunction; }", ")();",
				939	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				940	// Unpaired lead surrogate where following code point is a 3 byte sequence.
				941	{ " 'foo\355\240\201\340\277\277';\n"
				942	" (function fun", "(a,b) { infunction; }", ")();",
				943	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				944	// Unpaired lead surrogate where following code point is a 4 byte encoding
				945	// of a trail surrogate.
				946	{ " 'foo\355\240\201\360\215\260\211';\n"
				947	" (function fun", "(a,b) { infunction; }", ")();",
				948	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				949	// Unpaired trail surrogate.
				950	{ " 'foo\355\260\211';\n"
				951	" (function fun", "(a,b) { infunction; }", ")();",
				952	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				953	// 2 byte encoding of \u00ff.
				954	{ " 'foo\303\277';\n"
				955	" (function fun", "(a,b) { infunction; }", ")();",
				956	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				957	// Broken 2 byte encoding of \u00ff with missing last byte.
				958	{ " 'foo\303';\n"
				959	" (function fun", "(a,b) { infunction; }", ")();",
				960	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				961	// Broken 2 byte encoding of \u007f should be a 1 byte encoding.
				962	{ " 'foo\301\277';\n"
				963	" (function fun", "(a,b) { infunction; }", ")();",
				964	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				965	// Illegal 5 byte encoding.
				966	{ " 'foo\370\277\277\277\277';\n"
				967	" (function fun", "(a,b) { infunction; }", ")();",
				968	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				969	// Illegal 6 byte encoding.
				970	{ " 'foo\374\277\277\277\277\277';\n"
				971	" (function fun", "(a,b) { infunction; }", ")();",
				972	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				973	// Illegal 0xfe byte
				974	{ " 'foo\376\277\277\277\277\277\277';\n"
				975	" (function fun", "(a,b) { infunction; }", ")();",
				976	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				977	// Illegal 0xff byte
				978	{ " 'foo\377\277\277\277\277\277\277\277';\n"
				979	" (function fun", "(a,b) { infunction; }", ")();",
				980	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				981	{ " 'foo';\n"
				982	" (function fun", "(a,b) { 'bar\355\240\201\355\260\213'; }", ")();",
				983	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				984	{ " 'foo';\n"
				985	" (function fun", "(a,b) { 'bar\360\220\220\214'; }", ")();",
				986	i::FUNCTION_SCOPE, i::CLASSIC_MODE },
				987	{ NULL, NULL, NULL, i::EVAL_SCOPE, i::CLASSIC_MODE }
				988	};
				989
				990	v8::HandleScope handles;
				991	v8::Persistent<v8::Context> context = v8::Context::New();
				992	v8::Context::Scope context_scope(context);
				993
				994	int marker;
				995	i::Isolate::Current()->stack_guard()->SetStackLimit(
				996	reinterpret_cast<uintptr_t>(&marker) - 128 * 1024);
				997	i::FLAG_harmony_scoping = true;
				998
				999	for (int i = 0; source_data[i].outer_prefix; i++) {
				1000	int kPrefixLen = Utf8LengthHelper(source_data[i].outer_prefix);
				1001	int kInnerLen = Utf8LengthHelper(source_data[i].inner_source);
				1002	int kSuffixLen = Utf8LengthHelper(source_data[i].outer_suffix);
				1003	int kPrefixByteLen = i::StrLength(source_data[i].outer_prefix);
				1004	int kInnerByteLen = i::StrLength(source_data[i].inner_source);
				1005	int kSuffixByteLen = i::StrLength(source_data[i].outer_suffix);
				1006	int kProgramSize = kPrefixLen + kInnerLen + kSuffixLen;
				1007	int kProgramByteSize = kPrefixByteLen + kInnerByteLen + kSuffixByteLen;
				1008	i::Vector<char> program = i::Vector<char>::New(kProgramByteSize + 1);
				1009	i::OS::SNPrintF(program, "%s%s%s",
				1010	source_data[i].outer_prefix,
				1011	source_data[i].inner_source,
				1012	source_data[i].outer_suffix);
				1013
				1014	// Parse program source.
				1015	i::Handle<i::String> source(
				1016	FACTORY->NewStringFromUtf8(i::CStrVector(program.start())));
				1017	CHECK_EQ(source->length(), kProgramSize);
				1018	i::Handle<i::Script> script = FACTORY->NewScript(source);
				1019	i::Parser parser(script, i::kAllowLazy \| i::EXTENDED_MODE, NULL, NULL);
				1020	i::CompilationInfo info(script);
				1021	info.MarkAsGlobal();
				1022	info.SetLanguageMode(source_data[i].language_mode);
				1023	i::FunctionLiteral* function = parser.ParseProgram(&info);
				1024	CHECK(function != NULL);
				1025
				1026	// Check scope types and positions.
				1027	i::Scope* scope = function->scope();
				1028	CHECK(scope->is_global_scope());
				1029	CHECK_EQ(scope->start_position(), 0);
				1030	CHECK_EQ(scope->end_position(), kProgramSize);
				1031	CHECK_EQ(scope->inner_scopes()->length(), 1);
				1032
				1033	i::Scope* inner_scope = scope->inner_scopes()->at(0);
				1034	CHECK_EQ(inner_scope->type(), source_data[i].scope_type);
				1035	CHECK_EQ(inner_scope->start_position(), kPrefixLen);
				1036	// The end position of a token is one position after the last
				1037	// character belonging to that token.
				1038	CHECK_EQ(inner_scope->end_position(), kPrefixLen + kInnerLen);
				1039	}
				1040	}
				1041
				1042
				1043	void TestParserSync(i::Handle<i::String> source, int flags) {
Ben Murdoch	692be65	2012-01-10 18:47:50 +0000	[diff] [blame]	1044	uintptr_t stack_limit = i::Isolate::Current()->stack_guard()->real_climit();
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	1045	bool harmony_scoping = ((i::kLanguageModeMask & flags) == i::EXTENDED_MODE);
Ben Murdoch	692be65	2012-01-10 18:47:50 +0000	[diff] [blame]	1046
				1047	// Preparse the data.
				1048	i::CompleteParserRecorder log;
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	1049	i::Scanner scanner(i::Isolate::Current()->unicode_cache());
				1050	i::GenericStringUtf16CharacterStream stream(source, 0, source->length());
				1051	scanner.SetHarmonyScoping(harmony_scoping);
Ben Murdoch	692be65	2012-01-10 18:47:50 +0000	[diff] [blame]	1052	scanner.Initialize(&stream);
				1053	v8::preparser::PreParser::PreParseResult result =
				1054	v8::preparser::PreParser::PreParseProgram(
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	1055	&scanner, &log, flags, stack_limit);
Ben Murdoch	692be65	2012-01-10 18:47:50 +0000	[diff] [blame]	1056	CHECK_EQ(v8::preparser::PreParser::kPreParseSuccess, result);
				1057	i::ScriptDataImpl data(log.ExtractData());
				1058
				1059	// Parse the data
				1060	i::Handle<i::Script> script = FACTORY->NewScript(source);
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	1061	bool save_harmony_scoping = i::FLAG_harmony_scoping;
				1062	i::FLAG_harmony_scoping = harmony_scoping;
				1063	i::Parser parser(script, flags, NULL, NULL);
				1064	i::CompilationInfo info(script);
				1065	info.MarkAsGlobal();
				1066	i::FunctionLiteral* function = parser.ParseProgram(&info);
				1067	i::FLAG_harmony_scoping = save_harmony_scoping;
Ben Murdoch	692be65	2012-01-10 18:47:50 +0000	[diff] [blame]	1068
				1069	i::String* type_string = NULL;
				1070	if (function == NULL) {
				1071	// Extract exception from the parser.
				1072	i::Handle<i::String> type_symbol = FACTORY->LookupAsciiSymbol("type");
				1073	CHECK(i::Isolate::Current()->has_pending_exception());
				1074	i::MaybeObject* maybe_object = i::Isolate::Current()->pending_exception();
				1075	i::JSObject* exception = NULL;
				1076	CHECK(maybe_object->To(&exception));
				1077
				1078	// Get the type string.
				1079	maybe_object = exception->GetProperty(*type_symbol);
				1080	CHECK(maybe_object->To(&type_string));
				1081	}
				1082
				1083	// Check that preparsing fails iff parsing fails.
				1084	if (data.has_error() && function != NULL) {
				1085	i::OS::Print(
				1086	"Preparser failed on:\n"
				1087	"\t%s\n"
				1088	"with error:\n"
				1089	"\t%s\n"
				1090	"However, the parser succeeded",
				1091	*source->ToCString(), data.BuildMessage());
				1092	CHECK(false);
				1093	} else if (!data.has_error() && function == NULL) {
				1094	i::OS::Print(
				1095	"Parser failed on:\n"
				1096	"\t%s\n"
				1097	"with error:\n"
				1098	"\t%s\n"
				1099	"However, the preparser succeeded",
				1100	source->ToCString(), type_string->ToCString());
				1101	CHECK(false);
				1102	}
				1103
				1104	// Check that preparser and parser produce the same error.
				1105	if (function == NULL) {
				1106	if (!type_string->IsEqualTo(i::CStrVector(data.BuildMessage()))) {
				1107	i::OS::Print(
				1108	"Expected parser and preparser to produce the same error on:\n"
				1109	"\t%s\n"
				1110	"However, found the following error messages\n"
				1111	"\tparser: %s\n"
				1112	"\tpreparser: %s\n",
				1113	source->ToCString(), type_string->ToCString(), data.BuildMessage());
				1114	CHECK(false);
				1115	}
				1116	}
				1117	}
				1118
				1119
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	1120	void TestParserSyncWithFlags(i::Handle<i::String> source) {
				1121	static const int kFlagsCount = 6;
				1122	const int flags[kFlagsCount] = {
				1123	i::kNoParsingFlags \| i::CLASSIC_MODE,
				1124	i::kNoParsingFlags \| i::STRICT_MODE,
				1125	i::kNoParsingFlags \| i::EXTENDED_MODE,
				1126	i::kAllowLazy \| i::CLASSIC_MODE,
				1127	i::kAllowLazy \| i::STRICT_MODE,
				1128	i::kAllowLazy \| i::EXTENDED_MODE
				1129	};
				1130
				1131	for (int k = 0; k < kFlagsCount; ++k) {
				1132	TestParserSync(source, flags[k]);
				1133	}
				1134	}
				1135
				1136
Ben Murdoch	692be65	2012-01-10 18:47:50 +0000	[diff] [blame]	1137	TEST(ParserSync) {
				1138	const char* context_data[][2] = {
				1139	{ "", "" },
				1140	{ "{", "}" },
				1141	{ "if (true) ", " else {}" },
				1142	{ "if (true) {} else ", "" },
				1143	{ "if (true) ", "" },
				1144	{ "do ", " while (false)" },
				1145	{ "while (false) ", "" },
				1146	{ "for (;;) ", "" },
				1147	{ "with ({})", "" },
				1148	{ "switch (12) { case 12: ", "}" },
				1149	{ "switch (12) { default: ", "}" },
				1150	{ "label2: ", "" },
				1151	{ NULL, NULL }
				1152	};
				1153
				1154	const char* statement_data[] = {
				1155	"{}",
				1156	"var x",
				1157	"var x = 1",
				1158	"const x",
				1159	"const x = 1",
				1160	";",
				1161	"12",
				1162	"if (false) {} else ;",
				1163	"if (false) {} else {}",
				1164	"if (false) {} else 12",
				1165	"if (false) ;"
				1166	"if (false) {}",
				1167	"if (false) 12",
				1168	"do {} while (false)",
				1169	"for (;;) ;",
				1170	"for (;;) {}",
				1171	"for (;;) 12",
				1172	"continue",
				1173	"continue label",
				1174	"continue\nlabel",
				1175	"break",
				1176	"break label",
				1177	"break\nlabel",
				1178	"return",
				1179	"return 12",
				1180	"return\n12",
				1181	"with ({}) ;",
				1182	"with ({}) {}",
				1183	"with ({}) 12",
				1184	"switch ({}) { default: }"
				1185	"label3: "
				1186	"throw",
				1187	"throw 12",
				1188	"throw\n12",
				1189	"try {} catch(e) {}",
				1190	"try {} finally {}",
				1191	"try {} catch(e) {} finally {}",
				1192	"debugger",
				1193	NULL
				1194	};
				1195
				1196	const char* termination_data[] = {
				1197	"",
				1198	";",
				1199	"\n",
				1200	";\n",
				1201	"\n;",
				1202	NULL
				1203	};
				1204
				1205	v8::HandleScope handles;
				1206	v8::Persistent<v8::Context> context = v8::Context::New();
				1207	v8::Context::Scope context_scope(context);
				1208
				1209	int marker;
				1210	i::Isolate::Current()->stack_guard()->SetStackLimit(
				1211	reinterpret_cast<uintptr_t>(&marker) - 128 * 1024);
				1212
				1213	for (int i = 0; context_data[i][0] != NULL; ++i) {
				1214	for (int j = 0; statement_data[j] != NULL; ++j) {
				1215	for (int k = 0; termination_data[k] != NULL; ++k) {
				1216	int kPrefixLen = i::StrLength(context_data[i][0]);
				1217	int kStatementLen = i::StrLength(statement_data[j]);
				1218	int kTerminationLen = i::StrLength(termination_data[k]);
				1219	int kSuffixLen = i::StrLength(context_data[i][1]);
				1220	int kProgramSize = kPrefixLen + kStatementLen + kTerminationLen
				1221	+ kSuffixLen + i::StrLength("label: for (;;) { }");
				1222
				1223	// Plug the source code pieces together.
				1224	i::Vector<char> program = i::Vector<char>::New(kProgramSize + 1);
				1225	int length = i::OS::SNPrintF(program,
				1226	"label: for (;;) { %s%s%s%s }",
				1227	context_data[i][0],
				1228	statement_data[j],
				1229	termination_data[k],
				1230	context_data[i][1]);
				1231	CHECK(length == kProgramSize);
				1232	i::Handle<i::String> source =
				1233	FACTORY->NewStringFromAscii(i::CStrVector(program.start()));
Ben Murdoch	3ef787d	2012-04-12 10:51:47 +0100	[diff] [blame^]	1234	TestParserSyncWithFlags(source);
Ben Murdoch	692be65	2012-01-10 18:47:50 +0000	[diff] [blame]	1235	}
				1236	}
				1237	}
				1238	}