blob: 850169945815c2bebe93eaed91d9da48e57ff03a [file] [log] [blame]
Ben Murdochb8a8cc12014-11-26 15:28:44 +00001// Copyright 2012 the V8 project authors. All rights reserved.
2// Redistribution and use in source and binary forms, with or without
3// modification, are permitted provided that the following conditions are
4// met:
5//
6// * Redistributions of source code must retain the above copyright
7// notice, this list of conditions and the following disclaimer.
8// * Redistributions in binary form must reproduce the above
9// copyright notice, this list of conditions and the following
10// disclaimer in the documentation and/or other materials provided
11// with the distribution.
12// * Neither the name of Google Inc. nor the names of its
13// contributors may be used to endorse or promote products derived
14// from this software without specific prior written permission.
15//
16// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
17// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
18// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
19// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
20// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
21// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
22// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
26// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27
28
29// Test that an optional capture is cleared between two matches.
30var str = "ABX X";
31str = str.replace(/(\w)?X/g, function(match, capture) {
32 assertTrue(match.indexOf(capture) >= 0 ||
33 capture === undefined);
34 return capture ? capture.toLowerCase() : "-";
35 });
36assertEquals("Ab -", str);
37
38// Test zero-length matches.
39str = "Als Gregor Samsa eines Morgens";
40str = str.replace(/\b/g, function(match, capture) {
41 return "/";
42 });
43assertEquals("/Als/ /Gregor/ /Samsa/ /eines/ /Morgens/", str);
44
45// Test zero-length matches that have non-zero-length sub-captures.
46str = "It was a pleasure to burn.";
47str = str.replace(/(?=(\w+))\b/g, function(match, capture) {
48 return capture.length;
49 });
50assertEquals("2It 3was 1a 8pleasure 2to 4burn.", str);
51
52// Test multiple captures.
53str = "Try not. Do, or do not. There is no try.";
54str = str.replace(/(not?)|(do)|(try)/gi,
55 function(match, c1, c2, c3) {
56 assertTrue((c1 === undefined && c2 === undefined) ||
57 (c2 === undefined && c3 === undefined) ||
58 (c1 === undefined && c3 === undefined));
59 if (c1) return "-";
60 if (c2) return "+";
61 if (c3) return "="
62 });
63assertEquals("= -. +, or + -. There is - =.", str);
64
65// Test multiple alternate captures.
66str = "FOUR LEGS GOOD, TWO LEGS BAD!";
67str = str.replace(/(FOUR|TWO) LEGS (GOOD|BAD)/g,
68 function(match, num_legs, likeability) {
69 assertTrue(num_legs !== undefined);
70 assertTrue(likeability !== undefined);
71 if (num_legs == "FOUR") assertTrue(likeability == "GOOD");
72 if (num_legs == "TWO") assertTrue(likeability == "BAD");
73 return match.length - 10;
74 });
75assertEquals("4, 2!", str);
76
77
78// The same tests with UC16.
79
80//Test that an optional capture is cleared between two matches.
81str = "AB\u1234 \u1234";
82str = str.replace(/(\w)?\u1234/g,
83 function(match, capture) {
84 assertTrue(match.indexOf(capture) >= 0 ||
85 capture === undefined);
86 return capture ? capture.toLowerCase() : "-";
87 });
88assertEquals("Ab -", str);
89
90// Test zero-length matches.
91str = "Als \u2623\u2642 eines Morgens";
92str = str.replace(/\b/g, function(match, capture) {
93 return "/";
94 });
95assertEquals("/Als/ \u2623\u2642 /eines/ /Morgens/", str);
96
97// Test zero-length matches that have non-zero-length sub-captures.
98str = "It was a pleasure to \u70e7.";
99str = str.replace(/(?=(\w+))\b/g, function(match, capture) {
100 return capture.length;
101 });
102assertEquals("2It 3was 1a 8pleasure 2to \u70e7.", str);
103
104// Test multiple captures.
105str = "Try not. D\u26aa, or d\u26aa not. There is no try.";
106str = str.replace(/(not?)|(d\u26aa)|(try)/gi,
107 function(match, c1, c2, c3) {
108 assertTrue((c1 === undefined && c2 === undefined) ||
109 (c2 === undefined && c3 === undefined) ||
110 (c1 === undefined && c3 === undefined));
111 if (c1) return "-";
112 if (c2) return "+";
113 if (c3) return "="
114 });
115assertEquals("= -. +, or + -. There is - =.", str);
116
117// Test multiple alternate captures.
118str = "FOUR \u817f GOOD, TWO \u817f BAD!";
119str = str.replace(/(FOUR|TWO) \u817f (GOOD|BAD)/g,
120 function(match, num_legs, likeability) {
121 assertTrue(num_legs !== undefined);
122 assertTrue(likeability !== undefined);
123 if (num_legs == "FOUR") assertTrue(likeability == "GOOD");
124 if (num_legs == "TWO") assertTrue(likeability == "BAD");
125 return match.length - 7;
126 });
127assertEquals("4, 2!", str);
128
129// Test capture that is a real substring.
130var str = "Beasts of England, beasts of Ireland";
131str = str.replace(/(.*)/g, function(match) { return '~'; });
132assertEquals("~~", str);
133
134// Test zero-length matches that have non-zero-length sub-captures that do not
135// start at the match start position.
136str = "up up up up";
137str = str.replace(/\b(?=u(p))/g, function(match, capture) {
138 return capture.length;
139 });
140
141assertEquals("1up 1up 1up 1up", str);
142
143
144// Create regexp that has a *lot* of captures.
145var re_string = "(a)";
146for (var i = 0; i < 500; i++) {
147 re_string = "(" + re_string + ")";
148}
149re_string = re_string + "1";
150// re_string = "(((...((a))...)))1"
151
152var regexps = new Array();
153var last_match_expectations = new Array();
154var first_capture_expectations = new Array();
155
156// Atomic regexp.
157regexps.push(/a1/g);
158last_match_expectations.push("a1");
159first_capture_expectations.push("");
160// Small regexp (no capture);
161regexps.push(/\w1/g);
162last_match_expectations.push("a1");
163first_capture_expectations.push("");
164// Small regexp (one capture).
165regexps.push(/(a)1/g);
166last_match_expectations.push("a1");
167first_capture_expectations.push("a");
168// Large regexp (a lot of captures).
169regexps.push(new RegExp(re_string, "g"));
170last_match_expectations.push("a1");
171first_capture_expectations.push("a");
172
173function test_replace(result_expectation,
174 subject,
175 regexp,
176 replacement) {
177 for (var i = 0; i < regexps.length; i++) {
178 // Overwrite last match info.
179 "deadbeef".replace(/(dead)beef/, "$1holeycow");
180 // Conduct tests.
181 assertEquals(result_expectation, subject.replace(regexps[i], replacement));
182 if (subject.length == 0) {
183 assertEquals("deadbeef", RegExp.lastMatch);
184 assertEquals("dead", RegExp["$1"]);
185 } else {
186 assertEquals(last_match_expectations[i], RegExp.lastMatch);
187 assertEquals(first_capture_expectations[i], RegExp["$1"]);
188 }
189 }
190}
191
192
193function test_match(result_expectation,
194 subject,
195 regexp) {
196 for (var i = 0; i < regexps.length; i++) {
197 // Overwrite last match info.
198 "deadbeef".replace(/(dead)beef/, "$1holeycow");
199 // Conduct tests.
200 if (result_expectation == null) {
201 assertNull(subject.match(regexps[i]));
202 } else {
203 assertArrayEquals(result_expectation, subject.match(regexps[i]));
204 }
205 if (subject.length == 0) {
206 assertEquals("deadbeef", RegExp.lastMatch);
207 assertEquals("dead", RegExp["$1"]);
208 } else {
209 assertEquals(last_match_expectations[i], RegExp.lastMatch);
210 assertEquals(first_capture_expectations[i], RegExp["$1"]);
211 }
212 }
213}
214
215
216// Test for different number of matches.
217for (var m = 0; m < 33; m++) {
218 // Create string that matches m times.
219 var subject = "";
220 var test_1_expectation = "";
221 var test_2_expectation = "";
222 var test_3_expectation = (m == 0) ? null : new Array();
223 for (var i = 0; i < m; i++) {
224 subject += "a11";
225 test_1_expectation += "x1";
226 test_2_expectation += "1";
227 test_3_expectation.push("a1");
228 }
229
230 // Test 1a: String.replace with string.
231 test_replace(test_1_expectation, subject, /a1/g, "x");
232
233 // Test 1b: String.replace with function.
234 function f() { return "x"; }
235 test_replace(test_1_expectation, subject, /a1/g, f);
236
237 // Test 2a: String.replace with empty string.
238 test_replace(test_2_expectation, subject, /a1/g, "");
239
240 // Test 3a: String.match.
241 test_match(test_3_expectation, subject, /a1/g);
242}
243
244
245// Test String hashing (compiling regular expression includes hashing).
246var crosscheck = "\x80";
247for (var i = 0; i < 12; i++) crosscheck += crosscheck;
248new RegExp(crosscheck);
249
250var subject = "ascii~only~string~here~";
251var replacement = "\x80";
252var result = subject.replace(/~/g, replacement);
253for (var i = 0; i < 5; i++) result += result;
254new RegExp(result);