erik.corry@gmail.com | bbceb57 | 2012-03-09 10:52:05 +0000 | [diff] [blame] | 1 | // Copyright 2012 the V8 project authors. All rights reserved. |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 2 | // Redistribution and use in source and binary forms, with or without |
| 3 | // modification, are permitted provided that the following conditions are |
| 4 | // met: |
| 5 | // |
| 6 | // * Redistributions of source code must retain the above copyright |
| 7 | // notice, this list of conditions and the following disclaimer. |
| 8 | // * Redistributions in binary form must reproduce the above |
| 9 | // copyright notice, this list of conditions and the following |
| 10 | // disclaimer in the documentation and/or other materials provided |
| 11 | // with the distribution. |
| 12 | // * Neither the name of Google Inc. nor the names of its |
| 13 | // contributors may be used to endorse or promote products derived |
| 14 | // from this software without specific prior written permission. |
| 15 | // |
| 16 | // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| 17 | // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| 18 | // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
| 19 | // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
| 20 | // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| 21 | // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
| 22 | // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
| 23 | // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
| 24 | // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| 25 | // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| 26 | // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| 27 | |
| 28 | // Expect $Object = global.Object; |
| 29 | // Expect $Array = global.Array; |
| 30 | |
jkummerow@chromium.org | f7a5884 | 2012-02-21 10:08:21 +0000 | [diff] [blame] | 31 | var $RegExp = global.RegExp; |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 32 | |
| 33 | // A recursive descent parser for Patterns according to the grammar of |
| 34 | // ECMA-262 15.10.1, with deviations noted below. |
whesse@chromium.org | 023421e | 2010-12-21 12:19:12 +0000 | [diff] [blame] | 35 | function DoConstructRegExp(object, pattern, flags) { |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 36 | // RegExp : Called as constructor; see ECMA-262, section 15.10.4. |
| 37 | if (IS_REGEXP(pattern)) { |
| 38 | if (!IS_UNDEFINED(flags)) { |
| 39 | throw MakeTypeError('regexp_flags', []); |
| 40 | } |
| 41 | flags = (pattern.global ? 'g' : '') |
| 42 | + (pattern.ignoreCase ? 'i' : '') |
| 43 | + (pattern.multiline ? 'm' : ''); |
| 44 | pattern = pattern.source; |
| 45 | } |
| 46 | |
| 47 | pattern = IS_UNDEFINED(pattern) ? '' : ToString(pattern); |
| 48 | flags = IS_UNDEFINED(flags) ? '' : ToString(flags); |
| 49 | |
| 50 | var global = false; |
| 51 | var ignoreCase = false; |
| 52 | var multiline = false; |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 53 | for (var i = 0; i < flags.length; i++) { |
whesse@chromium.org | 7a392b3 | 2011-01-31 11:30:36 +0000 | [diff] [blame] | 54 | var c = %_CallFunction(flags, i, StringCharAt); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 55 | switch (c) { |
| 56 | case 'g': |
rossberg@chromium.org | 28a3708 | 2011-08-22 11:03:23 +0000 | [diff] [blame] | 57 | if (global) { |
| 58 | throw MakeSyntaxError("invalid_regexp_flags", [flags]); |
| 59 | } |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 60 | global = true; |
| 61 | break; |
| 62 | case 'i': |
rossberg@chromium.org | 28a3708 | 2011-08-22 11:03:23 +0000 | [diff] [blame] | 63 | if (ignoreCase) { |
| 64 | throw MakeSyntaxError("invalid_regexp_flags", [flags]); |
| 65 | } |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 66 | ignoreCase = true; |
| 67 | break; |
| 68 | case 'm': |
rossberg@chromium.org | 28a3708 | 2011-08-22 11:03:23 +0000 | [diff] [blame] | 69 | if (multiline) { |
| 70 | throw MakeSyntaxError("invalid_regexp_flags", [flags]); |
| 71 | } |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 72 | multiline = true; |
| 73 | break; |
| 74 | default: |
rossberg@chromium.org | 28a3708 | 2011-08-22 11:03:23 +0000 | [diff] [blame] | 75 | throw MakeSyntaxError("invalid_regexp_flags", [flags]); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 76 | } |
| 77 | } |
| 78 | |
lrn@chromium.org | 25156de | 2010-04-06 13:10:27 +0000 | [diff] [blame] | 79 | %RegExpInitializeObject(object, pattern, global, ignoreCase, multiline); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 80 | |
| 81 | // Call internal function to compile the pattern. |
| 82 | %RegExpCompile(object, pattern, flags); |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 83 | } |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 84 | |
| 85 | |
| 86 | function RegExpConstructor(pattern, flags) { |
kasperl@chromium.org | 2abc450 | 2009-07-02 07:00:29 +0000 | [diff] [blame] | 87 | if (%_IsConstructCall()) { |
whesse@chromium.org | 023421e | 2010-12-21 12:19:12 +0000 | [diff] [blame] | 88 | DoConstructRegExp(this, pattern, flags); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 89 | } else { |
| 90 | // RegExp : Called as function; see ECMA-262, section 15.10.3.1. |
| 91 | if (IS_REGEXP(pattern) && IS_UNDEFINED(flags)) { |
| 92 | return pattern; |
| 93 | } |
| 94 | return new $RegExp(pattern, flags); |
| 95 | } |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 96 | } |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 97 | |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 98 | // Deprecated RegExp.prototype.compile method. We behave like the constructor |
| 99 | // were called again. In SpiderMonkey, this method returns the regexp object. |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 100 | // In JSC, it returns undefined. For compatibility with JSC, we match their |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 101 | // behavior. |
erik.corry@gmail.com | c3b670f | 2011-10-05 21:44:48 +0000 | [diff] [blame] | 102 | function RegExpCompile(pattern, flags) { |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 103 | // Both JSC and SpiderMonkey treat a missing pattern argument as the |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 104 | // empty subject string, and an actual undefined value passed as the |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 105 | // pattern as the string 'undefined'. Note that JSC is inconsistent |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 106 | // here, treating undefined values differently in |
| 107 | // RegExp.prototype.compile and in the constructor, where they are |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 108 | // the empty string. For compatibility with JSC, we match their |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 109 | // behavior. |
erik.corry@gmail.com | c3b670f | 2011-10-05 21:44:48 +0000 | [diff] [blame] | 110 | if (this == $RegExp.prototype) { |
| 111 | // We don't allow recompiling RegExp.prototype. |
| 112 | throw MakeTypeError('incompatible_method_receiver', |
| 113 | ['RegExp.prototype.compile', this]); |
| 114 | } |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 115 | if (IS_UNDEFINED(pattern) && %_ArgumentsLength() != 0) { |
whesse@chromium.org | 023421e | 2010-12-21 12:19:12 +0000 | [diff] [blame] | 116 | DoConstructRegExp(this, 'undefined', flags); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 117 | } else { |
whesse@chromium.org | 023421e | 2010-12-21 12:19:12 +0000 | [diff] [blame] | 118 | DoConstructRegExp(this, pattern, flags); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 119 | } |
| 120 | } |
| 121 | |
| 122 | |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 123 | function DoRegExpExec(regexp, string, index) { |
fschneider@chromium.org | 013f3e1 | 2010-04-26 13:27:52 +0000 | [diff] [blame] | 124 | var result = %_RegExpExec(regexp, string, index, lastMatchInfo); |
| 125 | if (result !== null) lastMatchInfoOverride = null; |
| 126 | return result; |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 127 | } |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 128 | |
| 129 | |
whesse@chromium.org | b6e43bb | 2010-04-14 09:36:28 +0000 | [diff] [blame] | 130 | function BuildResultFromMatchInfo(lastMatchInfo, s) { |
| 131 | var numResults = NUMBER_OF_CAPTURES(lastMatchInfo) >> 1; |
ager@chromium.org | 5f0c45f | 2010-12-17 08:51:21 +0000 | [diff] [blame] | 132 | var start = lastMatchInfo[CAPTURE0]; |
| 133 | var end = lastMatchInfo[CAPTURE1]; |
| 134 | var result = %_RegExpConstructResult(numResults, start, s); |
| 135 | if (start + 1 == end) { |
| 136 | result[0] = %_StringCharAt(s, start); |
whesse@chromium.org | b6e43bb | 2010-04-14 09:36:28 +0000 | [diff] [blame] | 137 | } else { |
ager@chromium.org | 5f0c45f | 2010-12-17 08:51:21 +0000 | [diff] [blame] | 138 | result[0] = %_SubString(s, start, end); |
| 139 | } |
| 140 | var j = REGEXP_FIRST_CAPTURE + 2; |
| 141 | for (var i = 1; i < numResults; i++) { |
| 142 | start = lastMatchInfo[j++]; |
| 143 | end = lastMatchInfo[j++]; |
| 144 | if (end != -1) { |
| 145 | if (start + 1 == end) { |
| 146 | result[i] = %_StringCharAt(s, start); |
whesse@chromium.org | b6e43bb | 2010-04-14 09:36:28 +0000 | [diff] [blame] | 147 | } else { |
ager@chromium.org | 5f0c45f | 2010-12-17 08:51:21 +0000 | [diff] [blame] | 148 | result[i] = %_SubString(s, start, end); |
whesse@chromium.org | b6e43bb | 2010-04-14 09:36:28 +0000 | [diff] [blame] | 149 | } |
ager@chromium.org | 5f0c45f | 2010-12-17 08:51:21 +0000 | [diff] [blame] | 150 | } else { |
| 151 | // Make sure the element is present. Avoid reading the undefined |
| 152 | // property from the global object since this may change. |
| 153 | result[i] = void 0; |
whesse@chromium.org | b6e43bb | 2010-04-14 09:36:28 +0000 | [diff] [blame] | 154 | } |
| 155 | } |
| 156 | return result; |
| 157 | } |
| 158 | |
| 159 | |
| 160 | function RegExpExecNoTests(regexp, string, start) { |
| 161 | // Must be called with RegExp, string and positive integer as arguments. |
whesse@chromium.org | 023421e | 2010-12-21 12:19:12 +0000 | [diff] [blame] | 162 | var matchInfo = %_RegExpExec(regexp, string, start, lastMatchInfo); |
whesse@chromium.org | b6e43bb | 2010-04-14 09:36:28 +0000 | [diff] [blame] | 163 | if (matchInfo !== null) { |
whesse@chromium.org | 023421e | 2010-12-21 12:19:12 +0000 | [diff] [blame] | 164 | lastMatchInfoOverride = null; |
| 165 | return BuildResultFromMatchInfo(matchInfo, string); |
whesse@chromium.org | b6e43bb | 2010-04-14 09:36:28 +0000 | [diff] [blame] | 166 | } |
whesse@chromium.org | 023421e | 2010-12-21 12:19:12 +0000 | [diff] [blame] | 167 | return null; |
whesse@chromium.org | b6e43bb | 2010-04-14 09:36:28 +0000 | [diff] [blame] | 168 | } |
| 169 | |
| 170 | |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 171 | function RegExpExec(string) { |
fschneider@chromium.org | 086aac6 | 2010-03-17 13:18:24 +0000 | [diff] [blame] | 172 | if (!IS_REGEXP(this)) { |
| 173 | throw MakeTypeError('incompatible_method_receiver', |
| 174 | ['RegExp.prototype.exec', this]); |
| 175 | } |
| 176 | |
ager@chromium.org | 5f0c45f | 2010-12-17 08:51:21 +0000 | [diff] [blame] | 177 | string = TO_STRING_INLINE(string); |
lrn@chromium.org | fa943b7 | 2010-11-03 08:14:36 +0000 | [diff] [blame] | 178 | var lastIndex = this.lastIndex; |
vegorov@chromium.org | f837290 | 2010-03-15 10:26:20 +0000 | [diff] [blame] | 179 | |
vegorov@chromium.org | 4284196 | 2010-10-18 11:18:59 +0000 | [diff] [blame] | 180 | // Conversion is required by the ES5 specification (RegExp.prototype.exec |
| 181 | // algorithm, step 5) even if the value is discarded for non-global RegExps. |
| 182 | var i = TO_INTEGER(lastIndex); |
lrn@chromium.org | fa943b7 | 2010-11-03 08:14:36 +0000 | [diff] [blame] | 183 | |
| 184 | var global = this.global; |
vegorov@chromium.org | 4284196 | 2010-10-18 11:18:59 +0000 | [diff] [blame] | 185 | if (global) { |
ager@chromium.org | 5f0c45f | 2010-12-17 08:51:21 +0000 | [diff] [blame] | 186 | if (i < 0 || i > string.length) { |
vegorov@chromium.org | 4284196 | 2010-10-18 11:18:59 +0000 | [diff] [blame] | 187 | this.lastIndex = 0; |
| 188 | return null; |
| 189 | } |
| 190 | } else { |
| 191 | i = 0; |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 192 | } |
| 193 | |
ager@chromium.org | 5f0c45f | 2010-12-17 08:51:21 +0000 | [diff] [blame] | 194 | %_Log('regexp', 'regexp-exec,%0r,%1S,%2i', [this, string, lastIndex]); |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 195 | // matchIndices is either null or the lastMatchInfo array. |
ager@chromium.org | 5f0c45f | 2010-12-17 08:51:21 +0000 | [diff] [blame] | 196 | var matchIndices = %_RegExpExec(this, string, i, lastMatchInfo); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 197 | |
vegorov@chromium.org | 4284196 | 2010-10-18 11:18:59 +0000 | [diff] [blame] | 198 | if (matchIndices === null) { |
erik.corry@gmail.com | 4a6c327 | 2010-11-18 12:04:40 +0000 | [diff] [blame] | 199 | if (global) this.lastIndex = 0; |
lrn@chromium.org | fa943b7 | 2010-11-03 08:14:36 +0000 | [diff] [blame] | 200 | return null; |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 201 | } |
vegorov@chromium.org | 4284196 | 2010-10-18 11:18:59 +0000 | [diff] [blame] | 202 | |
| 203 | // Successful match. |
fschneider@chromium.org | 013f3e1 | 2010-04-26 13:27:52 +0000 | [diff] [blame] | 204 | lastMatchInfoOverride = null; |
vegorov@chromium.org | 4284196 | 2010-10-18 11:18:59 +0000 | [diff] [blame] | 205 | if (global) { |
vegorov@chromium.org | f837290 | 2010-03-15 10:26:20 +0000 | [diff] [blame] | 206 | this.lastIndex = lastMatchInfo[CAPTURE1]; |
vegorov@chromium.org | f837290 | 2010-03-15 10:26:20 +0000 | [diff] [blame] | 207 | } |
ager@chromium.org | 5f0c45f | 2010-12-17 08:51:21 +0000 | [diff] [blame] | 208 | return BuildResultFromMatchInfo(matchIndices, string); |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 209 | } |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 210 | |
| 211 | |
lrn@chromium.org | 1af7e1b | 2010-06-07 11:12:01 +0000 | [diff] [blame] | 212 | // One-element cache for the simplified test regexp. |
| 213 | var regexp_key; |
| 214 | var regexp_val; |
| 215 | |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 216 | // Section 15.10.6.3 doesn't actually make sense, but the intention seems to be |
ager@chromium.org | bb29dc9 | 2009-03-24 13:25:23 +0000 | [diff] [blame] | 217 | // that test is defined in terms of String.prototype.exec. However, it probably |
| 218 | // means the original value of String.prototype.exec, which is what everybody |
| 219 | // else implements. |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 220 | function RegExpTest(string) { |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 221 | if (!IS_REGEXP(this)) { |
ager@chromium.org | ce5e87b | 2010-03-10 10:24:18 +0000 | [diff] [blame] | 222 | throw MakeTypeError('incompatible_method_receiver', |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 223 | ['RegExp.prototype.test', this]); |
| 224 | } |
ager@chromium.org | 5f0c45f | 2010-12-17 08:51:21 +0000 | [diff] [blame] | 225 | string = TO_STRING_INLINE(string); |
fschneider@chromium.org | 086aac6 | 2010-03-17 13:18:24 +0000 | [diff] [blame] | 226 | |
lrn@chromium.org | fa943b7 | 2010-11-03 08:14:36 +0000 | [diff] [blame] | 227 | var lastIndex = this.lastIndex; |
| 228 | |
vegorov@chromium.org | 4284196 | 2010-10-18 11:18:59 +0000 | [diff] [blame] | 229 | // Conversion is required by the ES5 specification (RegExp.prototype.exec |
| 230 | // algorithm, step 5) even if the value is discarded for non-global RegExps. |
| 231 | var i = TO_INTEGER(lastIndex); |
jkummerow@chromium.org | ddda9e8 | 2011-07-06 11:27:02 +0000 | [diff] [blame] | 232 | |
erik.corry@gmail.com | 4a6c327 | 2010-11-18 12:04:40 +0000 | [diff] [blame] | 233 | if (this.global) { |
ager@chromium.org | 5f0c45f | 2010-12-17 08:51:21 +0000 | [diff] [blame] | 234 | if (i < 0 || i > string.length) { |
vegorov@chromium.org | 4284196 | 2010-10-18 11:18:59 +0000 | [diff] [blame] | 235 | this.lastIndex = 0; |
| 236 | return false; |
| 237 | } |
ager@chromium.org | 5f0c45f | 2010-12-17 08:51:21 +0000 | [diff] [blame] | 238 | %_Log('regexp', 'regexp-exec,%0r,%1S,%2i', [this, string, lastIndex]); |
erik.corry@gmail.com | 4a6c327 | 2010-11-18 12:04:40 +0000 | [diff] [blame] | 239 | // matchIndices is either null or the lastMatchInfo array. |
ager@chromium.org | 5f0c45f | 2010-12-17 08:51:21 +0000 | [diff] [blame] | 240 | var matchIndices = %_RegExpExec(this, string, i, lastMatchInfo); |
erik.corry@gmail.com | 4a6c327 | 2010-11-18 12:04:40 +0000 | [diff] [blame] | 241 | if (matchIndices === null) { |
| 242 | this.lastIndex = 0; |
| 243 | return false; |
lrn@chromium.org | 1af7e1b | 2010-06-07 11:12:01 +0000 | [diff] [blame] | 244 | } |
erik.corry@gmail.com | 4a6c327 | 2010-11-18 12:04:40 +0000 | [diff] [blame] | 245 | lastMatchInfoOverride = null; |
| 246 | this.lastIndex = lastMatchInfo[CAPTURE1]; |
jkummerow@chromium.org | ddda9e8 | 2011-07-06 11:27:02 +0000 | [diff] [blame] | 247 | return true; |
erik.corry@gmail.com | 4a6c327 | 2010-11-18 12:04:40 +0000 | [diff] [blame] | 248 | } else { |
| 249 | // Non-global regexp. |
jkummerow@chromium.org | ddda9e8 | 2011-07-06 11:27:02 +0000 | [diff] [blame] | 250 | // Remove irrelevant preceeding '.*' in a non-global test regexp. |
| 251 | // The expression checks whether this.source starts with '.*' and |
erik.corry@gmail.com | 4a6c327 | 2010-11-18 12:04:40 +0000 | [diff] [blame] | 252 | // that the third char is not a '?'. |
rossberg@chromium.org | 2c067b1 | 2012-03-19 11:01:52 +0000 | [diff] [blame] | 253 | var regexp = this; |
| 254 | if (%_StringCharCodeAt(regexp.source, 0) == 46 && // '.' |
| 255 | %_StringCharCodeAt(regexp.source, 1) == 42 && // '*' |
| 256 | %_StringCharCodeAt(regexp.source, 2) != 63) { // '?' |
| 257 | regexp = TrimRegExp(regexp); |
jkummerow@chromium.org | ddda9e8 | 2011-07-06 11:27:02 +0000 | [diff] [blame] | 258 | } |
rossberg@chromium.org | 2c067b1 | 2012-03-19 11:01:52 +0000 | [diff] [blame] | 259 | %_Log('regexp', 'regexp-exec,%0r,%1S,%2i', [regexp, string, lastIndex]); |
erik.corry@gmail.com | 4a6c327 | 2010-11-18 12:04:40 +0000 | [diff] [blame] | 260 | // matchIndices is either null or the lastMatchInfo array. |
rossberg@chromium.org | 2c067b1 | 2012-03-19 11:01:52 +0000 | [diff] [blame] | 261 | var matchIndices = %_RegExpExec(regexp, string, 0, lastMatchInfo); |
erik.corry@gmail.com | 4a6c327 | 2010-11-18 12:04:40 +0000 | [diff] [blame] | 262 | if (matchIndices === null) return false; |
| 263 | lastMatchInfoOverride = null; |
| 264 | return true; |
lrn@chromium.org | 1af7e1b | 2010-06-07 11:12:01 +0000 | [diff] [blame] | 265 | } |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 266 | } |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 267 | |
rossberg@chromium.org | 2c067b1 | 2012-03-19 11:01:52 +0000 | [diff] [blame] | 268 | function TrimRegExp(regexp) { |
| 269 | if (!%_ObjectEquals(regexp_key, regexp)) { |
| 270 | regexp_key = regexp; |
| 271 | regexp_val = |
| 272 | new $RegExp(SubString(regexp.source, 2, regexp.source.length), |
| 273 | (regexp.ignoreCase ? regexp.multiline ? "im" : "i" |
| 274 | : regexp.multiline ? "m" : "")); |
| 275 | } |
| 276 | return regexp_val; |
| 277 | } |
| 278 | |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 279 | |
| 280 | function RegExpToString() { |
jkummerow@chromium.org | 777db6f | 2012-05-24 09:33:09 +0000 | [diff] [blame] | 281 | if (!IS_REGEXP(this)) { |
| 282 | throw MakeTypeError('incompatible_method_receiver', |
| 283 | ['RegExp.prototype.toString', this]); |
| 284 | } |
yangguo@chromium.org | efdb9d7 | 2012-04-26 08:21:05 +0000 | [diff] [blame] | 285 | var result = '/' + this.source + '/'; |
vegorov@chromium.org | 4284196 | 2010-10-18 11:18:59 +0000 | [diff] [blame] | 286 | if (this.global) result += 'g'; |
| 287 | if (this.ignoreCase) result += 'i'; |
| 288 | if (this.multiline) result += 'm'; |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 289 | return result; |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 290 | } |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 291 | |
| 292 | |
| 293 | // Getters for the static properties lastMatch, lastParen, leftContext, and |
| 294 | // rightContext of the RegExp constructor. The properties are computed based |
| 295 | // on the captures array of the last successful match and the subject string |
| 296 | // of the last successful match. |
| 297 | function RegExpGetLastMatch() { |
fschneider@chromium.org | 013f3e1 | 2010-04-26 13:27:52 +0000 | [diff] [blame] | 298 | if (lastMatchInfoOverride !== null) { |
erik.corry@gmail.com | ed49e96 | 2012-04-17 11:57:53 +0000 | [diff] [blame] | 299 | return OVERRIDE_MATCH(lastMatchInfoOverride); |
fschneider@chromium.org | 013f3e1 | 2010-04-26 13:27:52 +0000 | [diff] [blame] | 300 | } |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 301 | var regExpSubject = LAST_SUBJECT(lastMatchInfo); |
| 302 | return SubString(regExpSubject, |
| 303 | lastMatchInfo[CAPTURE0], |
| 304 | lastMatchInfo[CAPTURE1]); |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 305 | } |
| 306 | |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 307 | |
| 308 | function RegExpGetLastParen() { |
lrn@chromium.org | 25156de | 2010-04-06 13:10:27 +0000 | [diff] [blame] | 309 | if (lastMatchInfoOverride) { |
| 310 | var override = lastMatchInfoOverride; |
| 311 | if (override.length <= 3) return ''; |
| 312 | return override[override.length - 3]; |
| 313 | } |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 314 | var length = NUMBER_OF_CAPTURES(lastMatchInfo); |
| 315 | if (length <= 2) return ''; // There were no captures. |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 316 | // We match the SpiderMonkey behavior: return the substring defined by the |
| 317 | // last pair (after the first pair) of elements of the capture array even if |
| 318 | // it is empty. |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 319 | var regExpSubject = LAST_SUBJECT(lastMatchInfo); |
| 320 | var start = lastMatchInfo[CAPTURE(length - 2)]; |
| 321 | var end = lastMatchInfo[CAPTURE(length - 1)]; |
| 322 | if (start != -1 && end != -1) { |
| 323 | return SubString(regExpSubject, start, end); |
| 324 | } |
| 325 | return ""; |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 326 | } |
| 327 | |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 328 | |
| 329 | function RegExpGetLeftContext() { |
lrn@chromium.org | 25156de | 2010-04-06 13:10:27 +0000 | [diff] [blame] | 330 | var start_index; |
| 331 | var subject; |
| 332 | if (!lastMatchInfoOverride) { |
| 333 | start_index = lastMatchInfo[CAPTURE0]; |
| 334 | subject = LAST_SUBJECT(lastMatchInfo); |
| 335 | } else { |
| 336 | var override = lastMatchInfoOverride; |
erik.corry@gmail.com | ed49e96 | 2012-04-17 11:57:53 +0000 | [diff] [blame] | 337 | start_index = OVERRIDE_POS(override); |
| 338 | subject = OVERRIDE_SUBJECT(override); |
lrn@chromium.org | 25156de | 2010-04-06 13:10:27 +0000 | [diff] [blame] | 339 | } |
| 340 | return SubString(subject, 0, start_index); |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 341 | } |
| 342 | |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 343 | |
| 344 | function RegExpGetRightContext() { |
lrn@chromium.org | 25156de | 2010-04-06 13:10:27 +0000 | [diff] [blame] | 345 | var start_index; |
| 346 | var subject; |
| 347 | if (!lastMatchInfoOverride) { |
| 348 | start_index = lastMatchInfo[CAPTURE1]; |
| 349 | subject = LAST_SUBJECT(lastMatchInfo); |
| 350 | } else { |
| 351 | var override = lastMatchInfoOverride; |
erik.corry@gmail.com | ed49e96 | 2012-04-17 11:57:53 +0000 | [diff] [blame] | 352 | subject = OVERRIDE_SUBJECT(override); |
| 353 | var match = OVERRIDE_MATCH(override); |
| 354 | start_index = OVERRIDE_POS(override) + match.length; |
lrn@chromium.org | 25156de | 2010-04-06 13:10:27 +0000 | [diff] [blame] | 355 | } |
| 356 | return SubString(subject, start_index, subject.length); |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 357 | } |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 358 | |
| 359 | |
| 360 | // The properties $1..$9 are the first nine capturing substrings of the last |
| 361 | // successful match, or ''. The function RegExpMakeCaptureGetter will be |
ager@chromium.org | bb29dc9 | 2009-03-24 13:25:23 +0000 | [diff] [blame] | 362 | // called with indices from 1 to 9. |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 363 | function RegExpMakeCaptureGetter(n) { |
| 364 | return function() { |
lrn@chromium.org | 25156de | 2010-04-06 13:10:27 +0000 | [diff] [blame] | 365 | if (lastMatchInfoOverride) { |
erik.corry@gmail.com | ed49e96 | 2012-04-17 11:57:53 +0000 | [diff] [blame] | 366 | if (n < lastMatchInfoOverride.length - 2) { |
| 367 | return OVERRIDE_CAPTURE(lastMatchInfoOverride, n); |
| 368 | } |
lrn@chromium.org | 25156de | 2010-04-06 13:10:27 +0000 | [diff] [blame] | 369 | return ''; |
| 370 | } |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 371 | var index = n * 2; |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 372 | if (index >= NUMBER_OF_CAPTURES(lastMatchInfo)) return ''; |
| 373 | var matchStart = lastMatchInfo[CAPTURE(index)]; |
| 374 | var matchEnd = lastMatchInfo[CAPTURE(index + 1)]; |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 375 | if (matchStart == -1 || matchEnd == -1) return ''; |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 376 | return SubString(LAST_SUBJECT(lastMatchInfo), matchStart, matchEnd); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 377 | }; |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 378 | } |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 379 | |
| 380 | |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 381 | // Property of the builtins object for recording the result of the last |
| 382 | // regexp match. The property lastMatchInfo includes the matchIndices |
| 383 | // array of the last successful regexp match (an array of start/end index |
| 384 | // pairs for the match and all the captured substrings), the invariant is |
| 385 | // that there are at least two capture indeces. The array also contains |
| 386 | // the subject string for the last successful match. |
karlklose@chromium.org | 8f806e8 | 2011-03-07 14:06:08 +0000 | [diff] [blame] | 387 | var lastMatchInfo = new InternalArray( |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 388 | 2, // REGEXP_NUMBER_OF_CAPTURES |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 389 | "", // Last subject. |
| 390 | void 0, // Last input - settable with RegExpSetInput. |
ager@chromium.org | bb29dc9 | 2009-03-24 13:25:23 +0000 | [diff] [blame] | 391 | 0, // REGEXP_FIRST_CAPTURE + 0 |
karlklose@chromium.org | 8f806e8 | 2011-03-07 14:06:08 +0000 | [diff] [blame] | 392 | 0 // REGEXP_FIRST_CAPTURE + 1 |
| 393 | ); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 394 | |
lrn@chromium.org | 25156de | 2010-04-06 13:10:27 +0000 | [diff] [blame] | 395 | // Override last match info with an array of actual substrings. |
| 396 | // Used internally by replace regexp with function. |
| 397 | // The array has the format of an "apply" argument for a replacement |
| 398 | // function. |
| 399 | var lastMatchInfoOverride = null; |
| 400 | |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 401 | // ------------------------------------------------------------------- |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 402 | |
fschneider@chromium.org | 1805e21 | 2011-09-05 10:49:12 +0000 | [diff] [blame] | 403 | function SetUpRegExp() { |
| 404 | %CheckIsBootstrapping(); |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 405 | %FunctionSetInstanceClassName($RegExp, 'RegExp'); |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 406 | %SetProperty($RegExp.prototype, 'constructor', $RegExp, DONT_ENUM); |
| 407 | %SetCode($RegExp, RegExpConstructor); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 408 | |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 409 | InstallFunctions($RegExp.prototype, DONT_ENUM, $Array( |
| 410 | "exec", RegExpExec, |
| 411 | "test", RegExpTest, |
| 412 | "toString", RegExpToString, |
erik.corry@gmail.com | c3b670f | 2011-10-05 21:44:48 +0000 | [diff] [blame] | 413 | "compile", RegExpCompile |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 414 | )); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 415 | |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 416 | // The length of compile is 1 in SpiderMonkey. |
| 417 | %FunctionSetLength($RegExp.prototype.compile, 1); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 418 | |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 419 | // The properties input, $input, and $_ are aliases for each other. When this |
lrn@chromium.org | 25156de | 2010-04-06 13:10:27 +0000 | [diff] [blame] | 420 | // value is set the value it is set to is coerced to a string. |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 421 | // Getter and setter for the input. |
jkummerow@chromium.org | f7a5884 | 2012-02-21 10:08:21 +0000 | [diff] [blame] | 422 | var RegExpGetInput = function() { |
kasperl@chromium.org | 7be3c99 | 2009-03-12 07:19:55 +0000 | [diff] [blame] | 423 | var regExpInput = LAST_INPUT(lastMatchInfo); |
ager@chromium.org | a74f0da | 2008-12-03 16:05:52 +0000 | [diff] [blame] | 424 | return IS_UNDEFINED(regExpInput) ? "" : regExpInput; |
jkummerow@chromium.org | f7a5884 | 2012-02-21 10:08:21 +0000 | [diff] [blame] | 425 | }; |
| 426 | var RegExpSetInput = function(string) { |
ager@chromium.org | bb29dc9 | 2009-03-24 13:25:23 +0000 | [diff] [blame] | 427 | LAST_INPUT(lastMatchInfo) = ToString(string); |
jkummerow@chromium.org | f7a5884 | 2012-02-21 10:08:21 +0000 | [diff] [blame] | 428 | }; |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 429 | |
svenpanne@chromium.org | 830d30c | 2012-05-29 13:20:14 +0000 | [diff] [blame] | 430 | %OptimizeObjectForAddingMultipleProperties($RegExp, 22); |
erik.corry@gmail.com | bbceb57 | 2012-03-09 10:52:05 +0000 | [diff] [blame] | 431 | %DefineOrRedefineAccessorProperty($RegExp, 'input', RegExpGetInput, |
| 432 | RegExpSetInput, DONT_DELETE); |
| 433 | %DefineOrRedefineAccessorProperty($RegExp, '$_', RegExpGetInput, |
| 434 | RegExpSetInput, DONT_ENUM | DONT_DELETE); |
| 435 | %DefineOrRedefineAccessorProperty($RegExp, '$input', RegExpGetInput, |
| 436 | RegExpSetInput, DONT_ENUM | DONT_DELETE); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 437 | |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 438 | // The properties multiline and $* are aliases for each other. When this |
| 439 | // value is set in SpiderMonkey, the value it is set to is coerced to a |
| 440 | // boolean. We mimic that behavior with a slight difference: in SpiderMonkey |
| 441 | // the value of the expression 'RegExp.multiline = null' (for instance) is the |
ulan@chromium.org | 2efb900 | 2012-01-19 15:36:35 +0000 | [diff] [blame] | 442 | // boolean false (i.e., the value after coercion), while in V8 it is the value |
| 443 | // null (i.e., the value before coercion). |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 444 | |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 445 | // Getter and setter for multiline. |
| 446 | var multiline = false; |
jkummerow@chromium.org | f7a5884 | 2012-02-21 10:08:21 +0000 | [diff] [blame] | 447 | var RegExpGetMultiline = function() { return multiline; }; |
| 448 | var RegExpSetMultiline = function(flag) { multiline = flag ? true : false; }; |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 449 | |
erik.corry@gmail.com | bbceb57 | 2012-03-09 10:52:05 +0000 | [diff] [blame] | 450 | %DefineOrRedefineAccessorProperty($RegExp, 'multiline', RegExpGetMultiline, |
kmillikin@chromium.org | be6bd10 | 2012-02-23 08:45:21 +0000 | [diff] [blame] | 451 | RegExpSetMultiline, DONT_DELETE); |
erik.corry@gmail.com | bbceb57 | 2012-03-09 10:52:05 +0000 | [diff] [blame] | 452 | %DefineOrRedefineAccessorProperty($RegExp, '$*', RegExpGetMultiline, |
| 453 | RegExpSetMultiline, |
kmillikin@chromium.org | be6bd10 | 2012-02-23 08:45:21 +0000 | [diff] [blame] | 454 | DONT_ENUM | DONT_DELETE); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 455 | |
| 456 | |
jkummerow@chromium.org | f7a5884 | 2012-02-21 10:08:21 +0000 | [diff] [blame] | 457 | var NoOpSetter = function(ignored) {}; |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 458 | |
| 459 | |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 460 | // Static properties set by a successful match. |
erik.corry@gmail.com | bbceb57 | 2012-03-09 10:52:05 +0000 | [diff] [blame] | 461 | %DefineOrRedefineAccessorProperty($RegExp, 'lastMatch', RegExpGetLastMatch, |
| 462 | NoOpSetter, DONT_DELETE); |
| 463 | %DefineOrRedefineAccessorProperty($RegExp, '$&', RegExpGetLastMatch, |
| 464 | NoOpSetter, DONT_ENUM | DONT_DELETE); |
| 465 | %DefineOrRedefineAccessorProperty($RegExp, 'lastParen', RegExpGetLastParen, |
| 466 | NoOpSetter, DONT_DELETE); |
| 467 | %DefineOrRedefineAccessorProperty($RegExp, '$+', RegExpGetLastParen, |
| 468 | NoOpSetter, DONT_ENUM | DONT_DELETE); |
| 469 | %DefineOrRedefineAccessorProperty($RegExp, 'leftContext', |
| 470 | RegExpGetLeftContext, NoOpSetter, |
kmillikin@chromium.org | be6bd10 | 2012-02-23 08:45:21 +0000 | [diff] [blame] | 471 | DONT_DELETE); |
erik.corry@gmail.com | bbceb57 | 2012-03-09 10:52:05 +0000 | [diff] [blame] | 472 | %DefineOrRedefineAccessorProperty($RegExp, '$`', RegExpGetLeftContext, |
| 473 | NoOpSetter, DONT_ENUM | DONT_DELETE); |
| 474 | %DefineOrRedefineAccessorProperty($RegExp, 'rightContext', |
| 475 | RegExpGetRightContext, NoOpSetter, |
kmillikin@chromium.org | be6bd10 | 2012-02-23 08:45:21 +0000 | [diff] [blame] | 476 | DONT_DELETE); |
erik.corry@gmail.com | bbceb57 | 2012-03-09 10:52:05 +0000 | [diff] [blame] | 477 | %DefineOrRedefineAccessorProperty($RegExp, "$'", RegExpGetRightContext, |
| 478 | NoOpSetter, DONT_ENUM | DONT_DELETE); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 479 | |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 480 | for (var i = 1; i < 10; ++i) { |
erik.corry@gmail.com | bbceb57 | 2012-03-09 10:52:05 +0000 | [diff] [blame] | 481 | %DefineOrRedefineAccessorProperty($RegExp, '$' + i, |
| 482 | RegExpMakeCaptureGetter(i), NoOpSetter, |
kmillikin@chromium.org | be6bd10 | 2012-02-23 08:45:21 +0000 | [diff] [blame] | 483 | DONT_DELETE); |
christian.plesner.hansen | 43d26ec | 2008-07-03 15:10:15 +0000 | [diff] [blame] | 484 | } |
svenpanne@chromium.org | 830d30c | 2012-05-29 13:20:14 +0000 | [diff] [blame] | 485 | %ToFastProperties($RegExp); |
kasperl@chromium.org | 41044eb | 2008-10-06 08:24:46 +0000 | [diff] [blame] | 486 | } |
| 487 | |
fschneider@chromium.org | 1805e21 | 2011-09-05 10:49:12 +0000 | [diff] [blame] | 488 | SetUpRegExp(); |