1// Copyright 2012 the V8 project authors. All rights reserved.
2// Redistribution and use in source and binary forms, with or without
3// modification, are permitted provided that the following conditions are
4// met:
5//
6//     * Redistributions of source code must retain the above copyright
7//       notice, this list of conditions and the following disclaimer.
8//     * Redistributions in binary form must reproduce the above
9//       copyright notice, this list of conditions and the following
10//       disclaimer in the documentation and/or other materials provided
11//       with the distribution.
12//     * Neither the name of Google Inc. nor the names of its
13//       contributors may be used to endorse or promote products derived
14//       from this software without specific prior written permission.
15//
16// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
17// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
18// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
19// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
20// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
21// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
22// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
26// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27
28
29// Test that an optional capture is cleared between two matches.
30var str = "ABX X";
31str = str.replace(/(\w)?X/g, function(match, capture) {
32                               assertTrue(match.indexOf(capture) >= 0 ||
33                                           capture === undefined);
34                               return capture ? capture.toLowerCase() : "-";
35                             });
36assertEquals("Ab -", str);
37
38// Test zero-length matches.
39str = "Als Gregor Samsa eines Morgens";
40str = str.replace(/\b/g, function(match, capture) {
41                           return "/";
42                         });
43assertEquals("/Als/ /Gregor/ /Samsa/ /eines/ /Morgens/", str);
44
45// Test zero-length matches that have non-zero-length sub-captures.
46str = "It was a pleasure to burn.";
47str = str.replace(/(?=(\w+))\b/g, function(match, capture) {
48                                    return capture.length;
49                                  });
50assertEquals("2It 3was 1a 8pleasure 2to 4burn.", str);
51
52// Test multiple captures.
53str = "Try not. Do, or do not. There is no try.";
54str = str.replace(/(not?)|(do)|(try)/gi,
55                  function(match, c1, c2, c3) {
56                    assertTrue((c1 === undefined && c2 === undefined) ||
57                               (c2 === undefined && c3 === undefined) ||
58                               (c1 === undefined && c3 === undefined));
59                    if (c1) return "-";
60                    if (c2) return "+";
61                    if (c3) return "="
62                  });
63assertEquals("= -. +, or + -. There is - =.", str);
64
65// Test multiple alternate captures.
66str = "FOUR LEGS GOOD, TWO LEGS BAD!";
67str = str.replace(/(FOUR|TWO) LEGS (GOOD|BAD)/g,
68                  function(match, num_legs, likeability) {
69                    assertTrue(num_legs !== undefined);
70                    assertTrue(likeability !== undefined);
71                    if (num_legs == "FOUR") assertTrue(likeability == "GOOD");
72                    if (num_legs == "TWO") assertTrue(likeability == "BAD");
73                    return match.length - 10;
74                  });
75assertEquals("4, 2!", str);
76
77
78// The same tests with UC16.
79
80//Test that an optional capture is cleared between two matches.
81str = "AB\u1234 \u1234";
82str = str.replace(/(\w)?\u1234/g,
83                  function(match, capture) {
84                    assertTrue(match.indexOf(capture) >= 0 ||
85                               capture === undefined);
86                    return capture ? capture.toLowerCase() : "-";
87                  });
88assertEquals("Ab -", str);
89
90// Test zero-length matches.
91str = "Als \u2623\u2642 eines Morgens";
92str = str.replace(/\b/g, function(match, capture) {
93                           return "/";
94                         });
95assertEquals("/Als/ \u2623\u2642 /eines/ /Morgens/", str);
96
97// Test zero-length matches that have non-zero-length sub-captures.
98str = "It was a pleasure to \u70e7.";
99str = str.replace(/(?=(\w+))\b/g, function(match, capture) {
100                                    return capture.length;
101                                  });
102assertEquals("2It 3was 1a 8pleasure 2to \u70e7.", str);
103
104// Test multiple captures.
105str = "Try not. D\u26aa, or d\u26aa not. There is no try.";
106str = str.replace(/(not?)|(d\u26aa)|(try)/gi,
107                  function(match, c1, c2, c3) {
108                    assertTrue((c1 === undefined && c2 === undefined) ||
109                               (c2 === undefined && c3 === undefined) ||
110                               (c1 === undefined && c3 === undefined));
111                    if (c1) return "-";
112                    if (c2) return "+";
113                    if (c3) return "="
114                  });
115assertEquals("= -. +, or + -. There is - =.", str);
116
117// Test multiple alternate captures.
118str = "FOUR \u817f GOOD, TWO \u817f BAD!";
119str = str.replace(/(FOUR|TWO) \u817f (GOOD|BAD)/g,
120                  function(match, num_legs, likeability) {
121                    assertTrue(num_legs !== undefined);
122                    assertTrue(likeability !== undefined);
123                    if (num_legs == "FOUR") assertTrue(likeability == "GOOD");
124                    if (num_legs == "TWO") assertTrue(likeability == "BAD");
125                    return match.length - 7;
126                  });
127assertEquals("4, 2!", str);
128
129// Test capture that is a real substring.
130var str = "Beasts of England, beasts of Ireland";
131str = str.replace(/(.*)/g, function(match) { return '~'; });
132assertEquals("~~", str);
133
134// Test zero-length matches that have non-zero-length sub-captures that do not
135// start at the match start position.
136str = "up up up up";
137str = str.replace(/\b(?=u(p))/g, function(match, capture) {
138                                    return capture.length;
139                                  });
140
141assertEquals("1up 1up 1up 1up", str);
142
143
144// Create regexp that has a *lot* of captures.
145var re_string = "(a)";
146for (var i = 0; i < 500; i++) {
147  re_string = "(" + re_string + ")";
148}
149re_string = re_string + "1";
150// re_string = "(((...((a))...)))1"
151
152var regexps = new Array();
153var last_match_expectations = new Array();
154var first_capture_expectations = new Array();
155
156// Atomic regexp.
157regexps.push(/a1/g);
158last_match_expectations.push("a1");
159first_capture_expectations.push("");
160// Small regexp (no capture);
161regexps.push(/\w1/g);
162last_match_expectations.push("a1");
163first_capture_expectations.push("");
164// Small regexp (one capture).
165regexps.push(/(a)1/g);
166last_match_expectations.push("a1");
167first_capture_expectations.push("a");
168// Large regexp (a lot of captures).
169regexps.push(new RegExp(re_string, "g"));
170last_match_expectations.push("a1");
171first_capture_expectations.push("a");
172
173function test_replace(result_expectation,
174                      subject,
175                      regexp,
176                      replacement) {
177  for (var i = 0; i < regexps.length; i++) {
178    // Overwrite last match info.
179    "deadbeef".replace(/(dead)beef/, "$1holeycow");
180    // Conduct tests.
181    assertEquals(result_expectation, subject.replace(regexps[i], replacement));
182    if (subject.length == 0) {
183      assertEquals("deadbeef", RegExp.lastMatch);
184      assertEquals("dead", RegExp["$1"]);
185    } else {
186      assertEquals(last_match_expectations[i], RegExp.lastMatch);
187      assertEquals(first_capture_expectations[i], RegExp["$1"]);
188    }
189  }
190}
191
192
193function test_match(result_expectation,
194                    subject,
195                    regexp) {
196  for (var i = 0; i < regexps.length; i++) {
197    // Overwrite last match info.
198    "deadbeef".replace(/(dead)beef/, "$1holeycow");
199    // Conduct tests.
200    if (result_expectation == null) {
201      assertNull(subject.match(regexps[i]));
202    } else {
203      assertArrayEquals(result_expectation, subject.match(regexps[i]));
204    }
205    if (subject.length == 0) {
206      assertEquals("deadbeef", RegExp.lastMatch);
207      assertEquals("dead", RegExp["$1"]);
208    } else {
209      assertEquals(last_match_expectations[i], RegExp.lastMatch);
210      assertEquals(first_capture_expectations[i], RegExp["$1"]);
211    }
212  }
213}
214
215
216// Test for different number of matches.
217for (var m = 0; m < 33; m++) {
218  // Create string that matches m times.
219  var subject = "";
220  var test_1_expectation = "";
221  var test_2_expectation = "";
222  var test_3_expectation = (m == 0) ? null : new Array();
223  for (var i = 0; i < m; i++) {
224    subject += "a11";
225    test_1_expectation += "x1";
226    test_2_expectation += "1";
227    test_3_expectation.push("a1");
228  }
229
230  // Test 1a: String.replace with string.
231  test_replace(test_1_expectation, subject, /a1/g, "x");
232
233  // Test 1b: String.replace with function.
234  function f() { return "x"; }
235  test_replace(test_1_expectation, subject, /a1/g, f);
236
237  // Test 2a: String.replace with empty string.
238  test_replace(test_2_expectation, subject, /a1/g, "");
239
240  // Test 3a: String.match.
241  test_match(test_3_expectation, subject, /a1/g);
242}
243
244
245// Test String hashing (compiling regular expression includes hashing).
246var crosscheck = "\x80";
247for (var i = 0; i < 12; i++) crosscheck += crosscheck;
248new RegExp(crosscheck);
249
250var subject = "ascii~only~string~here~";
251var replacement = "\x80";
252var result = subject.replace(/~/g, replacement);
253for (var i = 0; i < 5; i++) result += result;
254new RegExp(result);
255