зеркало из https://github.com/mozilla/pjs.git
274 строки
10 KiB
JavaScript
274 строки
10 KiB
JavaScript
/* ***** BEGIN LICENSE BLOCK *****
|
|
* Version: MPL 1.1/GPL 2.0/LGPL 2.1
|
|
*
|
|
* The contents of this file are subject to the Mozilla Public License Version
|
|
* 1.1 (the "License"); you may not use this file except in compliance with
|
|
* the License. You may obtain a copy of the License at
|
|
* http://www.mozilla.org/MPL/
|
|
*
|
|
* Software distributed under the License is distributed on an "AS IS" basis,
|
|
* WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
|
|
* for the specific language governing rights and limitations under the
|
|
* License.
|
|
*
|
|
* The Original Code is JavaScript Engine testing utilities.
|
|
*
|
|
* The Initial Developer of the Original Code is
|
|
* Netscape Communications Corp.
|
|
* Portions created by the Initial Developer are Copyright (C) 2002
|
|
* the Initial Developer. All Rights Reserved.
|
|
*
|
|
* Contributor(s):
|
|
* rogerl@netscape.com, pschwartau@netscape.com
|
|
*
|
|
* Alternatively, the contents of this file may be used under the terms of
|
|
* either the GNU General Public License Version 2 or later (the "GPL"), or
|
|
* the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
|
|
* in which case the provisions of the GPL or the LGPL are applicable instead
|
|
* of those above. If you wish to allow use of your version of this file only
|
|
* under the terms of either the GPL or the LGPL, and not to allow others to
|
|
* use your version of this file under the terms of the MPL, indicate your
|
|
* decision by deleting the provisions above and replace them with the notice
|
|
* and other provisions required by the GPL or the LGPL. If you do not delete
|
|
* the provisions above, a recipient may use your version of this file under
|
|
* the terms of any one of the MPL, the GPL or the LGPL.
|
|
*
|
|
* ***** END LICENSE BLOCK *****
|
|
*
|
|
*
|
|
* Date: 14 Feb 2002
|
|
* SUMMARY: Performance: Regexp performance degraded from 4.7
|
|
* See http://bugzilla.mozilla.org/show_bug.cgi?id=85721
|
|
*
|
|
* Adjust this testcase if necessary. The FAST constant defines
|
|
* an upper bound in milliseconds for any execution to take.
|
|
*
|
|
*/
|
|
//-----------------------------------------------------------------------------
|
|
var bug = 85721;
|
|
var summary = 'Performance: execution of regular expression';
|
|
var FAST = 100; // execution should be 100 ms or less to pass the test
|
|
var MSG_FAST = 'Execution took less than ' + FAST + ' ms';
|
|
var MSG_SLOW = 'Execution took ';
|
|
var MSG_MS = ' ms';
|
|
var str = '';
|
|
var re = '';
|
|
var status = '';
|
|
var actual = '';
|
|
var expect= '';
|
|
|
|
printBugNumber (bug);
|
|
printStatus (summary);
|
|
|
|
|
|
function elapsedTime(startTime)
|
|
{
|
|
return new Date() - startTime;
|
|
}
|
|
|
|
|
|
function isThisFast(ms)
|
|
{
|
|
if (ms <= FAST)
|
|
return MSG_FAST;
|
|
return MSG_SLOW + ms + MSG_MS;
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
* The first regexp. We'll test for performance (Section 1) and accuracy (Section 2).
|
|
*/
|
|
str='<sql:connection id="conn1"> <sql:url>www.m.com</sql:url> <sql:driver>drive.class</sql:driver>\n<sql:userId>foo</sql:userId> <sql:password>goo</sql:password> </sql:connection>';
|
|
re = /<sql:connection id="([^\r\n]*?)">\s*<sql:url>\s*([^\r\n]*?)\s*<\/sql:url>\s*<sql:driver>\s*([^\r\n]*?)\s*<\/sql:driver>\s*(\s*<sql:userId>\s*([^\r\n]*?)\s*<\/sql:userId>\s*)?\s*(\s*<sql:password>\s*([^\r\n]*?)\s*<\/sql:password>\s*)?\s*<\/sql:connection>/;
|
|
expect = Array("<sql:connection id=\"conn1\"> <sql:url>www.m.com</sql:url> <sql:driver>drive.class</sql:driver>\n<sql:userId>foo</sql:userId> <sql:password>goo</sql:password> </sql:connection>","conn1","www.m.com","drive.class","<sql:userId>foo</sql:userId> ","foo","<sql:password>goo</sql:password> ","goo");
|
|
|
|
/*
|
|
* Check performance -
|
|
*/
|
|
status = inSection(1);
|
|
var start = new Date();
|
|
var result = re.exec(str);
|
|
actual = elapsedTime(start);
|
|
reportCompare(isThisFast(FAST), isThisFast(actual), status);
|
|
|
|
/*
|
|
* Check accuracy -
|
|
*/
|
|
status = inSection(2);
|
|
testRegExp([status], [re], [str], [result], [expect]);
|
|
|
|
|
|
|
|
/*
|
|
* The second regexp (HUGE!). We'll test for performance (Section 3) and accuracy (Section 4).
|
|
* It comes from the O'Reilly book "Mastering Regular Expressions" by Jeffrey Friedl, Appendix B
|
|
*/
|
|
|
|
//# Some things for avoiding backslashitis later on.
|
|
$esc = '\\\\';
|
|
$Period = '\.';
|
|
$space = '\040'; $tab = '\t';
|
|
$OpenBR = '\\['; $CloseBR = '\\]';
|
|
$OpenParen = '\\('; $CloseParen = '\\)';
|
|
$NonASCII = '\x80-\xff'; $ctrl = '\000-\037';
|
|
$CRlist = '\n\015'; //# note: this should really be only \015.
|
|
// Items 19, 20, 21
|
|
$qtext = '[^' + $esc + $NonASCII + $CRlist + '\"]'; // # for within "..."
|
|
$dtext = '[^' + $esc + $NonASCII + $CRlist + $OpenBR + $CloseBR + ']'; // # for within [...]
|
|
$quoted_pair = $esc + '[^' + $NonASCII + ']'; // # an escaped character
|
|
|
|
//##############################################################################
|
|
//# Items 22 and 23, comment.
|
|
//# Impossible to do properly with a regex, I make do by allowing at most one level of nesting.
|
|
$ctext = '[^' + $esc + $NonASCII + $CRlist + '()]';
|
|
|
|
//# $Cnested matches one non-nested comment.
|
|
//# It is unrolled, with normal of $ctext, special of $quoted_pair.
|
|
$Cnested =
|
|
$OpenParen + // # (
|
|
$ctext + '*' + // # normal*
|
|
'(?:' + $quoted_pair + $ctext + '*)*' + // # (special normal*)*
|
|
$CloseParen; // # )
|
|
|
|
|
|
//# $comment allows one level of nested parentheses
|
|
//# It is unrolled, with normal of $ctext, special of ($quoted_pair|$Cnested)
|
|
$comment =
|
|
$OpenParen + // # (
|
|
$ctext + '*' + // # normal*
|
|
'(?:' + // # (
|
|
'(?:' + $quoted_pair + '|' + $Cnested + ')' + // # special
|
|
$ctext + '*' + // # normal*
|
|
')*' + // # )*
|
|
$CloseParen; // # )
|
|
|
|
|
|
//##############################################################################
|
|
//# $X is optional whitespace/comments.
|
|
$X =
|
|
'[' + $space + $tab + ']*' + // # Nab whitespace.
|
|
'(?:' + $comment + '[' + $space + $tab + ']*)*'; // # If comment found, allow more spaces.
|
|
|
|
|
|
//# Item 10: atom
|
|
$atom_char = '[^(' + $space + '<>\@,;:\".' + $esc + $OpenBR + $CloseBR + $ctrl + $NonASCII + ']';
|
|
$atom =
|
|
$atom_char + '+' + // # some number of atom characters...
|
|
'(?!' + $atom_char + ')'; // # ..not followed by something that could be part of an atom
|
|
|
|
// # Item 11: doublequoted string, unrolled.
|
|
$quoted_str =
|
|
'\"' + // # "
|
|
$qtext + '*' + // # normal
|
|
'(?:' + $quoted_pair + $qtext + '*)*' + // # ( special normal* )*
|
|
'\"'; // # "
|
|
|
|
//# Item 7: word is an atom or quoted string
|
|
$word =
|
|
'(?:' +
|
|
$atom + // # Atom
|
|
'|' + // # or
|
|
$quoted_str + // # Quoted string
|
|
')'
|
|
|
|
//# Item 12: domain-ref is just an atom
|
|
$domain_ref = $atom;
|
|
|
|
//# Item 13: domain-literal is like a quoted string, but [...] instead of "..."
|
|
$domain_lit =
|
|
$OpenBR + // # [
|
|
'(?:' + $dtext + '|' + $quoted_pair + ')*' + // # stuff
|
|
$CloseBR; // # ]
|
|
|
|
// # Item 9: sub-domain is a domain-ref or domain-literal
|
|
$sub_domain =
|
|
'(?:' +
|
|
$domain_ref +
|
|
'|' +
|
|
$domain_lit +
|
|
')' +
|
|
$X; // # optional trailing comments
|
|
|
|
// # Item 6: domain is a list of subdomains separated by dots.
|
|
$domain =
|
|
$sub_domain +
|
|
'(?:' +
|
|
$Period + $X + $sub_domain +
|
|
')*';
|
|
|
|
//# Item 8: a route. A bunch of "@ $domain" separated by commas, followed by a colon.
|
|
$route =
|
|
'\@' + $X + $domain +
|
|
'(?:,' + $X + '\@' + $X + $domain + ')*' + // # additional domains
|
|
':' +
|
|
$X; // # optional trailing comments
|
|
|
|
//# Item 6: local-part is a bunch of $word separated by periods
|
|
$local_part =
|
|
$word + $X
|
|
'(?:' +
|
|
$Period + $X + $word + $X + // # additional words
|
|
')*';
|
|
|
|
// # Item 2: addr-spec is local@domain
|
|
$addr_spec =
|
|
$local_part + '\@' + $X + $domain;
|
|
|
|
//# Item 4: route-addr is <route? addr-spec>
|
|
$route_addr =
|
|
'<' + $X + // # <
|
|
'(?:' + $route + ')?' + // # optional route
|
|
$addr_spec + // # address spec
|
|
'>'; // # >
|
|
|
|
//# Item 3: phrase........
|
|
$phrase_ctrl = '\000-\010\012-\037'; // # like ctrl, but without tab
|
|
|
|
//# Like atom-char, but without listing space, and uses phrase_ctrl.
|
|
//# Since the class is negated, this matches the same as atom-char plus space and tab
|
|
$phrase_char =
|
|
'[^()<>\@,;:\".' + $esc + $OpenBR + $CloseBR + $NonASCII + $phrase_ctrl + ']';
|
|
|
|
// # We've worked it so that $word, $comment, and $quoted_str to not consume trailing $X
|
|
// # because we take care of it manually.
|
|
$phrase =
|
|
$word + // # leading word
|
|
$phrase_char + '*' + // # "normal" atoms and/or spaces
|
|
'(?:' +
|
|
'(?:' + $comment + '|' + $quoted_str + ')' + // # "special" comment or quoted string
|
|
$phrase_char + '*' + // # more "normal"
|
|
')*';
|
|
|
|
// ## Item #1: mailbox is an addr_spec or a phrase/route_addr
|
|
$mailbox =
|
|
$X + // # optional leading comment
|
|
'(?:' +
|
|
$phrase + $route_addr + // # name and address
|
|
'|' + // # or
|
|
$addr_spec + // # address
|
|
')';
|
|
|
|
|
|
//###########################################################################
|
|
|
|
|
|
re = new RegExp($mailbox, "g");
|
|
str = 'Jeffy<"That Tall Guy"@ora.com (this address is no longer active)>';
|
|
expect = Array('Jeffy<"That Tall Guy"@ora.com (this address is no longer active)>');
|
|
|
|
/*
|
|
* Check performance -
|
|
*/
|
|
status = inSection(3);
|
|
var start = new Date();
|
|
var result = re.exec(str);
|
|
actual = elapsedTime(start);
|
|
reportCompare(isThisFast(FAST), isThisFast(actual), status);
|
|
|
|
/*
|
|
* Check accuracy -
|
|
*/
|
|
status = inSection(4);
|
|
testRegExp([status], [re], [str], [result], [expect]);
|