tests/mozilla/ecma_3/Unicode/uc-005.js

   1 /* ***** BEGIN LICENSE BLOCK *****
   2 * Version: NPL 1.1/GPL 2.0/LGPL 2.1
   3 *
   4 * The contents of this file are subject to the Netscape Public License
   5 * Version 1.1 (the "License"); you may not use this file except in
   6 * compliance with the License. You may obtain a copy of the License at
   7 * http://www.mozilla.org/NPL/
   8 *
   9 * Software distributed under the License is distributed on an "AS IS" basis,
  10 * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
  11 * for the specific language governing rights and limitations under the
  12 * License.
  13 *
  14 * The Original Code is JavaScript Engine testing utilities.
  15 *
  16 * The Initial Developer of the Original Code is Netscape Communications Corp.
  17 * Portions created by the Initial Developer are Copyright (C) 2002
  18 * the Initial Developer. All Rights Reserved.
  19 *
  20 * Contributor(s): rogerl@netscape.com, pschwartau@netscape.com
  21 *
  22 * Alternatively, the contents of this file may be used under the terms of
  23 * either the GNU General Public License Version 2 or later (the "GPL"), or
  24 * the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
  25 * in which case the provisions of the GPL or the LGPL are applicable instead
  26 * of those above. If you wish to allow use of your version of this file only
  27 * under the terms of either the GPL or the LGPL, and not to allow others to
  28 * use your version of this file under the terms of the NPL, indicate your
  29 * decision by deleting the provisions above and replace them with the notice
  30 * and other provisions required by the GPL or the LGPL. If you do not delete
  31 * the provisions above, a recipient may use your version of this file under
  32 * the terms of any one of the NPL, the GPL or the LGPL.
  33 *
  34 * ***** END LICENSE BLOCK *****
  35 *
  36 *
  37 * Date:    15 July 2002
  38 * SUMMARY: Testing identifiers with double-byte names
  39 * See http://bugzilla.mozilla.org/show_bug.cgi?id=58274
  40 *
  41 * Here is a sample of the problem:
  42 *
  43 *    js> function f\u02B1 () {}
  44 *
  45 *    js> f\u02B1.toSource();
  46 *    function f¦() {}
  47 *
  48 *    js> f\u02B1.toSource().toSource();
  49 *    (new String("function f\xB1() {}"))
  50 *
  51 *
  52 * See how the high-byte information (the 02) has been lost?
  53 * The same thing was happening with the toString() method:
  54 *
  55 *    js> f\u02B1.toString();
  56 *
  57 *    function f¦() {
  58 *    }
  59 *
  60 *    js> f\u02B1.toString().toSource();
  61 *    (new String("\nfunction f\xB1() {\n}\n"))
  62 *
  63 */
  64 //-----------------------------------------------------------------------------
  65 var UBound = 0;
  66 var bug = 58274;
  67 var summary = 'Testing identifiers with double-byte names';
  68 var status = '';
  69 var statusitems = [];
  70 var actual = '';
  71 var actualvalues = [];
  72 var expect= '';
  73 var expectedvalues = [];
  74
  75
  76 /*
  77  * Define a function that uses double-byte identifiers in
  78  * "every possible way"
  79  *
  80  * Then recover each double-byte identifier via f.toString().
  81  * To make this easier, put a 'Z' token before every one.
  82  *
  83  * Our eval string will be:
  84  *
  85  * sEval = "function Z\u02b1(Z\u02b2, b) {
  86  *          try { Z\u02b3 : var Z\u02b4 = Z\u02b1; }
  87  *          catch (Z\u02b5) { for (var Z\u02b6 in Z\u02b5)
  88  *          {for (1; 1<0; Z\u02b7++) {new Array()[Z\u02b6] = 1;} };} }";
  89  *
  90  * It will be helpful to build this string in stages:
  91  */
  92 var s0 =  'function Z';
  93 var s1 =  '\u02b1(Z';
  94 var s2 =  '\u02b2, b) {try { Z';
  95 var s3 =  '\u02b3 : var Z';
  96 var s4 =  '\u02b4 = Z';
  97 var s5 =  '\u02b1; } catch (Z'
  98 var s6 =  '\u02b5) { for (var Z';
  99 var s7 =  '\u02b6 in Z';
 100 var s8 =  '\u02b5){for (1; 1<0; Z';
 101 var s9 =  '\u02b7++) {new Array()[Z';
 102 var s10 = '\u02b6] = 1;} };} }';
 103
 104
 105 /*
 106  * Concatenate these and eval() to create the function Z\u02b1
 107  */
 108 var sEval = s0 + s1 + s2 + s3 + s4 + s5 + s6 + s7 + s8 + s9 + s10;
 109 eval(sEval);
 110
 111
 112 /*
 113  * Recover all the double-byte identifiers via Z\u02b1.toString().
 114  * We'll recover the 1st one as arrID[1], the 2nd one as arrID[2],
 115  * and so on ...
 116  */
 117 var arrID = getIdentifiers(Z\u02b1);
 118
 119
 120 /*
 121  * Now check that we got back what we put in -
 122  */
 123 status = inSection(1);
 124 actual = arrID[1];
 125 expect = s1.charAt(0);
 126 addThis();
 127
 128 status = inSection(2);
 129 actual = arrID[2];
 130 expect = s2.charAt(0);
 131 addThis();
 132
 133 status = inSection(3);
 134 actual = arrID[3];
 135 expect = s3.charAt(0);
 136 addThis();
 137
 138 status = inSection(4);
 139 actual = arrID[4];
 140 expect = s4.charAt(0);
 141 addThis();
 142
 143 status = inSection(5);
 144 actual = arrID[5];
 145 expect = s5.charAt(0);
 146 addThis();
 147
 148 status = inSection(6);
 149 actual = arrID[6];
 150 expect = s6.charAt(0);
 151 addThis();
 152
 153 status = inSection(7);
 154 actual = arrID[7];
 155 expect = s7.charAt(0);
 156 addThis();
 157
 158 status = inSection(8);
 159 actual = arrID[8];
 160 expect = s8.charAt(0);
 161 addThis();
 162
 163 status = inSection(9);
 164 actual = arrID[9];
 165 expect = s9.charAt(0);
 166 addThis();
 167
 168 status = inSection(10);
 169 actual = arrID[10];
 170 expect = s10.charAt(0);
 171 addThis();
 172
 173
 174
 175
 176 //-----------------------------------------------------------------------------
 177 test();
 178 //-----------------------------------------------------------------------------
 179
 180
 181
 182 /*
 183  * Goal: recover the double-byte identifiers from f.toString()
 184  * by getting the very next character after each 'Z' token.
 185  *
 186  * The return value will be an array |arr| indexed such that
 187  * |arr[1]| is the 1st identifier, |arr[2]| the 2nd, and so on.
 188  *
 189  * Note, however, f.toString() is implementation-independent.
 190  * For example, it may begin with '\nfunction' instead of 'function'.
 191  *
 192  * Rhino uses a Unicode representation for f.toString(); whereas
 193  * SpiderMonkey uses an ASCII representation, putting escape sequences
 194  * for non-ASCII characters. For example, if a function is called f\u02B1,
 195  * then in Rhino the toString() method will present a 2-character Unicode
 196  * string for its name, whereas SpiderMonkey will present a 7-character
 197  * ASCII string for its name: the string literal 'f\u02B1'.
 198  *
 199  * So we force the lexer to condense the string before we use it.
 200  * This will give uniform results in Rhino and SpiderMonkey.
 201  */
 202 function getIdentifiers(f)
 203 {
 204   var str = condenseStr(f.toString());
 205   var arr = str.split('Z');
 206
 207   /*
 208    * The identifiers are the 1st char of each split substring
 209    * EXCEPT the first one, which is just ('\n' +) 'function '.
 210    *
 211    * Thus note the 1st identifier will be stored in |arr[1]|,
 212    * the 2nd one in |arr[2]|, etc., making the indexing easy -
 213    */
 214   for (i in arr)
 215     arr[i] = arr[i].charAt(0);
 216   return arr;
 217 }
 218
 219
 220 /*
 221  * This function is the opposite of a functions like escape(), which take
 222  * Unicode characters and return escape sequences for them. Here, we force
 223  * the lexer to turn escape sequences back into single characters.
 224  *
 225  * Note we can't simply do |eval(str)|, since in practice |str| will be an
 226  * identifier somewhere in the program (e.g. a function name); thus |eval(str)|
 227  * would return the object that the identifier represents: not what we want.
 228  *
 229  * So we surround |str| lexicographically with quotes to force the lexer to
 230  * evaluate it as a string. Have to strip out any linefeeds first, however -
 231  */
 232 function condenseStr(str)
 233 {
 234   /*
 235    * You won't be able to do the next step if |str| has
 236    * any carriage returns or linefeeds in it. For example:
 237    *
 238    *  js> eval("'" + '\nHello' + "'");
 239    *  1: SyntaxError: unterminated string literal:
 240    *  1: '
 241    *  1: ^
 242    *
 243    * So replace them with the empty string -
 244    */
 245   str = str.replace(/[\r\n]/g, '')
 246   return eval("'" + str + "'")
 247 }
 248
 249
 250 function addThis()
 251 {
 252   statusitems[UBound] = status;
 253   actualvalues[UBound] = actual;
 254   expectedvalues[UBound] = expect;
 255   UBound++;
 256 }
 257
 258
 259 function test()
 260 {
 261   enterFunc('test');
 262   printBugNumber(bug);
 263   printStatus(summary);
 264
 265   for (var i=0; i<UBound; i++)
 266   {
 267     reportCompare(expectedvalues[i], actualvalues[i], statusitems[i]);
 268   }
 269
 270   exitFunc ('test');
 271 }