rt/emul/mini/src/main/java/java/lang/String.java
author Jaroslav Tulach <jaroslav.tulach@apidesign.org>
Mon, 09 Sep 2013 15:26:12 +0200
changeset 1272 3ee4ec9577bc
parent 926 e5fe6bfca579
child 1310 635ee75d82a5
permissions -rw-r--r--
Basic implementation of String.split
jaroslav@49
     1
/*
jaroslav@49
     2
 * Copyright (c) 1994, 2010, Oracle and/or its affiliates. All rights reserved.
jaroslav@49
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
jaroslav@49
     4
 *
jaroslav@49
     5
 * This code is free software; you can redistribute it and/or modify it
jaroslav@49
     6
 * under the terms of the GNU General Public License version 2 only, as
jaroslav@49
     7
 * published by the Free Software Foundation.  Oracle designates this
jaroslav@49
     8
 * particular file as subject to the "Classpath" exception as provided
jaroslav@49
     9
 * by Oracle in the LICENSE file that accompanied this code.
jaroslav@49
    10
 *
jaroslav@49
    11
 * This code is distributed in the hope that it will be useful, but WITHOUT
jaroslav@49
    12
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
jaroslav@49
    13
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
jaroslav@49
    14
 * version 2 for more details (a copy is included in the LICENSE file that
jaroslav@49
    15
 * accompanied this code).
jaroslav@49
    16
 *
jaroslav@49
    17
 * You should have received a copy of the GNU General Public License version
jaroslav@49
    18
 * 2 along with this work; if not, write to the Free Software Foundation,
jaroslav@49
    19
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
jaroslav@49
    20
 *
jaroslav@49
    21
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
jaroslav@49
    22
 * or visit www.oracle.com if you need additional information or have any
jaroslav@49
    23
 * questions.
jaroslav@49
    24
 */
jaroslav@49
    25
jaroslav@49
    26
package java.lang;
jaroslav@49
    27
jaroslav@608
    28
import java.io.UnsupportedEncodingException;
jaroslav@240
    29
import java.util.Comparator;
jaroslav@93
    30
import org.apidesign.bck2brwsr.core.ExtraJavaScript;
jaroslav@240
    31
import org.apidesign.bck2brwsr.core.JavaScriptBody;
jaroslav@240
    32
import org.apidesign.bck2brwsr.core.JavaScriptOnly;
jaroslav@240
    33
import org.apidesign.bck2brwsr.core.JavaScriptPrototype;
jaroslav@560
    34
import org.apidesign.bck2brwsr.emul.lang.System;
jaroslav@49
    35
jaroslav@49
    36
/**
jaroslav@49
    37
 * The <code>String</code> class represents character strings. All
jaroslav@49
    38
 * string literals in Java programs, such as <code>"abc"</code>, are
jaroslav@49
    39
 * implemented as instances of this class.
jaroslav@49
    40
 * <p>
jaroslav@49
    41
 * Strings are constant; their values cannot be changed after they
jaroslav@49
    42
 * are created. String buffers support mutable strings.
jaroslav@49
    43
 * Because String objects are immutable they can be shared. For example:
jaroslav@49
    44
 * <p><blockquote><pre>
jaroslav@49
    45
 *     String str = "abc";
jaroslav@49
    46
 * </pre></blockquote><p>
jaroslav@49
    47
 * is equivalent to:
jaroslav@49
    48
 * <p><blockquote><pre>
jaroslav@49
    49
 *     char data[] = {'a', 'b', 'c'};
jaroslav@49
    50
 *     String str = new String(data);
jaroslav@49
    51
 * </pre></blockquote><p>
jaroslav@49
    52
 * Here are some more examples of how strings can be used:
jaroslav@49
    53
 * <p><blockquote><pre>
jaroslav@49
    54
 *     System.out.println("abc");
jaroslav@49
    55
 *     String cde = "cde";
jaroslav@49
    56
 *     System.out.println("abc" + cde);
jaroslav@49
    57
 *     String c = "abc".substring(2,3);
jaroslav@49
    58
 *     String d = cde.substring(1, 2);
jaroslav@49
    59
 * </pre></blockquote>
jaroslav@49
    60
 * <p>
jaroslav@49
    61
 * The class <code>String</code> includes methods for examining
jaroslav@49
    62
 * individual characters of the sequence, for comparing strings, for
jaroslav@49
    63
 * searching strings, for extracting substrings, and for creating a
jaroslav@49
    64
 * copy of a string with all characters translated to uppercase or to
jaroslav@49
    65
 * lowercase. Case mapping is based on the Unicode Standard version
jaroslav@49
    66
 * specified by the {@link java.lang.Character Character} class.
jaroslav@49
    67
 * <p>
jaroslav@49
    68
 * The Java language provides special support for the string
jaroslav@49
    69
 * concatenation operator (&nbsp;+&nbsp;), and for conversion of
jaroslav@49
    70
 * other objects to strings. String concatenation is implemented
jaroslav@49
    71
 * through the <code>StringBuilder</code>(or <code>StringBuffer</code>)
jaroslav@49
    72
 * class and its <code>append</code> method.
jaroslav@49
    73
 * String conversions are implemented through the method
jaroslav@49
    74
 * <code>toString</code>, defined by <code>Object</code> and
jaroslav@49
    75
 * inherited by all classes in Java. For additional information on
jaroslav@49
    76
 * string concatenation and conversion, see Gosling, Joy, and Steele,
jaroslav@49
    77
 * <i>The Java Language Specification</i>.
jaroslav@49
    78
 *
jaroslav@49
    79
 * <p> Unless otherwise noted, passing a <tt>null</tt> argument to a constructor
jaroslav@49
    80
 * or method in this class will cause a {@link NullPointerException} to be
jaroslav@49
    81
 * thrown.
jaroslav@49
    82
 *
jaroslav@49
    83
 * <p>A <code>String</code> represents a string in the UTF-16 format
jaroslav@49
    84
 * in which <em>supplementary characters</em> are represented by <em>surrogate
jaroslav@49
    85
 * pairs</em> (see the section <a href="Character.html#unicode">Unicode
jaroslav@49
    86
 * Character Representations</a> in the <code>Character</code> class for
jaroslav@49
    87
 * more information).
jaroslav@49
    88
 * Index values refer to <code>char</code> code units, so a supplementary
jaroslav@49
    89
 * character uses two positions in a <code>String</code>.
jaroslav@49
    90
 * <p>The <code>String</code> class provides methods for dealing with
jaroslav@49
    91
 * Unicode code points (i.e., characters), in addition to those for
jaroslav@49
    92
 * dealing with Unicode code units (i.e., <code>char</code> values).
jaroslav@49
    93
 *
jaroslav@49
    94
 * @author  Lee Boynton
jaroslav@49
    95
 * @author  Arthur van Hoff
jaroslav@49
    96
 * @author  Martin Buchholz
jaroslav@49
    97
 * @author  Ulf Zibis
jaroslav@49
    98
 * @see     java.lang.Object#toString()
jaroslav@49
    99
 * @see     java.lang.StringBuffer
jaroslav@49
   100
 * @see     java.lang.StringBuilder
jaroslav@49
   101
 * @see     java.nio.charset.Charset
jaroslav@49
   102
 * @since   JDK1.0
jaroslav@49
   103
 */
jaroslav@49
   104
jaroslav@93
   105
@ExtraJavaScript(
jaroslav@555
   106
    resource="/org/apidesign/vm4brwsr/emul/lang/java_lang_String.js",
jaroslav@240
   107
    processByteCode=true
jaroslav@93
   108
)
jaroslav@240
   109
@JavaScriptPrototype(container = "String.prototype", prototype = "new String")
jaroslav@49
   110
public final class String
jaroslav@49
   111
    implements java.io.Serializable, Comparable<String>, CharSequence
jaroslav@49
   112
{
jaroslav@240
   113
    /** real string to delegate to */
jaroslav@240
   114
    private Object r;
jaroslav@49
   115
jaroslav@49
   116
    /** use serialVersionUID from JDK 1.0.2 for interoperability */
jaroslav@49
   117
    private static final long serialVersionUID = -6849794470754667710L;
jaroslav@787
   118
jaroslav@787
   119
    static {
jaroslav@787
   120
        registerToString();
jaroslav@787
   121
    }
jaroslav@787
   122
    @JavaScriptBody(args = {}, body = 
jaroslav@787
   123
          "var p = vm.java_lang_String(false);\n"
jaroslav@787
   124
        + "p.toString = function() {\nreturn this._r().toString();\n};\n"
jaroslav@787
   125
        + "p.valueOf = function() {\nreturn this._r().valueOf();\n}\n"
jaroslav@787
   126
    )
jaroslav@787
   127
    private static native void registerToString();
jaroslav@240
   128
    
jaroslav@49
   129
    /**
jaroslav@49
   130
     * Class String is special cased within the Serialization Stream Protocol.
jaroslav@49
   131
     *
jaroslav@49
   132
     * A String instance is written initially into an ObjectOutputStream in the
jaroslav@49
   133
     * following format:
jaroslav@49
   134
     * <pre>
jaroslav@49
   135
     *      <code>TC_STRING</code> (utf String)
jaroslav@49
   136
     * </pre>
jaroslav@49
   137
     * The String is written by method <code>DataOutput.writeUTF</code>.
jaroslav@49
   138
     * A new handle is generated to  refer to all future references to the
jaroslav@49
   139
     * string instance within the stream.
jaroslav@49
   140
     */
jaroslav@65
   141
//    private static final ObjectStreamField[] serialPersistentFields =
jaroslav@65
   142
//        new ObjectStreamField[0];
jaroslav@49
   143
jaroslav@49
   144
    /**
jaroslav@49
   145
     * Initializes a newly created {@code String} object so that it represents
jaroslav@49
   146
     * an empty character sequence.  Note that use of this constructor is
jaroslav@49
   147
     * unnecessary since Strings are immutable.
jaroslav@49
   148
     */
jaroslav@49
   149
    public String() {
jaroslav@241
   150
        this.r = "";
jaroslav@49
   151
    }
jaroslav@49
   152
jaroslav@49
   153
    /**
jaroslav@49
   154
     * Initializes a newly created {@code String} object so that it represents
jaroslav@49
   155
     * the same sequence of characters as the argument; in other words, the
jaroslav@49
   156
     * newly created string is a copy of the argument string. Unless an
jaroslav@49
   157
     * explicit copy of {@code original} is needed, use of this constructor is
jaroslav@49
   158
     * unnecessary since Strings are immutable.
jaroslav@49
   159
     *
jaroslav@49
   160
     * @param  original
jaroslav@49
   161
     *         A {@code String}
jaroslav@49
   162
     */
jaroslav@49
   163
    public String(String original) {
jaroslav@241
   164
        this.r = original.toString();
jaroslav@49
   165
    }
jaroslav@49
   166
jaroslav@49
   167
    /**
jaroslav@49
   168
     * Allocates a new {@code String} so that it represents the sequence of
jaroslav@49
   169
     * characters currently contained in the character array argument. The
jaroslav@49
   170
     * contents of the character array are copied; subsequent modification of
jaroslav@49
   171
     * the character array does not affect the newly created string.
jaroslav@49
   172
     *
jaroslav@49
   173
     * @param  value
jaroslav@49
   174
     *         The initial value of the string
jaroslav@49
   175
     */
jaroslav@443
   176
    @JavaScriptBody(args = { "charArr" }, body=
jaroslav@240
   177
        "for (var i = 0; i < charArr.length; i++) {\n"
jaroslav@240
   178
      + "  if (typeof charArr[i] === 'number') charArr[i] = String.fromCharCode(charArr[i]);\n"
jaroslav@240
   179
      + "}\n"
jaroslav@592
   180
      + "this._r(charArr.join(''));\n"
jaroslav@240
   181
    )
jaroslav@49
   182
    public String(char value[]) {
jaroslav@49
   183
    }
jaroslav@49
   184
jaroslav@49
   185
    /**
jaroslav@49
   186
     * Allocates a new {@code String} that contains characters from a subarray
jaroslav@49
   187
     * of the character array argument. The {@code offset} argument is the
jaroslav@49
   188
     * index of the first character of the subarray and the {@code count}
jaroslav@49
   189
     * argument specifies the length of the subarray. The contents of the
jaroslav@49
   190
     * subarray are copied; subsequent modification of the character array does
jaroslav@49
   191
     * not affect the newly created string.
jaroslav@49
   192
     *
jaroslav@49
   193
     * @param  value
jaroslav@49
   194
     *         Array that is the source of characters
jaroslav@49
   195
     *
jaroslav@49
   196
     * @param  offset
jaroslav@49
   197
     *         The initial offset
jaroslav@49
   198
     *
jaroslav@49
   199
     * @param  count
jaroslav@49
   200
     *         The length
jaroslav@49
   201
     *
jaroslav@49
   202
     * @throws  IndexOutOfBoundsException
jaroslav@49
   203
     *          If the {@code offset} and {@code count} arguments index
jaroslav@49
   204
     *          characters outside the bounds of the {@code value} array
jaroslav@49
   205
     */
jaroslav@611
   206
    public String(char value[], int offset, int count) {
jaroslav@611
   207
        initFromCharArray(value, offset, count);
jaroslav@611
   208
    }
jaroslav@611
   209
    
jaroslav@443
   210
    @JavaScriptBody(args = { "charArr", "off", "cnt" }, body =
jaroslav@240
   211
        "var up = off + cnt;\n" +
jaroslav@240
   212
        "for (var i = off; i < up; i++) {\n" +
jaroslav@240
   213
        "  if (typeof charArr[i] === 'number') charArr[i] = String.fromCharCode(charArr[i]);\n" +
jaroslav@240
   214
        "}\n" +
jaroslav@592
   215
        "this._r(charArr.slice(off, up).join(\"\"));\n"
jaroslav@240
   216
    )
jaroslav@611
   217
    private native void initFromCharArray(char value[], int offset, int count);
jaroslav@49
   218
jaroslav@49
   219
    /**
jaroslav@49
   220
     * Allocates a new {@code String} that contains characters from a subarray
jaroslav@49
   221
     * of the <a href="Character.html#unicode">Unicode code point</a> array
jaroslav@49
   222
     * argument.  The {@code offset} argument is the index of the first code
jaroslav@49
   223
     * point of the subarray and the {@code count} argument specifies the
jaroslav@49
   224
     * length of the subarray.  The contents of the subarray are converted to
jaroslav@49
   225
     * {@code char}s; subsequent modification of the {@code int} array does not
jaroslav@49
   226
     * affect the newly created string.
jaroslav@49
   227
     *
jaroslav@49
   228
     * @param  codePoints
jaroslav@49
   229
     *         Array that is the source of Unicode code points
jaroslav@49
   230
     *
jaroslav@49
   231
     * @param  offset
jaroslav@49
   232
     *         The initial offset
jaroslav@49
   233
     *
jaroslav@49
   234
     * @param  count
jaroslav@49
   235
     *         The length
jaroslav@49
   236
     *
jaroslav@49
   237
     * @throws  IllegalArgumentException
jaroslav@49
   238
     *          If any invalid Unicode code point is found in {@code
jaroslav@49
   239
     *          codePoints}
jaroslav@49
   240
     *
jaroslav@49
   241
     * @throws  IndexOutOfBoundsException
jaroslav@49
   242
     *          If the {@code offset} and {@code count} arguments index
jaroslav@49
   243
     *          characters outside the bounds of the {@code codePoints} array
jaroslav@49
   244
     *
jaroslav@49
   245
     * @since  1.5
jaroslav@49
   246
     */
jaroslav@49
   247
    public String(int[] codePoints, int offset, int count) {
jaroslav@49
   248
        if (offset < 0) {
jaroslav@49
   249
            throw new StringIndexOutOfBoundsException(offset);
jaroslav@49
   250
        }
jaroslav@49
   251
        if (count < 0) {
jaroslav@49
   252
            throw new StringIndexOutOfBoundsException(count);
jaroslav@49
   253
        }
jaroslav@49
   254
        // Note: offset or count might be near -1>>>1.
jaroslav@49
   255
        if (offset > codePoints.length - count) {
jaroslav@49
   256
            throw new StringIndexOutOfBoundsException(offset + count);
jaroslav@49
   257
        }
jaroslav@49
   258
jaroslav@49
   259
        final int end = offset + count;
jaroslav@49
   260
jaroslav@49
   261
        // Pass 1: Compute precise size of char[]
jaroslav@49
   262
        int n = count;
jaroslav@49
   263
        for (int i = offset; i < end; i++) {
jaroslav@49
   264
            int c = codePoints[i];
jaroslav@49
   265
            if (Character.isBmpCodePoint(c))
jaroslav@49
   266
                continue;
jaroslav@49
   267
            else if (Character.isValidCodePoint(c))
jaroslav@49
   268
                n++;
jaroslav@49
   269
            else throw new IllegalArgumentException(Integer.toString(c));
jaroslav@49
   270
        }
jaroslav@49
   271
jaroslav@49
   272
        // Pass 2: Allocate and fill in char[]
jaroslav@49
   273
        final char[] v = new char[n];
jaroslav@49
   274
jaroslav@49
   275
        for (int i = offset, j = 0; i < end; i++, j++) {
jaroslav@49
   276
            int c = codePoints[i];
jaroslav@49
   277
            if (Character.isBmpCodePoint(c))
jaroslav@49
   278
                v[j] = (char) c;
jaroslav@49
   279
            else
jaroslav@49
   280
                Character.toSurrogates(c, v, j++);
jaroslav@49
   281
        }
jaroslav@49
   282
jaroslav@241
   283
        this.r = new String(v, 0, n);
jaroslav@49
   284
    }
jaroslav@49
   285
jaroslav@49
   286
    /**
jaroslav@49
   287
     * Allocates a new {@code String} constructed from a subarray of an array
jaroslav@49
   288
     * of 8-bit integer values.
jaroslav@49
   289
     *
jaroslav@49
   290
     * <p> The {@code offset} argument is the index of the first byte of the
jaroslav@49
   291
     * subarray, and the {@code count} argument specifies the length of the
jaroslav@49
   292
     * subarray.
jaroslav@49
   293
     *
jaroslav@49
   294
     * <p> Each {@code byte} in the subarray is converted to a {@code char} as
jaroslav@49
   295
     * specified in the method above.
jaroslav@49
   296
     *
jaroslav@49
   297
     * @deprecated This method does not properly convert bytes into characters.
jaroslav@49
   298
     * As of JDK&nbsp;1.1, the preferred way to do this is via the
jaroslav@49
   299
     * {@code String} constructors that take a {@link
jaroslav@49
   300
     * java.nio.charset.Charset}, charset name, or that use the platform's
jaroslav@49
   301
     * default charset.
jaroslav@49
   302
     *
jaroslav@49
   303
     * @param  ascii
jaroslav@49
   304
     *         The bytes to be converted to characters
jaroslav@49
   305
     *
jaroslav@49
   306
     * @param  hibyte
jaroslav@49
   307
     *         The top 8 bits of each 16-bit Unicode code unit
jaroslav@49
   308
     *
jaroslav@49
   309
     * @param  offset
jaroslav@49
   310
     *         The initial offset
jaroslav@49
   311
     * @param  count
jaroslav@49
   312
     *         The length
jaroslav@49
   313
     *
jaroslav@49
   314
     * @throws  IndexOutOfBoundsException
jaroslav@49
   315
     *          If the {@code offset} or {@code count} argument is invalid
jaroslav@49
   316
     *
jaroslav@49
   317
     * @see  #String(byte[], int)
jaroslav@49
   318
     * @see  #String(byte[], int, int, java.lang.String)
jaroslav@49
   319
     * @see  #String(byte[], int, int, java.nio.charset.Charset)
jaroslav@49
   320
     * @see  #String(byte[], int, int)
jaroslav@49
   321
     * @see  #String(byte[], java.lang.String)
jaroslav@49
   322
     * @see  #String(byte[], java.nio.charset.Charset)
jaroslav@49
   323
     * @see  #String(byte[])
jaroslav@49
   324
     */
jaroslav@49
   325
    @Deprecated
jaroslav@49
   326
    public String(byte ascii[], int hibyte, int offset, int count) {
jaroslav@49
   327
        checkBounds(ascii, offset, count);
jaroslav@49
   328
        char value[] = new char[count];
jaroslav@49
   329
jaroslav@49
   330
        if (hibyte == 0) {
jaroslav@49
   331
            for (int i = count ; i-- > 0 ;) {
jaroslav@49
   332
                value[i] = (char) (ascii[i + offset] & 0xff);
jaroslav@49
   333
            }
jaroslav@49
   334
        } else {
jaroslav@49
   335
            hibyte <<= 8;
jaroslav@49
   336
            for (int i = count ; i-- > 0 ;) {
jaroslav@49
   337
                value[i] = (char) (hibyte | (ascii[i + offset] & 0xff));
jaroslav@49
   338
            }
jaroslav@49
   339
        }
jaroslav@670
   340
        initFromCharArray(value, offset, count);
jaroslav@49
   341
    }
jaroslav@49
   342
jaroslav@49
   343
    /**
jaroslav@49
   344
     * Allocates a new {@code String} containing characters constructed from
jaroslav@49
   345
     * an array of 8-bit integer values. Each character <i>c</i>in the
jaroslav@49
   346
     * resulting string is constructed from the corresponding component
jaroslav@49
   347
     * <i>b</i> in the byte array such that:
jaroslav@49
   348
     *
jaroslav@49
   349
     * <blockquote><pre>
jaroslav@49
   350
     *     <b><i>c</i></b> == (char)(((hibyte &amp; 0xff) &lt;&lt; 8)
jaroslav@49
   351
     *                         | (<b><i>b</i></b> &amp; 0xff))
jaroslav@49
   352
     * </pre></blockquote>
jaroslav@49
   353
     *
jaroslav@49
   354
     * @deprecated  This method does not properly convert bytes into
jaroslav@49
   355
     * characters.  As of JDK&nbsp;1.1, the preferred way to do this is via the
jaroslav@49
   356
     * {@code String} constructors that take a {@link
jaroslav@49
   357
     * java.nio.charset.Charset}, charset name, or that use the platform's
jaroslav@49
   358
     * default charset.
jaroslav@49
   359
     *
jaroslav@49
   360
     * @param  ascii
jaroslav@49
   361
     *         The bytes to be converted to characters
jaroslav@49
   362
     *
jaroslav@49
   363
     * @param  hibyte
jaroslav@49
   364
     *         The top 8 bits of each 16-bit Unicode code unit
jaroslav@49
   365
     *
jaroslav@49
   366
     * @see  #String(byte[], int, int, java.lang.String)
jaroslav@49
   367
     * @see  #String(byte[], int, int, java.nio.charset.Charset)
jaroslav@49
   368
     * @see  #String(byte[], int, int)
jaroslav@49
   369
     * @see  #String(byte[], java.lang.String)
jaroslav@49
   370
     * @see  #String(byte[], java.nio.charset.Charset)
jaroslav@49
   371
     * @see  #String(byte[])
jaroslav@49
   372
     */
jaroslav@49
   373
    @Deprecated
jaroslav@49
   374
    public String(byte ascii[], int hibyte) {
jaroslav@49
   375
        this(ascii, hibyte, 0, ascii.length);
jaroslav@49
   376
    }
jaroslav@49
   377
jaroslav@49
   378
    /* Common private utility method used to bounds check the byte array
jaroslav@49
   379
     * and requested offset & length values used by the String(byte[],..)
jaroslav@49
   380
     * constructors.
jaroslav@49
   381
     */
jaroslav@49
   382
    private static void checkBounds(byte[] bytes, int offset, int length) {
jaroslav@49
   383
        if (length < 0)
jaroslav@49
   384
            throw new StringIndexOutOfBoundsException(length);
jaroslav@49
   385
        if (offset < 0)
jaroslav@49
   386
            throw new StringIndexOutOfBoundsException(offset);
jaroslav@49
   387
        if (offset > bytes.length - length)
jaroslav@49
   388
            throw new StringIndexOutOfBoundsException(offset + length);
jaroslav@49
   389
    }
jaroslav@49
   390
jaroslav@49
   391
    /**
jaroslav@49
   392
     * Constructs a new {@code String} by decoding the specified subarray of
jaroslav@49
   393
     * bytes using the specified charset.  The length of the new {@code String}
jaroslav@49
   394
     * is a function of the charset, and hence may not be equal to the length
jaroslav@49
   395
     * of the subarray.
jaroslav@49
   396
     *
jaroslav@49
   397
     * <p> The behavior of this constructor when the given bytes are not valid
jaroslav@49
   398
     * in the given charset is unspecified.  The {@link
jaroslav@49
   399
     * java.nio.charset.CharsetDecoder} class should be used when more control
jaroslav@49
   400
     * over the decoding process is required.
jaroslav@49
   401
     *
jaroslav@49
   402
     * @param  bytes
jaroslav@49
   403
     *         The bytes to be decoded into characters
jaroslav@49
   404
     *
jaroslav@49
   405
     * @param  offset
jaroslav@49
   406
     *         The index of the first byte to decode
jaroslav@49
   407
     *
jaroslav@49
   408
     * @param  length
jaroslav@49
   409
     *         The number of bytes to decode
jaroslav@49
   410
jaroslav@49
   411
     * @param  charsetName
jaroslav@49
   412
     *         The name of a supported {@linkplain java.nio.charset.Charset
jaroslav@49
   413
     *         charset}
jaroslav@49
   414
     *
jaroslav@49
   415
     * @throws  UnsupportedEncodingException
jaroslav@49
   416
     *          If the named charset is not supported
jaroslav@49
   417
     *
jaroslav@49
   418
     * @throws  IndexOutOfBoundsException
jaroslav@49
   419
     *          If the {@code offset} and {@code length} arguments index
jaroslav@49
   420
     *          characters outside the bounds of the {@code bytes} array
jaroslav@49
   421
     *
jaroslav@49
   422
     * @since  JDK1.1
jaroslav@49
   423
     */
jaroslav@608
   424
    public String(byte bytes[], int offset, int length, String charsetName)
jaroslav@608
   425
        throws UnsupportedEncodingException
jaroslav@608
   426
    {
jaroslav@608
   427
        this(checkUTF8(bytes, charsetName), offset, length);
jaroslav@608
   428
    }
jaroslav@49
   429
jaroslav@49
   430
    /**
jaroslav@49
   431
     * Constructs a new {@code String} by decoding the specified subarray of
jaroslav@49
   432
     * bytes using the specified {@linkplain java.nio.charset.Charset charset}.
jaroslav@49
   433
     * The length of the new {@code String} is a function of the charset, and
jaroslav@49
   434
     * hence may not be equal to the length of the subarray.
jaroslav@49
   435
     *
jaroslav@49
   436
     * <p> This method always replaces malformed-input and unmappable-character
jaroslav@49
   437
     * sequences with this charset's default replacement string.  The {@link
jaroslav@49
   438
     * java.nio.charset.CharsetDecoder} class should be used when more control
jaroslav@49
   439
     * over the decoding process is required.
jaroslav@49
   440
     *
jaroslav@49
   441
     * @param  bytes
jaroslav@49
   442
     *         The bytes to be decoded into characters
jaroslav@49
   443
     *
jaroslav@49
   444
     * @param  offset
jaroslav@49
   445
     *         The index of the first byte to decode
jaroslav@49
   446
     *
jaroslav@49
   447
     * @param  length
jaroslav@49
   448
     *         The number of bytes to decode
jaroslav@49
   449
     *
jaroslav@49
   450
     * @param  charset
jaroslav@49
   451
     *         The {@linkplain java.nio.charset.Charset charset} to be used to
jaroslav@49
   452
     *         decode the {@code bytes}
jaroslav@49
   453
     *
jaroslav@49
   454
     * @throws  IndexOutOfBoundsException
jaroslav@49
   455
     *          If the {@code offset} and {@code length} arguments index
jaroslav@49
   456
     *          characters outside the bounds of the {@code bytes} array
jaroslav@49
   457
     *
jaroslav@49
   458
     * @since  1.6
jaroslav@49
   459
     */
jaroslav@61
   460
    /* don't want dependnecy on Charset
jaroslav@49
   461
    public String(byte bytes[], int offset, int length, Charset charset) {
jaroslav@49
   462
        if (charset == null)
jaroslav@49
   463
            throw new NullPointerException("charset");
jaroslav@49
   464
        checkBounds(bytes, offset, length);
jaroslav@49
   465
        char[] v = StringCoding.decode(charset, bytes, offset, length);
jaroslav@49
   466
        this.offset = 0;
jaroslav@49
   467
        this.count = v.length;
jaroslav@49
   468
        this.value = v;
jaroslav@49
   469
    }
jaroslav@61
   470
    */
jaroslav@49
   471
jaroslav@49
   472
    /**
jaroslav@49
   473
     * Constructs a new {@code String} by decoding the specified array of bytes
jaroslav@49
   474
     * using the specified {@linkplain java.nio.charset.Charset charset}.  The
jaroslav@49
   475
     * length of the new {@code String} is a function of the charset, and hence
jaroslav@49
   476
     * may not be equal to the length of the byte array.
jaroslav@49
   477
     *
jaroslav@49
   478
     * <p> The behavior of this constructor when the given bytes are not valid
jaroslav@49
   479
     * in the given charset is unspecified.  The {@link
jaroslav@49
   480
     * java.nio.charset.CharsetDecoder} class should be used when more control
jaroslav@49
   481
     * over the decoding process is required.
jaroslav@49
   482
     *
jaroslav@49
   483
     * @param  bytes
jaroslav@49
   484
     *         The bytes to be decoded into characters
jaroslav@49
   485
     *
jaroslav@49
   486
     * @param  charsetName
jaroslav@49
   487
     *         The name of a supported {@linkplain java.nio.charset.Charset
jaroslav@49
   488
     *         charset}
jaroslav@49
   489
     *
jaroslav@49
   490
     * @throws  UnsupportedEncodingException
jaroslav@49
   491
     *          If the named charset is not supported
jaroslav@49
   492
     *
jaroslav@49
   493
     * @since  JDK1.1
jaroslav@49
   494
     */
jaroslav@608
   495
    public String(byte bytes[], String charsetName)
jaroslav@608
   496
        throws UnsupportedEncodingException
jaroslav@608
   497
    {
jaroslav@608
   498
        this(bytes, 0, bytes.length, charsetName);
jaroslav@608
   499
    }
jaroslav@49
   500
jaroslav@49
   501
    /**
jaroslav@49
   502
     * Constructs a new {@code String} by decoding the specified array of
jaroslav@49
   503
     * bytes using the specified {@linkplain java.nio.charset.Charset charset}.
jaroslav@49
   504
     * The length of the new {@code String} is a function of the charset, and
jaroslav@49
   505
     * hence may not be equal to the length of the byte array.
jaroslav@49
   506
     *
jaroslav@49
   507
     * <p> This method always replaces malformed-input and unmappable-character
jaroslav@49
   508
     * sequences with this charset's default replacement string.  The {@link
jaroslav@49
   509
     * java.nio.charset.CharsetDecoder} class should be used when more control
jaroslav@49
   510
     * over the decoding process is required.
jaroslav@49
   511
     *
jaroslav@49
   512
     * @param  bytes
jaroslav@49
   513
     *         The bytes to be decoded into characters
jaroslav@49
   514
     *
jaroslav@49
   515
     * @param  charset
jaroslav@49
   516
     *         The {@linkplain java.nio.charset.Charset charset} to be used to
jaroslav@49
   517
     *         decode the {@code bytes}
jaroslav@49
   518
     *
jaroslav@49
   519
     * @since  1.6
jaroslav@49
   520
     */
jaroslav@61
   521
    /* don't want dep on Charset
jaroslav@49
   522
    public String(byte bytes[], Charset charset) {
jaroslav@49
   523
        this(bytes, 0, bytes.length, charset);
jaroslav@49
   524
    }
jaroslav@61
   525
    */
jaroslav@49
   526
jaroslav@49
   527
    /**
jaroslav@49
   528
     * Constructs a new {@code String} by decoding the specified subarray of
jaroslav@49
   529
     * bytes using the platform's default charset.  The length of the new
jaroslav@49
   530
     * {@code String} is a function of the charset, and hence may not be equal
jaroslav@49
   531
     * to the length of the subarray.
jaroslav@49
   532
     *
jaroslav@49
   533
     * <p> The behavior of this constructor when the given bytes are not valid
jaroslav@49
   534
     * in the default charset is unspecified.  The {@link
jaroslav@49
   535
     * java.nio.charset.CharsetDecoder} class should be used when more control
jaroslav@49
   536
     * over the decoding process is required.
jaroslav@49
   537
     *
jaroslav@49
   538
     * @param  bytes
jaroslav@49
   539
     *         The bytes to be decoded into characters
jaroslav@49
   540
     *
jaroslav@49
   541
     * @param  offset
jaroslav@49
   542
     *         The index of the first byte to decode
jaroslav@49
   543
     *
jaroslav@49
   544
     * @param  length
jaroslav@49
   545
     *         The number of bytes to decode
jaroslav@49
   546
     *
jaroslav@49
   547
     * @throws  IndexOutOfBoundsException
jaroslav@49
   548
     *          If the {@code offset} and the {@code length} arguments index
jaroslav@49
   549
     *          characters outside the bounds of the {@code bytes} array
jaroslav@49
   550
     *
jaroslav@49
   551
     * @since  JDK1.1
jaroslav@49
   552
     */
jaroslav@49
   553
    public String(byte bytes[], int offset, int length) {
jaroslav@49
   554
        checkBounds(bytes, offset, length);
jaroslav@75
   555
        char[] v  = new char[length];
jaroslav@608
   556
        int[] at = { offset };
jaroslav@608
   557
        int end = offset + length;
jaroslav@608
   558
        int chlen = 0;
jaroslav@608
   559
        while (at[0] < end) {
jaroslav@608
   560
            int ch = nextChar(bytes, at);
jaroslav@608
   561
            v[chlen++] = (char)ch;
jaroslav@75
   562
        }
jaroslav@611
   563
        initFromCharArray(v, 0, chlen);
jaroslav@49
   564
    }
jaroslav@49
   565
jaroslav@49
   566
    /**
jaroslav@49
   567
     * Constructs a new {@code String} by decoding the specified array of bytes
jaroslav@49
   568
     * using the platform's default charset.  The length of the new {@code
jaroslav@49
   569
     * String} is a function of the charset, and hence may not be equal to the
jaroslav@49
   570
     * length of the byte array.
jaroslav@49
   571
     *
jaroslav@49
   572
     * <p> The behavior of this constructor when the given bytes are not valid
jaroslav@49
   573
     * in the default charset is unspecified.  The {@link
jaroslav@49
   574
     * java.nio.charset.CharsetDecoder} class should be used when more control
jaroslav@49
   575
     * over the decoding process is required.
jaroslav@49
   576
     *
jaroslav@49
   577
     * @param  bytes
jaroslav@49
   578
     *         The bytes to be decoded into characters
jaroslav@49
   579
     *
jaroslav@49
   580
     * @since  JDK1.1
jaroslav@49
   581
     */
jaroslav@49
   582
    public String(byte bytes[]) {
jaroslav@49
   583
        this(bytes, 0, bytes.length);
jaroslav@49
   584
    }
jaroslav@49
   585
jaroslav@49
   586
    /**
jaroslav@49
   587
     * Allocates a new string that contains the sequence of characters
jaroslav@49
   588
     * currently contained in the string buffer argument. The contents of the
jaroslav@49
   589
     * string buffer are copied; subsequent modification of the string buffer
jaroslav@49
   590
     * does not affect the newly created string.
jaroslav@49
   591
     *
jaroslav@49
   592
     * @param  buffer
jaroslav@49
   593
     *         A {@code StringBuffer}
jaroslav@49
   594
     */
jaroslav@49
   595
    public String(StringBuffer buffer) {
jaroslav@241
   596
        this.r = buffer.toString();
jaroslav@49
   597
    }
jaroslav@49
   598
jaroslav@49
   599
    /**
jaroslav@49
   600
     * Allocates a new string that contains the sequence of characters
jaroslav@49
   601
     * currently contained in the string builder argument. The contents of the
jaroslav@49
   602
     * string builder are copied; subsequent modification of the string builder
jaroslav@49
   603
     * does not affect the newly created string.
jaroslav@49
   604
     *
jaroslav@49
   605
     * <p> This constructor is provided to ease migration to {@code
jaroslav@49
   606
     * StringBuilder}. Obtaining a string from a string builder via the {@code
jaroslav@49
   607
     * toString} method is likely to run faster and is generally preferred.
jaroslav@49
   608
     *
jaroslav@49
   609
     * @param   builder
jaroslav@49
   610
     *          A {@code StringBuilder}
jaroslav@49
   611
     *
jaroslav@49
   612
     * @since  1.5
jaroslav@49
   613
     */
jaroslav@49
   614
    public String(StringBuilder builder) {
jaroslav@241
   615
        this.r = builder.toString();
jaroslav@49
   616
    }
jaroslav@49
   617
jaroslav@49
   618
    /**
jaroslav@49
   619
     * Returns the length of this string.
jaroslav@49
   620
     * The length is equal to the number of <a href="Character.html#unicode">Unicode
jaroslav@49
   621
     * code units</a> in the string.
jaroslav@49
   622
     *
jaroslav@49
   623
     * @return  the length of the sequence of characters represented by this
jaroslav@49
   624
     *          object.
jaroslav@49
   625
     */
jaroslav@443
   626
    @JavaScriptBody(args = {}, body = "return this.toString().length;")
jaroslav@49
   627
    public int length() {
jaroslav@241
   628
        throw new UnsupportedOperationException();
jaroslav@49
   629
    }
jaroslav@49
   630
jaroslav@49
   631
    /**
jaroslav@49
   632
     * Returns <tt>true</tt> if, and only if, {@link #length()} is <tt>0</tt>.
jaroslav@49
   633
     *
jaroslav@49
   634
     * @return <tt>true</tt> if {@link #length()} is <tt>0</tt>, otherwise
jaroslav@49
   635
     * <tt>false</tt>
jaroslav@49
   636
     *
jaroslav@49
   637
     * @since 1.6
jaroslav@49
   638
     */
jaroslav@443
   639
    @JavaScriptBody(args = {}, body="return this.toString().length === 0;")
jaroslav@49
   640
    public boolean isEmpty() {
jaroslav@241
   641
        return length() == 0;
jaroslav@49
   642
    }
jaroslav@49
   643
jaroslav@49
   644
    /**
jaroslav@49
   645
     * Returns the <code>char</code> value at the
jaroslav@49
   646
     * specified index. An index ranges from <code>0</code> to
jaroslav@49
   647
     * <code>length() - 1</code>. The first <code>char</code> value of the sequence
jaroslav@49
   648
     * is at index <code>0</code>, the next at index <code>1</code>,
jaroslav@49
   649
     * and so on, as for array indexing.
jaroslav@49
   650
     *
jaroslav@49
   651
     * <p>If the <code>char</code> value specified by the index is a
jaroslav@49
   652
     * <a href="Character.html#unicode">surrogate</a>, the surrogate
jaroslav@49
   653
     * value is returned.
jaroslav@49
   654
     *
jaroslav@49
   655
     * @param      index   the index of the <code>char</code> value.
jaroslav@49
   656
     * @return     the <code>char</code> value at the specified index of this string.
jaroslav@49
   657
     *             The first <code>char</code> value is at index <code>0</code>.
jaroslav@49
   658
     * @exception  IndexOutOfBoundsException  if the <code>index</code>
jaroslav@49
   659
     *             argument is negative or not less than the length of this
jaroslav@49
   660
     *             string.
jaroslav@49
   661
     */
jaroslav@443
   662
    @JavaScriptBody(args = { "index" }, 
jaroslav@443
   663
        body = "return this.toString().charCodeAt(index);"
jaroslav@240
   664
    )
jaroslav@49
   665
    public char charAt(int index) {
jaroslav@241
   666
        throw new UnsupportedOperationException();
jaroslav@49
   667
    }
jaroslav@49
   668
jaroslav@49
   669
    /**
jaroslav@49
   670
     * Returns the character (Unicode code point) at the specified
jaroslav@49
   671
     * index. The index refers to <code>char</code> values
jaroslav@49
   672
     * (Unicode code units) and ranges from <code>0</code> to
jaroslav@49
   673
     * {@link #length()}<code> - 1</code>.
jaroslav@49
   674
     *
jaroslav@49
   675
     * <p> If the <code>char</code> value specified at the given index
jaroslav@49
   676
     * is in the high-surrogate range, the following index is less
jaroslav@49
   677
     * than the length of this <code>String</code>, and the
jaroslav@49
   678
     * <code>char</code> value at the following index is in the
jaroslav@49
   679
     * low-surrogate range, then the supplementary code point
jaroslav@49
   680
     * corresponding to this surrogate pair is returned. Otherwise,
jaroslav@49
   681
     * the <code>char</code> value at the given index is returned.
jaroslav@49
   682
     *
jaroslav@49
   683
     * @param      index the index to the <code>char</code> values
jaroslav@49
   684
     * @return     the code point value of the character at the
jaroslav@49
   685
     *             <code>index</code>
jaroslav@49
   686
     * @exception  IndexOutOfBoundsException  if the <code>index</code>
jaroslav@49
   687
     *             argument is negative or not less than the length of this
jaroslav@49
   688
     *             string.
jaroslav@49
   689
     * @since      1.5
jaroslav@49
   690
     */
jaroslav@49
   691
    public int codePointAt(int index) {
jaroslav@241
   692
        if ((index < 0) || (index >= length())) {
jaroslav@49
   693
            throw new StringIndexOutOfBoundsException(index);
jaroslav@49
   694
        }
jaroslav@241
   695
        return Character.codePointAtImpl(toCharArray(), offset() + index, offset() + length());
jaroslav@49
   696
    }
jaroslav@49
   697
jaroslav@49
   698
    /**
jaroslav@49
   699
     * Returns the character (Unicode code point) before the specified
jaroslav@49
   700
     * index. The index refers to <code>char</code> values
jaroslav@49
   701
     * (Unicode code units) and ranges from <code>1</code> to {@link
jaroslav@49
   702
     * CharSequence#length() length}.
jaroslav@49
   703
     *
jaroslav@49
   704
     * <p> If the <code>char</code> value at <code>(index - 1)</code>
jaroslav@49
   705
     * is in the low-surrogate range, <code>(index - 2)</code> is not
jaroslav@49
   706
     * negative, and the <code>char</code> value at <code>(index -
jaroslav@49
   707
     * 2)</code> is in the high-surrogate range, then the
jaroslav@49
   708
     * supplementary code point value of the surrogate pair is
jaroslav@49
   709
     * returned. If the <code>char</code> value at <code>index -
jaroslav@49
   710
     * 1</code> is an unpaired low-surrogate or a high-surrogate, the
jaroslav@49
   711
     * surrogate value is returned.
jaroslav@49
   712
     *
jaroslav@49
   713
     * @param     index the index following the code point that should be returned
jaroslav@49
   714
     * @return    the Unicode code point value before the given index.
jaroslav@49
   715
     * @exception IndexOutOfBoundsException if the <code>index</code>
jaroslav@49
   716
     *            argument is less than 1 or greater than the length
jaroslav@49
   717
     *            of this string.
jaroslav@49
   718
     * @since     1.5
jaroslav@49
   719
     */
jaroslav@49
   720
    public int codePointBefore(int index) {
jaroslav@49
   721
        int i = index - 1;
jaroslav@241
   722
        if ((i < 0) || (i >= length())) {
jaroslav@49
   723
            throw new StringIndexOutOfBoundsException(index);
jaroslav@49
   724
        }
jaroslav@241
   725
        return Character.codePointBeforeImpl(toCharArray(), offset() + index, offset());
jaroslav@49
   726
    }
jaroslav@49
   727
jaroslav@49
   728
    /**
jaroslav@49
   729
     * Returns the number of Unicode code points in the specified text
jaroslav@49
   730
     * range of this <code>String</code>. The text range begins at the
jaroslav@49
   731
     * specified <code>beginIndex</code> and extends to the
jaroslav@49
   732
     * <code>char</code> at index <code>endIndex - 1</code>. Thus the
jaroslav@49
   733
     * length (in <code>char</code>s) of the text range is
jaroslav@49
   734
     * <code>endIndex-beginIndex</code>. Unpaired surrogates within
jaroslav@49
   735
     * the text range count as one code point each.
jaroslav@49
   736
     *
jaroslav@49
   737
     * @param beginIndex the index to the first <code>char</code> of
jaroslav@49
   738
     * the text range.
jaroslav@49
   739
     * @param endIndex the index after the last <code>char</code> of
jaroslav@49
   740
     * the text range.
jaroslav@49
   741
     * @return the number of Unicode code points in the specified text
jaroslav@49
   742
     * range
jaroslav@49
   743
     * @exception IndexOutOfBoundsException if the
jaroslav@49
   744
     * <code>beginIndex</code> is negative, or <code>endIndex</code>
jaroslav@49
   745
     * is larger than the length of this <code>String</code>, or
jaroslav@49
   746
     * <code>beginIndex</code> is larger than <code>endIndex</code>.
jaroslav@49
   747
     * @since  1.5
jaroslav@49
   748
     */
jaroslav@49
   749
    public int codePointCount(int beginIndex, int endIndex) {
jaroslav@241
   750
        if (beginIndex < 0 || endIndex > length() || beginIndex > endIndex) {
jaroslav@49
   751
            throw new IndexOutOfBoundsException();
jaroslav@49
   752
        }
jaroslav@241
   753
        return Character.codePointCountImpl(toCharArray(), offset()+beginIndex, endIndex-beginIndex);
jaroslav@49
   754
    }
jaroslav@49
   755
jaroslav@49
   756
    /**
jaroslav@49
   757
     * Returns the index within this <code>String</code> that is
jaroslav@49
   758
     * offset from the given <code>index</code> by
jaroslav@49
   759
     * <code>codePointOffset</code> code points. Unpaired surrogates
jaroslav@49
   760
     * within the text range given by <code>index</code> and
jaroslav@49
   761
     * <code>codePointOffset</code> count as one code point each.
jaroslav@49
   762
     *
jaroslav@49
   763
     * @param index the index to be offset
jaroslav@49
   764
     * @param codePointOffset the offset in code points
jaroslav@49
   765
     * @return the index within this <code>String</code>
jaroslav@49
   766
     * @exception IndexOutOfBoundsException if <code>index</code>
jaroslav@49
   767
     *   is negative or larger then the length of this
jaroslav@49
   768
     *   <code>String</code>, or if <code>codePointOffset</code> is positive
jaroslav@49
   769
     *   and the substring starting with <code>index</code> has fewer
jaroslav@49
   770
     *   than <code>codePointOffset</code> code points,
jaroslav@49
   771
     *   or if <code>codePointOffset</code> is negative and the substring
jaroslav@49
   772
     *   before <code>index</code> has fewer than the absolute value
jaroslav@49
   773
     *   of <code>codePointOffset</code> code points.
jaroslav@49
   774
     * @since 1.5
jaroslav@49
   775
     */
jaroslav@49
   776
    public int offsetByCodePoints(int index, int codePointOffset) {
jaroslav@241
   777
        if (index < 0 || index > length()) {
jaroslav@49
   778
            throw new IndexOutOfBoundsException();
jaroslav@49
   779
        }
jaroslav@241
   780
        return Character.offsetByCodePointsImpl(toCharArray(), offset(), length(),
jaroslav@241
   781
                                                offset()+index, codePointOffset) - offset();
jaroslav@49
   782
    }
jaroslav@49
   783
jaroslav@49
   784
    /**
jaroslav@49
   785
     * Copy characters from this string into dst starting at dstBegin.
jaroslav@49
   786
     * This method doesn't perform any range checking.
jaroslav@49
   787
     */
jaroslav@443
   788
    @JavaScriptBody(args = { "arr", "to" }, body = 
jaroslav@443
   789
        "var s = this.toString();\n" +
jaroslav@240
   790
        "for (var i = 0; i < s.length; i++) {\n" +
jaroslav@240
   791
        "   arr[to++] = s[i];\n" +
jaroslav@240
   792
        "}"
jaroslav@240
   793
    )
jaroslav@49
   794
    void getChars(char dst[], int dstBegin) {
jaroslav@560
   795
        System.arraycopy(toCharArray(), offset(), dst, dstBegin, length());
jaroslav@49
   796
    }
jaroslav@49
   797
jaroslav@49
   798
    /**
jaroslav@49
   799
     * Copies characters from this string into the destination character
jaroslav@49
   800
     * array.
jaroslav@49
   801
     * <p>
jaroslav@49
   802
     * The first character to be copied is at index <code>srcBegin</code>;
jaroslav@49
   803
     * the last character to be copied is at index <code>srcEnd-1</code>
jaroslav@49
   804
     * (thus the total number of characters to be copied is
jaroslav@49
   805
     * <code>srcEnd-srcBegin</code>). The characters are copied into the
jaroslav@49
   806
     * subarray of <code>dst</code> starting at index <code>dstBegin</code>
jaroslav@49
   807
     * and ending at index:
jaroslav@49
   808
     * <p><blockquote><pre>
jaroslav@49
   809
     *     dstbegin + (srcEnd-srcBegin) - 1
jaroslav@49
   810
     * </pre></blockquote>
jaroslav@49
   811
     *
jaroslav@49
   812
     * @param      srcBegin   index of the first character in the string
jaroslav@49
   813
     *                        to copy.
jaroslav@49
   814
     * @param      srcEnd     index after the last character in the string
jaroslav@49
   815
     *                        to copy.
jaroslav@49
   816
     * @param      dst        the destination array.
jaroslav@49
   817
     * @param      dstBegin   the start offset in the destination array.
jaroslav@49
   818
     * @exception IndexOutOfBoundsException If any of the following
jaroslav@49
   819
     *            is true:
jaroslav@49
   820
     *            <ul><li><code>srcBegin</code> is negative.
jaroslav@49
   821
     *            <li><code>srcBegin</code> is greater than <code>srcEnd</code>
jaroslav@49
   822
     *            <li><code>srcEnd</code> is greater than the length of this
jaroslav@49
   823
     *                string
jaroslav@49
   824
     *            <li><code>dstBegin</code> is negative
jaroslav@49
   825
     *            <li><code>dstBegin+(srcEnd-srcBegin)</code> is larger than
jaroslav@49
   826
     *                <code>dst.length</code></ul>
jaroslav@49
   827
     */
jaroslav@443
   828
    @JavaScriptBody(args = { "beg", "end", "arr", "dst" }, body=
jaroslav@443
   829
        "var s = this.toString();\n" +
jaroslav@240
   830
        "while (beg < end) {\n" +
jaroslav@572
   831
        "  arr[dst++] = s.charCodeAt(beg++);\n" +
jaroslav@240
   832
        "}\n"
jaroslav@240
   833
    )
jaroslav@49
   834
    public void getChars(int srcBegin, int srcEnd, char dst[], int dstBegin) {
jaroslav@49
   835
        if (srcBegin < 0) {
jaroslav@49
   836
            throw new StringIndexOutOfBoundsException(srcBegin);
jaroslav@49
   837
        }
jaroslav@241
   838
        if (srcEnd > length()) {
jaroslav@49
   839
            throw new StringIndexOutOfBoundsException(srcEnd);
jaroslav@49
   840
        }
jaroslav@49
   841
        if (srcBegin > srcEnd) {
jaroslav@49
   842
            throw new StringIndexOutOfBoundsException(srcEnd - srcBegin);
jaroslav@49
   843
        }
jaroslav@560
   844
        System.arraycopy(toCharArray(), offset() + srcBegin, dst, dstBegin,
jaroslav@49
   845
             srcEnd - srcBegin);
jaroslav@49
   846
    }
jaroslav@49
   847
jaroslav@49
   848
    /**
jaroslav@49
   849
     * Copies characters from this string into the destination byte array. Each
jaroslav@49
   850
     * byte receives the 8 low-order bits of the corresponding character. The
jaroslav@49
   851
     * eight high-order bits of each character are not copied and do not
jaroslav@49
   852
     * participate in the transfer in any way.
jaroslav@49
   853
     *
jaroslav@49
   854
     * <p> The first character to be copied is at index {@code srcBegin}; the
jaroslav@49
   855
     * last character to be copied is at index {@code srcEnd-1}.  The total
jaroslav@49
   856
     * number of characters to be copied is {@code srcEnd-srcBegin}. The
jaroslav@49
   857
     * characters, converted to bytes, are copied into the subarray of {@code
jaroslav@49
   858
     * dst} starting at index {@code dstBegin} and ending at index:
jaroslav@49
   859
     *
jaroslav@49
   860
     * <blockquote><pre>
jaroslav@49
   861
     *     dstbegin + (srcEnd-srcBegin) - 1
jaroslav@49
   862
     * </pre></blockquote>
jaroslav@49
   863
     *
jaroslav@49
   864
     * @deprecated  This method does not properly convert characters into
jaroslav@49
   865
     * bytes.  As of JDK&nbsp;1.1, the preferred way to do this is via the
jaroslav@49
   866
     * {@link #getBytes()} method, which uses the platform's default charset.
jaroslav@49
   867
     *
jaroslav@49
   868
     * @param  srcBegin
jaroslav@49
   869
     *         Index of the first character in the string to copy
jaroslav@49
   870
     *
jaroslav@49
   871
     * @param  srcEnd
jaroslav@49
   872
     *         Index after the last character in the string to copy
jaroslav@49
   873
     *
jaroslav@49
   874
     * @param  dst
jaroslav@49
   875
     *         The destination array
jaroslav@49
   876
     *
jaroslav@49
   877
     * @param  dstBegin
jaroslav@49
   878
     *         The start offset in the destination array
jaroslav@49
   879
     *
jaroslav@49
   880
     * @throws  IndexOutOfBoundsException
jaroslav@49
   881
     *          If any of the following is true:
jaroslav@49
   882
     *          <ul>
jaroslav@49
   883
     *            <li> {@code srcBegin} is negative
jaroslav@49
   884
     *            <li> {@code srcBegin} is greater than {@code srcEnd}
jaroslav@49
   885
     *            <li> {@code srcEnd} is greater than the length of this String
jaroslav@49
   886
     *            <li> {@code dstBegin} is negative
jaroslav@49
   887
     *            <li> {@code dstBegin+(srcEnd-srcBegin)} is larger than {@code
jaroslav@49
   888
     *                 dst.length}
jaroslav@49
   889
     *          </ul>
jaroslav@49
   890
     */
jaroslav@49
   891
    @Deprecated
jaroslav@49
   892
    public void getBytes(int srcBegin, int srcEnd, byte dst[], int dstBegin) {
jaroslav@49
   893
        if (srcBegin < 0) {
jaroslav@49
   894
            throw new StringIndexOutOfBoundsException(srcBegin);
jaroslav@49
   895
        }
jaroslav@241
   896
        if (srcEnd > length()) {
jaroslav@49
   897
            throw new StringIndexOutOfBoundsException(srcEnd);
jaroslav@49
   898
        }
jaroslav@49
   899
        if (srcBegin > srcEnd) {
jaroslav@49
   900
            throw new StringIndexOutOfBoundsException(srcEnd - srcBegin);
jaroslav@49
   901
        }
jaroslav@49
   902
        int j = dstBegin;
jaroslav@241
   903
        int n = offset() + srcEnd;
jaroslav@241
   904
        int i = offset() + srcBegin;
jaroslav@241
   905
        char[] val = toCharArray();   /* avoid getfield opcode */
jaroslav@49
   906
jaroslav@49
   907
        while (i < n) {
jaroslav@49
   908
            dst[j++] = (byte)val[i++];
jaroslav@49
   909
        }
jaroslav@49
   910
    }
jaroslav@49
   911
jaroslav@49
   912
    /**
jaroslav@49
   913
     * Encodes this {@code String} into a sequence of bytes using the named
jaroslav@49
   914
     * charset, storing the result into a new byte array.
jaroslav@49
   915
     *
jaroslav@49
   916
     * <p> The behavior of this method when this string cannot be encoded in
jaroslav@49
   917
     * the given charset is unspecified.  The {@link
jaroslav@49
   918
     * java.nio.charset.CharsetEncoder} class should be used when more control
jaroslav@49
   919
     * over the encoding process is required.
jaroslav@49
   920
     *
jaroslav@49
   921
     * @param  charsetName
jaroslav@49
   922
     *         The name of a supported {@linkplain java.nio.charset.Charset
jaroslav@49
   923
     *         charset}
jaroslav@49
   924
     *
jaroslav@49
   925
     * @return  The resultant byte array
jaroslav@49
   926
     *
jaroslav@49
   927
     * @throws  UnsupportedEncodingException
jaroslav@49
   928
     *          If the named charset is not supported
jaroslav@49
   929
     *
jaroslav@49
   930
     * @since  JDK1.1
jaroslav@49
   931
     */
jaroslav@608
   932
    public byte[] getBytes(String charsetName)
jaroslav@608
   933
        throws UnsupportedEncodingException
jaroslav@608
   934
    {
jaroslav@608
   935
        checkUTF8(null, charsetName);
jaroslav@608
   936
        return getBytes();
jaroslav@608
   937
    }
jaroslav@49
   938
jaroslav@49
   939
    /**
jaroslav@49
   940
     * Encodes this {@code String} into a sequence of bytes using the given
jaroslav@49
   941
     * {@linkplain java.nio.charset.Charset charset}, storing the result into a
jaroslav@49
   942
     * new byte array.
jaroslav@49
   943
     *
jaroslav@49
   944
     * <p> This method always replaces malformed-input and unmappable-character
jaroslav@49
   945
     * sequences with this charset's default replacement byte array.  The
jaroslav@49
   946
     * {@link java.nio.charset.CharsetEncoder} class should be used when more
jaroslav@49
   947
     * control over the encoding process is required.
jaroslav@49
   948
     *
jaroslav@49
   949
     * @param  charset
jaroslav@49
   950
     *         The {@linkplain java.nio.charset.Charset} to be used to encode
jaroslav@49
   951
     *         the {@code String}
jaroslav@49
   952
     *
jaroslav@49
   953
     * @return  The resultant byte array
jaroslav@49
   954
     *
jaroslav@49
   955
     * @since  1.6
jaroslav@49
   956
     */
jaroslav@61
   957
    /* don't want dep on Charset
jaroslav@49
   958
    public byte[] getBytes(Charset charset) {
jaroslav@49
   959
        if (charset == null) throw new NullPointerException();
jaroslav@49
   960
        return StringCoding.encode(charset, value, offset, count);
jaroslav@49
   961
    }
jaroslav@61
   962
    */
jaroslav@49
   963
jaroslav@49
   964
    /**
jaroslav@49
   965
     * Encodes this {@code String} into a sequence of bytes using the
jaroslav@49
   966
     * platform's default charset, storing the result into a new byte array.
jaroslav@49
   967
     *
jaroslav@49
   968
     * <p> The behavior of this method when this string cannot be encoded in
jaroslav@49
   969
     * the default charset is unspecified.  The {@link
jaroslav@49
   970
     * java.nio.charset.CharsetEncoder} class should be used when more control
jaroslav@49
   971
     * over the encoding process is required.
jaroslav@49
   972
     *
jaroslav@49
   973
     * @return  The resultant byte array
jaroslav@49
   974
     *
jaroslav@49
   975
     * @since      JDK1.1
jaroslav@49
   976
     */
jaroslav@49
   977
    public byte[] getBytes() {
jaroslav@595
   978
        int len = length();
jaroslav@595
   979
        byte[] arr = new byte[len];
jaroslav@595
   980
        for (int i = 0, j = 0; j < len; j++) {
jaroslav@595
   981
            final int v = charAt(j);
jaroslav@595
   982
            if (v < 128) {
jaroslav@595
   983
                arr[i++] = (byte) v;
jaroslav@595
   984
                continue;
jaroslav@595
   985
            }
jaroslav@595
   986
            if (v < 0x0800) {
jaroslav@595
   987
                arr = System.expandArray(arr, i + 1);
jaroslav@595
   988
                arr[i++] = (byte) (0xC0 | (v >> 6));
jaroslav@595
   989
                arr[i++] = (byte) (0x80 | (0x3F & v));
jaroslav@595
   990
                continue;
jaroslav@595
   991
            }
jaroslav@595
   992
            arr = System.expandArray(arr, i + 2);
jaroslav@595
   993
            arr[i++] = (byte) (0xE0 | (v >> 12));
jaroslav@595
   994
            arr[i++] = (byte) (0x80 | ((v >> 6) & 0x7F));
jaroslav@595
   995
            arr[i++] = (byte) (0x80 | (0x3F & v));
jaroslav@75
   996
        }
jaroslav@75
   997
        return arr;
jaroslav@49
   998
    }
jaroslav@49
   999
jaroslav@49
  1000
    /**
jaroslav@49
  1001
     * Compares this string to the specified object.  The result is {@code
jaroslav@49
  1002
     * true} if and only if the argument is not {@code null} and is a {@code
jaroslav@49
  1003
     * String} object that represents the same sequence of characters as this
jaroslav@49
  1004
     * object.
jaroslav@49
  1005
     *
jaroslav@49
  1006
     * @param  anObject
jaroslav@49
  1007
     *         The object to compare this {@code String} against
jaroslav@49
  1008
     *
jaroslav@49
  1009
     * @return  {@code true} if the given object represents a {@code String}
jaroslav@49
  1010
     *          equivalent to this string, {@code false} otherwise
jaroslav@49
  1011
     *
jaroslav@49
  1012
     * @see  #compareTo(String)
jaroslav@49
  1013
     * @see  #equalsIgnoreCase(String)
jaroslav@49
  1014
     */
jaroslav@443
  1015
    @JavaScriptBody(args = { "obj" }, body = 
jaroslav@501
  1016
        "return obj != null && obj.$instOf_java_lang_String && "
jaroslav@443
  1017
        + "this.toString() === obj.toString();"
jaroslav@240
  1018
    )
jaroslav@49
  1019
    public boolean equals(Object anObject) {
jaroslav@49
  1020
        if (this == anObject) {
jaroslav@49
  1021
            return true;
jaroslav@49
  1022
        }
jaroslav@49
  1023
        if (anObject instanceof String) {
jaroslav@49
  1024
            String anotherString = (String)anObject;
jaroslav@241
  1025
            int n = length();
jaroslav@241
  1026
            if (n == anotherString.length()) {
jaroslav@241
  1027
                char v1[] = toCharArray();
jaroslav@241
  1028
                char v2[] = anotherString.toCharArray();
jaroslav@241
  1029
                int i = offset();
jaroslav@241
  1030
                int j = anotherString.offset();
jaroslav@49
  1031
                while (n-- != 0) {
jaroslav@49
  1032
                    if (v1[i++] != v2[j++])
jaroslav@49
  1033
                        return false;
jaroslav@49
  1034
                }
jaroslav@49
  1035
                return true;
jaroslav@49
  1036
            }
jaroslav@49
  1037
        }
jaroslav@49
  1038
        return false;
jaroslav@49
  1039
    }
jaroslav@49
  1040
jaroslav@49
  1041
    /**
jaroslav@49
  1042
     * Compares this string to the specified {@code StringBuffer}.  The result
jaroslav@49
  1043
     * is {@code true} if and only if this {@code String} represents the same
jaroslav@49
  1044
     * sequence of characters as the specified {@code StringBuffer}.
jaroslav@49
  1045
     *
jaroslav@49
  1046
     * @param  sb
jaroslav@49
  1047
     *         The {@code StringBuffer} to compare this {@code String} against
jaroslav@49
  1048
     *
jaroslav@49
  1049
     * @return  {@code true} if this {@code String} represents the same
jaroslav@49
  1050
     *          sequence of characters as the specified {@code StringBuffer},
jaroslav@49
  1051
     *          {@code false} otherwise
jaroslav@49
  1052
     *
jaroslav@49
  1053
     * @since  1.4
jaroslav@49
  1054
     */
jaroslav@49
  1055
    public boolean contentEquals(StringBuffer sb) {
jaroslav@49
  1056
        synchronized(sb) {
jaroslav@49
  1057
            return contentEquals((CharSequence)sb);
jaroslav@49
  1058
        }
jaroslav@49
  1059
    }
jaroslav@49
  1060
jaroslav@49
  1061
    /**
jaroslav@49
  1062
     * Compares this string to the specified {@code CharSequence}.  The result
jaroslav@49
  1063
     * is {@code true} if and only if this {@code String} represents the same
jaroslav@49
  1064
     * sequence of char values as the specified sequence.
jaroslav@49
  1065
     *
jaroslav@49
  1066
     * @param  cs
jaroslav@49
  1067
     *         The sequence to compare this {@code String} against
jaroslav@49
  1068
     *
jaroslav@49
  1069
     * @return  {@code true} if this {@code String} represents the same
jaroslav@49
  1070
     *          sequence of char values as the specified sequence, {@code
jaroslav@49
  1071
     *          false} otherwise
jaroslav@49
  1072
     *
jaroslav@49
  1073
     * @since  1.5
jaroslav@49
  1074
     */
jaroslav@49
  1075
    public boolean contentEquals(CharSequence cs) {
jaroslav@241
  1076
        if (length() != cs.length())
jaroslav@49
  1077
            return false;
jaroslav@49
  1078
        // Argument is a StringBuffer, StringBuilder
jaroslav@49
  1079
        if (cs instanceof AbstractStringBuilder) {
jaroslav@241
  1080
            char v1[] = toCharArray();
jaroslav@49
  1081
            char v2[] = ((AbstractStringBuilder)cs).getValue();
jaroslav@241
  1082
            int i = offset();
jaroslav@49
  1083
            int j = 0;
jaroslav@241
  1084
            int n = length();
jaroslav@49
  1085
            while (n-- != 0) {
jaroslav@49
  1086
                if (v1[i++] != v2[j++])
jaroslav@49
  1087
                    return false;
jaroslav@49
  1088
            }
jaroslav@49
  1089
            return true;
jaroslav@49
  1090
        }
jaroslav@49
  1091
        // Argument is a String
jaroslav@49
  1092
        if (cs.equals(this))
jaroslav@49
  1093
            return true;
jaroslav@49
  1094
        // Argument is a generic CharSequence
jaroslav@241
  1095
        char v1[] = toCharArray();
jaroslav@241
  1096
        int i = offset();
jaroslav@49
  1097
        int j = 0;
jaroslav@241
  1098
        int n = length();
jaroslav@49
  1099
        while (n-- != 0) {
jaroslav@49
  1100
            if (v1[i++] != cs.charAt(j++))
jaroslav@49
  1101
                return false;
jaroslav@49
  1102
        }
jaroslav@49
  1103
        return true;
jaroslav@49
  1104
    }
jaroslav@49
  1105
jaroslav@49
  1106
    /**
jaroslav@49
  1107
     * Compares this {@code String} to another {@code String}, ignoring case
jaroslav@49
  1108
     * considerations.  Two strings are considered equal ignoring case if they
jaroslav@49
  1109
     * are of the same length and corresponding characters in the two strings
jaroslav@49
  1110
     * are equal ignoring case.
jaroslav@49
  1111
     *
jaroslav@49
  1112
     * <p> Two characters {@code c1} and {@code c2} are considered the same
jaroslav@49
  1113
     * ignoring case if at least one of the following is true:
jaroslav@49
  1114
     * <ul>
jaroslav@49
  1115
     *   <li> The two characters are the same (as compared by the
jaroslav@49
  1116
     *        {@code ==} operator)
jaroslav@49
  1117
     *   <li> Applying the method {@link
jaroslav@49
  1118
     *        java.lang.Character#toUpperCase(char)} to each character
jaroslav@49
  1119
     *        produces the same result
jaroslav@49
  1120
     *   <li> Applying the method {@link
jaroslav@49
  1121
     *        java.lang.Character#toLowerCase(char)} to each character
jaroslav@49
  1122
     *        produces the same result
jaroslav@49
  1123
     * </ul>
jaroslav@49
  1124
     *
jaroslav@49
  1125
     * @param  anotherString
jaroslav@49
  1126
     *         The {@code String} to compare this {@code String} against
jaroslav@49
  1127
     *
jaroslav@49
  1128
     * @return  {@code true} if the argument is not {@code null} and it
jaroslav@49
  1129
     *          represents an equivalent {@code String} ignoring case; {@code
jaroslav@49
  1130
     *          false} otherwise
jaroslav@49
  1131
     *
jaroslav@49
  1132
     * @see  #equals(Object)
jaroslav@49
  1133
     */
jaroslav@49
  1134
    public boolean equalsIgnoreCase(String anotherString) {
jaroslav@49
  1135
        return (this == anotherString) ? true :
jaroslav@241
  1136
               (anotherString != null) && (anotherString.length() == length()) &&
jaroslav@241
  1137
               regionMatches(true, 0, anotherString, 0, length());
jaroslav@49
  1138
    }
jaroslav@49
  1139
jaroslav@49
  1140
    /**
jaroslav@49
  1141
     * Compares two strings lexicographically.
jaroslav@49
  1142
     * The comparison is based on the Unicode value of each character in
jaroslav@49
  1143
     * the strings. The character sequence represented by this
jaroslav@49
  1144
     * <code>String</code> object is compared lexicographically to the
jaroslav@49
  1145
     * character sequence represented by the argument string. The result is
jaroslav@49
  1146
     * a negative integer if this <code>String</code> object
jaroslav@49
  1147
     * lexicographically precedes the argument string. The result is a
jaroslav@49
  1148
     * positive integer if this <code>String</code> object lexicographically
jaroslav@49
  1149
     * follows the argument string. The result is zero if the strings
jaroslav@49
  1150
     * are equal; <code>compareTo</code> returns <code>0</code> exactly when
jaroslav@49
  1151
     * the {@link #equals(Object)} method would return <code>true</code>.
jaroslav@49
  1152
     * <p>
jaroslav@49
  1153
     * This is the definition of lexicographic ordering. If two strings are
jaroslav@49
  1154
     * different, then either they have different characters at some index
jaroslav@49
  1155
     * that is a valid index for both strings, or their lengths are different,
jaroslav@49
  1156
     * or both. If they have different characters at one or more index
jaroslav@49
  1157
     * positions, let <i>k</i> be the smallest such index; then the string
jaroslav@49
  1158
     * whose character at position <i>k</i> has the smaller value, as
jaroslav@49
  1159
     * determined by using the &lt; operator, lexicographically precedes the
jaroslav@49
  1160
     * other string. In this case, <code>compareTo</code> returns the
jaroslav@49
  1161
     * difference of the two character values at position <code>k</code> in
jaroslav@49
  1162
     * the two string -- that is, the value:
jaroslav@49
  1163
     * <blockquote><pre>
jaroslav@49
  1164
     * this.charAt(k)-anotherString.charAt(k)
jaroslav@49
  1165
     * </pre></blockquote>
jaroslav@49
  1166
     * If there is no index position at which they differ, then the shorter
jaroslav@49
  1167
     * string lexicographically precedes the longer string. In this case,
jaroslav@49
  1168
     * <code>compareTo</code> returns the difference of the lengths of the
jaroslav@49
  1169
     * strings -- that is, the value:
jaroslav@49
  1170
     * <blockquote><pre>
jaroslav@49
  1171
     * this.length()-anotherString.length()
jaroslav@49
  1172
     * </pre></blockquote>
jaroslav@49
  1173
     *
jaroslav@49
  1174
     * @param   anotherString   the <code>String</code> to be compared.
jaroslav@49
  1175
     * @return  the value <code>0</code> if the argument string is equal to
jaroslav@49
  1176
     *          this string; a value less than <code>0</code> if this string
jaroslav@49
  1177
     *          is lexicographically less than the string argument; and a
jaroslav@49
  1178
     *          value greater than <code>0</code> if this string is
jaroslav@49
  1179
     *          lexicographically greater than the string argument.
jaroslav@49
  1180
     */
jaroslav@49
  1181
    public int compareTo(String anotherString) {
jaroslav@241
  1182
        int len1 = length();
jaroslav@241
  1183
        int len2 = anotherString.length();
jaroslav@49
  1184
        int n = Math.min(len1, len2);
jaroslav@241
  1185
        char v1[] = toCharArray();
jaroslav@241
  1186
        char v2[] = anotherString.toCharArray();
jaroslav@241
  1187
        int i = offset();
jaroslav@241
  1188
        int j = anotherString.offset();
jaroslav@49
  1189
jaroslav@49
  1190
        if (i == j) {
jaroslav@49
  1191
            int k = i;
jaroslav@49
  1192
            int lim = n + i;
jaroslav@49
  1193
            while (k < lim) {
jaroslav@49
  1194
                char c1 = v1[k];
jaroslav@49
  1195
                char c2 = v2[k];
jaroslav@49
  1196
                if (c1 != c2) {
jaroslav@49
  1197
                    return c1 - c2;
jaroslav@49
  1198
                }
jaroslav@49
  1199
                k++;
jaroslav@49
  1200
            }
jaroslav@49
  1201
        } else {
jaroslav@49
  1202
            while (n-- != 0) {
jaroslav@49
  1203
                char c1 = v1[i++];
jaroslav@49
  1204
                char c2 = v2[j++];
jaroslav@49
  1205
                if (c1 != c2) {
jaroslav@49
  1206
                    return c1 - c2;
jaroslav@49
  1207
                }
jaroslav@49
  1208
            }
jaroslav@49
  1209
        }
jaroslav@49
  1210
        return len1 - len2;
jaroslav@49
  1211
    }
jaroslav@49
  1212
jaroslav@49
  1213
    /**
jaroslav@49
  1214
     * A Comparator that orders <code>String</code> objects as by
jaroslav@49
  1215
     * <code>compareToIgnoreCase</code>. This comparator is serializable.
jaroslav@49
  1216
     * <p>
jaroslav@49
  1217
     * Note that this Comparator does <em>not</em> take locale into account,
jaroslav@49
  1218
     * and will result in an unsatisfactory ordering for certain locales.
jaroslav@49
  1219
     * The java.text package provides <em>Collators</em> to allow
jaroslav@49
  1220
     * locale-sensitive ordering.
jaroslav@49
  1221
     *
jaroslav@49
  1222
     * @see     java.text.Collator#compare(String, String)
jaroslav@49
  1223
     * @since   1.2
jaroslav@49
  1224
     */
jaroslav@49
  1225
    public static final Comparator<String> CASE_INSENSITIVE_ORDER
jaroslav@49
  1226
                                         = new CaseInsensitiveComparator();
jaroslav@241
  1227
jaroslav@241
  1228
    private static int offset() {
jaroslav@241
  1229
        return 0;
jaroslav@241
  1230
    }
jaroslav@608
  1231
jaroslav@49
  1232
    private static class CaseInsensitiveComparator
jaroslav@49
  1233
                         implements Comparator<String>, java.io.Serializable {
jaroslav@49
  1234
        // use serialVersionUID from JDK 1.2.2 for interoperability
jaroslav@49
  1235
        private static final long serialVersionUID = 8575799808933029326L;
jaroslav@49
  1236
jaroslav@49
  1237
        public int compare(String s1, String s2) {
jaroslav@49
  1238
            int n1 = s1.length();
jaroslav@49
  1239
            int n2 = s2.length();
jaroslav@49
  1240
            int min = Math.min(n1, n2);
jaroslav@49
  1241
            for (int i = 0; i < min; i++) {
jaroslav@49
  1242
                char c1 = s1.charAt(i);
jaroslav@49
  1243
                char c2 = s2.charAt(i);
jaroslav@49
  1244
                if (c1 != c2) {
jaroslav@49
  1245
                    c1 = Character.toUpperCase(c1);
jaroslav@49
  1246
                    c2 = Character.toUpperCase(c2);
jaroslav@49
  1247
                    if (c1 != c2) {
jaroslav@49
  1248
                        c1 = Character.toLowerCase(c1);
jaroslav@49
  1249
                        c2 = Character.toLowerCase(c2);
jaroslav@49
  1250
                        if (c1 != c2) {
jaroslav@49
  1251
                            // No overflow because of numeric promotion
jaroslav@49
  1252
                            return c1 - c2;
jaroslav@49
  1253
                        }
jaroslav@49
  1254
                    }
jaroslav@49
  1255
                }
jaroslav@49
  1256
            }
jaroslav@49
  1257
            return n1 - n2;
jaroslav@49
  1258
        }
jaroslav@49
  1259
    }
jaroslav@49
  1260
jaroslav@49
  1261
    /**
jaroslav@49
  1262
     * Compares two strings lexicographically, ignoring case
jaroslav@49
  1263
     * differences. This method returns an integer whose sign is that of
jaroslav@49
  1264
     * calling <code>compareTo</code> with normalized versions of the strings
jaroslav@49
  1265
     * where case differences have been eliminated by calling
jaroslav@49
  1266
     * <code>Character.toLowerCase(Character.toUpperCase(character))</code> on
jaroslav@49
  1267
     * each character.
jaroslav@49
  1268
     * <p>
jaroslav@49
  1269
     * Note that this method does <em>not</em> take locale into account,
jaroslav@49
  1270
     * and will result in an unsatisfactory ordering for certain locales.
jaroslav@49
  1271
     * The java.text package provides <em>collators</em> to allow
jaroslav@49
  1272
     * locale-sensitive ordering.
jaroslav@49
  1273
     *
jaroslav@49
  1274
     * @param   str   the <code>String</code> to be compared.
jaroslav@49
  1275
     * @return  a negative integer, zero, or a positive integer as the
jaroslav@49
  1276
     *          specified String is greater than, equal to, or less
jaroslav@49
  1277
     *          than this String, ignoring case considerations.
jaroslav@49
  1278
     * @see     java.text.Collator#compare(String, String)
jaroslav@49
  1279
     * @since   1.2
jaroslav@49
  1280
     */
jaroslav@49
  1281
    public int compareToIgnoreCase(String str) {
jaroslav@49
  1282
        return CASE_INSENSITIVE_ORDER.compare(this, str);
jaroslav@49
  1283
    }
jaroslav@49
  1284
jaroslav@49
  1285
    /**
jaroslav@49
  1286
     * Tests if two string regions are equal.
jaroslav@49
  1287
     * <p>
jaroslav@49
  1288
     * A substring of this <tt>String</tt> object is compared to a substring
jaroslav@49
  1289
     * of the argument other. The result is true if these substrings
jaroslav@49
  1290
     * represent identical character sequences. The substring of this
jaroslav@49
  1291
     * <tt>String</tt> object to be compared begins at index <tt>toffset</tt>
jaroslav@49
  1292
     * and has length <tt>len</tt>. The substring of other to be compared
jaroslav@49
  1293
     * begins at index <tt>ooffset</tt> and has length <tt>len</tt>. The
jaroslav@49
  1294
     * result is <tt>false</tt> if and only if at least one of the following
jaroslav@49
  1295
     * is true:
jaroslav@49
  1296
     * <ul><li><tt>toffset</tt> is negative.
jaroslav@49
  1297
     * <li><tt>ooffset</tt> is negative.
jaroslav@49
  1298
     * <li><tt>toffset+len</tt> is greater than the length of this
jaroslav@49
  1299
     * <tt>String</tt> object.
jaroslav@49
  1300
     * <li><tt>ooffset+len</tt> is greater than the length of the other
jaroslav@49
  1301
     * argument.
jaroslav@49
  1302
     * <li>There is some nonnegative integer <i>k</i> less than <tt>len</tt>
jaroslav@49
  1303
     * such that:
jaroslav@49
  1304
     * <tt>this.charAt(toffset+<i>k</i>)&nbsp;!=&nbsp;other.charAt(ooffset+<i>k</i>)</tt>
jaroslav@49
  1305
     * </ul>
jaroslav@49
  1306
     *
jaroslav@49
  1307
     * @param   toffset   the starting offset of the subregion in this string.
jaroslav@49
  1308
     * @param   other     the string argument.
jaroslav@49
  1309
     * @param   ooffset   the starting offset of the subregion in the string
jaroslav@49
  1310
     *                    argument.
jaroslav@49
  1311
     * @param   len       the number of characters to compare.
jaroslav@49
  1312
     * @return  <code>true</code> if the specified subregion of this string
jaroslav@49
  1313
     *          exactly matches the specified subregion of the string argument;
jaroslav@49
  1314
     *          <code>false</code> otherwise.
jaroslav@49
  1315
     */
jaroslav@49
  1316
    public boolean regionMatches(int toffset, String other, int ooffset,
jaroslav@49
  1317
                                 int len) {
jaroslav@241
  1318
        char ta[] = toCharArray();
jaroslav@241
  1319
        int to = offset() + toffset;
jaroslav@241
  1320
        char pa[] = other.toCharArray();
jaroslav@241
  1321
        int po = other.offset() + ooffset;
jaroslav@49
  1322
        // Note: toffset, ooffset, or len might be near -1>>>1.
jaroslav@241
  1323
        if ((ooffset < 0) || (toffset < 0) || (toffset > (long)length() - len)
jaroslav@241
  1324
            || (ooffset > (long)other.length() - len)) {
jaroslav@49
  1325
            return false;
jaroslav@49
  1326
        }
jaroslav@49
  1327
        while (len-- > 0) {
jaroslav@49
  1328
            if (ta[to++] != pa[po++]) {
jaroslav@49
  1329
                return false;
jaroslav@49
  1330
            }
jaroslav@49
  1331
        }
jaroslav@49
  1332
        return true;
jaroslav@49
  1333
    }
jaroslav@49
  1334
jaroslav@49
  1335
    /**
jaroslav@49
  1336
     * Tests if two string regions are equal.
jaroslav@49
  1337
     * <p>
jaroslav@49
  1338
     * A substring of this <tt>String</tt> object is compared to a substring
jaroslav@49
  1339
     * of the argument <tt>other</tt>. The result is <tt>true</tt> if these
jaroslav@49
  1340
     * substrings represent character sequences that are the same, ignoring
jaroslav@49
  1341
     * case if and only if <tt>ignoreCase</tt> is true. The substring of
jaroslav@49
  1342
     * this <tt>String</tt> object to be compared begins at index
jaroslav@49
  1343
     * <tt>toffset</tt> and has length <tt>len</tt>. The substring of
jaroslav@49
  1344
     * <tt>other</tt> to be compared begins at index <tt>ooffset</tt> and
jaroslav@49
  1345
     * has length <tt>len</tt>. The result is <tt>false</tt> if and only if
jaroslav@49
  1346
     * at least one of the following is true:
jaroslav@49
  1347
     * <ul><li><tt>toffset</tt> is negative.
jaroslav@49
  1348
     * <li><tt>ooffset</tt> is negative.
jaroslav@49
  1349
     * <li><tt>toffset+len</tt> is greater than the length of this
jaroslav@49
  1350
     * <tt>String</tt> object.
jaroslav@49
  1351
     * <li><tt>ooffset+len</tt> is greater than the length of the other
jaroslav@49
  1352
     * argument.
jaroslav@49
  1353
     * <li><tt>ignoreCase</tt> is <tt>false</tt> and there is some nonnegative
jaroslav@49
  1354
     * integer <i>k</i> less than <tt>len</tt> such that:
jaroslav@49
  1355
     * <blockquote><pre>
jaroslav@49
  1356
     * this.charAt(toffset+k) != other.charAt(ooffset+k)
jaroslav@49
  1357
     * </pre></blockquote>
jaroslav@49
  1358
     * <li><tt>ignoreCase</tt> is <tt>true</tt> and there is some nonnegative
jaroslav@49
  1359
     * integer <i>k</i> less than <tt>len</tt> such that:
jaroslav@49
  1360
     * <blockquote><pre>
jaroslav@49
  1361
     * Character.toLowerCase(this.charAt(toffset+k)) !=
jaroslav@49
  1362
               Character.toLowerCase(other.charAt(ooffset+k))
jaroslav@49
  1363
     * </pre></blockquote>
jaroslav@49
  1364
     * and:
jaroslav@49
  1365
     * <blockquote><pre>
jaroslav@49
  1366
     * Character.toUpperCase(this.charAt(toffset+k)) !=
jaroslav@49
  1367
     *         Character.toUpperCase(other.charAt(ooffset+k))
jaroslav@49
  1368
     * </pre></blockquote>
jaroslav@49
  1369
     * </ul>
jaroslav@49
  1370
     *
jaroslav@49
  1371
     * @param   ignoreCase   if <code>true</code>, ignore case when comparing
jaroslav@49
  1372
     *                       characters.
jaroslav@49
  1373
     * @param   toffset      the starting offset of the subregion in this
jaroslav@49
  1374
     *                       string.
jaroslav@49
  1375
     * @param   other        the string argument.
jaroslav@49
  1376
     * @param   ooffset      the starting offset of the subregion in the string
jaroslav@49
  1377
     *                       argument.
jaroslav@49
  1378
     * @param   len          the number of characters to compare.
jaroslav@49
  1379
     * @return  <code>true</code> if the specified subregion of this string
jaroslav@49
  1380
     *          matches the specified subregion of the string argument;
jaroslav@49
  1381
     *          <code>false</code> otherwise. Whether the matching is exact
jaroslav@49
  1382
     *          or case insensitive depends on the <code>ignoreCase</code>
jaroslav@49
  1383
     *          argument.
jaroslav@49
  1384
     */
jaroslav@49
  1385
    public boolean regionMatches(boolean ignoreCase, int toffset,
jaroslav@49
  1386
                           String other, int ooffset, int len) {
jaroslav@241
  1387
        char ta[] = toCharArray();
jaroslav@241
  1388
        int to = offset() + toffset;
jaroslav@241
  1389
        char pa[] = other.toCharArray();
jaroslav@241
  1390
        int po = other.offset() + ooffset;
jaroslav@49
  1391
        // Note: toffset, ooffset, or len might be near -1>>>1.
jaroslav@241
  1392
        if ((ooffset < 0) || (toffset < 0) || (toffset > (long)length() - len) ||
jaroslav@241
  1393
                (ooffset > (long)other.length() - len)) {
jaroslav@49
  1394
            return false;
jaroslav@49
  1395
        }
jaroslav@49
  1396
        while (len-- > 0) {
jaroslav@49
  1397
            char c1 = ta[to++];
jaroslav@49
  1398
            char c2 = pa[po++];
jaroslav@49
  1399
            if (c1 == c2) {
jaroslav@49
  1400
                continue;
jaroslav@49
  1401
            }
jaroslav@49
  1402
            if (ignoreCase) {
jaroslav@49
  1403
                // If characters don't match but case may be ignored,
jaroslav@49
  1404
                // try converting both characters to uppercase.
jaroslav@49
  1405
                // If the results match, then the comparison scan should
jaroslav@49
  1406
                // continue.
jaroslav@49
  1407
                char u1 = Character.toUpperCase(c1);
jaroslav@49
  1408
                char u2 = Character.toUpperCase(c2);
jaroslav@49
  1409
                if (u1 == u2) {
jaroslav@49
  1410
                    continue;
jaroslav@49
  1411
                }
jaroslav@49
  1412
                // Unfortunately, conversion to uppercase does not work properly
jaroslav@49
  1413
                // for the Georgian alphabet, which has strange rules about case
jaroslav@49
  1414
                // conversion.  So we need to make one last check before
jaroslav@49
  1415
                // exiting.
jaroslav@49
  1416
                if (Character.toLowerCase(u1) == Character.toLowerCase(u2)) {
jaroslav@49
  1417
                    continue;
jaroslav@49
  1418
                }
jaroslav@49
  1419
            }
jaroslav@49
  1420
            return false;
jaroslav@49
  1421
        }
jaroslav@49
  1422
        return true;
jaroslav@49
  1423
    }
jaroslav@49
  1424
jaroslav@49
  1425
    /**
jaroslav@49
  1426
     * Tests if the substring of this string beginning at the
jaroslav@49
  1427
     * specified index starts with the specified prefix.
jaroslav@49
  1428
     *
jaroslav@49
  1429
     * @param   prefix    the prefix.
jaroslav@49
  1430
     * @param   toffset   where to begin looking in this string.
jaroslav@49
  1431
     * @return  <code>true</code> if the character sequence represented by the
jaroslav@49
  1432
     *          argument is a prefix of the substring of this object starting
jaroslav@49
  1433
     *          at index <code>toffset</code>; <code>false</code> otherwise.
jaroslav@49
  1434
     *          The result is <code>false</code> if <code>toffset</code> is
jaroslav@49
  1435
     *          negative or greater than the length of this
jaroslav@49
  1436
     *          <code>String</code> object; otherwise the result is the same
jaroslav@49
  1437
     *          as the result of the expression
jaroslav@49
  1438
     *          <pre>
jaroslav@49
  1439
     *          this.substring(toffset).startsWith(prefix)
jaroslav@49
  1440
     *          </pre>
jaroslav@49
  1441
     */
jaroslav@443
  1442
    @JavaScriptBody(args = { "find", "from" }, body=
jaroslav@240
  1443
        "find = find.toString();\n" +
jaroslav@443
  1444
        "return this.toString().substring(from, from + find.length) === find;\n"
jaroslav@240
  1445
    )
jaroslav@49
  1446
    public boolean startsWith(String prefix, int toffset) {
jaroslav@241
  1447
        char ta[] = toCharArray();
jaroslav@241
  1448
        int to = offset() + toffset;
jaroslav@241
  1449
        char pa[] = prefix.toCharArray();
jaroslav@241
  1450
        int po = prefix.offset();
jaroslav@241
  1451
        int pc = prefix.length();
jaroslav@49
  1452
        // Note: toffset might be near -1>>>1.
jaroslav@241
  1453
        if ((toffset < 0) || (toffset > length() - pc)) {
jaroslav@49
  1454
            return false;
jaroslav@49
  1455
        }
jaroslav@49
  1456
        while (--pc >= 0) {
jaroslav@49
  1457
            if (ta[to++] != pa[po++]) {
jaroslav@49
  1458
                return false;
jaroslav@49
  1459
            }
jaroslav@49
  1460
        }
jaroslav@49
  1461
        return true;
jaroslav@49
  1462
    }
jaroslav@49
  1463
jaroslav@49
  1464
    /**
jaroslav@49
  1465
     * Tests if this string starts with the specified prefix.
jaroslav@49
  1466
     *
jaroslav@49
  1467
     * @param   prefix   the prefix.
jaroslav@49
  1468
     * @return  <code>true</code> if the character sequence represented by the
jaroslav@49
  1469
     *          argument is a prefix of the character sequence represented by
jaroslav@49
  1470
     *          this string; <code>false</code> otherwise.
jaroslav@49
  1471
     *          Note also that <code>true</code> will be returned if the
jaroslav@49
  1472
     *          argument is an empty string or is equal to this
jaroslav@49
  1473
     *          <code>String</code> object as determined by the
jaroslav@49
  1474
     *          {@link #equals(Object)} method.
jaroslav@49
  1475
     * @since   1. 0
jaroslav@49
  1476
     */
jaroslav@49
  1477
    public boolean startsWith(String prefix) {
jaroslav@49
  1478
        return startsWith(prefix, 0);
jaroslav@49
  1479
    }
jaroslav@49
  1480
jaroslav@49
  1481
    /**
jaroslav@49
  1482
     * Tests if this string ends with the specified suffix.
jaroslav@49
  1483
     *
jaroslav@49
  1484
     * @param   suffix   the suffix.
jaroslav@49
  1485
     * @return  <code>true</code> if the character sequence represented by the
jaroslav@49
  1486
     *          argument is a suffix of the character sequence represented by
jaroslav@49
  1487
     *          this object; <code>false</code> otherwise. Note that the
jaroslav@49
  1488
     *          result will be <code>true</code> if the argument is the
jaroslav@49
  1489
     *          empty string or is equal to this <code>String</code> object
jaroslav@49
  1490
     *          as determined by the {@link #equals(Object)} method.
jaroslav@49
  1491
     */
jaroslav@49
  1492
    public boolean endsWith(String suffix) {
jaroslav@241
  1493
        return startsWith(suffix, length() - suffix.length());
jaroslav@49
  1494
    }
jaroslav@49
  1495
jaroslav@49
  1496
    /**
jaroslav@49
  1497
     * Returns a hash code for this string. The hash code for a
jaroslav@49
  1498
     * <code>String</code> object is computed as
jaroslav@49
  1499
     * <blockquote><pre>
jaroslav@49
  1500
     * s[0]*31^(n-1) + s[1]*31^(n-2) + ... + s[n-1]
jaroslav@49
  1501
     * </pre></blockquote>
jaroslav@49
  1502
     * using <code>int</code> arithmetic, where <code>s[i]</code> is the
jaroslav@49
  1503
     * <i>i</i>th character of the string, <code>n</code> is the length of
jaroslav@49
  1504
     * the string, and <code>^</code> indicates exponentiation.
jaroslav@49
  1505
     * (The hash value of the empty string is zero.)
jaroslav@49
  1506
     *
jaroslav@49
  1507
     * @return  a hash code value for this object.
jaroslav@49
  1508
     */
jaroslav@49
  1509
    public int hashCode() {
jaroslav@429
  1510
        return super.hashCode();
jaroslav@429
  1511
    }
jaroslav@429
  1512
    int computeHashCode() {
jaroslav@429
  1513
        int h = 0;
jaroslav@241
  1514
        if (h == 0 && length() > 0) {
jaroslav@241
  1515
            int off = offset();
jaroslav@241
  1516
            int len = length();
jaroslav@49
  1517
jaroslav@49
  1518
            for (int i = 0; i < len; i++) {
jaroslav@429
  1519
                h = 31*h + charAt(off++);
jaroslav@49
  1520
            }
jaroslav@49
  1521
        }
jaroslav@49
  1522
        return h;
jaroslav@49
  1523
    }
jaroslav@49
  1524
jaroslav@49
  1525
    /**
jaroslav@49
  1526
     * Returns the index within this string of the first occurrence of
jaroslav@49
  1527
     * the specified character. If a character with value
jaroslav@49
  1528
     * <code>ch</code> occurs in the character sequence represented by
jaroslav@49
  1529
     * this <code>String</code> object, then the index (in Unicode
jaroslav@49
  1530
     * code units) of the first such occurrence is returned. For
jaroslav@49
  1531
     * values of <code>ch</code> in the range from 0 to 0xFFFF
jaroslav@49
  1532
     * (inclusive), this is the smallest value <i>k</i> such that:
jaroslav@49
  1533
     * <blockquote><pre>
jaroslav@49
  1534
     * this.charAt(<i>k</i>) == ch
jaroslav@49
  1535
     * </pre></blockquote>
jaroslav@49
  1536
     * is true. For other values of <code>ch</code>, it is the
jaroslav@49
  1537
     * smallest value <i>k</i> such that:
jaroslav@49
  1538
     * <blockquote><pre>
jaroslav@49
  1539
     * this.codePointAt(<i>k</i>) == ch
jaroslav@49
  1540
     * </pre></blockquote>
jaroslav@49
  1541
     * is true. In either case, if no such character occurs in this
jaroslav@49
  1542
     * string, then <code>-1</code> is returned.
jaroslav@49
  1543
     *
jaroslav@49
  1544
     * @param   ch   a character (Unicode code point).
jaroslav@49
  1545
     * @return  the index of the first occurrence of the character in the
jaroslav@49
  1546
     *          character sequence represented by this object, or
jaroslav@49
  1547
     *          <code>-1</code> if the character does not occur.
jaroslav@49
  1548
     */
jaroslav@49
  1549
    public int indexOf(int ch) {
jaroslav@49
  1550
        return indexOf(ch, 0);
jaroslav@49
  1551
    }
jaroslav@49
  1552
jaroslav@49
  1553
    /**
jaroslav@49
  1554
     * Returns the index within this string of the first occurrence of the
jaroslav@49
  1555
     * specified character, starting the search at the specified index.
jaroslav@49
  1556
     * <p>
jaroslav@49
  1557
     * If a character with value <code>ch</code> occurs in the
jaroslav@49
  1558
     * character sequence represented by this <code>String</code>
jaroslav@49
  1559
     * object at an index no smaller than <code>fromIndex</code>, then
jaroslav@49
  1560
     * the index of the first such occurrence is returned. For values
jaroslav@49
  1561
     * of <code>ch</code> in the range from 0 to 0xFFFF (inclusive),
jaroslav@49
  1562
     * this is the smallest value <i>k</i> such that:
jaroslav@49
  1563
     * <blockquote><pre>
jaroslav@49
  1564
     * (this.charAt(<i>k</i>) == ch) && (<i>k</i> &gt;= fromIndex)
jaroslav@49
  1565
     * </pre></blockquote>
jaroslav@49
  1566
     * is true. For other values of <code>ch</code>, it is the
jaroslav@49
  1567
     * smallest value <i>k</i> such that:
jaroslav@49
  1568
     * <blockquote><pre>
jaroslav@49
  1569
     * (this.codePointAt(<i>k</i>) == ch) && (<i>k</i> &gt;= fromIndex)
jaroslav@49
  1570
     * </pre></blockquote>
jaroslav@49
  1571
     * is true. In either case, if no such character occurs in this
jaroslav@49
  1572
     * string at or after position <code>fromIndex</code>, then
jaroslav@49
  1573
     * <code>-1</code> is returned.
jaroslav@49
  1574
     *
jaroslav@49
  1575
     * <p>
jaroslav@49
  1576
     * There is no restriction on the value of <code>fromIndex</code>. If it
jaroslav@49
  1577
     * is negative, it has the same effect as if it were zero: this entire
jaroslav@49
  1578
     * string may be searched. If it is greater than the length of this
jaroslav@49
  1579
     * string, it has the same effect as if it were equal to the length of
jaroslav@49
  1580
     * this string: <code>-1</code> is returned.
jaroslav@49
  1581
     *
jaroslav@49
  1582
     * <p>All indices are specified in <code>char</code> values
jaroslav@49
  1583
     * (Unicode code units).
jaroslav@49
  1584
     *
jaroslav@49
  1585
     * @param   ch          a character (Unicode code point).
jaroslav@49
  1586
     * @param   fromIndex   the index to start the search from.
jaroslav@49
  1587
     * @return  the index of the first occurrence of the character in the
jaroslav@49
  1588
     *          character sequence represented by this object that is greater
jaroslav@49
  1589
     *          than or equal to <code>fromIndex</code>, or <code>-1</code>
jaroslav@49
  1590
     *          if the character does not occur.
jaroslav@49
  1591
     */
jaroslav@443
  1592
    @JavaScriptBody(args = { "ch", "from" }, body = 
jaroslav@240
  1593
        "if (typeof ch === 'number') ch = String.fromCharCode(ch);\n" +
jaroslav@443
  1594
        "return this.toString().indexOf(ch, from);\n"
jaroslav@240
  1595
    )
jaroslav@49
  1596
    public int indexOf(int ch, int fromIndex) {
jaroslav@49
  1597
        if (fromIndex < 0) {
jaroslav@49
  1598
            fromIndex = 0;
jaroslav@241
  1599
        } else if (fromIndex >= length()) {
jaroslav@49
  1600
            // Note: fromIndex might be near -1>>>1.
jaroslav@49
  1601
            return -1;
jaroslav@49
  1602
        }
jaroslav@49
  1603
jaroslav@49
  1604
        if (ch < Character.MIN_SUPPLEMENTARY_CODE_POINT) {
jaroslav@49
  1605
            // handle most cases here (ch is a BMP code point or a
jaroslav@49
  1606
            // negative value (invalid code point))
jaroslav@241
  1607
            final char[] value = this.toCharArray();
jaroslav@241
  1608
            final int offset = this.offset();
jaroslav@241
  1609
            final int max = offset + length();
jaroslav@49
  1610
            for (int i = offset + fromIndex; i < max ; i++) {
jaroslav@49
  1611
                if (value[i] == ch) {
jaroslav@49
  1612
                    return i - offset;
jaroslav@49
  1613
                }
jaroslav@49
  1614
            }
jaroslav@49
  1615
            return -1;
jaroslav@49
  1616
        } else {
jaroslav@49
  1617
            return indexOfSupplementary(ch, fromIndex);
jaroslav@49
  1618
        }
jaroslav@49
  1619
    }
jaroslav@49
  1620
jaroslav@49
  1621
    /**
jaroslav@49
  1622
     * Handles (rare) calls of indexOf with a supplementary character.
jaroslav@49
  1623
     */
jaroslav@49
  1624
    private int indexOfSupplementary(int ch, int fromIndex) {
jaroslav@49
  1625
        if (Character.isValidCodePoint(ch)) {
jaroslav@241
  1626
            final char[] value = this.toCharArray();
jaroslav@241
  1627
            final int offset = this.offset();
jaroslav@49
  1628
            final char hi = Character.highSurrogate(ch);
jaroslav@49
  1629
            final char lo = Character.lowSurrogate(ch);
jaroslav@241
  1630
            final int max = offset + length() - 1;
jaroslav@49
  1631
            for (int i = offset + fromIndex; i < max; i++) {
jaroslav@49
  1632
                if (value[i] == hi && value[i+1] == lo) {
jaroslav@49
  1633
                    return i - offset;
jaroslav@49
  1634
                }
jaroslav@49
  1635
            }
jaroslav@49
  1636
        }
jaroslav@49
  1637
        return -1;
jaroslav@49
  1638
    }
jaroslav@49
  1639
jaroslav@49
  1640
    /**
jaroslav@49
  1641
     * Returns the index within this string of the last occurrence of
jaroslav@49
  1642
     * the specified character. For values of <code>ch</code> in the
jaroslav@49
  1643
     * range from 0 to 0xFFFF (inclusive), the index (in Unicode code
jaroslav@49
  1644
     * units) returned is the largest value <i>k</i> such that:
jaroslav@49
  1645
     * <blockquote><pre>
jaroslav@49
  1646
     * this.charAt(<i>k</i>) == ch
jaroslav@49
  1647
     * </pre></blockquote>
jaroslav@49
  1648
     * is true. For other values of <code>ch</code>, it is the
jaroslav@49
  1649
     * largest value <i>k</i> such that:
jaroslav@49
  1650
     * <blockquote><pre>
jaroslav@49
  1651
     * this.codePointAt(<i>k</i>) == ch
jaroslav@49
  1652
     * </pre></blockquote>
jaroslav@49
  1653
     * is true.  In either case, if no such character occurs in this
jaroslav@49
  1654
     * string, then <code>-1</code> is returned.  The
jaroslav@49
  1655
     * <code>String</code> is searched backwards starting at the last
jaroslav@49
  1656
     * character.
jaroslav@49
  1657
     *
jaroslav@49
  1658
     * @param   ch   a character (Unicode code point).
jaroslav@49
  1659
     * @return  the index of the last occurrence of the character in the
jaroslav@49
  1660
     *          character sequence represented by this object, or
jaroslav@49
  1661
     *          <code>-1</code> if the character does not occur.
jaroslav@49
  1662
     */
jaroslav@49
  1663
    public int lastIndexOf(int ch) {
jaroslav@241
  1664
        return lastIndexOf(ch, length() - 1);
jaroslav@49
  1665
    }
jaroslav@49
  1666
jaroslav@49
  1667
    /**
jaroslav@49
  1668
     * Returns the index within this string of the last occurrence of
jaroslav@49
  1669
     * the specified character, searching backward starting at the
jaroslav@49
  1670
     * specified index. For values of <code>ch</code> in the range
jaroslav@49
  1671
     * from 0 to 0xFFFF (inclusive), the index returned is the largest
jaroslav@49
  1672
     * value <i>k</i> such that:
jaroslav@49
  1673
     * <blockquote><pre>
jaroslav@49
  1674
     * (this.charAt(<i>k</i>) == ch) && (<i>k</i> &lt;= fromIndex)
jaroslav@49
  1675
     * </pre></blockquote>
jaroslav@49
  1676
     * is true. For other values of <code>ch</code>, it is the
jaroslav@49
  1677
     * largest value <i>k</i> such that:
jaroslav@49
  1678
     * <blockquote><pre>
jaroslav@49
  1679
     * (this.codePointAt(<i>k</i>) == ch) && (<i>k</i> &lt;= fromIndex)
jaroslav@49
  1680
     * </pre></blockquote>
jaroslav@49
  1681
     * is true. In either case, if no such character occurs in this
jaroslav@49
  1682
     * string at or before position <code>fromIndex</code>, then
jaroslav@49
  1683
     * <code>-1</code> is returned.
jaroslav@49
  1684
     *
jaroslav@49
  1685
     * <p>All indices are specified in <code>char</code> values
jaroslav@49
  1686
     * (Unicode code units).
jaroslav@49
  1687
     *
jaroslav@49
  1688
     * @param   ch          a character (Unicode code point).
jaroslav@49
  1689
     * @param   fromIndex   the index to start the search from. There is no
jaroslav@49
  1690
     *          restriction on the value of <code>fromIndex</code>. If it is
jaroslav@49
  1691
     *          greater than or equal to the length of this string, it has
jaroslav@49
  1692
     *          the same effect as if it were equal to one less than the
jaroslav@49
  1693
     *          length of this string: this entire string may be searched.
jaroslav@49
  1694
     *          If it is negative, it has the same effect as if it were -1:
jaroslav@49
  1695
     *          -1 is returned.
jaroslav@49
  1696
     * @return  the index of the last occurrence of the character in the
jaroslav@49
  1697
     *          character sequence represented by this object that is less
jaroslav@49
  1698
     *          than or equal to <code>fromIndex</code>, or <code>-1</code>
jaroslav@49
  1699
     *          if the character does not occur before that point.
jaroslav@49
  1700
     */
jaroslav@443
  1701
    @JavaScriptBody(args = { "ch", "from" }, body = 
jaroslav@249
  1702
        "if (typeof ch === 'number') ch = String.fromCharCode(ch);\n" +
jaroslav@443
  1703
        "return this.toString().lastIndexOf(ch, from);"
jaroslav@249
  1704
    )
jaroslav@49
  1705
    public int lastIndexOf(int ch, int fromIndex) {
jaroslav@49
  1706
        if (ch < Character.MIN_SUPPLEMENTARY_CODE_POINT) {
jaroslav@49
  1707
            // handle most cases here (ch is a BMP code point or a
jaroslav@49
  1708
            // negative value (invalid code point))
jaroslav@241
  1709
            final char[] value = this.toCharArray();
jaroslav@241
  1710
            final int offset = this.offset();
jaroslav@241
  1711
            int i = offset + Math.min(fromIndex, length() - 1);
jaroslav@49
  1712
            for (; i >= offset ; i--) {
jaroslav@49
  1713
                if (value[i] == ch) {
jaroslav@49
  1714
                    return i - offset;
jaroslav@49
  1715
                }
jaroslav@49
  1716
            }
jaroslav@49
  1717
            return -1;
jaroslav@49
  1718
        } else {
jaroslav@49
  1719
            return lastIndexOfSupplementary(ch, fromIndex);
jaroslav@49
  1720
        }
jaroslav@49
  1721
    }
jaroslav@49
  1722
jaroslav@49
  1723
    /**
jaroslav@49
  1724
     * Handles (rare) calls of lastIndexOf with a supplementary character.
jaroslav@49
  1725
     */
jaroslav@49
  1726
    private int lastIndexOfSupplementary(int ch, int fromIndex) {
jaroslav@49
  1727
        if (Character.isValidCodePoint(ch)) {
jaroslav@241
  1728
            final char[] value = this.toCharArray();
jaroslav@241
  1729
            final int offset = this.offset();
jaroslav@49
  1730
            char hi = Character.highSurrogate(ch);
jaroslav@49
  1731
            char lo = Character.lowSurrogate(ch);
jaroslav@241
  1732
            int i = offset + Math.min(fromIndex, length() - 2);
jaroslav@49
  1733
            for (; i >= offset; i--) {
jaroslav@49
  1734
                if (value[i] == hi && value[i+1] == lo) {
jaroslav@49
  1735
                    return i - offset;
jaroslav@49
  1736
                }
jaroslav@49
  1737
            }
jaroslav@49
  1738
        }
jaroslav@49
  1739
        return -1;
jaroslav@49
  1740
    }
jaroslav@49
  1741
jaroslav@49
  1742
    /**
jaroslav@49
  1743
     * Returns the index within this string of the first occurrence of the
jaroslav@49
  1744
     * specified substring.
jaroslav@49
  1745
     *
jaroslav@49
  1746
     * <p>The returned index is the smallest value <i>k</i> for which:
jaroslav@49
  1747
     * <blockquote><pre>
jaroslav@49
  1748
     * this.startsWith(str, <i>k</i>)
jaroslav@49
  1749
     * </pre></blockquote>
jaroslav@49
  1750
     * If no such value of <i>k</i> exists, then {@code -1} is returned.
jaroslav@49
  1751
     *
jaroslav@49
  1752
     * @param   str   the substring to search for.
jaroslav@49
  1753
     * @return  the index of the first occurrence of the specified substring,
jaroslav@49
  1754
     *          or {@code -1} if there is no such occurrence.
jaroslav@49
  1755
     */
jaroslav@49
  1756
    public int indexOf(String str) {
jaroslav@49
  1757
        return indexOf(str, 0);
jaroslav@49
  1758
    }
jaroslav@49
  1759
jaroslav@49
  1760
    /**
jaroslav@49
  1761
     * Returns the index within this string of the first occurrence of the
jaroslav@49
  1762
     * specified substring, starting at the specified index.
jaroslav@49
  1763
     *
jaroslav@49
  1764
     * <p>The returned index is the smallest value <i>k</i> for which:
jaroslav@49
  1765
     * <blockquote><pre>
jaroslav@49
  1766
     * <i>k</i> &gt;= fromIndex && this.startsWith(str, <i>k</i>)
jaroslav@49
  1767
     * </pre></blockquote>
jaroslav@49
  1768
     * If no such value of <i>k</i> exists, then {@code -1} is returned.
jaroslav@49
  1769
     *
jaroslav@49
  1770
     * @param   str         the substring to search for.
jaroslav@49
  1771
     * @param   fromIndex   the index from which to start the search.
jaroslav@49
  1772
     * @return  the index of the first occurrence of the specified substring,
jaroslav@49
  1773
     *          starting at the specified index,
jaroslav@49
  1774
     *          or {@code -1} if there is no such occurrence.
jaroslav@49
  1775
     */
jaroslav@443
  1776
    @JavaScriptBody(args = { "str", "fromIndex" }, body =
jaroslav@443
  1777
        "return this.toString().indexOf(str.toString(), fromIndex);"
jaroslav@240
  1778
    )
jaroslav@403
  1779
    public native int indexOf(String str, int fromIndex);
jaroslav@49
  1780
jaroslav@49
  1781
    /**
jaroslav@49
  1782
     * Returns the index within this string of the last occurrence of the
jaroslav@49
  1783
     * specified substring.  The last occurrence of the empty string ""
jaroslav@49
  1784
     * is considered to occur at the index value {@code this.length()}.
jaroslav@49
  1785
     *
jaroslav@49
  1786
     * <p>The returned index is the largest value <i>k</i> for which:
jaroslav@49
  1787
     * <blockquote><pre>
jaroslav@49
  1788
     * this.startsWith(str, <i>k</i>)
jaroslav@49
  1789
     * </pre></blockquote>
jaroslav@49
  1790
     * If no such value of <i>k</i> exists, then {@code -1} is returned.
jaroslav@49
  1791
     *
jaroslav@49
  1792
     * @param   str   the substring to search for.
jaroslav@49
  1793
     * @return  the index of the last occurrence of the specified substring,
jaroslav@49
  1794
     *          or {@code -1} if there is no such occurrence.
jaroslav@49
  1795
     */
jaroslav@49
  1796
    public int lastIndexOf(String str) {
jaroslav@241
  1797
        return lastIndexOf(str, length());
jaroslav@49
  1798
    }
jaroslav@49
  1799
jaroslav@49
  1800
    /**
jaroslav@49
  1801
     * Returns the index within this string of the last occurrence of the
jaroslav@49
  1802
     * specified substring, searching backward starting at the specified index.
jaroslav@49
  1803
     *
jaroslav@49
  1804
     * <p>The returned index is the largest value <i>k</i> for which:
jaroslav@49
  1805
     * <blockquote><pre>
jaroslav@49
  1806
     * <i>k</i> &lt;= fromIndex && this.startsWith(str, <i>k</i>)
jaroslav@49
  1807
     * </pre></blockquote>
jaroslav@49
  1808
     * If no such value of <i>k</i> exists, then {@code -1} is returned.
jaroslav@49
  1809
     *
jaroslav@49
  1810
     * @param   str         the substring to search for.
jaroslav@49
  1811
     * @param   fromIndex   the index to start the search from.
jaroslav@49
  1812
     * @return  the index of the last occurrence of the specified substring,
jaroslav@49
  1813
     *          searching backward from the specified index,
jaroslav@49
  1814
     *          or {@code -1} if there is no such occurrence.
jaroslav@49
  1815
     */
jaroslav@443
  1816
    @JavaScriptBody(args = { "s", "from" }, body = 
jaroslav@443
  1817
        "return this.toString().lastIndexOf(s.toString(), from);"
jaroslav@249
  1818
    )
jaroslav@49
  1819
    public int lastIndexOf(String str, int fromIndex) {
jaroslav@241
  1820
        return lastIndexOf(toCharArray(), offset(), length(), str.toCharArray(), str.offset(), str.length(), fromIndex);
jaroslav@49
  1821
    }
jaroslav@49
  1822
jaroslav@49
  1823
    /**
jaroslav@49
  1824
     * Code shared by String and StringBuffer to do searches. The
jaroslav@49
  1825
     * source is the character array being searched, and the target
jaroslav@49
  1826
     * is the string being searched for.
jaroslav@49
  1827
     *
jaroslav@49
  1828
     * @param   source       the characters being searched.
jaroslav@49
  1829
     * @param   sourceOffset offset of the source string.
jaroslav@49
  1830
     * @param   sourceCount  count of the source string.
jaroslav@49
  1831
     * @param   target       the characters being searched for.
jaroslav@49
  1832
     * @param   targetOffset offset of the target string.
jaroslav@49
  1833
     * @param   targetCount  count of the target string.
jaroslav@49
  1834
     * @param   fromIndex    the index to begin searching from.
jaroslav@49
  1835
     */
jaroslav@49
  1836
    static int lastIndexOf(char[] source, int sourceOffset, int sourceCount,
jaroslav@49
  1837
                           char[] target, int targetOffset, int targetCount,
jaroslav@49
  1838
                           int fromIndex) {
jaroslav@49
  1839
        /*
jaroslav@49
  1840
         * Check arguments; return immediately where possible. For
jaroslav@49
  1841
         * consistency, don't check for null str.
jaroslav@49
  1842
         */
jaroslav@49
  1843
        int rightIndex = sourceCount - targetCount;
jaroslav@49
  1844
        if (fromIndex < 0) {
jaroslav@49
  1845
            return -1;
jaroslav@49
  1846
        }
jaroslav@49
  1847
        if (fromIndex > rightIndex) {
jaroslav@49
  1848
            fromIndex = rightIndex;
jaroslav@49
  1849
        }
jaroslav@49
  1850
        /* Empty string always matches. */
jaroslav@49
  1851
        if (targetCount == 0) {
jaroslav@49
  1852
            return fromIndex;
jaroslav@49
  1853
        }
jaroslav@49
  1854
jaroslav@49
  1855
        int strLastIndex = targetOffset + targetCount - 1;
jaroslav@49
  1856
        char strLastChar = target[strLastIndex];
jaroslav@49
  1857
        int min = sourceOffset + targetCount - 1;
jaroslav@49
  1858
        int i = min + fromIndex;
jaroslav@49
  1859
jaroslav@49
  1860
    startSearchForLastChar:
jaroslav@49
  1861
        while (true) {
jaroslav@49
  1862
            while (i >= min && source[i] != strLastChar) {
jaroslav@49
  1863
                i--;
jaroslav@49
  1864
            }
jaroslav@49
  1865
            if (i < min) {
jaroslav@49
  1866
                return -1;
jaroslav@49
  1867
            }
jaroslav@49
  1868
            int j = i - 1;
jaroslav@49
  1869
            int start = j - (targetCount - 1);
jaroslav@49
  1870
            int k = strLastIndex - 1;
jaroslav@49
  1871
jaroslav@49
  1872
            while (j > start) {
jaroslav@49
  1873
                if (source[j--] != target[k--]) {
jaroslav@49
  1874
                    i--;
jaroslav@49
  1875
                    continue startSearchForLastChar;
jaroslav@49
  1876
                }
jaroslav@49
  1877
            }
jaroslav@49
  1878
            return start - sourceOffset + 1;
jaroslav@49
  1879
        }
jaroslav@49
  1880
    }
jaroslav@49
  1881
jaroslav@49
  1882
    /**
jaroslav@49
  1883
     * Returns a new string that is a substring of this string. The
jaroslav@49
  1884
     * substring begins with the character at the specified index and
jaroslav@49
  1885
     * extends to the end of this string. <p>
jaroslav@49
  1886
     * Examples:
jaroslav@49
  1887
     * <blockquote><pre>
jaroslav@49
  1888
     * "unhappy".substring(2) returns "happy"
jaroslav@49
  1889
     * "Harbison".substring(3) returns "bison"
jaroslav@49
  1890
     * "emptiness".substring(9) returns "" (an empty string)
jaroslav@49
  1891
     * </pre></blockquote>
jaroslav@49
  1892
     *
jaroslav@49
  1893
     * @param      beginIndex   the beginning index, inclusive.
jaroslav@49
  1894
     * @return     the specified substring.
jaroslav@49
  1895
     * @exception  IndexOutOfBoundsException  if
jaroslav@49
  1896
     *             <code>beginIndex</code> is negative or larger than the
jaroslav@49
  1897
     *             length of this <code>String</code> object.
jaroslav@49
  1898
     */
jaroslav@49
  1899
    public String substring(int beginIndex) {
jaroslav@241
  1900
        return substring(beginIndex, length());
jaroslav@49
  1901
    }
jaroslav@49
  1902
jaroslav@49
  1903
    /**
jaroslav@49
  1904
     * Returns a new string that is a substring of this string. The
jaroslav@49
  1905
     * substring begins at the specified <code>beginIndex</code> and
jaroslav@49
  1906
     * extends to the character at index <code>endIndex - 1</code>.
jaroslav@49
  1907
     * Thus the length of the substring is <code>endIndex-beginIndex</code>.
jaroslav@49
  1908
     * <p>
jaroslav@49
  1909
     * Examples:
jaroslav@49
  1910
     * <blockquote><pre>
jaroslav@49
  1911
     * "hamburger".substring(4, 8) returns "urge"
jaroslav@49
  1912
     * "smiles".substring(1, 5) returns "mile"
jaroslav@49
  1913
     * </pre></blockquote>
jaroslav@49
  1914
     *
jaroslav@49
  1915
     * @param      beginIndex   the beginning index, inclusive.
jaroslav@49
  1916
     * @param      endIndex     the ending index, exclusive.
jaroslav@49
  1917
     * @return     the specified substring.
jaroslav@49
  1918
     * @exception  IndexOutOfBoundsException  if the
jaroslav@49
  1919
     *             <code>beginIndex</code> is negative, or
jaroslav@49
  1920
     *             <code>endIndex</code> is larger than the length of
jaroslav@49
  1921
     *             this <code>String</code> object, or
jaroslav@49
  1922
     *             <code>beginIndex</code> is larger than
jaroslav@49
  1923
     *             <code>endIndex</code>.
jaroslav@49
  1924
     */
jaroslav@443
  1925
    @JavaScriptBody(args = { "beginIndex", "endIndex" }, body = 
jaroslav@443
  1926
        "return this.toString().substring(beginIndex, endIndex);"
jaroslav@240
  1927
    )
jaroslav@49
  1928
    public String substring(int beginIndex, int endIndex) {
jaroslav@49
  1929
        if (beginIndex < 0) {
jaroslav@49
  1930
            throw new StringIndexOutOfBoundsException(beginIndex);
jaroslav@49
  1931
        }
jaroslav@241
  1932
        if (endIndex > length()) {
jaroslav@49
  1933
            throw new StringIndexOutOfBoundsException(endIndex);
jaroslav@49
  1934
        }
jaroslav@49
  1935
        if (beginIndex > endIndex) {
jaroslav@49
  1936
            throw new StringIndexOutOfBoundsException(endIndex - beginIndex);
jaroslav@49
  1937
        }
jaroslav@241
  1938
        return ((beginIndex == 0) && (endIndex == length())) ? this :
jaroslav@241
  1939
            new String(toCharArray(), offset() + beginIndex, endIndex - beginIndex);
jaroslav@49
  1940
    }
jaroslav@49
  1941
jaroslav@49
  1942
    /**
jaroslav@49
  1943
     * Returns a new character sequence that is a subsequence of this sequence.
jaroslav@49
  1944
     *
jaroslav@49
  1945
     * <p> An invocation of this method of the form
jaroslav@49
  1946
     *
jaroslav@49
  1947
     * <blockquote><pre>
jaroslav@49
  1948
     * str.subSequence(begin,&nbsp;end)</pre></blockquote>
jaroslav@49
  1949
     *
jaroslav@49
  1950
     * behaves in exactly the same way as the invocation
jaroslav@49
  1951
     *
jaroslav@49
  1952
     * <blockquote><pre>
jaroslav@49
  1953
     * str.substring(begin,&nbsp;end)</pre></blockquote>
jaroslav@49
  1954
     *
jaroslav@49
  1955
     * This method is defined so that the <tt>String</tt> class can implement
jaroslav@49
  1956
     * the {@link CharSequence} interface. </p>
jaroslav@49
  1957
     *
jaroslav@49
  1958
     * @param      beginIndex   the begin index, inclusive.
jaroslav@49
  1959
     * @param      endIndex     the end index, exclusive.
jaroslav@49
  1960
     * @return     the specified subsequence.
jaroslav@49
  1961
     *
jaroslav@49
  1962
     * @throws  IndexOutOfBoundsException
jaroslav@49
  1963
     *          if <tt>beginIndex</tt> or <tt>endIndex</tt> are negative,
jaroslav@49
  1964
     *          if <tt>endIndex</tt> is greater than <tt>length()</tt>,
jaroslav@49
  1965
     *          or if <tt>beginIndex</tt> is greater than <tt>startIndex</tt>
jaroslav@49
  1966
     *
jaroslav@49
  1967
     * @since 1.4
jaroslav@49
  1968
     * @spec JSR-51
jaroslav@49
  1969
     */
jaroslav@49
  1970
    public CharSequence subSequence(int beginIndex, int endIndex) {
jaroslav@49
  1971
        return this.substring(beginIndex, endIndex);
jaroslav@49
  1972
    }
jaroslav@49
  1973
jaroslav@49
  1974
    /**
jaroslav@49
  1975
     * Concatenates the specified string to the end of this string.
jaroslav@49
  1976
     * <p>
jaroslav@49
  1977
     * If the length of the argument string is <code>0</code>, then this
jaroslav@49
  1978
     * <code>String</code> object is returned. Otherwise, a new
jaroslav@49
  1979
     * <code>String</code> object is created, representing a character
jaroslav@49
  1980
     * sequence that is the concatenation of the character sequence
jaroslav@49
  1981
     * represented by this <code>String</code> object and the character
jaroslav@49
  1982
     * sequence represented by the argument string.<p>
jaroslav@49
  1983
     * Examples:
jaroslav@49
  1984
     * <blockquote><pre>
jaroslav@49
  1985
     * "cares".concat("s") returns "caress"
jaroslav@49
  1986
     * "to".concat("get").concat("her") returns "together"
jaroslav@49
  1987
     * </pre></blockquote>
jaroslav@49
  1988
     *
jaroslav@49
  1989
     * @param   str   the <code>String</code> that is concatenated to the end
jaroslav@49
  1990
     *                of this <code>String</code>.
jaroslav@49
  1991
     * @return  a string that represents the concatenation of this object's
jaroslav@49
  1992
     *          characters followed by the string argument's characters.
jaroslav@49
  1993
     */
jaroslav@49
  1994
    public String concat(String str) {
jaroslav@49
  1995
        int otherLen = str.length();
jaroslav@49
  1996
        if (otherLen == 0) {
jaroslav@49
  1997
            return this;
jaroslav@49
  1998
        }
jaroslav@241
  1999
        char buf[] = new char[length() + otherLen];
jaroslav@241
  2000
        getChars(0, length(), buf, 0);
jaroslav@241
  2001
        str.getChars(0, otherLen, buf, length());
jaroslav@241
  2002
        return new String(buf, 0, length() + otherLen);
jaroslav@49
  2003
    }
jaroslav@49
  2004
jaroslav@49
  2005
    /**
jaroslav@49
  2006
     * Returns a new string resulting from replacing all occurrences of
jaroslav@49
  2007
     * <code>oldChar</code> in this string with <code>newChar</code>.
jaroslav@49
  2008
     * <p>
jaroslav@49
  2009
     * If the character <code>oldChar</code> does not occur in the
jaroslav@49
  2010
     * character sequence represented by this <code>String</code> object,
jaroslav@49
  2011
     * then a reference to this <code>String</code> object is returned.
jaroslav@49
  2012
     * Otherwise, a new <code>String</code> object is created that
jaroslav@49
  2013
     * represents a character sequence identical to the character sequence
jaroslav@49
  2014
     * represented by this <code>String</code> object, except that every
jaroslav@49
  2015
     * occurrence of <code>oldChar</code> is replaced by an occurrence
jaroslav@49
  2016
     * of <code>newChar</code>.
jaroslav@49
  2017
     * <p>
jaroslav@49
  2018
     * Examples:
jaroslav@49
  2019
     * <blockquote><pre>
jaroslav@49
  2020
     * "mesquite in your cellar".replace('e', 'o')
jaroslav@49
  2021
     *         returns "mosquito in your collar"
jaroslav@49
  2022
     * "the war of baronets".replace('r', 'y')
jaroslav@49
  2023
     *         returns "the way of bayonets"
jaroslav@49
  2024
     * "sparring with a purple porpoise".replace('p', 't')
jaroslav@49
  2025
     *         returns "starring with a turtle tortoise"
jaroslav@49
  2026
     * "JonL".replace('q', 'x') returns "JonL" (no change)
jaroslav@49
  2027
     * </pre></blockquote>
jaroslav@49
  2028
     *
jaroslav@49
  2029
     * @param   oldChar   the old character.
jaroslav@49
  2030
     * @param   newChar   the new character.
jaroslav@49
  2031
     * @return  a string derived from this string by replacing every
jaroslav@49
  2032
     *          occurrence of <code>oldChar</code> with <code>newChar</code>.
jaroslav@49
  2033
     */
jaroslav@443
  2034
    @JavaScriptBody(args = { "arg1", "arg2" }, body =
jaroslav@240
  2035
        "if (typeof arg1 === 'number') arg1 = String.fromCharCode(arg1);\n" +
jaroslav@240
  2036
        "if (typeof arg2 === 'number') arg2 = String.fromCharCode(arg2);\n" +
jaroslav@443
  2037
        "var s = this.toString();\n" +
jaroslav@240
  2038
        "for (;;) {\n" +
jaroslav@240
  2039
        "  var ret = s.replace(arg1, arg2);\n" +
jaroslav@240
  2040
        "  if (ret === s) {\n" +
jaroslav@240
  2041
        "    return ret;\n" +
jaroslav@240
  2042
        "  }\n" +
jaroslav@240
  2043
        "  s = ret;\n" +
jaroslav@240
  2044
        "}"
jaroslav@240
  2045
    )
jaroslav@49
  2046
    public String replace(char oldChar, char newChar) {
jaroslav@49
  2047
        if (oldChar != newChar) {
jaroslav@241
  2048
            int len = length();
jaroslav@49
  2049
            int i = -1;
jaroslav@241
  2050
            char[] val = toCharArray(); /* avoid getfield opcode */
jaroslav@241
  2051
            int off = offset();   /* avoid getfield opcode */
jaroslav@49
  2052
jaroslav@49
  2053
            while (++i < len) {
jaroslav@49
  2054
                if (val[off + i] == oldChar) {
jaroslav@49
  2055
                    break;
jaroslav@49
  2056
                }
jaroslav@49
  2057
            }
jaroslav@49
  2058
            if (i < len) {
jaroslav@49
  2059
                char buf[] = new char[len];
jaroslav@49
  2060
                for (int j = 0 ; j < i ; j++) {
jaroslav@49
  2061
                    buf[j] = val[off+j];
jaroslav@49
  2062
                }
jaroslav@49
  2063
                while (i < len) {
jaroslav@49
  2064
                    char c = val[off + i];
jaroslav@49
  2065
                    buf[i] = (c == oldChar) ? newChar : c;
jaroslav@49
  2066
                    i++;
jaroslav@49
  2067
                }
jaroslav@179
  2068
                return new String(buf, 0, len);
jaroslav@49
  2069
            }
jaroslav@49
  2070
        }
jaroslav@49
  2071
        return this;
jaroslav@49
  2072
    }
jaroslav@49
  2073
jaroslav@49
  2074
    /**
jaroslav@49
  2075
     * Tells whether or not this string matches the given <a
jaroslav@49
  2076
     * href="../util/regex/Pattern.html#sum">regular expression</a>.
jaroslav@49
  2077
     *
jaroslav@49
  2078
     * <p> An invocation of this method of the form
jaroslav@49
  2079
     * <i>str</i><tt>.matches(</tt><i>regex</i><tt>)</tt> yields exactly the
jaroslav@49
  2080
     * same result as the expression
jaroslav@49
  2081
     *
jaroslav@49
  2082
     * <blockquote><tt> {@link java.util.regex.Pattern}.{@link
jaroslav@49
  2083
     * java.util.regex.Pattern#matches(String,CharSequence)
jaroslav@49
  2084
     * matches}(</tt><i>regex</i><tt>,</tt> <i>str</i><tt>)</tt></blockquote>
jaroslav@49
  2085
     *
jaroslav@49
  2086
     * @param   regex
jaroslav@49
  2087
     *          the regular expression to which this string is to be matched
jaroslav@49
  2088
     *
jaroslav@49
  2089
     * @return  <tt>true</tt> if, and only if, this string matches the
jaroslav@49
  2090
     *          given regular expression
jaroslav@49
  2091
     *
jaroslav@49
  2092
     * @throws  PatternSyntaxException
jaroslav@49
  2093
     *          if the regular expression's syntax is invalid
jaroslav@49
  2094
     *
jaroslav@49
  2095
     * @see java.util.regex.Pattern
jaroslav@49
  2096
     *
jaroslav@49
  2097
     * @since 1.4
jaroslav@49
  2098
     * @spec JSR-51
jaroslav@49
  2099
     */
jaroslav@443
  2100
    @JavaScriptBody(args = { "regex" }, body = 
jaroslav@443
  2101
          "var self = this.toString();\n"
jaroslav@326
  2102
        + "var re = new RegExp(regex.toString());\n"
jaroslav@326
  2103
        + "var r = re.exec(self);\n"
jaroslav@326
  2104
        + "return r != null && r.length > 0 && self.length == r[0].length;"
jaroslav@326
  2105
    )
jaroslav@49
  2106
    public boolean matches(String regex) {
jaroslav@64
  2107
        throw new UnsupportedOperationException();
jaroslav@49
  2108
    }
jaroslav@49
  2109
jaroslav@49
  2110
    /**
jaroslav@49
  2111
     * Returns true if and only if this string contains the specified
jaroslav@49
  2112
     * sequence of char values.
jaroslav@49
  2113
     *
jaroslav@49
  2114
     * @param s the sequence to search for
jaroslav@49
  2115
     * @return true if this string contains <code>s</code>, false otherwise
jaroslav@49
  2116
     * @throws NullPointerException if <code>s</code> is <code>null</code>
jaroslav@49
  2117
     * @since 1.5
jaroslav@49
  2118
     */
jaroslav@49
  2119
    public boolean contains(CharSequence s) {
jaroslav@49
  2120
        return indexOf(s.toString()) > -1;
jaroslav@49
  2121
    }
jaroslav@49
  2122
jaroslav@49
  2123
    /**
jaroslav@49
  2124
     * Replaces the first substring of this string that matches the given <a
jaroslav@49
  2125
     * href="../util/regex/Pattern.html#sum">regular expression</a> with the
jaroslav@49
  2126
     * given replacement.
jaroslav@49
  2127
     *
jaroslav@49
  2128
     * <p> An invocation of this method of the form
jaroslav@49
  2129
     * <i>str</i><tt>.replaceFirst(</tt><i>regex</i><tt>,</tt> <i>repl</i><tt>)</tt>
jaroslav@49
  2130
     * yields exactly the same result as the expression
jaroslav@49
  2131
     *
jaroslav@49
  2132
     * <blockquote><tt>
jaroslav@49
  2133
     * {@link java.util.regex.Pattern}.{@link java.util.regex.Pattern#compile
jaroslav@49
  2134
     * compile}(</tt><i>regex</i><tt>).{@link
jaroslav@49
  2135
     * java.util.regex.Pattern#matcher(java.lang.CharSequence)
jaroslav@49
  2136
     * matcher}(</tt><i>str</i><tt>).{@link java.util.regex.Matcher#replaceFirst
jaroslav@49
  2137
     * replaceFirst}(</tt><i>repl</i><tt>)</tt></blockquote>
jaroslav@49
  2138
     *
jaroslav@49
  2139
     *<p>
jaroslav@49
  2140
     * Note that backslashes (<tt>\</tt>) and dollar signs (<tt>$</tt>) in the
jaroslav@49
  2141
     * replacement string may cause the results to be different than if it were
jaroslav@49
  2142
     * being treated as a literal replacement string; see
jaroslav@49
  2143
     * {@link java.util.regex.Matcher#replaceFirst}.
jaroslav@49
  2144
     * Use {@link java.util.regex.Matcher#quoteReplacement} to suppress the special
jaroslav@49
  2145
     * meaning of these characters, if desired.
jaroslav@49
  2146
     *
jaroslav@49
  2147
     * @param   regex
jaroslav@49
  2148
     *          the regular expression to which this string is to be matched
jaroslav@49
  2149
     * @param   replacement
jaroslav@49
  2150
     *          the string to be substituted for the first match
jaroslav@49
  2151
     *
jaroslav@49
  2152
     * @return  The resulting <tt>String</tt>
jaroslav@49
  2153
     *
jaroslav@49
  2154
     * @throws  PatternSyntaxException
jaroslav@49
  2155
     *          if the regular expression's syntax is invalid
jaroslav@49
  2156
     *
jaroslav@49
  2157
     * @see java.util.regex.Pattern
jaroslav@49
  2158
     *
jaroslav@49
  2159
     * @since 1.4
jaroslav@49
  2160
     * @spec JSR-51
jaroslav@49
  2161
     */
jaroslav@49
  2162
    public String replaceFirst(String regex, String replacement) {
jaroslav@64
  2163
        throw new UnsupportedOperationException();
jaroslav@49
  2164
    }
jaroslav@49
  2165
jaroslav@49
  2166
    /**
jaroslav@49
  2167
     * Replaces each substring of this string that matches the given <a
jaroslav@49
  2168
     * href="../util/regex/Pattern.html#sum">regular expression</a> with the
jaroslav@49
  2169
     * given replacement.
jaroslav@49
  2170
     *
jaroslav@49
  2171
     * <p> An invocation of this method of the form
jaroslav@49
  2172
     * <i>str</i><tt>.replaceAll(</tt><i>regex</i><tt>,</tt> <i>repl</i><tt>)</tt>
jaroslav@49
  2173
     * yields exactly the same result as the expression
jaroslav@49
  2174
     *
jaroslav@49
  2175
     * <blockquote><tt>
jaroslav@49
  2176
     * {@link java.util.regex.Pattern}.{@link java.util.regex.Pattern#compile
jaroslav@49
  2177
     * compile}(</tt><i>regex</i><tt>).{@link
jaroslav@49
  2178
     * java.util.regex.Pattern#matcher(java.lang.CharSequence)
jaroslav@49
  2179
     * matcher}(</tt><i>str</i><tt>).{@link java.util.regex.Matcher#replaceAll
jaroslav@49
  2180
     * replaceAll}(</tt><i>repl</i><tt>)</tt></blockquote>
jaroslav@49
  2181
     *
jaroslav@49
  2182
     *<p>
jaroslav@49
  2183
     * Note that backslashes (<tt>\</tt>) and dollar signs (<tt>$</tt>) in the
jaroslav@49
  2184
     * replacement string may cause the results to be different than if it were
jaroslav@49
  2185
     * being treated as a literal replacement string; see
jaroslav@49
  2186
     * {@link java.util.regex.Matcher#replaceAll Matcher.replaceAll}.
jaroslav@49
  2187
     * Use {@link java.util.regex.Matcher#quoteReplacement} to suppress the special
jaroslav@49
  2188
     * meaning of these characters, if desired.
jaroslav@49
  2189
     *
jaroslav@49
  2190
     * @param   regex
jaroslav@49
  2191
     *          the regular expression to which this string is to be matched
jaroslav@49
  2192
     * @param   replacement
jaroslav@49
  2193
     *          the string to be substituted for each match
jaroslav@49
  2194
     *
jaroslav@49
  2195
     * @return  The resulting <tt>String</tt>
jaroslav@49
  2196
     *
jaroslav@49
  2197
     * @throws  PatternSyntaxException
jaroslav@49
  2198
     *          if the regular expression's syntax is invalid
jaroslav@49
  2199
     *
jaroslav@49
  2200
     * @see java.util.regex.Pattern
jaroslav@49
  2201
     *
jaroslav@49
  2202
     * @since 1.4
jaroslav@49
  2203
     * @spec JSR-51
jaroslav@49
  2204
     */
jaroslav@49
  2205
    public String replaceAll(String regex, String replacement) {
jaroslav@64
  2206
        throw new UnsupportedOperationException();
jaroslav@49
  2207
    }
jaroslav@49
  2208
jaroslav@49
  2209
    /**
jaroslav@49
  2210
     * Replaces each substring of this string that matches the literal target
jaroslav@49
  2211
     * sequence with the specified literal replacement sequence. The
jaroslav@49
  2212
     * replacement proceeds from the beginning of the string to the end, for
jaroslav@49
  2213
     * example, replacing "aa" with "b" in the string "aaa" will result in
jaroslav@49
  2214
     * "ba" rather than "ab".
jaroslav@49
  2215
     *
jaroslav@49
  2216
     * @param  target The sequence of char values to be replaced
jaroslav@49
  2217
     * @param  replacement The replacement sequence of char values
jaroslav@49
  2218
     * @return  The resulting string
jaroslav@49
  2219
     * @throws NullPointerException if <code>target</code> or
jaroslav@49
  2220
     *         <code>replacement</code> is <code>null</code>.
jaroslav@49
  2221
     * @since 1.5
jaroslav@49
  2222
     */
jaroslav@926
  2223
    @JavaScriptBody(args = { "target", "replacement" }, body = 
jaroslav@926
  2224
          "var s = this.toString();\n"
jaroslav@926
  2225
        + "target = target.toString();\n"
jaroslav@926
  2226
        + "replacement = replacement.toString();\n"
jaroslav@926
  2227
        + "for (;;) {\n"
jaroslav@926
  2228
        + "  var ret = s.replace(target, replacement);\n"
jaroslav@926
  2229
        + "  if (ret === s) {\n"
jaroslav@926
  2230
        + "    return ret;\n"
jaroslav@926
  2231
        + "  }\n"
jaroslav@926
  2232
        + "  s = ret;\n"
jaroslav@926
  2233
        + "}"
jaroslav@926
  2234
    )
jaroslav@926
  2235
    public native String replace(CharSequence target, CharSequence replacement);
jaroslav@49
  2236
jaroslav@49
  2237
    /**
jaroslav@49
  2238
     * Splits this string around matches of the given
jaroslav@49
  2239
     * <a href="../util/regex/Pattern.html#sum">regular expression</a>.
jaroslav@49
  2240
     *
jaroslav@49
  2241
     * <p> The array returned by this method contains each substring of this
jaroslav@49
  2242
     * string that is terminated by another substring that matches the given
jaroslav@49
  2243
     * expression or is terminated by the end of the string.  The substrings in
jaroslav@49
  2244
     * the array are in the order in which they occur in this string.  If the
jaroslav@49
  2245
     * expression does not match any part of the input then the resulting array
jaroslav@49
  2246
     * has just one element, namely this string.
jaroslav@49
  2247
     *
jaroslav@49
  2248
     * <p> The <tt>limit</tt> parameter controls the number of times the
jaroslav@49
  2249
     * pattern is applied and therefore affects the length of the resulting
jaroslav@49
  2250
     * array.  If the limit <i>n</i> is greater than zero then the pattern
jaroslav@49
  2251
     * will be applied at most <i>n</i>&nbsp;-&nbsp;1 times, the array's
jaroslav@49
  2252
     * length will be no greater than <i>n</i>, and the array's last entry
jaroslav@49
  2253
     * will contain all input beyond the last matched delimiter.  If <i>n</i>
jaroslav@49
  2254
     * is non-positive then the pattern will be applied as many times as
jaroslav@49
  2255
     * possible and the array can have any length.  If <i>n</i> is zero then
jaroslav@49
  2256
     * the pattern will be applied as many times as possible, the array can
jaroslav@49
  2257
     * have any length, and trailing empty strings will be discarded.
jaroslav@49
  2258
     *
jaroslav@49
  2259
     * <p> The string <tt>"boo:and:foo"</tt>, for example, yields the
jaroslav@49
  2260
     * following results with these parameters:
jaroslav@49
  2261
     *
jaroslav@49
  2262
     * <blockquote><table cellpadding=1 cellspacing=0 summary="Split example showing regex, limit, and result">
jaroslav@49
  2263
     * <tr>
jaroslav@49
  2264
     *     <th>Regex</th>
jaroslav@49
  2265
     *     <th>Limit</th>
jaroslav@49
  2266
     *     <th>Result</th>
jaroslav@49
  2267
     * </tr>
jaroslav@49
  2268
     * <tr><td align=center>:</td>
jaroslav@49
  2269
     *     <td align=center>2</td>
jaroslav@49
  2270
     *     <td><tt>{ "boo", "and:foo" }</tt></td></tr>
jaroslav@49
  2271
     * <tr><td align=center>:</td>
jaroslav@49
  2272
     *     <td align=center>5</td>
jaroslav@49
  2273
     *     <td><tt>{ "boo", "and", "foo" }</tt></td></tr>
jaroslav@49
  2274
     * <tr><td align=center>:</td>
jaroslav@49
  2275
     *     <td align=center>-2</td>
jaroslav@49
  2276
     *     <td><tt>{ "boo", "and", "foo" }</tt></td></tr>
jaroslav@49
  2277
     * <tr><td align=center>o</td>
jaroslav@49
  2278
     *     <td align=center>5</td>
jaroslav@49
  2279
     *     <td><tt>{ "b", "", ":and:f", "", "" }</tt></td></tr>
jaroslav@49
  2280
     * <tr><td align=center>o</td>
jaroslav@49
  2281
     *     <td align=center>-2</td>
jaroslav@49
  2282
     *     <td><tt>{ "b", "", ":and:f", "", "" }</tt></td></tr>
jaroslav@49
  2283
     * <tr><td align=center>o</td>
jaroslav@49
  2284
     *     <td align=center>0</td>
jaroslav@49
  2285
     *     <td><tt>{ "b", "", ":and:f" }</tt></td></tr>
jaroslav@49
  2286
     * </table></blockquote>
jaroslav@49
  2287
     *
jaroslav@49
  2288
     * <p> An invocation of this method of the form
jaroslav@49
  2289
     * <i>str.</i><tt>split(</tt><i>regex</i><tt>,</tt>&nbsp;<i>n</i><tt>)</tt>
jaroslav@49
  2290
     * yields the same result as the expression
jaroslav@49
  2291
     *
jaroslav@49
  2292
     * <blockquote>
jaroslav@49
  2293
     * {@link java.util.regex.Pattern}.{@link java.util.regex.Pattern#compile
jaroslav@49
  2294
     * compile}<tt>(</tt><i>regex</i><tt>)</tt>.{@link
jaroslav@49
  2295
     * java.util.regex.Pattern#split(java.lang.CharSequence,int)
jaroslav@49
  2296
     * split}<tt>(</tt><i>str</i><tt>,</tt>&nbsp;<i>n</i><tt>)</tt>
jaroslav@49
  2297
     * </blockquote>
jaroslav@49
  2298
     *
jaroslav@49
  2299
     *
jaroslav@49
  2300
     * @param  regex
jaroslav@49
  2301
     *         the delimiting regular expression
jaroslav@49
  2302
     *
jaroslav@49
  2303
     * @param  limit
jaroslav@49
  2304
     *         the result threshold, as described above
jaroslav@49
  2305
     *
jaroslav@49
  2306
     * @return  the array of strings computed by splitting this string
jaroslav@49
  2307
     *          around matches of the given regular expression
jaroslav@49
  2308
     *
jaroslav@49
  2309
     * @throws  PatternSyntaxException
jaroslav@49
  2310
     *          if the regular expression's syntax is invalid
jaroslav@49
  2311
     *
jaroslav@49
  2312
     * @see java.util.regex.Pattern
jaroslav@49
  2313
     *
jaroslav@49
  2314
     * @since 1.4
jaroslav@49
  2315
     * @spec JSR-51
jaroslav@49
  2316
     */
jaroslav@49
  2317
    public String[] split(String regex, int limit) {
jaroslav@1272
  2318
        if (limit <= 0) {
jaroslav@1272
  2319
            Object[] arr = splitImpl(this, regex, Integer.MAX_VALUE);
jaroslav@1272
  2320
            int to = arr.length;
jaroslav@1272
  2321
            if (limit == 0) {
jaroslav@1272
  2322
                while (to > 1 && ((String)arr[--to]).isEmpty()) {
jaroslav@1272
  2323
                }
jaroslav@1272
  2324
                to++;
jaroslav@1272
  2325
            }
jaroslav@1272
  2326
            String[] ret = new String[to];
jaroslav@1272
  2327
            System.arraycopy(arr, 0, ret, 0, to);
jaroslav@1272
  2328
            return ret;
jaroslav@1272
  2329
        } else {
jaroslav@1272
  2330
            Object[] arr = splitImpl(this, regex, limit);
jaroslav@1272
  2331
            String[] ret = new String[arr.length];
jaroslav@1272
  2332
            int pos = 0;
jaroslav@1272
  2333
            for (int i = 0; i < arr.length; i++) {
jaroslav@1272
  2334
                final String s = (String)arr[i];
jaroslav@1272
  2335
                ret[i] = s;
jaroslav@1272
  2336
                pos = indexOf(s, pos) + s.length();
jaroslav@1272
  2337
            }
jaroslav@1272
  2338
            ret[arr.length - 1] += substring(pos);
jaroslav@1272
  2339
            return ret;
jaroslav@1272
  2340
        }
jaroslav@49
  2341
    }
jaroslav@1272
  2342
    
jaroslav@1272
  2343
    @JavaScriptBody(args = { "str", "regex", "limit"}, body = 
jaroslav@1272
  2344
        "return str.split(new RegExp(regex), limit);"
jaroslav@1272
  2345
    )
jaroslav@1272
  2346
    private static native Object[] splitImpl(String str, String regex, int limit);
jaroslav@49
  2347
jaroslav@49
  2348
    /**
jaroslav@49
  2349
     * Splits this string around matches of the given <a
jaroslav@49
  2350
     * href="../util/regex/Pattern.html#sum">regular expression</a>.
jaroslav@49
  2351
     *
jaroslav@49
  2352
     * <p> This method works as if by invoking the two-argument {@link
jaroslav@49
  2353
     * #split(String, int) split} method with the given expression and a limit
jaroslav@49
  2354
     * argument of zero.  Trailing empty strings are therefore not included in
jaroslav@49
  2355
     * the resulting array.
jaroslav@49
  2356
     *
jaroslav@49
  2357
     * <p> The string <tt>"boo:and:foo"</tt>, for example, yields the following
jaroslav@49
  2358
     * results with these expressions:
jaroslav@49
  2359
     *
jaroslav@49
  2360
     * <blockquote><table cellpadding=1 cellspacing=0 summary="Split examples showing regex and result">
jaroslav@49
  2361
     * <tr>
jaroslav@49
  2362
     *  <th>Regex</th>
jaroslav@49
  2363
     *  <th>Result</th>
jaroslav@49
  2364
     * </tr>
jaroslav@49
  2365
     * <tr><td align=center>:</td>
jaroslav@49
  2366
     *     <td><tt>{ "boo", "and", "foo" }</tt></td></tr>
jaroslav@49
  2367
     * <tr><td align=center>o</td>
jaroslav@49
  2368
     *     <td><tt>{ "b", "", ":and:f" }</tt></td></tr>
jaroslav@49
  2369
     * </table></blockquote>
jaroslav@49
  2370
     *
jaroslav@49
  2371
     *
jaroslav@49
  2372
     * @param  regex
jaroslav@49
  2373
     *         the delimiting regular expression
jaroslav@49
  2374
     *
jaroslav@49
  2375
     * @return  the array of strings computed by splitting this string
jaroslav@49
  2376
     *          around matches of the given regular expression
jaroslav@49
  2377
     *
jaroslav@49
  2378
     * @throws  PatternSyntaxException
jaroslav@49
  2379
     *          if the regular expression's syntax is invalid
jaroslav@49
  2380
     *
jaroslav@49
  2381
     * @see java.util.regex.Pattern
jaroslav@49
  2382
     *
jaroslav@49
  2383
     * @since 1.4
jaroslav@49
  2384
     * @spec JSR-51
jaroslav@49
  2385
     */
jaroslav@49
  2386
    public String[] split(String regex) {
jaroslav@49
  2387
        return split(regex, 0);
jaroslav@49
  2388
    }
jaroslav@49
  2389
jaroslav@49
  2390
    /**
jaroslav@49
  2391
     * Converts all of the characters in this <code>String</code> to lower
jaroslav@49
  2392
     * case using the rules of the given <code>Locale</code>.  Case mapping is based
jaroslav@49
  2393
     * on the Unicode Standard version specified by the {@link java.lang.Character Character}
jaroslav@49
  2394
     * class. Since case mappings are not always 1:1 char mappings, the resulting
jaroslav@49
  2395
     * <code>String</code> may be a different length than the original <code>String</code>.
jaroslav@49
  2396
     * <p>
jaroslav@49
  2397
     * Examples of lowercase  mappings are in the following table:
jaroslav@49
  2398
     * <table border="1" summary="Lowercase mapping examples showing language code of locale, upper case, lower case, and description">
jaroslav@49
  2399
     * <tr>
jaroslav@49
  2400
     *   <th>Language Code of Locale</th>
jaroslav@49
  2401
     *   <th>Upper Case</th>
jaroslav@49
  2402
     *   <th>Lower Case</th>
jaroslav@49
  2403
     *   <th>Description</th>
jaroslav@49
  2404
     * </tr>
jaroslav@49
  2405
     * <tr>
jaroslav@49
  2406
     *   <td>tr (Turkish)</td>
jaroslav@49
  2407
     *   <td>&#92;u0130</td>
jaroslav@49
  2408
     *   <td>&#92;u0069</td>
jaroslav@49
  2409
     *   <td>capital letter I with dot above -&gt; small letter i</td>
jaroslav@49
  2410
     * </tr>
jaroslav@49
  2411
     * <tr>
jaroslav@49
  2412
     *   <td>tr (Turkish)</td>
jaroslav@49
  2413
     *   <td>&#92;u0049</td>
jaroslav@49
  2414
     *   <td>&#92;u0131</td>
jaroslav@49
  2415
     *   <td>capital letter I -&gt; small letter dotless i </td>
jaroslav@49
  2416
     * </tr>
jaroslav@49
  2417
     * <tr>
jaroslav@49
  2418
     *   <td>(all)</td>
jaroslav@49
  2419
     *   <td>French Fries</td>
jaroslav@49
  2420
     *   <td>french fries</td>
jaroslav@49
  2421
     *   <td>lowercased all chars in String</td>
jaroslav@49
  2422
     * </tr>
jaroslav@49
  2423
     * <tr>
jaroslav@49
  2424
     *   <td>(all)</td>
jaroslav@49
  2425
     *   <td><img src="doc-files/capiota.gif" alt="capiota"><img src="doc-files/capchi.gif" alt="capchi">
jaroslav@49
  2426
     *       <img src="doc-files/captheta.gif" alt="captheta"><img src="doc-files/capupsil.gif" alt="capupsil">
jaroslav@49
  2427
     *       <img src="doc-files/capsigma.gif" alt="capsigma"></td>
jaroslav@49
  2428
     *   <td><img src="doc-files/iota.gif" alt="iota"><img src="doc-files/chi.gif" alt="chi">
jaroslav@49
  2429
     *       <img src="doc-files/theta.gif" alt="theta"><img src="doc-files/upsilon.gif" alt="upsilon">
jaroslav@49
  2430
     *       <img src="doc-files/sigma1.gif" alt="sigma"></td>
jaroslav@49
  2431
     *   <td>lowercased all chars in String</td>
jaroslav@49
  2432
     * </tr>
jaroslav@49
  2433
     * </table>
jaroslav@49
  2434
     *
jaroslav@49
  2435
     * @param locale use the case transformation rules for this locale
jaroslav@49
  2436
     * @return the <code>String</code>, converted to lowercase.
jaroslav@49
  2437
     * @see     java.lang.String#toLowerCase()
jaroslav@49
  2438
     * @see     java.lang.String#toUpperCase()
jaroslav@49
  2439
     * @see     java.lang.String#toUpperCase(Locale)
jaroslav@49
  2440
     * @since   1.1
jaroslav@49
  2441
     */
jaroslav@61
  2442
//    public String toLowerCase(Locale locale) {
jaroslav@61
  2443
//        if (locale == null) {
jaroslav@61
  2444
//            throw new NullPointerException();
jaroslav@61
  2445
//        }
jaroslav@61
  2446
//
jaroslav@61
  2447
//        int     firstUpper;
jaroslav@61
  2448
//
jaroslav@61
  2449
//        /* Now check if there are any characters that need to be changed. */
jaroslav@61
  2450
//        scan: {
jaroslav@61
  2451
//            for (firstUpper = 0 ; firstUpper < count; ) {
jaroslav@61
  2452
//                char c = value[offset+firstUpper];
jaroslav@61
  2453
//                if ((c >= Character.MIN_HIGH_SURROGATE) &&
jaroslav@61
  2454
//                    (c <= Character.MAX_HIGH_SURROGATE)) {
jaroslav@61
  2455
//                    int supplChar = codePointAt(firstUpper);
jaroslav@61
  2456
//                    if (supplChar != Character.toLowerCase(supplChar)) {
jaroslav@61
  2457
//                        break scan;
jaroslav@61
  2458
//                    }
jaroslav@61
  2459
//                    firstUpper += Character.charCount(supplChar);
jaroslav@61
  2460
//                } else {
jaroslav@61
  2461
//                    if (c != Character.toLowerCase(c)) {
jaroslav@61
  2462
//                        break scan;
jaroslav@61
  2463
//                    }
jaroslav@61
  2464
//                    firstUpper++;
jaroslav@61
  2465
//                }
jaroslav@61
  2466
//            }
jaroslav@61
  2467
//            return this;
jaroslav@61
  2468
//        }
jaroslav@61
  2469
//
jaroslav@61
  2470
//        char[]  result = new char[count];
jaroslav@61
  2471
//        int     resultOffset = 0;  /* result may grow, so i+resultOffset
jaroslav@61
  2472
//                                    * is the write location in result */
jaroslav@61
  2473
//
jaroslav@61
  2474
//        /* Just copy the first few lowerCase characters. */
jaroslav@560
  2475
//        System.arraycopy(value, offset, result, 0, firstUpper);
jaroslav@61
  2476
//
jaroslav@61
  2477
//        String lang = locale.getLanguage();
jaroslav@61
  2478
//        boolean localeDependent =
jaroslav@61
  2479
//            (lang == "tr" || lang == "az" || lang == "lt");
jaroslav@61
  2480
//        char[] lowerCharArray;
jaroslav@61
  2481
//        int lowerChar;
jaroslav@61
  2482
//        int srcChar;
jaroslav@61
  2483
//        int srcCount;
jaroslav@61
  2484
//        for (int i = firstUpper; i < count; i += srcCount) {
jaroslav@61
  2485
//            srcChar = (int)value[offset+i];
jaroslav@61
  2486
//            if ((char)srcChar >= Character.MIN_HIGH_SURROGATE &&
jaroslav@61
  2487
//                (char)srcChar <= Character.MAX_HIGH_SURROGATE) {
jaroslav@61
  2488
//                srcChar = codePointAt(i);
jaroslav@61
  2489
//                srcCount = Character.charCount(srcChar);
jaroslav@61
  2490
//            } else {
jaroslav@61
  2491
//                srcCount = 1;
jaroslav@61
  2492
//            }
jaroslav@61
  2493
//            if (localeDependent || srcChar == '\u03A3') { // GREEK CAPITAL LETTER SIGMA
jaroslav@61
  2494
//                lowerChar = ConditionalSpecialCasing.toLowerCaseEx(this, i, locale);
jaroslav@61
  2495
//            } else if (srcChar == '\u0130') { // LATIN CAPITAL LETTER I DOT
jaroslav@61
  2496
//                lowerChar = Character.ERROR;
jaroslav@61
  2497
//            } else {
jaroslav@61
  2498
//                lowerChar = Character.toLowerCase(srcChar);
jaroslav@61
  2499
//            }
jaroslav@61
  2500
//            if ((lowerChar == Character.ERROR) ||
jaroslav@61
  2501
//                (lowerChar >= Character.MIN_SUPPLEMENTARY_CODE_POINT)) {
jaroslav@61
  2502
//                if (lowerChar == Character.ERROR) {
jaroslav@61
  2503
//                     if (!localeDependent && srcChar == '\u0130') {
jaroslav@61
  2504
//                         lowerCharArray =
jaroslav@61
  2505
//                             ConditionalSpecialCasing.toLowerCaseCharArray(this, i, Locale.ENGLISH);
jaroslav@61
  2506
//                     } else {
jaroslav@61
  2507
//                        lowerCharArray =
jaroslav@61
  2508
//                            ConditionalSpecialCasing.toLowerCaseCharArray(this, i, locale);
jaroslav@61
  2509
//                     }
jaroslav@61
  2510
//                } else if (srcCount == 2) {
jaroslav@61
  2511
//                    resultOffset += Character.toChars(lowerChar, result, i + resultOffset) - srcCount;
jaroslav@61
  2512
//                    continue;
jaroslav@61
  2513
//                } else {
jaroslav@61
  2514
//                    lowerCharArray = Character.toChars(lowerChar);
jaroslav@61
  2515
//                }
jaroslav@61
  2516
//
jaroslav@61
  2517
//                /* Grow result if needed */
jaroslav@61
  2518
//                int mapLen = lowerCharArray.length;
jaroslav@61
  2519
//                if (mapLen > srcCount) {
jaroslav@61
  2520
//                    char[] result2 = new char[result.length + mapLen - srcCount];
jaroslav@560
  2521
//                    System.arraycopy(result, 0, result2, 0,
jaroslav@61
  2522
//                        i + resultOffset);
jaroslav@61
  2523
//                    result = result2;
jaroslav@61
  2524
//                }
jaroslav@61
  2525
//                for (int x=0; x<mapLen; ++x) {
jaroslav@61
  2526
//                    result[i+resultOffset+x] = lowerCharArray[x];
jaroslav@61
  2527
//                }
jaroslav@61
  2528
//                resultOffset += (mapLen - srcCount);
jaroslav@61
  2529
//            } else {
jaroslav@61
  2530
//                result[i+resultOffset] = (char)lowerChar;
jaroslav@61
  2531
//            }
jaroslav@61
  2532
//        }
jaroslav@61
  2533
//        return new String(0, count+resultOffset, result);
jaroslav@61
  2534
//    }
jaroslav@49
  2535
jaroslav@49
  2536
    /**
jaroslav@49
  2537
     * Converts all of the characters in this <code>String</code> to lower
jaroslav@49
  2538
     * case using the rules of the default locale. This is equivalent to calling
jaroslav@49
  2539
     * <code>toLowerCase(Locale.getDefault())</code>.
jaroslav@49
  2540
     * <p>
jaroslav@49
  2541
     * <b>Note:</b> This method is locale sensitive, and may produce unexpected
jaroslav@49
  2542
     * results if used for strings that are intended to be interpreted locale
jaroslav@49
  2543
     * independently.
jaroslav@49
  2544
     * Examples are programming language identifiers, protocol keys, and HTML
jaroslav@49
  2545
     * tags.
jaroslav@49
  2546
     * For instance, <code>"TITLE".toLowerCase()</code> in a Turkish locale
jaroslav@49
  2547
     * returns <code>"t\u005Cu0131tle"</code>, where '\u005Cu0131' is the
jaroslav@49
  2548
     * LATIN SMALL LETTER DOTLESS I character.
jaroslav@49
  2549
     * To obtain correct results for locale insensitive strings, use
jaroslav@49
  2550
     * <code>toLowerCase(Locale.ENGLISH)</code>.
jaroslav@49
  2551
     * <p>
jaroslav@49
  2552
     * @return  the <code>String</code>, converted to lowercase.
jaroslav@49
  2553
     * @see     java.lang.String#toLowerCase(Locale)
jaroslav@49
  2554
     */
jaroslav@443
  2555
    @JavaScriptBody(args = {}, body = "return this.toLowerCase();")
jaroslav@49
  2556
    public String toLowerCase() {
jaroslav@64
  2557
        throw new UnsupportedOperationException("Should be supported but without connection to locale");
jaroslav@49
  2558
    }
jaroslav@49
  2559
jaroslav@49
  2560
    /**
jaroslav@49
  2561
     * Converts all of the characters in this <code>String</code> to upper
jaroslav@49
  2562
     * case using the rules of the given <code>Locale</code>. Case mapping is based
jaroslav@49
  2563
     * on the Unicode Standard version specified by the {@link java.lang.Character Character}
jaroslav@49
  2564
     * class. Since case mappings are not always 1:1 char mappings, the resulting
jaroslav@49
  2565
     * <code>String</code> may be a different length than the original <code>String</code>.
jaroslav@49
  2566
     * <p>
jaroslav@49
  2567
     * Examples of locale-sensitive and 1:M case mappings are in the following table.
jaroslav@49
  2568
     * <p>
jaroslav@49
  2569
     * <table border="1" summary="Examples of locale-sensitive and 1:M case mappings. Shows Language code of locale, lower case, upper case, and description.">
jaroslav@49
  2570
     * <tr>
jaroslav@49
  2571
     *   <th>Language Code of Locale</th>
jaroslav@49
  2572
     *   <th>Lower Case</th>
jaroslav@49
  2573
     *   <th>Upper Case</th>
jaroslav@49
  2574
     *   <th>Description</th>
jaroslav@49
  2575
     * </tr>
jaroslav@49
  2576
     * <tr>
jaroslav@49
  2577
     *   <td>tr (Turkish)</td>
jaroslav@49
  2578
     *   <td>&#92;u0069</td>
jaroslav@49
  2579
     *   <td>&#92;u0130</td>
jaroslav@49
  2580
     *   <td>small letter i -&gt; capital letter I with dot above</td>
jaroslav@49
  2581
     * </tr>
jaroslav@49
  2582
     * <tr>
jaroslav@49
  2583
     *   <td>tr (Turkish)</td>
jaroslav@49
  2584
     *   <td>&#92;u0131</td>
jaroslav@49
  2585
     *   <td>&#92;u0049</td>
jaroslav@49
  2586
     *   <td>small letter dotless i -&gt; capital letter I</td>
jaroslav@49
  2587
     * </tr>
jaroslav@49
  2588
     * <tr>
jaroslav@49
  2589
     *   <td>(all)</td>
jaroslav@49
  2590
     *   <td>&#92;u00df</td>
jaroslav@49
  2591
     *   <td>&#92;u0053 &#92;u0053</td>
jaroslav@49
  2592
     *   <td>small letter sharp s -&gt; two letters: SS</td>
jaroslav@49
  2593
     * </tr>
jaroslav@49
  2594
     * <tr>
jaroslav@49
  2595
     *   <td>(all)</td>
jaroslav@49
  2596
     *   <td>Fahrvergn&uuml;gen</td>
jaroslav@49
  2597
     *   <td>FAHRVERGN&Uuml;GEN</td>
jaroslav@49
  2598
     *   <td></td>
jaroslav@49
  2599
     * </tr>
jaroslav@49
  2600
     * </table>
jaroslav@49
  2601
     * @param locale use the case transformation rules for this locale
jaroslav@49
  2602
     * @return the <code>String</code>, converted to uppercase.
jaroslav@49
  2603
     * @see     java.lang.String#toUpperCase()
jaroslav@49
  2604
     * @see     java.lang.String#toLowerCase()
jaroslav@49
  2605
     * @see     java.lang.String#toLowerCase(Locale)
jaroslav@49
  2606
     * @since   1.1
jaroslav@49
  2607
     */
jaroslav@61
  2608
    /* not for javascript 
jaroslav@49
  2609
    public String toUpperCase(Locale locale) {
jaroslav@49
  2610
        if (locale == null) {
jaroslav@49
  2611
            throw new NullPointerException();
jaroslav@49
  2612
        }
jaroslav@49
  2613
jaroslav@49
  2614
        int     firstLower;
jaroslav@49
  2615
jaroslav@61
  2616
        // Now check if there are any characters that need to be changed. 
jaroslav@49
  2617
        scan: {
jaroslav@49
  2618
            for (firstLower = 0 ; firstLower < count; ) {
jaroslav@49
  2619
                int c = (int)value[offset+firstLower];
jaroslav@49
  2620
                int srcCount;
jaroslav@49
  2621
                if ((c >= Character.MIN_HIGH_SURROGATE) &&
jaroslav@49
  2622
                    (c <= Character.MAX_HIGH_SURROGATE)) {
jaroslav@49
  2623
                    c = codePointAt(firstLower);
jaroslav@49
  2624
                    srcCount = Character.charCount(c);
jaroslav@49
  2625
                } else {
jaroslav@49
  2626
                    srcCount = 1;
jaroslav@49
  2627
                }
jaroslav@49
  2628
                int upperCaseChar = Character.toUpperCaseEx(c);
jaroslav@49
  2629
                if ((upperCaseChar == Character.ERROR) ||
jaroslav@49
  2630
                    (c != upperCaseChar)) {
jaroslav@49
  2631
                    break scan;
jaroslav@49
  2632
                }
jaroslav@49
  2633
                firstLower += srcCount;
jaroslav@49
  2634
            }
jaroslav@49
  2635
            return this;
jaroslav@49
  2636
        }
jaroslav@49
  2637
jaroslav@61
  2638
        char[]  result       = new char[count]; /* may grow *
jaroslav@49
  2639
        int     resultOffset = 0;  /* result may grow, so i+resultOffset
jaroslav@61
  2640
                                    * is the write location in result *
jaroslav@49
  2641
jaroslav@61
  2642
        /* Just copy the first few upperCase characters. *
jaroslav@560
  2643
        System.arraycopy(value, offset, result, 0, firstLower);
jaroslav@49
  2644
jaroslav@49
  2645
        String lang = locale.getLanguage();
jaroslav@49
  2646
        boolean localeDependent =
jaroslav@49
  2647
            (lang == "tr" || lang == "az" || lang == "lt");
jaroslav@49
  2648
        char[] upperCharArray;
jaroslav@49
  2649
        int upperChar;
jaroslav@49
  2650
        int srcChar;
jaroslav@49
  2651
        int srcCount;
jaroslav@49
  2652
        for (int i = firstLower; i < count; i += srcCount) {
jaroslav@49
  2653
            srcChar = (int)value[offset+i];
jaroslav@49
  2654
            if ((char)srcChar >= Character.MIN_HIGH_SURROGATE &&
jaroslav@49
  2655
                (char)srcChar <= Character.MAX_HIGH_SURROGATE) {
jaroslav@49
  2656
                srcChar = codePointAt(i);
jaroslav@49
  2657
                srcCount = Character.charCount(srcChar);
jaroslav@49
  2658
            } else {
jaroslav@49
  2659
                srcCount = 1;
jaroslav@49
  2660
            }
jaroslav@49
  2661
            if (localeDependent) {
jaroslav@49
  2662
                upperChar = ConditionalSpecialCasing.toUpperCaseEx(this, i, locale);
jaroslav@49
  2663
            } else {
jaroslav@49
  2664
                upperChar = Character.toUpperCaseEx(srcChar);
jaroslav@49
  2665
            }
jaroslav@49
  2666
            if ((upperChar == Character.ERROR) ||
jaroslav@49
  2667
                (upperChar >= Character.MIN_SUPPLEMENTARY_CODE_POINT)) {
jaroslav@49
  2668
                if (upperChar == Character.ERROR) {
jaroslav@49
  2669
                    if (localeDependent) {
jaroslav@49
  2670
                        upperCharArray =
jaroslav@49
  2671
                            ConditionalSpecialCasing.toUpperCaseCharArray(this, i, locale);
jaroslav@49
  2672
                    } else {
jaroslav@49
  2673
                        upperCharArray = Character.toUpperCaseCharArray(srcChar);
jaroslav@49
  2674
                    }
jaroslav@49
  2675
                } else if (srcCount == 2) {
jaroslav@49
  2676
                    resultOffset += Character.toChars(upperChar, result, i + resultOffset) - srcCount;
jaroslav@49
  2677
                    continue;
jaroslav@49
  2678
                } else {
jaroslav@49
  2679
                    upperCharArray = Character.toChars(upperChar);
jaroslav@49
  2680
                }
jaroslav@49
  2681
jaroslav@61
  2682
                /* Grow result if needed *
jaroslav@49
  2683
                int mapLen = upperCharArray.length;
jaroslav@49
  2684
                if (mapLen > srcCount) {
jaroslav@49
  2685
                    char[] result2 = new char[result.length + mapLen - srcCount];
jaroslav@560
  2686
                    System.arraycopy(result, 0, result2, 0,
jaroslav@49
  2687
                        i + resultOffset);
jaroslav@49
  2688
                    result = result2;
jaroslav@49
  2689
                }
jaroslav@49
  2690
                for (int x=0; x<mapLen; ++x) {
jaroslav@49
  2691
                    result[i+resultOffset+x] = upperCharArray[x];
jaroslav@49
  2692
                }
jaroslav@49
  2693
                resultOffset += (mapLen - srcCount);
jaroslav@49
  2694
            } else {
jaroslav@49
  2695
                result[i+resultOffset] = (char)upperChar;
jaroslav@49
  2696
            }
jaroslav@49
  2697
        }
jaroslav@49
  2698
        return new String(0, count+resultOffset, result);
jaroslav@49
  2699
    }
jaroslav@61
  2700
    */
jaroslav@49
  2701
jaroslav@49
  2702
    /**
jaroslav@49
  2703
     * Converts all of the characters in this <code>String</code> to upper
jaroslav@49
  2704
     * case using the rules of the default locale. This method is equivalent to
jaroslav@49
  2705
     * <code>toUpperCase(Locale.getDefault())</code>.
jaroslav@49
  2706
     * <p>
jaroslav@49
  2707
     * <b>Note:</b> This method is locale sensitive, and may produce unexpected
jaroslav@49
  2708
     * results if used for strings that are intended to be interpreted locale
jaroslav@49
  2709
     * independently.
jaroslav@49
  2710
     * Examples are programming language identifiers, protocol keys, and HTML
jaroslav@49
  2711
     * tags.
jaroslav@49
  2712
     * For instance, <code>"title".toUpperCase()</code> in a Turkish locale
jaroslav@49
  2713
     * returns <code>"T\u005Cu0130TLE"</code>, where '\u005Cu0130' is the
jaroslav@49
  2714
     * LATIN CAPITAL LETTER I WITH DOT ABOVE character.
jaroslav@49
  2715
     * To obtain correct results for locale insensitive strings, use
jaroslav@49
  2716
     * <code>toUpperCase(Locale.ENGLISH)</code>.
jaroslav@49
  2717
     * <p>
jaroslav@49
  2718
     * @return  the <code>String</code>, converted to uppercase.
jaroslav@49
  2719
     * @see     java.lang.String#toUpperCase(Locale)
jaroslav@49
  2720
     */
jaroslav@443
  2721
    @JavaScriptBody(args = {}, body = "return this.toUpperCase();")
jaroslav@49
  2722
    public String toUpperCase() {
jaroslav@61
  2723
        throw new UnsupportedOperationException();
jaroslav@49
  2724
    }
jaroslav@49
  2725
jaroslav@49
  2726
    /**
jaroslav@49
  2727
     * Returns a copy of the string, with leading and trailing whitespace
jaroslav@49
  2728
     * omitted.
jaroslav@49
  2729
     * <p>
jaroslav@49
  2730
     * If this <code>String</code> object represents an empty character
jaroslav@49
  2731
     * sequence, or the first and last characters of character sequence
jaroslav@49
  2732
     * represented by this <code>String</code> object both have codes
jaroslav@49
  2733
     * greater than <code>'&#92;u0020'</code> (the space character), then a
jaroslav@49
  2734
     * reference to this <code>String</code> object is returned.
jaroslav@49
  2735
     * <p>
jaroslav@49
  2736
     * Otherwise, if there is no character with a code greater than
jaroslav@49
  2737
     * <code>'&#92;u0020'</code> in the string, then a new
jaroslav@49
  2738
     * <code>String</code> object representing an empty string is created
jaroslav@49
  2739
     * and returned.
jaroslav@49
  2740
     * <p>
jaroslav@49
  2741
     * Otherwise, let <i>k</i> be the index of the first character in the
jaroslav@49
  2742
     * string whose code is greater than <code>'&#92;u0020'</code>, and let
jaroslav@49
  2743
     * <i>m</i> be the index of the last character in the string whose code
jaroslav@49
  2744
     * is greater than <code>'&#92;u0020'</code>. A new <code>String</code>
jaroslav@49
  2745
     * object is created, representing the substring of this string that
jaroslav@49
  2746
     * begins with the character at index <i>k</i> and ends with the
jaroslav@49
  2747
     * character at index <i>m</i>-that is, the result of
jaroslav@49
  2748
     * <code>this.substring(<i>k</i>,&nbsp;<i>m</i>+1)</code>.
jaroslav@49
  2749
     * <p>
jaroslav@49
  2750
     * This method may be used to trim whitespace (as defined above) from
jaroslav@49
  2751
     * the beginning and end of a string.
jaroslav@49
  2752
     *
jaroslav@49
  2753
     * @return  A copy of this string with leading and trailing white
jaroslav@49
  2754
     *          space removed, or this string if it has no leading or
jaroslav@49
  2755
     *          trailing white space.
jaroslav@49
  2756
     */
jaroslav@49
  2757
    public String trim() {
jaroslav@241
  2758
        int len = length();
jaroslav@49
  2759
        int st = 0;
jaroslav@241
  2760
        int off = offset();      /* avoid getfield opcode */
jaroslav@241
  2761
        char[] val = toCharArray();    /* avoid getfield opcode */
jaroslav@49
  2762
jaroslav@49
  2763
        while ((st < len) && (val[off + st] <= ' ')) {
jaroslav@49
  2764
            st++;
jaroslav@49
  2765
        }
jaroslav@49
  2766
        while ((st < len) && (val[off + len - 1] <= ' ')) {
jaroslav@49
  2767
            len--;
jaroslav@49
  2768
        }
jaroslav@241
  2769
        return ((st > 0) || (len < length())) ? substring(st, len) : this;
jaroslav@49
  2770
    }
jaroslav@49
  2771
jaroslav@49
  2772
    /**
jaroslav@49
  2773
     * This object (which is already a string!) is itself returned.
jaroslav@49
  2774
     *
jaroslav@49
  2775
     * @return  the string itself.
jaroslav@49
  2776
     */
jaroslav@443
  2777
    @JavaScriptBody(args = {}, body = "return this.toString();")
jaroslav@49
  2778
    public String toString() {
jaroslav@49
  2779
        return this;
jaroslav@49
  2780
    }
jaroslav@49
  2781
jaroslav@49
  2782
    /**
jaroslav@49
  2783
     * Converts this string to a new character array.
jaroslav@49
  2784
     *
jaroslav@49
  2785
     * @return  a newly allocated character array whose length is the length
jaroslav@49
  2786
     *          of this string and whose contents are initialized to contain
jaroslav@49
  2787
     *          the character sequence represented by this string.
jaroslav@49
  2788
     */
jaroslav@49
  2789
    public char[] toCharArray() {
jaroslav@241
  2790
        char result[] = new char[length()];
jaroslav@241
  2791
        getChars(0, length(), result, 0);
jaroslav@49
  2792
        return result;
jaroslav@49
  2793
    }
jaroslav@49
  2794
jaroslav@49
  2795
    /**
jaroslav@49
  2796
     * Returns a formatted string using the specified format string and
jaroslav@49
  2797
     * arguments.
jaroslav@49
  2798
     *
jaroslav@49
  2799
     * <p> The locale always used is the one returned by {@link
jaroslav@49
  2800
     * java.util.Locale#getDefault() Locale.getDefault()}.
jaroslav@49
  2801
     *
jaroslav@49
  2802
     * @param  format
jaroslav@49
  2803
     *         A <a href="../util/Formatter.html#syntax">format string</a>
jaroslav@49
  2804
     *
jaroslav@49
  2805
     * @param  args
jaroslav@49
  2806
     *         Arguments referenced by the format specifiers in the format
jaroslav@49
  2807
     *         string.  If there are more arguments than format specifiers, the
jaroslav@49
  2808
     *         extra arguments are ignored.  The number of arguments is
jaroslav@49
  2809
     *         variable and may be zero.  The maximum number of arguments is
jaroslav@49
  2810
     *         limited by the maximum dimension of a Java array as defined by
jaroslav@49
  2811
     *         <cite>The Java&trade; Virtual Machine Specification</cite>.
jaroslav@49
  2812
     *         The behaviour on a
jaroslav@49
  2813
     *         <tt>null</tt> argument depends on the <a
jaroslav@49
  2814
     *         href="../util/Formatter.html#syntax">conversion</a>.
jaroslav@49
  2815
     *
jaroslav@49
  2816
     * @throws  IllegalFormatException
jaroslav@49
  2817
     *          If a format string contains an illegal syntax, a format
jaroslav@49
  2818
     *          specifier that is incompatible with the given arguments,
jaroslav@49
  2819
     *          insufficient arguments given the format string, or other
jaroslav@49
  2820
     *          illegal conditions.  For specification of all possible
jaroslav@49
  2821
     *          formatting errors, see the <a
jaroslav@49
  2822
     *          href="../util/Formatter.html#detail">Details</a> section of the
jaroslav@49
  2823
     *          formatter class specification.
jaroslav@49
  2824
     *
jaroslav@49
  2825
     * @throws  NullPointerException
jaroslav@49
  2826
     *          If the <tt>format</tt> is <tt>null</tt>
jaroslav@49
  2827
     *
jaroslav@49
  2828
     * @return  A formatted string
jaroslav@49
  2829
     *
jaroslav@49
  2830
     * @see  java.util.Formatter
jaroslav@49
  2831
     * @since  1.5
jaroslav@49
  2832
     */
jaroslav@49
  2833
    public static String format(String format, Object ... args) {
jaroslav@64
  2834
        throw new UnsupportedOperationException();
jaroslav@49
  2835
    }
jaroslav@49
  2836
jaroslav@49
  2837
    /**
jaroslav@49
  2838
     * Returns a formatted string using the specified locale, format string,
jaroslav@49
  2839
     * and arguments.
jaroslav@49
  2840
     *
jaroslav@49
  2841
     * @param  l
jaroslav@49
  2842
     *         The {@linkplain java.util.Locale locale} to apply during
jaroslav@49
  2843
     *         formatting.  If <tt>l</tt> is <tt>null</tt> then no localization
jaroslav@49
  2844
     *         is applied.
jaroslav@49
  2845
     *
jaroslav@49
  2846
     * @param  format
jaroslav@49
  2847
     *         A <a href="../util/Formatter.html#syntax">format string</a>
jaroslav@49
  2848
     *
jaroslav@49
  2849
     * @param  args
jaroslav@49
  2850
     *         Arguments referenced by the format specifiers in the format
jaroslav@49
  2851
     *         string.  If there are more arguments than format specifiers, the
jaroslav@49
  2852
     *         extra arguments are ignored.  The number of arguments is
jaroslav@49
  2853
     *         variable and may be zero.  The maximum number of arguments is
jaroslav@49
  2854
     *         limited by the maximum dimension of a Java array as defined by
jaroslav@49
  2855
     *         <cite>The Java&trade; Virtual Machine Specification</cite>.
jaroslav@49
  2856
     *         The behaviour on a
jaroslav@49
  2857
     *         <tt>null</tt> argument depends on the <a
jaroslav@49
  2858
     *         href="../util/Formatter.html#syntax">conversion</a>.
jaroslav@49
  2859
     *
jaroslav@49
  2860
     * @throws  IllegalFormatException
jaroslav@49
  2861
     *          If a format string contains an illegal syntax, a format
jaroslav@49
  2862
     *          specifier that is incompatible with the given arguments,
jaroslav@49
  2863
     *          insufficient arguments given the format string, or other
jaroslav@49
  2864
     *          illegal conditions.  For specification of all possible
jaroslav@49
  2865
     *          formatting errors, see the <a
jaroslav@49
  2866
     *          href="../util/Formatter.html#detail">Details</a> section of the
jaroslav@49
  2867
     *          formatter class specification
jaroslav@49
  2868
     *
jaroslav@49
  2869
     * @throws  NullPointerException
jaroslav@49
  2870
     *          If the <tt>format</tt> is <tt>null</tt>
jaroslav@49
  2871
     *
jaroslav@49
  2872
     * @return  A formatted string
jaroslav@49
  2873
     *
jaroslav@49
  2874
     * @see  java.util.Formatter
jaroslav@49
  2875
     * @since  1.5
jaroslav@49
  2876
     */
jaroslav@61
  2877
//    public static String format(Locale l, String format, Object ... args) {
jaroslav@61
  2878
//        return new Formatter(l).format(format, args).toString();
jaroslav@61
  2879
//    }
jaroslav@49
  2880
jaroslav@49
  2881
    /**
jaroslav@49
  2882
     * Returns the string representation of the <code>Object</code> argument.
jaroslav@49
  2883
     *
jaroslav@49
  2884
     * @param   obj   an <code>Object</code>.
jaroslav@49
  2885
     * @return  if the argument is <code>null</code>, then a string equal to
jaroslav@49
  2886
     *          <code>"null"</code>; otherwise, the value of
jaroslav@49
  2887
     *          <code>obj.toString()</code> is returned.
jaroslav@49
  2888
     * @see     java.lang.Object#toString()
jaroslav@49
  2889
     */
jaroslav@49
  2890
    public static String valueOf(Object obj) {
jaroslav@49
  2891
        return (obj == null) ? "null" : obj.toString();
jaroslav@49
  2892
    }
jaroslav@49
  2893
jaroslav@49
  2894
    /**
jaroslav@49
  2895
     * Returns the string representation of the <code>char</code> array
jaroslav@49
  2896
     * argument. The contents of the character array are copied; subsequent
jaroslav@49
  2897
     * modification of the character array does not affect the newly
jaroslav@49
  2898
     * created string.
jaroslav@49
  2899
     *
jaroslav@49
  2900
     * @param   data   a <code>char</code> array.
jaroslav@49
  2901
     * @return  a newly allocated string representing the same sequence of
jaroslav@49
  2902
     *          characters contained in the character array argument.
jaroslav@49
  2903
     */
jaroslav@49
  2904
    public static String valueOf(char data[]) {
jaroslav@49
  2905
        return new String(data);
jaroslav@49
  2906
    }
jaroslav@49
  2907
jaroslav@49
  2908
    /**
jaroslav@49
  2909
     * Returns the string representation of a specific subarray of the
jaroslav@49
  2910
     * <code>char</code> array argument.
jaroslav@49
  2911
     * <p>
jaroslav@49
  2912
     * The <code>offset</code> argument is the index of the first
jaroslav@49
  2913
     * character of the subarray. The <code>count</code> argument
jaroslav@49
  2914
     * specifies the length of the subarray. The contents of the subarray
jaroslav@49
  2915
     * are copied; subsequent modification of the character array does not
jaroslav@49
  2916
     * affect the newly created string.
jaroslav@49
  2917
     *
jaroslav@49
  2918
     * @param   data     the character array.
jaroslav@49
  2919
     * @param   offset   the initial offset into the value of the
jaroslav@49
  2920
     *                  <code>String</code>.
jaroslav@49
  2921
     * @param   count    the length of the value of the <code>String</code>.
jaroslav@49
  2922
     * @return  a string representing the sequence of characters contained
jaroslav@49
  2923
     *          in the subarray of the character array argument.
jaroslav@49
  2924
     * @exception IndexOutOfBoundsException if <code>offset</code> is
jaroslav@49
  2925
     *          negative, or <code>count</code> is negative, or
jaroslav@49
  2926
     *          <code>offset+count</code> is larger than
jaroslav@49
  2927
     *          <code>data.length</code>.
jaroslav@49
  2928
     */
jaroslav@49
  2929
    public static String valueOf(char data[], int offset, int count) {
jaroslav@49
  2930
        return new String(data, offset, count);
jaroslav@49
  2931
    }
jaroslav@49
  2932
jaroslav@49
  2933
    /**
jaroslav@49
  2934
     * Returns a String that represents the character sequence in the
jaroslav@49
  2935
     * array specified.
jaroslav@49
  2936
     *
jaroslav@49
  2937
     * @param   data     the character array.
jaroslav@49
  2938
     * @param   offset   initial offset of the subarray.
jaroslav@49
  2939
     * @param   count    length of the subarray.
jaroslav@49
  2940
     * @return  a <code>String</code> that contains the characters of the
jaroslav@49
  2941
     *          specified subarray of the character array.
jaroslav@49
  2942
     */
jaroslav@49
  2943
    public static String copyValueOf(char data[], int offset, int count) {
jaroslav@49
  2944
        // All public String constructors now copy the data.
jaroslav@49
  2945
        return new String(data, offset, count);
jaroslav@49
  2946
    }
jaroslav@49
  2947
jaroslav@49
  2948
    /**
jaroslav@49
  2949
     * Returns a String that represents the character sequence in the
jaroslav@49
  2950
     * array specified.
jaroslav@49
  2951
     *
jaroslav@49
  2952
     * @param   data   the character array.
jaroslav@49
  2953
     * @return  a <code>String</code> that contains the characters of the
jaroslav@49
  2954
     *          character array.
jaroslav@49
  2955
     */
jaroslav@49
  2956
    public static String copyValueOf(char data[]) {
jaroslav@49
  2957
        return copyValueOf(data, 0, data.length);
jaroslav@49
  2958
    }
jaroslav@49
  2959
jaroslav@49
  2960
    /**
jaroslav@49
  2961
     * Returns the string representation of the <code>boolean</code> argument.
jaroslav@49
  2962
     *
jaroslav@49
  2963
     * @param   b   a <code>boolean</code>.
jaroslav@49
  2964
     * @return  if the argument is <code>true</code>, a string equal to
jaroslav@49
  2965
     *          <code>"true"</code> is returned; otherwise, a string equal to
jaroslav@49
  2966
     *          <code>"false"</code> is returned.
jaroslav@49
  2967
     */
jaroslav@49
  2968
    public static String valueOf(boolean b) {
jaroslav@49
  2969
        return b ? "true" : "false";
jaroslav@49
  2970
    }
jaroslav@49
  2971
jaroslav@49
  2972
    /**
jaroslav@49
  2973
     * Returns the string representation of the <code>char</code>
jaroslav@49
  2974
     * argument.
jaroslav@49
  2975
     *
jaroslav@49
  2976
     * @param   c   a <code>char</code>.
jaroslav@49
  2977
     * @return  a string of length <code>1</code> containing
jaroslav@49
  2978
     *          as its single character the argument <code>c</code>.
jaroslav@49
  2979
     */
jaroslav@49
  2980
    public static String valueOf(char c) {
jaroslav@49
  2981
        char data[] = {c};
jaroslav@179
  2982
        return new String(data, 0, 1);
jaroslav@49
  2983
    }
jaroslav@49
  2984
jaroslav@49
  2985
    /**
jaroslav@49
  2986
     * Returns the string representation of the <code>int</code> argument.
jaroslav@49
  2987
     * <p>
jaroslav@49
  2988
     * The representation is exactly the one returned by the
jaroslav@49
  2989
     * <code>Integer.toString</code> method of one argument.
jaroslav@49
  2990
     *
jaroslav@49
  2991
     * @param   i   an <code>int</code>.
jaroslav@49
  2992
     * @return  a string representation of the <code>int</code> argument.
jaroslav@49
  2993
     * @see     java.lang.Integer#toString(int, int)
jaroslav@49
  2994
     */
jaroslav@49
  2995
    public static String valueOf(int i) {
jaroslav@49
  2996
        return Integer.toString(i);
jaroslav@49
  2997
    }
jaroslav@49
  2998
jaroslav@49
  2999
    /**
jaroslav@49
  3000
     * Returns the string representation of the <code>long</code> argument.
jaroslav@49
  3001
     * <p>
jaroslav@49
  3002
     * The representation is exactly the one returned by the
jaroslav@49
  3003
     * <code>Long.toString</code> method of one argument.
jaroslav@49
  3004
     *
jaroslav@49
  3005
     * @param   l   a <code>long</code>.
jaroslav@49
  3006
     * @return  a string representation of the <code>long</code> argument.
jaroslav@49
  3007
     * @see     java.lang.Long#toString(long)
jaroslav@49
  3008
     */
jaroslav@49
  3009
    public static String valueOf(long l) {
jaroslav@49
  3010
        return Long.toString(l);
jaroslav@49
  3011
    }
jaroslav@49
  3012
jaroslav@49
  3013
    /**
jaroslav@49
  3014
     * Returns the string representation of the <code>float</code> argument.
jaroslav@49
  3015
     * <p>
jaroslav@49
  3016
     * The representation is exactly the one returned by the
jaroslav@49
  3017
     * <code>Float.toString</code> method of one argument.
jaroslav@49
  3018
     *
jaroslav@49
  3019
     * @param   f   a <code>float</code>.
jaroslav@49
  3020
     * @return  a string representation of the <code>float</code> argument.
jaroslav@49
  3021
     * @see     java.lang.Float#toString(float)
jaroslav@49
  3022
     */
jaroslav@49
  3023
    public static String valueOf(float f) {
jaroslav@49
  3024
        return Float.toString(f);
jaroslav@49
  3025
    }
jaroslav@49
  3026
jaroslav@49
  3027
    /**
jaroslav@49
  3028
     * Returns the string representation of the <code>double</code> argument.
jaroslav@49
  3029
     * <p>
jaroslav@49
  3030
     * The representation is exactly the one returned by the
jaroslav@49
  3031
     * <code>Double.toString</code> method of one argument.
jaroslav@49
  3032
     *
jaroslav@49
  3033
     * @param   d   a <code>double</code>.
jaroslav@49
  3034
     * @return  a  string representation of the <code>double</code> argument.
jaroslav@49
  3035
     * @see     java.lang.Double#toString(double)
jaroslav@49
  3036
     */
jaroslav@49
  3037
    public static String valueOf(double d) {
jaroslav@49
  3038
        return Double.toString(d);
jaroslav@49
  3039
    }
jaroslav@49
  3040
jaroslav@49
  3041
    /**
jaroslav@49
  3042
     * Returns a canonical representation for the string object.
jaroslav@49
  3043
     * <p>
jaroslav@49
  3044
     * A pool of strings, initially empty, is maintained privately by the
jaroslav@49
  3045
     * class <code>String</code>.
jaroslav@49
  3046
     * <p>
jaroslav@49
  3047
     * When the intern method is invoked, if the pool already contains a
jaroslav@49
  3048
     * string equal to this <code>String</code> object as determined by
jaroslav@49
  3049
     * the {@link #equals(Object)} method, then the string from the pool is
jaroslav@49
  3050
     * returned. Otherwise, this <code>String</code> object is added to the
jaroslav@49
  3051
     * pool and a reference to this <code>String</code> object is returned.
jaroslav@49
  3052
     * <p>
jaroslav@49
  3053
     * It follows that for any two strings <code>s</code> and <code>t</code>,
jaroslav@49
  3054
     * <code>s.intern()&nbsp;==&nbsp;t.intern()</code> is <code>true</code>
jaroslav@49
  3055
     * if and only if <code>s.equals(t)</code> is <code>true</code>.
jaroslav@49
  3056
     * <p>
jaroslav@49
  3057
     * All literal strings and string-valued constant expressions are
jaroslav@49
  3058
     * interned. String literals are defined in section 3.10.5 of the
jaroslav@49
  3059
     * <cite>The Java&trade; Language Specification</cite>.
jaroslav@49
  3060
     *
jaroslav@49
  3061
     * @return  a string that has the same contents as this string, but is
jaroslav@49
  3062
     *          guaranteed to be from a pool of unique strings.
jaroslav@49
  3063
     */
jaroslav@49
  3064
    public native String intern();
jaroslav@608
  3065
    
jaroslav@608
  3066
    
jaroslav@608
  3067
    private static <T> T checkUTF8(T data, String charsetName)
jaroslav@608
  3068
        throws UnsupportedEncodingException {
jaroslav@608
  3069
        if (charsetName == null) {
jaroslav@608
  3070
            throw new NullPointerException("charsetName");
jaroslav@608
  3071
        }
jaroslav@608
  3072
        if (!charsetName.equalsIgnoreCase("UTF-8")
jaroslav@608
  3073
            && !charsetName.equalsIgnoreCase("UTF8")) {
jaroslav@608
  3074
            throw new UnsupportedEncodingException(charsetName);
jaroslav@608
  3075
        }
jaroslav@608
  3076
        return data;
jaroslav@608
  3077
    }
jaroslav@608
  3078
    
jaroslav@608
  3079
    private static int nextChar(byte[] arr, int[] index) throws IndexOutOfBoundsException {
jaroslav@608
  3080
        int c = arr[index[0]++] & 0xff;
jaroslav@608
  3081
        switch (c >> 4) {
jaroslav@608
  3082
            case 0:
jaroslav@608
  3083
            case 1:
jaroslav@608
  3084
            case 2:
jaroslav@608
  3085
            case 3:
jaroslav@608
  3086
            case 4:
jaroslav@608
  3087
            case 5:
jaroslav@608
  3088
            case 6:
jaroslav@608
  3089
            case 7:
jaroslav@608
  3090
                /* 0xxxxxxx*/
jaroslav@608
  3091
                return c;
jaroslav@608
  3092
            case 12:
jaroslav@608
  3093
            case 13: {
jaroslav@608
  3094
                /* 110x xxxx   10xx xxxx*/
jaroslav@608
  3095
                int char2 = (int) arr[index[0]++];
jaroslav@608
  3096
                if ((char2 & 0xC0) != 0x80) {
jaroslav@608
  3097
                    throw new IndexOutOfBoundsException("malformed input");
jaroslav@608
  3098
                }
jaroslav@608
  3099
                return (((c & 0x1F) << 6) | (char2 & 0x3F));
jaroslav@608
  3100
            }
jaroslav@608
  3101
            case 14: {
jaroslav@608
  3102
                /* 1110 xxxx  10xx xxxx  10xx xxxx */
jaroslav@608
  3103
                int char2 = arr[index[0]++];
jaroslav@608
  3104
                int char3 = arr[index[0]++];
jaroslav@608
  3105
                if (((char2 & 0xC0) != 0x80) || ((char3 & 0xC0) != 0x80)) {
jaroslav@608
  3106
                    throw new IndexOutOfBoundsException("malformed input");
jaroslav@608
  3107
                }
jaroslav@608
  3108
                return (((c & 0x0F) << 12)
jaroslav@608
  3109
                    | ((char2 & 0x3F) << 6)
jaroslav@608
  3110
                    | ((char3 & 0x3F) << 0));
jaroslav@608
  3111
            }
jaroslav@608
  3112
            default:
jaroslav@608
  3113
                /* 10xx xxxx,  1111 xxxx */
jaroslav@608
  3114
                throw new IndexOutOfBoundsException("malformed input");
jaroslav@608
  3115
        }
jaroslav@608
  3116
        
jaroslav@608
  3117
    }
jaroslav@49
  3118
}