Monitoring JavaMelody sur /demo

1 /*

2  * Copyright (c) 2003, 2018, Oracle and/or its affiliates. All rights reserved.

3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.

4  *

5  * This code is free software; you can redistribute it and/or modify it

6  * under the terms of the GNU General Public License version 2 only, as

7  * published by the Free Software Foundation.  Oracle designates this

8  * particular file as subject to the "Classpath" exception as provided

9  * by Oracle in the LICENSE file that accompanied this code.

10  *

11  * This code is distributed in the hope that it will be useful, but WITHOUT

12  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or

13  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License

14  * version 2 for more details (a copy is included in the LICENSE file that

15  * accompanied this code).

16  *

17  * You should have received a copy of the GNU General Public License version

18  * 2 along with this work; if not, write to the Free Software Foundation,

19  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.

20  *

21  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA

22  * or visit www.oracle.com if you need additional information or have any

23  * questions.

24  */

25 

26 package java.util;

27 

28 import java.io.*;

29 import java.math.*;

30 import java.nio.*;

31 import java.nio.channels.*;

32 import java.nio.charset.*;

33 import java.nio.file.Path;

34 import java.nio.file.Files;

35 import java.text.*;

36 import java.text.spi.NumberFormatProvider;

37 import java.util.function.Consumer;

38 import java.util.regex.*;

39 import java.util.stream.Stream;

40 import java.util.stream.StreamSupport;

41 import sun.util.locale.provider.LocaleProviderAdapter;

42 import sun.util.locale.provider.ResourceBundleBasedAdapter;

43 

44 /**

45  * A simple text scanner which can parse primitive types and strings using

46  * regular expressions.

47  *

48  * <p>A {@code Scanner} breaks its input into tokens using a

49  * delimiter pattern, which by default matches whitespace. The resulting

50  * tokens may then be converted into values of different types using the

51  * various {@code next} methods.

52  *

53  * <p>For example, this code allows a user to read a number from

54  * {@code System.in}:

55  * <blockquote><pre>{@code

56  *     Scanner sc = new Scanner(System.in);

57  *     int i = sc.nextInt();

58  * }</pre></blockquote>

59  *

60  * <p>As another example, this code allows {@code long} types to be

61  * assigned from entries in a file {@code myNumbers}:

62  * <blockquote><pre>{@code

63  *      Scanner sc = new Scanner(new File("myNumbers"));

64  *      while (sc.hasNextLong()) {

65  *          long aLong = sc.nextLong();

66  *      }

67  * }</pre></blockquote>

68  *

69  * <p>The scanner can also use delimiters other than whitespace. This

70  * example reads several items in from a string:

71  * <blockquote><pre>{@code

72  *     String input = "1 fish 2 fish red fish blue fish";

73  *     Scanner s = new Scanner(input).useDelimiter("\\s*fish\\s*");

74  *     System.out.println(s.nextInt());

75  *     System.out.println(s.nextInt());

76  *     System.out.println(s.next());

77  *     System.out.println(s.next());

78  *     s.close();

79  * }</pre></blockquote>

80  * <p>

81  * prints the following output:

82  * <blockquote><pre>{@code

83  *     1

84  *     2

85  *     red

86  *     blue

87  * }</pre></blockquote>

88  *

89  * <p>The same output can be generated with this code, which uses a regular

90  * expression to parse all four tokens at once:

91  * <blockquote><pre>{@code

92  *     String input = "1 fish 2 fish red fish blue fish";

93  *     Scanner s = new Scanner(input);

94  *     s.findInLine("(\\d+) fish (\\d+) fish (\\w+) fish (\\w+)");

95  *     MatchResult result = s.match();

96  *     for (int i=1; i<=result.groupCount(); i++)

97  *         System.out.println(result.group(i));

98  *     s.close();

99  * }</pre></blockquote>

100  *

101  * <p>The <a id="default-delimiter">default whitespace delimiter</a> used

102  * by a scanner is as recognized by {@link Character#isWhitespace(char)

103  * Character.isWhitespace()}. The {@link #reset reset()}

104  * method will reset the value of the scanner's delimiter to the default

105  * whitespace delimiter regardless of whether it was previously changed.

106  *

107  * <p>A scanning operation may block waiting for input.

108  *

109  * <p>The {@link #next} and {@link #hasNext} methods and their

110  * companion methods (such as {@link #nextInt} and

111  * {@link #hasNextInt}) first skip any input that matches the delimiter

112  * pattern, and then attempt to return the next token. Both {@code hasNext()}

113  * and {@code next()} methods may block waiting for further input.  Whether a

114  * {@code hasNext()} method blocks has no connection to whether or not its

115  * associated {@code next()} method will block. The {@link #tokens} method

116  * may also block waiting for input.

117  *

118  * <p>The {@link #findInLine findInLine()},

119  * {@link #findWithinHorizon findWithinHorizon()},

120  * {@link #skip skip()}, and {@link #findAll findAll()}

121  * methods operate independently of the delimiter pattern. These methods will

122  * attempt to match the specified pattern with no regard to delimiters in the

123  * input and thus can be used in special circumstances where delimiters are

124  * not relevant. These methods may block waiting for more input.

125  *

126  * <p>When a scanner throws an {@link InputMismatchException}, the scanner

127  * will not pass the token that caused the exception, so that it may be

128  * retrieved or skipped via some other method.

129  *

130  * <p>Depending upon the type of delimiting pattern, empty tokens may be

131  * returned. For example, the pattern {@code "\\s+"} will return no empty

132  * tokens since it matches multiple instances of the delimiter. The delimiting

133  * pattern {@code "\\s"} could return empty tokens since it only passes one

134  * space at a time.

135  *

136  * <p> A scanner can read text from any object which implements the {@link

137  * java.lang.Readable} interface.  If an invocation of the underlying

138  * readable's {@link java.lang.Readable#read read()} method throws an {@link

139  * java.io.IOException} then the scanner assumes that the end of the input

140  * has been reached.  The most recent {@code IOException} thrown by the

141  * underlying readable can be retrieved via the {@link #ioException} method.

142  *

143  * <p>When a {@code Scanner} is closed, it will close its input source

144  * if the source implements the {@link java.io.Closeable} interface.

145  *

146  * <p>A {@code Scanner} is not safe for multithreaded use without

147  * external synchronization.

148  *

149  * <p>Unless otherwise mentioned, passing a {@code null} parameter into

150  * any method of a {@code Scanner} will cause a

151  * {@code NullPointerException} to be thrown.

152  *

153  * <p>A scanner will default to interpreting numbers as decimal unless a

154  * different radix has been set by using the {@link #useRadix} method. The

155  * {@link #reset} method will reset the value of the scanner's radix to

156  * {@code 10} regardless of whether it was previously changed.

157  *

158  * <h3> <a id="localized-numbers">Localized numbers</a> </h3>

159  *

160  * <p> An instance of this class is capable of scanning numbers in the standard

161  * formats as well as in the formats of the scanner's locale. A scanner's

162  * <a id="initial-locale">initial locale </a>is the value returned by the {@link

163  * java.util.Locale#getDefault(Locale.Category)

164  * Locale.getDefault(Locale.Category.FORMAT)} method; it may be changed via the {@link

165  * #useLocale useLocale()} method. The {@link #reset} method will reset the value of the

166  * scanner's locale to the initial locale regardless of whether it was

167  * previously changed.

168  *

169  * <p>The localized formats are defined in terms of the following parameters,

170  * which for a particular locale are taken from that locale's {@link

171  * java.text.DecimalFormat DecimalFormat} object, {@code df}, and its and

172  * {@link java.text.DecimalFormatSymbols DecimalFormatSymbols} object,

173  * {@code dfs}.

174  *

175  * <blockquote><dl>

176  *     <dt><i>LocalGroupSeparator&nbsp;&nbsp;</i>

177  *         <dd>The character used to separate thousands groups,

178  *         <i>i.e.,</i>&nbsp;{@code dfs.}{@link

179  *         java.text.DecimalFormatSymbols#getGroupingSeparator

180  *         getGroupingSeparator()}

181  *     <dt><i>LocalDecimalSeparator&nbsp;&nbsp;</i>

182  *         <dd>The character used for the decimal point,

183  *     <i>i.e.,</i>&nbsp;{@code dfs.}{@link

184  *     java.text.DecimalFormatSymbols#getDecimalSeparator

185  *     getDecimalSeparator()}

186  *     <dt><i>LocalPositivePrefix&nbsp;&nbsp;</i>

187  *         <dd>The string that appears before a positive number (may

188  *         be empty), <i>i.e.,</i>&nbsp;{@code df.}{@link

189  *         java.text.DecimalFormat#getPositivePrefix

190  *         getPositivePrefix()}

191  *     <dt><i>LocalPositiveSuffix&nbsp;&nbsp;</i>

192  *         <dd>The string that appears after a positive number (may be

193  *         empty), <i>i.e.,</i>&nbsp;{@code df.}{@link

194  *         java.text.DecimalFormat#getPositiveSuffix

195  *         getPositiveSuffix()}

196  *     <dt><i>LocalNegativePrefix&nbsp;&nbsp;</i>

197  *         <dd>The string that appears before a negative number (may

198  *         be empty), <i>i.e.,</i>&nbsp;{@code df.}{@link

199  *         java.text.DecimalFormat#getNegativePrefix

200  *         getNegativePrefix()}

201  *     <dt><i>LocalNegativeSuffix&nbsp;&nbsp;</i>

202  *         <dd>The string that appears after a negative number (may be

203  *         empty), <i>i.e.,</i>&nbsp;{@code df.}{@link

204  *     java.text.DecimalFormat#getNegativeSuffix

205  *     getNegativeSuffix()}

206  *     <dt><i>LocalNaN&nbsp;&nbsp;</i>

207  *         <dd>The string that represents not-a-number for

208  *         floating-point values,

209  *         <i>i.e.,</i>&nbsp;{@code dfs.}{@link

210  *         java.text.DecimalFormatSymbols#getNaN

211  *         getNaN()}

212  *     <dt><i>LocalInfinity&nbsp;&nbsp;</i>

213  *         <dd>The string that represents infinity for floating-point

214  *         values, <i>i.e.,</i>&nbsp;{@code dfs.}{@link

215  *         java.text.DecimalFormatSymbols#getInfinity

216  *         getInfinity()}

217  * </dl></blockquote>

218  *

219  * <h4> <a id="number-syntax">Number syntax</a> </h4>

220  *

221  * <p> The strings that can be parsed as numbers by an instance of this class

222  * are specified in terms of the following regular-expression grammar, where

223  * Rmax is the highest digit in the radix being used (for example, Rmax is 9 in base 10).

224  *

225  * <dl>

226  *   <dt><i>NonAsciiDigit</i>:

227  *       <dd>A non-ASCII character c for which

228  *            {@link java.lang.Character#isDigit Character.isDigit}{@code (c)}

229  *                        returns&nbsp;true

230  *

231  *   <dt><i>Non0Digit</i>:

232  *       <dd>{@code [1-}<i>Rmax</i>{@code ] | }<i>NonASCIIDigit</i>

233  *

234  *   <dt><i>Digit</i>:

235  *       <dd>{@code [0-}<i>Rmax</i>{@code ] | }<i>NonASCIIDigit</i>

236  *

237  *   <dt><i>GroupedNumeral</i>:

238  *       <dd><code>(&nbsp;</code><i>Non0Digit</i>

239  *                   <i>Digit</i>{@code ?

240  *                   }<i>Digit</i>{@code ?}

241  *       <dd>&nbsp;&nbsp;&nbsp;&nbsp;<code>(&nbsp;</code><i>LocalGroupSeparator</i>

242  *                         <i>Digit</i>

243  *                         <i>Digit</i>

244  *                         <i>Digit</i>{@code  )+ )}

245  *

246  *   <dt><i>Numeral</i>:

247  *       <dd>{@code ( ( }<i>Digit</i>{@code + )

248  *               | }<i>GroupedNumeral</i>{@code  )}

249  *

250  *   <dt><a id="Integer-regex"><i>Integer</i>:</a>

251  *       <dd>{@code ( [-+]? ( }<i>Numeral</i>{@code

252  *                               ) )}

253  *       <dd>{@code | }<i>LocalPositivePrefix</i> <i>Numeral</i>

254  *                      <i>LocalPositiveSuffix</i>

255  *       <dd>{@code | }<i>LocalNegativePrefix</i> <i>Numeral</i>

256  *                 <i>LocalNegativeSuffix</i>

257  *

258  *   <dt><i>DecimalNumeral</i>:

259  *       <dd><i>Numeral</i>

260  *       <dd>{@code | }<i>Numeral</i>

261  *                 <i>LocalDecimalSeparator</i>

262  *                 <i>Digit</i>{@code *}

263  *       <dd>{@code | }<i>LocalDecimalSeparator</i>

264  *                 <i>Digit</i>{@code +}

265  *

266  *   <dt><i>Exponent</i>:

267  *       <dd>{@code ( [eE] [+-]? }<i>Digit</i>{@code + )}

268  *

269  *   <dt><a id="Decimal-regex"><i>Decimal</i>:</a>

270  *       <dd>{@code ( [-+]? }<i>DecimalNumeral</i>

271  *                         <i>Exponent</i>{@code ? )}

272  *       <dd>{@code | }<i>LocalPositivePrefix</i>

273  *                 <i>DecimalNumeral</i>

274  *                 <i>LocalPositiveSuffix</i>

275  *                 <i>Exponent</i>{@code ?}

276  *       <dd>{@code | }<i>LocalNegativePrefix</i>

277  *                 <i>DecimalNumeral</i>

278  *                 <i>LocalNegativeSuffix</i>

279  *                 <i>Exponent</i>{@code ?}

280  *

281  *   <dt><i>HexFloat</i>:

282  *       <dd>{@code [-+]? 0[xX][0-9a-fA-F]*\.[0-9a-fA-F]+

283  *                 ([pP][-+]?[0-9]+)?}

284  *

285  *   <dt><i>NonNumber</i>:

286  *       <dd>{@code NaN

287  *                          | }<i>LocalNan</i>{@code

288  *                          | Infinity

289  *                          | }<i>LocalInfinity</i>

290  *

291  *   <dt><i>SignedNonNumber</i>:

292  *       <dd>{@code ( [-+]? }<i>NonNumber</i>{@code  )}

293  *       <dd>{@code | }<i>LocalPositivePrefix</i>

294  *                 <i>NonNumber</i>

295  *                 <i>LocalPositiveSuffix</i>

296  *       <dd>{@code | }<i>LocalNegativePrefix</i>

297  *                 <i>NonNumber</i>

298  *                 <i>LocalNegativeSuffix</i>

299  *

300  *   <dt><a id="Float-regex"><i>Float</i></a>:

301  *       <dd><i>Decimal</i>

302  *           {@code | }<i>HexFloat</i>

303  *           {@code | }<i>SignedNonNumber</i>

304  *

305  * </dl>

306  * <p>Whitespace is not significant in the above regular expressions.

307  *

308  * @since   1.5

309  */

310 public final class Scanner implements Iterator<String>, Closeable {

311 

312     // Internal buffer used to hold input

313     private CharBuffer buf;

314 

315     // Size of internal character buffer

316     private static final int BUFFER_SIZE = 1024; // change to 1024;

317 

318     // The index into the buffer currently held by the Scanner

319     private int position;

320 

321     // Internal matcher used for finding delimiters

322     private Matcher matcher;

323 

324     // Pattern used to delimit tokens

325     private Pattern delimPattern;

326 

327     // Pattern found in last hasNext operation

328     private Pattern hasNextPattern;

329 

330     // Position after last hasNext operation

331     private int hasNextPosition;

332 

333     // Result after last hasNext operation

334     private String hasNextResult;

335 

336     // The input source

337     private Readable source;

338 

339     // Boolean is true if source is done

340     private boolean sourceClosed = false;

341 

342     // Boolean indicating more input is required

343     private boolean needInput = false;

344 

345     // Boolean indicating if a delim has been skipped this operation

346     private boolean skipped = false;

347 

348     // A store of a position that the scanner may fall back to

349     private int savedScannerPosition = -1;

350 

351     // A cache of the last primitive type scanned

352     private Object typeCache = null;

353 

354     // Boolean indicating if a match result is available

355     private boolean matchValid = false;

356 

357     // Boolean indicating if this scanner has been closed

358     private boolean closed = false;

359 

360     // The current radix used by this scanner

361     private int radix = 10;

362 

363     // The default radix for this scanner

364     private int defaultRadix = 10;

365 

366     // The locale used by this scanner

367     private Locale locale = null;

368 

369     // A cache of the last few recently used Patterns

370     private PatternLRUCache patternCache = new PatternLRUCache(7);

371 

372     // A holder of the last IOException encountered

373     private IOException lastException;

374 

375     // Number of times this scanner's state has been modified.

376     // Generally incremented on most public APIs and checked

377     // within spliterator implementations.

378     int modCount;

379 

380     // A pattern for java whitespace

381     private static Pattern WHITESPACE_PATTERN = Pattern.compile(

382                                                 "\\p{javaWhitespace}+");

383 

384     // A pattern for any token

385     private static Pattern FIND_ANY_PATTERN = Pattern.compile("(?s).*");

386 

387     // A pattern for non-ASCII digits

388     private static Pattern NON_ASCII_DIGIT = Pattern.compile(

389         "[\\p{javaDigit}&&[^0-9]]");

390 

391     // Fields and methods to support scanning primitive types

392 

393     /**

394      * Locale dependent values used to scan numbers

395      */

396     private String groupSeparator = "\\,";

397     private String decimalSeparator = "\\.";

398     private String nanString = "NaN";

399     private String infinityString = "Infinity";

400     private String positivePrefix = "";

401     private String negativePrefix = "\\-";

402     private String positiveSuffix = "";

403     private String negativeSuffix = "";

404 

405     /**

406      * Fields and an accessor method to match booleans

407      */

408     private static volatile Pattern boolPattern;

409     private static final String BOOLEAN_PATTERN = "true|false";

410     private static Pattern boolPattern() {

411         Pattern bp = boolPattern;

412         if (bp == null)

413             boolPattern = bp = Pattern.compile(BOOLEAN_PATTERN,

414                                           Pattern.CASE_INSENSITIVE);

415         return bp;

416     }

417 

418     /**

419      * Fields and methods to match bytes, shorts, ints, and longs

420      */

421     private Pattern integerPattern;

422     private String digits = "0123456789abcdefghijklmnopqrstuvwxyz";

423     private String non0Digit = "[\\p{javaDigit}&&[^0]]";

424     private int SIMPLE_GROUP_INDEX = 5;

425     private String buildIntegerPatternString() {

426         String radixDigits = digits.substring(0, radix);

427         // \\p{javaDigit} is not guaranteed to be appropriate

428         // here but what can we do? The final authority will be

429         // whatever parse method is invoked, so ultimately the

430         // Scanner will do the right thing

431         String digit = "((?i)["+radixDigits+"]|\\p{javaDigit})";

432         String groupedNumeral = "("+non0Digit+digit+"?"+digit+"?("+

433                                 groupSeparator+digit+digit+digit+")+)";

434         // digit++ is the possessive form which is necessary for reducing

435         // backtracking that would otherwise cause unacceptable performance

436         String numeral = "(("+ digit+"++)|"+groupedNumeral+")";

437         String javaStyleInteger = "([-+]?(" + numeral + "))";

438         String negativeInteger = negativePrefix + numeral + negativeSuffix;

439         String positiveInteger = positivePrefix + numeral + positiveSuffix;

440         return "("+ javaStyleInteger + ")|(" +

441             positiveInteger + ")|(" +

442             negativeInteger + ")";

443     }

444     private Pattern integerPattern() {

445         if (integerPattern == null) {

446             integerPattern = patternCache.forName(buildIntegerPatternString());

447         }

448         return integerPattern;

449     }

450 

451     /**

452      * Fields and an accessor method to match line separators

453      */

454     private static volatile Pattern separatorPattern;

455     private static volatile Pattern linePattern;

456     private static final String LINE_SEPARATOR_PATTERN =

457                                            "\r\n|[\n\r\u2028\u2029\u0085]";

458     private static final String LINE_PATTERN = ".*("+LINE_SEPARATOR_PATTERN+")|.+$";

459 

460     private static Pattern separatorPattern() {

461         Pattern sp = separatorPattern;

462         if (sp == null)

463             separatorPattern = sp = Pattern.compile(LINE_SEPARATOR_PATTERN);

464         return sp;

465     }

466 

467     private static Pattern linePattern() {

468         Pattern lp = linePattern;

469         if (lp == null)

470             linePattern = lp = Pattern.compile(LINE_PATTERN);

471         return lp;

472     }

473 

474     /**

475      * Fields and methods to match floats and doubles

476      */

477     private Pattern floatPattern;

478     private Pattern decimalPattern;

479     private void buildFloatAndDecimalPattern() {

480         // \\p{javaDigit} may not be perfect, see above

481         String digit = "([0-9]|(\\p{javaDigit}))";

482         String exponent = "([eE][+-]?"+digit+"+)?";

483         String groupedNumeral = "("+non0Digit+digit+"?"+digit+"?("+

484                                 groupSeparator+digit+digit+digit+")+)";

485         // Once again digit++ is used for performance, as above

486         String numeral = "(("+digit+"++)|"+groupedNumeral+")";

487         String decimalNumeral = "("+numeral+"|"+numeral +

488             decimalSeparator + digit + "*+|"+ decimalSeparator +

489             digit + "++)";

490         String nonNumber = "(NaN|"+nanString+"|Infinity|"+

491                                infinityString+")";

492         String positiveFloat = "(" + positivePrefix + decimalNumeral +

493                             positiveSuffix + exponent + ")";

494         String negativeFloat = "(" + negativePrefix + decimalNumeral +

495                             negativeSuffix + exponent + ")";

496         String decimal = "(([-+]?" + decimalNumeral + exponent + ")|"+

497             positiveFloat + "|" + negativeFloat + ")";

498         String hexFloat =

499             "[-+]?0[xX][0-9a-fA-F]*\\.[0-9a-fA-F]+([pP][-+]?[0-9]+)?";

500         String positiveNonNumber = "(" + positivePrefix + nonNumber +

501                             positiveSuffix + ")";

502         String negativeNonNumber = "(" + negativePrefix + nonNumber +

503                             negativeSuffix + ")";

504         String signedNonNumber = "(([-+]?"+nonNumber+")|" +

505                                  positiveNonNumber + "|" +

506                                  negativeNonNumber + ")";

507         floatPattern = Pattern.compile(decimal + "|" + hexFloat + "|" +

508                                        signedNonNumber);

509         decimalPattern = Pattern.compile(decimal);

510     }

511     private Pattern floatPattern() {

512         if (floatPattern == null) {

513             buildFloatAndDecimalPattern();

514         }

515         return floatPattern;

516     }

517     private Pattern decimalPattern() {

518         if (decimalPattern == null) {

519             buildFloatAndDecimalPattern();

520         }

521         return decimalPattern;

522     }

523 

524     // Constructors

525 

526     /**

527      * Constructs a {@code Scanner} that returns values scanned

528      * from the specified source delimited by the specified pattern.

529      *

530      * @param source A character source implementing the Readable interface

531      * @param pattern A delimiting pattern

532      */

533     private Scanner(Readable source, Pattern pattern) {

534         assert source != null : "source should not be null";

535         assert pattern != null : "pattern should not be null";

536         this.source = source;

537         delimPattern = pattern;

538         buf = CharBuffer.allocate(BUFFER_SIZE);

539         buf.limit(0);

540         matcher = delimPattern.matcher(buf);

541         matcher.useTransparentBounds(true);

542         matcher.useAnchoringBounds(false);

543         useLocale(Locale.getDefault(Locale.Category.FORMAT));

544     }

545 

546     /**

547      * Constructs a new {@code Scanner} that produces values scanned

548      * from the specified source.

549      *

550      * @param  source A character source implementing the {@link Readable}

551      *         interface

552      */

553     public Scanner(Readable source) {

554         this(Objects.requireNonNull(source, "source"), WHITESPACE_PATTERN);

555     }

556 

557     /**

558      * Constructs a new {@code Scanner} that produces values scanned

559      * from the specified input stream. Bytes from the stream are converted

560      * into characters using the underlying platform's

561      * {@linkplain java.nio.charset.Charset#defaultCharset() default charset}.

562      *

563      * @param  source An input stream to be scanned

564      */

565     public Scanner(InputStream source) {

566         this(new InputStreamReader(source), WHITESPACE_PATTERN);

567     }

568 

569     /**

570      * Constructs a new {@code Scanner} that produces values scanned

571      * from the specified input stream. Bytes from the stream are converted

572      * into characters using the specified charset.

573      *

574      * @param  source An input stream to be scanned

575      * @param charsetName The encoding type used to convert bytes from the

576      *        stream into characters to be scanned

577      * @throws IllegalArgumentException if the specified character set

578      *         does not exist

579      */

580     public Scanner(InputStream source, String charsetName) {

581         this(source, toCharset(charsetName));

582     }

583 

584     /**

585      * Constructs a new {@code Scanner} that produces values scanned

586      * from the specified input stream. Bytes from the stream are converted

587      * into characters using the specified charset.

588      *

589      * @param  source an input stream to be scanned

590      * @param  charset the charset used to convert bytes from the file

591      *         into characters to be scanned

592      * @since  10

593      */

594     public Scanner(InputStream source, Charset charset) {

595         this(makeReadable(Objects.requireNonNull(source, "source"), charset),

596              WHITESPACE_PATTERN);

597     }

598 

599     /**

600      * Returns a charset object for the given charset name.

601      * @throws NullPointerException          is csn is null

602      * @throws IllegalArgumentException      if the charset is not supported

603      */

604     private static Charset toCharset(String csn) {

605         Objects.requireNonNull(csn, "charsetName");

606         try {

607             return Charset.forName(csn);

608         } catch (IllegalCharsetNameException|UnsupportedCharsetException e) {

609             // IllegalArgumentException should be thrown

610             throw new IllegalArgumentException(e);

611         }

612     }

613 

614     /*

615      * This method is added so that null-check on charset can be performed before

616      * creating InputStream as an existing test required it.

617     */

618     private static Readable makeReadable(Path source, Charset charset)

619             throws IOException {

620         Objects.requireNonNull(charset, "charset");

621         return makeReadable(Files.newInputStream(source), charset);

622     }

623 

624     private static Readable makeReadable(InputStream source, Charset charset) {

625         Objects.requireNonNull(charset, "charset");

626         return new InputStreamReader(source, charset);

627     }

628 

629     /**

630      * Constructs a new {@code Scanner} that produces values scanned

631      * from the specified file. Bytes from the file are converted into

632      * characters using the underlying platform's

633      * {@linkplain java.nio.charset.Charset#defaultCharset() default charset}.

634      *

635      * @param  source A file to be scanned

636      * @throws FileNotFoundException if source is not found

637      */

638     public Scanner(File source) throws FileNotFoundException {

639         this((ReadableByteChannel)(new FileInputStream(source).getChannel()));

640     }

641 

642     /**

643      * Constructs a new {@code Scanner} that produces values scanned

644      * from the specified file. Bytes from the file are converted into

645      * characters using the specified charset.

646      *

647      * @param  source A file to be scanned

648      * @param charsetName The encoding type used to convert bytes from the file

649      *        into characters to be scanned

650      * @throws FileNotFoundException if source is not found

651      * @throws IllegalArgumentException if the specified encoding is

652      *         not found

653      */

654     public Scanner(File source, String charsetName)

655         throws FileNotFoundException

656     {

657         this(Objects.requireNonNull(source), toDecoder(charsetName));

658     }

659 

660     /**

661      * Constructs a new {@code Scanner} that produces values scanned

662      * from the specified file. Bytes from the file are converted into

663      * characters using the specified charset.

664      *

665      * @param  source A file to be scanned

666      * @param  charset The charset used to convert bytes from the file

667      *         into characters to be scanned

668      * @throws IOException

669      *         if an I/O error occurs opening the source

670      * @since  10

671      */

672     public Scanner(File source, Charset charset) throws IOException {

673         this(Objects.requireNonNull(source), charset.newDecoder());

674     }

675 

676     private Scanner(File source, CharsetDecoder dec)

677         throws FileNotFoundException

678     {

679         this(makeReadable((ReadableByteChannel)(new FileInputStream(source).getChannel()), dec));

680     }

681 

682     private static CharsetDecoder toDecoder(String charsetName) {

683         Objects.requireNonNull(charsetName, "charsetName");

684         try {

685             return Charset.forName(charsetName).newDecoder();

686         } catch (IllegalCharsetNameException|UnsupportedCharsetException unused) {

687             throw new IllegalArgumentException(charsetName);

688         }

689     }

690 

691     private static Readable makeReadable(ReadableByteChannel source,

692                                          CharsetDecoder dec) {

693         return Channels.newReader(source, dec, -1);

694     }

695 

696     private static Readable makeReadable(ReadableByteChannel source,

697                                          Charset charset) {

698         Objects.requireNonNull(charset, "charset");

699         return Channels.newReader(source, charset);

700     }

701 

702     /**

703      * Constructs a new {@code Scanner} that produces values scanned

704      * from the specified file. Bytes from the file are converted into

705      * characters using the underlying platform's

706      * {@linkplain java.nio.charset.Charset#defaultCharset() default charset}.

707      *

708      * @param   source

709      *          the path to the file to be scanned

710      * @throws  IOException

711      *          if an I/O error occurs opening source

712      *

713      * @since   1.7

714      */

715     public Scanner(Path source)

716         throws IOException

717     {

718         this(Files.newInputStream(source));

719     }

720 

721     /**

722      * Constructs a new {@code Scanner} that produces values scanned

723      * from the specified file. Bytes from the file are converted into

724      * characters using the specified charset.

725      *

726      * @param   source

727      *          the path to the file to be scanned

728      * @param   charsetName

729      *          The encoding type used to convert bytes from the file

730      *          into characters to be scanned

731      * @throws  IOException

732      *          if an I/O error occurs opening source

733      * @throws  IllegalArgumentException

734      *          if the specified encoding is not found

735      * @since   1.7

736      */

737     public Scanner(Path source, String charsetName) throws IOException {

738         this(Objects.requireNonNull(source), toCharset(charsetName));

739     }

740 

741     /**

742      * Constructs a new {@code Scanner} that produces values scanned

743      * from the specified file. Bytes from the file are converted into

744      * characters using the specified charset.

745      *

746      * @param   source

747      *          the path to the file to be scanned

748      * @param   charset

749      *          the charset used to convert bytes from the file

750      *          into characters to be scanned

751      * @throws  IOException

752      *          if an I/O error occurs opening the source

753      * @since   10

754      */

755     public Scanner(Path source, Charset charset)  throws IOException {

756         this(makeReadable(source, charset));

757     }

758 

759     /**

760      * Constructs a new {@code Scanner} that produces values scanned

761      * from the specified string.

762      *

763      * @param  source A string to scan

764      */

765     public Scanner(String source) {

766         this(new StringReader(source), WHITESPACE_PATTERN);

767     }

768 

769     /**

770      * Constructs a new {@code Scanner} that produces values scanned

771      * from the specified channel. Bytes from the source are converted into

772      * characters using the underlying platform's

773      * {@linkplain java.nio.charset.Charset#defaultCharset() default charset}.

774      *

775      * @param  source A channel to scan

776      */

777     public Scanner(ReadableByteChannel source) {

778         this(makeReadable(Objects.requireNonNull(source, "source")),

779              WHITESPACE_PATTERN);

780     }

781 

782     private static Readable makeReadable(ReadableByteChannel source) {

783         return makeReadable(source, Charset.defaultCharset().newDecoder());

784     }

785 

786     /**

787      * Constructs a new {@code Scanner} that produces values scanned

788      * from the specified channel. Bytes from the source are converted into

789      * characters using the specified charset.

790      *

791      * @param  source A channel to scan

792      * @param charsetName The encoding type used to convert bytes from the

793      *        channel into characters to be scanned

794      * @throws IllegalArgumentException if the specified character set

795      *         does not exist

796      */

797     public Scanner(ReadableByteChannel source, String charsetName) {

798         this(makeReadable(Objects.requireNonNull(source, "source"), toDecoder(charsetName)),

799              WHITESPACE_PATTERN);

800     }

801 

802     /**

803      * Constructs a new {@code Scanner} that produces values scanned

804      * from the specified channel. Bytes from the source are converted into

805      * characters using the specified charset.

806      *

807      * @param source a channel to scan

808      * @param charset the encoding type used to convert bytes from the

809      *        channel into characters to be scanned

810      * @since 10

811      */

812     public Scanner(ReadableByteChannel source, Charset charset) {

813         this(makeReadable(Objects.requireNonNull(source, "source"), charset),

814              WHITESPACE_PATTERN);

815     }

816 

817     // Private primitives used to support scanning

818 

819     private void saveState() {

820         savedScannerPosition = position;

821     }

822 

823     private void revertState() {

824         this.position = savedScannerPosition;

825         savedScannerPosition = -1;

826         skipped = false;

827     }

828 

829     private boolean revertState(boolean b) {

830         this.position = savedScannerPosition;

831         savedScannerPosition = -1;

832         skipped = false;

833         return b;

834     }

835 

836     private void cacheResult() {

837         hasNextResult = matcher.group();

838         hasNextPosition = matcher.end();

839         hasNextPattern = matcher.pattern();

840     }

841 

842     private void cacheResult(String result) {

843         hasNextResult = result;

844         hasNextPosition = matcher.end();

845         hasNextPattern = matcher.pattern();

846     }

847 

848     // Clears both regular cache and type cache

849     private void clearCaches() {

850         hasNextPattern = null;

851         typeCache = null;

852     }

853 

854     // Also clears both the regular cache and the type cache

855     private String getCachedResult() {

856         position = hasNextPosition;

857         hasNextPattern = null;

858         typeCache = null;

859         return hasNextResult;

860     }

861 

862     // Also clears both the regular cache and the type cache

863     private void useTypeCache() {

864         if (closed)

865             throw new IllegalStateException("Scanner closed");

866         position = hasNextPosition;

867         hasNextPattern = null;

868         typeCache = null;

869     }

870 

871     // Tries to read more input. May block.

872     private void readInput() {

873         if (buf.limit() == buf.capacity())

874             makeSpace();

875         // Prepare to receive data

876         int p = buf.position();

877         buf.position(buf.limit());

878         buf.limit(buf.capacity());

879 

880         int n = 0;

881         try {

882             n = source.read(buf);

883         } catch (IOException ioe) {

884             lastException = ioe;

885             n = -1;

886         }

887         if (n == -1) {

888             sourceClosed = true;

889             needInput = false;

890         }

891         if (n > 0)

892             needInput = false;

893         // Restore current position and limit for reading

894         buf.limit(buf.position());

895         buf.position(p);

896     }

897 

898     // After this method is called there will either be an exception

899     // or else there will be space in the buffer

900     private boolean makeSpace() {

901         clearCaches();

902         int offset = savedScannerPosition == -1 ?

903             position : savedScannerPosition;

904         buf.position(offset);

905         // Gain space by compacting buffer

906         if (offset > 0) {

907             buf.compact();

908             translateSavedIndexes(offset);

909             position -= offset;

910             buf.flip();

911             return true;

912         }

913         // Gain space by growing buffer

914         int newSize = buf.capacity() * 2;

915         CharBuffer newBuf = CharBuffer.allocate(newSize);

916         newBuf.put(buf);

917         newBuf.flip();

918         translateSavedIndexes(offset);

919         position -= offset;

920         buf = newBuf;

921         matcher.reset(buf);

922         return true;

923     }

924 

925     // When a buffer compaction/reallocation occurs the saved indexes must

926     // be modified appropriately

927     private void translateSavedIndexes(int offset) {

928         if (savedScannerPosition != -1)

929             savedScannerPosition -= offset;

930     }

931 

932     // If we are at the end of input then NoSuchElement;

933     // If there is still input left then InputMismatch

934     private void throwFor() {

935         skipped = false;

936         if ((sourceClosed) && (position == buf.limit()))

937             throw new NoSuchElementException();

938         else

939             throw new InputMismatchException();

940     }

941 

942     // Returns true if a complete token or partial token is in the buffer.

943     // It is not necessary to find a complete token since a partial token

944     // means that there will be another token with or without more input.

945     private boolean hasTokenInBuffer() {

946         matchValid = false;

947         matcher.usePattern(delimPattern);

948         matcher.region(position, buf.limit());

949         // Skip delims first

950         if (matcher.lookingAt()) {

951             if (matcher.hitEnd() && !sourceClosed) {

952                 // more input might change the match of delims, in which

953                 // might change whether or not if there is token left in

954                 // buffer (don't update the "position" in this case)

955                 needInput = true;

956                 return false;

957             }

958             position = matcher.end();

959         }

960         // If we are sitting at the end, no more tokens in buffer

961         if (position == buf.limit())

962             return false;

963         return true;

964     }

965 

966     /*

967      * Returns a "complete token" that matches the specified pattern

968      *

969      * A token is complete if surrounded by delims; a partial token

970      * is prefixed by delims but not postfixed by them

971      *

972      * The position is advanced to the end of that complete token

973      *

974      * Pattern == null means accept any token at all

975      *

976      * Triple return:

977      * 1. valid string means it was found

978      * 2. null with needInput=false means we won't ever find it

979      * 3. null with needInput=true means try again after readInput

980      */

981     private String getCompleteTokenInBuffer(Pattern pattern) {

982         matchValid = false;

983         // Skip delims first

984         matcher.usePattern(delimPattern);

985         if (!skipped) { // Enforcing only one skip of leading delims

986             matcher.region(position, buf.limit());

987             if (matcher.lookingAt()) {

988                 // If more input could extend the delimiters then we must wait

989                 // for more input

990                 if (matcher.hitEnd() && !sourceClosed) {

991                     needInput = true;

992                     return null;

993                 }

994                 // The delims were whole and the matcher should skip them

995                 skipped = true;

996                 position = matcher.end();

997             }

998         }

999 

1000         // If we are sitting at the end, no more tokens in buffer

1001         if (position == buf.limit()) {

1002             if (sourceClosed)

1003                 return null;

1004             needInput = true;

1005             return null;

1006         }

1007         // Must look for next delims. Simply attempting to match the

1008         // pattern at this point may find a match but it might not be

1009         // the first longest match because of missing input, or it might

1010         // match a partial token instead of the whole thing.

1011 

1012         // Then look for next delims

1013         matcher.region(position, buf.limit());

1014         boolean foundNextDelim = matcher.find();

1015         if (foundNextDelim && (matcher.end() == position)) {

1016             // Zero length delimiter match; we should find the next one

1017             // using the automatic advance past a zero length match;

1018             // Otherwise we have just found the same one we just skipped

1019             foundNextDelim = matcher.find();

1020         }

1021         if (foundNextDelim) {

1022             // In the rare case that more input could cause the match

1023             // to be lost and there is more input coming we must wait

1024             // for more input. Note that hitting the end is okay as long

1025             // as the match cannot go away. It is the beginning of the

1026             // next delims we want to be sure about, we don't care if

1027             // they potentially extend further.

1028             if (matcher.requireEnd() && !sourceClosed) {

1029                 needInput = true;

1030                 return null;

1031             }

1032             int tokenEnd = matcher.start();

1033             // There is a complete token.

1034             if (pattern == null) {

1035                 // Must continue with match to provide valid MatchResult

1036                 pattern = FIND_ANY_PATTERN;

1037             }

1038             //  Attempt to match against the desired pattern

1039             matcher.usePattern(pattern);

1040             matcher.region(position, tokenEnd);

1041             if (matcher.matches()) {

1042                 String s = matcher.group();

1043                 position = matcher.end();

1044                 return s;

1045             } else { // Complete token but it does not match

1046                 return null;

1047             }

1048         }

1049 

1050         // If we can't find the next delims but no more input is coming,

1051         // then we can treat the remainder as a whole token

1052         if (sourceClosed) {

1053             if (pattern == null) {

1054                 // Must continue with match to provide valid MatchResult

1055                 pattern = FIND_ANY_PATTERN;

1056             }

1057             // Last token; Match the pattern here or throw

1058             matcher.usePattern(pattern);

1059             matcher.region(position, buf.limit());

1060             if (matcher.matches()) {

1061                 String s = matcher.group();

1062                 position = matcher.end();

1063                 return s;

1064             }

1065             // Last piece does not match

1066             return null;

1067         }

1068 

1069         // There is a partial token in the buffer; must read more

1070         // to complete it

1071         needInput = true;

1072         return null;

1073     }

1074 

1075     // Finds the specified pattern in the buffer up to horizon.

1076     // Returns true if the specified input pattern was matched,

1077     // and leaves the matcher field with the current match state.

1078     private boolean findPatternInBuffer(Pattern pattern, int horizon) {

1079         matchValid = false;

1080         matcher.usePattern(pattern);

1081         int bufferLimit = buf.limit();

1082         int horizonLimit = -1;

1083         int searchLimit = bufferLimit;

1084         if (horizon > 0) {

1085             horizonLimit = position + horizon;

1086             if (horizonLimit < bufferLimit)

1087                 searchLimit = horizonLimit;

1088         }

1089         matcher.region(position, searchLimit);

1090         if (matcher.find()) {

1091             if (matcher.hitEnd() && (!sourceClosed)) {

1092                 // The match may be longer if didn't hit horizon or real end

1093                 if (searchLimit != horizonLimit) {

1094                      // Hit an artificial end; try to extend the match

1095                     needInput = true;

1096                     return false;

1097                 }

1098                 // The match could go away depending on what is next

1099                 if ((searchLimit == horizonLimit) && matcher.requireEnd()) {

1100                     // Rare case: we hit the end of input and it happens

1101                     // that it is at the horizon and the end of input is

1102                     // required for the match.

1103                     needInput = true;

1104                     return false;

1105                 }

1106             }

1107             // Did not hit end, or hit real end, or hit horizon

1108             position = matcher.end();

1109             return true;

1110         }

1111 

1112         if (sourceClosed)

1113             return false;

1114 

1115         // If there is no specified horizon, or if we have not searched

1116         // to the specified horizon yet, get more input

1117         if ((horizon == 0) || (searchLimit != horizonLimit))

1118             needInput = true;

1119         return false;

1120     }

1121 

1122     // Attempts to match a pattern anchored at the current position.

1123     // Returns true if the specified input pattern was matched,

1124     // and leaves the matcher field with the current match state.

1125     private boolean matchPatternInBuffer(Pattern pattern) {

1126         matchValid = false;

1127         matcher.usePattern(pattern);

1128         matcher.region(position, buf.limit());

1129         if (matcher.lookingAt()) {

1130             if (matcher.hitEnd() && (!sourceClosed)) {

1131                 // Get more input and try again

1132                 needInput = true;

1133                 return false;

1134             }

1135             position = matcher.end();

1136             return true;

1137         }

1138 

1139         if (sourceClosed)

1140             return false;

1141 

1142         // Read more to find pattern

1143         needInput = true;

1144         return false;

1145     }

1146 

1147     // Throws if the scanner is closed

1148     private void ensureOpen() {

1149         if (closed)

1150             throw new IllegalStateException("Scanner closed");

1151     }

1152 

1153     // Public methods

1154 

1155     /**

1156      * Closes this scanner.

1157      *

1158      * <p> If this scanner has not yet been closed then if its underlying

1159      * {@linkplain java.lang.Readable readable} also implements the {@link

1160      * java.io.Closeable} interface then the readable's {@code close} method

1161      * will be invoked.  If this scanner is already closed then invoking this

1162      * method will have no effect.

1163      *

1164      * <p>Attempting to perform search operations after a scanner has

1165      * been closed will result in an {@link IllegalStateException}.

1166      *

1167      */

1168     public void close() {

1169         if (closed)

1170             return;

1171         if (source instanceof Closeable) {

1172             try {

1173                 ((Closeable)source).close();

1174             } catch (IOException ioe) {

1175                 lastException = ioe;

1176             }

1177         }

1178         sourceClosed = true;

1179         source = null;

1180         closed = true;

1181     }

1182 

1183     /**

1184      * Returns the {@code IOException} last thrown by this

1185      * {@code Scanner}'s underlying {@code Readable}. This method

1186      * returns {@code null} if no such exception exists.

1187      *

1188      * @return the last exception thrown by this scanner's readable

1189      */

1190     public IOException ioException() {

1191         return lastException;

1192     }

1193 

1194     /**

1195      * Returns the {@code Pattern} this {@code Scanner} is currently

1196      * using to match delimiters.

1197      *

1198      * @return this scanner's delimiting pattern.

1199      */

1200     public Pattern delimiter() {

1201         return delimPattern;

1202     }

1203 

1204     /**

1205      * Sets this scanner's delimiting pattern to the specified pattern.

1206      *

1207      * @param pattern A delimiting pattern

1208      * @return this scanner

1209      */

1210     public Scanner useDelimiter(Pattern pattern) {

1211         modCount++;

1212         delimPattern = pattern;

1213         return this;

1214     }

1215 

1216     /**

1217      * Sets this scanner's delimiting pattern to a pattern constructed from

1218      * the specified {@code String}.

1219      *

1220      * <p> An invocation of this method of the form

1221      * {@code useDelimiter(pattern)} behaves in exactly the same way as the

1222      * invocation {@code useDelimiter(Pattern.compile(pattern))}.

1223      *

1224      * <p> Invoking the {@link #reset} method will set the scanner's delimiter

1225      * to the <a href= "#default-delimiter">default</a>.

1226      *

1227      * @param pattern A string specifying a delimiting pattern

1228      * @return this scanner

1229      */

1230     public Scanner useDelimiter(String pattern) {

1231         modCount++;

1232         delimPattern = patternCache.forName(pattern);

1233         return this;

1234     }

1235 

1236     /**

1237      * Returns this scanner's locale.

1238      *

1239      * <p>A scanner's locale affects many elements of its default

1240      * primitive matching regular expressions; see

1241      * <a href= "#localized-numbers">localized numbers</a> above.

1242      *

1243      * @return this scanner's locale

1244      */

1245     public Locale locale() {

1246         return this.locale;

1247     }

1248 

1249     /**

1250      * Sets this scanner's locale to the specified locale.

1251      *

1252      * <p>A scanner's locale affects many elements of its default

1253      * primitive matching regular expressions; see

1254      * <a href= "#localized-numbers">localized numbers</a> above.

1255      *

1256      * <p>Invoking the {@link #reset} method will set the scanner's locale to

1257      * the <a href= "#initial-locale">initial locale</a>.

1258      *

1259      * @param locale A string specifying the locale to use

1260      * @return this scanner

1261      */

1262     public Scanner useLocale(Locale locale) {

1263         if (locale.equals(this.locale))

1264             return this;

1265 

1266         modCount++;

1267         this.locale = locale;

1268 

1269         DecimalFormat df = null;

1270         NumberFormat nf = NumberFormat.getNumberInstance(locale);

1271         DecimalFormatSymbols dfs = DecimalFormatSymbols.getInstance(locale);

1272         if (nf instanceof DecimalFormat) {

1273              df = (DecimalFormat) nf;

1274         } else {

1275 

1276             // In case where NumberFormat.getNumberInstance() returns

1277             // other instance (non DecimalFormat) based on the provider

1278             // used and java.text.spi.NumberFormatProvider implementations,

1279             // DecimalFormat constructor is used to obtain the instance

1280             LocaleProviderAdapter adapter = LocaleProviderAdapter

1281                     .getAdapter(NumberFormatProvider.class, locale);

1282             if (!(adapter instanceof ResourceBundleBasedAdapter)) {

1283                 adapter = LocaleProviderAdapter.getResourceBundleBased();

1284             }

1285             String[] all = adapter.getLocaleResources(locale)

1286                     .getNumberPatterns();

1287             df = new DecimalFormat(all[0], dfs);

1288         }

1289 

1290         // These must be literalized to avoid collision with regex

1291         // metacharacters such as dot or parenthesis

1292         groupSeparator =   "\\" + dfs.getGroupingSeparator();

1293         decimalSeparator = "\\" + dfs.getDecimalSeparator();

1294 

1295         // Quoting the nonzero length locale-specific things

1296         // to avoid potential conflict with metacharacters

1297         nanString = "\\Q" + dfs.getNaN() + "\\E";

1298         infinityString = "\\Q" + dfs.getInfinity() + "\\E";

1299         positivePrefix = df.getPositivePrefix();

1300         if (!positivePrefix.isEmpty())

1301             positivePrefix = "\\Q" + positivePrefix + "\\E";

1302         negativePrefix = df.getNegativePrefix();

1303         if (!negativePrefix.isEmpty())

1304             negativePrefix = "\\Q" + negativePrefix + "\\E";

1305         positiveSuffix = df.getPositiveSuffix();

1306         if (!positiveSuffix.isEmpty())

1307             positiveSuffix = "\\Q" + positiveSuffix + "\\E";

1308         negativeSuffix = df.getNegativeSuffix();

1309         if (!negativeSuffix.isEmpty())

1310             negativeSuffix = "\\Q" + negativeSuffix + "\\E";

1311 

1312         // Force rebuilding and recompilation of locale dependent

1313         // primitive patterns

1314         integerPattern = null;

1315         floatPattern = null;

1316 

1317         return this;

1318     }

1319 

1320     /**

1321      * Returns this scanner's default radix.

1322      *

1323      * <p>A scanner's radix affects elements of its default

1324      * number matching regular expressions; see

1325      * <a href= "#localized-numbers">localized numbers</a> above.

1326      *

1327      * @return the default radix of this scanner

1328      */

1329     public int radix() {

1330         return this.defaultRadix;

1331     }

1332 

1333     /**

1334      * Sets this scanner's default radix to the specified radix.

1335      *

1336      * <p>A scanner's radix affects elements of its default

1337      * number matching regular expressions; see

1338      * <a href= "#localized-numbers">localized numbers</a> above.

1339      *

1340      * <p>If the radix is less than {@link Character#MIN_RADIX Character.MIN_RADIX}

1341      * or greater than {@link Character#MAX_RADIX Character.MAX_RADIX}, then an

1342      * {@code IllegalArgumentException} is thrown.

1343      *

1344      * <p>Invoking the {@link #reset} method will set the scanner's radix to

1345      * {@code 10}.

1346      *

1347      * @param radix The radix to use when scanning numbers

1348      * @return this scanner

1349      * @throws IllegalArgumentException if radix is out of range

1350      */

1351     public Scanner useRadix(int radix) {

1352         if ((radix < Character.MIN_RADIX) || (radix > Character.MAX_RADIX))

1353             throw new IllegalArgumentException("radix:"+radix);

1354 

1355         if (this.defaultRadix == radix)

1356             return this;

1357         modCount++;

1358         this.defaultRadix = radix;

1359         // Force rebuilding and recompilation of radix dependent patterns

1360         integerPattern = null;

1361         return this;

1362     }

1363 

1364     // The next operation should occur in the specified radix but

1365     // the default is left untouched.

1366     private void setRadix(int radix) {

1367         if ((radix < Character.MIN_RADIX) || (radix > Character.MAX_RADIX))

1368             throw new IllegalArgumentException("radix:"+radix);

1369 

1370         if (this.radix != radix) {

1371             // Force rebuilding and recompilation of radix dependent patterns

1372             integerPattern = null;

1373             this.radix = radix;

1374         }

1375     }

1376 

1377     /**

1378      * Returns the match result of the last scanning operation performed

1379      * by this scanner. This method throws {@code IllegalStateException}

1380      * if no match has been performed, or if the last match was

1381      * not successful.

1382      *

1383      * <p>The various {@code next} methods of {@code Scanner}

1384      * make a match result available if they complete without throwing an

1385      * exception. For instance, after an invocation of the {@link #nextInt}

1386      * method that returned an int, this method returns a

1387      * {@code MatchResult} for the search of the

1388      * <a href="#Integer-regex"><i>Integer</i></a> regular expression

1389      * defined above. Similarly the {@link #findInLine findInLine()},

1390      * {@link #findWithinHorizon findWithinHorizon()}, and {@link #skip skip()}

1391      * methods will make a match available if they succeed.

1392      *

1393      * @return a match result for the last match operation

1394      * @throws IllegalStateException  If no match result is available

1395      */

1396     public MatchResult match() {

1397         if (!matchValid)

1398             throw new IllegalStateException("No match result available");

1399         return matcher.toMatchResult();

1400     }

1401 

1402     /**

1403      * <p>Returns the string representation of this {@code Scanner}. The

1404      * string representation of a {@code Scanner} contains information

1405      * that may be useful for debugging. The exact format is unspecified.

1406      *

1407      * @return  The string representation of this scanner

1408      */

1409     public String toString() {

1410         StringBuilder sb = new StringBuilder();

1411         sb.append("java.util.Scanner");

1412         sb.append("[delimiters=" + delimPattern + "]");

1413         sb.append("[position=" + position + "]");

1414         sb.append("[match valid=" + matchValid + "]");

1415         sb.append("[need input=" + needInput + "]");

1416         sb.append("[source closed=" + sourceClosed + "]");

1417         sb.append("[skipped=" + skipped + "]");

1418         sb.append("[group separator=" + groupSeparator + "]");

1419         sb.append("[decimal separator=" + decimalSeparator + "]");

1420         sb.append("[positive prefix=" + positivePrefix + "]");

1421         sb.append("[negative prefix=" + negativePrefix + "]");

1422         sb.append("[positive suffix=" + positiveSuffix + "]");

1423         sb.append("[negative suffix=" + negativeSuffix + "]");

1424         sb.append("[NaN string=" + nanString + "]");

1425         sb.append("[infinity string=" + infinityString + "]");

1426         return sb.toString();

1427     }

1428 

1429     /**

1430      * Returns true if this scanner has another token in its input.

1431      * This method may block while waiting for input to scan.

1432      * The scanner does not advance past any input.

1433      *

1434      * @return true if and only if this scanner has another token

1435      * @throws IllegalStateException if this scanner is closed

1436      * @see java.util.Iterator

1437      */

1438     public boolean hasNext() {

1439         ensureOpen();

1440         saveState();

1441         modCount++;

1442         while (!sourceClosed) {

1443             if (hasTokenInBuffer()) {

1444                 return revertState(true);

1445             }

1446             readInput();

1447         }

1448         boolean result = hasTokenInBuffer();

1449         return revertState(result);

1450     }

1451 

1452     /**

1453      * Finds and returns the next complete token from this scanner.

1454      * A complete token is preceded and followed by input that matches

1455      * the delimiter pattern. This method may block while waiting for input

1456      * to scan, even if a previous invocation of {@link #hasNext} returned

1457      * {@code true}.

1458      *

1459      * @return the next token

1460      * @throws NoSuchElementException if no more tokens are available

1461      * @throws IllegalStateException if this scanner is closed

1462      * @see java.util.Iterator

1463      */

1464     public String next() {

1465         ensureOpen();

1466         clearCaches();

1467         modCount++;

1468         while (true) {

1469             String token = getCompleteTokenInBuffer(null);

1470             if (token != null) {

1471                 matchValid = true;

1472                 skipped = false;

1473                 return token;

1474             }

1475             if (needInput)

1476                 readInput();

1477             else

1478                 throwFor();

1479         }

1480     }

1481 

1482     /**

1483      * The remove operation is not supported by this implementation of

1484      * {@code Iterator}.

1485      *

1486      * @throws UnsupportedOperationException if this method is invoked.

1487      * @see java.util.Iterator

1488      */

1489     public void remove() {

1490         throw new UnsupportedOperationException();

1491     }

1492 

1493     /**

1494      * Returns true if the next token matches the pattern constructed from the

1495      * specified string. The scanner does not advance past any input.

1496      *

1497      * <p> An invocation of this method of the form {@code hasNext(pattern)}

1498      * behaves in exactly the same way as the invocation

1499      * {@code hasNext(Pattern.compile(pattern))}.

1500      *

1501      * @param pattern a string specifying the pattern to scan

1502      * @return true if and only if this scanner has another token matching

1503      *         the specified pattern

1504      * @throws IllegalStateException if this scanner is closed

1505      */

1506     public boolean hasNext(String pattern)  {

1507         return hasNext(patternCache.forName(pattern));

1508     }

1509 

1510     /**

1511      * Returns the next token if it matches the pattern constructed from the

1512      * specified string.  If the match is successful, the scanner advances

1513      * past the input that matched the pattern.

1514      *

1515      * <p> An invocation of this method of the form {@code next(pattern)}

1516      * behaves in exactly the same way as the invocation

1517      * {@code next(Pattern.compile(pattern))}.

1518      *

1519      * @param pattern a string specifying the pattern to scan

1520      * @return the next token

1521      * @throws NoSuchElementException if no such tokens are available

1522      * @throws IllegalStateException if this scanner is closed

1523      */

1524     public String next(String pattern)  {

1525         return next(patternCache.forName(pattern));

1526     }

1527 

1528     /**

1529      * Returns true if the next complete token matches the specified pattern.

1530      * A complete token is prefixed and postfixed by input that matches

1531      * the delimiter pattern. This method may block while waiting for input.

1532      * The scanner does not advance past any input.

1533      *

1534      * @param pattern the pattern to scan for

1535      * @return true if and only if this scanner has another token matching

1536      *         the specified pattern

1537      * @throws IllegalStateException if this scanner is closed

1538      */

1539     public boolean hasNext(Pattern pattern) {

1540         ensureOpen();

1541         if (pattern == null)

1542             throw new NullPointerException();

1543         hasNextPattern = null;

1544         saveState();

1545         modCount++;

1546 

1547         while (true) {

1548             if (getCompleteTokenInBuffer(pattern) != null) {

1549                 matchValid = true;

1550                 cacheResult();

1551                 return revertState(true);

1552             }

1553             if (needInput)

1554                 readInput();

1555             else

1556                 return revertState(false);

1557         }

1558     }

1559 

1560     /**

1561      * Returns the next token if it matches the specified pattern. This

1562      * method may block while waiting for input to scan, even if a previous

1563      * invocation of {@link #hasNext(Pattern)} returned {@code true}.

1564      * If the match is successful, the scanner advances past the input that

1565      * matched the pattern.

1566      *

1567      * @param pattern the pattern to scan for

1568      * @return the next token

1569      * @throws NoSuchElementException if no more tokens are available

1570      * @throws IllegalStateException if this scanner is closed

1571      */

1572     public String next(Pattern pattern) {

1573         ensureOpen();

1574         if (pattern == null)

1575             throw new NullPointerException();

1576 

1577         modCount++;

1578         // Did we already find this pattern?

1579         if (hasNextPattern == pattern)

1580             return getCachedResult();

1581         clearCaches();

1582 

1583         // Search for the pattern

1584         while (true) {

1585             String token = getCompleteTokenInBuffer(pattern);

1586             if (token != null) {

1587                 matchValid = true;

1588                 skipped = false;

1589                 return token;

1590             }

1591             if (needInput)

1592                 readInput();

1593             else

1594                 throwFor();

1595         }

1596     }

1597 

1598     /**

1599      * Returns true if there is another line in the input of this scanner.

1600      * This method may block while waiting for input. The scanner does not

1601      * advance past any input.

1602      *

1603      * @return true if and only if this scanner has another line of input

1604      * @throws IllegalStateException if this scanner is closed

1605      */

1606     public boolean hasNextLine() {

1607         saveState();

1608 

1609         modCount++;

1610         String result = findWithinHorizon(linePattern(), 0);

1611         if (result != null) {

1612             MatchResult mr = this.match();

1613             String lineSep = mr.group(1);

1614             if (lineSep != null) {

1615                 result = result.substring(0, result.length() -

1616                                           lineSep.length());

1617                 cacheResult(result);

1618 

1619             } else {

1620                 cacheResult();

1621             }

1622         }

1623         revertState();

1624         return (result != null);

1625     }

1626 

1627     /**

1628      * Advances this scanner past the current line and returns the input

1629      * that was skipped.

1630      *

1631      * This method returns the rest of the current line, excluding any line

1632      * separator at the end. The position is set to the beginning of the next

1633      * line.

1634      *

1635      * <p>Since this method continues to search through the input looking

1636      * for a line separator, it may buffer all of the input searching for

1637      * the line to skip if no line separators are present.

1638      *

1639      * @return the line that was skipped

1640      * @throws NoSuchElementException if no line was found

1641      * @throws IllegalStateException if this scanner is closed

1642      */

1643     public String nextLine() {

1644         modCount++;

1645         if (hasNextPattern == linePattern())

1646             return getCachedResult();

1647         clearCaches();

1648 

1649         String result = findWithinHorizon(linePattern, 0);

1650         if (result == null)

1651             throw new NoSuchElementException("No line found");

1652         MatchResult mr = this.match();

1653         String lineSep = mr.group(1);

1654         if (lineSep != null)

1655             result = result.substring(0, result.length() - lineSep.length());

1656         if (result == null)

1657             throw new NoSuchElementException();

1658         else

1659             return result;

1660     }

1661 

1662     // Public methods that ignore delimiters

1663 

1664     /**

1665      * Attempts to find the next occurrence of a pattern constructed from the

1666      * specified string, ignoring delimiters.

1667      *

1668      * <p>An invocation of this method of the form {@code findInLine(pattern)}

1669      * behaves in exactly the same way as the invocation

1670      * {@code findInLine(Pattern.compile(pattern))}.

1671      *

1672      * @param pattern a string specifying the pattern to search for

1673      * @return the text that matched the specified pattern

1674      * @throws IllegalStateException if this scanner is closed

1675      */

1676     public String findInLine(String pattern) {

1677         return findInLine(patternCache.forName(pattern));

1678     }

1679 

1680     /**

1681      * Attempts to find the next occurrence of the specified pattern ignoring

1682      * delimiters. If the pattern is found before the next line separator, the

1683      * scanner advances past the input that matched and returns the string that

1684      * matched the pattern.

1685      * If no such pattern is detected in the input up to the next line

1686      * separator, then {@code null} is returned and the scanner's

1687      * position is unchanged. This method may block waiting for input that

1688      * matches the pattern.

1689      *

1690      * <p>Since this method continues to search through the input looking

1691      * for the specified pattern, it may buffer all of the input searching for

1692      * the desired token if no line separators are present.

1693      *

1694      * @param pattern the pattern to scan for

1695      * @return the text that matched the specified pattern

1696      * @throws IllegalStateException if this scanner is closed

1697      */

1698     public String findInLine(Pattern pattern) {

1699         ensureOpen();

1700         if (pattern == null)

1701             throw new NullPointerException();

1702         clearCaches();

1703         modCount++;

1704         // Expand buffer to include the next newline or end of input

1705         int endPosition = 0;

1706         saveState();

1707         while (true) {

1708             if (findPatternInBuffer(separatorPattern(), 0)) {

1709                 endPosition = matcher.start();

1710                 break; // up to next newline

1711             }

1712             if (needInput) {

1713                 readInput();

1714             } else {

1715                 endPosition = buf.limit();

1716                 break; // up to end of input

1717             }

1718         }

1719         revertState();

1720         int horizonForLine = endPosition - position;

1721         // If there is nothing between the current pos and the next

1722         // newline simply return null, invoking findWithinHorizon

1723         // with "horizon=0" will scan beyond the line bound.

1724         if (horizonForLine == 0)

1725             return null;

1726         // Search for the pattern

1727         return findWithinHorizon(pattern, horizonForLine);

1728     }

1729 

1730     /**

1731      * Attempts to find the next occurrence of a pattern constructed from the

1732      * specified string, ignoring delimiters.

1733      *

1734      * <p>An invocation of this method of the form

1735      * {@code findWithinHorizon(pattern)} behaves in exactly the same way as

1736      * the invocation

1737      * {@code findWithinHorizon(Pattern.compile(pattern), horizon)}.

1738      *

1739      * @param pattern a string specifying the pattern to search for

1740      * @param horizon the search horizon

1741      * @return the text that matched the specified pattern

1742      * @throws IllegalStateException if this scanner is closed

1743      * @throws IllegalArgumentException if horizon is negative

1744      */

1745     public String findWithinHorizon(String pattern, int horizon) {

1746         return findWithinHorizon(patternCache.forName(pattern), horizon);

1747     }

1748 

1749     /**

1750      * Attempts to find the next occurrence of the specified pattern.

1751      *

1752      * <p>This method searches through the input up to the specified

1753      * search horizon, ignoring delimiters. If the pattern is found the

1754      * scanner advances past the input that matched and returns the string

1755      * that matched the pattern. If no such pattern is detected then the

1756      * null is returned and the scanner's position remains unchanged. This

1757      * method may block waiting for input that matches the pattern.

1758      *

1759      * <p>A scanner will never search more than {@code horizon} code

1760      * points beyond its current position. Note that a match may be clipped

1761      * by the horizon; that is, an arbitrary match result may have been

1762      * different if the horizon had been larger. The scanner treats the

1763      * horizon as a transparent, non-anchoring bound (see {@link

1764      * Matcher#useTransparentBounds} and {@link Matcher#useAnchoringBounds}).

1765      *

1766      * <p>If horizon is {@code 0}, then the horizon is ignored and

1767      * this method continues to search through the input looking for the

1768      * specified pattern without bound. In this case it may buffer all of

1769      * the input searching for the pattern.

1770      *

1771      * <p>If horizon is negative, then an IllegalArgumentException is

1772      * thrown.

1773      *

1774      * @param pattern the pattern to scan for

1775      * @param horizon the search horizon

1776      * @return the text that matched the specified pattern

1777      * @throws IllegalStateException if this scanner is closed

1778      * @throws IllegalArgumentException if horizon is negative

1779      */

1780     public String findWithinHorizon(Pattern pattern, int horizon) {

1781         ensureOpen();

1782         if (pattern == null)

1783             throw new NullPointerException();

1784         if (horizon < 0)

1785             throw new IllegalArgumentException("horizon < 0");

1786         clearCaches();

1787         modCount++;

1788 

1789         // Search for the pattern

1790         while (true) {

1791             if (findPatternInBuffer(pattern, horizon)) {

1792                 matchValid = true;

1793                 return matcher.group();

1794             }

1795             if (needInput)

1796                 readInput();

1797             else

1798                 break; // up to end of input

1799         }

1800         return null;

1801     }

1802 

1803     /**

1804      * Skips input that matches the specified pattern, ignoring delimiters.

1805      * This method will skip input if an anchored match of the specified

1806      * pattern succeeds.

1807      *

1808      * <p>If a match to the specified pattern is not found at the

1809      * current position, then no input is skipped and a

1810      * {@code NoSuchElementException} is thrown.

1811      *

1812      * <p>Since this method seeks to match the specified pattern starting at

1813      * the scanner's current position, patterns that can match a lot of

1814      * input (".*", for example) may cause the scanner to buffer a large

1815      * amount of input.

1816      *

1817      * <p>Note that it is possible to skip something without risking a

1818      * {@code NoSuchElementException} by using a pattern that can

1819      * match nothing, e.g., {@code sc.skip("[ \t]*")}.

1820      *

1821      * @param pattern a string specifying the pattern to skip over

1822      * @return this scanner

1823      * @throws NoSuchElementException if the specified pattern is not found

1824      * @throws IllegalStateException if this scanner is closed

1825      */

1826     public Scanner skip(Pattern pattern) {

1827         ensureOpen();

1828         if (pattern == null)

1829             throw new NullPointerException();

1830         clearCaches();

1831         modCount++;

1832 

1833         // Search for the pattern

1834         while (true) {

1835             if (matchPatternInBuffer(pattern)) {

1836                 matchValid = true;

1837                 position = matcher.end();

1838                 return this;

1839             }

1840             if (needInput)

1841                 readInput();

1842             else

1843                 throw new NoSuchElementException();

1844         }

1845     }

1846 

1847     /**

1848      * Skips input that matches a pattern constructed from the specified

1849      * string.

1850      *

1851      * <p> An invocation of this method of the form {@code skip(pattern)}

1852      * behaves in exactly the same way as the invocation

1853      * {@code skip(Pattern.compile(pattern))}.

1854      *

1855      * @param pattern a string specifying the pattern to skip over

1856      * @return this scanner

1857      * @throws IllegalStateException if this scanner is closed

1858      */

1859     public Scanner skip(String pattern) {

1860         return skip(patternCache.forName(pattern));

1861     }

1862 

1863     // Convenience methods for scanning primitives

1864 

1865     /**

1866      * Returns true if the next token in this scanner's input can be

1867      * interpreted as a boolean value using a case insensitive pattern

1868      * created from the string "true|false".  The scanner does not

1869      * advance past the input that matched.

1870      *

1871      * @return true if and only if this scanner's next token is a valid

1872      *         boolean value

1873      * @throws IllegalStateException if this scanner is closed

1874      */

1875     public boolean hasNextBoolean()  {

1876         return hasNext(boolPattern());

1877     }

1878 

1879     /**

1880      * Scans the next token of the input into a boolean value and returns

1881      * that value. This method will throw {@code InputMismatchException}

1882      * if the next token cannot be translated into a valid boolean value.

1883      * If the match is successful, the scanner advances past the input that

1884      * matched.

1885      *

1886      * @return the boolean scanned from the input

1887      * @throws InputMismatchException if the next token is not a valid boolean

1888      * @throws NoSuchElementException if input is exhausted

1889      * @throws IllegalStateException if this scanner is closed

1890      */

1891     public boolean nextBoolean()  {

1892         clearCaches();

1893         return Boolean.parseBoolean(next(boolPattern()));

1894     }

1895 

1896     /**

1897      * Returns true if the next token in this scanner's input can be

1898      * interpreted as a byte value in the default radix using the

1899      * {@link #nextByte} method. The scanner does not advance past any input.

1900      *

1901      * @return true if and only if this scanner's next token is a valid

1902      *         byte value

1903      * @throws IllegalStateException if this scanner is closed

1904      */

1905     public boolean hasNextByte() {

1906         return hasNextByte(defaultRadix);

1907     }

1908 

1909     /**

1910      * Returns true if the next token in this scanner's input can be

1911      * interpreted as a byte value in the specified radix using the

1912      * {@link #nextByte} method. The scanner does not advance past any input.

1913      *

1914      * <p>If the radix is less than {@link Character#MIN_RADIX Character.MIN_RADIX}

1915      * or greater than {@link Character#MAX_RADIX Character.MAX_RADIX}, then an

1916      * {@code IllegalArgumentException} is thrown.

1917      *

1918      * @param radix the radix used to interpret the token as a byte value

1919      * @return true if and only if this scanner's next token is a valid

1920      *         byte value

1921      * @throws IllegalStateException if this scanner is closed

1922      * @throws IllegalArgumentException if the radix is out of range

1923      */

1924     public boolean hasNextByte(int radix) {

1925         setRadix(radix);

1926         boolean result = hasNext(integerPattern());

1927         if (result) { // Cache it

1928             try {

1929                 String s = (matcher.group(SIMPLE_GROUP_INDEX) == null) ?

1930                     processIntegerToken(hasNextResult) :

1931                     hasNextResult;

1932                 typeCache = Byte.parseByte(s, radix);

1933             } catch (NumberFormatException nfe) {

1934                 result = false;

1935             }

1936         }

1937         return result;

1938     }

1939 

1940     /**

1941      * Scans the next token of the input as a {@code byte}.

1942      *

1943      * <p> An invocation of this method of the form

1944      * {@code nextByte()} behaves in exactly the same way as the

1945      * invocation {@code nextByte(radix)}, where {@code radix}

1946      * is the default radix of this scanner.

1947      *

1948      * @return the {@code byte} scanned from the input

1949      * @throws InputMismatchException

1950      *         if the next token does not match the <i>Integer</i>

1951      *         regular expression, or is out of range

1952      * @throws NoSuchElementException if input is exhausted

1953      * @throws IllegalStateException if this scanner is closed

1954      */

1955     public byte nextByte() {

1956          return nextByte(defaultRadix);

1957     }

1958 

1959     /**

1960      * Scans the next token of the input as a {@code byte}.

1961      * This method will throw {@code InputMismatchException}

1962      * if the next token cannot be translated into a valid byte value as

1963      * described below. If the translation is successful, the scanner advances

1964      * past the input that matched.

1965      *

1966      * <p> If the next token matches the <a

1967      * href="#Integer-regex"><i>Integer</i></a> regular expression defined

1968      * above then the token is converted into a {@code byte} value as if by

1969      * removing all locale specific prefixes, group separators, and locale

1970      * specific suffixes, then mapping non-ASCII digits into ASCII

1971      * digits via {@link Character#digit Character.digit}, prepending a

1972      * negative sign (-) if the locale specific negative prefixes and suffixes

1973      * were present, and passing the resulting string to

1974      * {@link Byte#parseByte(String, int) Byte.parseByte} with the

1975      * specified radix.

1976      *

1977      * <p>If the radix is less than {@link Character#MIN_RADIX Character.MIN_RADIX}

1978      * or greater than {@link Character#MAX_RADIX Character.MAX_RADIX}, then an

1979      * {@code IllegalArgumentException} is thrown.

1980      *

1981      * @param radix the radix used to interpret the token as a byte value

1982      * @return the {@code byte} scanned from the input

1983      * @throws InputMismatchException

1984      *         if the next token does not match the <i>Integer</i>

1985      *         regular expression, or is out of range

1986      * @throws NoSuchElementException if input is exhausted

1987      * @throws IllegalStateException if this scanner is closed

1988      * @throws IllegalArgumentException if the radix is out of range

1989      */

1990     public byte nextByte(int radix) {

1991         // Check cached result

1992         if ((typeCache != null) && (typeCache instanceof Byte)

1993             && this.radix == radix) {

1994             byte val = ((Byte)typeCache).byteValue();

1995             useTypeCache();

1996             return val;

1997         }

1998         setRadix(radix);

1999         clearCaches();

2000         // Search for next byte

2001         try {

2002             String s = next(integerPattern());

2003             if (matcher.group(SIMPLE_GROUP_INDEX) == null)

2004                 s = processIntegerToken(s);

2005             return Byte.parseByte(s, radix);

2006         } catch (NumberFormatException nfe) {

2007             position = matcher.start(); // don't skip bad token

2008             throw new InputMismatchException(nfe.getMessage());

2009         }

2010     }

2011 

2012     /**

2013      * Returns true if the next token in this scanner's input can be

2014      * interpreted as a short value in the default radix using the

2015      * {@link #nextShort} method. The scanner does not advance past any input.

2016      *

2017      * @return true if and only if this scanner's next token is a valid

2018      *         short value in the default radix

2019      * @throws IllegalStateException if this scanner is closed

2020      */

2021     public boolean hasNextShort() {

2022         return hasNextShort(defaultRadix);

2023     }

2024 

2025     /**

2026      * Returns true if the next token in this scanner's input can be

2027      * interpreted as a short value in the specified radix using the

2028      * {@link #nextShort} method. The scanner does not advance past any input.

2029      *

2030      * <p>If the radix is less than {@link Character#MIN_RADIX Character.MIN_RADIX}

2031      * or greater than {@link Character#MAX_RADIX Character.MAX_RADIX}, then an

2032      * {@code IllegalArgumentException} is thrown.

2033      *

2034      * @param radix the radix used to interpret the token as a short value

2035      * @return true if and only if this scanner's next token is a valid

2036      *         short value in the specified radix

2037      * @throws IllegalStateException if this scanner is closed

2038      * @throws IllegalArgumentException if the radix is out of range

2039      */

2040     public boolean hasNextShort(int radix) {

2041         setRadix(radix);

2042         boolean result = hasNext(integerPattern());

2043         if (result) { // Cache it

2044             try {

2045                 String s = (matcher.group(SIMPLE_GROUP_INDEX) == null) ?

2046                     processIntegerToken(hasNextResult) :

2047                     hasNextResult;

2048                 typeCache = Short.parseShort(s, radix);

2049             } catch (NumberFormatException nfe) {

2050                 result = false;

2051             }

2052         }

2053         return result;

2054     }

2055 

2056     /**

2057      * Scans the next token of the input as a {@code short}.

2058      *

2059      * <p> An invocation of this method of the form

2060      * {@code nextShort()} behaves in exactly the same way as the

2061      * invocation {@link #nextShort(int) nextShort(radix)}, where {@code radix}

2062      * is the default radix of this scanner.

2063      *

2064      * @return the {@code short} scanned from the input

2065      * @throws InputMismatchException

2066      *         if the next token does not match the <i>Integer</i>

2067      *         regular expression, or is out of range

2068      * @throws NoSuchElementException if input is exhausted

2069      * @throws IllegalStateException if this scanner is closed

2070      */

2071     public short nextShort() {

2072         return nextShort(defaultRadix);

2073     }

2074 

2075     /**

2076      * Scans the next token of the input as a {@code short}.

2077      * This method will throw {@code InputMismatchException}

2078      * if the next token cannot be translated into a valid short value as

2079      * described below. If the translation is successful, the scanner advances

2080      * past the input that matched.

2081      *

2082      * <p> If the next token matches the <a

2083      * href="#Integer-regex"><i>Integer</i></a> regular expression defined

2084      * above then the token is converted into a {@code short} value as if by

2085      * removing all locale specific prefixes, group separators, and locale

2086      * specific suffixes, then mapping non-ASCII digits into ASCII

2087      * digits via {@link Character#digit Character.digit}, prepending a

2088      * negative sign (-) if the locale specific negative prefixes and suffixes

2089      * were present, and passing the resulting string to

2090      * {@link Short#parseShort(String, int) Short.parseShort} with the

2091      * specified radix.

2092      *

2093      * <p>If the radix is less than {@link Character#MIN_RADIX Character.MIN_RADIX}

2094      * or greater than {@link Character#MAX_RADIX Character.MAX_RADIX}, then an

2095      * {@code IllegalArgumentException} is thrown.

2096      *

2097      * @param radix the radix used to interpret the token as a short value

2098      * @return the {@code short} scanned from the input

2099      * @throws InputMismatchException

2100      *         if the next token does not match the <i>Integer</i>

2101      *         regular expression, or is out of range

2102      * @throws NoSuchElementException if input is exhausted

2103      * @throws IllegalStateException if this scanner is closed

2104      * @throws IllegalArgumentException if the radix is out of range

2105      */

2106     public short nextShort(int radix) {

2107         // Check cached result

2108         if ((typeCache != null) && (typeCache instanceof Short)

2109             && this.radix == radix) {

2110             short val = ((Short)typeCache).shortValue();

2111             useTypeCache();

2112             return val;

2113         }

2114         setRadix(radix);

2115         clearCaches();

2116         // Search for next short

2117         try {

2118             String s = next(integerPattern());

2119             if (matcher.group(SIMPLE_GROUP_INDEX) == null)

2120                 s = processIntegerToken(s);

2121             return Short.parseShort(s, radix);

2122         } catch (NumberFormatException nfe) {

2123             position = matcher.start(); // don't skip bad token

2124             throw new InputMismatchException(nfe.getMessage());

2125         }

2126     }

2127 

2128     /**

2129      * Returns true if the next token in this scanner's input can be

2130      * interpreted as an int value in the default radix using the

2131      * {@link #nextInt} method. The scanner does not advance past any input.

2132      *

2133      * @return true if and only if this scanner's next token is a valid

2134      *         int value

2135      * @throws IllegalStateException if this scanner is closed

2136      */

2137     public boolean hasNextInt() {

2138         return hasNextInt(defaultRadix);

2139     }

2140 

2141     /**

2142      * Returns true if the next token in this scanner's input can be

2143      * interpreted as an int value in the specified radix using the

2144      * {@link #nextInt} method. The scanner does not advance past any input.

2145      *

2146      * <p>If the radix is less than {@link Character#MIN_RADIX Character.MIN_RADIX}

2147      * or greater than {@link Character#MAX_RADIX Character.MAX_RADIX}, then an

2148      * {@code IllegalArgumentException} is thrown.

2149      *

2150      * @param radix the radix used to interpret the token as an int value

2151      * @return true if and only if this scanner's next token is a valid

2152      *         int value

2153      * @throws IllegalStateException if this scanner is closed

2154      * @throws IllegalArgumentException if the radix is out of range

2155      */

2156     public boolean hasNextInt(int radix) {

2157         setRadix(radix);

2158         boolean result = hasNext(integerPattern());

2159         if (result) { // Cache it

2160             try {

2161                 String s = (matcher.group(SIMPLE_GROUP_INDEX) == null) ?

2162                     processIntegerToken(hasNextResult) :

2163                     hasNextResult;

2164                 typeCache = Integer.parseInt(s, radix);

2165             } catch (NumberFormatException nfe) {

2166                 result = false;

2167             }

2168         }

2169         return result;

2170     }

2171 

2172     /**

2173      * The integer token must be stripped of prefixes, group separators,

2174      * and suffixes, non ascii digits must be converted into ascii digits

2175      * before parse will accept it.

2176      */

2177     private String processIntegerToken(String token) {

2178         String result = token.replaceAll(""+groupSeparator, "");

2179         boolean isNegative = false;

2180         int preLen = negativePrefix.length();

2181         if ((preLen > 0) && result.startsWith(negativePrefix)) {

2182             isNegative = true;

2183             result = result.substring(preLen);

2184         }

2185         int sufLen = negativeSuffix.length();

2186         if ((sufLen > 0) && result.endsWith(negativeSuffix)) {

2187             isNegative = true;

2188             result = result.substring(result.length() - sufLen,

2189                                       result.length());

2190         }

2191         if (isNegative)

2192             result = "-" + result;

2193         return result;

2194     }

2195 

2196     /**

2197      * Scans the next token of the input as an {@code int}.

2198      *

2199      * <p> An invocation of this method of the form

2200      * {@code nextInt()} behaves in exactly the same way as the

2201      * invocation {@code nextInt(radix)}, where {@code radix}

2202      * is the default radix of this scanner.

2203      *

2204      * @return the {@code int} scanned from the input

2205      * @throws InputMismatchException

2206      *         if the next token does not match the <i>Integer</i>

2207      *         regular expression, or is out of range

2208      * @throws NoSuchElementException if input is exhausted

2209      * @throws IllegalStateException if this scanner is closed

2210      */

2211     public int nextInt() {

2212         return nextInt(defaultRadix);

2213     }

2214 

2215     /**

2216      * Scans the next token of the input as an {@code int}.

2217      * This method will throw {@code InputMismatchException}

2218      * if the next token cannot be translated into a valid int value as

2219      * described below. If the translation is successful, the scanner advances

2220      * past the input that matched.

2221      *

2222      * <p> If the next token matches the <a

2223      * href="#Integer-regex"><i>Integer</i></a> regular expression defined

2224      * above then the token is converted into an {@code int} value as if by

2225      * removing all locale specific prefixes, group separators, and locale

2226      * specific suffixes, then mapping non-ASCII digits into ASCII

2227      * digits via {@link Character#digit Character.digit}, prepending a

2228      * negative sign (-) if the locale specific negative prefixes and suffixes

2229      * were present, and passing the resulting string to

2230      * {@link Integer#parseInt(String, int) Integer.parseInt} with the

2231      * specified radix.

2232      *

2233      * <p>If the radix is less than {@link Character#MIN_RADIX Character.MIN_RADIX}

2234      * or greater than {@link Character#MAX_RADIX Character.MAX_RADIX}, then an

2235      * {@code IllegalArgumentException} is thrown.

2236      *

2237      * @param radix the radix used to interpret the token as an int value

2238      * @return the {@code int} scanned from the input

2239      * @throws InputMismatchException

2240      *         if the next token does not match the <i>Integer</i>

2241      *         regular expression, or is out of range

2242      * @throws NoSuchElementException if input is exhausted

2243      * @throws IllegalStateException if this scanner is closed

2244      * @throws IllegalArgumentException if the radix is out of range

2245      */

2246     public int nextInt(int radix) {

2247         // Check cached result

2248         if ((typeCache != null) && (typeCache instanceof Integer)

2249             && this.radix == radix) {

2250             int val = ((Integer)typeCache).intValue();

2251             useTypeCache();

2252             return val;

2253         }

2254         setRadix(radix);

2255         clearCaches();

2256         // Search for next int

2257         try {

2258             String s = next(integerPattern());

2259             if (matcher.group(SIMPLE_GROUP_INDEX) == null)

2260                 s = processIntegerToken(s);

2261             return Integer.parseInt(s, radix);

2262         } catch (NumberFormatException nfe) {

2263             position = matcher.start(); // don't skip bad token

2264             throw new InputMismatchException(nfe.getMessage());

2265         }

2266     }

2267 

2268     /**

2269      * Returns true if the next token in this scanner's input can be

2270      * interpreted as a long value in the default radix using the

2271      * {@link #nextLong} method. The scanner does not advance past any input.

2272      *

2273      * @return true if and only if this scanner's next token is a valid

2274      *         long value

2275      * @throws IllegalStateException if this scanner is closed

2276      */

2277     public boolean hasNextLong() {

2278         return hasNextLong(defaultRadix);

2279     }

2280 

2281     /**

2282      * Returns true if the next token in this scanner's input can be

2283      * interpreted as a long value in the specified radix using the

2284      * {@link #nextLong} method. The scanner does not advance past any input.

2285      *

2286      * <p>If the radix is less than {@link Character#MIN_RADIX Character.MIN_RADIX}

2287      * or greater than {@link Character#MAX_RADIX Character.MAX_RADIX}, then an

2288      * {@code IllegalArgumentException} is thrown.

2289      *

2290      * @param radix the radix used to interpret the token as a long value

2291      * @return true if and only if this scanner's next token is a valid

2292      *         long value

2293      * @throws IllegalStateException if this scanner is closed

2294      * @throws IllegalArgumentException if the radix is out of range

2295      */

2296     public boolean hasNextLong(int radix) {

2297         setRadix(radix);

2298         boolean result = hasNext(integerPattern());

2299         if (result) { // Cache it

2300             try {

2301                 String s = (matcher.group(SIMPLE_GROUP_INDEX) == null) ?

2302                     processIntegerToken(hasNextResult) :

2303                     hasNextResult;

2304                 typeCache = Long.parseLong(s, radix);

2305             } catch (NumberFormatException nfe) {

2306                 result = false;

2307             }

2308         }

2309         return result;

2310     }

2311 

2312     /**

2313      * Scans the next token of the input as a {@code long}.

2314      *

2315      * <p> An invocation of this method of the form

2316      * {@code nextLong()} behaves in exactly the same way as the

2317      * invocation {@code nextLong(radix)}, where {@code radix}

2318      * is the default radix of this scanner.

2319      *

2320      * @return the {@code long} scanned from the input

2321      * @throws InputMismatchException

2322      *         if the next token does not match the <i>Integer</i>

2323      *         regular expression, or is out of range

2324      * @throws NoSuchElementException if input is exhausted

2325      * @throws IllegalStateException if this scanner is closed

2326      */

2327     public long nextLong() {

2328         return nextLong(defaultRadix);

2329     }

2330 

2331     /**

2332      * Scans the next token of the input as a {@code long}.

2333      * This method will throw {@code InputMismatchException}

2334      * if the next token cannot be translated into a valid long value as

2335      * described below. If the translation is successful, the scanner advances

2336      * past the input that matched.

2337      *

2338      * <p> If the next token matches the <a

2339      * href="#Integer-regex"><i>Integer</i></a> regular expression defined

2340      * above then the token is converted into a {@code long} value as if by

2341      * removing all locale specific prefixes, group separators, and locale

2342      * specific suffixes, then mapping non-ASCII digits into ASCII

2343      * digits via {@link Character#digit Character.digit}, prepending a

2344      * negative sign (-) if the locale specific negative prefixes and suffixes

2345      * were present, and passing the resulting string to

2346      * {@link Long#parseLong(String, int) Long.parseLong} with the

2347      * specified radix.

2348      *

2349      * <p>If the radix is less than {@link Character#MIN_RADIX Character.MIN_RADIX}

2350      * or greater than {@link Character#MAX_RADIX Character.MAX_RADIX}, then an

2351      * {@code IllegalArgumentException} is thrown.

2352      *

2353      * @param radix the radix used to interpret the token as an int value

2354      * @return the {@code long} scanned from the input

2355      * @throws InputMismatchException

2356      *         if the next token does not match the <i>Integer</i>

2357      *         regular expression, or is out of range

2358      * @throws NoSuchElementException if input is exhausted

2359      * @throws IllegalStateException if this scanner is closed

2360      * @throws IllegalArgumentException if the radix is out of range

2361      */

2362     public long nextLong(int radix) {

2363         // Check cached result

2364         if ((typeCache != null) && (typeCache instanceof Long)

2365             && this.radix == radix) {

2366             long val = ((Long)typeCache).longValue();

2367             useTypeCache();

2368             return val;

2369         }

2370         setRadix(radix);

2371         clearCaches();

2372         try {

2373             String s = next(integerPattern());

2374             if (matcher.group(SIMPLE_GROUP_INDEX) == null)

2375                 s = processIntegerToken(s);

2376             return Long.parseLong(s, radix);

2377         } catch (NumberFormatException nfe) {

2378             position = matcher.start(); // don't skip bad token

2379             throw new InputMismatchException(nfe.getMessage());

2380         }

2381     }

2382 

2383     /**

2384      * The float token must be stripped of prefixes, group separators,

2385      * and suffixes, non ascii digits must be converted into ascii digits

2386      * before parseFloat will accept it.

2387      *

2388      * If there are non-ascii digits in the token these digits must

2389      * be processed before the token is passed to parseFloat.

2390      */

2391     private String processFloatToken(String token) {

2392         String result = token.replaceAll(groupSeparator, "");

2393         if (!decimalSeparator.equals("\\."))

2394             result = result.replaceAll(decimalSeparator, ".");

2395         boolean isNegative = false;

2396         int preLen = negativePrefix.length();

2397         if ((preLen > 0) && result.startsWith(negativePrefix)) {

2398             isNegative = true;

2399             result = result.substring(preLen);

2400         }

2401         int sufLen = negativeSuffix.length();

2402         if ((sufLen > 0) && result.endsWith(negativeSuffix)) {

2403             isNegative = true;

2404             result = result.substring(result.length() - sufLen,

2405                                       result.length());

2406         }

2407         if (result.equals(nanString))

2408             result = "NaN";

2409         if (result.equals(infinityString))

2410             result = "Infinity";

2411         if (isNegative)

2412             result = "-" + result;

2413 

2414         // Translate non-ASCII digits

2415         Matcher m = NON_ASCII_DIGIT.matcher(result);

2416         if (m.find()) {

2417             StringBuilder inASCII = new StringBuilder();

2418             for (int i=0; i<result.length(); i++) {

2419                 char nextChar = result.charAt(i);

2420                 if (Character.isDigit(nextChar)) {

2421                     int d = Character.digit(nextChar, 10);

2422                     if (d != -1)

2423                         inASCII.append(d);

2424                     else

2425                         inASCII.append(nextChar);

2426                 } else {

2427                     inASCII.append(nextChar);

2428                 }

2429             }

2430             result = inASCII.toString();

2431         }

2432 

2433         return result;

2434     }

2435 

2436     /**

2437      * Returns true if the next token in this scanner's input can be

2438      * interpreted as a float value using the {@link #nextFloat}

2439      * method. The scanner does not advance past any input.

2440      *

2441      * @return true if and only if this scanner's next token is a valid

2442      *         float value

2443      * @throws IllegalStateException if this scanner is closed

2444      */

2445     public boolean hasNextFloat() {

2446         setRadix(10);

2447         boolean result = hasNext(floatPattern());

2448         if (result) { // Cache it

2449             try {

2450                 String s = processFloatToken(hasNextResult);

2451                 typeCache = Float.valueOf(Float.parseFloat(s));

2452             } catch (NumberFormatException nfe) {

2453                 result = false;

2454             }

2455         }

2456         return result;

2457     }

2458 

2459     /**

2460      * Scans the next token of the input as a {@code float}.

2461      * This method will throw {@code InputMismatchException}

2462      * if the next token cannot be translated into a valid float value as

2463      * described below. If the translation is successful, the scanner advances

2464      * past the input that matched.

2465      *

2466      * <p> If the next token matches the <a

2467      * href="#Float-regex"><i>Float</i></a> regular expression defined above

2468      * then the token is converted into a {@code float} value as if by

2469      * removing all locale specific prefixes, group separators, and locale

2470      * specific suffixes, then mapping non-ASCII digits into ASCII

2471      * digits via {@link Character#digit Character.digit}, prepending a

2472      * negative sign (-) if the locale specific negative prefixes and suffixes

2473      * were present, and passing the resulting string to

2474      * {@link Float#parseFloat Float.parseFloat}. If the token matches

2475      * the localized NaN or infinity strings, then either "Nan" or "Infinity"

2476      * is passed to {@link Float#parseFloat(String) Float.parseFloat} as

2477      * appropriate.

2478      *

2479      * @return the {@code float} scanned from the input

2480      * @throws InputMismatchException

2481      *         if the next token does not match the <i>Float</i>

2482      *         regular expression, or is out of range

2483      * @throws NoSuchElementException if input is exhausted

2484      * @throws IllegalStateException if this scanner is closed

2485      */

2486     public float nextFloat() {

2487         // Check cached result

2488         if ((typeCache != null) && (typeCache instanceof Float)) {

2489             float val = ((Float)typeCache).floatValue();

2490             useTypeCache();

2491             return val;

2492         }

2493         setRadix(10);

2494         clearCaches();

2495         try {

2496             return Float.parseFloat(processFloatToken(next(floatPattern())));

2497         } catch (NumberFormatException nfe) {

2498             position = matcher.start(); // don't skip bad token

2499             throw new InputMismatchException(nfe.getMessage());

2500         }

2501     }

2502 

2503     /**

2504      * Returns true if the next token in this scanner's input can be

2505      * interpreted as a double value using the {@link #nextDouble}

2506      * method. The scanner does not advance past any input.

2507      *

2508      * @return true if and only if this scanner's next token is a valid

2509      *         double value

2510      * @throws IllegalStateException if this scanner is closed

2511      */

2512     public boolean hasNextDouble() {

2513         setRadix(10);

2514         boolean result = hasNext(floatPattern());

2515         if (result) { // Cache it

2516             try {

2517                 String s = processFloatToken(hasNextResult);

2518                 typeCache = Double.valueOf(Double.parseDouble(s));

2519             } catch (NumberFormatException nfe) {

2520                 result = false;

2521             }

2522         }

2523         return result;

2524     }

2525 

2526     /**

2527      * Scans the next token of the input as a {@code double}.

2528      * This method will throw {@code InputMismatchException}

2529      * if the next token cannot be translated into a valid double value.

2530      * If the translation is successful, the scanner advances past the input

2531      * that matched.

2532      *

2533      * <p> If the next token matches the <a

2534      * href="#Float-regex"><i>Float</i></a> regular expression defined above

2535      * then the token is converted into a {@code double} value as if by

2536      * removing all locale specific prefixes, group separators, and locale

2537      * specific suffixes, then mapping non-ASCII digits into ASCII

2538      * digits via {@link Character#digit Character.digit}, prepending a

2539      * negative sign (-) if the locale specific negative prefixes and suffixes

2540      * were present, and passing the resulting string to

2541      * {@link Double#parseDouble Double.parseDouble}. If the token matches

2542      * the localized NaN or infinity strings, then either "Nan" or "Infinity"

2543      * is passed to {@link Double#parseDouble(String) Double.parseDouble} as

2544      * appropriate.

2545      *

2546      * @return the {@code double} scanned from the input

2547      * @throws InputMismatchException

2548      *         if the next token does not match the <i>Float</i>

2549      *         regular expression, or is out of range

2550      * @throws NoSuchElementException if the input is exhausted

2551      * @throws IllegalStateException if this scanner is closed

2552      */

2553     public double nextDouble() {

2554         // Check cached result

2555         if ((typeCache != null) && (typeCache instanceof Double)) {

2556             double val = ((Double)typeCache).doubleValue();

2557             useTypeCache();

2558             return val;

2559         }

2560         setRadix(10);

2561         clearCaches();

2562         // Search for next float

2563         try {

2564             return Double.parseDouble(processFloatToken(next(floatPattern())));

2565         } catch (NumberFormatException nfe) {

2566             position = matcher.start(); // don't skip bad token

2567             throw new InputMismatchException(nfe.getMessage());

2568         }

2569     }

2570 

2571     // Convenience methods for scanning multi precision numbers

2572 

2573     /**

2574      * Returns true if the next token in this scanner's input can be

2575      * interpreted as a {@code BigInteger} in the default radix using the

2576      * {@link #nextBigInteger} method. The scanner does not advance past any

2577      * input.

2578      *

2579      * @return true if and only if this scanner's next token is a valid

2580      *         {@code BigInteger}

2581      * @throws IllegalStateException if this scanner is closed

2582      */

2583     public boolean hasNextBigInteger() {

2584         return hasNextBigInteger(defaultRadix);

2585     }

2586 

2587     /**

2588      * Returns true if the next token in this scanner's input can be

2589      * interpreted as a {@code BigInteger} in the specified radix using

2590      * the {@link #nextBigInteger} method. The scanner does not advance past

2591      * any input.

2592      *

2593      * <p>If the radix is less than {@link Character#MIN_RADIX Character.MIN_RADIX}

2594      * or greater than {@link Character#MAX_RADIX Character.MAX_RADIX}, then an

2595      * {@code IllegalArgumentException} is thrown.

2596      *

2597      * @param radix the radix used to interpret the token as an integer

2598      * @return true if and only if this scanner's next token is a valid

2599      *         {@code BigInteger}

2600      * @throws IllegalStateException if this scanner is closed

2601      * @throws IllegalArgumentException if the radix is out of range

2602      */

2603     public boolean hasNextBigInteger(int radix) {

2604         setRadix(radix);

2605         boolean result = hasNext(integerPattern());

2606         if (result) { // Cache it

2607             try {

2608                 String s = (matcher.group(SIMPLE_GROUP_INDEX) == null) ?

2609                     processIntegerToken(hasNextResult) :

2610                     hasNextResult;

2611                 typeCache = new BigInteger(s, radix);

2612             } catch (NumberFormatException nfe) {

2613                 result = false;

2614             }

2615         }

2616         return result;

2617     }

2618 

2619     /**

2620      * Scans the next token of the input as a {@link java.math.BigInteger

2621      * BigInteger}.

2622      *

2623      * <p> An invocation of this method of the form

2624      * {@code nextBigInteger()} behaves in exactly the same way as the

2625      * invocation {@code nextBigInteger(radix)}, where {@code radix}

2626      * is the default radix of this scanner.

2627      *

2628      * @return the {@code BigInteger} scanned from the input

2629      * @throws InputMismatchException

2630      *         if the next token does not match the <i>Integer</i>

2631      *         regular expression, or is out of range

2632      * @throws NoSuchElementException if the input is exhausted

2633      * @throws IllegalStateException if this scanner is closed

2634      */

2635     public BigInteger nextBigInteger() {

2636         return nextBigInteger(defaultRadix);

2637     }

2638 

2639     /**

2640      * Scans the next token of the input as a {@link java.math.BigInteger

2641      * BigInteger}.

2642      *

2643      * <p> If the next token matches the <a

2644      * href="#Integer-regex"><i>Integer</i></a> regular expression defined

2645      * above then the token is converted into a {@code BigInteger} value as if

2646      * by removing all group separators, mapping non-ASCII digits into ASCII

2647      * digits via the {@link Character#digit Character.digit}, and passing the

2648      * resulting string to the {@link

2649      * java.math.BigInteger#BigInteger(java.lang.String)

2650      * BigInteger(String, int)} constructor with the specified radix.

2651      *

2652      * <p>If the radix is less than {@link Character#MIN_RADIX Character.MIN_RADIX}

2653      * or greater than {@link Character#MAX_RADIX Character.MAX_RADIX}, then an

2654      * {@code IllegalArgumentException} is thrown.

2655      *

2656      * @param radix the radix used to interpret the token

2657      * @return the {@code BigInteger} scanned from the input

2658      * @throws InputMismatchException

2659      *         if the next token does not match the <i>Integer</i>

2660      *         regular expression, or is out of range

2661      * @throws NoSuchElementException if the input is exhausted

2662      * @throws IllegalStateException if this scanner is closed

2663      * @throws IllegalArgumentException if the radix is out of range

2664      */

2665     public BigInteger nextBigInteger(int radix) {

2666         // Check cached result

2667         if ((typeCache != null) && (typeCache instanceof BigInteger)

2668             && this.radix == radix) {

2669             BigInteger val = (BigInteger)typeCache;

2670             useTypeCache();

2671             return val;

2672         }

2673         setRadix(radix);

2674         clearCaches();

2675         // Search for next int

2676         try {

2677             String s = next(integerPattern());

2678             if (matcher.group(SIMPLE_GROUP_INDEX) == null)

2679                 s = processIntegerToken(s);

2680             return new BigInteger(s, radix);

2681         } catch (NumberFormatException nfe) {

2682             position = matcher.start(); // don't skip bad token

2683             throw new InputMismatchException(nfe.getMessage());

2684         }

2685     }

2686 

2687     /**

2688      * Returns true if the next token in this scanner's input can be

2689      * interpreted as a {@code BigDecimal} using the

2690      * {@link #nextBigDecimal} method. The scanner does not advance past any

2691      * input.

2692      *

2693      * @return true if and only if this scanner's next token is a valid

2694      *         {@code BigDecimal}

2695      * @throws IllegalStateException if this scanner is closed

2696      */

2697     public boolean hasNextBigDecimal() {

2698         setRadix(10);

2699         boolean result = hasNext(decimalPattern());

2700         if (result) { // Cache it

2701             try {

2702                 String s = processFloatToken(hasNextResult);

2703                 typeCache = new BigDecimal(s);

2704             } catch (NumberFormatException nfe) {

2705                 result = false;

2706             }

2707         }

2708         return result;

2709     }

2710 

2711     /**

2712      * Scans the next token of the input as a {@link java.math.BigDecimal

2713      * BigDecimal}.

2714      *

2715      * <p> If the next token matches the <a

2716      * href="#Decimal-regex"><i>Decimal</i></a> regular expression defined

2717      * above then the token is converted into a {@code BigDecimal} value as if

2718      * by removing all group separators, mapping non-ASCII digits into ASCII

2719      * digits via the {@link Character#digit Character.digit}, and passing the

2720      * resulting string to the {@link

2721      * java.math.BigDecimal#BigDecimal(java.lang.String) BigDecimal(String)}

2722      * constructor.

2723      *

2724      * @return the {@code BigDecimal} scanned from the input

2725      * @throws InputMismatchException

2726      *         if the next token does not match the <i>Decimal</i>

2727      *         regular expression, or is out of range

2728      * @throws NoSuchElementException if the input is exhausted

2729      * @throws IllegalStateException if this scanner is closed

2730      */

2731     public BigDecimal nextBigDecimal() {

2732         // Check cached result

2733         if ((typeCache != null) && (typeCache instanceof BigDecimal)) {

2734             BigDecimal val = (BigDecimal)typeCache;

2735             useTypeCache();

2736             return val;

2737         }

2738         setRadix(10);

2739         clearCaches();

2740         // Search for next float

2741         try {

2742             String s = processFloatToken(next(decimalPattern()));

2743             return new BigDecimal(s);

2744         } catch (NumberFormatException nfe) {

2745             position = matcher.start(); // don't skip bad token

2746             throw new InputMismatchException(nfe.getMessage());

2747         }

2748     }

2749 

2750     /**

2751      * Resets this scanner.

2752      *

2753      * <p> Resetting a scanner discards all of its explicit state

2754      * information which may have been changed by invocations of

2755      * {@link #useDelimiter useDelimiter()},

2756      * {@link #useLocale useLocale()}, or

2757      * {@link #useRadix useRadix()}.

2758      *

2759      * <p> An invocation of this method of the form

2760      * {@code scanner.reset()} behaves in exactly the same way as the

2761      * invocation

2762      *

2763      * <blockquote><pre>{@code

2764      *   scanner.useDelimiter("\\p{javaWhitespace}+")

2765      *          .useLocale(Locale.getDefault(Locale.Category.FORMAT))

2766      *          .useRadix(10);

2767      * }</pre></blockquote>

2768      *

2769      * @return this scanner

2770      *

2771      * @since 1.6

2772      */

2773     public Scanner reset() {

2774         delimPattern = WHITESPACE_PATTERN;

2775         useLocale(Locale.getDefault(Locale.Category.FORMAT));

2776         useRadix(10);

2777         clearCaches();

2778         modCount++;

2779         return this;

2780     }

2781 

2782     /**

2783      * Returns a stream of delimiter-separated tokens from this scanner. The

2784      * stream contains the same tokens that would be returned, starting from

2785      * this scanner's current state, by calling the {@link #next} method

2786      * repeatedly until the {@link #hasNext} method returns false.

2787      *

2788      * <p>The resulting stream is sequential and ordered. All stream elements are

2789      * non-null.

2790      *

2791      * <p>Scanning starts upon initiation of the terminal stream operation, using the

2792      * current state of this scanner. Subsequent calls to any methods on this scanner

2793      * other than {@link #close} and {@link #ioException} may return undefined results

2794      * or may cause undefined effects on the returned stream. The returned stream's source

2795      * {@code Spliterator} is <em>fail-fast</em> and will, on a best-effort basis, throw a

2796      * {@link java.util.ConcurrentModificationException} if any such calls are detected

2797      * during stream pipeline execution.

2798      *

2799      * <p>After stream pipeline execution completes, this scanner is left in an indeterminate

2800      * state and cannot be reused.

2801      *

2802      * <p>If this scanner contains a resource that must be released, this scanner

2803      * should be closed, either by calling its {@link #close} method, or by

2804      * closing the returned stream. Closing the stream will close the underlying scanner.

2805      * {@code IllegalStateException} is thrown if the scanner has been closed when this

2806      * method is called, or if this scanner is closed during stream pipeline execution.

2807      *

2808      * <p>This method might block waiting for more input.

2809      *

2810      * @apiNote

2811      * For example, the following code will create a list of

2812      * comma-delimited tokens from a string:

2813      *

2814      * <pre>{@code

2815      * List<String> result = new Scanner("abc,def,,ghi")

2816      *     .useDelimiter(",")

2817      *     .tokens()

2818      *     .collect(Collectors.toList());

2819      * }</pre>

2820      *

2821      * <p>The resulting list would contain {@code "abc"}, {@code "def"},

2822      * the empty string, and {@code "ghi"}.

2823      *

2824      * @return a sequential stream of token strings

2825      * @throws IllegalStateException if this scanner is closed

2826      * @since 9

2827      */

2828     public Stream<String> tokens() {

2829         ensureOpen();

2830         Stream<String> stream = StreamSupport.stream(new TokenSpliterator(), false);

2831         return stream.onClose(this::close);

2832     }

2833 

2834     class TokenSpliterator extends Spliterators.AbstractSpliterator<String> {

2835         int expectedCount = -1;

2836 

2837         TokenSpliterator() {

2838             super(Long.MAX_VALUE,

2839                   Spliterator.IMMUTABLE | Spliterator.NONNULL | Spliterator.ORDERED);

2840         }

2841 

2842         @Override

2843         public boolean tryAdvance(Consumer<? super String> cons) {

2844             if (expectedCount >= 0 && expectedCount != modCount) {

2845                 throw new ConcurrentModificationException();

2846             }

2847 

2848             if (hasNext()) {

2849                 String token = next();

2850                 expectedCount = modCount;

2851                 cons.accept(token);

2852                 if (expectedCount != modCount) {

2853                     throw new ConcurrentModificationException();

2854                 }

2855                 return true;

2856             } else {

2857                 expectedCount = modCount;

2858                 return false;

2859             }

2860         }

2861     }

2862 

2863     /**

2864      * Returns a stream of match results from this scanner. The stream

2865      * contains the same results in the same order that would be returned by

2866      * calling {@code findWithinHorizon(pattern, 0)} and then {@link #match}

2867      * successively as long as {@link #findWithinHorizon findWithinHorizon()}

2868      * finds matches.

2869      *

2870      * <p>The resulting stream is sequential and ordered. All stream elements are

2871      * non-null.

2872      *

2873      * <p>Scanning starts upon initiation of the terminal stream operation, using the

2874      * current state of this scanner. Subsequent calls to any methods on this scanner

2875      * other than {@link #close} and {@link #ioException} may return undefined results

2876      * or may cause undefined effects on the returned stream. The returned stream's source

2877      * {@code Spliterator} is <em>fail-fast</em> and will, on a best-effort basis, throw a

2878      * {@link java.util.ConcurrentModificationException} if any such calls are detected

2879      * during stream pipeline execution.

2880      *

2881      * <p>After stream pipeline execution completes, this scanner is left in an indeterminate

2882      * state and cannot be reused.

2883      *

2884      * <p>If this scanner contains a resource that must be released, this scanner

2885      * should be closed, either by calling its {@link #close} method, or by

2886      * closing the returned stream. Closing the stream will close the underlying scanner.

2887      * {@code IllegalStateException} is thrown if the scanner has been closed when this

2888      * method is called, or if this scanner is closed during stream pipeline execution.

2889      *

2890      * <p>As with the {@link #findWithinHorizon findWithinHorizon()} methods, this method

2891      * might block waiting for additional input, and it might buffer an unbounded amount of

2892      * input searching for a match.

2893      *

2894      * @apiNote

2895      * For example, the following code will read a file and return a list

2896      * of all sequences of characters consisting of seven or more Latin capital

2897      * letters:

2898      *

2899      * <pre>{@code

2900      * try (Scanner sc = new Scanner(Path.of("input.txt"))) {

2901      *     Pattern pat = Pattern.compile("[A-Z]{7,}");

2902      *     List<String> capWords = sc.findAll(pat)

2903      *                               .map(MatchResult::group)

2904      *                               .collect(Collectors.toList());

2905      * }

2906      * }</pre>

2907      *

2908      * @param pattern the pattern to be matched

2909      * @return a sequential stream of match results

2910      * @throws NullPointerException if pattern is null

2911      * @throws IllegalStateException if this scanner is closed

2912      * @since 9

2913      */

2914     public Stream<MatchResult> findAll(Pattern pattern) {

2915         Objects.requireNonNull(pattern);

2916         ensureOpen();

2917         Stream<MatchResult> stream = StreamSupport.stream(new FindSpliterator(pattern), false);

2918         return stream.onClose(this::close);

2919     }

2920 

2921     /**

2922      * Returns a stream of match results that match the provided pattern string.

2923      * The effect is equivalent to the following code:

2924      *

2925      * <pre>{@code

2926      *     scanner.findAll(Pattern.compile(patString))

2927      * }</pre>

2928      *

2929      * @param patString the pattern string

2930      * @return a sequential stream of match results

2931      * @throws NullPointerException if patString is null

2932      * @throws IllegalStateException if this scanner is closed

2933      * @throws PatternSyntaxException if the regular expression's syntax is invalid

2934      * @since 9

2935      * @see java.util.regex.Pattern

2936      */

2937     public Stream<MatchResult> findAll(String patString) {

2938         Objects.requireNonNull(patString);

2939         ensureOpen();

2940         return findAll(patternCache.forName(patString));

2941     }

2942 

2943     class FindSpliterator extends Spliterators.AbstractSpliterator<MatchResult> {

2944         final Pattern pattern;

2945         int expectedCount = -1;

2946         private boolean advance = false; // true if we need to auto-advance

2947 

2948         FindSpliterator(Pattern pattern) {

2949             super(Long.MAX_VALUE,

2950                   Spliterator.IMMUTABLE | Spliterator.NONNULL | Spliterator.ORDERED);

2951             this.pattern = pattern;

2952         }

2953 

2954         @Override

2955         public boolean tryAdvance(Consumer<? super MatchResult> cons) {

2956             ensureOpen();

2957             if (expectedCount >= 0) {

2958                 if (expectedCount != modCount) {

2959                     throw new ConcurrentModificationException();

2960                 }

2961             } else {

2962                 // init

2963                 matchValid = false;

2964                 matcher.usePattern(pattern);

2965                 expectedCount = modCount;

2966             }

2967 

2968             while (true) {

2969                 // assert expectedCount == modCount

2970                 if (nextInBuffer()) { // doesn't increment modCount

2971                     cons.accept(matcher.toMatchResult());

2972                     if (expectedCount != modCount) {

2973                         throw new ConcurrentModificationException();

2974                     }

2975                     return true;

2976                 }

2977                 if (needInput)

2978                     readInput(); // doesn't increment modCount

2979                 else

2980                     return false; // reached end of input

2981             }

2982         }

2983 

2984         // reimplementation of findPatternInBuffer with auto-advance on zero-length matches

2985         private boolean nextInBuffer() {

2986             if (advance) {

2987                 if (position + 1 > buf.limit()) {

2988                     if (!sourceClosed)

2989                         needInput = true;

2990                     return false;

2991                 }

2992                 position++;

2993                 advance = false;

2994             }

2995             matcher.region(position, buf.limit());

2996             if (matcher.find() && (!matcher.hitEnd() || sourceClosed)) {

2997                  // Did not hit end, or hit real end

2998                  position = matcher.end();

2999                  advance = matcher.start() == position;

3000                  return true;

3001             }

3002             if (!sourceClosed)

3003                 needInput = true;

3004             return false;

3005         }

3006     }

3007 

3008     /** Small LRU cache of Patterns. */

3009     private static class PatternLRUCache {

3010 

3011         private Pattern[] oa = null;

3012         private final int size;

3013 

3014         PatternLRUCache(int size) {

3015             this.size = size;

3016         }

3017 

3018         boolean hasName(Pattern p, String s) {

3019             return p.pattern().equals(s);

3020         }

3021 

3022         void moveToFront(Object[] oa, int i) {

3023             Object ob = oa[i];

3024             for (int j = i; j > 0; j--)

3025                 oa[j] = oa[j - 1];

3026             oa[0] = ob;

3027         }

3028 

3029         Pattern forName(String name) {

3030             if (oa == null) {

3031                 Pattern[] temp = new Pattern[size];

3032                 oa = temp;

3033             } else {

3034                 for (int i = 0; i < oa.length; i++) {

3035                     Pattern ob = oa[i];

3036                     if (ob == null)

3037                         continue;

3038                     if (hasName(ob, name)) {

3039                         if (i > 0)

3040                             moveToFront(oa, i);

3041                         return ob;

3042                     }

3043                 }

3044             }

3045 

3046             // Create a new object

3047             Pattern ob = Pattern.compile(name);

3048             oa[oa.length - 1] = ob;

3049             moveToFront(oa, oa.length - 1);

3050             return ob;

3051         }

3052     }

3053 }

3054