Java 1.2 How-To

home *** CD-ROM | disk | FTP | other *** search

/ Java 1.2 How-To / JavaHowTo.iso / 3rdParty / jbuilder / unsupported / JDK1.2beta3 / SOURCE / SRC.ZIP / java / util / StringTokenizer.java < prev next >

Wrap

Java Source | 1998-03-20 | 9.0 KB | 272 lines

/* * @(#)StringTokenizer.java 1.19 98/03/18 * * Copyright 1994-1998 by Sun Microsystems, Inc., * 901 San Antonio Road, Palo Alto, California, 94303, U.S.A. * All rights reserved. * * This software is the confidential and proprietary information * of Sun Microsystems, Inc. ("Confidential Information"). You * shall not disclose such Confidential Information and shall use * it only in accordance with the terms of the license agreement * you entered into with Sun. */ package java.util; import java.lang.*; /** * The string tokenizer class allows an application to break a * string into tokens. The tokenization method is much simpler than * the one used by the <code>StreamTokenizer</code> class. The * <code>StringTokenizer</code> methods do not distinguish among * identifiers, numbers, and quoted strings, nor do they recognize * and skip comments. * * The set of delimiters (the characters that separate tokens) may * be specified either at creation time or on a per-token basis. * * An instance of <code>StringTokenizer</code> behaves in one of two * ways, depending on whether it was created with the * <code>returnTokens</code> flag having the value <code>true</code> * or <code>false</code>: * <ul> * <li>If the flag is <code>false</code>, delimiter characters serve to * separate tokens. A token is a maximal sequence of consecutive * characters that are not delimiters. * <li>If the flag is <code>true</code>, delimiter characters are themselves * considered to be tokens. A token is thus either one delimiter * character, or a maximal sequence of consecutive characters that are * not delimiters. * </ul> * A <tt>StringTokenizer</tt> object internally maintains a current * position within the string to be tokenized. Some operations advance this * current position past the characters processed. * A token is returned by taking a substring of the string that was used to * create the <tt>StringTokenizer</tt> object. * * The following is one example of the use of the tokenizer. The code: * <blockquote><pre> * StringTokenizer st = new StringTokenizer("this is a test"); * while (st.hasMoreTokens()) { * println(st.nextToken()); * } * </pre></blockquote> * * prints the following output: * <blockquote><pre> * this * is * a * test * </pre></blockquote> * * @author unascribed * @version 1.19, 03/18/98 * @see java.io.StreamTokenizer * @since JDK1.0 */ public class StringTokenizer implements Enumeration { private int currentPosition; private int maxPosition; private String str; private String delimiters; private boolean retTokens; /** * Constructs a string tokenizer for the specified string. All * characters in the <code>delim</code> argument are the delimiters * for separating tokens. * * If the <code>returnTokens</code> flag is <code>true</code>, then * the delimiter characters are also returned as tokens. Each * delimiter is returned as a string of length one. If the flag is * <code>false</code>, the delimiter characters are skipped and only * serve as separators between tokens. * * @param str a string to be parsed. * @param delim the delimiters. * @param returnTokens flag indicating whether to return the delimiters * as tokens. */ public StringTokenizer(String str, String delim, boolean returnTokens) { currentPosition = 0; this.str = str; maxPosition = str.length(); delimiters = delim; retTokens = returnTokens; } /** * Constructs a string tokenizer for the specified string. The * characters in the <code>delim</code> argument are the delimiters * for separating tokens. Delimiter characters themselves will not * be treated as tokens. * * @param str a string to be parsed. * @param delim the delimiters. */ public StringTokenizer(String str, String delim) { this(str, delim, false); } /** * Constructs a string tokenizer for the specified string. The * tokenizer uses the default delimiter set, which is * <code>"\t\n\r\f"</code>: the space character, the tab * character, the newline character, the carriage-return character, * and the form-feed character. Delimiter characters themselves will * not be treated as tokens. * * @param str a string to be parsed. */ public StringTokenizer(String str) { this(str, " \t\n\r\f", false); } /** * Skips delimiters. */ private void skipDelimiters() { while (!retTokens && (currentPosition < maxPosition) && (delimiters.indexOf(str.charAt(currentPosition)) >= 0)) { currentPosition++; } } /** * Tests if there are more tokens available from this tokenizer's string. * If this method returns <tt>true</tt>, then a subsequent call to * <tt>nextToken</tt> with no argument will successfully return a token. * * @return <code>true</code> if and only if there is at least one token * in the string after the current position; <code>false</code> * otherwise. */ public boolean hasMoreTokens() { skipDelimiters(); return (currentPosition < maxPosition); } /** * Returns the next token from this string tokenizer. * * @return the next token from this string tokenizer. * @exception NoSuchElementException if there are no more tokens in this * tokenizer's string. */ public String nextToken() { skipDelimiters(); if (currentPosition >= maxPosition) { throw new NoSuchElementException(); } int start = currentPosition; while ((currentPosition < maxPosition) && (delimiters.indexOf(str.charAt(currentPosition)) < 0)) { currentPosition++; } if (retTokens && (start == currentPosition) && (delimiters.indexOf(str.charAt(currentPosition)) >= 0)) { currentPosition++; } return str.substring(start, currentPosition); } /** * Returns the next token in this string tokenizer's string. First, * the set of characters considered to be delimiters by this * <tt>StringTokenizer</tt> object is changed to be the characters in * the string <tt>delim</tt>. Then the next token in the string * after the current position is returned. The current position is * advanced beyond the recognized token. The new delimiter set * remains the default after this call. * * @param delim the new delimiters. * @return the next token, after switching to the new delimiter set. * @exception NoSuchElementException if there are no more tokens in this * tokenizer's string. */ public String nextToken(String delim) { delimiters = delim; return nextToken(); } /** * Returns the same value as the <code>hasMoreTokens</code> * method. It exists so that this class can implement the * <code>Enumeration</code> interface. * * @return <code>true</code> if there are more tokens; * <code>false</code> otherwise. * @see java.util.Enumeration * @see java.util.StringTokenizer#hasMoreTokens() */ public boolean hasMoreElements() { return hasMoreTokens(); } /** * Returns the same value as the <code>nextToken</code> method, * except that its declared return value is <code>Object</code> rather than * <code>String</code>. It exists so that this class can implement the * <code>Enumeration</code> interface. * * @return the next token in the string. * @exception NoSuchElementException if there are no more tokens in this * tokenizer's string. * @see java.util.Enumeration * @see java.util.StringTokenizer#nextToken() */ public Object nextElement() { return nextToken(); } /** * Calculates the number of times that this tokenizer's * <code>nextToken</code> method can be called before it generates an * exception. The current position is not advanced. * * @return the number of tokens remaining in the string using the current * delimiter set. * @see java.util.StringTokenizer#nextToken() */ public int countTokens() { int count = 0; int currpos = currentPosition; while (currpos < maxPosition) { /* * This is just skipDelimiters(); but it does not affect * currentPosition. */ while (!retTokens && (currpos < maxPosition) && (delimiters.indexOf(str.charAt(currpos)) >= 0)) { currpos++; } if (currpos >= maxPosition) { break; } int start = currpos; while ((currpos < maxPosition) && (delimiters.indexOf(str.charAt(currpos)) < 0)) { currpos++; } if (retTokens && (start == currpos) && (delimiters.indexOf(str.charAt(currpos)) >= 0)) { currpos++; } count++; } return count; } }