luni/src/main/java/java/util/StringTokenizer.java - platform/libcore - Git at Google

 /*
  *  Licensed to the Apache Software Foundation (ASF) under one or more
  *  contributor license agreements.  See the NOTICE file distributed with
  *  this work for additional information regarding copyright ownership.
  *  The ASF licenses this file to You under the Apache License, Version 2.0
  *  (the "License"); you may not use this file except in compliance with
  *  the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  *  Unless required by applicable law or agreed to in writing, software
  *  distributed under the License is distributed on an "AS IS" BASIS,
  *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  *  See the License for the specific language governing permissions and
  *  limitations under the License.
  */

 package java.util;

 /**
  * The {@code StringTokenizer} class allows an application to break a string
  * into tokens by performing code point comparison. The {@code StringTokenizer}
  * methods do not distinguish among identifiers, numbers, and quoted strings,
  * nor do they recognize and skip comments.
  * <p>
  * The set of delimiters (the codepoints that separate tokens) may be specified
  * either at creation time or on a per-token basis.
  * <p>
  * An instance of {@code StringTokenizer} behaves in one of three ways,
  * depending on whether it was created with the {@code returnDelimiters} flag
  * having the value {@code true} or {@code false}:
  * <ul>
  * <li>If returnDelims is {@code false}, delimiter code points serve to separate
  * tokens. A token is a maximal sequence of consecutive code points that are not
  * delimiters.
  * <li>If returnDelims is {@code true}, delimiter code points are themselves
  * considered to be tokens. In this case a token will be received for each
  * delimiter code point.
  * </ul>
  * <p>
  * A token is thus either one delimiter code point, or a maximal sequence of
  * consecutive code points that are not delimiters.
  * <p>
  * A {@code StringTokenizer} object internally maintains a current position
  * within the string to be tokenized. Some operations advance this current
  * position past the code point processed.
  * <p>
  * A token is returned by taking a substring of the string that was used to
  * create the {@code StringTokenizer} object.
  * <p>
  * Here's an example of the use of the default delimiter {@code StringTokenizer}
  * : <blockquote>
  *
  * <pre>
  * StringTokenizer st = new StringTokenizer(&quot;this is a test&quot;);
  * while (st.hasMoreTokens()) {
  *     println(st.nextToken());
  * }
  * </pre>
  *
  * </blockquote>
  * <p>
  * This prints the following output: <blockquote>
  *
  * <pre>
  *     this
  *     is
  *     a
  *     test
  * </pre>
  *
  * </blockquote>
  * <p>
  * Here's an example of how to use a {@code StringTokenizer} with a user
  * specified delimiter: <blockquote>
  *
  * <pre>
  * StringTokenizer st = new StringTokenizer(
  *         &quot;this is a test with supplementary characters \ud800\ud800\udc00\udc00&quot;,
  *         &quot; \ud800\udc00&quot;);
  * while (st.hasMoreTokens()) {
  *     println(st.nextToken());
  * }
  * </pre>
  *
  * </blockquote>
  * <p>
  * This prints the following output: <blockquote>
  *
  * <pre>
  *     this
  *     is
  *     a
  *     test
  *     with
  *     supplementary
  *     characters
  *     \ud800
  *     \udc00
  * </pre>
  *
  * </blockquote>
  */
 public class StringTokenizer implements Enumeration<Object> {

     private String string;

     private String delimiters;

     private boolean returnDelimiters;

     private int position;

     /**
      * Constructs a new {@code StringTokenizer} for the parameter string using
      * whitespace as the delimiter. The {@code returnDelimiters} flag is set to
      * {@code false}.
      *
      * @param string
      *            the string to be tokenized.
      */
     public StringTokenizer(String string) {
         this(string, " \t\n\r\f", false);
     }

     /**
      * Constructs a new {@code StringTokenizer} for the parameter string using
      * the specified delimiters. The {@code returnDelimiters} flag is set to
      * {@code false}. If {@code delimiters} is {@code null}, this constructor
      * doesn't throw an {@code Exception}, but later calls to some methods might
      * throw a {@code NullPointerException}.
      *
      * @param string
      *            the string to be tokenized.
      * @param delimiters
      *            the delimiters to use.
      */
     public StringTokenizer(String string, String delimiters) {
         this(string, delimiters, false);
     }

     /**
      * Constructs a new {@code StringTokenizer} for the parameter string using
      * the specified delimiters, returning the delimiters as tokens if the
      * parameter {@code returnDelimiters} is {@code true}. If {@code delimiters}
      * is null this constructor doesn't throw an {@code Exception}, but later
      * calls to some methods might throw a {@code NullPointerException}.
      *
      * @param string
      *            the string to be tokenized.
      * @param delimiters
      *            the delimiters to use.
      * @param returnDelimiters
      *            {@code true} to return each delimiter as a token.
      */
     public StringTokenizer(String string, String delimiters,
             boolean returnDelimiters) {
         if (string != null) {
             this.string = string;
             this.delimiters = delimiters;
             this.returnDelimiters = returnDelimiters;
             this.position = 0;
         } else
             throw new NullPointerException();
     }

     /**
      * Returns the number of unprocessed tokens remaining in the string.
      *
      * @return number of tokens that can be retreived before an {@code
      *         Exception} will result from a call to {@code nextToken()}.
      */
     public int countTokens() {
         int count = 0;
         boolean inToken = false;
         for (int i = position, length = string.length(); i < length; i++) {
             if (delimiters.indexOf(string.charAt(i), 0) >= 0) {
                 if (returnDelimiters)
                     count++;
                 if (inToken) {
                     count++;
                     inToken = false;
                 }
             } else {
                 inToken = true;
             }
         }
         if (inToken)
             count++;
         return count;
     }

     /**
      * Returns {@code true} if unprocessed tokens remain. This method is
      * implemented in order to satisfy the {@code Enumeration} interface.
      *
      * @return {@code true} if unprocessed tokens remain.
      */
     public boolean hasMoreElements() {
         return hasMoreTokens();
     }

     /**
      * Returns {@code true} if unprocessed tokens remain.
      *
      * @return {@code true} if unprocessed tokens remain.
      */
     public boolean hasMoreTokens() {
         if (delimiters == null) {
             throw new NullPointerException();
         }
         int length = string.length();
         if (position < length) {
             if (returnDelimiters)
                 return true; // there is at least one character and even if
             // it is a delimiter it is a token

             // otherwise find a character which is not a delimiter
             for (int i = position; i < length; i++)
                 if (delimiters.indexOf(string.charAt(i), 0) == -1)
                     return true;
         }
         return false;
     }

     /**
      * Returns the next token in the string as an {@code Object}. This method is
      * implemented in order to satisfy the {@code Enumeration} interface.
      *
      * @return next token in the string as an {@code Object}
      * @throws NoSuchElementException
      *                if no tokens remain.
      */
     public Object nextElement() {
         return nextToken();
     }

     /**
      * Returns the next token in the string as a {@code String}.
      *
      * @return next token in the string as a {@code String}.
      * @throws NoSuchElementException
      *                if no tokens remain.
      */
     public String nextToken() {
         if (delimiters == null) {
             throw new NullPointerException();
         }
         int i = position;
         int length = string.length();

         if (i < length) {
             if (returnDelimiters) {
                 if (delimiters.indexOf(string.charAt(position), 0) >= 0)
                     return String.valueOf(string.charAt(position++));
                 for (position++; position < length; position++)
                     if (delimiters.indexOf(string.charAt(position), 0) >= 0)
                         return string.substring(i, position);
                 return string.substring(i);
             }

             while (i < length && delimiters.indexOf(string.charAt(i), 0) >= 0)
                 i++;
             position = i;
             if (i < length) {
                 for (position++; position < length; position++)
                     if (delimiters.indexOf(string.charAt(position), 0) >= 0)
                         return string.substring(i, position);
                 return string.substring(i);
             }
         }
         throw new NoSuchElementException();
     }

     /**
      * Returns the next token in the string as a {@code String}. The delimiters
      * used are changed to the specified delimiters.
      *
      * @param delims
      *            the new delimiters to use.
      * @return next token in the string as a {@code String}.
      * @throws NoSuchElementException
      *                if no tokens remain.
      */
     public String nextToken(String delims) {
         this.delimiters = delims;
         return nextToken();
     }
 }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one or more
	* contributor license agreements. See the NOTICE file distributed with
	* this work for additional information regarding copyright ownership.
	* The ASF licenses this file to You under the Apache License, Version 2.0
	* (the "License"); you may not use this file except in compliance with
	* the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	package java.util;

	/**
	* The {@code StringTokenizer} class allows an application to break a string
	* into tokens by performing code point comparison. The {@code StringTokenizer}
	* methods do not distinguish among identifiers, numbers, and quoted strings,
	* nor do they recognize and skip comments.
	* <p>
	* The set of delimiters (the codepoints that separate tokens) may be specified
	* either at creation time or on a per-token basis.
	* <p>
	* An instance of {@code StringTokenizer} behaves in one of three ways,
	* depending on whether it was created with the {@code returnDelimiters} flag
	* having the value {@code true} or {@code false}:
	* <ul>
	* <li>If returnDelims is {@code false}, delimiter code points serve to separate
	* tokens. A token is a maximal sequence of consecutive code points that are not
	* delimiters.
	* <li>If returnDelims is {@code true}, delimiter code points are themselves
	* considered to be tokens. In this case a token will be received for each
	* delimiter code point.
	* </ul>
	* <p>
	* A token is thus either one delimiter code point, or a maximal sequence of
	* consecutive code points that are not delimiters.
	* <p>
	* A {@code StringTokenizer} object internally maintains a current position
	* within the string to be tokenized. Some operations advance this current
	* position past the code point processed.
	* <p>
	* A token is returned by taking a substring of the string that was used to
	* create the {@code StringTokenizer} object.
	* <p>
	* Here's an example of the use of the default delimiter {@code StringTokenizer}
	* : <blockquote>
	*
	* <pre>
	* StringTokenizer st = new StringTokenizer("this is a test");
	* while (st.hasMoreTokens()) {
	* println(st.nextToken());
	* }
	* </pre>
	*
	* </blockquote>
	* <p>
	* This prints the following output: <blockquote>
	*
	* <pre>
	* this
	* is
	* a
	* test
	* </pre>
	*
	* </blockquote>
	* <p>
	* Here's an example of how to use a {@code StringTokenizer} with a user
	* specified delimiter: <blockquote>
	*
	* <pre>
	* StringTokenizer st = new StringTokenizer(
	* "this is a test with supplementary characters \ud800\ud800\udc00\udc00",
	* " \ud800\udc00");
	* while (st.hasMoreTokens()) {
	* println(st.nextToken());
	* }
	* </pre>
	*
	* </blockquote>
	* <p>
	* This prints the following output: <blockquote>
	*
	* <pre>
	* this
	* is
	* a
	* test
	* with
	* supplementary
	* characters
	* \ud800
	* \udc00
	* </pre>
	*
	* </blockquote>
	*/
	public class StringTokenizer implements Enumeration<Object> {

	private String string;

	private String delimiters;

	private boolean returnDelimiters;

	private int position;

	/**
	* Constructs a new {@code StringTokenizer} for the parameter string using
	* whitespace as the delimiter. The {@code returnDelimiters} flag is set to
	* {@code false}.
	*
	* @param string
	* the string to be tokenized.
	*/
	public StringTokenizer(String string) {
	this(string, " \t\n\r\f", false);
	}

	/**
	* Constructs a new {@code StringTokenizer} for the parameter string using
	* the specified delimiters. The {@code returnDelimiters} flag is set to
	* {@code false}. If {@code delimiters} is {@code null}, this constructor
	* doesn't throw an {@code Exception}, but later calls to some methods might
	* throw a {@code NullPointerException}.
	*
	* @param string
	* the string to be tokenized.
	* @param delimiters
	* the delimiters to use.
	*/
	public StringTokenizer(String string, String delimiters) {
	this(string, delimiters, false);
	}

	/**
	* Constructs a new {@code StringTokenizer} for the parameter string using
	* the specified delimiters, returning the delimiters as tokens if the
	* parameter {@code returnDelimiters} is {@code true}. If {@code delimiters}
	* is null this constructor doesn't throw an {@code Exception}, but later
	* calls to some methods might throw a {@code NullPointerException}.
	*
	* @param string
	* the string to be tokenized.
	* @param delimiters
	* the delimiters to use.
	* @param returnDelimiters
	* {@code true} to return each delimiter as a token.
	*/
	public StringTokenizer(String string, String delimiters,
	boolean returnDelimiters) {
	if (string != null) {
	this.string = string;
	this.delimiters = delimiters;
	this.returnDelimiters = returnDelimiters;
	this.position = 0;
	} else
	throw new NullPointerException();
	}

	/**
	* Returns the number of unprocessed tokens remaining in the string.
	*
	* @return number of tokens that can be retreived before an {@code
	* Exception} will result from a call to {@code nextToken()}.
	*/
	public int countTokens() {
	int count = 0;
	boolean inToken = false;
	for (int i = position, length = string.length(); i < length; i++) {
	if (delimiters.indexOf(string.charAt(i), 0) >= 0) {
	if (returnDelimiters)
	count++;
	if (inToken) {
	count++;
	inToken = false;
	}
	} else {
	inToken = true;
	}
	}
	if (inToken)
	count++;
	return count;
	}

	/**
	* Returns {@code true} if unprocessed tokens remain. This method is
	* implemented in order to satisfy the {@code Enumeration} interface.
	*
	* @return {@code true} if unprocessed tokens remain.
	*/
	public boolean hasMoreElements() {
	return hasMoreTokens();
	}

	/**
	* Returns {@code true} if unprocessed tokens remain.
	*
	* @return {@code true} if unprocessed tokens remain.
	*/
	public boolean hasMoreTokens() {
	if (delimiters == null) {
	throw new NullPointerException();
	}
	int length = string.length();
	if (position < length) {
	if (returnDelimiters)
	return true; // there is at least one character and even if
	// it is a delimiter it is a token

	// otherwise find a character which is not a delimiter
	for (int i = position; i < length; i++)
	if (delimiters.indexOf(string.charAt(i), 0) == -1)
	return true;
	}
	return false;
	}

	/**
	* Returns the next token in the string as an {@code Object}. This method is
	* implemented in order to satisfy the {@code Enumeration} interface.
	*
	* @return next token in the string as an {@code Object}
	* @throws NoSuchElementException
	* if no tokens remain.
	*/
	public Object nextElement() {
	return nextToken();
	}

	/**
	* Returns the next token in the string as a {@code String}.
	*
	* @return next token in the string as a {@code String}.
	* @throws NoSuchElementException
	* if no tokens remain.
	*/
	public String nextToken() {
	if (delimiters == null) {
	throw new NullPointerException();
	}
	int i = position;
	int length = string.length();

	if (i < length) {
	if (returnDelimiters) {
	if (delimiters.indexOf(string.charAt(position), 0) >= 0)
	return String.valueOf(string.charAt(position++));
	for (position++; position < length; position++)
	if (delimiters.indexOf(string.charAt(position), 0) >= 0)
	return string.substring(i, position);
	return string.substring(i);
	}

	while (i < length && delimiters.indexOf(string.charAt(i), 0) >= 0)
	i++;
	position = i;
	if (i < length) {
	for (position++; position < length; position++)
	if (delimiters.indexOf(string.charAt(position), 0) >= 0)
	return string.substring(i, position);
	return string.substring(i);
	}
	}
	throw new NoSuchElementException();
	}

	/**
	* Returns the next token in the string as a {@code String}. The delimiters
	* used are changed to the specified delimiters.
	*
	* @param delims
	* the new delimiters to use.
	* @return next token in the string as a {@code String}.
	* @throws NoSuchElementException
	* if no tokens remain.
	*/
	public String nextToken(String delims) {
	this.delimiters = delims;
	return nextToken();
	}
	}