1 files changed, 204 insertions, 127 deletions
diff --git a/libjava/java/util/StringTokenizer.java b/libjava/java/util/StringTokenizer.java
index 1686a03..ee29940 100644
--- a/libjava/java/util/StringTokenizer.java
+++ b/libjava/java/util/StringTokenizer.java
@@ -1,76 +1,236 @@
-/* Copyright (C) 1998, 1999  Free Software Foundation
+/* java.util.StringTokenizer
+   Copyright (C) 1998, 1999, 2001 Free Software Foundation, Inc.
 
-   This file is part of libgcj.
+This file is part of GNU Classpath.
+
+GNU Classpath is free software; you can redistribute it and/or modify
+it under the terms of the GNU General Public License as published by
+the Free Software Foundation; either version 2, or (at your option)
+any later version.
+
+GNU Classpath is distributed in the hope that it will be useful, but
+WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with GNU Classpath; see the file COPYING.  If not, write to the
+Free Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
+02111-1307 USA.
+
+As a special exception, if you link this library with other files to
+produce an executable, this library does not by itself cause the
+resulting executable to be covered by the GNU General Public License.
+This exception does not however invalidate any other reasons why the
+executable file might be covered by the GNU General Public License. */
 
-This software is copyrighted work licensed under the terms of the
-Libgcj License.  Please consult the file "LIBGCJ_LICENSE" for
-details.  */
 
 package java.util;
 
 /**
+ * This class splits a string into tokens.  The caller can set on which 
+ * delimiters the string should be split and if the delimiters should be
+ * returned.
+ *
+ * You may change the delimiter set on the fly by calling
+ * nextToken(String).  But the semantic is quite difficult; it even
+ * depends on calling <code>hasMoreTokens()</code>.  You should call
+ * <code>hasMoreTokens()</code> before, otherwise the old delimiters
+ * after the last token are returned.
+ *
+ * If you want to get the delimiters, you have to use the three argument
+ * constructor.  The delimiters are returned as token consisting of a
+ * single character.  
+ *
+ * @author Jochen Hoenicke
  * @author Warren Levy <warrenl@cygnus.com>
- * @date August 24, 1998.
- */
-/* Written using "Java Class Libraries", 2nd edition, ISBN 0-201-31002-3
- * "The Java Language Specification", ISBN 0-201-63451-1
- * plus online API docs for JDK 1.2 beta from http://www.javasoft.com.
- * Status:  Believed complete and correct
  */
-
 public class StringTokenizer implements Enumeration
 {
-  /* String to be parsed */
-  private String inputString;
+  /**
+   * The position in the str, where we currently are.
+   */
+  private int pos;
+  /**
+   * The string that should be split into tokens.
+   */
+  private String str;
+  /**
+   * The string containing the delimiter characters.
+   */
+  private String delim;
+  /**
+   * Tells, if we should return the delimiters.
+   */
+  private boolean retDelims;
+
+  /*{ 
+     invariant {
+     pos >= 0 :: "position is negative";
+     pos <= str.length() :: "position is out of string";
+     str != null :: "String is null";
+     delim != null :: "Delimiters are null";
+     }
+     } */
+
+  /**
+   * Creates a new StringTokenizer for the string <code>str</code>,
+   * that should split on the default delimiter set (space, tap,
+   * newline, return and formfeed), and which doesn't return the
+   * delimiters.
+   * @param str The string to split.
+   */
+  public StringTokenizer(String str)
+    /*{ require { str != null :: "str must not be null"; } } */
+  {
+    this(str, " \t\n\r\f", false);
+  }
 
-  /* String to be parsed put into a char array for efficient access */
-  private char[] chArray;
+  /**
+   * Create a new StringTokenizer, that splits the given string on 
+   * the given delimiter characters.  It doesn't return the delimiter
+   * characters.
+   *
+   * @param str The string to split.
+   * @param delim A string containing all delimiter characters.
+   */
+  public StringTokenizer(String str, String delim)
+    /*{ require { str != null :: "str must not be null";
+       delim != null :: "delim must not be null"; } } */
+  {
+    this(str, delim, false);
+  }
 
-  /* Set of delimiter characters for separating tokens */
-  private String delimiters;
+  /**
+   * Create a new StringTokenizer, that splits the given string on
+   * the given delimiter characters.  If you set
+   * <code>returnDelims</code> to <code>true</code>, the delimiter
+   * characters are returned as tokens of their own.  The delimiter
+   * tokens always consist of a single character.
+   *
+   * @param str The string to split.
+   * @param delim A string containing all delimiter characters.
+   * @param returnDelims Tells, if you want to get the delimiters.
+   */
+  public StringTokenizer(String str, String delim, boolean returnDelims)
+    /*{ require { str != null :: "str must not be null";
+       delim != null :: "delim must not be null"; } } */
+  {
+    this.str = str;
+    this.delim = delim;
+    this.retDelims = returnDelims;
+    this.pos = 0;
+  }
 
-  /* Whether delimiters in this instance are treated as tokens themselves */
-  private boolean returnDelimiters;
+  /**
+   * Tells if there are more tokens.
+   * @return True, if the next call of nextToken() succeeds, false otherwise.
+   */
+  public boolean hasMoreTokens()
+  {
+    if (!retDelims)
+      {
+	while (pos < str.length() && delim.indexOf(str.charAt(pos)) > -1)
+	  {
+	    pos++;
+	  }
+      }
+    return pos < str.length();
+  }
 
-  /* Index into the input string to start parsing for the next token */
-  private int inputStringIndex;
+  /**
+   * Returns the nextToken, changing the delimiter set to the given
+   * <code>delim</code>.  The change of the delimiter set is
+   * permanent, ie. the next call of nextToken(), uses the same
+   * delimiter set.
+   * @param delim a string containing the new delimiter characters.
+   * @return the next token with respect to the new delimiter characters.
+   * @exception NoSuchElementException if there are no more tokens.
+   */
+  public String nextToken(String delim) throws NoSuchElementException
+    /*{ require { hasMoreTokens() :: "no more Tokens available";
+       ensure { $return != null && $return.length() > 0; } } */
+  {
+    this.delim = delim;
+    return nextToken();
+  }
 
-  public StringTokenizer(String str)
+  /**
+   * Returns the nextToken of the string.
+   * @param delim a string containing the new delimiter characters.
+   * @return the next token with respect to the new delimiter characters.
+   * @exception NoSuchElementException if there are no more tokens.
+   */
+  public String nextToken() throws NoSuchElementException
+    /*{ require { hasMoreTokens() :: "no more Tokens available";
+       ensure { $return != null && $return.length() > 0; } } */
   {
-    this(str, " \t\n\r", false);
+    if (pos < str.length() && delim.indexOf(str.charAt(pos)) > -1)
+      {
+	if (retDelims)
+	  return str.substring(pos, ++pos);
+
+	while (++pos < str.length() && delim.indexOf(str.charAt(pos)) > -1)
+	  {
+	    /* empty */
+	  }
+      }
+    if (pos < str.length())
+      {
+	int start = pos;
+	while (++pos < str.length() && delim.indexOf(str.charAt(pos)) == -1)
+	  {
+	    /* empty */
+	  }
+	return str.substring(start, pos);
+      }
+    throw new NoSuchElementException();
   }
 
-  public StringTokenizer(String str, String delims)
+  /**
+   * This does the same as hasMoreTokens. This is the
+   * <code>Enumeration</code interface method.
+   * @return True, if the next call of nextElement() succeeds, false
+   * otherwise.  
+   * @see #hasMoreTokens
+   */
+  public boolean hasMoreElements()
   {
-    this(str, delims, false);
+    return hasMoreTokens();
   }
 
-  public StringTokenizer(String str, String delims, boolean retDelim)
+  /**
+   * This does the same as nextTokens. This is the
+   * <code>Enumeration</code interface method.
+   * @return the next token with respect to the new delimiter characters.
+   * @exception NoSuchElementException if there are no more tokens.
+   * @see #nextToken
+   */
+  public Object nextElement() throws NoSuchElementException
   {
-    inputString = str;
-    delimiters = delims;
-    returnDelimiters = retDelim;
-    inputStringIndex = 0;
-
-    // Work on a copy of the remaining string in a char array
-    // to gain efficiency of using primitives
-    chArray = new char[inputString.length()];
-    inputString.getChars(0, inputString.length(), chArray, 0);
+    return nextToken();
   }
 
+  /**
+   * This counts the number of remaining tokens in the string, with
+   * respect to the current delimiter set.
+   * @return the number of times <code>nextTokens()</code> will
+   * succeed.  
+   * @see #nextToken
+   */
   public int countTokens()
   {
     int count = 0;
     int delimiterCount = 0;
     boolean tokenFound = false;		// Set when a non-delimiter is found
-    int offset = inputStringIndex;
+    int tmpPos = pos;
 
     // Note for efficiency, we count up the delimiters rather than check
-    // returnDelimiters every time we encounter one.  That way, we can
+    // retDelims every time we encounter one.  That way, we can
     // just do the conditional once at the end of the method
-    while (offset < chArray.length)
+    while (tmpPos < str.length())
       {
-	if (isDelimiter(chArray[offset++]))
+	if (delim.indexOf(str.charAt(tmpPos++)) > -1)
 	  {
 	    if (tokenFound)
 	      {
@@ -86,8 +246,9 @@ public class StringTokenizer implements Enumeration
 	    tokenFound = true;
 
 	    // Get to the end of the token
-	    while (offset < chArray.length && !isDelimiter(chArray[offset]))
-	      offset++;
+	    while (tmpPos < str.length()
+		   && delim.indexOf(str.charAt(tmpPos)) == -1)
+	      ++tmpPos;
 	  }
       }
 
@@ -96,90 +257,6 @@ public class StringTokenizer implements Enumeration
       count++;
 
     // if counting delmiters add them into the token count
-    return returnDelimiters ? count + delimiterCount : count;
-  }
-
-  public boolean hasMoreElements()
-  {
-    return hasMoreTokens();
-  }
-
-  public boolean hasMoreTokens()
-  {
-    int offset = inputStringIndex;
-
-    while (offset < chArray.length)
-      if (!isDelimiter(chArray[offset++]) || returnDelimiters)
-	{
-	  // update the current position with the start of the next token
-	  inputStringIndex = --offset;
-
-	  return true;
-	}
-
-    return false;
-  }
-
-  public Object nextElement()
-  {
-    return nextToken();
-  }
-
-  public String nextToken()
-  {
-    int offset = inputStringIndex;
-    int startSubstr = -1;
-
-    // Make sure we have more chars left to parse
-    // and then find the start of the next token
-    while (offset < chArray.length && startSubstr < 0)
-      {
-	// Find the start of the token; skipping initial delimiters
-	if (!isDelimiter(chArray[offset++]))
-	  startSubstr = offset - 1;
-	else if (returnDelimiters)
-	  {
-	    // The single char delimiter is treated as a token
-	    inputStringIndex = offset;		// update the current position
-
-	    return inputString.substring(offset - 1, inputStringIndex);
-	  }
-      }
-
-    // Now look for the end of the token
-    while (offset < chArray.length)
-      {
-	if (isDelimiter(chArray[offset++]))
-	  {
-	    // Found the end of token
-            inputStringIndex = offset - 1;	// update the current position
-
-            return inputString.substring(startSubstr, inputStringIndex);
-	  }
-      }
-
-    // Got to the end of the string without finding the start of a token
-    if (startSubstr < 0)
-      throw new NoSuchElementException();
-
-    // Got to the end of the string before a delimiter
-    inputStringIndex = offset;		// update the current position
-
-    return inputString.substring(startSubstr, inputStringIndex);
-  }
-
-  public String nextToken(String delims)
-  {
-    // First replace with new set of delimiters
-    delimiters = delims;
-
-    return nextToken();
-  }
-
-  // This private method could be inlined but the other methods are
-  // more readable this way, so we'll take the hit on efficiency.
-  private boolean isDelimiter(char ch)
-  {
-    return delimiters.indexOf(ch, 0) >= 0;
+    return retDelims ? count + delimiterCount : count;
   }
 }