Context Navigation

← Previous Change
Next Change →

HTMLStringTokenizer.java

Timestamp:

2003-05-27T15:40:47+12:00 (21 years ago)

Author:

mdewsnip

Message:

Fixed tabbing.

File:

: 1 edited

trunk/gli/src/org/greenstone/gatherer/util/HTMLStringTokenizer.java (modified) (1 diff)

Legend:

: Unmodified
: Added
: Removed

trunk/gli/src/org/greenstone/gatherer/util/HTMLStringTokenizer.java

-              r4293
+              r4364
 /** This class functions much like a <strong>StringTokenizer</strong> in that it tokenizes a long string into tokens, however this tokenizer cleverly notices HTML formatting tags. */
 public class HTMLStringTokenizer {
      /** The current position in the source string. */
      private int pos = 0;
      /** The current token, usually created by the last nextToken call. */
      private String current = null;
      /** The previous token. */
      private String previous = null;
      /** The string to be tokenized, including any HTML markup. */
      private String source = null;
      /** Constructor.
       * @param source The source <strong>String</strong> to be tokenized.
+    /** The current position in the source string. */
+    private int pos = 0;
+    /** The current token, usually created by the last nextToken call. */
+    private String current = null;
+    /** The previous token. */
+    private String previous = null;
+    /** The string to be tokenized, including any HTML markup. */
+    private String source = null;
+    /** Constructor.
+     * @param source The source <strong>String</strong> to be tokenized.
       */
      public HTMLStringTokenizer(String source) {
           this.source = source;
           // Parse the first token.
           parseToken();
+     }
      /** Determines if there are still tokens remaining unparsed in the source.
+    public HTMLStringTokenizer(String source) {
+    this.source = source;
+    // Parse the first token.
+    parseToken();
+    }
+    /** Determines if there are still tokens remaining unparsed in the source.
       * @return A <strong>boolean</strong> which is <i>true</i> if there are more tokens.
       */
      public boolean hasMoreTokens() {
           if(current != null && current.length() > 0) {
                 return true;
+          }
           return false;
+     }
      /** Determines if the tag currently being returned by sameToken is a tag.
+    public boolean hasMoreTokens() {
+    if(current != null && current.length() > 0) {
+        return true;
+    }
+    return false;
+    }
+    /** Determines if the tag currently being returned by sameToken is a tag.
       * @return A <strong>boolean</strong> indicating if the token is a tag.
       */
      public boolean isTag() {
           if(previous.startsWith("<") && previous.endsWith(">")) {
                 return true;
+          }
           return false;
+     }
      /** Retrieves the next token.
+    public boolean isTag() {
+    if(previous.startsWith("<") && previous.endsWith(">")) {
+        return true;
+    }
+    return false;
+    }
+    /** Retrieves the next token.
       * @return A <strong>String</strong> representing the token.
       */
      public String nextToken() {
           previous = current;
           // Get the next token.
           parseToken();
           // Return previous.
           return previous;
+     }
      /** Repeats the result of the last <i>nextToken()</i>.
+    public String nextToken() {
+    previous = current;
+    // Get the next token.
+    parseToken();
+    // Return previous.
+    return previous;
+    }
+    /** Repeats the result of the last <i>nextToken()</i>.
       * @return A <strong>String</strong> representing the token.
       */
      public String sameToken() {
           return previous;
+     }
      /** Parses the next token and stores it in current.
+    public String sameToken() {
+    return previous;
+    }
+    /** Parses the next token and stores it in current.
       */
      private void parseToken() {
           boolean found = false;
           boolean tag = false;
           boolean text = false;
           // Reset current
           current = "";
           // Parse away
           dumpWhiteSpace();
           while(pos < source.length() && !found) {
                 char c = (char)source.charAt(pos);
                 if(!tag && !text) {
                      if(c == '<') {
                           tag = true;
+                     }
                      else {
                           text = true;
+                     }
                      current = current + c;
+                }
+    private void parseToken() {
+    boolean found = false;
+    boolean tag = false;
+    boolean text = false;
+    // Reset current
+    current = "";
+    // Parse away
+    dumpWhiteSpace();
+    while(pos < source.length() && !found) {
+        char c = (char)source.charAt(pos);
+        if(!tag && !text) {
+        if(c == '<') {
+            tag = true;
+        }
+        else {
+            text = true;
+        }
+        current = current + c;
+        }
                 // Reading a tag. Watch only for '>'.
                 else if(tag) {
                      if(c == '>') {
                           found = true;
+                     }
                      current = current + c;
+                }
+        else if(tag) {
+        if(c == '>') {
+            found = true;
+        }
+        current = current + c;
+        }
                 // Reading text. Watch for ' ' and '<'. Rollback '<'.
                 else if(text) {
                      if(c == ' ') {
                           found = true;
+                     }
                      else if(c == '<') {
                           found = true;
                           pos--;
+                     }
                      else {
                           current = current + c;
+                     }
+                }
                 pos++;
+          }
+     }
      /** Method to ignore whitespace in the source.
+        else if(text) {
+        if(c == ' ') {
+            found = true;
+        }
+        else if(c == '<') {
+            found = true;
+            pos--;
+        }
+        else {
+            current = current + c;
+        }
+        }
+        pos++;
+    }
+    }
+    /** Method to ignore whitespace in the source.
       */
      private void dumpWhiteSpace() {
           while(pos < source.length() && source.charAt(pos) == ' ') {
                 pos++;
+          }
+     }
+    private void dumpWhiteSpace() {
+    while(pos < source.length() && source.charAt(pos) == ' ') {
+        pos++;
+    }
+    }
      static public void main(String args[]) {
           String init = "<HTML>Where material to be imported is found. Defaults to <i>GSDLHOME/collection/col_name/gimport</i></HTML>";
           ///ystem.err.println("Before: " + init);
           String result = Utility.formatHTMLWidth(init, 40);
           ///ystem.err.println("After: " + result);
+     }
+    static public void main(String args[]) {
+    String init = "<HTML>Where material to be imported is found. Defaults to <i>GSDLHOME/collection/col_name/gimport</i></HTML>";
+    ///ystem.err.println("Before: " + init);
+    String result = Utility.formatHTMLWidth(init, 40);
+    ///ystem.err.println("After: " + result);
+    }
+}

Note: See TracChangeset for help on using the changeset viewer.

Context Navigation

Changeset 4364 for trunk/gli/src/org/greenstone/gatherer/util/HTMLStringTokenizer.java

Legend:

trunk/gli/src/org/greenstone/gatherer/util/HTMLStringTokenizer.java

Download in other formats: