Changeset 5670 for trunk


Ignore:
Timestamp:
2003-10-17T04:47:32+13:00 (21 years ago)
Author:
jmt12
Message:

Added a new transform to replace square brackets with the appropriate Unicode

File:
1 edited

Legend:

Unmodified
Added
Removed
  • trunk/gli/src/org/greenstone/gatherer/util/Codec.java

    r5372 r5670  
    3838public class Codec {
    3939   
    40     static final public String DOM_TO_GREENSTONE = "DOM_TO_GREENSTONE";
    41     static final public String DOM_TO_TEXT = "DOM_TO_TEXT";
    42     static final public String GREENSTONE_TO_DOM = "GREENSTONE_TO_DOM";
    43     static final public String GREENSTONE_TO_TEXT = "GREENSTONE_TO_TEXT";
    44     static final public String TEXT_TO_DOM = "TEXT_TO_DOM";
    45     static final public String TEXT_TO_GREENSTONE = "TEXT_TO_GREENSTONE";
    46     static final public String TEXT_TO_SHELL_UNIX = "TEXT_TO_SHELL_UNIX";
    47     static final public String TEXT_TO_SHELL_WINDOWS = "TEXT_TO_SHELL_WINDOWS";
     40   static final public String DOM_TO_GREENSTONE = "DOM_TO_GREENSTONE";
     41   static final public String DOM_TO_TEXT = "DOM_TO_TEXT";
     42   static final public String GREENSTONE_TO_DOM = "GREENSTONE_TO_DOM";
     43   static final public String GREENSTONE_TO_TEXT = "GREENSTONE_TO_TEXT";
     44   static final public String REMOVE_SQUARE_BRACKET = "REMOVE_SQUARE_BRACKET";
     45   static final public String TEXT_TO_DOM = "TEXT_TO_DOM";
     46   static final public String TEXT_TO_GREENSTONE = "TEXT_TO_GREENSTONE";
     47   static final public String TEXT_TO_SHELL_UNIX = "TEXT_TO_SHELL_UNIX";
     48   static final public String TEXT_TO_SHELL_WINDOWS = "TEXT_TO_SHELL_WINDOWS";
    4849
    4950    static final private int MAX_CACHE_SIZE = 100;
     
    7172    // Transform DOM encoded text into plain text
    7273    String[] dom_to_text = {
    73         "'", "\'",
    74         ">", ">",
    75         "&lt;", "<",
    76         "&quot;", "\"",
    77         "&amp;", "&"
     74       "&amp;#091;", "\\[",
     75       "&amp;#093;", "\\]",
     76       "&apos;", "\'",
     77       "&gt;", ">",
     78       "&lt;", "<",
     79       "&quot;", "\"",
     80       "&amp;", "&"
    7881    };
    7982    TRANSFORMS.put(DOM_TO_TEXT, dom_to_text);
     
    99102        "&quot;", "\"",
    100103        "&apos;", "\'",
    101         "\\\\\\[", "\\[",
    102         "\\\\\\]", "\\]",
     104        "&#091;", "\\[",
     105        "&#093;", "\\]",
    103106        "\\\\\\\\", "\\\\"
    104107    };
     
    106109    greenstone_to_text = null;
    107110
     111    // Transform text into text, but without [ and ]
     112    String[] remove_square_bracket = {
     113        "\\[", "&amp;#091;",
     114        "\\]", "&amp;#093;"
     115    };
     116    TRANSFORMS.put(REMOVE_SQUARE_BRACKET, remove_square_bracket);
     117    remove_square_bracket = null;
     118   
    108119    // Transform plain html text into something that can be placed in a DOM
    109120    String[] text_to_dom = {
     
    120131    String[] text_to_greenstone = {
    121132        "\\\\", "\\\\\\\\",
    122         "\\[", "\\\\[",
    123         "\\]", "\\\\]",
     133        "\\[", "&#091;",
     134        "\\]", "&#093;",
    124135        "\"", "&quot;",
    125136        "\'", "&apos;",
     
    162173        }
    163174        }
    164         //Gatherer.println("*** Transform: " + transform + " ***");
    165         //Gatherer.println("*** Raw      : '" + raw + "'");
    166         //Gatherer.println("*** Processed: '" + processed + "'");
     175        Gatherer.println("*** Transform: " + transform + " ***");
     176        Gatherer.println("*** Raw      : '" + raw + "'");
     177        Gatherer.println("*** Processed: '" + processed + "'");
    167178        // If cache is at maximum size, empty it and start again
    168179        if(CACHE.size() == MAX_CACHE_SIZE) {
     
    235246        index++;
    236247    }
    237    
    238248    return processed.toString();
    239249    }
Note: See TracChangeset for help on using the changeset viewer.