All Downloads are FREE. Search and download functionalities are using the official Maven repository.

gov.nih.nlm.nls.lvg.Util.StrTokenObject Maven / Gradle / Ivy

The newest version!
package gov.nih.nlm.nls.lvg.Util;
/*****************************************************************************
* This class creates a fundamental string token object for strip function.
* The strip function become complicated if it combines with punctuations.
* This class along with StripToken handle such cases.
*
* 

History: * * @author NLM NLS Development Team * * @see StripToken * * @version V-2010 ****************************************************************************/ public class StrTokenObject { // public constructor /** * Creates a string token object, using token string and token type * * @param tokenStr the token string * @param tokenType the type of token */ public StrTokenObject(String tokenStr, int tokenType) { tokenStr_ = tokenStr; tokenType_ = tokenType; } // public methods /** * Set the token type of this string token object * * @param tokenType token type */ public void SetTokenType(int tokenType) { tokenType_ = tokenType; } /** * Get the token type of this token object * * @return an integer represents the type of the token */ public int GetTokenType() { return tokenType_; } /** * Get the token object in a String format * * @return toekn string */ public String GetTokenStr() { return tokenStr_; } // data member /** token type: None */ final public static int NONE = 0; /** token type: it is a token, not a delimiter */ final public static int TOKEN = 1; /** token type: space token, such as " \t" */ final public static int SPACE_D = 2; /** token type: token is stripped, won't be resotred while restoring */ final public static int STRIPPED = 3; /** token type: delimiters will be kept while restoring */ final public static int RESTORE_D = 4; /** token type: delimiters that strip previous chararcter if it's token * type is STRIPPED or in a conflict list */ final public static int STRIPPING_D = 5; /** token type: delimiters that will be striped if it's previous token type * is STRIPPED */ final public static int STRIPABLE_D = 6; /** delimiter string: space */ final public static String SPACE_D_STR = " \t"; /** delimiter string: restore it after tokenizing */ final public static String RESTORE_D_STR = "({[<\"'"; /** delimiter string: strip out */ final public static String STRIPPING_D_STR = ")}]>!?"; /** delimiter string: can be stripped */ final public static String STRIPABLE_D_STR = ",.:;"; /** delimiter string: conflict list string for reomving character */ final public static String CONFLICT_STR = " -,:;"; /** delimiter string: should not be at the end of the string */ final public static String BAD_END_STR = " -,:;"; // private data members private int tokenType_ = NONE; // Deliminator type private String tokenStr_ = null; // the token in String format }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy