org.itc.irst.tcc.sre.util
Class Orthographic
java.lang.Object
org.itc.irst.tcc.sre.util.Orthographic
public class Orthographic
- extends java.lang.Object
TO DO
- Since:
- 1.0
- Version:
- %I%, %G%
- Author:
- Claudio Giuliano
Methods inherited from class java.lang.Object |
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
logger
static org.apache.log4j.Logger logger
- Define a static logger variable so that it references the
Logger instance named
Orthographic
.
WORD_FORM
public static final java.lang.String WORD_FORM
- See Also:
- Constant Field Values
LEMMA
public static final java.lang.String LEMMA
- See Also:
- Constant Field Values
PART_OF_SPEECH
public static final java.lang.String PART_OF_SPEECH
- See Also:
- Constant Field Values
STEM
public static final java.lang.String STEM
- See Also:
- Constant Field Values
UPPER_CASE
public static final java.lang.String UPPER_CASE
- See Also:
- Constant Field Values
LOWER_CASE
public static final java.lang.String LOWER_CASE
- See Also:
- Constant Field Values
CAPITALIZED
public static final java.lang.String CAPITALIZED
- See Also:
- Constant Field Values
NUMERIC
public static final java.lang.String NUMERIC
- See Also:
- Constant Field Values
ALPHANUMERIC
public static final java.lang.String ALPHANUMERIC
- See Also:
- Constant Field Values
PUNCTUATION
public static final java.lang.String PUNCTUATION
- See Also:
- Constant Field Values
PARENTHESIS
public static final java.lang.String PARENTHESIS
- See Also:
- Constant Field Values
QUOTE
public static final java.lang.String QUOTE
- See Also:
- Constant Field Values
ALL_DIGITS
public static final java.lang.String ALL_DIGITS
- See Also:
- Constant Field Values
ENDS_WITH_DOTS
public static final java.lang.String ENDS_WITH_DOTS
- See Also:
- Constant Field Values
SINGLE_LETTER
public static final java.lang.String SINGLE_LETTER
- See Also:
- Constant Field Values
SINGLE_DIGIT
public static final java.lang.String SINGLE_DIGIT
- See Also:
- Constant Field Values
ROMAN_NUMBER
public static final java.lang.String ROMAN_NUMBER
- See Also:
- Constant Field Values
GREEK_LETTER
public static final java.lang.String GREEK_LETTER
- See Also:
- Constant Field Values
ALL_CONSONANTS
public static final java.lang.String ALL_CONSONANTS
- See Also:
- Constant Field Values
ALL_VOWELS
public static final java.lang.String ALL_VOWELS
- See Also:
- Constant Field Values
CONTAINS_DASH
public static final java.lang.String CONTAINS_DASH
- See Also:
- Constant Field Values
CONTAINS_SYMBOLS
public static final java.lang.String CONTAINS_SYMBOLS
- See Also:
- Constant Field Values
PERCENTAGE
public static final java.lang.String PERCENTAGE
- See Also:
- Constant Field Values
PART
public static final java.lang.String PART
- See Also:
- Constant Field Values
romans
private static final java.lang.String[] romans
greekLetters
private static final java.lang.String[] greekLetters
consonants
private static final char[] consonants
vowels
private static final char[] vowels
Orthographic
public Orthographic()
characterNGram
public static java.lang.Object[] characterNGram(java.lang.String s,
int b,
int e)
prefixes
public static java.lang.Object[] prefixes(java.lang.String s,
int b,
int e)
suffixes
public static java.lang.Object[] suffixes(java.lang.String s,
int b,
int e)
isNumeric
public static final boolean isNumeric(java.lang.String s)
allDigits
public static final boolean allDigits(java.lang.String s)
endsWithDots
public static final boolean endsWithDots(java.lang.String s)
isUpperCase
public static final boolean isUpperCase(java.lang.String s)
isLowerCase
public static final boolean isLowerCase(java.lang.String s)
isAlphanumeric
public static final boolean isAlphanumeric(java.lang.String s)
isCapitalized
public static final boolean isCapitalized(java.lang.String s)
isPunctuation
public static final boolean isPunctuation(java.lang.String s)
isParenthesis
public static final boolean isParenthesis(java.lang.String s)
isQuote
public static final boolean isQuote(java.lang.String s)
isSingleLetter
public static final boolean isSingleLetter(java.lang.String s)
isSingleDigit
public static final boolean isSingleDigit(java.lang.String s)
wordShape
public static final java.lang.String wordShape(java.lang.String s)
wordShape2
public static final java.lang.String wordShape2(java.lang.String s)
isRomanNumber
public static final boolean isRomanNumber(java.lang.String s)
allConsonants
public static final boolean allConsonants(java.lang.String s)
isConsonant
public static final boolean isConsonant(char c)
allVowels
public static final boolean allVowels(java.lang.String s)
isVowel
public static final boolean isVowel(char c)
isGreekLetter
public static final boolean isGreekLetter(java.lang.String s)
containsGreekLetter
public static final boolean containsGreekLetter(java.lang.String s)
isAcronym
public static final boolean isAcronym(java.lang.String s)
isCapAndCap
public static final boolean isCapAndCap(java.lang.String s)
isRealNumber
public static final boolean isRealNumber(java.lang.String s)
isNaturalNumber
public static final boolean isNaturalNumber(java.lang.String s)
containsDots
public static final boolean containsDots(java.lang.String s)
containsDigits
public static final boolean containsDigits(java.lang.String s)
containsDash
public static final boolean containsDash(java.lang.String s)
isSymbol
public static final boolean isSymbol(java.lang.String s)
isPercentage
public static final boolean isPercentage(java.lang.String s)
isSymbol
public static final boolean isSymbol(char c)
containsSymbols
public static final boolean containsSymbols(java.lang.String s)
test
public static void test(java.lang.String t)
throws java.lang.Exception
- Throws:
java.lang.Exception
infix
public static final java.lang.Object[] infix(java.lang.String s)
split
public static final java.lang.Object[] split(java.lang.String s)
main
public static void main(java.lang.String[] args)
throws java.lang.Exception
- Throws:
java.lang.Exception