org.itc.irst.tcc.sre.util
Class Orthographic

java.lang.Object
  extended by org.itc.irst.tcc.sre.util.Orthographic

public class Orthographic
extends java.lang.Object

TO DO

Since:
1.0
Version:
%I%, %G%
Author:
Claudio Giuliano

Field Summary
static java.lang.String ALL_CONSONANTS
           
static java.lang.String ALL_DIGITS
           
static java.lang.String ALL_VOWELS
           
static java.lang.String ALPHANUMERIC
           
static java.lang.String CAPITALIZED
           
private static char[] consonants
           
static java.lang.String CONTAINS_DASH
           
static java.lang.String CONTAINS_SYMBOLS
           
static java.lang.String ENDS_WITH_DOTS
           
static java.lang.String GREEK_LETTER
           
private static java.lang.String[] greekLetters
           
static java.lang.String LEMMA
           
(package private) static org.apache.log4j.Logger logger
          Define a static logger variable so that it references the Logger instance named Orthographic.
static java.lang.String LOWER_CASE
           
static java.lang.String NUMERIC
           
static java.lang.String PARENTHESIS
           
static java.lang.String PART
           
static java.lang.String PART_OF_SPEECH
           
static java.lang.String PERCENTAGE
           
static java.lang.String PUNCTUATION
           
static java.lang.String QUOTE
           
static java.lang.String ROMAN_NUMBER
           
private static java.lang.String[] romans
           
static java.lang.String SINGLE_DIGIT
           
static java.lang.String SINGLE_LETTER
           
static java.lang.String STEM
           
static java.lang.String UPPER_CASE
           
private static char[] vowels
           
static java.lang.String WORD_FORM
           
 
Constructor Summary
Orthographic()
           
 
Method Summary
static boolean allConsonants(java.lang.String s)
           
static boolean allDigits(java.lang.String s)
           
static boolean allVowels(java.lang.String s)
           
static java.lang.Object[] characterNGram(java.lang.String s, int b, int e)
           
static boolean containsDash(java.lang.String s)
           
static boolean containsDigits(java.lang.String s)
           
static boolean containsDots(java.lang.String s)
           
static boolean containsGreekLetter(java.lang.String s)
           
static boolean containsSymbols(java.lang.String s)
           
static boolean endsWithDots(java.lang.String s)
           
static java.lang.Object[] infix(java.lang.String s)
           
static boolean isAcronym(java.lang.String s)
           
static boolean isAlphanumeric(java.lang.String s)
           
static boolean isCapAndCap(java.lang.String s)
           
static boolean isCapitalized(java.lang.String s)
           
static boolean isConsonant(char c)
           
static boolean isGreekLetter(java.lang.String s)
           
static boolean isLowerCase(java.lang.String s)
           
static boolean isNaturalNumber(java.lang.String s)
           
static boolean isNumeric(java.lang.String s)
           
static boolean isParenthesis(java.lang.String s)
           
static boolean isPercentage(java.lang.String s)
           
static boolean isPunctuation(java.lang.String s)
           
static boolean isQuote(java.lang.String s)
           
static boolean isRealNumber(java.lang.String s)
           
static boolean isRomanNumber(java.lang.String s)
           
static boolean isSingleDigit(java.lang.String s)
           
static boolean isSingleLetter(java.lang.String s)
           
static boolean isSymbol(char c)
           
static boolean isSymbol(java.lang.String s)
           
static boolean isUpperCase(java.lang.String s)
           
static boolean isVowel(char c)
           
static void main(java.lang.String[] args)
           
static java.lang.Object[] prefixes(java.lang.String s, int b, int e)
           
static java.lang.Object[] split(java.lang.String s)
           
static java.lang.Object[] suffixes(java.lang.String s, int b, int e)
           
static void test(java.lang.String t)
           
static java.lang.String wordShape(java.lang.String s)
           
static java.lang.String wordShape2(java.lang.String s)
           
 
Methods inherited from class java.lang.Object
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
 

Field Detail

logger

static org.apache.log4j.Logger logger
Define a static logger variable so that it references the Logger instance named Orthographic.


WORD_FORM

public static final java.lang.String WORD_FORM
See Also:
Constant Field Values

LEMMA

public static final java.lang.String LEMMA
See Also:
Constant Field Values

PART_OF_SPEECH

public static final java.lang.String PART_OF_SPEECH
See Also:
Constant Field Values

STEM

public static final java.lang.String STEM
See Also:
Constant Field Values

UPPER_CASE

public static final java.lang.String UPPER_CASE
See Also:
Constant Field Values

LOWER_CASE

public static final java.lang.String LOWER_CASE
See Also:
Constant Field Values

CAPITALIZED

public static final java.lang.String CAPITALIZED
See Also:
Constant Field Values

NUMERIC

public static final java.lang.String NUMERIC
See Also:
Constant Field Values

ALPHANUMERIC

public static final java.lang.String ALPHANUMERIC
See Also:
Constant Field Values

PUNCTUATION

public static final java.lang.String PUNCTUATION
See Also:
Constant Field Values

PARENTHESIS

public static final java.lang.String PARENTHESIS
See Also:
Constant Field Values

QUOTE

public static final java.lang.String QUOTE
See Also:
Constant Field Values

ALL_DIGITS

public static final java.lang.String ALL_DIGITS
See Also:
Constant Field Values

ENDS_WITH_DOTS

public static final java.lang.String ENDS_WITH_DOTS
See Also:
Constant Field Values

SINGLE_LETTER

public static final java.lang.String SINGLE_LETTER
See Also:
Constant Field Values

SINGLE_DIGIT

public static final java.lang.String SINGLE_DIGIT
See Also:
Constant Field Values

ROMAN_NUMBER

public static final java.lang.String ROMAN_NUMBER
See Also:
Constant Field Values

GREEK_LETTER

public static final java.lang.String GREEK_LETTER
See Also:
Constant Field Values

ALL_CONSONANTS

public static final java.lang.String ALL_CONSONANTS
See Also:
Constant Field Values

ALL_VOWELS

public static final java.lang.String ALL_VOWELS
See Also:
Constant Field Values

CONTAINS_DASH

public static final java.lang.String CONTAINS_DASH
See Also:
Constant Field Values

CONTAINS_SYMBOLS

public static final java.lang.String CONTAINS_SYMBOLS
See Also:
Constant Field Values

PERCENTAGE

public static final java.lang.String PERCENTAGE
See Also:
Constant Field Values

PART

public static final java.lang.String PART
See Also:
Constant Field Values

romans

private static final java.lang.String[] romans

greekLetters

private static final java.lang.String[] greekLetters

consonants

private static final char[] consonants

vowels

private static final char[] vowels
Constructor Detail

Orthographic

public Orthographic()
Method Detail

characterNGram

public static java.lang.Object[] characterNGram(java.lang.String s,
                                                int b,
                                                int e)

prefixes

public static java.lang.Object[] prefixes(java.lang.String s,
                                          int b,
                                          int e)

suffixes

public static java.lang.Object[] suffixes(java.lang.String s,
                                          int b,
                                          int e)

isNumeric

public static final boolean isNumeric(java.lang.String s)

allDigits

public static final boolean allDigits(java.lang.String s)

endsWithDots

public static final boolean endsWithDots(java.lang.String s)

isUpperCase

public static final boolean isUpperCase(java.lang.String s)

isLowerCase

public static final boolean isLowerCase(java.lang.String s)

isAlphanumeric

public static final boolean isAlphanumeric(java.lang.String s)

isCapitalized

public static final boolean isCapitalized(java.lang.String s)

isPunctuation

public static final boolean isPunctuation(java.lang.String s)

isParenthesis

public static final boolean isParenthesis(java.lang.String s)

isQuote

public static final boolean isQuote(java.lang.String s)

isSingleLetter

public static final boolean isSingleLetter(java.lang.String s)

isSingleDigit

public static final boolean isSingleDigit(java.lang.String s)

wordShape

public static final java.lang.String wordShape(java.lang.String s)

wordShape2

public static final java.lang.String wordShape2(java.lang.String s)

isRomanNumber

public static final boolean isRomanNumber(java.lang.String s)

allConsonants

public static final boolean allConsonants(java.lang.String s)

isConsonant

public static final boolean isConsonant(char c)

allVowels

public static final boolean allVowels(java.lang.String s)

isVowel

public static final boolean isVowel(char c)

isGreekLetter

public static final boolean isGreekLetter(java.lang.String s)

containsGreekLetter

public static final boolean containsGreekLetter(java.lang.String s)

isAcronym

public static final boolean isAcronym(java.lang.String s)

isCapAndCap

public static final boolean isCapAndCap(java.lang.String s)

isRealNumber

public static final boolean isRealNumber(java.lang.String s)

isNaturalNumber

public static final boolean isNaturalNumber(java.lang.String s)

containsDots

public static final boolean containsDots(java.lang.String s)

containsDigits

public static final boolean containsDigits(java.lang.String s)

containsDash

public static final boolean containsDash(java.lang.String s)

isSymbol

public static final boolean isSymbol(java.lang.String s)

isPercentage

public static final boolean isPercentage(java.lang.String s)

isSymbol

public static final boolean isSymbol(char c)

containsSymbols

public static final boolean containsSymbols(java.lang.String s)

test

public static void test(java.lang.String t)
                 throws java.lang.Exception
Throws:
java.lang.Exception

infix

public static final java.lang.Object[] infix(java.lang.String s)

split

public static final java.lang.Object[] split(java.lang.String s)

main

public static void main(java.lang.String[] args)
                 throws java.lang.Exception
Throws:
java.lang.Exception