public class WordNetUtilities
extends java.lang.Object
Modifier and Type | Field and Description |
---|---|
static int |
TPTPidCounter |
protected static java.util.ArrayList<java.lang.String> |
WordNetRelations |
Constructor and Description |
---|
WordNetUtilities() |
Modifier and Type | Method and Description |
---|---|
static void |
commentSentiment(java.lang.String fileWithPath)
Take a file of
|
static java.util.ArrayList<java.lang.String> |
convertTermList(java.lang.String termList)
Convert a list of Terms in the format "&%term1 &%term2" to an ArrayList
of bare term Strings
|
static java.lang.String |
convertWordNetPointer(java.lang.String ptr) |
static void |
deduceMissingLinks()
Use the WordNet hyper-/hypo-nym links to deduce a likely link
for a SUMO term that has not yet been manually linked.
|
static void |
extractMeronyms()
A utility to extract meronym relations as relations between
SUMO terms.
|
static java.lang.String |
formatWords(java.util.TreeMap<java.lang.String,java.lang.String> words,
java.lang.String kbName)
HTML format a TreeMap of word senses and their associated synset
|
static java.lang.String |
formatWordsList(java.util.TreeMap<java.lang.String,java.util.ArrayList<java.lang.String>> words,
java.lang.String kbName)
HTML format a TreeMap of ArrayLists word senses
|
static java.lang.String |
getBareSUMOTerm(java.lang.String term)
Get a SUMO term minus its &% prefix and one character mapping
suffix.
|
static java.lang.String |
getPOSfromKey(java.lang.String senseKey)
Extract the POS from a word_POS_num sense key.
|
static char |
getSUMOMappingSuffix(java.lang.String term)
Get a SUMO term mapping suffix.
|
static java.lang.String |
getWordFromKey(java.lang.String senseKey)
Extract the POS from a word_POS_num sense key
|
void |
imageNetLinks()
Import links from www.image-net.org that are linked to
WordNet and links them to SUMO terms when the synset has a
directly equivalent SUMO term
|
static void |
main(java.lang.String[] args)
A main method, used only for testing.
|
static java.lang.String |
mappingCharToName(char mappingType) |
static void |
mergeUpdates()
Read in a file with a nine-digit synset number followed by a space
and a SUMO term.
|
static java.lang.String |
posLettersToNumber(java.lang.String pos)
Convert a part of speech number to the two letter format used by
the WordNet sense index code.
|
static char |
posLetterToNumber(char POS) |
static char |
posNumberToLetter(char POS) |
static java.lang.String |
posNumberToLetters(java.lang.String pos)
Convert a part of speech number to the two letter format used by
the WordNet sense index code.
|
static java.lang.String |
printStatistics() |
static void |
processMissingLinks(java.lang.String fileName,
java.lang.String pattern,
java.lang.String posNum)
This is a utility routine that should not be called during
normal Sigma operation.
|
static java.lang.String |
removeTermPrefixes(java.lang.String formula) |
static void |
searchCoherence(java.lang.String fileWithPath)
Take a file of
|
static int |
sensePOS(java.lang.String sense)
Take a WordNet sense identifier, and return the integer part of
speech code.
|
static java.lang.String |
subst(java.lang.String result,
java.lang.String match,
java.lang.String subst)
A utility function that mimics the functionality of the perl
substitution feature (s/match/replacement/).
|
static boolean |
substTest(java.lang.String result,
java.lang.String match,
java.lang.String subst,
java.util.Hashtable<java.lang.String,java.lang.String> hash)
A utility function that mimics the functionality of the perl
substitution feature (s/match/replacement/) but rather than
returning the result of the substitution, just tests whether the
result is a key in a hashtable.
|
void |
updateWNversion()
Port the mappings from one version of WordNet to another.
|
void |
updateWNversionProcess(java.lang.String fileName,
java.lang.String pattern,
java.lang.String posNum)
This is a utility routine that should not be called during
normal Sigma operation.
|
void |
updateWNversionReading(java.lang.String fileName,
java.lang.String pattern,
java.lang.String posNum)
Read the version mapping files and store in the HashMap
called "mappings".
|
static java.lang.String |
verbPlural(java.lang.String verb)
Return the plural form of the verb.
|
static void |
writeTPTPWordNet(java.io.PrintWriter pw)
Write TPTP format for WordNet
|
public static int TPTPidCounter
protected static java.util.ArrayList<java.lang.String> WordNetRelations
public static java.lang.String getBareSUMOTerm(java.lang.String term)
public static java.lang.String getPOSfromKey(java.lang.String senseKey)
public static java.lang.String getWordFromKey(java.lang.String senseKey)
public static java.lang.String removeTermPrefixes(java.lang.String formula)
public static java.util.ArrayList<java.lang.String> convertTermList(java.lang.String termList)
public static char getSUMOMappingSuffix(java.lang.String term)
public static java.lang.String convertWordNetPointer(java.lang.String ptr)
public static char posLetterToNumber(char POS)
public static char posNumberToLetter(char POS)
public static java.lang.String posNumberToLetters(java.lang.String pos)
public static java.lang.String posLettersToNumber(java.lang.String pos)
public static int sensePOS(java.lang.String sense)
public static java.lang.String mappingCharToName(char mappingType)
public static java.lang.String subst(java.lang.String result, java.lang.String match, java.lang.String subst)
result
- is the string on which the substitution is performed.match
- is the substring to be found and replaced.subst
- is the string replacement for match.public static boolean substTest(java.lang.String result, java.lang.String match, java.lang.String subst, java.util.Hashtable<java.lang.String,java.lang.String> hash)
result
- is the string on which the substitution is performed.match
- is the substring to be found and replaced.subst
- is the string replacement for match.hash
- is a hashtable to be checked against the result.public static java.lang.String verbPlural(java.lang.String verb)
public static java.lang.String formatWords(java.util.TreeMap<java.lang.String,java.lang.String> words, java.lang.String kbName)
public static java.lang.String formatWordsList(java.util.TreeMap<java.lang.String,java.util.ArrayList<java.lang.String>> words, java.lang.String kbName)
public static void mergeUpdates() throws java.io.IOException
java.io.IOException
public static void processMissingLinks(java.lang.String fileName, java.lang.String pattern, java.lang.String posNum) throws java.io.IOException
java.io.IOException
public static void deduceMissingLinks() throws java.io.IOException
java.io.IOException
public void updateWNversionProcess(java.lang.String fileName, java.lang.String pattern, java.lang.String posNum) throws java.io.IOException
java.io.IOException
public void updateWNversionReading(java.lang.String fileName, java.lang.String pattern, java.lang.String posNum) throws java.io.IOException
java.io.IOException
public void updateWNversion() throws java.io.IOException
java.io.IOException
public static java.lang.String printStatistics()
public void imageNetLinks() throws java.io.IOException
java.io.IOException
public static void extractMeronyms()
public static void searchCoherence(java.lang.String fileWithPath)
public static void commentSentiment(java.lang.String fileWithPath)
public static void writeTPTPWordNet(java.io.PrintWriter pw) throws java.io.IOException
java.io.IOException
public static void main(java.lang.String[] args)