|
||||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |
java.lang.Objectgate.util.AbstractFeatureBearer
gate.creole.AbstractResource
gate.creole.AbstractProcessingResource
gate.creole.AbstractLanguageAnalyser
gate.creole.orthomatcher.OrthoMatcher
Field Summary | |
static String |
OM_ANN_SET_PARAMETER_NAME
|
static String |
OM_ANN_TYPES_PARAMETER_NAME
|
static String |
OM_CASE_SENSITIVE_PARAMETER_NAME
|
static String |
OM_DOCUMENT_PARAMETER_NAME
|
static String |
OM_EXT_LISTS_PARAMETER_NAME
|
static String |
OM_ORG_TYPE_PARAMETER_NAME
|
static String |
OM_PERSON_TYPE_PARAMETER_NAME
|
Constructor Summary | |
OrthoMatcher()
|
Method Summary | |
void |
execute()
Run the resource. |
String |
getAnnotationSetName()
get the name of the annotation set |
List |
getAnnotationTypes()
get the types of the annotation |
Boolean |
getCaseSensitive()
Are we running in a case-sensitive mode? |
URL |
getDefinitionFileURL()
|
String |
getEncoding()
|
Boolean |
getExtLists()
|
String |
getOrganizationType()
|
String |
getPersonType()
|
Boolean |
getProcessUnknown()
Return whether or not we're processing the Unknown annots |
Resource |
init()
Initialise this resource, and return it. |
boolean |
matchRule0(String s1,
String s2)
RULE #0: If the two names are listed in table of spurius matches then they do NOT match Condition(s): - Applied to: all name annotations |
boolean |
matchRule1(String s1,
String s2,
boolean matchCase)
RULE #1: If the two names are identical then they are the same no longer used, because I do the check for same string via the hash table of previous annotations Condition(s): depend on case Applied to: all name annotations |
boolean |
matchRule10(String s1,
String s2)
RULE #10: is one name the reverse of the other reversing around prepositions only? e.g. |
boolean |
matchRule11(String s1,
String s2)
RULE #11: does one name consist of contractions of the first two tokens of the other name? e.g. |
boolean |
matchRule12(String s1,
String s2)
RULE #12: do the first and last tokens of one name match the first and last tokens of the other? Condition(s): case-sensitive match Applied to: organisation annotations only |
boolean |
matchRule13(String s1,
String s2)
RULE #13: do multi-word names match except for one token e.g. |
boolean |
matchRule14(String s1,
String s2)
RULE #14: if the last token of one name matches the second name e.g. |
boolean |
matchRule15(String s1,
String s2)
RULE #15: does one token from a Person name appear as the other token Note that this rule has NOT been used in LaSIE's 1.5 namematcher; added for ACE by Di's request |
boolean |
matchRule2(String s1,
String s2)
RULE #2: if the two names are listed as equivalent in the lookup table (alias) then they match Condition(s): - Applied to: all name annotations |
boolean |
matchRule3(String s1,
String s2)
RULE #3: adding a possessive at the end of one name causes a match e.g. |
boolean |
matchRule4(String s1,
String s2)
RULE #4: Do all tokens other than the punctuation marks , and . |
boolean |
matchRule5(String s1,
String s2)
RULE #5: if the 1st token of one name matches the second name e.g. |
boolean |
matchRule6(String s1,
String s2)
RULE #6: if one name is the acronym of the other e.g. |
boolean |
matchRule7(String s1,
String s2)
RULE #7: if one of the tokens in one of the names is in the list of separators eg. |
boolean |
matchRule8(String s1,
String s2)
This rule is now obsolete, as The and the trailing CDG are stripped before matching. |
boolean |
matchRule9(String s1,
String s2)
RULE #9: does one of the names match the token just before a trailing company designator in the other name? The company designator has already been chopped off, so the token before it, is in fact the last token e.g. |
String |
regularExpressions(String text,
String replacement,
String regEx)
substitute all multiple spaces, tabes and newlines with a single space |
void |
setAnnotationSetName(String newAnnotationSetName)
set the annotation set name |
void |
setAnnotationTypes(List newType)
set the types of the annotations |
void |
setCaseSensitive(Boolean newCase)
set the caseSensitive flag |
void |
setDefinitionFileURL(URL definitionFileURL)
|
void |
setEncoding(String encoding)
|
void |
setExtLists(Boolean newExtLists)
set the extLists flag |
void |
setOrganizationType(String newOrganizationType)
|
void |
setPersonType(String newPersonType)
|
void |
setProcessUnknown(Boolean processOrNot)
set whether to process the Unknown annotations |
Methods inherited from class gate.creole.AbstractLanguageAnalyser |
getCorpus, getDocument, setCorpus, setDocument |
Methods inherited from class gate.creole.AbstractProcessingResource |
addProgressListener, addStatusListener, cleanup, interrupt, isInterrupted, reInit, removeProgressListener, removeStatusListener |
Methods inherited from class gate.creole.AbstractResource |
checkParameterValues, getName, getParameterValue, getParameterValue, removeResourceListeners, setName, setParameterValue, setParameterValue, setParameterValues, setParameterValues, setResourceListeners |
Methods inherited from class gate.util.AbstractFeatureBearer |
getFeatures, setFeatures |
Methods inherited from class java.lang.Object |
equals, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
Methods inherited from interface gate.ProcessingResource |
reInit |
Methods inherited from interface gate.Resource |
cleanup, getParameterValue, setParameterValue, setParameterValues |
Methods inherited from interface gate.util.FeatureBearer |
getFeatures, setFeatures |
Methods inherited from interface gate.util.NameBearer |
getName, setName |
Methods inherited from interface gate.Executable |
interrupt, isInterrupted |
Field Detail |
public static final String OM_DOCUMENT_PARAMETER_NAME
public static final String OM_ANN_SET_PARAMETER_NAME
public static final String OM_CASE_SENSITIVE_PARAMETER_NAME
public static final String OM_ANN_TYPES_PARAMETER_NAME
public static final String OM_ORG_TYPE_PARAMETER_NAME
public static final String OM_PERSON_TYPE_PARAMETER_NAME
public static final String OM_EXT_LISTS_PARAMETER_NAME
Constructor Detail |
public OrthoMatcher()
Method Detail |
public Resource init() throws ResourceInstantiationException
init
in interface Resource
init
in class AbstractProcessingResource
ResourceInstantiationException
public void execute() throws ExecutionException
execute
in interface Executable
execute
in class AbstractProcessingResource
ExecutionException
public void setExtLists(Boolean newExtLists)
public void setCaseSensitive(Boolean newCase)
public void setAnnotationSetName(String newAnnotationSetName)
public void setAnnotationTypes(List newType)
public void setProcessUnknown(Boolean processOrNot)
public void setOrganizationType(String newOrganizationType)
public void setPersonType(String newPersonType)
public String getAnnotationSetName()
public List getAnnotationTypes()
public String getOrganizationType()
public String getPersonType()
public Boolean getExtLists()
public Boolean getCaseSensitive()
public Boolean getProcessUnknown()
public boolean matchRule0(String s1, String s2)
public boolean matchRule1(String s1, String s2, boolean matchCase)
public boolean matchRule2(String s1, String s2)
public boolean matchRule3(String s1, String s2)
public boolean matchRule4(String s1, String s2)
public boolean matchRule5(String s1, String s2)
public boolean matchRule6(String s1, String s2)
public boolean matchRule7(String s1, String s2)
public boolean matchRule8(String s1, String s2)
public boolean matchRule9(String s1, String s2)
public boolean matchRule10(String s1, String s2)
public boolean matchRule11(String s1, String s2)
public boolean matchRule12(String s1, String s2)
public boolean matchRule13(String s1, String s2)
public boolean matchRule14(String s1, String s2)
public boolean matchRule15(String s1, String s2)
public String regularExpressions(String text, String replacement, String regEx)
public void setDefinitionFileURL(URL definitionFileURL)
public URL getDefinitionFileURL()
public void setEncoding(String encoding)
public String getEncoding()
|
||||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |