gate.creole
Class GazetteerListsCollector

java.lang.Object
  extended bygate.util.AbstractFeatureBearer
      extended bygate.creole.AbstractResource
          extended bygate.creole.AbstractProcessingResource
              extended bygate.creole.AbstractLanguageAnalyser
                  extended bygate.creole.GazetteerListsCollector
All Implemented Interfaces:
ANNIEConstants, Executable, FeatureBearer, LanguageAnalyser, NameBearer, ProcessingResource, Resource, Serializable

public class GazetteerListsCollector
extends AbstractLanguageAnalyser

See Also:
Serialized Form

Nested Class Summary
 
Nested classes inherited from class gate.creole.AbstractProcessingResource
AbstractProcessingResource.InternalStatusListener, AbstractProcessingResource.IntervalProgressListener
 
Field Summary
private  AnnotationSet allAnnots
           
private  List annotationTypes
           
private  Gazetteer gazetteer
           
private  String markupSetName
           
private static String PERSON_ANNOT_NAME
           
private  HashMap statsPerType
           
private  String theLanguage
           
 
Fields inherited from class gate.creole.AbstractLanguageAnalyser
corpus, document
 
Fields inherited from class gate.creole.AbstractProcessingResource
interrupted
 
Fields inherited from class gate.creole.AbstractResource
name, serialVersionUID
 
Fields inherited from class gate.util.AbstractFeatureBearer
features
 
Fields inherited from interface gate.creole.ANNIEConstants
ANNOTATION_COREF_FEATURE_NAME, DATE_ANNOTATION_TYPE, DOCUMENT_COREF_FEATURE_NAME, LOCATION_ANNOTATION_TYPE, LOOKUP_ANNOTATION_TYPE, LOOKUP_CLASS_FEATURE_NAME, LOOKUP_MAJOR_TYPE_FEATURE_NAME, LOOKUP_MINOR_TYPE_FEATURE_NAME, LOOKUP_ONTOLOGY_FEATURE_NAME, MONEY_ANNOTATION_TYPE, ORGANIZATION_ANNOTATION_TYPE, PERSON_ANNOTATION_TYPE, PERSON_GENDER_FEATURE_NAME, PR_NAMES, SENTENCE_ANNOTATION_TYPE, SPACE_TOKEN_ANNOTATION_TYPE, TOKEN_ANNOTATION_TYPE, TOKEN_CATEGORY_FEATURE_NAME, TOKEN_KIND_FEATURE_NAME, TOKEN_LENGTH_FEATURE_NAME, TOKEN_ORTH_FEATURE_NAME, TOKEN_STRING_FEATURE_NAME
 
Constructor Summary
GazetteerListsCollector()
           
 
Method Summary
protected  boolean alreadyPresentInGazetteer(String token)
          The idea is to have this method check if an item is already present in the gazetteer under this type, and if so, not to add it.
protected  void collectLists(AnnotationSet annots, String annotType)
           
 void execute()
          Starts the execution of this executable
 List getAnnotationTypes()
          get the types of the annotation
 Gazetteer getGazetteer()
           
 String getMarkupASName()
           
 String getTheLanguage()
           
protected  void printStats()
           
 void setAnnotationTypes(List newType)
          set the types of the annotations
 void setGazetteer(Gazetteer theGaz)
           
 void setMarkupASName(String newMarkupASName)
           
 void setTheLanguage(String language)
           
 
Methods inherited from class gate.creole.AbstractLanguageAnalyser
getCorpus, getDocument, setCorpus, setDocument
 
Methods inherited from class gate.creole.AbstractProcessingResource
addProgressListener, addStatusListener, cleanup, fireProcessFinished, fireProgressChanged, fireStatusChanged, init, interrupt, isInterrupted, reInit, removeProgressListener, removeStatusListener
 
Methods inherited from class gate.creole.AbstractResource
checkParameterValues, getName, getParameterValue, getParameterValue, removeResourceListeners, setName, setParameterValue, setParameterValue, setParameterValues, setParameterValues, setResourceListeners
 
Methods inherited from class gate.util.AbstractFeatureBearer
getFeatures, setFeatures
 
Methods inherited from class java.lang.Object
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
 
Methods inherited from interface gate.ProcessingResource
reInit
 
Methods inherited from interface gate.Resource
cleanup, getParameterValue, init, setParameterValue, setParameterValues
 
Methods inherited from interface gate.util.FeatureBearer
getFeatures, setFeatures
 
Methods inherited from interface gate.util.NameBearer
getName, setName
 
Methods inherited from interface gate.Executable
interrupt, isInterrupted
 

Field Detail

PERSON_ANNOT_NAME

private static String PERSON_ANNOT_NAME

markupSetName

private String markupSetName

allAnnots

private AnnotationSet allAnnots

annotationTypes

private List annotationTypes

gazetteer

private Gazetteer gazetteer

theLanguage

private String theLanguage

statsPerType

private HashMap statsPerType
Constructor Detail

GazetteerListsCollector

public GazetteerListsCollector()
Method Detail

execute

public void execute()
             throws ExecutionException
Description copied from interface: Executable
Starts the execution of this executable

Specified by:
execute in interface Executable
Overrides:
execute in class AbstractProcessingResource
Throws:
ExecutionException

setMarkupASName

public void setMarkupASName(String newMarkupASName)

getMarkupASName

public String getMarkupASName()

getAnnotationTypes

public List getAnnotationTypes()
get the types of the annotation


setAnnotationTypes

public void setAnnotationTypes(List newType)
set the types of the annotations


getGazetteer

public Gazetteer getGazetteer()

setGazetteer

public void setGazetteer(Gazetteer theGaz)

setTheLanguage

public void setTheLanguage(String language)

getTheLanguage

public String getTheLanguage()

collectLists

protected void collectLists(AnnotationSet annots,
                            String annotType)

printStats

protected void printStats()

alreadyPresentInGazetteer

protected boolean alreadyPresentInGazetteer(String token)
The idea is to have this method check if an item is already present in the gazetteer under this type, and if so, not to add it. It is not implemented for now.