/** * prune existing 'constit' annotations on 'span' of 'doc' using information from a part-of-speech * tagger. Words are assumed, on entry, to have multiple 'constit' annotations from dictionary * look-up, reflecting the POS ambiguity of the words; this ambiguity will be reduced using a * tagger. Words are first assigned 'tagger' annotations with feature cat = a Penn tag. This * information is then used to remove 'constit' annotations not consistent with the Penn tag. */ public void prune(Document doc, Span span) { annotate(doc, span, "tagger"); Retagger.pruneConstit(doc, span); }
/** * tag 'span' of 'doc' according to the Jet part of speech set. Words are first assigned 'tagger' * annotations with feature cat = a Penn tag. Then these are mapped to Jet tags, and 'constit' * annotations are added with cat = a Jet part-of-speech tag. */ public void tagJet(Document doc, Span span) { annotate(doc, span, "tagger"); Retagger.mapConstit(doc, span); }