Java PosTagger.tokensToLinePosTagged示例

编程语言: Java

命名空间/包名称: pltag.util

类/类型: PosTagger

方法/功能: tokensToLinePosTagged

hotexamples.com的示例: 1

Java PosTagger.tokensToLinePosTagged - 已找到1个示例。这些是从开源项目中提取的最受好评的pltag.util.PosTagger.tokensToLinePosTagged现实Java示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

posTagLine(1)

posTagLineToArray(1)

tokensToLinePosTagged(1)

示例#1

显示文件

文件： Example.java 项目： sinantie/PLTAG

 /**
  * Read input from Dundee corpus. The format is: RC_label|w_1 id_1 w_2 id_2 ...
  *
  * @param line
  */
 private void readDundeeInput(String line) {
   int index = line.indexOf("|");
   if (index > -1) sentenceRc = line.substring(0, index);
   line = line.substring(index + 1);
   StringBuilder sent = new StringBuilder();
   boolean usePosTagger = opts.goldPosTags;
   StringBuilder posTagDummy = new StringBuilder();
   if (line.charAt(0) == '(') // some examples may contain already parsed input in tree format
   {
     List<Word> words = Tree.valueOf(treeProcessDundeeIds(line)).yieldWords();
     for (Word word : words) {
       sent.append(word).append(" ");
       if (!usePosTagger) posTagDummy.append("N/A ").append(word).append("\t");
     }
   } else {
     // remove quotes
     line = replaceParenthesesDundee(removeQuotesDundee(line).trim()).trim();
     String[] tokens = line.split(" ");
     wordIds = new String[tokens.length / 2];
     for (int i = 0; i < tokens.length - 1; i += 2) {
       String word = !usePosTagger ? wordRemoveDigits(tokens[i]) : tokens[i];
       sent.append(word).append(" ");
       if (!usePosTagger) posTagDummy.append("N/A ").append(word).append("\t");
       wordIds[i / 2] = tokens[i + 1];
     }
     sentence = sent.toString().trim();
     if (usePosTagger) {
       Pair<String, String>[] posWords = PosTagger.posTagLineToArray(sentence);
       // One or more words has been expanded due to PTB-compliant splitting.
       // For each new constituent assign the word-id of the original word.
       if (posWords.length != wordIds.length) {
         adjustWordIdsDundee(posWords, sentence.split(" "));
       }
       sentence = sentRemoveDigits(sentence);
       readPosTagged(wordRemoveDigits(PosTagger.tokensToLinePosTagged(posWords)));
     } else posTagged = posTagDummy.toString().trim();
   }
 }