Java Document.text Beispiele

Programmiersprache: Java

Klasse / Typ: Document

Methode / Funktion: text

Beispiele auf hotexamples.com: 12

Java Document.text - 12 Beispiele gefunden. Dies sind die am besten bewerteten Java Beispiele für die Document.text, die aus Open Source-Projekten extrahiert wurden. Sie können Beispiele bewerten, um die Qualität der Beispiele zu verbessern.

Häufig verwendete Methoden

Anzeigen Verbergen

createElement(30)

createTextNode(30)

select(30)

get(30)

insertString(30)

getTextLength(30)

getCharsSequence(30)

getText(30)

appendChild(30)

getRootElement(30)

getDocumentElement(30)

getLineStartOffset(30)

add(30)

getElementsByTagName(30)

getLineEndOffset(29)

getLength(23)

getLineNumber(22)

getLineCount(19)

createRangeMarker(18)

createElementNS(16)

getContent(15)

getElementById(15)

importNode(12)

text(12)

body(11)

save(11)

replaceString(10)

deleteString(10)

remove(10)

createDivElement(9)

getDefaultRootElement(8)

check(8)

getId(8)

replaceItemValue(7)

open(7)

getGamma(7)

close(7)

getNumberOfTypes(7)

getNumberOfTopics(7)

getNumberOfTokens(7)

getFirstChild(7)

getChildNodes(7)

getHtml(6)

html(6)

getBody(6)

getName(6)

getSentence(6)

annotate(6)

toString(6)

setRootElement(6)

Beispiel #1

Datei anzeigen

Datei: ElementTest.java Projekt: haggisandchips/jsoup

  @Test
  public void testBrHasSpace() {
    Document doc = Jsoup.parse("<p>Hello<br>there</p>");
    assertEquals("Hello there", doc.text());
    assertEquals("Hello there", doc.select("p").first().ownText());

    doc = Jsoup.parse("<p>Hello <br> there</p>");
    assertEquals("Hello there", doc.text());
  }

Beispiel #2

Datei anzeigen

Datei: DocumentTest.java Projekt: testIT-LivingDoc/livingdoc-core

  @Test
  public void testInterpretsASequenceOfTables() {
    tables =
        parse(
            "["
                + RuleForInterpreter.class.getName()
                + "]["
                + AlternateCalculator.class.getName()
                + "]\n"
                + "[a][b][sum?]\n"
                + "[6][2][8]\n"
                + "[5][2][8]\n"
                + "****\n"
                + "["
                + SetOfInterpreter.class.getName()
                + "]["
                + RowFixtureTarget.class.getName()
                + "]\n"
                + "[a][b][c]\n"
                + "[1][2][3]");

    Document document = Document.text(tables);
    execute(document);
    assertEquals(2, document.getStatistics().rightCount());
    assertEquals(3, document.getStatistics().wrongCount());
  }

Beispiel #3

Datei anzeigen

Datei: KariyerParser.java Projekt: eguller/mujobo-crawler

 public List<String> extractCities(Document doc) {
   HashMap<String, String> cityMap = new HashMap<String, String>();
   cityMap.put("Adana", "Adana");
   cityMap.put("Konya", "Konya");
   cityMap.put("Tekirda\u011f", "Tekirda\u011f");
   // \u011f
   List<String> cityList = new ArrayList<String>();
   Element ilanDetay = doc.select("div#divIlanDetay").first();
   String patternJobTitle = ".*(\u015eehir/\u00dclke|City/Country|Location).*";
   Pattern pattern = Pattern.compile(patternJobTitle);
   Matcher matcher = pattern.matcher(getPlainText(ilanDetay));
   if (matcher.find()) {
     String cityLine = matcher.group();
     String[] cityLineArr = cityLine.split(":");
     if (cityLineArr.length > 1) {
       String cityCommaStr = cityLineArr[1].trim();
       String[] cityArr = cityCommaStr.split(" ")[0].split(",");
       for (String city : cityArr) {
         cityList.add(trim(city));
       }
     }
   }
   if (cityList.size() == 0) {
     Set<String> tokenSet = tokenize(doc.text());
     for (String s : tokenSet) {
       if (cityMap.containsKey(s)) {
         cityList.add(trim(cityMap.get(s)));
       }
     }
   }
   return cityList;
 }

Beispiel #4

Datei anzeigen

Datei: NewAnnotationAction.java Projekt: rgrishman/jet

 /**
  * performs the action, adding the specified Annotation. Returns the position of the end of the
  * Annotation.
  */
 @Override
 public int perform(Document doc, PatternApplication patap) {
   Span span;
   HashMap bindings = patap.bestBindings;
   // System.out.println ("bindings (for new annotation): " + bindings);
   if (spanVariable == null) {
     span = new Span(patap.startPosition, patap.bestPosition);
   } else if (spanVariable.name.toString() == "0") {
     span = new Span(patap.startPosition, patap.startPosition);
   } else {
     Object value = bindings.get(spanVariable.name);
     if (value instanceof Span) {
       span = (Span) value;
     } else if (value instanceof Annotation) {
       span = ((Annotation) value).span();
     } else {
       System.out.println("Value of " + spanVariable.toString() + " is not a span.or annotation");
       return -1;
     }
   }
   if (Pat.trace)
     Console.println(
         "Annotating "
             + doc.text(span)
             + " as "
             + type
             + " "
             + features.substitute(bindings).toSGMLString());
   hideAnnotations(doc, type, span);
   hideAnnotations(doc, "token", span);
   Annotation newAnnotation = new Annotation(type, span, features.substitute(bindings));
   doc.addAnnotation(newAnnotation);
   if (bindingVariable != null) bindings.put(bindingVariable.name, newAnnotation);
   return span.end();
 }

Beispiel #5

Datei anzeigen

Datei: ElementTest.java Projekt: haggisandchips/jsoup

 @Test
 public void testKeepsPreTextInCode() {
   String h = "<pre><code>code\n\ncode</code></pre>";
   Document doc = Jsoup.parse(h);
   assertEquals("code\n\ncode", doc.text());
   assertEquals("<pre><code>code\n\ncode</code></pre>", doc.body().html());
 }

Beispiel #6

Datei anzeigen

Datei: ElementTest.java Projekt: haggisandchips/jsoup

 @Test
 public void testNormalisesText() {
   String h = "<p>Hello<p>There.</p> \n <p>Here <b>is</b> \n s<b>om</b>e text.";
   Document doc = Jsoup.parse(h);
   String text = doc.text();
   assertEquals("Hello There. Here is some text.", text);
 }

Beispiel #7

Datei anzeigen

Datei: PTBReader.java Projekt: keeyon2/NYU-School-Shizzle

  /**
   * Adds <B>constit</B> annotations to an existing Document <CODE>doc</CODE> to represent the parse
   * tree structure <CODE>tree</CODE>.
   *
   * @param tree the parse tree (for a portion of Document doc)
   * @param doc the document
   * @param span the portion of doc covered by the parse tree
   * @param jetCategories if true, use Jet categories as terminal categories (if false, use
   *     categories read from parse trees)
   */
  public void addAnnotations(ParseTreeNode tree, Document doc, Span span, boolean jetCategories) {
    List<ParseTreeNode> terminalNodes = getTerminalNodes(tree);
    String text = doc.text();
    int offset = span.start();

    for (ParseTreeNode terminal : terminalNodes) {
      while (offset < span.end() && Character.isWhitespace(text.charAt(offset))) {
        offset++;
      }
      for (String skipString : skip) {
        if (text.startsWith(skipString, offset)) {
          offset += skipString.length();
          while (offset < span.end() && Character.isWhitespace(text.charAt(offset))) {
            offset++;
          }
          break;
        }
      }
      // match next terminal node against next word in text
      int matchLength = matchTextToTree(text, offset, terminal.word);
      if (matchLength > 0) {
        int endOffset = offset + matchLength;
        while (endOffset < span.end() && Character.isWhitespace(text.charAt(endOffset))) {
          endOffset++;
        }
        terminal.start = offset;
        terminal.end = endOffset;
        offset = endOffset;
      } else {
        System.err.println(
            "PTBReader.addAnnotations:  "
                + "Cannot determine parse tree offset for word "
                + terminal.word);
        System.err.println("  at document offset " + offset + " in sentence");
        System.err.println("  " + doc.text(span));
        return;
      }
    }

    if (jetCategories) {
      setJetAnnotations(tree, span, doc);
      StatParser.deleteUnusedConstits(doc, span, tree.ann); // <<<
    } else {
      determineNonTerminalSpans(tree, span.start());
      setAnnotations(tree, doc);
    }
  }

Beispiel #8

Datei anzeigen

Datei: ElementTest.java Projekt: haggisandchips/jsoup

  @Test
  public void testSetText() {
    String h = "<div id=1>Hello <p>there <b>now</b></p></div>";
    Document doc = Jsoup.parse(h);
    assertEquals("Hello there now", doc.text()); // need to sort out node whitespace
    assertEquals("there now", doc.select("p").get(0).text());

    Element div = doc.getElementById("1").text("Gone");
    assertEquals("Gone", div.text());
    assertEquals(0, doc.select("p").size());
  }

Beispiel #9

Datei anzeigen

Datei: PTBReader.java Projekt: keeyon2/NYU-School-Shizzle

  /**
   * converts a set of Penn TreeBank files into text documents. Invoked by: PTBReader inputDir
   * outputDir. Converts all files with extension .mrg in inputDir to text documents, and writes
   * them into outputDir.
   */
  public static void main(String[] args) throws Exception {
    if (args.length != 2) {
      System.out.println("usage: java " + PTBReader.class.getName() + " ");
      System.exit(1);
    }

    File inputDir = new File(args[0]);
    File outputDir = new File(args[1]);
    PTBReader parser = new PTBReader();
    for (File file : getFiles(new File(args[0]), ".mrg")) {
      String outFilename = removeSuffix(getRelativePath(inputDir, file));
      File outFile = new File(outputDir, outFilename);
      outFile.getParentFile().mkdirs();

      Writer out = new FileWriter(outFile);
      Document doc = parser.load(file).getDocument();
      out.write(doc.text());
      out.close();
    }
  }

Beispiel #10

Datei anzeigen

Datei: DocumentTest.java Projekt: testIT-LivingDoc/livingdoc-core

 private Document document() {
   return Document.text(tables);
 }

Beispiel #11

Datei anzeigen

Datei: ElementTest.java Projekt: haggisandchips/jsoup

 @Test
 public void testKeepsPreText() {
   String h = "<p>Hello \n \n there.</p> <div><pre>  What's \n\n  that?</pre>";
   Document doc = Jsoup.parse(h);
   assertEquals("Hello there.   What's \n\n  that?", doc.text());
 }

Beispiel #12

Datei anzeigen

Datei: ElementTest.java Projekt: haggisandchips/jsoup

 @Test
 public void testGetText() {
   Document doc = Jsoup.parse(reference);
   assertEquals("Hello Another element", doc.text());
   assertEquals("Another element", doc.getElementsByTag("p").get(1).text());
 }