public static void main(String[] args) throws Exception { // The path to the documents directory. String dataDir = "src/programmersguide/workingwithasposepdf/workingwithtext/searchandgettextfrompagesofpdf/data/"; // open document com.aspose.pdf.Document pdfDocument = new com.aspose.pdf.Document(dataDir + "input.pdf"); // create TextAbsorber object to find all instances of the input search phrase com.aspose.pdf.TextFragmentAbsorber textFragmentAbsorber = new com.aspose.pdf.TextFragmentAbsorber("sample"); // accept the absorber for all the pages pdfDocument.getPages().accept(textFragmentAbsorber); // In order to search a text an get properties associated with it, please provide the page index // against which you need to get the information. Take a look over following code line. // accept the absorber for first page of document // pdfDocument.getPages().get_Item(1).accept(textFragmentAbsorber); // get the extracted text fragments into collection com.aspose.pdf.TextFragmentCollection textFragmentCollection = textFragmentAbsorber.getTextFragments(); // loop through the fragments for (com.aspose.pdf.TextFragment textFragment : (Iterable<com.aspose.pdf.TextFragment>) textFragmentCollection) { System.out.println("Text :- " + textFragment.getText()); System.out.println("Position :- " + textFragment.getPosition()); System.out.println("XIndent :- " + textFragment.getPosition().getXIndent()); System.out.println("YIndent :- " + textFragment.getPosition().getYIndent()); System.out.println("Font - Name :- " + textFragment.getTextState().getFont().getFontName()); System.out.println( "Font - IsAccessible :- " + textFragment.getTextState().getFont().isAccessible()); System.out.println( "Font - IsEmbedded - " + textFragment.getTextState().getFont().isEmbedded()); System.out.println("Font - IsSubset :- " + textFragment.getTextState().getFont().isSubset()); System.out.println("Font Size :- " + textFragment.getTextState().getFontSize()); System.out.println("Foreground Color :- " + textFragment.getTextState().getForegroundColor()); System.out.println("\n"); } // Print message System.out.println("Successfully finished."); }
public static void main(String[] args) throws Exception { // The path to the documents directory. String dataDir = Utils.getDataDir(SearchGetTextPage.class); // open document com.aspose.pdf.Document pdfDocument = new com.aspose.pdf.Document(dataDir + "input.pdf"); // create TextAbsorber object to find all instances of the input search phrase com.aspose.pdf.TextFragmentAbsorber textFragmentAbsorber = new com.aspose.pdf.TextFragmentAbsorber("sample"); // accept the absorber for first page of document pdfDocument.getPages().get_Item(1).accept(textFragmentAbsorber); // get the extracted text fragments into collection com.aspose.pdf.TextFragmentCollection textFragmentCollection = textFragmentAbsorber.getTextFragments(); // loop through the fragments for (com.aspose.pdf.TextFragment textFragment : (Iterable<com.aspose.pdf.TextFragment>) textFragmentCollection) { System.out.println("Text :- " + textFragment.getText()); System.out.println("Position :- " + textFragment.getPosition()); System.out.println("XIndent :- " + textFragment.getPosition().getXIndent()); System.out.println("YIndent :- " + textFragment.getPosition().getYIndent()); System.out.println("Font - Name :- " + textFragment.getTextState().getFont().getFontName()); System.out.println( "Font - IsAccessible :- " + textFragment.getTextState().getFont().isAccessible()); System.out.println( "Font - IsEmbedded - " + textFragment.getTextState().getFont().isEmbedded()); System.out.println("Font - IsSubset :- " + textFragment.getTextState().getFont().isSubset()); System.out.println("Font Size :- " + textFragment.getTextState().getFontSize()); System.out.println("Foreground Color :- " + textFragment.getTextState().getForegroundColor()); System.out.println("\n"); } // Print message System.out.println("Successfully finished."); }