package com.aspose.pdf.examples.AsposePdfExamples.Text;
import com.aspose.pdf.Document;
import com.aspose.pdf.TextFragment;
import com.aspose.pdf.TextFragmentAbsorber;
import com.aspose.pdf.TextFragmentCollection;
import com.aspose.pdf.TextSegment;
public class SearchAndGetTextSegmentsFromPagesOfPDF {
public static void main(String[] args) {
// Open document
Document pdfDocument = new Document("input.pdf");
// Create TextAbsorber object to find all instances of the input search phrase
TextFragmentAbsorber textFragmentAbsorber = new TextFragmentAbsorber("sample");
// Accept the absorber for first page of document
pdfDocument.getPages().accept(textFragmentAbsorber);
// Get the extracted text fragments into collection
TextFragmentCollection textFragmentCollection = textFragmentAbsorber.getTextFragments();
// Loop through the Text fragments
for (TextFragment textFragment : (Iterable<TextFragment>) textFragmentCollection) {
// Iterate through text segments
for (TextSegment textSegment : (Iterable<TextSegment>) textFragment.getSegments()) {
System.out.println("Text :- " + textSegment.getText());
System.out.println("Position :- " + textSegment.getPosition());
System.out.println("XIndent :- " + textSegment.getPosition().getXIndent());
System.out.println("YIndent :- " + textSegment.getPosition().getYIndent());
System.out.println("Font - Name :- " + textSegment.getTextState().getFont().getFontName());
System.out.println("Font - IsAccessible :- " + textSegment.getTextState().getFont().isAccessible());
System.out.println("Font - IsEmbedded - " + textSegment.getTextState().getFont().isEmbedded());
System.out.println("Font - IsSubset :- " + textSegment.getTextState().getFont().isSubset());
System.out.println("Font Size :- " + textSegment.getTextState().getFontSize());
System.out.println("Foreground Color :- " + textSegment.getTextState().getForegroundColor());
}
}
/*
// ExStart:Info
// Accept the absorber for the first page of document.
pdfDocument.getPages().get_Item(1).accept(textFragmentAbsorber);
// ExEnd:Info
*/
}
}