List of usage examples for com.itextpdf.text.pdf.parser RegionTextRenderFilter RegionTextRenderFilter
public RegionTextRenderFilter(Rectangle filterRect)
From source file:javaapplication1.JavaApplication1.java
/** * Parses a specific area of a PDF to a plain text file. * @param pdf the original PDF//from w w w . j a v a 2s. co m * @param txt the resulting text * @throws IOException */ public String mycheckline(PdfReader reader, int pheight, int pwidth, int lh, int page) throws IOException { // PrintWriter out = new PrintWriter(new FileOutputStream(txt)); Rectangle rect = new Rectangle(0, pheight - lh, pwidth / 3, pheight - lh - fontchecksize); RenderFilter filter = new RegionTextRenderFilter(rect); TextExtractionStrategy strategy = new FilteredTextRenderListener(new LocationTextExtractionStrategy(), filter); return (PdfTextExtractor.getTextFromPage(reader, page, strategy)); }
From source file:Project.data.preparation.ExtractPageContentArea.java
public void parsePdf(String pdf, int pageNum, int upper_x, int upper_y, int lower_x, int lower_y) throws IOException { PdfReader reader = new PdfReader(pdf); // System.out.println("(" + upper_x + " , " + upper_y + ") to ( " + lower_x + " , " + lower_y + ")"); rect = new Rectangle(upper_x, upper_y, lower_x, lower_y); RenderFilter filter = new RegionTextRenderFilter(getRect()); TextExtractionStrategy strategy;/*from ww w . ja v a 2 s .c o m*/ strategy = new FilteredTextRenderListener(new LocationTextExtractionStrategy(), filter); TextCropped = PdfTextExtractor.getTextFromPage(reader, pageNum, strategy); setTextCropped(TextCropped); reader.close(); }