org.ujmp.pdfbox.PdfUtil.java Source code

Java tutorial

Introduction

Here is the source code for org.ujmp.pdfbox.PdfUtil.java

Source

/*
 * Copyright (C) 2008-2015 by Holger Arndt
 *
 * This file is part of the Universal Java Matrix Package (UJMP).
 * See the NOTICE file distributed with this work for additional
 * information regarding copyright ownership and licensing.
 *
 * UJMP is free software; you can redistribute it and/or modify
 * it under the terms of the GNU Lesser General Public License as
 * published by the Free Software Foundation; either version 2
 * of the License, or (at your option) any later version.
 *
 * UJMP is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
 * GNU Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with UJMP; if not, write to the
 * Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,
 * Boston, MA  02110-1301  USA
 */

package org.ujmp.pdfbox;

import java.io.ByteArrayInputStream;
import java.io.File;
import java.io.IOException;
import java.io.InputStream;

import org.apache.pdfbox.pdmodel.PDDocument;
import org.apache.pdfbox.util.PDFTextStripper;

public abstract class PdfUtil {

    public static final String getTextFromFile(File file) throws IOException {
        PDDocument pdd = PDDocument.load(file);
        PDFTextStripper pts = new PDFTextStripper();
        String text = pts.getText(pdd);
        pdd.close();
        return text;
    }

    public static final String getTextFromStream(InputStream inputStream) throws IOException {
        PDDocument pdd = PDDocument.load(inputStream);
        PDFTextStripper pts = new PDFTextStripper();
        String text = pts.getText(pdd);
        pdd.close();
        return text;
    }

    public static final String getTextFromBytes(byte[] data) throws IOException {
        ByteArrayInputStream is = new ByteArrayInputStream(data);
        return getTextFromStream(is);
    }

}