Package org.apache.pdfbox.util

Source Code of org.apache.pdfbox.util.TestPDFToImage

/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements.  See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License.  You may obtain a copy of the License at
*
*      http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.pdfbox.util;

import java.io.File;
import java.io.FileInputStream;
import java.io.FilenameFilter;
import java.io.IOException;

import junit.framework.Test;
import junit.framework.TestCase;
import junit.framework.TestSuite;

import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.pdfbox.pdmodel.PDDocument;

/**
* Test suite for PDFTextStripper.
*
* FILE SET VALIDATION
*
* This test suite is designed to test PDFToImage using a set of PDF
* files and known good output for each.  The default mode of testAll()
* is to process each *.pdf file in "test/input".  An output file is
* created in "test/output" with the same name as the PDF file, plus an
* additional ".jpg" suffix.
*
* The output file is then tested against a known good result file from
* the input directory (again, with the same name as the tested PDF file,
* but with the additional ".jpg" suffix).
*
* Currently, testing against known output is simply a byte-for-byte comparison
*
*In the future, testing against the known output may be accomplished using PerceptualDiff
*  http://sourceforge.net/projects/pdiff
*
*
* @author <a href="mailto:DanielWilson@Users.Sourceforge.net">Daniel Wilson</a>
* @author <a href="mailto:ben@benlitchfield.com">Ben Litchfield</a>
* @version $Revision: 1.1 $
*/
public class TestPDFToImage extends TestCase
{

    /**
     * Logger instance.
     */
    private static final Log log = LogFactory.getLog(TestPDFToImage.class);

    private boolean bFail = false;
    private PDFImageWriter writer = null;
    private File mcurFile = null;

    /**
     * Test class constructor.
     *
     * @param name The name of the test class.
     *
     * @throws IOException If there is an error creating the test.
     */
    public TestPDFToImage( String name ) throws IOException
    {
        super( name );
        writer = new PDFImageWriter();
    }

    /**
     * Test suite setup.
     */
    public void setUp()
    {
        // If you want to test a single file using DEBUG logging, from an IDE,
        // you can do something like this:
        //
        // System.setProperty("org.apache.pdfbox.util.TextStripper.file", "FVS318Ref.pdf");
    }

    /**
     * Validate text extraction on a single file.
     *
     * @param file The file to validate
     * @param bLogResult Whether to log the extracted text
     * @param inDir Name of the input directory
     * @param outDir Name of the output directory
     * @throws Exception when there is an exception
     */
    public void doTestFile(File file, boolean bLogResult, String inDir, String outDir)
        throws Exception
    {
        PDDocument document = null;

        log.info("Preparing to convert " + file.getName());
        try
        {
            document =  PDDocument.load(file);
            writer.writeImage(document, "png", "", 1, Integer.MAX_VALUE, outDir + file.getName() + "-");
        }
        catch(Exception e)
        {
            this.bFail=true;
            log.error("Error converting file " + file.getName(), e);
        }
        finally
        {
            document.close();
        }

        //Now check the resulting files ... did we get identical PNG(s)?
        try
        {
            mcurFile = file;

            File[] outFiles = new File(outDir).listFiles(new FilenameFilter()
              {
                public boolean accept(File dir, String name)
                {
                    return (name.endsWith(".png") && name.startsWith(mcurFile.getName(),0));
                }
              });
                for (int n = 0; n < outFiles.length; n++)
                {
                    File inFile = new File(inDir + outFiles[n].getName());
                    if (!inFile.exists() ||
                        !filesAreIdentical(outFiles[n], inFile))
                    {
                        this.bFail=true;
                        log.info("Input and output not identical for file: " + inFile.getName());
                    }
                }
        }
        catch(Exception e)
        {
            this.bFail=true;
            log.error("Error comparing file output for " + file.getName(), e);
        }

    }

    /**
     * Test to validate image rendering of file set.
     *
     * @throws Exception when there is an exception
     */
    public void testRenderImage()
        throws Exception
    {
        String filename = System.getProperty("org.apache.pdfbox.util.TextStripper.file");
        String inDir = "src/test/resources/input/rendering";
        String outDir = "target/test-output/rendering/";
        String inDirExt = "target/test-input-ext/rendering";
        String outDirExt = "target/test-output-ext/rendering";

            if ((filename == null) || (filename.length() == 0))
            {
                File[] testFiles = new File(inDir).listFiles(new FilenameFilter()
                {
                    public boolean accept(File dir, String name)
                    {
                        return (name.endsWith(".pdf") || name.endsWith(".ai"));
                    }
                });

                for (int n = 0; n < testFiles.length; n++)
                {
                    doTestFile(testFiles[n], false, inDir, outDir);
                }
                testFiles = new File(inDirExt).listFiles(new FilenameFilter()
                {
                    public boolean accept(File dir, String name)
                    {
                        return (name.endsWith(".pdf") || name.endsWith(".ai"));
                    }
                });
                if (testFiles != null)
                {
                    for (int n = 0; n < testFiles.length; n++)
                    {
                        doTestFile(testFiles[n], false, inDirExt, outDirExt);
                    }
                }
            }
            else
            {
                doTestFile(new File(inDir, filename), true, inDir, outDir);
            }

            if (this.bFail)
            {
                fail("One or more failures, see test log for details");
            }
    }

    /**
     * Set the tests in the suite for this test class.
     *
     * @return the Suite.
     */
    public static Test suite()
    {
        return new TestSuite( TestPDFToImage.class );
    }

    /**
     * Command line execution.
     *
     * @param args Command line arguments.
     */
    public static void main( String[] args )
    {
        String[] arg = {TestPDFToImage.class.getName() };
        junit.textui.TestRunner.main( arg );
    }

    private boolean filesAreIdentical(File left, File right) throws IOException
    {
        //http://forum.java.sun.com/thread.jspa?threadID=688105&messageID=4003259

        /* -- I reworked ASSERT's into IF statement -- dwilson
        assert left != null;
        assert right != null;
        assert left.exists();
        assert right.exists();
        */
        if(left != null && right != null && left.exists() && right.exists())
        {
            if (left.length() != right.length())
            {
                return false;
            }

            FileInputStream lin = new FileInputStream(left);
            FileInputStream rin = new FileInputStream(right);
            try
            {
                byte[] lbuffer = new byte[4096];
                byte[] rbuffer = new byte[lbuffer.length];
                for (int lcount = 0; (lcount = lin.read(lbuffer)) > 0;)
                {
                    int bytesRead = 0;
                    for (int rcount = 0; (rcount = rin.read(rbuffer, bytesRead, lcount - bytesRead)) > 0;)
                    {
                        bytesRead += rcount;
                    }
                    for (int byteIndex = 0; byteIndex < lcount; byteIndex++)
                    {
                        if (lbuffer[byteIndex] != rbuffer[byteIndex])
                        {
                            return false;
                        }
                    }
                }
            }
            finally
            {
                lin.close();
                rin.close();
            }
            return true;
        }
        else
        {
            return false;
        }
    }

}
TOP

Related Classes of org.apache.pdfbox.util.TestPDFToImage

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.