Source Code of org.jpedal.objects.structuredtext.MarkedContentGenerator

/**
* ===========================================
* Java Pdf Extraction Decoding Access Library
* ===========================================
*
* Project Info:  http://www.jpedal.org
* (C) Copyright 1997-2012, IDRsolutions and Contributors.
*
*   This file is part of JPedal
*
    This library is free software; you can redistribute it and/or
    modify it under the terms of the GNU Lesser General Public
    License as published by the Free Software Foundation; either
    version 2.1 of the License, or (at your option) any later version.


    This library is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
    Lesser General Public License for more details.


    You should have received a copy of the GNU Lesser General Public
    License along with this library; if not, write to the Free Software
    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA




*
* ---------------
* MarkedContentGenerator.java
* ---------------
*/
package org.jpedal.objects.structuredtext;


import org.jpedal.PdfDecoder;
import org.jpedal.io.ObjectStore;
import org.jpedal.io.PdfObjectReader;
import org.jpedal.objects.PageLookup;
import org.jpedal.objects.PdfPageData;
import org.jpedal.objects.PdfResources;
import org.jpedal.objects.layers.PdfLayerList;
import org.jpedal.objects.raw.PageObject;
import org.jpedal.objects.raw.PdfDictionary;
import org.jpedal.objects.raw.PdfObject;
import org.jpedal.objects.raw.MCObject;


import org.jpedal.parser.PdfStreamDecoder;
import org.jpedal.parser.ValueTypes;
import org.jpedal.utils.LogWriter;
import org.jpedal.utils.repositories.Vector_Int;
import org.jpedal.utils.repositories.Vector_Rectangle;
import org.w3c.dom.Document;
import org.w3c.dom.Element;


import org.w3c.dom.Text;


import javax.xml.parsers.DocumentBuilder;
import javax.xml.parsers.DocumentBuilderFactory;
import javax.xml.parsers.ParserConfigurationException;
import java.awt.*;
import java.util.HashMap;
import java.util.Map;


/**
 * extract as marked content
 */
public class MarkedContentGenerator {
  
  private PdfObjectReader currentPdfFile;


    private DocumentBuilder db=null;


    private Document doc;


    private Element root;


    private Map pageStreams=new HashMap();


  private PdfObject structTreeRootObj;


    private PdfResources res;


    private PdfLayerList layers;


    private PdfPageData pdfPageData;


    private boolean isDecoding=false;


  /**
   * main entry paint
   */
  public Document getMarkedContentTree(PdfResources res, PdfPageData pdfPageData, PdfObjectReader currentPdfFile) {


        this.structTreeRootObj=res.getPdfObject(PdfResources.StructTreeRootObj);
        //PdfObject markInfoObj=res.getPdfObject(PdfResources.MarkInfoObj);  //not used at present


        this.res=res;
        this.layers=res.getPdfLayerList();;


        this.pdfPageData=pdfPageData;


        return null;
        /**/


  }




    /**
     * extract marked content - not yet live
     */
    final synchronized private void decodePageForMarkedContent(int pageNumber, PdfObject pdfObject, Object pageStream) throws Exception {


        if (isDecoding) {


            if(LogWriter.isOutput())
                LogWriter.writeLog("[PDF]WARNING - this file is being decoded already");


        } else {


            //if no tree use page
            if(pdfObject==null){
                String currentPageOffset = (String) currentPdfFile.getReferenceforPage(pageNumber);


                pdfObject=new PageObject(currentPageOffset);
                currentPdfFile.readObject(pdfObject);


            }else{
                pageNumber=currentPdfFile.convertObjectToPageNumber(new String(pdfObject.getUnresolvedData()));
                currentPdfFile.checkResolved(pdfObject);
            }


            try{
                isDecoding=true;


                /** read page or next pages */
                if (pdfObject != null) {


                    /** the ObjectStore for this file */
                    ObjectStore objectStoreRef = new ObjectStore();


                    PdfStreamDecoder current = new PdfStreamDecoder(currentPdfFile, false, layers);
                    current.setParameters(true, false, 0,PdfDecoder.TEXT + PdfDecoder.RAWIMAGES + PdfDecoder.FINALIMAGES);
                    current.setXMLExtraction(false);
                    current.setObjectValue(ValueTypes.Name, "markedContent");
                    current.setObjectValue(ValueTypes.ObjectStore,objectStoreRef);
                    current.setObjectValue(ValueTypes.StatusBar, null);
                    current.setObjectValue(ValueTypes.PDFPageData,pdfPageData);
                    current.setIntValue(ValueTypes.PageNum, pageNumber);


                    res.setupResources(current, false, pdfObject.getDictionary(PdfDictionary.Resources), pageNumber, currentPdfFile);


                    current.setObjectValue(ValueTypes.MarkedContent,pageStream);


                    current.decodePageContent(pdfObject);


                    objectStoreRef.flush();


                }
            }catch(Exception e){
                e.printStackTrace();
            }finally {
                isDecoding=false;
            }
        }
    }
}
Source Code of org.jpedal.objects.structuredtext.MarkedContentGenerator

Related Classes of org.jpedal.objects.structuredtext.MarkedContentGenerator