/** * Copyright (c) 2004, www.pdfbox.org * All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions are met: * * 1. Redistributions of source code must retain the above copyright notice, * this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright notice, * this list of conditions and the following disclaimer in the documentation * and/or other materials provided with the distribution. * 3. Neither the name of pdfbox; nor the names of its * contributors may be used to endorse or promote products derived from this * software without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON * ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. * * http://www.pdfbox.org * */ package org.pdfbox; import java.io.IOException; import java.io.InputStream; import java.io.FileInputStream; import java.io.FileOutputStream; import java.util.List; import org.pdfbox.exceptions.InvalidPasswordException; import org.pdfbox.exceptions.COSVisitorException; import org.pdfbox.pdfparser.PDFParser; import org.pdfbox.pdmodel.PDDocument; import org.pdfbox.pdfwriter.COSWriter; import org.pdfbox.util.Splitter; /** * This is the main program that will take a pdf document and split it into * a number of other documents. * * @author Ben Litchfield (ben@csh.rit.edu) * @version $Revision: 1.5 $ */ public class PDFSplit { private static final String PASSWORD = "-password"; private static final String SPLIT = "-split"; /** * Infamous main method. * * @param args Command line arguments, should be one and a reference to a file. * * @throws Exception If there is an error parsing the document. */ public static void main( String[] args ) throws Exception { PDFSplit split = new PDFSplit(); split.split( args ); } private void split( String[] args ) throws Exception { String password = ""; String split = "1"; Splitter splitter = new Splitter(); String pdfFile = null; for( int i=0; i<args.length; i++ ) { if( args[i].equals( PASSWORD ) ) { i++; if( i >= args.length ) { usage(); } password = args[i]; } else if( args[i].equals( SPLIT ) ) { i++; if( i >= args.length ) { usage(); } split = args[i]; } else { if( pdfFile == null ) { pdfFile = args[i]; } } } if( pdfFile == null ) { usage(); } InputStream input = null; PDDocument document = null; List documents = null; try { input = new FileInputStream( pdfFile ); document = parseDocument( input ); if( document.isEncrypted() ) { try { document.decrypt( password ); } catch( InvalidPasswordException e ) { if( args.length == 4 )//they supplied the wrong password { System.err.println( "Error: The supplied password is incorrect." ); System.exit( 2 ); } else { //they didn't suppply a password and the default of "" was wrong. System.err.println( "Error: The document is encrypted." ); usage(); } } } splitter.setSplitAtPage( Integer.parseInt( split ) ); documents = splitter.split( document ); for( int i=0; i<documents.size(); i++ ) { PDDocument doc = (PDDocument)documents.get( i ); String fileName = pdfFile.substring(0, pdfFile.length()-4 ) + "-" + i + ".pdf"; writeDocument( doc, fileName ); doc.close(); } } finally { if( input != null ) { input.close(); } if( document != null ) { document.close(); } for( int i=0; documents != null && i<documents.size(); i++ ) { PDDocument doc = (PDDocument)documents.get( i ); doc.close(); } } } private static final void writeDocument( PDDocument doc, String fileName ) throws IOException, COSVisitorException { FileOutputStream output = null; COSWriter writer = null; try { output = new FileOutputStream( fileName ); writer = new COSWriter( output ); writer.write( doc ); } finally { if( output != null ) { output.close(); } if( writer != null ) { writer.close(); } } } /** * This will parse a document. * * @param input The input stream for the document. * * @return The document. * * @throws IOException If there is an error parsing the document. */ private static PDDocument parseDocument( InputStream input )throws IOException { PDFParser parser = new PDFParser( input ); parser.parse(); return parser.getPDDocument(); } /** * This will print the usage requirements and exit. */ private static void usage() { System.err.println( "Usage: java org.pdfbox.PDFSplit [OPTIONS] <PDF file>\n" + " -password <password> Password to decrypt document\n" + " -split <integer> split after this many pages\n" + " <PDF file> The PDF document to use\n" ); System.exit( 1 ); } }