aboutsummaryrefslogtreecommitdiff
path: root/src/main/java/test
diff options
context:
space:
mode:
authortknall <tknall@7b5415b0-85f9-ee4d-85bd-d5d0c3b42d1c>2008-11-25 12:03:13 +0000
committertknall <tknall@7b5415b0-85f9-ee4d-85bd-d5d0c3b42d1c>2008-11-25 12:03:13 +0000
commitc68ad0ec056b37c82debebcecfcde1866d61b4d9 (patch)
tree9e3ec28a87a5c29d1087fd03cc4c77899e2c758c /src/main/java/test
parent2eae233bf806c076acb8afea41eb16552687bcea (diff)
downloadpdf-as-3-c68ad0ec056b37c82debebcecfcde1866d61b4d9.tar.gz
pdf-as-3-c68ad0ec056b37c82debebcecfcde1866d61b4d9.tar.bz2
pdf-as-3-c68ad0ec056b37c82debebcecfcde1866d61b4d9.zip
Removing pdfbox from source.
git-svn-id: https://joinup.ec.europa.eu/svn/pdf-as/trunk@301 7b5415b0-85f9-ee4d-85bd-d5d0c3b42d1c
Diffstat (limited to 'src/main/java/test')
-rw-r--r--src/main/java/test/pdfbox/TestAll.java88
-rw-r--r--src/main/java/test/pdfbox/cos/TestCOSString.java92
-rw-r--r--src/main/java/test/pdfbox/cos/package.html9
-rw-r--r--src/main/java/test/pdfbox/encryption/TestEncryption.java179
-rw-r--r--src/main/java/test/pdfbox/encryption/package.html9
-rw-r--r--src/main/java/test/pdfbox/filter/TestFilters.java182
-rw-r--r--src/main/java/test/pdfbox/filter/package.html9
-rw-r--r--src/main/java/test/pdfbox/package.html9
-rw-r--r--src/main/java/test/pdfbox/pdfparser/TestPDFParser.java126
-rw-r--r--src/main/java/test/pdfbox/pdfparser/package.html9
-rw-r--r--src/main/java/test/pdfbox/pdmodel/TestFDF.java292
-rw-r--r--src/main/java/test/pdfbox/pdmodel/interactive/form/TestFields.java144
-rw-r--r--src/main/java/test/pdfbox/pdmodel/interactive/form/package.html9
-rw-r--r--src/main/java/test/pdfbox/pdmodel/package.html9
-rw-r--r--src/main/java/test/pdfbox/util/TestTextStripper.java371
-rw-r--r--src/main/java/test/pdfbox/util/TestTextStripperPerformance.java173
-rw-r--r--src/main/java/test/pdfbox/util/package.html9
17 files changed, 0 insertions, 1719 deletions
diff --git a/src/main/java/test/pdfbox/TestAll.java b/src/main/java/test/pdfbox/TestAll.java
deleted file mode 100644
index c1882fc..0000000
--- a/src/main/java/test/pdfbox/TestAll.java
+++ /dev/null
@@ -1,88 +0,0 @@
-/**
- * Copyright (c) 2003-2004, www.pdfbox.org
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- * 1. Redistributions of source code must retain the above copyright notice,
- * this list of conditions and the following disclaimer.
- * 2. Redistributions in binary form must reproduce the above copyright notice,
- * this list of conditions and the following disclaimer in the documentation
- * and/or other materials provided with the distribution.
- * 3. Neither the name of pdfbox; nor the names of its
- * contributors may be used to endorse or promote products derived from this
- * software without specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
- * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
- * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
- * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
- * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
- * ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
- * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * http://www.pdfbox.org
- *
- */
-package test.pdfbox;
-
-import test.pdfbox.cos.TestCOSString;
-import test.pdfbox.encryption.TestEncryption;
-import test.pdfbox.filter.TestFilters;
-import test.pdfbox.pdmodel.TestFDF;
-import test.pdfbox.pdmodel.interactive.form.TestFields;
-import junit.framework.Test;
-import junit.framework.TestCase;
-import junit.framework.TestSuite;
-
-/**
- * This is a holder for all test cases in the pdfbox system.
- *
- * @author Ben Litchfield (ben@csh.rit.edu)
- * @version $Revision: 1.6 $
- */
-public class TestAll extends TestCase
-{
-
- /**
- * Constructor.
- *
- * @param name The name of the test to run.
- */
- public TestAll( String name )
- {
- super( name );
- }
-
- /**
- * The main method to run tests.
- *
- * @param args The command line arguments.
- */
- public static void main( String[] args )
- {
- String[] arg = {TestAll.class.getName() };
- junit.textui.TestRunner.main( arg );
- }
-
- /**
- * This will get the suite of test that this class holds.
- *
- * @return All of the tests that this class holds.
- */
- public static Test suite()
- {
- TestSuite suite = new TestSuite();
- suite.addTest( TestFilters.suite() );
- suite.addTest( TestFDF.suite() );
- suite.addTest( TestFields.suite() );
- suite.addTest( TestEncryption.suite() );
- suite.addTest( TestFDF.suite() );
- suite.addTest( TestCOSString.suite() );
- return suite;
- }
-} \ No newline at end of file
diff --git a/src/main/java/test/pdfbox/cos/TestCOSString.java b/src/main/java/test/pdfbox/cos/TestCOSString.java
deleted file mode 100644
index 19b3ca0..0000000
--- a/src/main/java/test/pdfbox/cos/TestCOSString.java
+++ /dev/null
@@ -1,92 +0,0 @@
-/**
- * Copyright (c) 2003-2004, www.pdfbox.org
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- * 1. Redistributions of source code must retain the above copyright notice,
- * this list of conditions and the following disclaimer.
- * 2. Redistributions in binary form must reproduce the above copyright notice,
- * this list of conditions and the following disclaimer in the documentation
- * and/or other materials provided with the distribution.
- * 3. Neither the name of pdfbox; nor the names of its
- * contributors may be used to endorse or promote products derived from this
- * software without specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
- * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
- * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
- * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
- * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
- * ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
- * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * http://www.pdfbox.org
- *
- */
-package test.pdfbox.cos;
-
-import java.io.IOException;
-
-import junit.framework.Test;
-import junit.framework.TestCase;
-import junit.framework.TestSuite;
-
-import org.pdfbox.cos.COSString;
-
-/**
- * This will test all of the filters in the PDFBox system.
- *
- * @author Ben Litchfield (ben@csh.rit.edu)
- * @version $Revision$
- */
-public class TestCOSString extends TestCase
-{
-
- /**
- * Constructor.
- *
- * @param name The name of the test to run.
- */
- public TestCOSString( String name )
- {
- super( name );
- }
-
- /**
- * This will get the suite of test that this class holds.
- *
- * @return All of the tests that this class holds.
- */
- public static Test suite()
- {
- return new TestSuite( TestCOSString.class );
- }
-
- /**
- * infamous main method.
- *
- * @param args The command line arguments.
- */
- public static void main( String[] args )
- {
- String[] arg = {TestCOSString.class.getName() };
- junit.textui.TestRunner.main( arg );
- }
-
- /**
- * This will test all of the filters in the system.
- *
- * @throws IOException If there is an exception while encoding.
- */
- public void testUnicode() throws IOException
- {
- String theString = "\u4e16";
- COSString string = new COSString( theString );
- assertTrue( string.getString().equals( theString ) );
- }
-} \ No newline at end of file
diff --git a/src/main/java/test/pdfbox/cos/package.html b/src/main/java/test/pdfbox/cos/package.html
deleted file mode 100644
index c64f742..0000000
--- a/src/main/java/test/pdfbox/cos/package.html
+++ /dev/null
@@ -1,9 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 3.2 Final//EN">
-<html>
-<head>
-
-</head>
-<body>
-These classes will be used to test the various COS objects that make up the core of PDFBox.
-</body>
-</html>
diff --git a/src/main/java/test/pdfbox/encryption/TestEncryption.java b/src/main/java/test/pdfbox/encryption/TestEncryption.java
deleted file mode 100644
index e13de2a..0000000
--- a/src/main/java/test/pdfbox/encryption/TestEncryption.java
+++ /dev/null
@@ -1,179 +0,0 @@
-/**
- * Copyright (c) 2004, www.pdfbox.org
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- * 1. Redistributions of source code must retain the above copyright notice,
- * this list of conditions and the following disclaimer.
- * 2. Redistributions in binary form must reproduce the above copyright notice,
- * this list of conditions and the following disclaimer in the documentation
- * and/or other materials provided with the distribution.
- * 3. Neither the name of pdfbox; nor the names of its
- * contributors may be used to endorse or promote products derived from this
- * software without specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
- * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
- * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
- * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
- * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
- * ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
- * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * http://www.pdfbox.org
- *
- */
-package test.pdfbox.encryption;
-
-import java.io.ByteArrayInputStream;
-import java.io.ByteArrayOutputStream;
-
-import junit.framework.Test;
-import junit.framework.TestCase;
-import junit.framework.TestSuite;
-
-import org.apache.log4j.Logger;
-
-import org.pdfbox.encryption.PDFEncryption;
-
-/**
- * This will test the encryption algorithms in PDFBox.
- *
- * @author Ben Litchfield (ben@csh.rit.edu)
- * @version $Revision: 1.3 $
- */
-public class TestEncryption extends TestCase
-{
- private static Logger log = Logger.getLogger(TestEncryption.class);
-
- /**
- * Constructor.
- *
- * @param name The name of the test to run.
- */
- public TestEncryption( String name )
- {
- super( name );
- }
-
- /**
- * This will get the suite of test that this class holds.
- *
- * @return All of the tests that this class holds.
- */
- public static Test suite()
- {
- return new TestSuite( TestEncryption.class );
- }
-
- /**
- * infamous main method.
- *
- * @param args The command line arguments.
- */
- public static void main( String[] args )
- {
- String[] arg = {TestEncryption.class.getName() };
- junit.textui.TestRunner.main( arg );
- }
-
- /**
- * This will test some simple encryption.
- *
- * @throws Exception If there is an exception while encrypting.
- */
- public void testEncryption() throws Exception
- {
- byte[] key={0x65, 0x3d, 0x4f, 0x70, 0x0c };
- byte[] data={0x31, 0x20, 0x30, 0x20, 0x30, 0x20, 0x72, 0x67, 0x20, 0x30,
- 0x20, 0x30, 0x20, 0x33, 0x30, 0x38, 0x2e, 0x34, 0x37, 0x34,
- 0x37, 0x20, 0x35, 0x37, 0x2e, 0x36, 0x32, 0x37, 0x31, 0x20,
- 0x72, 0x65, 0x20, 0x66, 0x20, 0x30, 0x20, 0x47, 0x20, 0x31,
- 0x20, 0x77, 0x20, 0x30, 0x2e, 0x35, 0x20, 0x30, 0x2e, 0x35,
- 0x20, 0x33, 0x30, 0x37, 0x2e, 0x34, 0x37, 0x34, 0x37, 0x20,
- 0x35, 0x36, 0x2e, 0x36, 0x32, 0x37, 0x31, 0x20, 0x72, 0x65,
- 0x20, 0x73, 0x20, 0x2f, 0x54, 0x78, 0x20, 0x42, 0x4d, 0x43,
- 0x20, 0x71, 0x20, 0x31, 0x20, 0x31, 0x20, 0x33, 0x30, 0x36,
- 0x2e, 0x34, 0x37, 0x34, 0x37, 0x20, 0x35, 0x35, 0x2e, 0x36,
- 0x32, 0x37, 0x31, 0x20, 0x72, 0x65, 0x20, 0x57, 0x20, 0x6e,
- 0x20, 0x30, 0x20, 0x67, 0x20, 0x42, 0x54, 0x0a, 0x2f, 0x48,
- 0x65, 0x6c, 0x76, 0x20, 0x31, 0x30, 0x20, 0x54, 0x66, 0x0a,
- 0x32, 0x20, 0x32, 0x35, 0x2e, 0x31, 0x30, 0x33, 0x35, 0x20,
- 0x54, 0x64, 0x0a, 0x31, 0x31, 0x2e, 0x35, 0x35, 0x39, 0x39,
- 0x20, 0x54, 0x4c, 0x0a, 0x28, 0x2d, 0x2d, 0x5c, 0x30, 0x34,
- 0x30, 0x44, 0x65, 0x66, 0x61, 0x75, 0x6c, 0x74, 0x5c, 0x30,
- 0x34, 0x30, 0x66, 0x69, 0x65, 0x6c, 0x64, 0x5c, 0x30, 0x34,
- 0x30, 0x76, 0x61, 0x6c, 0x75, 0x65, 0x5c, 0x30, 0x34, 0x30,
- 0x2d, 0x2d, 0x29, 0x20, 0x54, 0x6a, 0x0a, 0x45, 0x54, 0x0a,
- 0x20, 0x51, 0x20, 0x45, 0x4d, 0x43, (byte)0x8a, 0x0d, 0x0a
- };
- PDFEncryption enc = new PDFEncryption();
- ByteArrayOutputStream output = new ByteArrayOutputStream();
- enc.encryptData( 43, 0, key, new ByteArrayInputStream( data ), output );
-
- byte[] encrypted = output.toByteArray();
- printHexString( encrypted );
-
- ByteArrayOutputStream sameAsInput = new ByteArrayOutputStream();
- enc.encryptData( 43, 0, key, new ByteArrayInputStream( encrypted ), sameAsInput );
- byte[] dataAgain = sameAsInput.toByteArray();
- cmpArray( data, dataAgain );
- }
-
- /**
- * This will compare a couple of arrays and fail if they do not match.
- *
- * @param firstArray The first array.
- * @param secondArray The second array.
- */
- private void cmpArray( byte[] firstArray, byte[] secondArray )
- {
- if( firstArray.length != secondArray.length )
- {
- fail( "The array lengths do not match for " +
- ", firstArray length was: " + firstArray.length +
- ", secondArray length was: " + secondArray.length);
- }
-
- for( int i=0; i<firstArray.length; i++ )
- {
- if( firstArray[i] != secondArray[i] )
- {
- fail( "Array data does not match " );
- }
- }
- }
-
- /**
- * This will print a byte array as a hex string to standard output.
- *
- * @param data The array to print.
- */
- private void printHexString( byte[] data )
- {
- for( int i=0; i<data.length; i++ )
- {
- int nextByte = (data[i] + 256)%256;
- String hexString = Integer.toHexString( nextByte );
- if( hexString.length() < 2 )
- {
- hexString = "0" + hexString;
- }
- System.out.print( hexString );
- if( i != 0 && (i+1) % 2 == 0 )
- {
- System.out.print( " " );
- }
- else if( i!= 0 &&i % 20 == 0 )
- {
- System.out.println();
- }
- }
- System.out.println();
- }
-} \ No newline at end of file
diff --git a/src/main/java/test/pdfbox/encryption/package.html b/src/main/java/test/pdfbox/encryption/package.html
deleted file mode 100644
index 1dcaad7..0000000
--- a/src/main/java/test/pdfbox/encryption/package.html
+++ /dev/null
@@ -1,9 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 3.2 Final//EN">
-<html>
-<head>
-
-</head>
-<body>
-These classes will be used to test the various encryption algorithms that are used in PDFBox.
-</body>
-</html>
diff --git a/src/main/java/test/pdfbox/filter/TestFilters.java b/src/main/java/test/pdfbox/filter/TestFilters.java
deleted file mode 100644
index db124eb..0000000
--- a/src/main/java/test/pdfbox/filter/TestFilters.java
+++ /dev/null
@@ -1,182 +0,0 @@
-/**
- * Copyright (c) 2003-2004, www.pdfbox.org
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- * 1. Redistributions of source code must retain the above copyright notice,
- * this list of conditions and the following disclaimer.
- * 2. Redistributions in binary form must reproduce the above copyright notice,
- * this list of conditions and the following disclaimer in the documentation
- * and/or other materials provided with the distribution.
- * 3. Neither the name of pdfbox; nor the names of its
- * contributors may be used to endorse or promote products derived from this
- * software without specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
- * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
- * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
- * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
- * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
- * ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
- * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * http://www.pdfbox.org
- *
- */
-package test.pdfbox.filter;
-
-import java.io.ByteArrayInputStream;
-import java.io.ByteArrayOutputStream;
-import java.io.IOException;
-import java.io.File;
-import java.io.FileInputStream;
-
-import java.util.Collection;
-import java.util.Iterator;
-
-import junit.framework.Test;
-import junit.framework.TestCase;
-import junit.framework.TestSuite;
-
-import org.apache.log4j.Logger;
-
-import org.pdfbox.cos.COSDictionary;
-
-import org.pdfbox.filter.DCTFilter;
-import org.pdfbox.filter.CCITTFaxDecodeFilter;
-import org.pdfbox.filter.Filter;
-import org.pdfbox.filter.FilterManager;
-import org.pdfbox.filter.RunLengthDecodeFilter;
-
-/**
- * This will test all of the filters in the PDFBox system.
- *
- * @author Ben Litchfield (ben@csh.rit.edu)
- * @version $Revision: 1.5 $
- */
-public class TestFilters extends TestCase
-{
- private static Logger log = Logger.getLogger(TestFilters.class);
-
- private static final int BUFFER_SIZE = 2048;
- private static final COSDictionary EMPTY_DICTIONARY = new COSDictionary();
-
- /**
- * Constructor.
- *
- * @param name The name of the test to run.
- */
- public TestFilters( String name )
- {
- super( name );
- }
-
- /**
- * This will get the suite of test that this class holds.
- *
- * @return All of the tests that this class holds.
- */
- public static Test suite()
- {
- return new TestSuite( TestFilters.class );
- }
-
- /**
- * This will test all of the filters in the system.
- *
- * @throws IOException If there is an exception while encoding.
- */
- public void testFilters() throws IOException
- {
- FilterManager manager = new FilterManager();
- Collection filters = manager.getFilters();
-
- Iterator filterIter = filters.iterator();
- while( filterIter.hasNext() )
- {
- long start = System.currentTimeMillis();
- Filter filter = (Filter)filterIter.next();
- if( !(filter instanceof DCTFilter ||
- filter instanceof CCITTFaxDecodeFilter ||
- filter instanceof RunLengthDecodeFilter))
- {
- checkFilter( new File( "classes" ), filter );
- long stop = System.currentTimeMillis();
- System.out.println( "Time for filter " + filter.getClass().getName() + "=" + (stop-start) );
- }
- }
- }
-
- /**
- * This will check the filter.
- *
- * @param file The file or directory to test.
- * @param filter The filter to check.
- *
- * @throws IOException If there is an exception while encoding.
- */
- private void checkFilter( File file, Filter filter ) throws IOException
- {
- if( file.isDirectory() )
- {
- File[] subFiles = file.listFiles();
- for( int i=0; i<subFiles.length; i++ )
- {
- checkFilter( subFiles[i], filter );
- }
- }
- else
- {
- log.debug("Checking filter: " + filter + ", with file: " + file.getAbsolutePath());
- ByteArrayOutputStream output = new ByteArrayOutputStream();
-
- ByteArrayOutputStream encoded = new ByteArrayOutputStream();
- ByteArrayOutputStream decoded = new ByteArrayOutputStream();
- FileInputStream fin = new FileInputStream( file );
- int amountRead = 0;
- byte[] buffer = new byte[ BUFFER_SIZE ];
- while( (amountRead = fin.read( buffer, 0, BUFFER_SIZE )) != -1 )
- {
- output.write( buffer, 0, amountRead );
- }
- fin.close();
- byte[] original = output.toByteArray();
- filter.encode( new ByteArrayInputStream( original ), encoded, EMPTY_DICTIONARY );
- filter.decode( new ByteArrayInputStream( encoded.toByteArray() ), decoded, EMPTY_DICTIONARY );
-
- cmpArray( original, decoded.toByteArray(), filter, file );
- }
- }
-
- /**
- * This will compare a couple of arrays and fail if they do not match.
- *
- * @param firstArray The first array.
- * @param secondArray The second array.
- * @param filter The filter that did the encoding.
- * @param file The file that was encoded.
- */
- private void cmpArray( byte[] firstArray, byte[] secondArray, Filter filter, File file )
- {
- String fileMsg = filter.getClass().getName() + " " + file.getAbsolutePath();
- if( firstArray.length != secondArray.length )
- {
- fail( "The array lengths do not match for " + fileMsg +
- ", firstArray length was: " + firstArray.length +
- ", secondArray length was: " + secondArray.length);
- }
-
- for( int i=0; i<firstArray.length; i++ )
- {
- if( firstArray[i] != secondArray[i] )
- {
- fail( "Array data does not match " + fileMsg );
- }
- }
- }
-} \ No newline at end of file
diff --git a/src/main/java/test/pdfbox/filter/package.html b/src/main/java/test/pdfbox/filter/package.html
deleted file mode 100644
index 41556d1..0000000
--- a/src/main/java/test/pdfbox/filter/package.html
+++ /dev/null
@@ -1,9 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 3.2 Final//EN">
-<html>
-<head>
-
-</head>
-<body>
-These classes will be used to test the various filters that are available with PDFBox.
-</body>
-</html>
diff --git a/src/main/java/test/pdfbox/package.html b/src/main/java/test/pdfbox/package.html
deleted file mode 100644
index 2d5d590..0000000
--- a/src/main/java/test/pdfbox/package.html
+++ /dev/null
@@ -1,9 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 3.2 Final//EN">
-<html>
-<head>
-
-</head>
-<body>
-This holds classes that will be used to test all of PDFBox.
-</body>
-</html>
diff --git a/src/main/java/test/pdfbox/pdfparser/TestPDFParser.java b/src/main/java/test/pdfbox/pdfparser/TestPDFParser.java
deleted file mode 100644
index e935af3..0000000
--- a/src/main/java/test/pdfbox/pdfparser/TestPDFParser.java
+++ /dev/null
@@ -1,126 +0,0 @@
-/**
- * Copyright (c) 2005, www.pdfbox.org
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- * 1. Redistributions of source code must retain the above copyright notice,
- * this list of conditions and the following disclaimer.
- * 2. Redistributions in binary form must reproduce the above copyright notice,
- * this list of conditions and the following disclaimer in the documentation
- * and/or other materials provided with the distribution.
- * 3. Neither the name of pdfbox; nor the names of its
- * contributors may be used to endorse or promote products derived from this
- * software without specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
- * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
- * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
- * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
- * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
- * ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
- * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * http://www.pdfbox.org
- *
- */
-package test.pdfbox.pdfparser;
-
-import java.io.ByteArrayInputStream;
-import java.io.IOException;
-import java.io.InputStream;
-
-import junit.framework.Test;
-import junit.framework.TestCase;
-import junit.framework.TestSuite;
-
-import org.pdfbox.cos.COSName;
-
-import org.pdfbox.pdfparser.BaseParser;
-
-
-/**
- * This will test the PDF parsing in PDFBox.
- *
- * @author Ben Litchfield (ben@benlitchfield.com)
- * @version $Revision: 1.1 $
- */
-public class TestPDFParser extends TestCase
-{
- //private static Logger log = Logger.getLogger(TestFDF.class);
-
- /**
- * Constructor.
- *
- * @param name The name of the test to run.
- */
- public TestPDFParser( String name )
- {
- super( name );
- }
-
- /**
- * This will get the suite of test that this class holds.
- *
- * @return All of the tests that this class holds.
- */
- public static Test suite()
- {
- return new TestSuite( TestPDFParser.class );
- }
-
- /**
- * infamous main method.
- *
- * @param args The command line arguments.
- */
- public static void main( String[] args )
- {
- String[] arg = {TestPDFParser.class.getName() };
- junit.textui.TestRunner.main( arg );
- }
-
- /**
- * This will test some cos name parsing.
- *
- * @throws Exception If there is an exception while parsing.
- */
- public void testCOSName() throws Exception
- {
- TestParser parser = new TestParser(new ByteArrayInputStream( "/PANTONE#20116#20CV".getBytes() ) );
- COSName name = parser.parseCOSName();
- assertTrue("Failed to parse COSName",name.getName().equals( "PANTONE 116 CV" ));
-
- }
-
- /**
- * A simple class used to test parsing of the cos name.
- */
- private class TestParser extends BaseParser
- {
- /**
- * Constructor.
- * @param input The input stream.
- * @throws IOException If there is an error during parsing.
- */
- public TestParser( InputStream input) throws IOException
- {
- super( input );
- }
-
- /**
- * Expose the parseCOSName as public.
- *
- * @return The parsed cos name.
- * @throws IOException If there is an error parsing the COSName.
- */
- public COSName parseCOSName() throws IOException
- {
- return super.parseCOSName();
- }
- }
-} \ No newline at end of file
diff --git a/src/main/java/test/pdfbox/pdfparser/package.html b/src/main/java/test/pdfbox/pdfparser/package.html
deleted file mode 100644
index d723694..0000000
--- a/src/main/java/test/pdfbox/pdfparser/package.html
+++ /dev/null
@@ -1,9 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 3.2 Final//EN">
-<html>
-<head>
-
-</head>
-<body>
-This holds classes that will be used to test the pdf parsing classes.
-</body>
-</html>
diff --git a/src/main/java/test/pdfbox/pdmodel/TestFDF.java b/src/main/java/test/pdfbox/pdmodel/TestFDF.java
deleted file mode 100644
index d17ed11..0000000
--- a/src/main/java/test/pdfbox/pdmodel/TestFDF.java
+++ /dev/null
@@ -1,292 +0,0 @@
-/**
- * Copyright (c) 2005, www.pdfbox.org
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- * 1. Redistributions of source code must retain the above copyright notice,
- * this list of conditions and the following disclaimer.
- * 2. Redistributions in binary form must reproduce the above copyright notice,
- * this list of conditions and the following disclaimer in the documentation
- * and/or other materials provided with the distribution.
- * 3. Neither the name of pdfbox; nor the names of its
- * contributors may be used to endorse or promote products derived from this
- * software without specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
- * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
- * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
- * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
- * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
- * ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
- * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * http://www.pdfbox.org
- *
- */
-package test.pdfbox.pdmodel;
-
-import java.io.ByteArrayInputStream;
-import java.io.IOException;
-import java.util.List;
-import java.util.Map;
-
-import junit.framework.Test;
-import junit.framework.TestCase;
-import junit.framework.TestSuite;
-
-import org.pdfbox.cos.COSStream;
-import org.pdfbox.cos.COSString;
-import org.pdfbox.pdfparser.PDFStreamParser;
-import org.pdfbox.pdmodel.PDDocument;
-import org.pdfbox.pdmodel.fdf.FDFDocument;
-import org.pdfbox.pdmodel.interactive.annotation.PDAppearanceStream;
-import org.pdfbox.pdmodel.interactive.annotation.PDAnnotationWidget;
-import org.pdfbox.pdmodel.interactive.form.PDAcroForm;
-import org.pdfbox.pdmodel.interactive.form.PDField;
-import org.pdfbox.pdmodel.interactive.form.PDRadioCollection;
-import org.pdfbox.pdmodel.interactive.form.PDTextbox;
-
-/**
- * This will test the FDF algorithms in PDFBox.
- *
- * @author Ben Litchfield (ben@csh.rit.edu)
- * @version $Revision: 1.5 $
- */
-public class TestFDF extends TestCase
-{
- //private static Logger log = Logger.getLogger(TestFDF.class);
-
- /**
- * Constructor.
- *
- * @param name The name of the test to run.
- */
- public TestFDF( String name )
- {
- super( name );
- }
-
- /**
- * This will get the suite of test that this class holds.
- *
- * @return All of the tests that this class holds.
- */
- public static Test suite()
- {
- return new TestSuite( TestFDF.class );
- }
-
- /**
- * infamous main method.
- *
- * @param args The command line arguments.
- */
- public static void main( String[] args )
- {
- String[] arg = {TestFDF.class.getName() };
- junit.textui.TestRunner.main( arg );
- }
-
- /**
- * This will test some simple field setting.
- *
- * @throws Exception If there is an exception while encrypting.
- */
- public void testFDFfdeb() throws Exception
- {
- PDDocument fdeb = null;
- try
- {
- fdeb = PDDocument.load( "test/input/fdeb.pdf" );
- PDAcroForm form = fdeb.getDocumentCatalog().getAcroForm();
- PDTextbox field = (PDTextbox)form.getField( "f67_1" );
- field.setValue( "2" );
-
- String expected =
- "/Tx BMC " +
- "BT " +
- "/Helv 9 Tf " +
- " 0 g " +
- " 2 1.985585 Td " +
- "2.07698 0 Td " +
- "(2) Tj " +
- "ET " +
- "EMC";
-
- testContentStreams( fdeb, field, expected );
- }
- finally
- {
- fdeb.close();
- }
-
- }
-
- /**
- * This will test a pdf with lots of fields.
- *
- * @throws Exception If there is an exception while encrypting.
- */
- public void testFDFPDFWithLotsOfFields() throws Exception
- {
- PDDocument fdeb = null;
- try
- {
- fdeb = PDDocument.load( "test/input/pdf_with_lots_of_fields.pdf" );
- PDAcroForm form = fdeb.getDocumentCatalog().getAcroForm();
- PDTextbox feld2 = (PDTextbox)form.getField( "Feld.2" );
- feld2.setValue( "Benjamin" );
-
- String expected =
- "1 1 0.8000000119 rg " +
- " 0 0 127.5 19.8299999237 re " +
- " f " +
- " 0 0 0 RG " +
- " 1 w " +
- " 0.5 0.5 126.5 18.8299999237 re " +
- " S " +
- " 0.5 g " +
- " 1 1 m " +
- " 1 18.8299999237 l " +
- " 126.5 18.8299999237 l " +
- " 125.5 17.8299999237 l " +
- " 2 17.8299999237 l " +
- " 2 2 l " +
- " 1 1 l " +
- " f " +
- " 0.75 g " +
- " 1 1 m " +
- " 126.5 1 l " +
- " 126.5 18.8299999237 l " +
- " 125.5 17.8299999237 l " +
- " 125.5 2 l " +
- " 2 2 l " +
- " 1 1 l " +
- " f " +
- " /Tx BMC " +
- "BT " +
- "/Helv 14 Tf " +
- " 0 0 0 rg " +
- " 4 4.721 Td " +
- "(Benjamin) Tj " +
- "ET " +
- "EMC";
-
- testContentStreams( fdeb, feld2, expected );
-
- PDRadioCollection feld3 = (PDRadioCollection)form.getField( "Feld.3" );
- feld3.setValue("RB1");
- assertEquals( "RB1", feld3.getValue() );
- //assertEquals( ((PDCheckbox)feld3.getKids().get( 0 )).getValue(), "RB1" );
-
- }
- finally
- {
- fdeb.close();
- }
- }
-
- /**
- * This will test the Freedom pdf.
- *
- * @throws Exception If there is an error while testing.
- */
- public void testFDFFreedomExpressions() throws Exception
- {
- PDDocument freedom = null;
- FDFDocument fdf = null;
- try
- {
- freedom = PDDocument.load( "test/input/FreedomExpressions.pdf" );
- fdf = FDFDocument.load( "test/input/FreedomExpressions.fdf" );
- PDAcroForm form = freedom.getDocumentCatalog().getAcroForm();
- form.importFDF( fdf );
- PDTextbox feld2 = (PDTextbox)form.getField( "eeFirstName" );
- List kids = feld2.getKids();
- PDField firstKid = (PDField)kids.get( 0 );
- PDField secondKid = (PDField)kids.get( 1 );
- testContentStreamContains( freedom, firstKid, "Steve" );
- testContentStreamContains( freedom, secondKid, "Steve" );
-
- //the appearance stream is suppose to be null because there
- //is an F action in the AA dictionary that populates that field.
- PDField totalAmt = form.getField( "eeSuppTotalAmt" );
- assertTrue( totalAmt.getDictionary().getDictionaryObject( "AP" ) == null );
-
- }
- finally
- {
- if( freedom != null )
- {
- freedom.close();
- }
- if( fdf != null )
- {
- fdf.close();
- }
- }
- }
-
- private void testContentStreamContains( PDDocument doc, PDField field, String expected ) throws Exception
- {
- PDAnnotationWidget widget = field.getWidget();
- Map normalAppearance = widget.getAppearance().getNormalAppearance();
- PDAppearanceStream appearanceStream = (PDAppearanceStream)normalAppearance.get( "default" );
- COSStream actual = appearanceStream.getStream();
-
- List actualTokens = getStreamTokens( doc, actual );
- assertTrue( actualTokens.contains( new COSString( expected ) ) );
- }
-
- private void testContentStreams( PDDocument doc, PDField field, String expected ) throws Exception
- {
- PDAnnotationWidget widget = field.getWidget();
- Map normalAppearance = widget.getAppearance().getNormalAppearance();
- PDAppearanceStream appearanceStream = (PDAppearanceStream)normalAppearance.get( "default" );
- COSStream actual = appearanceStream.getStream();
-
- List actualTokens = getStreamTokens( doc, actual );
- List expectedTokens = getStreamTokens( doc, expected );
- assertEquals( actualTokens.size(), expectedTokens.size() );
- for( int i=0; i<actualTokens.size(); i++ )
- {
- Object actualToken = actualTokens.get( i );
- Object expectedToken = expectedTokens.get( i );
- assertEquals( actualToken, expectedToken );
- }
- }
-
- private List getStreamTokens( PDDocument doc, String string ) throws IOException
- {
- PDFStreamParser parser;
-
- List tokens = null;
- if( string != null )
- {
- ByteArrayInputStream stream = new ByteArrayInputStream( string.getBytes() );
- parser = new PDFStreamParser( stream, doc.getDocument().getScratchFile() );
- parser.parse();
- tokens = parser.getTokens();
- }
- return tokens;
- }
-
- private List getStreamTokens( PDDocument doc, COSStream stream ) throws IOException
- {
- PDFStreamParser parser;
-
- List tokens = null;
- if( stream != null )
- {
- parser = new PDFStreamParser( stream );
- parser.parse();
- tokens = parser.getTokens();
- }
- return tokens;
- }
-} \ No newline at end of file
diff --git a/src/main/java/test/pdfbox/pdmodel/interactive/form/TestFields.java b/src/main/java/test/pdfbox/pdmodel/interactive/form/TestFields.java
deleted file mode 100644
index 8453fbc..0000000
--- a/src/main/java/test/pdfbox/pdmodel/interactive/form/TestFields.java
+++ /dev/null
@@ -1,144 +0,0 @@
-/**
- * Copyright (c) 2005, www.pdfbox.org
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- * 1. Redistributions of source code must retain the above copyright notice,
- * this list of conditions and the following disclaimer.
- * 2. Redistributions in binary form must reproduce the above copyright notice,
- * this list of conditions and the following disclaimer in the documentation
- * and/or other materials provided with the distribution.
- * 3. Neither the name of pdfbox; nor the names of its
- * contributors may be used to endorse or promote products derived from this
- * software without specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
- * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
- * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
- * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
- * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
- * ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
- * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * http://www.pdfbox.org
- *
- */
-package test.pdfbox.pdmodel.interactive.form;
-
-import java.io.IOException;
-
-import junit.framework.Test;
-import junit.framework.TestCase;
-import junit.framework.TestSuite;
-
-import org.pdfbox.pdmodel.PDDocument;
-import org.pdfbox.pdmodel.interactive.form.PDAcroForm;
-import org.pdfbox.pdmodel.interactive.form.PDTextbox;
-
-/**
- * This will test the form fields in PDFBox.
- *
- * @author Ben Litchfield (ben@benlitchfield.com)
- * @version $Revision: 1.3 $
- */
-public class TestFields extends TestCase
-{
- //private static Logger log = Logger.getLogger(TestFDF.class);
-
- /**
- * Constructor.
- *
- * @param name The name of the test to run.
- */
- public TestFields( String name )
- {
- super( name );
- }
-
- /**
- * This will get the suite of test that this class holds.
- *
- * @return All of the tests that this class holds.
- */
- public static Test suite()
- {
- return new TestSuite( TestFields.class );
- }
-
- /**
- * infamous main method.
- *
- * @param args The command line arguments.
- */
- public static void main( String[] args )
- {
- String[] arg = {TestFields.class.getName() };
- junit.textui.TestRunner.main( arg );
- }
-
- /**
- * This will test setting field flags on the PDField.
- *
- * @throws IOException If there is an error creating the field.
- */
- public void testFlags() throws IOException
- {
- PDDocument doc = null;
- try
- {
- doc = new PDDocument();
- PDAcroForm form = new PDAcroForm( doc );
- PDTextbox textBox = new PDTextbox(form);
-
- //assert that default is false.
- assertFalse( textBox.shouldComb() );
-
- //try setting and clearing a single field
- textBox.setComb( true );
- assertTrue( textBox.shouldComb() );
- textBox.setComb( false );
- assertFalse( textBox.shouldComb() );
-
- //try setting and clearing multiple fields
- textBox.setComb( true );
- textBox.setDoNotScroll( true );
- assertTrue( textBox.shouldComb() );
- assertTrue( textBox.doNotScroll() );
-
- textBox.setComb( false );
- textBox.setDoNotScroll( false );
- assertFalse( textBox.shouldComb() );
- assertFalse( textBox.doNotScroll() );
-
- //assert that setting a field to false multiple times works
- textBox.setComb( false );
- assertFalse( textBox.shouldComb() );
- textBox.setComb( false );
- assertFalse( textBox.shouldComb() );
-
- //assert that setting a field to true multiple times works
- textBox.setComb( true );
- assertTrue( textBox.shouldComb() );
- textBox.setComb( true );
- assertTrue( textBox.shouldComb() );
-
-
-
-
-
- }
- finally
- {
- if( doc != null )
- {
- doc.close();
- }
- }
- }
-
-} \ No newline at end of file
diff --git a/src/main/java/test/pdfbox/pdmodel/interactive/form/package.html b/src/main/java/test/pdfbox/pdmodel/interactive/form/package.html
deleted file mode 100644
index d6c2f8c..0000000
--- a/src/main/java/test/pdfbox/pdmodel/interactive/form/package.html
+++ /dev/null
@@ -1,9 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 3.2 Final//EN">
-<html>
-<head>
-
-</head>
-<body>
-This holds classes that will be used to test pdmodel form classes.
-</body>
-</html>
diff --git a/src/main/java/test/pdfbox/pdmodel/package.html b/src/main/java/test/pdfbox/pdmodel/package.html
deleted file mode 100644
index 7cb4cde..0000000
--- a/src/main/java/test/pdfbox/pdmodel/package.html
+++ /dev/null
@@ -1,9 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 3.2 Final//EN">
-<html>
-<head>
-
-</head>
-<body>
-This holds classes that will be used to test pdmodel classes.
-</body>
-</html>
diff --git a/src/main/java/test/pdfbox/util/TestTextStripper.java b/src/main/java/test/pdfbox/util/TestTextStripper.java
deleted file mode 100644
index c425f38..0000000
--- a/src/main/java/test/pdfbox/util/TestTextStripper.java
+++ /dev/null
@@ -1,371 +0,0 @@
-/**
- * Copyright (c) 2003-2005, www.pdfbox.org
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- * 1. Redistributions of source code must retain the above copyright notice,
- * this list of conditions and the following disclaimer.
- * 2. Redistributions in binary form must reproduce the above copyright notice,
- * this list of conditions and the following disclaimer in the documentation
- * and/or other materials provided with the distribution.
- * 3. Neither the name of pdfbox; nor the names of its
- * contributors may be used to endorse or promote products derived from this
- * software without specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
- * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
- * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
- * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
- * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
- * ANY THEORY OF LIABILIT, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
- * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * http://www.pdfbox.org
- */
-package test.pdfbox.util;
-
-import java.io.File;
-import java.io.FileInputStream;
-import java.io.FilenameFilter;
-import java.io.FileOutputStream;
-import java.io.IOException;
-import java.io.InputStreamReader;
-import java.io.LineNumberReader;
-import java.io.OutputStream;
-import java.io.OutputStreamWriter;
-import java.io.Writer;
-
-import junit.framework.Test;
-import junit.framework.TestCase;
-import junit.framework.TestSuite;
-
-import org.apache.log4j.Logger;
-import org.apache.log4j.Level;
-
-import org.pdfbox.pdmodel.PDDocument;
-
-import org.pdfbox.util.PDFTextStripper;
-
-/**
- * Test suite for PDFTextStripper.
- *
- * FILE SET VALIDATION
- *
- * This test suite is designed to test PDFTextStripper using a set of PDF
- * files and known good output for each. The default mode of testAll()
- * is to process each *.pdf file in "test/input". An output file is
- * created in "test/output" with the same name as the PDF file, plus an
- * additional ".txt" suffix.
- *
- * The output file is then tested against a known good result file from
- * the input directory (again, with the same name as the tested PDF file,
- * but with the additional ".txt" suffix).
- *
- * So for the file "test/input/hello.pdf", an output file will be generated
- * named "test/output/hello.pdf.txt". Then that file will be compared to
- * the known good file "test/input/hello.pdf.txt", if it exists.
- *
- * Any errors are logged, and at the end of processing all *.pdf files, if
- * there were any errors, the test fails. The logging is at INFO, as the
- * general goal is overall validation, and on failure, the indication of
- * which file or files failed.
- *
- * When processing new PDF files, you may use testAll() to generate output,
- * verify the output manually, then move the output file to the test input
- * directory to use as the basis for future validations.
- *
- * SINGLE FILE VALIDATION
- *
- * To further research individual failures, the test.pdfbox.util.TextStripper.file
- * system property may be set with the name of a single file in the "test/input"
- * directory. In this mode, testAll() will evaluate only that file, and will
- * do so with DEBUG level logging. You can set this property from ant by
- * defining "file", as in:
- *
- * ant testextract -Dfile=hello.pdf
- *
- * @author Robert Dickinson (bob@brutesquadlabs.com)
- * @author Ben Litchfield (ben@benlitchfield.com)
- * @version $Revision: 1.14 $
- */
-public class TestTextStripper extends TestCase
-{
- private static Logger log = Logger.getLogger(TestTextStripper.class);
-
- private boolean bFail = false;
- private PDFTextStripper stripper = null;
-
- /**
- * Test class constructor.
- *
- * @param name The name of the test class.
- *
- * @throws IOException If there is an error creating the test.
- */
- public TestTextStripper( String name ) throws IOException
- {
- super( name );
- stripper = new PDFTextStripper();
- stripper.setLineSeparator("\n");
- }
-
- /**
- * Test suite setup.
- */
- public void setUp()
- {
- // If you want to test a single file using DEBUG logging, from an IDE,
- // you can do something like this:
- //
- // System.setProperty("test.pdfbox.util.TextStripper.file", "FVS318Ref.pdf");
- }
-
- /**
- * Determine whether two strings are equal, where two null strings are
- * considered equal.
- *
- * @param expected Excpected string
- * @param actual Actual String
- * @return <code>true</code> is the strings are both null,
- * or if their contents are the same, otherwise <code>false</code>.
- */
- private boolean stringsEqual(String expected, String actual)
- {
- boolean equals = true;
- if( (expected == null) && (actual == null) )
- {
- return true;
- }
- else if( expected != null && actual != null )
- {
- expected = expected.trim();
- actual = actual.trim();
- char[] expectedArray = expected.toCharArray();
- char[] actualArray = actual.toCharArray();
- int expectedIndex = 0;
- int actualIndex = 0;
- while( expectedIndex<expectedArray.length && actualIndex<actualArray.length )
- {
- if( expectedArray[expectedIndex] != actualArray[actualIndex] )
- {
- equals = false;
- log.error("Lines differ at index"
- + " expected:" + expectedIndex + "-" + (int)expectedArray[expectedIndex]
- + " actual:" + actualIndex + "-" + (int)actualArray[actualIndex] );
- break;
- }
- expectedIndex = skipWhitespace( expectedArray, expectedIndex );
- actualIndex = skipWhitespace( actualArray, actualIndex );
- expectedIndex++;
- actualIndex++;
- }
- if( equals )
- {
- if( expectedIndex != expectedArray.length )
- {
- equals = false;
- log.error("Expected line is longer at:" + expectedIndex );
- }
- if( actualIndex != actualArray.length )
- {
- equals = false;
- log.error("Actual line is longer at:" + actualIndex );
- }
- }
- }
- else if( ( expected == null && actual != null && actual.trim().equals( "" ) ) ||
- ( actual == null && expected != null && expected.trim().equals( "" ) ) )
- {
- //basically there are some cases where pdfbox will put an extra line
- //at the end of the file, who cares, this is not enough to report
- // a failure
- equals = true;
- }
- else
- {
- equals = false;
- }
- return equals;
- }
-
- /**
- * If the current index is whitespace then skip any subsequent whitespace.
- */
- private int skipWhitespace( char[] array, int index )
- {
- //if we are at a space character then skip all space
- //characters, but when all done rollback 1 because stringsEqual
- //will roll forward 1
- if( array[index] == ' ' || array[index] > 256 )
- {
- while( index < array.length && (array[index] == ' ' || array[index] > 256))
- {
- index++;
- }
- index--;
- }
- return index;
- }
-
- /**
- * Validate text extraction on a single file.
- *
- * @param file The file to validate
- * @param bLogResult Whether to log the extracted text
- * @throws Exception when there is an exception
- */
- public void doTestFile(File file, boolean bLogResult)
- throws Exception
- {
- log.info("Preparing to parse " + file.getName());
-
-
- OutputStream os = null;
- Writer writer = null;
- PDDocument document = null;
- try
- {
- document = PDDocument.load(file);
-
- File outFile = new File(file.getParentFile().getParentFile(), "output/" + file.getName() + ".txt");
- os = new FileOutputStream(outFile);
- os.write( 0xFF );
- os.write( 0xFE );
- writer = new OutputStreamWriter(os,"UTF-16LE");
-
- stripper.writeText(document, writer);
-
-
-
- if (bLogResult)
- {
- log.info("Text for " + file.getName() + ":\r\n" + stripper.getText(document));
- }
-
- File expectedFile = new File(file.getParentFile().getParentFile(), "input/" + file.getName() + ".txt");
- File actualFile = new File(file.getParentFile().getParentFile(), "output/" + file.getName() + ".txt");
-
- if (!expectedFile.exists())
- {
- this.bFail = true;
- log.error("FAILURE: Input verification file: " + expectedFile.getAbsolutePath() + " did not exist");
- return;
- }
-
- LineNumberReader expectedReader =
- new LineNumberReader(new InputStreamReader(new FileInputStream(expectedFile),"UTF-16"));
- LineNumberReader actualReader =
- new LineNumberReader(new InputStreamReader(new FileInputStream(actualFile), "UTF-16"));
-
- while (true)
- {
- String expectedLine = expectedReader.readLine();
- while( expectedLine != null && expectedLine.trim().length() == 0 )
- {
- expectedLine = expectedReader.readLine();
- }
- String actualLine = actualReader.readLine();
- while( actualLine != null && actualLine.trim().length() == 0 )
- {
- actualLine = actualReader.readLine();
- }
- if (!stringsEqual(expectedLine, actualLine))
- {
- this.bFail = true;
- log.error("FAILURE: Line mismatch for file " + file.getName() +
- " at expected line: " + expectedReader.getLineNumber() +
- " at actual line: " + actualReader.getLineNumber() +
- "\r\n expected line was: \"" + expectedLine + "\"" +
- "\r\n actual line was: \"" + actualLine + "\"");
- //lets report all lines, even though this might produce some verbose logging
- //break;
- }
-
- if( expectedLine == null || actualLine==null)
- {
- break;
- }
- }
- }
- finally
- {
- if( writer != null )
- {
- writer.close();
- }
- if( os != null )
- {
- os.close();
- }
- if( document != null )
- {
- document.close();
- }
- }
- }
-
- /**
- * Test to validate text extraction of file set.
- *
- * @throws Exception when there is an exception
- */
- public void testExtract()
- throws Exception
- {
- String filename = System.getProperty("test.pdfbox.util.TextStripper.file");
- File testDir = new File("test/input");
-
- if ((filename == null) || (filename.length() == 0))
- {
- Logger.getRootLogger().setLevel( Level.INFO );
-
- File[] testFiles = testDir.listFiles(new FilenameFilter()
- {
- public boolean accept(File dir, String name)
- {
- return (name.endsWith(".pdf"));
- }
- });
-
- for (int n = 0; n < testFiles.length; n++)
- {
- doTestFile(testFiles[n], false);
- }
- }
- else
- {
- doTestFile(new File(testDir, filename), true);
- }
-
- if (this.bFail)
- {
- fail("One or more failures, see test log for details");
- }
- }
-
- /**
- * Set the tests in the suite for this test class.
- *
- * @return the Suite.
- */
- public static Test suite()
- {
- return new TestSuite( TestTextStripper.class );
- }
-
- /**
- * Command line execution.
- *
- * @param args Command line arguments.
- */
- public static void main( String[] args )
- {
- String[] arg = {TestTextStripper.class.getName() };
- junit.textui.TestRunner.main( arg );
- }
-} \ No newline at end of file
diff --git a/src/main/java/test/pdfbox/util/TestTextStripperPerformance.java b/src/main/java/test/pdfbox/util/TestTextStripperPerformance.java
deleted file mode 100644
index 0aadb30..0000000
--- a/src/main/java/test/pdfbox/util/TestTextStripperPerformance.java
+++ /dev/null
@@ -1,173 +0,0 @@
-/**
- * Copyright (c) 2003-2004, www.pdfbox.org
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- * 1. Redistributions of source code must retain the above copyright notice,
- * this list of conditions and the following disclaimer.
- * 2. Redistributions in binary form must reproduce the above copyright notice,
- * this list of conditions and the following disclaimer in the documentation
- * and/or other materials provided with the distribution.
- * 3. Neither the name of pdfbox; nor the names of its
- * contributors may be used to endorse or promote products derived from this
- * software without specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
- * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
- * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
- * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
- * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
- * ANY THEORY OF LIABILIT, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
- * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * http://www.pdfbox.org
- */
-package test.pdfbox.util;
-
-import java.io.File;
-import java.io.FilenameFilter;
-import java.io.FileOutputStream;
-import java.io.OutputStream;
-import java.io.OutputStreamWriter;
-import java.io.Writer;
-
-import junit.framework.Test;
-import junit.framework.TestCase;
-import junit.framework.TestSuite;
-
-import org.apache.log4j.Logger;
-
-import org.pdfbox.pdmodel.PDDocument;
-
-import org.pdfbox.util.PDFTextStripper;
-
-/**
- * Test the performance of the PDF text stripper utility.
- *
- * @author Ben Litchfield (ben@csh.rit.edu)
- * @version $Revision: 1.2 $
- */
-public class TestTextStripperPerformance extends TestCase
-{
- private static Logger log = Logger.getLogger(TestTextStripperPerformance.class);
-
- private boolean bFail = false;
-
- /**
- * Test class constructor.
- *
- * @param name The name of the test class.
- */
- public TestTextStripperPerformance( String name )
- {
- super( name );
- }
-
- /**
- * Test suite setup.
- */
- public void setUp()
- {
- }
-
-
- /**
- * Validate text extraction on a single file.
- *
- * @param file The file to validate
- * @param bLogResult Whether to log the extracted text
- * @throws Exception when there is an exception
- */
- public void doTestFile(File file, boolean bLogResult)
- throws Exception
- {
-
- PDFTextStripper stripper = new PDFTextStripper();
- OutputStream os = null;
- Writer writer = null;
- PDDocument document = null;
- try
- {
- document = PDDocument.load(file);
-
- File outFile = new File(file.getParentFile().getParentFile(), "output/" + file.getName() + ".txt");
- os = new FileOutputStream(outFile);
- writer = new OutputStreamWriter(os);
-
- stripper.writeText(document, writer);
- }
- finally
- {
- if( writer != null )
- {
- writer.close();
- }
- if( os != null )
- {
- os.close();
- }
- if( document != null )
- {
- document.close();
- }
- }
- }
-
- /**
- * Test to validate text extraction of file set.
- *
- * @throws Exception when there is an exception
- */
- public void testExtract()
- throws Exception
- {
- String filename = System.getProperty("test.pdfbox.util.TextStripper.file");
- File testDir = new File("test/input");
-
- if ((filename == null) || (filename.length() == 0))
- {
- File[] testFiles = testDir.listFiles(new FilenameFilter()
- {
- public boolean accept(File dir, String name)
- {
- return (name.endsWith(".pdf"));
- }
- });
-
- for (int n = 0; n < testFiles.length; n++)
- {
- doTestFile(testFiles[n], false);
- }
- }
- else
- {
- //doTestFile(new File(testDir, filename), true);
- }
- }
-
- /**
- * Set the tests in the suite for this test class.
- *
- * @return the Suite.
- */
- public static Test suite()
- {
- return new TestSuite( TestTextStripperPerformance.class );
- }
-
- /**
- * Command line execution.
- *
- * @param args Command line arguments.
- */
- public static void main( String[] args )
- {
- String[] arg = {TestTextStripperPerformance.class.getName() };
- junit.textui.TestRunner.main( arg );
- }
-} \ No newline at end of file
diff --git a/src/main/java/test/pdfbox/util/package.html b/src/main/java/test/pdfbox/util/package.html
deleted file mode 100644
index 8d98577..0000000
--- a/src/main/java/test/pdfbox/util/package.html
+++ /dev/null
@@ -1,9 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 3.2 Final//EN">
-<html>
-<head>
-
-</head>
-<body>
-These classes will be used to test the text extraction capabilities that are available with PDFBox.
-</body>
-</html>