From 2226daf4acb2bd6f5a81406df91f53522245cde7 Mon Sep 17 00:00:00 2001 From: ferbas Date: Thu, 19 Nov 2009 14:14:49 +0000 Subject: added non text oject info git-svn-id: https://joinup.ec.europa.eu/svn/pdf-as/trunk@439 7b5415b0-85f9-ee4d-85bd-d5d0c3b42d1c --- src/main/java/at/knowcenter/wag/egov/egiz/PdfAS.java | 11 +++++++++++ 1 file changed, 11 insertions(+) (limited to 'src/main/java') diff --git a/src/main/java/at/knowcenter/wag/egov/egiz/PdfAS.java b/src/main/java/at/knowcenter/wag/egov/egiz/PdfAS.java index 1340f4d..621b96f 100644 --- a/src/main/java/at/knowcenter/wag/egov/egiz/PdfAS.java +++ b/src/main/java/at/knowcenter/wag/egov/egiz/PdfAS.java @@ -32,6 +32,7 @@ import org.apache.commons.logging.Log; import org.apache.commons.logging.LogFactory; import at.gv.egiz.pdfas.algorithmSuite.AlgorithmSuiteUtil; +import at.gv.egiz.pdfas.api.analyze.NonTextObjectInfo; import at.gv.egiz.pdfas.api.timestamp.TimeStamper; import at.gv.egiz.pdfas.commandline.CommandlineConnectorChooser; import at.gv.egiz.pdfas.exceptions.ErrorCode; @@ -1090,6 +1091,16 @@ public abstract class PdfAS // return extractNormalizedTextTextual(pdf, pdf.length); // } + /** + * + * @param pdfDs + * @return List of {@link NonTextObjectInfo} + */ + public static List extractNonTextualObjects(PdfDataSource pdfDs) { + return TextualSignature.extractNonTextInfo(pdfDs); + } + + public static String extractNormalizedTextTextual(PdfDataSource pdfDataSource) throws PresentableException { String raw_document_text = TextualSignature.extractTextTextual(pdfDataSource); -- cgit v1.2.3