1 files changed, 204 insertions, 0 deletions
diff --git a/src/main/java/com/lowagie/text/pdf/PdfContentParser.java b/src/main/java/com/lowagie/text/pdf/PdfContentParser.java
new file mode 100644
index 0000000..af731bc
--- /dev/null
+++ b/src/main/java/com/lowagie/text/pdf/PdfContentParser.java
@@ -0,0 +1,204 @@
+/*
+ * $Id: PdfContentParser.java,v 1.4 2006/05/27 11:11:54 psoares33 Exp $
+ *
+ * Copyright 2005 by Paulo Soares.
+ *
+ * The contents of this file are subject to the Mozilla Public License Version 1.1
+ * (the "License"); you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at http://www.mozilla.org/MPL/
+ *
+ * Software distributed under the License is distributed on an "AS IS" basis,
+ * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
+ * for the specific language governing rights and limitations under the License.
+ *
+ * The Original Code is 'iText, a free JAVA-PDF library'.
+ *
+ * The Initial Developer of the Original Code is Bruno Lowagie. Portions created by
+ * the Initial Developer are Copyright (C) 1999, 2000, 2001, 2002 by Bruno Lowagie.
+ * All Rights Reserved.
+ * Co-Developer of the code is Paulo Soares. Portions created by the Co-Developer
+ * are Copyright (C) 2000, 2001, 2002 by Paulo Soares. All Rights Reserved.
+ *
+ * Contributor(s): all the names of the contributors are added in the source code
+ * where applicable.
+ *
+ * Alternatively, the contents of this file may be used under the terms of the
+ * LGPL license (the "GNU LIBRARY GENERAL PUBLIC LICENSE"), in which case the
+ * provisions of LGPL are applicable instead of those above.  If you wish to
+ * allow use of your version of this file only under the terms of the LGPL
+ * License and not to allow others to use your version of this file under
+ * the MPL, indicate your decision by deleting the provisions above and
+ * replace them with the notice and other provisions required by the LGPL.
+ * If you do not delete the provisions above, a recipient may use your version
+ * of this file under either the MPL or the GNU LIBRARY GENERAL PUBLIC LICENSE.
+ *
+ * This library is free software; you can redistribute it and/or modify it
+ * under the terms of the MPL as stated above or under the terms of the GNU
+ * Library General Public License as published by the Free Software Foundation;
+ * either version 2 of the License, or any later version.
+ *
+ * This library is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ * FOR A PARTICULAR PURPOSE. See the GNU Library general Public License for more
+ * details.
+ *
+ * If you didn't download this code from the following link, you should check if
+ * you aren't using an obsolete version:
+ * http://www.lowagie.com/iText/
+ */
+
+package com.lowagie.text.pdf;
+
+import java.io.IOException;
+import java.util.ArrayList;
+/**
+ * Parses the page or template content.
+ * @author Paulo Soares (psoares@consiste.pt)
+ */
+public class PdfContentParser {
+    
+    /**
+     * Commands have this type.
+     */    
+    public static final int COMMAND_TYPE = 200;
+    /**
+     * Holds value of property tokeniser.
+     */
+    private PRTokeniser tokeniser;    
+    
+    /**
+     * Creates a new instance of PdfContentParser
+     * @param tokeniser the tokeniser with the content
+     */
+    public PdfContentParser(PRTokeniser tokeniser) {
+        this.tokeniser = tokeniser;
+    }
+    
+    /**
+     * Parses a single command from the content. Each command is output as an array of arguments
+     * having the command itself as the last element. The returned array will be empty if the
+     * end of content was reached.
+     * @param ls an <CODE>ArrayList</CODE> to use. It will be cleared before using. If it's
+     * <CODE>null</CODE> will create a new <CODE>ArrayList</CODE>
+     * @return the same <CODE>ArrayList</CODE> given as argument or a new one
+     * @throws IOException on error
+     */    
+    public ArrayList parse(ArrayList ls) throws IOException {
+        if (ls == null)
+            ls = new ArrayList();
+        else
+            ls.clear();
+        PdfObject ob = null;
+        while ((ob = readPRObject()) != null) {
+            ls.add(ob);
+            if (ob.type() == COMMAND_TYPE)
+                break;
+        }
+        return ls;
+    }
+    
+    /**
+     * Gets the tokeniser.
+     * @return the tokeniser.
+     */
+    public PRTokeniser getTokeniser() {
+        return this.tokeniser;
+    }
+    
+    /**
+     * Sets the tokeniser.
+     * @param tokeniser the tokeniser
+     */
+    public void setTokeniser(PRTokeniser tokeniser) {
+        this.tokeniser = tokeniser;
+    }
+    
+    /**
+     * Reads a dictionary. The tokeniser must be positioned past the "&lt;&lt;" token.
+     * @return the dictionary
+     * @throws IOException on error
+     */    
+    public PdfDictionary readDictionary() throws IOException {
+        PdfDictionary dic = new PdfDictionary();
+        while (true) {
+            if (!nextValidToken())
+                throw new IOException("Unexpected end of file.");;
+                if (tokeniser.getTokenType() == PRTokeniser.TK_END_DIC)
+                    break;
+                if (tokeniser.getTokenType() != PRTokeniser.TK_NAME)
+                    throw new IOException("Dictionary key is not a name.");
+                PdfName name = new PdfName(tokeniser.getStringValue(), false);
+                PdfObject obj = readPRObject();
+                int type = obj.type();
+                if (-type == PRTokeniser.TK_END_DIC)
+                    throw new IOException("Unexpected '>>'");
+                if (-type == PRTokeniser.TK_END_ARRAY)
+                    throw new IOException("Unexpected ']'");
+                dic.put(name, obj);
+        }
+        return dic;
+    }
+    
+    /**
+     * Reads an array. The tokeniser must be positioned past the "[" token.
+     * @return an array
+     * @throws IOException on error
+     */    
+    public PdfArray readArray() throws IOException {
+        PdfArray array = new PdfArray();
+        while (true) {
+            PdfObject obj = readPRObject();
+            int type = obj.type();
+            if (-type == PRTokeniser.TK_END_ARRAY)
+                break;
+            if (-type == PRTokeniser.TK_END_DIC)
+                throw new IOException("Unexpected '>>'");
+            array.add(obj);
+        }
+        return array;
+    }
+    
+    /**
+     * Reads a pdf object.
+     * @return the pdf object
+     * @throws IOException on error
+     */    
+    public PdfObject readPRObject() throws IOException {
+        if (!nextValidToken())
+            return null;
+        int type = tokeniser.getTokenType();
+        switch (type) {
+            case PRTokeniser.TK_START_DIC: {
+                PdfDictionary dic = readDictionary();
+                return dic;
+            }
+            case PRTokeniser.TK_START_ARRAY:
+                return readArray();
+            case PRTokeniser.TK_STRING:
+                PdfString str = new PdfString(tokeniser.getStringValue(), null).setHexWriting(tokeniser.isHexString());
+                return str;
+            case PRTokeniser.TK_NAME:
+                return new PdfName(tokeniser.getStringValue(), false);
+            case PRTokeniser.TK_NUMBER:
+                return new PdfNumber(tokeniser.getStringValue());
+            case PRTokeniser.TK_OTHER:
+                return new PdfLiteral(COMMAND_TYPE, tokeniser.getStringValue());
+            default:
+                return new PdfLiteral(-type, tokeniser.getStringValue());
+        }
+    }
+    
+    /**
+     * Reads the next token skipping over the comments.
+     * @return <CODE>true</CODE> if a token was read, <CODE>false</CODE> if the end of content was reached
+     * @throws IOException on error
+     */    
+    public boolean nextValidToken() throws IOException {
+        while (tokeniser.nextToken()) {
+            if (tokeniser.getTokenType() == PRTokeniser.TK_COMMENT)
+                continue;
+            return true;
+        }
+        return false;
+    }
+}
+\ No newline at end of file