using System; using System.Collections; using System.util; using System.Text; using System.Xml; using iTextSharp.text; using iTextSharp.text.pdf; using iTextSharp.text.pdf.draw; using iTextSharp.text.xml.simpleparser; using iTextSharp.text.html; using iTextSharp.text.factories; /* * $Id: ITextHandler.cs,v 1.21 2008/05/13 11:26:11 psoares33 Exp $ * * * Copyright 2001, 2002 by Bruno Lowagie. * * The contents of this file are subject to the Mozilla Public License Version 1.1 * (the "License"); you may not use this file except in compliance with the License. * You may obtain a copy of the License at http://www.mozilla.org/MPL/ * * Software distributed under the License is distributed on an "AS IS" basis, * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License * for the specific language governing rights and limitations under the License. * * The Original Code is 'iText, a free JAVA-PDF library'. * * The Initial Developer of the Original Code is Bruno Lowagie. Portions created by * the Initial Developer are Copyright (C) 1999, 2000, 2001, 2002 by Bruno Lowagie. * All Rights Reserved. * Co-Developer of the code is Paulo Soares. Portions created by the Co-Developer * are Copyright (C) 2000, 2001, 2002 by Paulo Soares. All Rights Reserved. * * Contributor(s): all the names of the contributors are added in the source code * where applicable. * * Alternatively, the contents of this file may be used under the terms of the * LGPL license (the "GNU LIBRARY GENERAL PUBLIC LICENSE"), in which case the * provisions of LGPL are applicable instead of those above. If you wish to * allow use of your version of this file only under the terms of the LGPL * License and not to allow others to use your version of this file under * the MPL, indicate your decision by deleting the provisions above and * replace them with the notice and other provisions required by the LGPL. * If you do not delete the provisions above, a recipient may use your version * of this file under either the MPL or the GNU LIBRARY GENERAL PUBLIC LICENSE. * * This library is free software; you can redistribute it and/or modify it * under the terms of the MPL as stated above or under the terms of the GNU * Library General Public License as published by the Free Software Foundation; * either version 2 of the License, or any later version. * * This library is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS * FOR A PARTICULAR PURPOSE. See the GNU Library general Public License for more * details. * * If you didn't download this code from the following link, you should check if * you aren't using an obsolete version: * http://www.lowagie.com/iText/ */ namespace iTextSharp.text.xml { /// /// The iTextHandler-class maps several XHTML-tags to iText-objects. /// public class ITextHandler : ParserBase { /// This is the resulting document. protected IDocListener document; /// This is a Stack of objects, waiting to be added to the document. protected Stack stack; /// Counts the number of chapters in this document. protected int chapters = 0; /// This is the current chunk to which characters can be added. protected Chunk currentChunk = null; /// This is the current chunk to which characters can be added. protected bool ignore = false; /// This is a flag that can be set, if you want to open and close the Document-object yourself. protected bool controlOpenClose = true; /** current margin of a page. */ float topMargin = 36; /** current margin of a page. */ float rightMargin = 36; /** current margin of a page. */ float leftMargin = 36; /** current margin of a page. */ float bottomMargin = 36; /// /// Constructs a new iTextHandler that will translate all the events /// triggered by the parser to actions on the Document-object. /// /// this is the document on which events must be triggered public ITextHandler(IDocListener document) : base() { this.document = document; stack = new Stack(); } protected Hashtable myTags; /** * @param document * @param myTags * @throws DocumentException * @throws IOException */ public ITextHandler(IDocListener document, HtmlTagMap myTags) : this(document) { this.myTags = myTags; } /** * @param document * @param myTags * @param bf * @throws DocumentException * @throws IOException */ public ITextHandler(IDocListener document, HtmlTagMap myTags, BaseFont bf) : this(document, myTags) { this.bf = bf; } /** * @param document * @param myTags * @throws DocumentException * @throws IOException */ public ITextHandler(IDocListener document, Hashtable myTags) : this(document) { this.myTags = myTags; } /// /// Sets the parameter that allows you to enable/disable the control over the Document.Open() and Document.Close() method. /// /// /// If you set this parameter to true (= default), the parser will open the Document object when the start-root-tag is encountered /// and close it when the end-root-tag is met. If you set it to false, you have to open and close the Document object /// yourself. /// /// set this to false if you plan to open/close the Document yourself public void SetControlOpenClose(bool controlOpenClose) { this.controlOpenClose = controlOpenClose; } /// /// This method gets called when a start tag is encountered. /// /// /// /// the name of the tag that is encountered /// the list of attributes public override void StartElement(String uri, String lname, String name, Hashtable attrs) { Properties attributes = new Properties(); if (attrs != null) { foreach (string key in attrs.Keys) { attributes.Add(key, (string)attrs[key]); } } HandleStartingTags(name, attributes); } /// /// This method deals with the starting tags. /// /// the name of the tag /// the list of attributes public void HandleStartingTags(String name, Properties attributes) { //System.err.Println("Start: " + name); if (ignore || ElementTags.IGNORE.Equals(name)) { ignore = true; return; } // maybe there is some meaningful data that wasn't between tags if (currentChunk != null) { ITextElementArray current; try { current = (ITextElementArray) stack.Pop(); } catch { if (bf == null) { current = new Paragraph("", new Font()); } else { current = new Paragraph("", new Font(this.bf)); } } current.Add(currentChunk); stack.Push(current); currentChunk = null; } // registerfont if (name.Equals("registerfont")) { FontFactory.Register(attributes); } // header if (ElementTags.HEADER.Equals(name)) { stack.Push(new HeaderFooter(attributes)); return; } // footer if (ElementTags.FOOTER.Equals(name)) { stack.Push(new HeaderFooter(attributes)); return; } // before if (name.Equals("before")) { HeaderFooter tmp = (HeaderFooter)stack.Pop(); tmp.Before = ElementFactory.GetPhrase(attributes); stack.Push(tmp); return; } // after if (name.Equals("after")) { HeaderFooter tmp = (HeaderFooter)stack.Pop(); tmp.After = ElementFactory.GetPhrase(attributes); stack.Push(tmp); return; } // chunks if (ElementTags.CHUNK.Equals(name)) { currentChunk = ElementFactory.GetChunk(attributes); if (bf != null) { currentChunk.Font = new Font(this.bf); } return; } // symbols if (ElementTags.ENTITY.Equals(name)) { Font f = new Font(); if (currentChunk != null) { HandleEndingTags(ElementTags.CHUNK); f = currentChunk.Font; } currentChunk = EntitiesToSymbol.Get(attributes[ElementTags.ID], f); return; } // phrases if (ElementTags.PHRASE.Equals(name)) { stack.Push(ElementFactory.GetPhrase(attributes)); return; } // anchors if (ElementTags.ANCHOR.Equals(name)) { stack.Push(ElementFactory.GetAnchor(attributes)); return; } // paragraphs and titles if (ElementTags.PARAGRAPH.Equals(name) || ElementTags.TITLE.Equals(name)) { stack.Push(ElementFactory.GetParagraph(attributes)); return; } // lists if (ElementTags.LIST.Equals(name)) { stack.Push(ElementFactory.GetList(attributes)); return; } // listitems if (ElementTags.LISTITEM.Equals(name)) { stack.Push(ElementFactory.GetListItem(attributes)); return; } // cells if (ElementTags.CELL.Equals(name)) { stack.Push(ElementFactory.GetCell(attributes)); return; } // tables if (ElementTags.TABLE.Equals(name)) { Table table = ElementFactory.GetTable(attributes); float[] widths = table.ProportionalWidths; for (int i = 0; i < widths.Length; i++) { if (widths[i] == 0) { widths[i] = 100.0f / (float)widths.Length; } } try { table.Widths = widths; } catch (BadElementException bee) { // this shouldn't happen throw new Exception("", bee); } stack.Push(table); return; } // sections if (ElementTags.SECTION.Equals(name)) { IElement previous = (IElement) stack.Pop(); Section section; section = ElementFactory.GetSection((Section) previous, attributes); stack.Push(previous); stack.Push(section); return; } // chapters if (ElementTags.CHAPTER.Equals(name)) { stack.Push(ElementFactory.GetChapter(attributes)); return; } // images if (ElementTags.IMAGE.Equals(name)) { try { Image img = ElementFactory.GetImage(attributes); try { AddImage(img); return; } catch { // if there is no element on the stack, the Image is added to the document try { document.Add(img); } catch (DocumentException de) { throw new Exception("", de); } return; } } catch (Exception e) { throw new Exception("", e); } } // annotations if (ElementTags.ANNOTATION.Equals(name)) { Annotation annotation = ElementFactory.GetAnnotation(attributes); ITextElementArray current; try { try { current = (ITextElementArray) stack.Pop(); try { current.Add(annotation); } catch { document.Add(annotation); } stack.Push(current); } catch { document.Add(annotation); } return; } catch (DocumentException de) { throw de; } } // newlines if (IsNewline(name)) { ITextElementArray current; try { current = (ITextElementArray) stack.Pop(); current.Add(Chunk.NEWLINE); stack.Push(current); } catch { if (currentChunk == null) { try { document.Add(Chunk.NEWLINE); } catch (DocumentException de) { throw de; } } else { currentChunk.Append("\n"); } } return; } // newpage if (IsNewpage(name)) { ITextElementArray current; try { current = (ITextElementArray) stack.Pop(); Chunk newPage = new Chunk(""); newPage.SetNewPage(); if (bf != null) { newPage.Font = new Font(this.bf); } current.Add(newPage); stack.Push(current); } catch { document.NewPage(); } return; } if (ElementTags.HORIZONTALRULE.Equals(name)) { ITextElementArray current; LineSeparator hr = new LineSeparator(1.0f, 100.0f, null, Element.ALIGN_CENTER, 0); try { current = (ITextElementArray)stack.Pop(); current.Add(hr); stack.Push(current); } catch (InvalidOperationException) { document.Add(hr); } return; } // documentroot if (IsDocumentRoot(name)) { String value; // pagesize and orientation specific code suggested by Samuel Gabriel // Updated by Ricardo Coutinho. Only use if set in html! Rectangle pageSize = null; String orientation = null; foreach (string key in attributes.Keys) { value = attributes[key]; // margin specific code suggested by Reza Nasiri if (Util.EqualsIgnoreCase(ElementTags.LEFT, key)) leftMargin = float.Parse(value, System.Globalization.NumberFormatInfo.InvariantInfo); if (Util.EqualsIgnoreCase(ElementTags.RIGHT, key)) rightMargin = float.Parse(value, System.Globalization.NumberFormatInfo.InvariantInfo); if (Util.EqualsIgnoreCase(ElementTags.TOP, key)) topMargin = float.Parse(value, System.Globalization.NumberFormatInfo.InvariantInfo); if (Util.EqualsIgnoreCase(ElementTags.BOTTOM, key)) bottomMargin = float.Parse(value, System.Globalization.NumberFormatInfo.InvariantInfo); if (ElementTags.PAGE_SIZE.Equals(key)) { pageSize = (Rectangle)typeof(PageSize).GetField(value).GetValue(null); } else if (ElementTags.ORIENTATION.Equals(key)) { if ("landscape".Equals(value)) { orientation = "landscape"; } } else { document.Add(new Meta(key, value)); } } if (pageSize != null) { if ("landscape".Equals(orientation)) { pageSize = pageSize.Rotate(); } document.SetPageSize(pageSize); } document.SetMargins(leftMargin, rightMargin, topMargin, bottomMargin); if (controlOpenClose) document.Open(); } } protected internal void AddImage(Image img) { // if there is an element on the stack... Object current = stack.Pop(); // ...and it's a Chapter or a Section, the Image can be // added directly if (current is Chapter || current is Section || current is Cell) { ((ITextElementArray) current).Add(img); stack.Push(current); return; } // ...if not, we need to to a lot of stuff else { Stack newStack = new Stack(); while (!(current is Chapter || current is Section || current is Cell)) { newStack.Push(current); if (current is Anchor) { img.Annotation = new Annotation(0, 0, 0, 0, ((Anchor) current).Reference); } current = stack.Pop(); } ((ITextElementArray) current).Add(img); stack.Push(current); while (newStack.Count != 0) { stack.Push(newStack.Pop()); } return; } } /// /// This method gets called when ignorable white space encountered. /// /// an array of characters /// the start position in the array /// the number of characters to read from the array public void IgnorableWhitespace(char[] ch, int start, int length) { // do nothing: we handle white space ourselves in the characters method } /// /// This method gets called when characters are encountered. /// /// an array of characters /// the start position in the array /// the number of characters to read from the array public override void Characters(string content, int start, int length) { if (ignore) return; if (content.Trim().Length == 0 && content.IndexOf(' ') < 0) { return; } StringBuilder buf = new StringBuilder(); int len = content.Length; char character; bool newline = false; for (int i = 0; i < len; i++) { switch (character = content[i]) { case ' ': if (!newline) { buf.Append(character); } break; case '\n': if (i > 0) { newline = true; buf.Append(' '); } break; case '\r': break; case '\t': break; default: newline = false; buf.Append(character); break; } } string tmp = buf.ToString(); string rline = new String('\r', 1); string nline = new String('\n', 1); string tline = new String('\t', 1); tmp = tmp.Replace("\\n", nline); tmp = tmp.Replace("\\t", tline); tmp = tmp.Replace("\\r", rline); if (currentChunk == null) { if (bf == null) { currentChunk = new Chunk(buf.ToString()); } else { currentChunk = new Chunk(buf.ToString(), new Font(this.bf)); } } else { currentChunk.Append(buf.ToString()); } } private BaseFont bf = null; public BaseFont DefaultFont { set { bf = value; } get { return bf; } } /// /// This method gets called when an end tag is encountered. /// /// /// /// the name of the tag that ends public override void EndElement(String uri, String lname, String name) { HandleEndingTags(name); } /// /// This method deals with the starting tags. /// /// the name of the tag public void HandleEndingTags(String name) { //System.err.Println("Stop: " + name); if (ElementTags.IGNORE.Equals(name)) { ignore = false; return; } if (ignore) return; // tags that don't have any content if (IsNewpage(name) || ElementTags.ANNOTATION.Equals(name) || ElementTags.IMAGE.Equals(name) || IsNewline(name)) { return; } try { // titles of sections and chapters if (ElementTags.TITLE.Equals(name)) { Paragraph current = (Paragraph) stack.Pop(); if (currentChunk != null) { current.Add(currentChunk); currentChunk = null; } Section previous = (Section) stack.Pop(); previous.Title = current; stack.Push(previous); return; } // all other endtags if (currentChunk != null) { ITextElementArray current; try { current = (ITextElementArray) stack.Pop(); } catch { current = new Paragraph(); } current.Add(currentChunk); stack.Push(current); currentChunk = null; } // chunks if (ElementTags.CHUNK.Equals(name)) { return; } // phrases, anchors, lists, tables if (ElementTags.PHRASE.Equals(name) || ElementTags.ANCHOR.Equals(name) || ElementTags.LIST.Equals(name) || ElementTags.PARAGRAPH.Equals(name)) { IElement current = (IElement) stack.Pop(); try { ITextElementArray previous = (ITextElementArray) stack.Pop(); previous.Add(current); stack.Push(previous); } catch { document.Add(current); } return; } // listitems if (ElementTags.LISTITEM.Equals(name)) { ListItem listItem = (ListItem) stack.Pop(); List list = (List) stack.Pop(); list.Add(listItem); stack.Push(list); } // tables if (ElementTags.TABLE.Equals(name)) { Table table = (Table) stack.Pop(); try { ITextElementArray previous = (ITextElementArray) stack.Pop(); previous.Add(table); stack.Push(previous); } catch { document.Add(table); } return; } // rows if (ElementTags.ROW.Equals(name)) { ArrayList cells = new ArrayList(); int columns = 0; Table table; Cell cell; while (true) { IElement element = (IElement) stack.Pop(); if (element.Type == Element.CELL) { cell = (Cell) element; columns += cell.Colspan; cells.Add(cell); } else { table = (Table) element; break; } } if (table.Columns < columns) { table.AddColumns(columns - table.Columns); } cells.Reverse(0, cells.Count); String width; float[] cellWidths = new float[columns]; bool[] cellNulls = new bool[columns]; for (int i = 0; i < columns; i++) { cellWidths[i] = 0; cellNulls[i] = true; } float total = 0; int j = 0; foreach (Cell c in cells) { cell = c; width = cell.GetWidthAsString(); if (cell.Width == 0) { if (cell.Colspan == 1 && cellWidths[j] == 0) { try { cellWidths[j] = 100f / columns; total += cellWidths[j]; } catch { // empty on purpose } } else if (cell.Colspan == 1) { cellNulls[j] = false; } } else if (cell.Colspan == 1 && width.EndsWith("%")) { try { cellWidths[j] = float.Parse(width.Substring(0, width.Length - 1), System.Globalization.NumberFormatInfo.InvariantInfo); total += cellWidths[j]; } catch { // empty on purpose } } j += cell.Colspan; table.AddCell(cell); } float[] widths = table.ProportionalWidths; if (widths.Length == columns) { float left = 0.0f; for (int i = 0; i < columns; i++) { if (cellNulls[i] && widths[i] != 0) { left += widths[i]; cellWidths[i] = widths[i]; } } if (100.0 >= total) { for (int i = 0; i < widths.Length; i++) { if (cellWidths[i] == 0 && widths[i] != 0) { cellWidths[i] = (widths[i] / left) * (100.0f - total); } } } table.Widths = cellWidths; } stack.Push(table); } // registerfont if (name.Equals("registerfont")) { return; } // header if (ElementTags.HEADER.Equals(name)) { document.Header = (HeaderFooter)stack.Pop(); return; } // footer if (ElementTags.FOOTER.Equals(name)) { document.Footer = (HeaderFooter)stack.Pop(); return; } // before if (name.Equals("before")) { return; } // after if (name.Equals("after")) { return; } // cells if (ElementTags.CELL.Equals(name)) { return; } // sections if (ElementTags.SECTION.Equals(name)) { stack.Pop(); return; } // chapters if (ElementTags.CHAPTER.Equals(name)) { document.Add((IElement) stack.Pop()); return; } // the documentroot if (IsDocumentRoot(name)) { try { while (true) { IElement element = (IElement) stack.Pop(); try { ITextElementArray previous = (ITextElementArray) stack.Pop(); previous.Add(element); stack.Push(previous); } catch { document.Add(element); } } } catch { // empty on purpose } if (controlOpenClose) document.Close(); return; } } catch (DocumentException de) { throw de; } } /// /// Checks if a certain tag corresponds with the newpage-tag. /// /// a presumed tagname /// true or false private bool IsNewpage(String tag) { return ElementTags.NEWPAGE.Equals(tag); } /// /// Checks if a certain tag corresponds with the newpage-tag. /// /// a presumed tagname /// true or false private bool IsNewline(String tag) { return ElementTags.NEWLINE.Equals(tag); } /// /// Checks if a certain tag corresponds with the roottag. /// /// a presumed tagname /// true if tag equals itext, false otherwise. protected bool IsDocumentRoot(String tag) { return ElementTags.ITEXT.Equals(tag); } } }