w2phtml/src/main/java/writer2latex/xhtml/content/TextParser.java

1854 lines
70 KiB
Java

/************************************************************************
*
* TextConverter.java
*
* Copyright: 2002-2015 by Henrik Just
*
* This file is part of Writer2LaTeX.
*
* Writer2LaTeX is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Writer2LaTeX is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Writer2LaTeX. If not, see <http://www.gnu.org/licenses/>.
*
* Version 1.6 (2015-07-23)
*
*/
package writer2latex.xhtml.content;
import java.util.Hashtable;
import java.util.Stack;
import org.w3c.dom.Node;
import org.w3c.dom.NodeList;
import pro.litvinovg.xml.Debug;
import org.w3c.dom.Element;
import writer2latex.util.Misc;
import writer2latex.xhtml.Converter;
import writer2latex.xhtml.ODFPageSplitter;
import writer2latex.xhtml.Parser;
import writer2latex.xhtml.StyleInfo;
import writer2latex.xhtml.XhtmlConfig;
import writer2latex.xhtml.XhtmlStyleMap;
import writer2latex.xhtml.XhtmlStyleMapItem;
import writer2latex.office.FontDeclaration;
import writer2latex.office.MasterPage;
import writer2latex.office.OfficeStyle;
import writer2latex.office.PageLayout;
import writer2latex.office.ListCounter;
import writer2latex.office.ListStyle;
import writer2latex.office.StyleWithProperties;
import writer2latex.office.OfficeReader;
import static writer2latex.office.XMLString.*;
/** This class handles text content
*/
public class TextParser extends Parser {
// Data used to handle splitting over several files
// TODO: Accessor methods for sections
// Some (Sony?) EPUB readers have a limit on the file size of individual files
// In any case very large files could be a performance problem, hence we do automatic splitting
// after this number of characters.
private int nSplitAfter = 150000;
// TODO: Collect soft page breaks between table rows
private boolean bPendingPageBreak = false; // We have encountered a page break which should be inserted asap
private int splitHeadingLevel = 0; // The outline level at which to split files (0=no split)
private int nRepeatLevels = 5; // The number of levels to repeat when splitting (0=no repeat)
private int nLastSplitLevel = 1; // The outline level at which the last split occurred
private int nDontSplitLevel = 0; // if > 0 splitting is forbidden
boolean bAfterHeading=false; // last element was a top level heading
Element[] currentHeading = new Element[7]; // Last headings (repeated when splitting)
private int nCharacterCount = 0; // The number of text characters in the current document
// Counters for generated numbers
private ListCounter outlineNumbering;
private Hashtable<String, ListCounter> listCounters = new Hashtable<String, ListCounter>();
private String sCurrentListLabel = null;
private ListStyle currentListStyle = null;
private int nCurrentListLevel = 0;
public Separator docSep = null;
// Mode used to handle floats (depends on source doc type and config)
private int nFloatMode;
// Converter helpers used to handle all sorts of indexes
private TOCParser tocParser;
private LOFParser lofCv;
private LOTParser lotCv;
private AlphabeticalIndexParser indexCv;
private BibliographyParser bibCv;
// Converter helpers used to handle footnotes and endnotes
private FootnoteParser footCv;
private EndnoteParser endCv;
// Sometimes we have to create an inlinenode in a block context
// (labels for footnotes and endnotes)
// We put it here and insert it in the first paragraph/heading to come:
private Node asapNode = null;
// When generating toc, a few things should be done differently
private boolean bInToc = false;
// Display hidden text?
private boolean displayHiddenText = false;
// Current page number
int pageNum = 1;
//Current master page name
private String currentMasterPage = null;
//Current master page name
private String nextMasterPage = null;
private boolean pagination = config.pagination();
private boolean breakBeforeNextNode = false;
private boolean inTable = false;
private boolean inList = false;
private boolean inFootnote = false;
private boolean inEndnote = false;
private boolean inHeader = false;
private boolean inFooter = false;
private String endnotesContext = null;
private String footnotesContext = null;
PageContainer pageContainer = null;
public TextParser(OfficeReader ofr, XhtmlConfig config, Converter converter) {
super(ofr,config,converter);
tocParser = new TOCParser(ofr, config, converter);
lofCv = new LOFParser(ofr, config, converter);
lotCv = new LOTParser(ofr, config, converter);
bibCv = new BibliographyParser(ofr, config, converter);
indexCv = new AlphabeticalIndexParser(ofr, config, converter);
footCv = new FootnoteParser(ofr, config, converter);
endCv = new EndnoteParser(ofr, config, converter);
nSplitAfter = 1000*config.splitAfter();
splitHeadingLevel = config.getXhtmlSplitLevel();
nRepeatLevels = converter.isOPS() ? 0 : config.getXhtmlRepeatLevels(); // never repeat headings in EPUB
nFloatMode = ofr.isText() && config.xhtmlFloatObjects() ?
DrawParser.FLOATING : DrawParser.ABSOLUTE;
outlineNumbering = new ListCounter(ofr.getOutlineStyle());
displayHiddenText = config.displayHiddenText();
pageContainer = converter.pageContainer;
docSep = new Separator(config, converter);
}
/** Converts an office node as a complete text document
*
* @param onode the Office node containing the content to convert
*/
public void convertDocumentContent(Element onode) {
Element hnode = converter.nextOutFile();
// Create form
if (splitHeadingLevel==0) {
Element form = getDrawCv().createForm();
if (form!=null) {
hnode.appendChild(form);
hnode = form;
}
}
// Add cover image
hnode = getDrawCv().insertCoverImage(hnode);
//Extract table:index-body content from TOC
if (!config.includeToc()){
extractRealTOC(onode);
}
//Split pages
if (pagination) {
onode = (Element) ODFPageSplitter.splitText(onode,ofr);
}
hnode = (Element)traverseBlockText(onode,hnode);
// Add footnotes and endnotes
insertFootnotes(hnode,true);
addFooter(hnode);
insertEndnotes(hnode, null);
hnode = (Element) docSep.endDocument(hnode);
// Generate all indexes
bInToc = true;
tocParser.generate();
bInToc = false;
bInToc = true;
tocParser.generatePanels(splitHeadingLevel);
bInToc = false;
}
private void insertEndnotes(Element hnode, String section) {
inEndnote = true;
endCv.insertEndnotes(hnode,section);
inEndnote = false;
}
private void extractRealTOC(Element onode) {
NodeList tocs = onode.getElementsByTagName(TEXT_TABLE_OF_CONTENT);
int i = 0;
if (tocs == null){
return;
}
while (i < tocs.getLength()){
Node toc = tocs.item(i);
NodeList indexBody = ((Element)toc).getElementsByTagName(TEXT_INDEX_BODY);
if (indexBody == null || indexBody.item(0) == null){
i++;
continue;
}
while (indexBody.item(0).hasChildNodes()){
Node child = indexBody.item(0).getFirstChild();
if (child.getNodeType() == Node.ELEMENT_NODE
&&
((Element) child).getTagName().equals(TEXT_INDEX_TITLE)
){
while(child.hasChildNodes()){
toc.getParentNode().insertBefore(child.getFirstChild(),toc);
}
//kamikadze
child.getParentNode().removeChild(child);
continue;
}
//Move childnodes before text:table-of-content
toc.getParentNode().insertBefore(child, toc);
}
i++;
}
return;
}
public int getTocIndex() { return tocParser.getFileIndex(); }
public int getAlphabeticalIndex() { return indexCv.getFileIndex(); }
protected void setAsapNode(Element node) {
asapNode = node;
}
////////////////////////////////////////////////////////////////////////
// NAVIGATION (fill header, footer and panel with navigation links)
////////////////////////////////////////////////////////////////////////
////////////////////////////////////////////////////////////////////////
// BLOCK TEXT (returns current html node at end of block)
////////////////////////////////////////////////////////////////////////
public Node traverseBlockText(Node onode, Node hnode) {
return parseText(onode,0,null,hnode);
}
private Node parseText(Node onode, int nLevel, String styleName, Node hnode) {
if (!onode.hasChildNodes()) { return hnode; }
bAfterHeading = false;
NodeList nList = onode.getChildNodes();
int nLen = nList.getLength();
int i = 0;
//hard Break after marker
breakBeforeNextNode = false;
while (i < nLen) {
Node child = nList.item(i);
if (child.getNodeType() == Node.ELEMENT_NODE) {
String nodeName = child.getNodeName();
// Block splitting
nDontSplitLevel++;
if (OfficeReader.isDrawElement(child)) {
getDrawCv().handleDrawElement((Element)child,(Element)hnode,null,nFloatMode);
}
else if (nodeName.equals(TEXT_P)) {
StyleWithProperties style = ofr.getParStyle(Misc.getAttribute(child,TEXT_STYLE_NAME));
hnode = processPageBreaks(child, hnode,style);
nCharacterCount+=OfficeReader.getCharacterCount(child);
// is there a block element, we should use?
XhtmlStyleMap xpar = config.getXParStyleMap();
String sDisplayName = style!=null ? style.getDisplayName() : null;
if (sDisplayName!=null && xpar.contains(sDisplayName)) {
Node curHnode = hnode;
XhtmlStyleMapItem map = xpar.get(sDisplayName);
String sBlockElement = map.sBlockElement;
String sBlockCss = map.sBlockCss;
if (map.sBlockElement.length()>0) {
Element block = converter.createElement(map.sBlockElement);
if (!"(none)".equals(map.sBlockCss)) {
block.setAttribute("class",map.sBlockCss);
}
hnode.appendChild(block);
curHnode = block;
}
boolean bMoreParagraphs = true;
do {
handleParagraph(child,curHnode);
bMoreParagraphs = false;
if (++i<nLen) {
child = nList.item(i);
String cnodeName = child.getNodeName();
if (cnodeName.equals(TEXT_P)) {
String sCurDisplayName = ofr.getParStyles().getDisplayName(Misc.getAttribute(child,TEXT_STYLE_NAME));
if (sCurDisplayName!=null && xpar.contains(sCurDisplayName)) {
XhtmlStyleMapItem newmap = xpar.get(sCurDisplayName);
if (sBlockElement.equals(newmap.sBlockElement) &&
sBlockCss.equals(newmap.sBlockCss)) {
bMoreParagraphs = true;
}
}
}
}
} while (bMoreParagraphs);
i--;
}
else {
handleParagraph(child,hnode);
}
}
else if(nodeName.equals(TEXT_H)) {
StyleWithProperties style = ofr.getParStyle(Misc.getAttribute(child,TEXT_STYLE_NAME));
Node rememberNode = hnode;
hnode = processPageBreaks(child, hnode, style);
nCharacterCount+=OfficeReader.getCharacterCount(child);
handleHeading((Element)child,(Element)hnode,rememberNode!=hnode);
}
else if (nodeName.equals(TEXT_LIST) || // oasis
nodeName.equals(TEXT_UNORDERED_LIST) || // old
nodeName.equals(TEXT_ORDERED_LIST)) // old
{
StyleWithProperties style = null;
String newPageNumberProperty = null;
Element para = null;
Element head = null;
Element item = Misc.getChildByTagName(child, TEXT_LIST_ITEM);
if (item != null){
NodeList paras = item.getElementsByTagName(TEXT_P);
if (paras != null && paras.getLength() > 0){
para = (Element) paras.item(0);
}
NodeList heads = item.getElementsByTagName(TEXT_H);
if (heads != null && heads.getLength() > 0){
head = (Element) heads.item(0);
}
if (para != null ){
StyleWithProperties paraStyle = ofr.getParStyle(Misc.getAttribute(para,TEXT_STYLE_NAME));
if (paraStyle != null) {
newPageNumberProperty = paraStyle.getParProperty(STYLE_PAGE_NUMBER, true);
}
newPageNumberProperty = paraStyle.getParProperty(STYLE_PAGE_NUMBER, true);
if (hasMasterPage(paraStyle) || newPageNumberProperty != null){
style = paraStyle;
}
}
if (head != null && style == null){
StyleWithProperties headStyle = ofr.getParStyle(Misc.getAttribute(head,TEXT_STYLE_NAME));
if (headStyle != null) {
newPageNumberProperty = headStyle.getParProperty(STYLE_PAGE_NUMBER, true);
}
if (hasMasterPage(headStyle) || newPageNumberProperty != null){
style = headStyle;
}
}
}
hnode = processPageBreaks(child, hnode,style);
inList = true;
if (listIsOnlyHeadings(child)) {
nDontSplitLevel--;
hnode = handleFakeList(child,nLevel+1,styleName,hnode);
nDontSplitLevel++;
}
else {
handleList(child,nLevel+1,styleName,hnode);
}
inList = false;
}
else if (nodeName.equals(TABLE_TABLE)) {
StyleWithProperties style = ofr.getTableStyle(Misc.getAttribute(child, TABLE_STYLE_NAME));
hnode = processPageBreaks(child, hnode,style);
inTable = true;
getTableCv().handleTable(child,hnode);
inTable = false;
}
else if (nodeName.equals(TABLE_SUB_TABLE)) {
getTableCv().handleTable(child,hnode);
}
else if (nodeName.equals(TEXT_SECTION)) {
hnode = processPageBreaks(child, hnode,null);
nDontSplitLevel--;
hnode = handleSection(child,hnode);
nDontSplitLevel++;
}
else if (nodeName.equals(TEXT_TABLE_OF_CONTENT)) {
if (!ofr.getTocReader((Element)child).isByChapter()) {
}
tocParser.handleIndex((Element)child,(Element)hnode);
}
else if (nodeName.equals(TEXT_ILLUSTRATION_INDEX)) {
lofCv.handleLOF(child,hnode);
}
else if (nodeName.equals(TEXT_TABLE_INDEX)) {
lotCv.handleLOT(child,hnode);
}
else if (nodeName.equals(TEXT_OBJECT_INDEX)) {
// TODO
}
else if (nodeName.equals(TEXT_USER_INDEX)) {
// TODO
}
else if (nodeName.equals(TEXT_ALPHABETICAL_INDEX)) {
indexCv.handleIndex((Element)child,(Element)hnode);
}
else if (nodeName.equals(TEXT_BIBLIOGRAPHY)) {
bibCv.handleIndex((Element)child,(Element)hnode);
}
else if (nodeName.equals(TEXT_SOFT_PAGE_BREAK)) {
breakBeforeNextNode = true;
}
else if (nodeName.equals(OFFICE_ANNOTATION)) {
converter.handleOfficeAnnotation(child,hnode);
}
else if (nodeName.equals(TEXT_SEQUENCE_DECLS)) {
//handleSeqeuenceDecls(child);
}
// Reenable splitting
nDontSplitLevel--;
// Remember if this was a heading
if (nDontSplitLevel==0) {
bAfterHeading = nodeName.equals(TEXT_H);
hnode = getDrawCv().flushFullscreenFrames((Element)hnode);
}
}
i++;
}
return hnode;
}
/* Process a text:section tag (returns current html node) */
private Node handleSection(Node onode, Node hnode) {
// Unlike headings, paragraphs and spans, text:display is not attached to the style:
String lastEndnotesContext = endnotesContext;
String lastFootnotesContext = footnotesContext;
boolean pageWasOpened = docSep.isPageOpened();
String sectionName = Misc.getAttribute(onode,TEXT_NAME);
String last = Misc.getAttribute(onode,"last");
boolean isLast = false;
if (last != null && last.equals("true")) { isLast = true;}
if (!displayHiddenText && "none".equals(Misc.getAttribute(onode,TEXT_DISPLAY))) { return hnode; }
if (pageWasOpened) {hnode = docSep.closePage(hnode);}
boolean removeStyleAtExit = setSectionStyle(onode);
if (pageWasOpened) {hnode = docSep.openPage(hnode, pageNum);}
hnode = traverseBlockText(onode, hnode);
if (isLast) {
insertEndnotes((Element) hnode, sectionName);
}
endnotesContext = lastEndnotesContext;
footnotesContext = lastFootnotesContext;
if (removeStyleAtExit) {
pageContainer.removeStyle();
}
return hnode;
}
private boolean setSectionStyle(Node onode) {
boolean result = false;
StyleWithProperties sectionStyle;
String styleName = Misc.getAttribute(onode,TEXT_STYLE_NAME);
String sectionName = Misc.getAttribute(onode,TEXT_NAME);
OfficeStyle ofStyle = getSectionSc().getStyles().getStyle(styleName);
if (ofStyle != null) {
sectionStyle = (StyleWithProperties) ofStyle;
int colCount = sectionStyle.getColCount();
if (colCount > 1 ) {
String styleValue = "column-count: " + colCount + ";";
pageContainer.addStyle(styleValue);
result = true;
}
String collectEndnotes = sectionStyle.getSectionProperty("endnote", false);
if (collectEndnotes != null && collectEndnotes.equals("true")) {
endnotesContext = sectionName;
}
String collectFootnotes = sectionStyle.getSectionProperty("footnote", false);
if (collectFootnotes != null && collectFootnotes.equals("true")) {
footnotesContext = sectionName;
}
}
return result;
}
private void handleHeading(Element onode, Element hnode, boolean bAfterSplit) {
int nListLevel = getOutlineLevel((Element)onode);
boolean bUnNumbered = "true".equals(Misc.getAttribute(onode,TEXT_IS_LIST_HEADER));
boolean bRestart = "true".equals(Misc.getAttribute(onode,TEXT_RESTART_NUMBERING));
int nStartValue = Misc.getPosInteger(Misc.getAttribute(onode,TEXT_START_VALUE),1)-1;
handleHeading(onode, hnode, bAfterSplit, ofr.getOutlineStyle(),
nListLevel, bUnNumbered, bRestart, nStartValue);
}
/*
* Process a text:h tag
*/
private void handleHeading(Element onode, Element hnode, boolean bAfterSplit, ListStyle listStyle, int nListLevel, boolean bUnNumbered, boolean bRestart, int nStartValue) {
// Note: nListLevel may in theory be different from the outline level,
// though the ui in OOo does not allow this
// Numbering: It is possible to define outline numbering in CSS2
// using counters; but this is not supported in all browsers
// TODO: Offer CSS2 solution as an alternative later.
// Note: Conditional styles are not supported
int nLevel = getOutlineLevel(onode);
if (nLevel <= 6) { // Export as heading
String sStyleName = onode.getAttribute(TEXT_STYLE_NAME);
StyleWithProperties style = ofr.getParStyle(sStyleName);
// Check for hidden text
if (!displayHiddenText && style != null && "none".equals(style.getProperty(TEXT_DISPLAY))) {
return;
}
// Numbering
if (!bUnNumbered) {
// If the heading uses a paragraph style which sets an explicit empty
// list style name, it's unnumbered
if (style != null) {
String sListStyleName = style.getListStyleName();
if (sListStyleName != null && sListStyleName.length() == 0) {
bUnNumbered = true;
}
}
}
ListCounter counter = null;
String sLabel = "";
if (!bUnNumbered) {
counter = getListCounter(listStyle);
if (bRestart) {
counter.restart(nListLevel, nStartValue);
}
sLabel = counter.step(nListLevel).getLabel();
}
// In EPUB export, a striked out heading will only appear in the external
// toc
boolean bTocOnly = false;
if (converter.isOPS() && style != null) {
String sStrikeOut = style.getProperty(STYLE_TEXT_LINE_THROUGH_STYLE, true);
if (sStrikeOut != null && !"none".equals(sStrikeOut)) {
bTocOnly = true;
}
}
// Export the heading
if (!bTocOnly) {
// If split output, add headings of higher levels
if (bAfterSplit && splitHeadingLevel > 0) {
int nFirst = nLevel - nRepeatLevels;
if (nFirst < 0) {
nFirst = 0;
}
for (int i = nFirst; i < nLevel; i++) {
if (currentHeading[i] != null) {
hnode.appendChild(converter.importNode(currentHeading[i], true));
}
}
}
// Apply style
StyleInfo info = new StyleInfo();
info.sTagName = "h" + nLevel;
getHeadingSc().readParentStyle(nLevel, sStyleName, info);
getHeadingSc().applyStyle(nLevel, sStyleName, info);
// add root element
Element heading = converter.createElement(info.sTagName);
hnode.appendChild(heading);
writeStyle(info, heading);
traverseFloats(onode, hnode, heading);
// Apply writing direction
/*
* String sStyleName = Misc.getAttribute(onode,TEXT_STYLE_NAME);
* StyleWithProperties style = ofr.getParStyle(sStyleName); if
* (style!=null) { StyleInfo headInfo = new StyleInfo();
* StyleConverterHelper.applyDirection(style,headInfo);
* getParSc().applyStyle(headInfo,heading); }
*/
// Prepend asapNode
prependAsapNode(heading);
// Prepend numbering
if (!bUnNumbered) {
insertListLabel(listStyle, nListLevel, "SectionNumber", null, sLabel, heading);
}
// Add to toc
if (!bInToc) {
tocParser.handleHeading(onode, heading, sLabel);
}
// Convert content
StyleInfo innerInfo = new StyleInfo();
getHeadingSc().applyInnerStyle(nLevel, sStyleName, innerInfo);
Element content = heading;
if (innerInfo.sTagName != null && innerInfo.sTagName.length() > 0) {
content = converter.createElement(innerInfo.sTagName);
heading.appendChild(content);
writeStyle(innerInfo, content);
}
traverseInlineText(onode, content);
// Add before/after text if required
addBeforeAfter(heading, ofr.getParStyle(getParSP().getRealParStyleName(sStyleName)), config.getXHeadingStyleMap());
// Keep track of current headings for split output
currentHeading[nLevel] = heading;
for (int i = nLevel + 1; i <= 6; i++) {
currentHeading[i] = null;
}
} else {
if (!bInToc) {
tocParser.handleHeadingExternal(onode, hnode, sLabel);
}
// Keep track of current headings for split output
currentHeading[nLevel] = null;
for (int i = nLevel + 1; i <= 6; i++) {
currentHeading[i] = null;
}
}
} else { // beyond h6 - export as ordinary paragraph
handleParagraph(onode, hnode);
}
}
/*
* Process a text:p tag
*/
private void handleParagraph(Node onode, Node hnode) {
boolean bIsEmpty = OfficeReader.isWhitespaceContent(onode);
if (config.ignoreEmptyParagraphs() && bIsEmpty) { return; }
String styleName = Misc.getAttribute(onode,TEXT_STYLE_NAME);
StyleWithProperties style = ofr.getParStyle(styleName);
if (!displayHiddenText && style!=null && "none".equals(style.getProperty(TEXT_DISPLAY))) { return; }
Element par;
if (ofr.isSpreadsheet()) { // attach inline text directly to parent (always a table cell)
par = (Element) hnode;
}
else {
// Hack because createParagraph doesn't work the way we need here :-(
Element temp = converter.createElement("temp");
par = createParagraph(temp, styleName);
prependAsapNode(par);
traverseFloats(onode,hnode,par);
hnode.appendChild(temp.getFirstChild());
}
// Maybe add to toc
tocParser.handleParagraph((Element)onode, par, sCurrentListLabel);
if (!bIsEmpty) {
par = createTextBackground(par, styleName);
if (config.listFormatting()==XhtmlConfig.HARD_LABELS) {
insertListLabel(currentListStyle, nCurrentListLevel, "ItemNumber", null, sCurrentListLabel, par);
}
sCurrentListLabel = null;
traverseInlineText(onode,par);
}
else {
// An empty paragraph (this includes paragraphs that only contains
// whitespace) is ignored by the browser, hence we add &nbsp;
par.appendChild( converter.createTextNode("\u00A0") );
sCurrentListLabel = null;
}
if (converter.isOPS() && !par.hasChildNodes()) {
// Finally, in EPUB export, if the exported paragraph turns out to be empty, remove it
hnode.removeChild(par);
}
else {
// Otherwise, add before/after text if required
addBeforeAfter(par,ofr.getParStyle(getParSP().getRealParStyleName(styleName)),config.getXParStyleMap());
}
}
private void prependAsapNode(Node node) {
if (asapNode!=null) {
// May float past a split; check this first
if (asapNode.getOwnerDocument()!=node.getOwnerDocument()) {
asapNode = converter.importNode(asapNode,true);
}
node.appendChild(asapNode); asapNode = null;
}
}
///////////////////////////////////////////////////////////////////////////
// LISTS
///////////////////////////////////////////////////////////////////////////
// Helper: Get a list counter for a list style
private ListCounter getListCounter(ListStyle style) {
if (style==ofr.getOutlineStyle()) {
// Outline numbering has a special counter
return outlineNumbering;
}
else if (style!=null) {
// Get existing or create new counter
if (listCounters.containsKey(style.getName())) {
return listCounters.get(style.getName());
}
else {
ListCounter counter = new ListCounter(style);
listCounters.put(style.getName(),counter);
return counter;
}
}
else {
// No style, return a dummy
return new ListCounter();
}
}
// Helper: Insert a list label formatted with a list style
private void insertListLabel(ListStyle style, int nLevel, String sDefaultStyle, String sPrefix, String sLabel, Element hnode) {
if (sLabel!=null && sLabel.length()>0) {
if (sPrefix!=null) {
Element prefix = converter.createElement("span");
prefix.setAttribute("class", "chapter-name");
hnode.appendChild(prefix);
prefix.appendChild( converter.createTextNode(sPrefix));
}
StyleInfo info = new StyleInfo();
if (style!=null) {
String sTextStyleName = style.getLevelProperty(nLevel,TEXT_STYLE_NAME);
getTextSP().readStyle(sTextStyleName, info);
}
if (info.sTagName==null) { info.sTagName = "span"; }
if (info.sClass==null) { info.sClass = sDefaultStyle; }
Element content = converter.createElement(info.sTagName);
getTextSP().writeStyle(info, content);
hnode.appendChild(content);
content.appendChild( converter.createTextNode(sLabel) );
}
}
// Helper: Check if a list contains any items
private boolean hasItems(Node onode) {
Node child = onode.getFirstChild();
while (child!=null) {
if (Misc.isElement(child,TEXT_LIST_ITEM) ||
Misc.isElement(child,TEXT_LIST_HEADER)) {
return true;
}
child = child.getNextSibling();
}
return false;
}
// TODO: Merge these three methods
/*
* Process a text:ordered-list tag.
*/
private void handleOL (Node onode, int nLevel, String sStyleName, Node hnode) {
if (hasItems(onode)) {
// add an OL element
Element list = converter.createElement("ol");
StyleInfo listInfo = new StyleInfo();
getListSc().applyStyle(nLevel,sStyleName,listInfo);
getListSc().readParentStyle(nLevel, sStyleName, listInfo);
writeStyle(listInfo,list);
hnode.appendChild(list);
traverseList(onode,nLevel,sStyleName,list);
}
}
/*
* Process a text:unordered-list tag.
*/
private void handleUL (Node onode, int nLevel, String sStyleName, Node hnode) {
if (hasItems(onode)) {
// add an UL element
Element list = converter.createElement("ul");
StyleInfo listInfo = new StyleInfo();
getListSc().applyStyle(nLevel,sStyleName,listInfo);
writeStyle(listInfo,list);
hnode.appendChild(list);
traverseList(onode,nLevel,sStyleName,list);
}
}
private void handleList(Node onode, int nLevel, String sStyleName, Node hnode) {
// In OpenDocument, we should use the style to determine the type of list
String sStyleName1 = Misc.getAttribute(onode,TEXT_STYLE_NAME);
if (sStyleName1!=null) { sStyleName = sStyleName1; }
ListStyle style = ofr.getListStyle(sStyleName);
if (style!=null && style.isNumber(nLevel)) {
handleOL(onode,nLevel,sStyleName,hnode);
}
else {
handleUL(onode,nLevel,sStyleName,hnode);
}
}
/*
* Process the contents of a list (Changed as suggested by Nick Bower)
* The option xhtml_use_list_hack triggers some *invalid* code:
* - the attribute start on ol (is valid in html 4 transitional)
* - the attribute value on li (is valid in html 4 transitional)
* (these attributes are supposed to be replaced by css, but browsers
* generally don't support that)
* - generates <ol><ol><li>...</li></ol></ol> instead of
* <ol><li><ol><li>...</li></ol></li></ol> in case the first child of
* a list item is a new list. This occurs when a list is *continued* at
* level 2 or higher. This hack seems to be the only solution that
* actually produces correct results in browsers :-(
*/
private void traverseList (Node onode, int nLevel, String styleName, Element hnode) {
ListCounter counter = getListCounter(ofr.getListStyle(styleName));
// Restart numbering, if required
//if (counter!=null) {
boolean bContinueNumbering = "true".equals(Misc.getAttribute(onode,TEXT_CONTINUE_NUMBERING));
if (!bContinueNumbering && counter!=null) {
counter.restart(nLevel);
}
if (config.listFormatting()==XhtmlConfig.CSS1_HACK && counter.getValue(nLevel)>0) {
hnode.setAttribute("start",Integer.toString(counter.getValue(nLevel)+1));
}
//}
if (onode.hasChildNodes()) {
NodeList nList = onode.getChildNodes();
int len = nList.getLength();
for (int i = 0; i < len; i++) {
Node child = nList.item(i);
if (child.getNodeType() == Node.ELEMENT_NODE) {
String nodeName = child.getNodeName();
if (nodeName.equals(TEXT_LIST_ITEM)) {
// Check to see if first child is a new list
boolean bIsImmediateNestedList = false;
Element child1 = Misc.getFirstChildElement(child);
if (child1.getTagName().equals(TEXT_ORDERED_LIST) || // old
child1.getTagName().equals(TEXT_UNORDERED_LIST) || // old
child1.getTagName().equals(TEXT_LIST)) { // oasis
bIsImmediateNestedList = true;
}
if (config.listFormatting()==XhtmlConfig.CSS1_HACK && bIsImmediateNestedList) {
traverseListItem(child,nLevel,styleName,hnode);
}
else {
// add an li element
//if (counter!=null) {
sCurrentListLabel = counter.step(nLevel).getLabel();
//}
currentListStyle = ofr.getListStyle(styleName);
nCurrentListLevel = nLevel;
Element item = converter.createElement("li");
StyleInfo info = new StyleInfo();
getPresentationSc().applyOutlineStyle(nLevel,info);
writeStyle(info,item);
hnode.appendChild(item);
if (config.listFormatting()==XhtmlConfig.CSS1_HACK) {
boolean bRestart = "true".equals(Misc.getAttribute(child,
TEXT_RESTART_NUMBERING));
int nStartValue = Misc.getPosInteger(Misc.getAttribute(child,
TEXT_START_VALUE),1);
if (bRestart) {
item.setAttribute("value",Integer.toString(nStartValue));
//if (counter!=null) {
sCurrentListLabel = counter.restart(nLevel,nStartValue).getLabel();
//}
}
}
traverseListItem(child,nLevel,styleName,item);
}
}
if (nodeName.equals(TEXT_LIST_HEADER)) {
// add an li element
Element item = converter.createElement("li");
hnode.appendChild(item);
item.setAttribute("style","list-style-type:none");
traverseListItem(child,nLevel,styleName,item);
}
}
}
}
}
/*
* Process the contents of a list item
* (a list header should only contain paragraphs, but we don't care)
*/
private void traverseListItem (Node onode, int nLevel, String styleName, Node hnode) {
// First check if we have a single paragraph to be omitted
// This should happen if we ignore styles and have no style-map
// for the paragraph style used
if (config.xhtmlFormatting()!=XhtmlConfig.CONVERT_ALL && onode.hasChildNodes()) {
NodeList list = onode.getChildNodes();
int nLen = list.getLength();
int nParCount = 0;
boolean bNoPTag = true;
for (int i=0; i<nLen; i++) {
if (list.item(i).getNodeType()==Node.ELEMENT_NODE) {
if (list.item(i).getNodeName().equals(TEXT_P)) {
nParCount++;
if (bNoPTag) {
String sDisplayName = ofr.getParStyles().getDisplayName(Misc.getAttribute(list.item(0),TEXT_STYLE_NAME));
if (config.getXParStyleMap().contains(sDisplayName)) {
bNoPTag = false;
}
}
}
else { // found non-text:p element
bNoPTag=false;
}
}
}
if (bNoPTag && nParCount<=1) {
// traverse the list
for (int i = 0; i < nLen; i++) {
Node child = list.item(i);
if (child.getNodeType() == Node.ELEMENT_NODE) {
String nodeName = child.getNodeName();
if (nodeName.equals(TEXT_P)) {
traverseInlineText(child,hnode);
}
if (nodeName.equals(TEXT_LIST)) { // oasis
handleList(child,nLevel+1,styleName,hnode);
}
if (nodeName.equals(TEXT_ORDERED_LIST)) { // old
handleOL(child,nLevel+1,styleName,hnode);
}
if (nodeName.equals(TEXT_UNORDERED_LIST)) { // old
handleUL(child,nLevel+1,styleName,hnode);
}
}
}
return;
}
}
// Still here? - traverse block text as usual!
parseText(onode,nLevel,styleName,hnode);
}
///////////////////////////////////////////////////////////////////////////
// FAKE LISTS
///////////////////////////////////////////////////////////////////////////
// A fake list is a list which is converted into a sequence of numbered
// paragraphs rather than into a list.
// Currently this is done for list which only contains headings
// Helper: Check to see, if this list contains only headings
// (If so, we will ignore the list and apply the numbering to the headings)
private boolean listIsOnlyHeadings(Node node) {
Node child = node.getFirstChild();
while (child!=null) {
if (child.getNodeType() == Node.ELEMENT_NODE) {
String nodeName = child.getNodeName();
if (nodeName.equals(TEXT_LIST_ITEM)) {
if (!itemIsOnlyHeadings(child)) return false;
}
else if (nodeName.equals(TEXT_LIST_HEADER)) {
if (!itemIsOnlyHeadings(child)) return false;
}
}
child = child.getNextSibling();
}
return true;
}
private boolean itemIsOnlyHeadings(Node node) {
Node child = node.getFirstChild();
while (child!=null) {
if (child.getNodeType() == Node.ELEMENT_NODE) {
String nodeName = child.getNodeName();
if (nodeName.equals(TEXT_LIST)) {
if (!listIsOnlyHeadings(child)) return false;
}
else if (nodeName.equals(TEXT_ORDERED_LIST)) {
if (!listIsOnlyHeadings(child)) return false;
}
else if (nodeName.equals(TEXT_UNORDERED_LIST)) {
if (!listIsOnlyHeadings(child)) return false;
}
else if(!nodeName.equals(TEXT_H)) {
return false;
}
}
child = child.getNextSibling();
}
return true;
}
// Splitting may occur inside a fake list, so we return the (new) hnode
private Node handleFakeList(Node onode, int nLevel, String sStyleName, Node hnode) {
String sStyleName1 = Misc.getAttribute(onode,TEXT_STYLE_NAME);
if (sStyleName1!=null) { sStyleName = sStyleName1; }
return traverseFakeList(onode,hnode,nLevel,sStyleName);
}
// Traverse a list which is not exported as a list but as a sequence of
// numbered headings/paragraphs
private Node traverseFakeList (Node onode, Node hnode, int nLevel, String sStyleName) {
// Restart numbering?
boolean bContinueNumbering ="true".equals(
Misc.getAttribute(onode,TEXT_CONTINUE_NUMBERING));
if (!bContinueNumbering) {
getListCounter(ofr.getListStyle(sStyleName)).restart(nLevel);
}
Node child = onode.getFirstChild();
while (child!=null) {
if (child.getNodeType() == Node.ELEMENT_NODE) {
String sNodeName = child.getNodeName();
if (sNodeName.equals(TEXT_LIST_ITEM)) {
boolean bRestart = "true".equals(Misc.getAttribute(child,
TEXT_RESTART_NUMBERING));
int nStartValue = Misc.getPosInteger(Misc.getAttribute(child,
TEXT_START_VALUE),1);
hnode = traverseFakeListItem(child, hnode, nLevel, sStyleName, false, bRestart, nStartValue);
}
else if (sNodeName.equals(TEXT_LIST_HEADER)) {
hnode = traverseFakeListItem(child, hnode, nLevel, sStyleName, true, false, 0);
}
}
child = child.getNextSibling();
}
return hnode;
}
// Process the contents of a fake list item
private Node traverseFakeListItem(Node onode, Node hnode, int nLevel, String sStyleName, boolean bUnNumbered, boolean bRestart, int nStartValue) {
Node child = onode.getFirstChild();
while (child != null) {
if (child.getNodeType() == Node.ELEMENT_NODE) {
String sNodeName = child.getNodeName();
if (sNodeName.equals(TEXT_H)) {
nDontSplitLevel++;
Node rememberNode = hnode;
handleHeading((Element) child, (Element) hnode, rememberNode != hnode, ofr.getListStyle(sStyleName), nLevel, bUnNumbered, bRestart, nStartValue);
nDontSplitLevel--;
if (nDontSplitLevel == 0) {
bAfterHeading = true;
}
} else if (sNodeName.equals(TEXT_P)) {
// Currently we only handle fakes lists containing headings
} else if (sNodeName.equals(TEXT_LIST)) { // oasis
return traverseFakeList(child, hnode, nLevel + 1, sStyleName);
} else if (sNodeName.equals(TEXT_ORDERED_LIST)) { // old
return traverseFakeList(child, hnode, nLevel + 1, sStyleName);
} else if (sNodeName.equals(TEXT_UNORDERED_LIST)) { // old
return traverseFakeList(child, hnode, nLevel + 1, sStyleName);
}
}
child = child.getNextSibling();
}
return hnode;
}
////////////////////////////////////////////////////////////////////////
// INLINE TEXT
////////////////////////////////////////////////////////////////////////
/* Process floating frames bound to this inline text (ie. paragraph) */
private void traverseFloats(Node onode, Node hnodeBlock, Node hnodeInline) {
Node child = onode.getFirstChild();
while (child!=null) {
if (child.getNodeType()==Node.ELEMENT_NODE) {
Element elm = (Element) child;
if (OfficeReader.isDrawElement(elm)) {
elm = getDrawCv().getRealDrawElement(elm);
String sAnchor = elm.getAttribute(TEXT_ANCHOR_TYPE);
if (Misc.isElement(elm, DRAW_FRAME)) {
elm = Misc.getFirstChildElement(elm);
}
if (elm!=null) {
String sTag = elm.getTagName();
// Convert only floating frames; text-boxes must always float
if (!"as-char".equals(sAnchor)) {
getDrawCv().handleDrawElement(elm,(Element)hnodeBlock,
(Element)hnodeInline,nFloatMode);
}
else if (DRAW_TEXT_BOX.equals(sTag)) {
getDrawCv().handleDrawElement(elm,(Element)hnodeBlock,
(Element)hnodeInline,DrawParser.INLINE);
}
}
}
else if (OfficeReader.isTextElement(elm)) {
// Do not descend into {foot|end}notes
if (!OfficeReader.isNoteElement(elm)) {
traverseFloats(elm,hnodeBlock,hnodeInline);
}
}
}
child = child.getNextSibling();
}
}
/*
* Process inline text
*/
protected void traverseInlineText(Node onode, Node hnode) {
// String styleName = Misc.getAttribute(onode, TEXT_STYLE_NAME);
if (onode.hasChildNodes()) {
NodeList nList = onode.getChildNodes();
int nLen = nList.getLength();
for (int i = 0; i < nLen; i++) {
Node child = nList.item(i);
short nodeType = child.getNodeType();
switch (nodeType) {
case Node.TEXT_NODE:
String s = child.getNodeValue();
if (s.length() > 0) {
hnode.appendChild(converter.createTextNode(s));
}
break;
case Node.ELEMENT_NODE:
String sName = child.getNodeName();
if (OfficeReader.isDrawElement(child)) {
Element elm = getDrawCv().getRealDrawElement((Element) child);
if (elm != null) {
String sAnchor = (elm.getAttribute(TEXT_ANCHOR_TYPE));
if ("as-char".equals(sAnchor)) {
getDrawCv().handleDrawElement(elm, null, (Element) hnode, DrawParser.INLINE);
}
}
} else if (child.getNodeName().equals(TEXT_S)) {
if (config.ignoreDoubleSpaces()) {
hnode.appendChild(converter.createTextNode(" "));
} else {
int count = Misc.getPosInteger(Misc.getAttribute(child, TEXT_C), 1);
for (; count > 0; count--) {
hnode.appendChild(converter.createTextNode("\u00A0"));
}
}
} else if (sName.equals(TEXT_TAB_STOP)) {
handleTabStop(child, hnode);
} else if (sName.equals(TEXT_TAB)) { // oasis
handleTabStop(child, hnode);
} else if (sName.equals(TEXT_LINE_BREAK)) {
if (!config.ignoreHardLineBreaks()) {
hnode.appendChild(converter.createElement("br"));
}
} else if (sName.equals(TEXT_SPAN)) {
handleSpan(child, hnode);
} else if (sName.equals(TEXT_A)) {
handleAnchor(child, hnode);
} else if (sName.equals(TEXT_FOOTNOTE)) {
footCv.handleNote(child, hnode, footnotesContext);
} else if (sName.equals(TEXT_ENDNOTE)) {
endCv.handleNote(child, hnode, endnotesContext);
} else if (sName.equals(TEXT_NOTE)) { // oasis
if ("endnote".equals(Misc.getAttribute(child, TEXT_NOTE_CLASS))) {
endCv.handleNote(child, hnode, endnotesContext);
} else {
footCv.handleNote(child, hnode, footnotesContext);
}
} else if (sName.equals(TEXT_SEQUENCE)) {
handleSequence(child, hnode);
} else if (sName.equals(TEXT_PAGE_NUMBER)) {
handlePageNumber(child, hnode);
} else if (sName.equals(TEXT_PAGE_COUNT)) {
handlePageCount(child, hnode);
} else if (sName.equals(TEXT_SEQUENCE_REF)) {
handleSequenceRef(child, hnode);
} else if (sName.equals(TEXT_FOOTNOTE_REF)) {
handleNoteRef(child, hnode);
} else if (sName.equals(TEXT_ENDNOTE_REF)) {
handleNoteRef(child, hnode);
} else if (sName.equals(TEXT_NOTE_REF)) { // oasis
handleNoteRef(child, hnode);
} else if (sName.equals(TEXT_REFERENCE_MARK)) {
handleReferenceMark(child, hnode);
} else if (sName.equals(TEXT_REFERENCE_MARK_START)) {
handleReferenceMark(child, hnode);
} else if (sName.equals(TEXT_REFERENCE_REF)) {
handleReferenceRef(child, hnode);
} else if (sName.equals(TEXT_BOOKMARK)) {
handleBookmark(child, hnode);
} else if (sName.equals(TEXT_BOOKMARK_START)) {
handleBookmark(child, hnode);
} else if (sName.equals(TEXT_BOOKMARK_REF)) {
handleBookmarkRef(child, hnode);
} else if (sName.equals(TEXT_ALPHABETICAL_INDEX_MARK)) {
if (!bInToc) {
indexCv.handleIndexMark(child, hnode);
}
} else if (sName.equals(TEXT_ALPHABETICAL_INDEX_MARK_START)) {
if (!bInToc) {
indexCv.handleIndexMarkStart(child, hnode);
}
} else if (sName.equals(TEXT_TOC_MARK)) {
tocParser.handleTocMark(child, hnode);
} else if (sName.equals(TEXT_TOC_MARK_START)) {
tocParser.handleTocMark(child, hnode);
} else if (sName.equals(TEXT_BIBLIOGRAPHY_MARK)) {
handleBibliographyMark(child, hnode);
} else if (sName.equals(OFFICE_ANNOTATION)) {
converter.handleOfficeAnnotation(child, hnode);
} else if (sName.startsWith("text:")) {
traverseInlineText(child, hnode);
}
// other tags are ignored;
break;
default:
// Do nothing
}
}
}
}
private void handleTabStop(Node onode, Node hnode) {
// xhtml does not have tab stops, but we export and ASCII TAB character, which the
// user may choose to format
if (config.getXhtmlTabstopStyle().length()>0) {
Element span = converter.createElement("span");
hnode.appendChild(span);
span.setAttribute("class",config.getXhtmlTabstopStyle());
span.appendChild(converter.createTextNode("\t"));
}
else {
hnode.appendChild(converter.createTextNode("\t"));
}
}
private void handleSpan(Node onode, Node hnode) {
StyleWithProperties style = ofr.getTextStyle(Misc.getAttribute(onode, TEXT_STYLE_NAME));
if (!displayHiddenText && style != null && "none".equals(style.getProperty(TEXT_DISPLAY))) {
return;
}
if (!bInToc) {
String sStyleName = Misc.getAttribute(onode, TEXT_STYLE_NAME);
Element span = createInline((Element) hnode, sStyleName);
traverseInlineText(onode, span);
} else {
traverseInlineText(onode, hnode);
}
}
protected void traversePCDATA(Node onode, Node hnode) {
if (onode.hasChildNodes()) {
NodeList nl = onode.getChildNodes();
int nLen = nl.getLength();
for (int i=0; i<nLen; i++) {
if (nl.item(i).getNodeType()==Node.TEXT_NODE) {
hnode.appendChild( converter.createTextNode(nl.item(i).getNodeValue()) );
}
}
}
}
protected void handleAnchor(Node onode, Node hnode) {
Element anchor = converter.createLink((Element)onode);
hnode.appendChild(anchor);
traverseInlineText(onode,anchor);
}
private void handlePageNumber(Node onode, Node hnode) {
String adjust = Misc.getAttribute(onode, TEXT_PAGE_ADJUST);
//Set current page number
Integer pageNumber = pageNum;
//If there is adjustment apply it
if (adjust != null) {
int pageNumberAdjust = Integer.parseInt(adjust);
pageNumber += pageNumberAdjust;
}
hnode.appendChild(converter.createTextNode(pageNumber.toString()));
}
private void handlePageCount(Node onode, Node hnode) {
// also no sense
hnode.appendChild( converter.createTextNode("(Page count)") );
}
private void handleSequence(Node onode, Node hnode) {
// Use current value, but turn references into hyperlinks
String sName = Misc.getAttribute(onode,TEXT_REF_NAME);
if (sName!=null && !bInToc && ofr.hasSequenceRefTo(sName)) {
Element anchor = converter.createTarget("seq"+sName);
hnode.appendChild(anchor);
traversePCDATA(onode,anchor);
}
else {
traversePCDATA(onode,hnode);
}
}
private void createReference(Node onode, Node hnode, String sPrefix) {
// Turn reference into hyperlink
String sFormat = Misc.getAttribute(onode,TEXT_REFERENCE_FORMAT);
String sName = Misc.getAttribute(onode,TEXT_REF_NAME);
Element anchor = converter.createLink(sPrefix+sName);
hnode.appendChild(anchor);
if ("page".equals(sFormat)) { // all page numbers are 1 :-)
anchor.appendChild( converter.createTextNode("1") );
}
else { // in other cases use current value
traversePCDATA(onode,anchor);
}
}
private void handleSequenceRef(Node onode, Node hnode) {
createReference(onode,hnode,"seq");
}
private void handleNoteRef(Node onode, Node hnode) {
createReference(onode,hnode,"");
}
private void handleReferenceMark(Node onode, Node hnode) {
String sName = Misc.getAttribute(onode,TEXT_NAME);
if (sName!=null && !bInToc && ofr.hasReferenceRefTo(sName)) {
hnode.appendChild(converter.createTarget("ref"+sName));
}
}
private void handleReferenceRef(Node onode, Node hnode) {
createReference(onode,hnode,"ref");
}
private void handleBookmark(Node onode, Node hnode) {
// Note: Two targets (may be the target of a hyperlink or a reference)
String sName = Misc.getAttribute(onode,TEXT_NAME);
if (sName!=null && !bInToc) {
hnode.appendChild(converter.createTarget(sName));
if (ofr.hasBookmarkRefTo(sName)) {
hnode.appendChild(converter.createTarget("bkm"+sName));
}
}
}
private void handleBookmarkRef(Node onode, Node hnode) {
createReference(onode,hnode,"bkm");
}
private void handleBibliographyMark(Node onode, Node hnode) {
if (bInToc) {
traversePCDATA(onode,hnode);
}
else {
bibCv.handleBibliographyMark(onode, hnode);
}
}
///////////////////////////////////////////////////////////////////////////
// UTILITY METHODS
///////////////////////////////////////////////////////////////////////////
// Insert text before/after in an element
private void addBeforeAfter(Element elm, StyleWithProperties style, XhtmlStyleMap styleMap) {
if (style!=null && styleMap.contains(style.getDisplayName())) {
XhtmlStyleMapItem mapItem = styleMap.get(style.getDisplayName());
if (mapItem.sBefore!=null && mapItem.sBefore.length()>0) {
Node child = elm.getFirstChild();
if (child!=null) {
elm.insertBefore(converter.createTextNode(mapItem.sBefore),child);
}
else {
elm.appendChild(converter.createTextNode(mapItem.sBefore));
}
}
if (mapItem.sAfter!=null && mapItem.sAfter.length()>0) {
elm.appendChild(converter.createTextNode(mapItem.sAfter));
}
}
}
// Methods to query individual formatting properties (no inheritance)
// Does this style contain the bold attribute?
private boolean isBold(StyleWithProperties style) {
String s = style.getProperty(FO_FONT_WEIGHT,false);
return s!=null && "bold".equals(s);
}
// Does this style contain the italics/oblique attribute?
private boolean isItalics(StyleWithProperties style) {
String s = style.getProperty(FO_FONT_STYLE,false);
return s!=null && !"normal".equals(s);
}
// Does this style contain a fixed pitch font?
private boolean isFixed(StyleWithProperties style) {
String s = style.getProperty(STYLE_FONT_NAME,false);
String s2 = null;
String s3 = null;
if (s!=null) {
FontDeclaration fd = (FontDeclaration) ofr.getFontDeclarations().getStyle(s);
if (fd!=null) {
s2 = fd.getFontFamilyGeneric();
s3 = fd.getFontPitch();
}
}
else {
s = style.getProperty(FO_FONT_FAMILY,false);
s2 = style.getProperty(STYLE_FONT_FAMILY_GENERIC,false);
s3 = style.getProperty(STYLE_FONT_PITCH,false);
}
if ("fixed".equals(s3)) { return true; }
if ("modern".equals(s2)) { return true; }
return false;
}
// Does this style specify superscript?
private boolean isSuperscript(StyleWithProperties style) {
String sPos = style.getProperty(STYLE_TEXT_POSITION,false);
if (sPos==null) return false;
if (sPos.startsWith("sub")) return false;
if (sPos.startsWith("-")) return false;
if (sPos.startsWith("0%")) return false;
return true;
}
// Does this style specify subscript?
private boolean isSubscript(StyleWithProperties style) {
String sPos = style.getProperty(STYLE_TEXT_POSITION,false);
if (sPos==null) return false;
if (sPos.startsWith("sub")) return true;
if (sPos.startsWith("-")) return true;
return false;
}
// Does this style specify underline?
private boolean isUnderline(StyleWithProperties style) {
String s;
if (ofr.isOpenDocument()) {
s = style.getProperty(STYLE_TEXT_UNDERLINE_STYLE,false);
}
else {
s = style.getProperty(STYLE_TEXT_UNDERLINE,false);
}
return s!=null && !"none".equals(s);
}
// Does this style specify overstrike?
private boolean isOverstrike(StyleWithProperties style) {
String s;
if (ofr.isOpenDocument()) {
s = style.getProperty(STYLE_TEXT_LINE_THROUGH_STYLE,false);
}
else {
s = style.getProperty(STYLE_TEXT_CROSSING_OUT,false);
}
return s!=null && !"none".equals(s);
}
/* apply hard formatting attribute style maps */
private Element applyAttributes(Element node, StyleWithProperties style) {
// Do nothing if we convert hard formatting
if (config.xhtmlFormatting()==XhtmlConfig.CONVERT_ALL || config.xhtmlFormatting()==XhtmlConfig.IGNORE_STYLES) { return node; }
// Do nothing if this is not an automatic style
if (style==null) { return node; }
if (!style.isAutomatic()) { return node; }
node = applyAttribute(node,"bold",isBold(style));
node = applyAttribute(node,"italics",isItalics(style));
node = applyAttribute(node,"fixed",isFixed(style));
node = applyAttribute(node,"superscript",isSuperscript(style));
node = applyAttribute(node,"subscript",isSubscript(style));
node = applyAttribute(node,"underline",isUnderline(style));
node = applyAttribute(node,"overstrike",isOverstrike(style));
return node;
}
/* apply hard formatting attribute style maps */
private Element applyAttribute(Element node, String sAttr, boolean bApply) {
if (bApply) {
XhtmlStyleMap xattr = config.getXAttrStyleMap();
if (xattr.contains(sAttr) && xattr.get(sAttr).sElement.length()>0) {
XhtmlStyleMapItem map = xattr.get(sAttr);
Element attr = converter.createElement(map.sElement);
if (!"(none)".equals(map.sCss)) {
attr.setAttribute("class",map.sCss);
}
node.appendChild(attr);
return attr;
}
}
return node;
}
/* Create a styled paragraph node */
protected Element createParagraph(Element node, String styleName) {
StyleInfo info = new StyleInfo();
StyleWithProperties style = ofr.getParStyle(styleName);
getParSP().readStyle(styleName,info);
getParSP().readParentStyle(styleName,info);
Element para = converter.createElement(info.sTagName);
node.appendChild(para);
writeStyle(info,para);
if (style!=null && style.isAutomatic()) {
return applyAttributes(para,style);
}
else {
return para;
}
}
/* Create an inline node with background style from paragraph style */
private Element createTextBackground(Element node, String sStyleName) {
if (config.xhtmlFormatting()==XhtmlConfig.IGNORE_ALL || config.xhtmlFormatting()==XhtmlConfig.IGNORE_HARD) {
return node;
}
String sBack = getParSP().getTextBackground(sStyleName);
if (sBack.length()>0) {
Element span = converter.createElement("span");
span.setAttribute("style",sBack);
node.appendChild(span);
return span;
}
else {
return node;
}
}
/* Create a styled inline node */
protected Element createInline(Element node, String sStyleName) {
StyleInfo info = new StyleInfo();
getTextSP().readStyle(sStyleName,info);
getTextSP().readParentStyle(sStyleName,info);
Element newNode = node;
if (info.hasAttributes() || !"span".equals(info.sTagName)) {
// We (probably) need to create a new element
newNode = converter.createElement(info.sTagName);
writeStyle(info,newNode);
// But we may want to merge it with the previous element
Node prev = node.getLastChild();
if (prev!=null && Misc.isElement(prev, info.sTagName)) {
// The previous node is of the same type, compare attributes
Element prevNode = (Element) prev;
if (newNode.getAttribute("class").equals(prevNode.getAttribute("class")) &&
newNode.getAttribute("style").equals(prevNode.getAttribute("style")) &&
newNode.getAttribute("xml:lang").equals(prevNode.getAttribute("xml:lang")) &&
newNode.getAttribute("dir").equals(prevNode.getAttribute("dir"))) {
// Attribute style mapped elements are *not* merged, we will live with that
return applyAttributes(prevNode,ofr.getTextStyle(sStyleName));
}
}
node.appendChild(newNode);
}
return applyAttributes(newNode,ofr.getTextStyle(sStyleName));
}
protected int getOutlineLevel(Element node) {
return ofr.isOpenDocument() ?
Misc.getPosInteger(node.getAttribute(TEXT_OUTLINE_LEVEL),0):
Misc.getPosInteger(node.getAttribute(TEXT_LEVEL),0);
}
private Node processPageBreaks(Node currentNode, Node hnode, StyleWithProperties style){
//Check for paragraph in current node in case currentNode is table
// If currentNode is table
//check for first para inside
// Check it's master page, pageNumber, Page break before - if we already set MP - throw it away
// And make a note to pass this paragraph next time you'll meet it.
if (inUnreakableElement() ) {
return hnode;
}
Integer newPageNumber = null;
newPageNumber = getPageNumber(style, newPageNumber);
if (currentMasterPage == null && style != null) {
hnode = startDocument(hnode, style, newPageNumber);
hnode = docSep.processOutlineLevel(currentNode, hnode, pageNum);
} else if (hasMasterPage(style) || hasBreakBefore(style) || breakBeforeNextNode) {
// Insert footnotes
insertFootnotes(hnode,false);
// Add previous MP footer
//hnode = exitPageContainer((Element) hnode);
addFooter(hnode);
// Update MP
updateMasterPageWith(style);
setPageContainerStyle();
// Set new page number if defined or increment if not
if (newPageNumber != null) {
pageNum = newPageNumber;
} else {
pageNum++;
fitPageNumberToMasterPageStyle();
}
if (hasOutlineLevel(currentNode)) {
hnode = docSep.processOutlineLevel(currentNode, hnode, pageNum);
} else {
hnode = docSep.processPageBreak(currentNode, hnode, pageNum);
}
// Print new header
addHeader(hnode);
//hnode = enterPageContainer(hnode);
breakBeforeNextNode = false;
return hnode;
} else {
hnode = docSep.processOutlineLevel(currentNode, hnode, pageNum);
}
if (checkHardBreakAfter(style)) {
breakBeforeNextNode = true;
} else {
breakBeforeNextNode = false;
}
return hnode;
}
private boolean inUnreakableElement() {
return inHeader || inFooter || inTable || inList || inFootnote || inEndnote;
}
private void insertFootnotes(Node hnode, boolean lastCall) {
inFootnote = true;
footCv.insertFootnotes(hnode, lastCall);
inFootnote = false;
}
private Integer getPageNumber(StyleWithProperties style, Integer newPageNumber) {
if (style != null) {
// If style:paragraph-properties extists and contain
// style:page-number
String newPageNumberProperty = style.getParProperty(STYLE_PAGE_NUMBER, true);
if (newPageNumberProperty != null) {
// Truncate auto and other string values
newPageNumberProperty = newPageNumberProperty.replaceAll("[^0-9]", "");
if (!newPageNumberProperty.isEmpty()) {
// Save new page number
newPageNumber = Integer.parseInt(newPageNumberProperty);
}
}
}
return newPageNumber;
}
private Node startDocument(Node hnode, StyleWithProperties style, Integer newPageNumber) {
setFirstMasterPage(style);
if (newPageNumber != null) {
pageNum = newPageNumber;
} else {
}
//Start tagging
String sTitle = converter.getTitle();
hnode = docSep.startDocument(hnode, sTitle,pageNum);
//Print header
addHeader(hnode);
//hnode = enterPageContainer(hnode);
return hnode;
}
private void setFirstMasterPage(StyleWithProperties style) {
updateMasterPageWith(style);
if (currentMasterPage == null) {
currentMasterPage = "Standard";
}
setPageContainerStyle();
}
private void setPageContainerStyle() {
MasterPage mp = ofr.getFullMasterPage(currentMasterPage);
PageLayout layout = ofr.getPageLayout(mp.getPageLayoutName());
String containerStyle = "column-count: " + layout.getColCount() + ";";
pageContainer.setRootStyle(containerStyle);
}
private void fitPageNumberToMasterPageStyle() {
// TODO: READ master-page style
MasterPage masterPage = ofr.getFullMasterPage(currentMasterPage);
if (masterPage != null) {
String pageLayoutName = masterPage.getPageLayoutName();
if (pageLayoutName != null) {
PageLayout pageLayout = ofr.getPageLayout(pageLayoutName);
if (pageLayout != null) {
String pageUsage = pageLayout.getPageUsage();
if (pageUsage != null) {
int parity = pageNum % 2;
if (parity == 1 && pageUsage.equals("left")){
pageNum++;
}
if (parity == 0 && pageUsage.equals("right")){
pageNum++;
}
} else {
}
} else {
}
} else {
}
} else {
}
}
private boolean hasMasterPage(StyleWithProperties style) {
// Page break was found before
if (style != null) {
String sMasterPage = style.getMasterPageName();
if (sMasterPage != null && sMasterPage.length() > 0) {
return true;
}
}
return false;
}
private void updateMasterPageWith(StyleWithProperties style) {
if (!hasMasterPage(style) && nextMasterPage == null) {
return;
}
if (hasMasterPage(style)) {
String sMasterPage = style.getMasterPageName();
currentMasterPage = sMasterPage;
} else {
currentMasterPage = nextMasterPage;
}
MasterPage masterPage = ofr.getFullMasterPage(currentMasterPage);
nextMasterPage = masterPage.getProperty(STYLE_NEXT_STYLE_NAME);
}
private boolean hasBreakBefore(StyleWithProperties style) {
if (style != null && "page".equals(style.getProperty(FO_BREAK_BEFORE))) {
return true;
}
return false;
}
private boolean checkHardBreakAfter(StyleWithProperties style) {
if (style != null && "page".equals(style.getProperty(FO_BREAK_AFTER))) {
return true;
}
return false;
}
private Node addHeader(Node node) {
if (!pagination) {
return node;
}
Node headerNode = null;
inHeader = true;
MasterPage masterPage = ofr.getFullMasterPage(currentMasterPage);
if (currentMasterPage != null) {
String pageLayoutName = masterPage.getPageLayoutName();
PageLayout pageLayout = ofr.getPageLayout(pageLayoutName);
String marginBottom = pageLayout.getFooterProperty(FO_MARGIN_BOTTOM);
if (pageNum % 2 == 0) {
headerNode = masterPage.getHeaderLeft();
}
if (headerNode == null) {
headerNode = masterPage.getHeader();
}
if (headerNode != null) {
//Create header element
Element headerElement = converter.createElement("header");
if (marginBottom != null) {
headerElement.setAttribute("style", "margin-bottom:"+getPageSc().scale(marginBottom)+";");
}
Node pageNode = node.getParentNode();
pageNode.insertBefore(headerElement, node);
traverseBlockText(headerNode, headerElement);
}
} else {
System.out.println("ERROR MP is null");
}
inHeader = false;
return node;
}
private Node addFooter(Node node) {
if (!pagination) {
return node;
}
Node footerNode = null;
inFooter = true;
MasterPage masterPage = ofr.getFullMasterPage(currentMasterPage);
if (currentMasterPage != null) {
String pageLayoutName = masterPage.getPageLayoutName();
PageLayout pageLayout = ofr.getPageLayout(pageLayoutName);
String marginTop = pageLayout.getFooterProperty(FO_MARGIN_TOP);
if (pageNum % 2 == 0) {
footerNode = masterPage.getFooterLeft();
}
if (footerNode == null) {
footerNode = masterPage.getFooter();
}
if (footerNode != null) {
//Create footer element
Element footerElement = converter.createElement("footer");
if (marginTop != null) {
footerElement.setAttribute("style", "margin-top:"+getPageSc().scale(marginTop)+";");
}
Node pageNode = node.getParentNode();
pageNode.appendChild(footerElement);
traverseBlockText(footerNode, footerElement);
}
} else {
System.out.println("ERROR MP is null");
}
inFooter = false;
return node;
}
private boolean hasOutlineLevel(Node node) {
if (Misc.isElement(node)
&& Misc.getAttribute(node, TEXT_OUTLINE_LEVEL) != null
&& !Misc.getAttribute(node, TEXT_OUTLINE_LEVEL).isEmpty()) {
String title = docSep.getTitle(node).trim();
if (title == null || title.isEmpty()) {
return false;
}
return true;
}
return false;
}
}