Fixed title extraction method

This commit is contained in:
Georgy Litvinov 2020-02-19 18:31:44 +01:00
parent 3226257348
commit b006fc0471

View file

@ -47,6 +47,7 @@ public class Separator {
alignSplitToPages = config.getAlignSplitsToPages(); alignSplitToPages = config.getAlignSplitsToPages();
breakStyle = config.getPageBreakStyle(); breakStyle = config.getPageBreakStyle();
pageContainer = converter.pageContainer; pageContainer = converter.pageContainer;
rdfSeparation = converter.isRDF;
headingPath = new int[10]; headingPath = new int[10];
} }
@ -55,10 +56,10 @@ public class Separator {
// Get outline level // Get outline level
String sLevel = getAttribute(currentNode, XMLString.TEXT_OUTLINE_LEVEL); String sLevel = getAttribute(currentNode, XMLString.TEXT_OUTLINE_LEVEL);
// System.out.println(sLevel); // System.out.println(sLevel);
String title = getTitle(currentNode).trim();
if (sLevel == null || sLevel.isEmpty()) { if (sLevel == null || sLevel.isEmpty()) {
return hnode; return hnode;
} }
String title = getTitle(currentNode).trim();
if (title == null || title.isEmpty()) { if (title == null || title.isEmpty()) {
return hnode; return hnode;
} }
@ -273,30 +274,36 @@ public class Separator {
public static String getTitle(Node currentNode) { public static String getTitle(Node currentNode) {
Node content = currentNode.cloneNode(true); Node content = currentNode.cloneNode(true);
NodeList contentNodes = content.getChildNodes();
String title = null; String title = null;
NodeList lineBreaks = ((Element) content).getElementsByTagName(XMLString.TEXT_LINE_BREAK);
NodeList textTabs = ((Element) content).getElementsByTagName(XMLString.TEXT_TAB);
int i = 0; replaceWithSpaces(lineBreaks);
while (i < contentNodes.getLength()) { replaceWithSpaces(textTabs);
Node child = contentNodes.item(i); deleteNotesIn(content);
if (isElement(child)) { title = content.getTextContent();
if (child.getNodeName().equals(XMLString.TEXT_TAB) || child.getNodeName().equals(XMLString.TEXT_LINE_BREAK)) { return title;
Document doc = child.getOwnerDocument(); }
Node testSpace = doc.createTextNode(" ");
content.insertBefore(testSpace, child); private static void deleteNotesIn(Node content) {
content.removeChild(child);
}
}
i++;
}
NodeList notes = ((Element) content).getElementsByTagName(XMLString.TEXT_NOTE); NodeList notes = ((Element) content).getElementsByTagName(XMLString.TEXT_NOTE);
int j = 0; int j = 0;
while (j < notes.getLength()) { while (j < notes.getLength()) {
Node note = notes.item(j); Node note = notes.item(j);
note.getParentNode().removeChild(note); note.getParentNode().removeChild(note);
} }
title = content.getTextContent(); }
return title;
private static void replaceWithSpaces(NodeList contentNodes) {
int i = 0;
while (i < contentNodes.getLength()) {
Node node = contentNodes.item(i);
Document doc = node.getOwnerDocument();
Node testSpace = doc.createTextNode(" ");
node.getParentNode().insertBefore(testSpace, node);
node.getParentNode().removeChild(node);
i++;
}
} }
private static void openCommentHeading(Node hnode, String title) { private static void openCommentHeading(Node hnode, String title) {