/************************************************************************ * * UnicodeStringParser.java * * Copyright: 2002-2007 by Henrik Just * * This file is part of Writer2LaTeX. * * Writer2LaTeX is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * Writer2LaTeX is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with Writer2LaTeX. If not, see . * * Version 0.5 (2007-07-24) * */ package writer2latex.latex.i18n; // Helper class: Parse a unicode string. // Note: Some 8-bit fonts have additional "spacer" characters that are used // for manual placement of accents. These are ignored between the base character // and the combining character, thus we are parsing according to the rule // * ? class UnicodeStringParser { private UnicodeTable table; // the table to use private String s; // the string private int i; // the current index private int nEnd; // the maximal index private char c; // the current character private char cc; // the current combining character protected void reset(UnicodeTable table, String s, int i, int nEnd) { this.table=table; this.s=s; this.i=i; this.nEnd=nEnd; } protected boolean next() { if (i>=nEnd) { return false; } // Pick up base character c = s.charAt(i++); if (table.getCharType(c)==UnicodeCharacter.COMBINING) { // Lonely combining character - combine with space cc = c; c = ' '; return true; } // Skip characters that should be ignored while (i