Java tutorial
/* Copyright (C) 2003-2011 JabRef contributors. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. */ package net.sf.jabref.logic.layout.format; import net.sf.jabref.Globals; import net.sf.jabref.logic.layout.LayoutFormatter; import net.sf.jabref.logic.layout.StringInt; import net.sf.jabref.logic.util.strings.RtfCharMap; import org.apache.commons.logging.Log; import org.apache.commons.logging.LogFactory; /** * Transform a LaTeX-String to RTF. * * This method will: * * 1.) Remove LaTeX-Command sequences. * * 2.) Replace LaTeX-Special chars with RTF aquivalents. * * 3.) Replace emph and textit and textbf with their RTF replacements. * * 4.) Take special care to save all unicode characters correctly. * * 5.) Replace --- by \emdash and -- by \endash. */ public class RTFChars implements LayoutFormatter { private static final Log LOGGER = LogFactory.getLog(LayoutFormatter.class); private static final RtfCharMap RTF_CHARS = new RtfCharMap(); @Override public String format(String field) { StringBuilder sb = new StringBuilder(""); StringBuilder currentCommand = null; boolean escaped = false; boolean incommand = false; for (int i = 0; i < field.length(); i++) { char c = field.charAt(i); if (escaped && (c == '\\')) { sb.append('\\'); escaped = false; } else if (c == '\\') { escaped = true; incommand = true; currentCommand = new StringBuilder(); } else if (!incommand && ((c == '{') || (c == '}'))) { // Swallow the brace. } else if (Character.isLetter(c) || Globals.SPECIAL_COMMAND_CHARS.contains(String.valueOf(c))) { escaped = false; if (incommand) { // Else we are in a command, and should not keep the letter. currentCommand.append(c); testCharCom: if ((currentCommand.length() == 1) && Globals.SPECIAL_COMMAND_CHARS.contains(currentCommand.toString())) { // This indicates that we are in a command of the type // \^o or \~{n} if (i >= (field.length() - 1)) { break testCharCom; } String command = currentCommand.toString(); i++; c = field.charAt(i); String combody; if (c == '{') { StringInt part = getPart(field, i, true); i += part.i; combody = part.s; } else { combody = field.substring(i, i + 1); } String result = RTF_CHARS.get(command + combody); if (result != null) { sb.append(result); } incommand = false; escaped = false; } } else { sb.append(c); } } else { testContent: if (!incommand || (!Character.isWhitespace(c) && (c != '{') && (c != '}'))) { sb.append(c); } else { assert incommand; // First test for braces that may be part of a LaTeX command: if ((c == '{') && (currentCommand.length() == 0)) { // We have seen something like \{, which is probably the start // of a command like \{aa}. Swallow the brace. continue; } else if ((c == '}') && (currentCommand.length() > 0)) { // Seems to be the end of a command like \{aa}. Look it up: String command = currentCommand.toString(); String result = RTF_CHARS.get(command); if (result != null) { sb.append(result); } incommand = false; escaped = false; continue; } // Then look for italics etc., // but first check if we are already at the end of the string. if (i >= field.length() - 1) { break testContent; } if (((c == '{') || (c == ' ')) && (currentCommand.length() > 0)) { String command = currentCommand.toString(); // Then test if we are dealing with a italics or bold // command. If so, handle. if ("em".equals(command) || "emph".equals(command) || "textit".equals(command) || "it".equals(command)) { StringInt part = getPart(field, i, c == '{'); i += part.i; sb.append("{\\i ").append(part.s).append('}'); } else if ("textbf".equals(command) || "bf".equals(command)) { StringInt part = getPart(field, i, c == '{'); i += part.i; sb.append("{\\b ").append(part.s).append('}'); } else { LOGGER.info("Unknown command " + command); } if (c == ' ') { // command was separated with the content by ' ' // We have to add the space a } } else { sb.append(c); } } incommand = false; escaped = false; } } char[] chars = sb.toString().toCharArray(); sb = new StringBuilder(); for (char c : chars) { if (c < 128) { sb.append(c); } else { sb.append("\\u").append((long) c).append('?'); } } return sb.toString().replace("---", "{\\emdash}").replace("--", "{\\endash}").replace("``", "{\\ldblquote}") .replace("''", "{\\rdblquote}"); } /** * @param text the text to extract the part from * @param i the position to start * @param commandNestedInBraces true if the command is nested in braces (\emph{xy}), false if spaces are sued (\emph xy) * @return a tuple of number of added characters and the extracted part */ private StringInt getPart(String text, int i, boolean commandNestedInBraces) { char c; int count = 0; int icount = i; StringBuilder part = new StringBuilder(); loop: while ((count >= 0) && (icount < text.length())) { icount++; c = text.charAt(icount); switch (c) { case '}': count--; break; case '{': count++; break; case ' ': if (!commandNestedInBraces) { // in any case, a space terminates the loop break loop; } break; default: break; } part.append(c); } String res = part.toString(); // the wrong "}" at the end is removed by "format(res)" return new StringInt(format(res), part.length()); } }