/src/de/uni_koblenz/jgralab/utilities/gui/xdot/XDotLexer.java

http://github.com/jgralab/jgralab · Java · 256 lines · 197 code · 14 blank · 45 comment · 71 complexity · dedea67ad9431475db4ac6bc8376eab8 MD5 · raw file

  1. /*
  2. * JGraLab - The Java Graph Laboratory
  3. *
  4. * Copyright (C) 2006-2014 Institute for Software Technology
  5. * University of Koblenz-Landau, Germany
  6. * ist@uni-koblenz.de
  7. *
  8. * For bug reports, documentation and further information, visit
  9. *
  10. * https://github.com/jgralab/jgralab
  11. *
  12. * This program is free software; you can redistribute it and/or modify it
  13. * under the terms of the GNU General Public License as published by the
  14. * Free Software Foundation; either version 3 of the License, or (at your
  15. * option) any later version.
  16. *
  17. * This program is distributed in the hope that it will be useful, but
  18. * WITHOUT ANY WARRANTY; without even the implied warranty of
  19. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
  20. * Public License for more details.
  21. *
  22. * You should have received a copy of the GNU General Public License along
  23. * with this program; if not, see <http://www.gnu.org/licenses>.
  24. *
  25. * Additional permission under GNU GPL version 3 section 7
  26. *
  27. * If you modify this Program, or any covered work, by linking or combining
  28. * it with Eclipse (or a modified version of that program or an Eclipse
  29. * plugin), containing parts covered by the terms of the Eclipse Public
  30. * License (EPL), the licensors of this Program grant you additional
  31. * permission to convey the resulting work. Corresponding Source for a
  32. * non-source form of such a combination shall include the source code for
  33. * the parts of JGraLab used as well as that of the covered work.
  34. */
  35. package de.uni_koblenz.jgralab.utilities.gui.xdot;
  36. import java.io.BufferedReader;
  37. import java.io.IOException;
  38. import java.io.InputStream;
  39. import java.io.InputStreamReader;
  40. /**
  41. * @author ist@uni-koblenz.de
  42. */
  43. public class XDotLexer {
  44. private int line;
  45. private int col;
  46. private int la;
  47. private int putBackChar;
  48. private BufferedReader in;
  49. public enum Type {
  50. TEXT, SEPARATOR, STRING, EOF
  51. }
  52. public static final class Token {
  53. public Type type;
  54. public String text;
  55. private Token(Type t, String s) {
  56. type = t;
  57. text = s;
  58. }
  59. }
  60. public XDotLexer(InputStream is) throws IOException {
  61. in = new BufferedReader(new InputStreamReader(is, "UTF-8"));
  62. putBackChar = -1;
  63. line = 1;
  64. col = 0;
  65. la = read();
  66. }
  67. public final int getLine() {
  68. return line;
  69. }
  70. public final Token nextToken() throws IOException {
  71. skipWs();
  72. Type type = null;
  73. StringBuilder out = new StringBuilder();
  74. if (la < 0) {
  75. type = Type.EOF;
  76. } else if (la == '"') {
  77. readQuotedString(out);
  78. type = Type.STRING;
  79. } else if (la == '<') {
  80. readHtmlString(out);
  81. type = Type.STRING;
  82. } else if (isSeparator(la)) {
  83. out.append((char) la);
  84. type = Type.SEPARATOR;
  85. la = read();
  86. } else {
  87. if (la >= 0) {
  88. do {
  89. out.append((char) la);
  90. la = read();
  91. } while (!isWs(la) && !isSeparator(la) && (la >= 0));
  92. }
  93. type = Type.TEXT;
  94. }
  95. Token t = new Token(type, out.toString());
  96. // if (t.text.equals("{") || t.text.equalsIgnoreCase("}")
  97. // || t.text.equals(";")) {
  98. // System.out.println("'" + t.text + "'");
  99. // } else {
  100. // System.out.print("'" + t.text + "' ");
  101. // }
  102. return t;
  103. }
  104. private final int read() throws IOException {
  105. int ch;
  106. if (putBackChar >= 0) {
  107. ch = putBackChar;
  108. putBackChar = -1;
  109. } else {
  110. ch = in.read();
  111. }
  112. if (ch == '\n') {
  113. ++line;
  114. col = 0;
  115. return ch;
  116. }
  117. // check for (possible repeated) escaped line ends
  118. while (ch == '\\') {
  119. ch = in.read();
  120. if (ch == '\r') {
  121. // check for windows line end (CR-LF)
  122. ch = in.read();
  123. if (ch == '\n') {
  124. ++line;
  125. ch = in.read();
  126. } else if (ch != -1) {
  127. throw new IOException(
  128. "Expected line end CR/LF but found CR/ASCII " + ch);
  129. }
  130. } else if (ch == '\n') {
  131. // unix line end
  132. ++line;
  133. ch = in.read();
  134. } else {
  135. putBackChar = ch;
  136. ch = '\\';
  137. return ch;
  138. }
  139. }
  140. ++col;
  141. return ch;
  142. }
  143. private final void readQuotedString(StringBuilder out) throws IOException {
  144. int startLine = line;
  145. la = read();
  146. LOOP: while ((la >= 0) && (la != '"')) {
  147. if (la == '\\') {
  148. la = read();
  149. if (la < 0) {
  150. break LOOP;
  151. }
  152. if (la != '"') {
  153. out.append("\\");
  154. }
  155. }
  156. out.append((char) la);
  157. la = read();
  158. }
  159. if (la < 0) {
  160. throw new IOException(
  161. "Unterminated quoted string starting in line " + startLine);
  162. }
  163. la = read();
  164. }
  165. private final void readHtmlString(StringBuilder out) throws IOException {
  166. int startLine = line;
  167. la = read();
  168. while ((la >= 0) && (la != '>')) {
  169. out.append((char) la);
  170. la = read();
  171. }
  172. if (la < 0) {
  173. throw new IOException("Unterminated HTML string starting in line "
  174. + startLine);
  175. }
  176. la = read();
  177. }
  178. private final static boolean isWs(int c) {
  179. return (c == ' ') || (c == '\n') || (c == '\t') || (c == '\r');
  180. }
  181. private final static boolean isSeparator(int c) {
  182. return (c == ';') || (c == '{') || (c == '}') || (c == '[')
  183. || (c == ']') || (c == '=') || (c == ',');
  184. }
  185. private final void skipWs() throws IOException {
  186. // skip whitespace and consecutive single line comments
  187. do {
  188. // skip whitespace
  189. while (isWs(la)) {
  190. la = read();
  191. }
  192. // skip comments
  193. while (la == '/' || (la == '#' && col == 1)) {
  194. if (la == '#' && col == 1) {
  195. // single line CPP comment, skip to the end of the current
  196. // line
  197. while ((la >= 0) && (la != '\n')) {
  198. la = read();
  199. }
  200. } else {
  201. la = read();
  202. if ((la >= 0) && (la == '/')) {
  203. // single line comment, skip to the end of the current
  204. // line
  205. while ((la >= 0) && (la != '\n')) {
  206. la = read();
  207. }
  208. } else if ((la >= 0) && (la == '*')) {
  209. // multi line comment
  210. int startLine = line;
  211. do {
  212. while ((la >= 0) && (la != '*')) {
  213. la = read();
  214. }
  215. if (la >= 0) {
  216. la = read();
  217. }
  218. } while (la >= 0 && la != '/');
  219. if (la < 0) {
  220. throw new IOException(
  221. "Unterminated multi line comment starting in line "
  222. + startLine);
  223. }
  224. la = read();
  225. } else {
  226. putback(la);
  227. la = '/';
  228. return;
  229. }
  230. }
  231. }
  232. } while (isWs(la));
  233. }
  234. private final void putback(int ch) {
  235. putBackChar = ch;
  236. if (ch == '\n') {
  237. --line;
  238. }
  239. }
  240. }