--- a/src/c2html.c	Fri Aug 30 11:23:44 2013 +0200
+++ b/src/c2html.c	Thu Jan 23 09:19:37 2014 +0100
@@ -1,7 +1,7 @@
 /*
  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER.
  *
- * Copyright 2013 Mike Becker. All rights reserved.
+ * Copyright 2014 Mike Becker. All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions are met:
@@ -34,56 +34,10 @@
 #include <unistd.h>
 #include <ctype.h>
 
-#define INPUTBUF_SIZE 2048
-#define WORDBUF_SIZE 64
-
-const char* ckeywords[] = {
-    "auto", "break", "case", "char", "const", "continue", "default", "do",
-    "double", "else", "enum", "extern", "float", "for", "goto", "if", "int",
-    "long", "register", "return", "short", "signed", "sizeof", "static",
-    "struct", "switch", "typedef", "union", "unsigned", "void", "volatile",
-    "while", NULL
-};
-
-const char* jkeywords[] = {
-    "abstract", "continue", "for", "new", "switch", "assert", "default", "goto",
-    "package", "synchronized", "boolean", "do", "if", "private", "this",
-    "break", "double", "implements", "protected", "throw", "byte", "else",
-    "import", "public", "throws", "case", "enum", "instanceof", "return",
-    "transient", "catch", "extends", "int", "short", "try", "char", "final",
-    "interface", "static", "void", "class", "finally", "long", "strictfp",
-    "volatile", "const", "float", "native", "super", "while", NULL
-};
-
-#define iswordcharacter(c) (isalnum(c) || c=='_' || c=='#' || c=='@')
+#include "javacodegen.h"
+#include "ccodegen.h"
 
-int isctype(char *word, size_t len) {
-    return (word[len-2] == '_' && word[len-1] == 't');
-}
-
-int iscdirective(char *word) {
-    return (word[0] == '#');
-}
-
-int isjtype(char *word, size_t len) {
-    return isupper(word[0]);
-}
-
-int isjdirective(char *word) {
-    return word[0] == '@';
-}
-
-typedef struct _highlighter_t highlighter_t;
-
-struct _highlighter_t {
-    const char** keywords;
-    int(*istype)(char*,size_t);
-    int(*isdirective)(char*);
-    void(*parser)(char*,char*,highlighter_t*);
-    int iscommentml;
-    char word[WORDBUF_SIZE];
-    char includefile[FILENAME_MAX];
-};
+#define INPUTBUF_SIZE 2048
 
 typedef struct {
     char* outfilename;
@@ -169,190 +123,6 @@
     return inputfile;
 }
 
-size_t writeescapedchar(char *dest, size_t dp, char c) {
-    if (c == '>') {
-        dest[dp++] = '&'; dest[dp++] = 'g'; dest[dp++] = 't'; dest[dp++] = ';';
-    } else if (c == '<') {
-        dest[dp++] = '&'; dest[dp++] = 'l'; dest[dp++] = 't'; dest[dp++] = ';';
-    } else {
-        dest[dp++] = c;
-    }
-
-    return dp;
-}
-
-int iskeyword(char *word, const char** keywords) {
-    for (int i = 0 ; keywords[i] ; i++) {
-        if (strncmp(keywords[i], word, WORDBUF_SIZE) == 0) {
-            return 1;
-        }
-    }
-    return 0;
-}
-
-int iscapsonly(char *word, size_t wp) {
-    for (size_t i = 0 ; i < wp ; i++) {
-        if (!isupper(word[i]) && word[i] != '_') {
-            return 0;
-        }
-    }
-    return 1;
-}
-
-void parseline(char *src, char *dest, highlighter_t *hltr) {
-    hltr->parser(src, dest, hltr);
-}
-
-void cjparseline(char *src, char *dest, highlighter_t *hltr) {
-    size_t sp = 0, dp = 0;
-    /* indent */
-    while (isspace(src[sp])) {
-        dest[dp++] = src[sp++];
-    }
-
-    memset(hltr->word, 0, WORDBUF_SIZE);
-    size_t wp = 0, ifp = 0;
-    int isstring = 0, iscomment = 0, isinclude = 0, parseinclude = 0;
-    int isescaping = 0;
-
-    if (hltr->iscommentml) {
-        iscomment = 1;
-        memcpy(&(dest[dp]), "<span class=\"c2html-comment\">", 29);
-        dp += 29;
-    }
-
-    for (char c = src[sp] ; c ; c=src[++sp]) {
-        /* comments */
-        if (c == '/') {
-            if (hltr->iscommentml && sp > 0 && src[sp-1] == '*') {
-                iscomment = 0;
-                hltr->iscommentml = 0;
-                memcpy(&(dest[dp]), "/</span>", 8);
-                dp += 8;
-                continue;
-            } else if (!iscomment && (src[sp+1] == '/' || src[sp+1] == '*')) {
-                iscomment = 1;
-                hltr->iscommentml = (src[sp+1] == '*');
-                memcpy(&(dest[dp]), "<span class=\"c2html-comment\">", 29);
-                dp += 29;
-            }
-        }
-
-        if (iscomment) {
-            if (c == '\n') {
-                memcpy(&(dest[dp]), "</span>", 7);
-                dp += 7;
-            }
-            dp = writeescapedchar(dest, dp, c);
-        } else if (isinclude) {
-            if (c == '<') {
-                memcpy(&(dest[dp]), "<span class=\"c2html-stdinclude\">", 32);
-                dp += 32;
-                dp = writeescapedchar(dest, dp, c);
-            } else if (c == '\"') {
-                if (parseinclude) {
-                    dest[dp++] = '\"';
-                    dest[dp++] = '>';
-                    memcpy(&(dest[dp]), hltr->includefile, ifp);
-                    dp += ifp;
-
-                    dp = writeescapedchar(dest, dp, c);
-                    memcpy(&(dest[dp]), "</a>", 4);
-                    dp += 4;
-                    parseinclude = 0;
-                } else {
-                    memcpy(&(dest[dp]),
-                        "<a class=\"c2html-userinclude\" href=", 35);
-                    dp += 35;
-                    dp = writeescapedchar(dest, dp, c);
-                    ifp = 0;
-                    hltr->includefile[ifp++] = '\"';
-                    parseinclude = 1;
-                }
-            } else if (c == '>') {
-                dp = writeescapedchar(dest, dp, c);
-                memcpy(&(dest[dp]), "</span>", 7);
-                dp += 7;
-            } else {
-                if (parseinclude) {
-                    hltr->includefile[ifp++] = c;
-                }
-                dp = writeescapedchar(dest, dp, c);
-            }
-        } else {
-            /* strings */
-            if (!isescaping && (c == '\'' || c == '\"')) {
-                isstring ^= 1;
-                if (isstring) {
-                    memcpy(&(dest[dp]), "<span class=\"c2html-string\">", 28);
-                    dp += 28;
-                    dp = writeescapedchar(dest, dp, c);
-                } else {
-                    dp = writeescapedchar(dest, dp, c);
-                    memcpy(&(dest[dp]), "</span>", 7);
-                    dp += 7;
-                }
-            } else {
-                if (isstring) {
-                    dp = writeescapedchar(dest, dp, c);
-                } else if (!iswordcharacter(c)) {
-                    /* interpret word int_t */
-                    if (wp > 0 && wp < WORDBUF_SIZE) {
-                        int closespan = 1;
-                        if (iskeyword(hltr->word, hltr->keywords)) {
-                            memcpy(&(dest[dp]),
-                                "<span class=\"c2html-keyword\">", 29);
-                            dp += 29;
-                        } else if (hltr->istype(hltr->word, wp)) {
-                            memcpy(&(dest[dp]),
-                                "<span class=\"c2html-type\">", 26);
-                            dp += 26;
-                        } else if (hltr->isdirective(hltr->word)) {
-                            isinclude = !strncmp(
-                                "#include", hltr->word, WORDBUF_SIZE);
-                            memcpy(&(dest[dp]),
-                                "<span class=\"c2html-directive\">", 31);
-                            dp += 31;
-                        } else if (iscapsonly(hltr->word, wp)) {
-                            memcpy(&(dest[dp]),
-                                "<span class=\"c2html-macroconst\">", 32);
-                            dp += 32;
-                        } else {
-                            closespan = 0;
-                        }
-                        for (int i = 0 ; i < wp ; i++) {
-                            dp = writeescapedchar(dest, dp, hltr->word[i]);
-                        }
-                        if (closespan) {
-                            memcpy(&(dest[dp]), "</span>", 7);
-                            dp += 7;
-                        }
-                    }
-                    memset(hltr->word, 0, WORDBUF_SIZE);
-                    wp = 0;
-                    dp = writeescapedchar(dest, dp, c);
-                } else {
-                    /* read word */
-                    if (wp < WORDBUF_SIZE) {
-                        hltr->word[wp++] = c;
-                    } else if (wp == WORDBUF_SIZE) {
-                        for (int i = 0 ; i < WORDBUF_SIZE ; i++) {
-                            dp = writeescapedchar(dest, dp, hltr->word[i]);
-                        }
-                        wp++;
-                        dp = writeescapedchar(dest, dp, c);
-                    } else {
-                        dp = writeescapedchar(dest, dp, c);
-                    }
-                }
-            }
-
-            isescaping = !isescaping & (c == '\\');
-        }
-    }
-    dest[dp] = 0;
-}
-
 void printhelp() {
     printf("Formats source code using HTML.\n\nUsage:\n"
         "  c2html [Options] FILE\n\n"
@@ -382,7 +152,7 @@
     highlighter.isdirective = iscdirective;
     highlighter.istype = isctype;
     highlighter.keywords = ckeywords;
-    highlighter.parser = cjparseline;
+    highlighter.parser = cparseline;
 
     char optc;
     while ((optc = getopt(argc, argv, "hjo:p")) != -1) {
@@ -396,6 +166,7 @@
                 highlighter.isdirective = isjdirective;
                 highlighter.istype = isjtype;
                 highlighter.keywords = jkeywords;
+                highlighter.parser = jparseline;
                 break;
             case 'p':
                 settings.highlight = 0;
@@ -432,7 +203,7 @@
             int lnw = lnint(inputfile->count);
             for (int i = 0 ; i < inputfile->count ; i++) {
                 if (settings.highlight) {
-                    parseline(inputfile->lines[i], line, &highlighter);
+                    highlighter.parser(inputfile->lines[i], line, &highlighter);
                 } else {
                     line = inputfile->lines[i];
                 }