src/c2html.c

Wed, 10 Jul 2013 14:38:56 +0200

author
Mike Becker <universe@uap-core.de>
date
Wed, 10 Jul 2013 14:38:56 +0200
changeset 15
398a7589297f
parent 14
b33629bf4b58
child 16
fa0bcd0444eb
permissions
-rw-r--r--

double free fix

     1 /*
     2  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER.
     3  *
     4  * Copyright 2013 Mike Becker. All rights reserved.
     5  *
     6  * Redistribution and use in source and binary forms, with or without
     7  * modification, are permitted provided that the following conditions are met:
     8  *
     9  *   1. Redistributions of source code must retain the above copyright
    10  *      notice, this list of conditions and the following disclaimer.
    11  *
    12  *   2. Redistributions in binary form must reproduce the above copyright
    13  *      notice, this list of conditions and the following disclaimer in the
    14  *      documentation and/or other materials provided with the distribution.
    15  *
    16  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
    17  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
    18  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
    19  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
    20  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
    21  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
    22  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
    23  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
    24  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
    25  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
    26  * POSSIBILITY OF SUCH DAMAGE.
    27  *
    28  */
    30 #include <stdio.h>
    31 #include <stdlib.h>
    32 #include <string.h>
    33 #include <fcntl.h>
    34 #include <unistd.h>
    35 #include <ctype.h>
    37 #define INPUTBUF_SIZE 2048
    38 #define WORDBUF_SIZE 16
    40 #define istype(word, len) (word[len-2] == '_' && word[len-1] == 't')
    41 #define isdirective(word) (word[0] == '#')
    43 const char* keywords[] = {
    44   "auto", "break", "case", "char", "const", "continue", "default", "do", 
    45   "double", "else", "enum", "extern", "float", "for", "goto", "if", "int", 
    46   "long", "register", "return", "short", "signed", "sizeof", "static", "struct", 
    47   "switch", "typedef", "union", "unsigned", "void", "volatile", "while", NULL
    48 };
    50 typedef struct {
    51   char* outfilename;
    52   char* infilename;
    53   int highlight;
    54 } settings_t;
    56 typedef struct {
    57   size_t count;
    58   size_t capacity;
    59   size_t maxlinewidth;
    60   char** lines;
    61 } inputfile_t;
    63 inputfile_t *inputfilebuffer(size_t capacity) {
    64   inputfile_t *inputfile = (inputfile_t*) malloc(sizeof(inputfile_t));
    65   inputfile->lines = (char**) malloc(capacity * sizeof(char*));
    66   inputfile->capacity = capacity;
    67   inputfile->count = 0;
    68   inputfile->maxlinewidth = 0;
    70   return inputfile;
    71 }
    73 void addline(inputfile_t *inputfile, char* line, size_t width) {
    74   char *l = (char*) malloc(width+1);
    75   memcpy(l, line, width);
    76   l[width] = 0;
    77   if (inputfile->count >= inputfile->capacity) {
    78     inputfile->capacity <<= 1;
    79     inputfile->lines = realloc(inputfile->lines, inputfile->capacity);
    80   }
    81   inputfile->lines[inputfile->count] = l;
    82   inputfile->maxlinewidth =
    83           width > inputfile->maxlinewidth ? width : inputfile->maxlinewidth;
    84   inputfile->count++;
    85 }
    87 void freeinputfilebuffer(inputfile_t *inputfile) {
    88   for (int i = 0 ; i < inputfile->count ; i++) {
    89     free(inputfile->lines[i]);
    90   }
    91   free(inputfile->lines);
    92   free(inputfile);
    93 }
    95 inputfile_t *readinput(char *filename) {
    97   int fd = open(filename, O_RDONLY);
    98   if (fd == -1) return NULL;
   100   inputfile_t *inputfile = inputfilebuffer(512);
   102   char buf[INPUTBUF_SIZE];
   103   ssize_t r;
   105   size_t maxlinewidth = 256;
   106   char *line = (char*) malloc(maxlinewidth);
   107   size_t col = 0;
   109   while ((r = read(fd, buf, INPUTBUF_SIZE)) > 0) {
   110     for (size_t i = 0 ; i < r ; i++) {
   111       if (col >= maxlinewidth-4) {
   112         maxlinewidth <<= 1;
   113         line = realloc(line, maxlinewidth);
   114       }
   116       if (buf[i] == '\n') {
   117         line[col++] = '\n';
   118         line[col] = 0;
   119         addline(inputfile, line, col);        
   120         col = 0;
   121       } else {
   122         line[col++] = buf[i];
   123       }
   124     }
   125   }
   127   free(line);
   129   close(fd);
   131   return inputfile;
   132 }
   134 size_t writeescapedchar(char *dest, size_t dp, char c) {
   135   if (c == '>') {
   136     dest[dp++] = '&'; dest[dp++] = 'g';
   137     dest[dp++] = 't'; dest[dp++] = ';';
   138   } else if (c == '<') {
   139     dest[dp++] = '&'; dest[dp++] = 'l';
   140     dest[dp++] = 't'; dest[dp++] = ';';
   141   } else {
   142     dest[dp++] = c;
   143   }
   145   return dp;
   146 }
   148 int iskeyword(char *word) {
   149   for (int i = 0 ; keywords[i] ; i++) {
   150     if (strncmp(keywords[i], word, WORDBUF_SIZE) == 0) {
   151       return 1;
   152     }
   153   }
   154   return 0;
   155 }
   157 int iscapsonly(char *word, size_t wp) {
   158   for (size_t i = 0 ; i < wp ; i++) {
   159     if (!isupper(word[i]) && word[i] != '_') {
   160       return 0;
   161     }
   162   }
   163   return 1;
   164 }
   166 void parseline(char *src, char *dest) {
   167   size_t sp = 0, dp = 0;
   168   /* indent */
   169   while (isspace(src[sp])) {
   170     dest[dp++] = src[sp++];
   171   }
   173   static char word[WORDBUF_SIZE];
   174   static char includefile[FILENAME_MAX];
   176   memset(word, 0, WORDBUF_SIZE);
   177   size_t wp = 0, ifp = 0;
   178   int isstring = 0, iscomment = 0, isinclude = 0, parseinclude = 0;
   179   static int iscommentml;
   180   int isescaping = 0;
   182   if (iscommentml) {
   183     iscomment = 1;
   184     memcpy(&(dest[dp]), "<span class=\"c2html-comment\">", 29);
   185     dp += 29;
   186   }
   188   for (char c = src[sp] ; c ; c=src[++sp]) {
   189     /* comments */
   190     if (c == '/') {
   191       if (iscommentml && sp > 0 && src[sp-1] == '*') {
   192         iscomment = 0;
   193         iscommentml = 0;
   194         memcpy(&(dest[dp]), "/</span>", 8);
   195         dp += 8;
   196         continue;
   197       } else if (!iscomment && (src[sp+1] == '/' || src[sp+1] == '*')) {
   198         iscomment = 1;
   199         iscommentml = (src[sp+1] == '*');
   200         memcpy(&(dest[dp]), "<span class=\"c2html-comment\">", 29);
   201         dp += 29;
   202       }
   203     }
   205     if (iscomment) {
   206       if (c == '\n') {
   207         memcpy(&(dest[dp]), "</span>", 7);
   208         dp += 7;
   209       }
   210       dp = writeescapedchar(dest, dp, c);
   211     } else if (isinclude) {
   212       if (c == '<') {
   213         memcpy(&(dest[dp]), "<span class=\"c2html-stdinclude\">", 32);
   214         dp += 32;
   215         dp = writeescapedchar(dest, dp, c);
   216       } else if (c == '\"') {
   217         if (parseinclude) {
   218           dest[dp++] = '\"';
   219           dest[dp++] = '>';
   220           memcpy(&(dest[dp]), includefile, ifp);
   221           dp += ifp;
   223           dp = writeescapedchar(dest, dp, c);
   224           memcpy(&(dest[dp]), "</a>", 4);
   225           dp += 4;
   226           parseinclude = 0;
   227         } else {
   228           memcpy(&(dest[dp]), "<a class=\"c2html-userinclude\" href=", 35);
   229           dp += 35;
   230           dp = writeescapedchar(dest, dp, c);
   231           ifp = 0;
   232           includefile[ifp++] = '\"';
   233           parseinclude = 1;
   234         }
   235       } else if (c == '>') {
   236         dp = writeescapedchar(dest, dp, c);
   237         memcpy(&(dest[dp]), "</span>", 7);
   238         dp += 7;
   239       } else {
   240         if (parseinclude) {
   241           includefile[ifp++] = c;
   242         }
   243         dp = writeescapedchar(dest, dp, c);
   244       }
   245     } else {
   246       /* strings */
   247       if (!isescaping && (c == '\'' || c == '\"')) {
   248         isstring ^= 1;
   249         if (isstring) {
   250           memcpy(&(dest[dp]), "<span class=\"c2html-string\">", 28);
   251           dp += 28;
   252           dp = writeescapedchar(dest, dp, c);
   253         } else {
   254           dp = writeescapedchar(dest, dp, c);
   255           memcpy(&(dest[dp]), "</span>", 7);
   256           dp += 7;
   257         }
   258       } else {
   259         if (isstring) {
   260           dp = writeescapedchar(dest, dp, c);
   261         } else if (!isalnum(c) && c != '_' && c != '#' && c != '.') {
   262           /* interpret word int_t */
   263           if (wp > 0 && wp < WORDBUF_SIZE) {
   264             int closespan = 1;
   265             if (iskeyword(word)) {
   266               memcpy(&(dest[dp]), "<span class=\"c2html-keyword\">", 29);
   267               dp += 29;
   268             } else if (istype(word, wp)) {
   269               memcpy(&(dest[dp]), "<span class=\"c2html-type\">", 26);
   270               dp += 26;
   271             } else if (isdirective(word)) {
   272               isinclude = !strncmp("#include", word, WORDBUF_SIZE);
   273               memcpy(&(dest[dp]), "<span class=\"c2html-directive\">", 31);
   274               dp += 31;
   275             } else if (iscapsonly(word, wp)) {
   276               memcpy(&(dest[dp]), "<span class=\"c2html-macroconst\">", 32);
   277               dp += 32;
   278             } else {
   279               closespan = 0;
   280             }
   281             for (int i = 0 ; i < wp ; i++) {
   282               dp = writeescapedchar(dest, dp, word[i]);
   283             }
   284             if (closespan) {
   285               memcpy(&(dest[dp]), "</span>", 7);
   286               dp += 7;
   287             }
   288           }
   289           memset(word, 0, WORDBUF_SIZE);
   290           wp = 0;
   291           dp = writeescapedchar(dest, dp, c);
   292         } else {
   293           /* read word */
   294           if (wp < WORDBUF_SIZE) {
   295             word[wp++] = c;
   296           } else if (wp == WORDBUF_SIZE) {
   297             for (int i = 0 ; i < WORDBUF_SIZE ; i++) {
   298               dp = writeescapedchar(dest, dp, word[i]);
   299             }
   300             wp++;
   301             dp = writeescapedchar(dest, dp, c);
   302           } else {
   303             dp = writeescapedchar(dest, dp, c);
   304           }
   305         }
   306       }
   308       isescaping = !isescaping & (c == '\\');
   309     }
   310   }
   311   dest[dp] = 0;
   312 }
   314 void printhelp() {
   315   printf("Formats source code using HTML.\n\nUsage:\n"
   316       "  c2html [Options] FILE\n\n"
   317       " Options:\n"
   318       "  -h                    Prints this help message\n"
   319       "  -o <output>           Output file (if not specified, stdout is used)\n"
   320       "  -p                    Disable highlighting (plain text)\n"
   321       "\n");
   324 }
   326 int lnint(size_t lnc) {
   327   int w = 1, p = 1;
   328   while ((p*=10) < lnc) w++;
   329   return w;
   330 }
   332 int main(int argc, char** argv) {
   334   settings_t settings;
   335   settings.outfilename = NULL;
   336   settings.highlight = 1;
   338   char optc;
   339   while ((optc = getopt(argc, argv, "ho:p")) != -1) {
   340     switch (optc) {
   341       case 'o':
   342         if (!(optarg[0] == '-' && optarg[1] == 0)) {
   343           settings.outfilename = optarg;
   344         }
   345         break;
   346       case 'p':
   347         settings.highlight = 0;
   348         break;
   349       case 'h':
   350         printhelp();
   351         return 0;
   352       default:
   353         return 1;
   354     }
   355   }
   357   if (optind != argc-1) {
   358     printhelp();
   359     return 1;
   360   } else {
   361     settings.infilename = argv[optind];
   363     inputfile_t *inputfile = readinput(settings.infilename);
   364     if (inputfile) {
   365       FILE *fout;
   366       char *line;
   367       if (settings.highlight) {
   368         line = (char*) malloc(inputfile->maxlinewidth*64);
   369       } else {
   370         line = NULL;
   371       }
   372       if (settings.outfilename) {
   373         fout = fopen(settings.outfilename, "w");
   374       } else {
   375         fout = stdout;
   376       }
   377       fprintf(fout, "<pre>\n");
   378       int lnw = lnint(inputfile->count);
   379       for (int i = 0 ; i < inputfile->count ; i++) {
   380         if (settings.highlight) {
   381           parseline(inputfile->lines[i], line);
   382         } else {
   383           line = inputfile->lines[i];
   384         }
   385         fprintf(fout, "<span class=\"c2html-lineno\">%*d:</span> %s",
   386             lnw, i+1, line);
   387       }
   388       if (settings.highlight) {
   389         free(line);
   390       }
   391       fprintf(fout, "</pre>\n");
   393       if (fout != stdout) {
   394         fclose(fout);
   395       }
   397       freeinputfilebuffer(inputfile);
   398     }
   400     return 0;
   401   }
   402 }

mercurial