Thu, 02 Feb 2012 14:17:35 +0100
added regex parser
universe@10 | 1 | /* |
universe@10 | 2 | * cline.c |
universe@10 | 3 | * |
universe@10 | 4 | * Created on: 23.05.2011 |
universe@20 | 5 | * Author: Mike |
universe@10 | 6 | */ |
universe@10 | 7 | |
universe@3 | 8 | #include "cline.h" |
universe@10 | 9 | #include "scanner.h" |
universe@10 | 10 | #include "settings.h" |
universe@12 | 11 | #include "arguments.h" |
universe@16 | 12 | #include "stream.h" |
universe@27 | 13 | #include "regex_parser.h" |
universe@0 | 14 | |
universe@12 | 15 | void printHelpText() { |
universe@0 | 16 | const char* helpText = |
universe@1 | 17 | "\nUsage:" |
universe@27 | 18 | "\n cline [Options] [Directory]" |
universe@27 | 19 | "\n cline [Options] [Directory]" |
universe@0 | 20 | "\n\nCounts the line terminator characters (\\n) within all" |
universe@0 | 21 | " files in the specified\ndirectory." |
universe@0 | 22 | "\n\nOptions:" |
universe@21 | 23 | "\n -b <level> - binary file heuristics level (default medium)" |
universe@21 | 24 | "\n One of: ignore low medium high" |
universe@28 | 25 | "\n -E <pattern> - Excludes any line matching the <pattern>" |
universe@27 | 26 | "\n -e <start> <end> - Excludes lines between <start> and <end>" |
universe@28 | 27 | "\n You may use these options multiple times" |
universe@0 | 28 | "\n -h, --help - this help text" |
universe@1 | 29 | "\n -m - print information about matching files only" |
universe@1 | 30 | "\n -s <suffixes> - only count files with these suffixes (separated" |
universe@0 | 31 | "\n by commas)" |
universe@1 | 32 | "\n -S <suffixes> - count any file except those with these suffixes" |
universe@0 | 33 | "\n (separated by commas)" |
universe@1 | 34 | "\n -r, -R - includes subdirectories" |
universe@14 | 35 | "\n -v, --version - print out version information" |
universe@16 | 36 | "\n -V - turn verbose output off, print the result only" |
universe@0 | 37 | "\n\n" |
universe@1 | 38 | "The default call without any options is:" |
universe@28 | 39 | "\n cline ./\n\n" |
universe@7 | 40 | "So each file in the working directory is counted. If you want to count C" |
universe@7 | 41 | "\nsource code in your working directory and its subdirectories, type:" |
universe@27 | 42 | "\n cline -rs .c\n" |
universe@28 | 43 | "\nIf you want to exclude comment lines, you may use the -e/-E option." |
universe@27 | 44 | "\nAfter a line matches the regex pattern <start> any following line is" |
universe@28 | 45 | "\nnot counted unless a line matches the <end> pattern. A line is still " |
universe@28 | 46 | "\ncounted when it does not start or end with the respective patterns." |
universe@28 | 47 | "\nPlease note, that cline does not remove whitespace characters as this" |
universe@28 | 48 | "\nmight not be reasonable in some cases." |
universe@28 | 49 | "\n\nExample (C comments):" |
universe@28 | 50 | "\n cline -s .c,.h -E \"\\s*//\" -e \"\\s*/\\*\" \"\\*/\\s*\""; |
universe@1 | 51 | |
universe@12 | 52 | printf(helpText); |
universe@1 | 53 | } |
universe@1 | 54 | |
universe@14 | 55 | int exit_with_version(settings_t* settings) { |
universe@16 | 56 | printf("cline - Revision: %s", VERSION); |
universe@14 | 57 | destroy_settings_t(settings); |
universe@14 | 58 | return 0; |
universe@14 | 59 | } |
universe@14 | 60 | |
universe@12 | 61 | int exit_with_help(settings_t* settings, int code) { |
universe@12 | 62 | printHelpText(); |
universe@8 | 63 | destroy_settings_t(settings); |
universe@8 | 64 | return code; |
universe@8 | 65 | } |
universe@8 | 66 | |
universe@1 | 67 | int main(int argc, char** argv) { |
universe@0 | 68 | |
universe@22 | 69 | /* Settings */ |
universe@3 | 70 | settings_t *settings = new_settings_t(); |
universe@5 | 71 | if (settings == NULL) { |
universe@5 | 72 | fprintf(stderr, "Memory allocation failed.\n"); |
universe@5 | 73 | return 1; |
universe@5 | 74 | } |
universe@3 | 75 | |
universe@22 | 76 | /* Get arguments */ |
universe@7 | 77 | char* directory = "./"; |
universe@7 | 78 | char* suffix = " "; |
universe@8 | 79 | int checked = 0; |
universe@0 | 80 | |
universe@1 | 81 | for (int t = 1 ; t < argc ; t++) { |
universe@1 | 82 | |
universe@28 | 83 | int argflags = checkArgument(argv[t], "hsSrRmvVbeE"); |
universe@1 | 84 | |
universe@22 | 85 | /* s, S */ |
universe@14 | 86 | if ((argflags & 6) > 0) { |
universe@8 | 87 | if (registerArgument(&checked, 6)) { |
universe@12 | 88 | return exit_with_help(settings, 1); |
universe@0 | 89 | } |
universe@14 | 90 | settings->includeSuffixes = (argflags & 2) > 0; |
universe@1 | 91 | t++; |
universe@1 | 92 | if (t >= argc) { |
universe@12 | 93 | return exit_with_help(settings, 1); |
universe@1 | 94 | } |
universe@1 | 95 | suffix = argv[t]; |
universe@0 | 96 | } |
universe@22 | 97 | /* h */ |
universe@1 | 98 | if ((argflags & 1) > 0 || strcmp(argv[t], "--help") == 0) { |
universe@14 | 99 | return exit_with_help(settings, 0); |
universe@0 | 100 | } |
universe@22 | 101 | /* r, R */ |
universe@1 | 102 | if ((argflags & 24) > 0) { |
universe@8 | 103 | if (registerArgument(&checked, 24)) { |
universe@12 | 104 | return exit_with_help(settings, 1); |
universe@0 | 105 | } |
universe@3 | 106 | settings->recursive = true; |
universe@0 | 107 | } |
universe@22 | 108 | /* m */ |
universe@1 | 109 | if ((argflags & 32) > 0) { |
universe@8 | 110 | if (registerArgument(&checked, 32)) { |
universe@12 | 111 | return exit_with_help(settings, 1); |
universe@0 | 112 | } |
universe@3 | 113 | settings->matchesOnly = true; |
universe@0 | 114 | } |
universe@22 | 115 | /* v */ |
universe@14 | 116 | if ((argflags & 64) > 0 || strcmp(argv[t], "--version") == 0) { |
universe@14 | 117 | return exit_with_version(settings); |
universe@14 | 118 | } |
universe@22 | 119 | /* V */ |
universe@16 | 120 | if ((argflags & 128) > 0) { |
universe@16 | 121 | if (registerArgument(&checked, 128)) { |
universe@16 | 122 | return exit_with_help(settings, 1); |
universe@16 | 123 | } |
universe@16 | 124 | settings->verbose = false; |
universe@16 | 125 | } |
universe@22 | 126 | /* b */ |
universe@21 | 127 | if ((argflags & 256) > 0) { |
universe@21 | 128 | if (registerArgument(&checked, 256)) { |
universe@21 | 129 | return exit_with_help(settings, 1); |
universe@21 | 130 | } |
universe@21 | 131 | t++; |
universe@21 | 132 | if (t >= argc) { |
universe@21 | 133 | return exit_with_help(settings, 1); |
universe@21 | 134 | } |
universe@24 | 135 | if (strcasecmp(argv[t], "ignore") == 0) { |
universe@21 | 136 | settings->bfileHeuristics->level = BFILE_IGNORE; |
universe@24 | 137 | } else if (strcasecmp(argv[t], "low") == 0) { |
universe@21 | 138 | settings->bfileHeuristics->level = BFILE_LOW_ACCURACY; |
universe@24 | 139 | } else if (strcasecmp(argv[t], "medium") == 0) { |
universe@21 | 140 | settings->bfileHeuristics->level = BFILE_MEDIUM_ACCURACY; |
universe@24 | 141 | } else if (strcasecmp(argv[t], "high") == 0) { |
universe@21 | 142 | settings->bfileHeuristics->level = BFILE_HIGH_ACCURACY; |
universe@21 | 143 | } else { |
universe@21 | 144 | return exit_with_help(settings, 1); |
universe@21 | 145 | } |
universe@21 | 146 | } |
universe@28 | 147 | /* e */ |
universe@27 | 148 | if ((argflags & 512) > 0) { |
universe@27 | 149 | if (t + 2 >= argc) { |
universe@27 | 150 | return exit_with_help(settings, 1); |
universe@27 | 151 | } |
universe@27 | 152 | t++; add_string(settings->regex->pattern_list, argv[t]); |
universe@27 | 153 | t++; add_string(settings->regex->pattern_list, argv[t]); |
universe@27 | 154 | } |
universe@28 | 155 | /* E */ |
universe@28 | 156 | if ((argflags & 1024) > 0) { |
universe@28 | 157 | t++; |
universe@28 | 158 | if (t >= argc) { |
universe@28 | 159 | return exit_with_help(settings, 1); |
universe@28 | 160 | } |
universe@28 | 161 | add_string(settings->regex->pattern_list, argv[t]); |
universe@28 | 162 | add_string(settings->regex->pattern_list, "$"); |
universe@28 | 163 | } |
universe@22 | 164 | /* Path */ |
universe@1 | 165 | if (argflags == 0) { |
universe@8 | 166 | if (registerArgument(&checked, 1024)) { |
universe@12 | 167 | return exit_with_help(settings, 1); |
universe@0 | 168 | } |
universe@0 | 169 | directory = argv[t]; |
universe@0 | 170 | } |
universe@0 | 171 | } |
universe@0 | 172 | |
universe@22 | 173 | /* Configure output */ |
universe@16 | 174 | if (!settings->verbose) { |
universe@16 | 175 | close_stdout(); |
universe@16 | 176 | } |
universe@16 | 177 | |
universe@22 | 178 | /* Find tokens */ |
universe@6 | 179 | char* finder = strtok(suffix, ","); |
universe@1 | 180 | while (finder != NULL) { |
universe@19 | 181 | add_string(settings->suffixList, finder); |
universe@0 | 182 | finder = strtok(NULL, ","); |
universe@0 | 183 | } |
universe@0 | 184 | |
universe@22 | 185 | /* Scan directory */ |
universe@28 | 186 | if (regex_compile_all(settings->regex)) { |
universe@28 | 187 | int lines = scanDirectory((scanner_t){directory, 0}, settings); |
universe@28 | 188 | destroy_settings_t(settings); |
universe@0 | 189 | |
universe@28 | 190 | /* Print double line and line count */ |
universe@28 | 191 | for (int t = 0 ; t < 79 ; t++) { |
universe@28 | 192 | printf("="); |
universe@28 | 193 | } |
universe@28 | 194 | printf("\n%73d lines\n", lines); |
universe@0 | 195 | |
universe@28 | 196 | if (settings->confusing_lnlen && settings->regex->pattern_list->count > 0) { |
universe@28 | 197 | printf("\nSome files contain too long lines.\n" |
universe@28 | 198 | "The regex parser currently supports a maximum line length of %d." |
universe@28 | 199 | "\nThe result might be wrong.\n", REGEX_MAX_LINELENGTH); |
universe@28 | 200 | } |
universe@25 | 201 | |
universe@28 | 202 | if (!settings->verbose) { |
universe@28 | 203 | reopen_stdout(); |
universe@28 | 204 | printf("%d", lines); |
universe@28 | 205 | } |
universe@16 | 206 | } |
universe@16 | 207 | |
universe@16 | 208 | fflush(stdout); |
universe@28 | 209 | fflush(stderr); |
universe@0 | 210 | return 0; |
universe@0 | 211 | } |