Tue, 23 Aug 2016 16:34:02 +0200
words (token) are now stored as sstr_t
21 | 1 | /* |
2 | * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER. | |
3 | * | |
35 | 4 | * Copyright 2016 Mike Becker. All rights reserved. |
21 | 5 | * |
6 | * Redistribution and use in source and binary forms, with or without | |
7 | * modification, are permitted provided that the following conditions are met: | |
8 | * | |
9 | * 1. Redistributions of source code must retain the above copyright | |
10 | * notice, this list of conditions and the following disclaimer. | |
11 | * | |
12 | * 2. Redistributions in binary form must reproduce the above copyright | |
13 | * notice, this list of conditions and the following disclaimer in the | |
14 | * documentation and/or other materials provided with the distribution. | |
15 | * | |
16 | * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | |
17 | * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | |
18 | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | |
19 | * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | |
20 | * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | |
21 | * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | |
22 | * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | |
23 | * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | |
24 | * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | |
25 | * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | |
26 | * POSSIBILITY OF SUCH DAMAGE. | |
27 | * | |
28 | */ | |
29 | ||
30 | #include "javacodegen.h" | |
31 | #include <string.h> | |
32 | #include <ctype.h> | |
33 | ||
34 | const char* jkeywords[] = { | |
35 | "abstract", "continue", "for", "new", "switch", "assert", "default", "goto", | |
36 | "package", "synchronized", "boolean", "do", "if", "private", "this", | |
37 | "break", "double", "implements", "protected", "throw", "byte", "else", | |
38 | "import", "public", "throws", "case", "enum", "instanceof", "return", | |
39 | "transient", "catch", "extends", "int", "short", "try", "char", "final", | |
40 | "interface", "static", "void", "class", "finally", "long", "strictfp", | |
41 | "volatile", "const", "float", "native", "super", "while", NULL | |
42 | }; | |
43 | ||
29
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
44 | #define memcpy_const(darr,doff,str) memcpy(&(darr[doff]), str, sizeof(str)-1); \ |
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
45 | dp += sizeof(str)-1 |
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
46 | |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
47 | void jparseline(char *src, UcxBuffer *destbuf, int *multiline_comment) { |
45
1f3835182aeb
changes signature of parser functions to use a UcxBuffer - the functions itself don't use the API yet
Mike Becker <universe@uap-core.de>
parents:
39
diff
changeset
|
48 | /* TODO: workaround for using old code with UcxBuffer */ |
1f3835182aeb
changes signature of parser functions to use a UcxBuffer - the functions itself don't use the API yet
Mike Becker <universe@uap-core.de>
parents:
39
diff
changeset
|
49 | char *dest = destbuf->space + destbuf->pos; |
1f3835182aeb
changes signature of parser functions to use a UcxBuffer - the functions itself don't use the API yet
Mike Becker <universe@uap-core.de>
parents:
39
diff
changeset
|
50 | |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
51 | /* TODO: try to replace this buffer */ |
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
52 | char wordbuf[WORDBUF_SIZE]; |
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
53 | sstr_t word; |
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
54 | word.ptr = wordbuf; word.length = 0; |
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
55 | |
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
56 | size_t sp = (size_t)-1, dp = 0; |
21 | 57 | int isstring = 0, iscomment = 0, isimport = 0; |
28
1be8ea902ef4
fixed string highlighting when different quote symbol is in string
Mike Becker <universe@uap-core.de>
parents:
26
diff
changeset
|
58 | char quote = '\0'; |
21 | 59 | int isescaping = 0; |
60 | ||
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
61 | if (*multiline_comment) { |
21 | 62 | iscomment = 1; |
29
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
63 | memcpy_const(dest, dp, "<span class=\"c2html-comment\">"); |
21 | 64 | } |
65 | ||
39
ac35daceb24c
adds UCX + changes how the input file is read (uses an consecutive memory area now)
Mike Becker <universe@uap-core.de>
parents:
36
diff
changeset
|
66 | char c; |
ac35daceb24c
adds UCX + changes how the input file is read (uses an consecutive memory area now)
Mike Becker <universe@uap-core.de>
parents:
36
diff
changeset
|
67 | do { |
ac35daceb24c
adds UCX + changes how the input file is read (uses an consecutive memory area now)
Mike Becker <universe@uap-core.de>
parents:
36
diff
changeset
|
68 | c = src[++sp]; |
ac35daceb24c
adds UCX + changes how the input file is read (uses an consecutive memory area now)
Mike Becker <universe@uap-core.de>
parents:
36
diff
changeset
|
69 | if (!c) break; |
ac35daceb24c
adds UCX + changes how the input file is read (uses an consecutive memory area now)
Mike Becker <universe@uap-core.de>
parents:
36
diff
changeset
|
70 | |
21 | 71 | /* comments */ |
26
05c3c6842aef
fixed wrong comment formatting in strings
Mike Becker <universe@uap-core.de>
parents:
24
diff
changeset
|
72 | if (!isstring && c == '/') { |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
73 | if (*multiline_comment && sp > 0 && src[sp-1] == '*') { |
21 | 74 | iscomment = 0; |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
75 | *multiline_comment = 0; |
29
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
76 | memcpy_const(dest, dp, "/</span>"); |
21 | 77 | continue; |
78 | } else if (!iscomment && (src[sp+1] == '/' || src[sp+1] == '*')) { | |
79 | iscomment = 1; | |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
80 | *multiline_comment = (src[sp+1] == '*'); |
29
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
81 | memcpy_const(dest, dp, "<span class=\"c2html-comment\">"); |
21 | 82 | } |
83 | } | |
84 | ||
85 | if (iscomment) { | |
86 | if (c == '\n') { | |
87 | memcpy(&(dest[dp]), "</span>", 7); | |
88 | dp += 7; | |
89 | } | |
90 | dp = writeescapedchar(dest, dp, c); | |
91 | } else if (isimport) { | |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
92 | /* TODO: local imports */ |
21 | 93 | } else { |
94 | /* strings */ | |
95 | if (!isescaping && (c == '\'' || c == '\"')) { | |
96 | if (isstring) { | |
29
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
97 | dp = writeescapedchar(dest, dp, c); |
28
1be8ea902ef4
fixed string highlighting when different quote symbol is in string
Mike Becker <universe@uap-core.de>
parents:
26
diff
changeset
|
98 | if (c == quote) { |
1be8ea902ef4
fixed string highlighting when different quote symbol is in string
Mike Becker <universe@uap-core.de>
parents:
26
diff
changeset
|
99 | isstring = 0; |
29
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
100 | memcpy_const(dest, dp, "</span>"); |
28
1be8ea902ef4
fixed string highlighting when different quote symbol is in string
Mike Becker <universe@uap-core.de>
parents:
26
diff
changeset
|
101 | } else { |
1be8ea902ef4
fixed string highlighting when different quote symbol is in string
Mike Becker <universe@uap-core.de>
parents:
26
diff
changeset
|
102 | dp = writeescapedchar(dest, dp, c); |
1be8ea902ef4
fixed string highlighting when different quote symbol is in string
Mike Becker <universe@uap-core.de>
parents:
26
diff
changeset
|
103 | } |
21 | 104 | } else { |
28
1be8ea902ef4
fixed string highlighting when different quote symbol is in string
Mike Becker <universe@uap-core.de>
parents:
26
diff
changeset
|
105 | isstring = 1; |
1be8ea902ef4
fixed string highlighting when different quote symbol is in string
Mike Becker <universe@uap-core.de>
parents:
26
diff
changeset
|
106 | quote = c; |
29
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
107 | memcpy_const(dest, dp, |
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
108 | "<span class=\"c2html-string\">"); |
21 | 109 | dp = writeescapedchar(dest, dp, c); |
110 | } | |
111 | } else { | |
112 | if (isstring) { | |
113 | dp = writeescapedchar(dest, dp, c); | |
114 | } else if (!iswordcharacter(c)) { | |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
115 | if (word.length > 0 && word.length < WORDBUF_SIZE) { |
21 | 116 | int closespan = 1; |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
117 | if (check_keyword(word, jkeywords)) { |
29
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
118 | memcpy_const(dest, dp, |
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
119 | "<span class=\"c2html-keyword\">"); |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
120 | } else if (isupper(word.ptr[0])) { |
29
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
121 | memcpy_const(dest, dp, |
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
122 | "<span class=\"c2html-type\">"); |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
123 | } else if (word.ptr[0] == '@') { |
29
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
124 | memcpy_const(dest, dp, |
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
125 | "<span class=\"c2html-directive\">"); |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
126 | } else if (check_capsonly(word)) { |
29
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
127 | memcpy_const(dest, dp, |
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
128 | "<span class=\"c2html-macroconst\">"); |
21 | 129 | } else { |
130 | closespan = 0; | |
131 | } | |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
132 | for (int i = 0 ; i < word.length ; i++) { |
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
133 | dp = writeescapedchar(dest, dp, word.ptr[i]); |
21 | 134 | } |
135 | if (closespan) { | |
29
ec6e97454e64
introduced macro for constant string memcpy + fixed string highlight fix
Mike Becker <universe@uap-core.de>
parents:
28
diff
changeset
|
136 | memcpy_const(dest, dp, "</span>"); |
21 | 137 | } |
138 | } | |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
139 | word.length = 0; |
21 | 140 | dp = writeescapedchar(dest, dp, c); |
141 | } else { | |
142 | /* read word */ | |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
143 | if (word.length < WORDBUF_SIZE) { |
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
144 | word.ptr[word.length++] = c; |
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
145 | } else if (word.length == WORDBUF_SIZE) { |
21 | 146 | for (int i = 0 ; i < WORDBUF_SIZE ; i++) { |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
147 | dp = writeescapedchar(dest, dp, word.ptr[i]); |
21 | 148 | } |
47
c39ecbbca7c0
words (token) are now stored as sstr_t
Mike Becker <universe@uap-core.de>
parents:
46
diff
changeset
|
149 | word.length++; |
21 | 150 | dp = writeescapedchar(dest, dp, c); |
151 | } else { | |
152 | dp = writeescapedchar(dest, dp, c); | |
153 | } | |
154 | } | |
155 | } | |
156 | ||
157 | isescaping = !isescaping & (c == '\\'); | |
158 | } | |
39
ac35daceb24c
adds UCX + changes how the input file is read (uses an consecutive memory area now)
Mike Becker <universe@uap-core.de>
parents:
36
diff
changeset
|
159 | } while (c != '\n'); |
21 | 160 | dest[dp] = 0; |
45
1f3835182aeb
changes signature of parser functions to use a UcxBuffer - the functions itself don't use the API yet
Mike Becker <universe@uap-core.de>
parents:
39
diff
changeset
|
161 | |
1f3835182aeb
changes signature of parser functions to use a UcxBuffer - the functions itself don't use the API yet
Mike Becker <universe@uap-core.de>
parents:
39
diff
changeset
|
162 | /* TODO: workaround */ |
1f3835182aeb
changes signature of parser functions to use a UcxBuffer - the functions itself don't use the API yet
Mike Becker <universe@uap-core.de>
parents:
39
diff
changeset
|
163 | destbuf->pos += dp; |
1f3835182aeb
changes signature of parser functions to use a UcxBuffer - the functions itself don't use the API yet
Mike Becker <universe@uap-core.de>
parents:
39
diff
changeset
|
164 | destbuf->size += dp; |
21 | 165 | } |