2 * Copyright (C) 2012, 2013
5 * Permission is hereby granted, free of charge, to any person obtaining a copy of
6 * this software and associated documentation files (the "Software"), to deal in
7 * the Software without restriction, including without limitation the rights to
8 * use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is furnished to do
10 * so, subject to the following conditions:
12 * The above copyright notice and this permission notice shall be included in all
13 * copies or substantial portions of the Software.
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
23 #ifndef GMQCC_LEXER_HDR
24 #define GMQCC_LEXER_HDR
26 typedef struct token_s token;
50 void token_delete(token*);
51 token* token_copy(const token *cp);
52 void token_delete_all(token *t);
53 token* token_copy_all(const token *cp);
60 /* Other tokens which we can return: */
70 TOKEN_KEYWORD, /* loop */
72 TOKEN_DOTS, /* 3 dots, ... */
74 TOKEN_ATTRIBUTE_OPEN, /* [[ */
75 TOKEN_ATTRIBUTE_CLOSE, /* ]] */
77 TOKEN_VA_ARGS, /* for the ftepp only */
78 TOKEN_VA_ARGS_ARRAY, /* for the ftepp only */
79 TOKEN_VA_COUNT, /* to get the count of vaargs */
81 TOKEN_STRINGCONST, /* not the typename but an actual "string" */
92 /* We use '< TOKEN_ERROR', so TOKEN_FATAL must come after it and any
93 * other error related tokens as well
96 TOKEN_FATAL /* internal error, eg out of memory */
104 typedef struct lex_file_s {
106 const char *open_string;
107 size_t open_string_length;
108 size_t open_string_pos;
112 size_t sline; /* line at the start of a token */
119 token tok; /* not a pointer anymore */
123 bool nodigraphs; /* used when lexing string constants */
124 bool preprocessing; /* whitespace and EOLs become actual tokens */
125 bool mergelines; /* backslash at the end of a line escapes the newline */
135 lex_file* lex_open (const char *file);
136 lex_file* lex_open_string(const char *str, size_t len, const char *name);
137 void lex_close(lex_file *lex);
138 int lex_do (lex_file *lex);
139 void lex_cleanup(void);
155 unsigned int operands;
163 #define opid2(a,b) ((a<<8)|b)
164 #define opid3(a,b,c) ((a<<16)|(b<<8)|c)
166 static const oper_info c_operators[] = {
167 { "(", 0, opid1('('), ASSOC_LEFT, 99, OP_PREFIX}, /* paren expression - non function call */
169 { "++", 1, opid3('S','+','+'), ASSOC_LEFT, 15, OP_SUFFIX},
170 { "--", 1, opid3('S','-','-'), ASSOC_LEFT, 15, OP_SUFFIX},
171 { ".", 2, opid1('.'), ASSOC_LEFT, 15, 0 },
172 { "(", 0, opid1('('), ASSOC_LEFT, 15, 0 }, /* function call */
173 { "[", 2, opid1('['), ASSOC_LEFT, 15, 0 }, /* array subscript */
175 { "!", 1, opid2('!', 'P'), ASSOC_RIGHT, 14, OP_PREFIX },
176 { "~", 1, opid2('~', 'P'), ASSOC_RIGHT, 14, OP_PREFIX },
177 { "+", 1, opid2('+','P'), ASSOC_RIGHT, 14, OP_PREFIX },
178 { "-", 1, opid2('-','P'), ASSOC_RIGHT, 14, OP_PREFIX },
179 { "++", 1, opid3('+','+','P'), ASSOC_RIGHT, 14, OP_PREFIX },
180 { "--", 1, opid3('-','-','P'), ASSOC_RIGHT, 14, OP_PREFIX },
181 /* { "&", 1, opid2('&','P'), ASSOC_RIGHT, 14, OP_PREFIX }, */
183 { "*", 2, opid1('*'), ASSOC_LEFT, 13, 0 },
184 { "/", 2, opid1('/'), ASSOC_LEFT, 13, 0 },
185 { "%", 2, opid1('%'), ASSOC_LEFT, 13, 0 },
187 { "+", 2, opid1('+'), ASSOC_LEFT, 12, 0 },
188 { "-", 2, opid1('-'), ASSOC_LEFT, 12, 0 },
190 { "<<", 2, opid2('<','<'), ASSOC_LEFT, 11, 0 },
191 { ">>", 2, opid2('>','>'), ASSOC_LEFT, 11, 0 },
193 { "<", 2, opid1('<'), ASSOC_LEFT, 10, 0 },
194 { ">", 2, opid1('>'), ASSOC_LEFT, 10, 0 },
195 { "<=>", 2, opid3('<','=','>'), ASSOC_LEFT, 10, 0 },
196 { "<=", 2, opid2('<','='), ASSOC_LEFT, 10, 0 },
197 { ">=", 2, opid2('>','='), ASSOC_LEFT, 10, 0 },
199 { "==", 2, opid2('=','='), ASSOC_LEFT, 9, 0 },
200 { "!=", 2, opid2('!','='), ASSOC_LEFT, 9, 0 },
202 { "&", 2, opid1('&'), ASSOC_LEFT, 8, 0 },
204 { "^", 2, opid1('^'), ASSOC_LEFT, 7, 0 },
206 { "|", 2, opid1('|'), ASSOC_LEFT, 6, 0 },
208 { "&&", 2, opid2('&','&'), ASSOC_LEFT, 5, 0 },
210 { "||", 2, opid2('|','|'), ASSOC_LEFT, 4, 0 },
212 { "?", 3, opid2('?',':'), ASSOC_RIGHT, 3, 0 },
214 { "=", 2, opid1('='), ASSOC_RIGHT, 2, 0 },
215 { "+=", 2, opid2('+','='), ASSOC_RIGHT, 2, 0 },
216 { "-=", 2, opid2('-','='), ASSOC_RIGHT, 2, 0 },
217 { "*=", 2, opid2('*','='), ASSOC_RIGHT, 2, 0 },
218 { "/=", 2, opid2('/','='), ASSOC_RIGHT, 2, 0 },
219 { "%=", 2, opid2('%','='), ASSOC_RIGHT, 2, 0 },
220 { ">>=", 2, opid3('>','>','='), ASSOC_RIGHT, 2, 0 },
221 { "<<=", 2, opid3('<','<','='), ASSOC_RIGHT, 2, 0 },
222 { "&=", 2, opid2('&','='), ASSOC_RIGHT, 2, 0 },
223 { "^=", 2, opid2('^','='), ASSOC_RIGHT, 2, 0 },
224 { "|=", 2, opid2('|','='), ASSOC_RIGHT, 2, 0 },
225 { "&~=", 2, opid3('&','~','='), ASSOC_RIGHT, 2, 0 },
227 { ":", 0, opid2(':','?'), ASSOC_RIGHT, 1, 0 },
229 { ",", 2, opid1(','), ASSOC_LEFT, 0, 0 }
231 static const size_t c_operator_count = (sizeof(c_operators) / sizeof(c_operators[0]));
233 static const oper_info fte_operators[] = {
234 { "(", 0, opid1('('), ASSOC_LEFT, 99, OP_PREFIX}, /* paren expression - non function call */
236 { "++", 1, opid3('S','+','+'), ASSOC_LEFT, 15, OP_SUFFIX},
237 { "--", 1, opid3('S','-','-'), ASSOC_LEFT, 15, OP_SUFFIX},
238 { ".", 2, opid1('.'), ASSOC_LEFT, 15, 0 },
239 { "(", 0, opid1('('), ASSOC_LEFT, 15, 0 }, /* function call */
240 { "[", 2, opid1('['), ASSOC_LEFT, 15, 0 }, /* array subscript */
242 { "!", 1, opid2('!', 'P'), ASSOC_RIGHT, 14, OP_PREFIX },
243 { "+", 1, opid2('+','P'), ASSOC_RIGHT, 14, OP_PREFIX },
244 { "-", 1, opid2('-','P'), ASSOC_RIGHT, 14, OP_PREFIX },
245 { "++", 1, opid3('+','+','P'), ASSOC_RIGHT, 14, OP_PREFIX },
246 { "--", 1, opid3('-','-','P'), ASSOC_RIGHT, 14, OP_PREFIX },
248 { "*", 2, opid1('*'), ASSOC_LEFT, 13, 0 },
249 { "/", 2, opid1('/'), ASSOC_LEFT, 13, 0 },
250 { "&", 2, opid1('&'), ASSOC_LEFT, 13, 0 },
251 { "|", 2, opid1('|'), ASSOC_LEFT, 13, 0 },
253 { "+", 2, opid1('+'), ASSOC_LEFT, 12, 0 },
254 { "-", 2, opid1('-'), ASSOC_LEFT, 12, 0 },
256 { "<<", 2, opid2('<','<'), ASSOC_LEFT, 11, 0 },
257 { ">>", 2, opid2('>','>'), ASSOC_LEFT, 11, 0 },
259 { "<", 2, opid1('<'), ASSOC_LEFT, 10, 0 },
260 { ">", 2, opid1('>'), ASSOC_LEFT, 10, 0 },
261 { "<=", 2, opid2('<','='), ASSOC_LEFT, 10, 0 },
262 { ">=", 2, opid2('>','='), ASSOC_LEFT, 10, 0 },
263 { "==", 2, opid2('=','='), ASSOC_LEFT, 10, 0 },
264 { "!=", 2, opid2('!','='), ASSOC_LEFT, 10, 0 },
266 { "?", 3, opid2('?',':'), ASSOC_RIGHT, 9, 0 },
268 { "=", 2, opid1('='), ASSOC_RIGHT, 8, 0 },
269 { "+=", 2, opid2('+','='), ASSOC_RIGHT, 8, 0 },
270 { "-=", 2, opid2('-','='), ASSOC_RIGHT, 8, 0 },
271 { "*=", 2, opid2('*','='), ASSOC_RIGHT, 8, 0 },
272 { "/=", 2, opid2('/','='), ASSOC_RIGHT, 8, 0 },
273 { "%=", 2, opid2('%','='), ASSOC_RIGHT, 8, 0 },
274 { "&=", 2, opid2('&','='), ASSOC_RIGHT, 8, 0 },
275 { "|=", 2, opid2('|','='), ASSOC_RIGHT, 8, 0 },
276 { "&~=", 2, opid3('&','~','='), ASSOC_RIGHT, 8, 0 },
278 { "&&", 2, opid2('&','&'), ASSOC_LEFT, 5, 0 },
279 { "||", 2, opid2('|','|'), ASSOC_LEFT, 5, 0 },
281 /* Leave precedence 3 for : with -fcorrect-ternary */
282 { ",", 2, opid1(','), ASSOC_LEFT, 2, 0 },
283 { ":", 0, opid2(':','?'), ASSOC_RIGHT, 1, 0 }
285 static const size_t fte_operator_count = (sizeof(fte_operators) / sizeof(fte_operators[0]));
287 static const oper_info qcc_operators[] = {
288 { "(", 0, opid1('('), ASSOC_LEFT, 99, OP_PREFIX}, /* paren expression - non function call */
290 { ".", 2, opid1('.'), ASSOC_LEFT, 15, 0 },
291 { "(", 0, opid1('('), ASSOC_LEFT, 15, 0 }, /* function call */
292 { "[", 2, opid1('['), ASSOC_LEFT, 15, 0 }, /* array subscript */
294 { "!", 1, opid2('!', 'P'), ASSOC_RIGHT, 14, OP_PREFIX },
295 { "+", 1, opid2('+','P'), ASSOC_RIGHT, 14, OP_PREFIX },
296 { "-", 1, opid2('-','P'), ASSOC_RIGHT, 14, OP_PREFIX },
298 { "*", 2, opid1('*'), ASSOC_LEFT, 13, 0 },
299 { "/", 2, opid1('/'), ASSOC_LEFT, 13, 0 },
300 { "&", 2, opid1('&'), ASSOC_LEFT, 13, 0 },
301 { "|", 2, opid1('|'), ASSOC_LEFT, 13, 0 },
303 { "+", 2, opid1('+'), ASSOC_LEFT, 12, 0 },
304 { "-", 2, opid1('-'), ASSOC_LEFT, 12, 0 },
306 { "<", 2, opid1('<'), ASSOC_LEFT, 10, 0 },
307 { ">", 2, opid1('>'), ASSOC_LEFT, 10, 0 },
308 { "<=", 2, opid2('<','='), ASSOC_LEFT, 10, 0 },
309 { ">=", 2, opid2('>','='), ASSOC_LEFT, 10, 0 },
310 { "==", 2, opid2('=','='), ASSOC_LEFT, 10, 0 },
311 { "!=", 2, opid2('!','='), ASSOC_LEFT, 10, 0 },
313 { "=", 2, opid1('='), ASSOC_RIGHT, 8, 0 },
314 { "+=", 2, opid2('+','='), ASSOC_RIGHT, 8, 0 },
315 { "-=", 2, opid2('-','='), ASSOC_RIGHT, 8, 0 },
316 { "*=", 2, opid2('*','='), ASSOC_RIGHT, 8, 0 },
317 { "/=", 2, opid2('/','='), ASSOC_RIGHT, 8, 0 },
318 { "%=", 2, opid2('%','='), ASSOC_RIGHT, 8, 0 },
319 { "&=", 2, opid2('&','='), ASSOC_RIGHT, 8, 0 },
320 { "|=", 2, opid2('|','='), ASSOC_RIGHT, 8, 0 },
322 { "&&", 2, opid2('&','&'), ASSOC_LEFT, 5, 0 },
323 { "||", 2, opid2('|','|'), ASSOC_LEFT, 5, 0 },
325 { ",", 2, opid1(','), ASSOC_LEFT, 2, 0 },
327 static const size_t qcc_operator_count = (sizeof(qcc_operators) / sizeof(qcc_operators[0]));
329 extern const oper_info *operators;
330 extern size_t operator_count;
331 void lexerror(lex_file*, const char *fmt, ...);