X-Git-Url: https://git.xonotic.org/?p=xonotic%2Fgmqcc.git;a=blobdiff_plain;f=lexer.h;h=8ed85a97ab39607494378f048cd1ad4429d29d91;hp=561148ca0a18db5a590b6aefcc9297194dba0bd6;hb=f84c8ea62922f20b13e54916fac849ade0886b66;hpb=79619fbf50c473672f268b27b8c667f0a2e83271 diff --git a/lexer.h b/lexer.h index 561148c..8ed85a9 100644 --- a/lexer.h +++ b/lexer.h @@ -1,38 +1,19 @@ -#ifndef GMQCC_LEXER_HDR_ -#define GMQCC_LEXER_HDR_ - -typedef struct token_s token; - -#include "ast.h" - -struct token_s { - int ttype; - - char *value; - - union { - vector v; - int i; - double f; - int t; /* type */ - } constval; - -#if 0 - struct token_s *next; - struct token_s *prev; -#endif - - lex_ctx ctx; +#ifndef GMQCC_LEXER_HDR +#define GMQCC_LEXER_HDR +#include "gmqcc.h" + +struct token { + int ttype; + char *value; + union { + vec3_t v; + int i; + qcfloat_t f; + qc_type t; /* type */ + } constval; + lex_ctx_t ctx; }; -#if 0 -token* token_new(); -void token_delete(token*); -token* token_copy(const token *cp); -void token_delete_all(token *t); -token* token_copy_all(const token *cp); -#endif - /* Lexer * */ @@ -51,6 +32,13 @@ enum { TOKEN_DOTS, /* 3 dots, ... */ + TOKEN_ATTRIBUTE_OPEN, /* [[ */ + TOKEN_ATTRIBUTE_CLOSE, /* ]] */ + + TOKEN_VA_ARGS, /* for the ftepp only */ + TOKEN_VA_ARGS_ARRAY, /* for the ftepp only */ + TOKEN_VA_COUNT, /* to get the count of vaargs */ + TOKEN_STRINGCONST, /* not the typename but an actual "string" */ TOKEN_CHARCONST, TOKEN_VECTORCONST, @@ -60,7 +48,11 @@ enum { TOKEN_WHITE, TOKEN_EOL, - TOKEN_EOF, + /* if we add additional tokens before this, the exposed API + * should not be broken anyway, but EOF/ERROR/... should + * still be at the bottom + */ + TOKEN_EOF = 1024, /* We use '< TOKEN_ERROR', so TOKEN_FATAL must come after it and any * other error related tokens as well @@ -69,65 +61,42 @@ enum { TOKEN_FATAL /* internal error, eg out of memory */ }; -static const char *_tokennames[] = { - "TOKEN_START", - "TOKEN_IDENT", - "TOKEN_TYPENAME", - "TOKEN_OPERATOR", - "TOKEN_KEYWORD", - "TOKEN_DOTS", - "TOKEN_STRINGCONST", - "TOKEN_CHARCONST", - "TOKEN_VECTORCONST", - "TOKEN_INTCONST", - "TOKEN_FLOATCONST", - "TOKEN_WHITE", - "TOKEN_EOL", - "TOKEN_EOF", - "TOKEN_ERROR", - "TOKEN_FATAL", -}; -typedef int -_all_tokennames_added_[ - ((TOKEN_FATAL - TOKEN_START + 1) == - (sizeof(_tokennames)/sizeof(_tokennames[0]))) - ? 1 : -1]; - -typedef struct { +struct frame_macro { char *name; - int value; -} frame_macro; + int value; +}; -typedef struct { - FILE *file; - const char *open_string; - size_t open_string_length; - size_t open_string_pos; +struct lex_file { + FILE *file; + const char *open_string; + size_t open_string_length; + size_t open_string_pos; - char *name; - size_t line; - size_t sline; /* line at the start of a token */ + char *name; + size_t line; + size_t sline; /* line at the start of a token */ + size_t column; - char peek[256]; - size_t peekpos; + int peek[256]; + size_t peekpos; - bool eof; + bool eof; - token tok; /* not a pointer anymore */ + token tok; /* not a pointer anymore */ - struct { - bool noops; - bool nodigraphs; /* used when lexing string constants */ - bool preprocessing; /* whitespace and EOLs become actual tokens */ - bool mergelines; /* backslash at the end of a line escapes the newline */ - } flags; + struct { + unsigned noops:1; + unsigned nodigraphs:1; /* used when lexing string constants */ + unsigned preprocessing:1; /* whitespace and EOLs become actual tokens */ + unsigned mergelines:1; /* backslash at the end of a line escapes the newline */ + } flags; /* sizeof == 1 */ int framevalue; - frame_macro *frames; - char *modelname; + frame_macro *frames; + char *modelname; - size_t push_line; -} lex_file; + size_t push_line; +}; lex_file* lex_open (const char *file); lex_file* lex_open_string(const char *str, size_t len, const char *name); @@ -147,127 +116,188 @@ enum { #define OP_SUFFIX 1 #define OP_PREFIX 2 -typedef struct { +struct oper_info { const char *op; unsigned int operands; unsigned int id; unsigned int assoc; - unsigned int prec; + signed int prec; unsigned int flags; -} oper_info; + bool folds; +}; -#define opid1(a) (a) -#define opid2(a,b) ((a<<8)|b) -#define opid3(a,b,c) ((a<<16)|(b<<8)|c) +/* + * Explicit uint8_t casts since the left operand of shift operator cannot + * be negative, even though it won't happen, this supresses the future + * possibility. + */ +#define opid1(a) ((uint8_t)a) +#define opid2(a,b) (((uint8_t)a<<8) |(uint8_t)b) +#define opid3(a,b,c) (((uint8_t)a<<16)|((uint8_t)b<<8)|(uint8_t)c) static const oper_info c_operators[] = { - { "(", 0, opid1('('), ASSOC_LEFT, 99, OP_PREFIX}, /* paren expression - non function call */ + { "(", 0, opid1('('), ASSOC_LEFT, 99, OP_PREFIX, false}, /* paren expression - non function call */ + { "_length", 1, opid3('l','e','n'), ASSOC_RIGHT, 98, OP_PREFIX, true}, + + { "++", 1, opid3('S','+','+'), ASSOC_LEFT, 17, OP_SUFFIX, false}, + { "--", 1, opid3('S','-','-'), ASSOC_LEFT, 17, OP_SUFFIX, false}, + { ".", 2, opid1('.'), ASSOC_LEFT, 17, 0, false}, + { "(", 0, opid1('('), ASSOC_LEFT, 17, 0, false}, /* function call */ + { "[", 2, opid1('['), ASSOC_LEFT, 17, 0, false}, /* array subscript */ - { "++", 1, opid3('S','+','+'), ASSOC_LEFT, 16, OP_SUFFIX}, - { "--", 1, opid3('S','-','-'), ASSOC_LEFT, 16, OP_SUFFIX}, + { "++", 1, opid3('+','+','P'), ASSOC_RIGHT, 16, OP_PREFIX, false}, + { "--", 1, opid3('-','-','P'), ASSOC_RIGHT, 16, OP_PREFIX, false}, - { ".", 2, opid1('.'), ASSOC_LEFT, 15, 0 }, - { "(", 0, opid1('('), ASSOC_LEFT, 15, 0 }, /* function call */ - { "[", 2, opid1('['), ASSOC_LEFT, 15, 0 }, /* array subscript */ + { "**", 2, opid2('*','*'), ASSOC_RIGHT, 14, 0, true}, + { "!", 1, opid2('!','P'), ASSOC_RIGHT, 14, OP_PREFIX, true}, + { "~", 1, opid2('~','P'), ASSOC_RIGHT, 14, OP_PREFIX, true}, + { "+", 1, opid2('+','P'), ASSOC_RIGHT, 14, OP_PREFIX, false}, + { "-", 1, opid2('-','P'), ASSOC_RIGHT, 14, OP_PREFIX, true}, +/* { "&", 1, opid2('&','P'), ASSOC_RIGHT, 14, OP_PREFIX, false}, */ - { "!", 1, opid2('!', 'P'), ASSOC_RIGHT, 14, OP_PREFIX }, - { "~", 1, opid2('~', 'P'), ASSOC_RIGHT, 14, OP_PREFIX }, - { "+", 1, opid2('+','P'), ASSOC_RIGHT, 14, OP_PREFIX }, - { "-", 1, opid2('-','P'), ASSOC_RIGHT, 14, OP_PREFIX }, - { "++", 1, opid3('+','+','P'), ASSOC_RIGHT, 14, OP_PREFIX }, - { "--", 1, opid3('-','-','P'), ASSOC_RIGHT, 14, OP_PREFIX }, -/* { "&", 1, opid2('&','P'), ASSOC_RIGHT, 14, OP_PREFIX }, */ + { "*", 2, opid1('*'), ASSOC_LEFT, 13, 0, true}, + { "/", 2, opid1('/'), ASSOC_LEFT, 13, 0, true}, + { "%", 2, opid1('%'), ASSOC_LEFT, 13, 0, true}, + { "><", 2, opid2('>','<'), ASSOC_LEFT, 13, 0, true}, - { "*", 2, opid1('*'), ASSOC_LEFT, 13, 0 }, - { "/", 2, opid1('/'), ASSOC_LEFT, 13, 0 }, - { "%", 2, opid1('%'), ASSOC_LEFT, 13, 0 }, + { "+", 2, opid1('+'), ASSOC_LEFT, 12, 0, true}, + { "-", 2, opid1('-'), ASSOC_LEFT, 12, 0, true}, - { "+", 2, opid1('+'), ASSOC_LEFT, 12, 0 }, - { "-", 2, opid1('-'), ASSOC_LEFT, 12, 0 }, + { "<<", 2, opid2('<','<'), ASSOC_LEFT, 11, 0, true}, + { ">>", 2, opid2('>','>'), ASSOC_LEFT, 11, 0, true}, - { "<<", 2, opid2('<','<'), ASSOC_LEFT, 11, 0 }, - { ">>", 2, opid2('>','>'), ASSOC_LEFT, 11, 0 }, + { "<", 2, opid1('<'), ASSOC_LEFT, 10, 0, false}, + { ">", 2, opid1('>'), ASSOC_LEFT, 10, 0, false}, + { "<=>", 2, opid3('<','=','>'), ASSOC_LEFT, 10, 0, true}, + { "<=", 2, opid2('<','='), ASSOC_LEFT, 10, 0, false}, + { ">=", 2, opid2('>','='), ASSOC_LEFT, 10, 0, false}, - { "<", 2, opid1('<'), ASSOC_LEFT, 10, 0 }, - { ">", 2, opid1('>'), ASSOC_LEFT, 10, 0 }, - { "<=", 2, opid2('<','='), ASSOC_LEFT, 10, 0 }, - { ">=", 2, opid2('>','='), ASSOC_LEFT, 10, 0 }, + { "==", 2, opid2('=','='), ASSOC_LEFT, 9, 0, true}, + { "!=", 2, opid2('!','='), ASSOC_LEFT, 9, 0, true}, - { "==", 2, opid2('=','='), ASSOC_LEFT, 9, 0 }, - { "!=", 2, opid2('!','='), ASSOC_LEFT, 9, 0 }, + { "&", 2, opid1('&'), ASSOC_LEFT, 8, 0, true}, - { "&", 2, opid1('&'), ASSOC_LEFT, 8, 0 }, + { "^", 2, opid1('^'), ASSOC_LEFT, 7, 0, true}, - { "^", 2, opid1('^'), ASSOC_LEFT, 7, 0 }, + { "|", 2, opid1('|'), ASSOC_LEFT, 6, 0, true}, - { "|", 2, opid1('|'), ASSOC_LEFT, 6, 0 }, + { "&&", 2, opid2('&','&'), ASSOC_LEFT, 5, 0, true}, - { "&&", 2, opid2('&','&'), ASSOC_LEFT, 5, 0 }, + { "||", 2, opid2('|','|'), ASSOC_LEFT, 4, 0, true}, - { "||", 2, opid2('|','|'), ASSOC_LEFT, 4, 0 }, + { "?", 3, opid2('?',':'), ASSOC_RIGHT, 3, 0, true}, - { "?", 3, opid2('?',':'), ASSOC_RIGHT, 3, 0 }, + { "=", 2, opid1('='), ASSOC_RIGHT, 2, 0, false}, + { "+=", 2, opid2('+','='), ASSOC_RIGHT, 2, 0, false}, + { "-=", 2, opid2('-','='), ASSOC_RIGHT, 2, 0, false}, + { "*=", 2, opid2('*','='), ASSOC_RIGHT, 2, 0, false}, + { "/=", 2, opid2('/','='), ASSOC_RIGHT, 2, 0, false}, + { "%=", 2, opid2('%','='), ASSOC_RIGHT, 2, 0, false}, + { ">>=", 2, opid3('>','>','='), ASSOC_RIGHT, 2, 0, false}, + { "<<=", 2, opid3('<','<','='), ASSOC_RIGHT, 2, 0, false}, + { "&=", 2, opid2('&','='), ASSOC_RIGHT, 2, 0, false}, + { "^=", 2, opid2('^','='), ASSOC_RIGHT, 2, 0, false}, + { "|=", 2, opid2('|','='), ASSOC_RIGHT, 2, 0, false}, - { "=", 2, opid1('='), ASSOC_RIGHT, 2, 0 }, - { "+=", 2, opid2('+','='), ASSOC_RIGHT, 2, 0 }, - { "-=", 2, opid2('-','='), ASSOC_RIGHT, 2, 0 }, - { "*=", 2, opid2('*','='), ASSOC_RIGHT, 2, 0 }, - { "/=", 2, opid2('/','='), ASSOC_RIGHT, 2, 0 }, - { "%=", 2, opid2('%','='), ASSOC_RIGHT, 2, 0 }, - { ">>=", 2, opid3('>','>','='), ASSOC_RIGHT, 2, 0 }, - { "<<=", 2, opid3('<','<','='), ASSOC_RIGHT, 2, 0 }, - { "&=", 2, opid2('&','='), ASSOC_RIGHT, 2, 0 }, - { "^=", 2, opid2('^','='), ASSOC_RIGHT, 2, 0 }, - { "|=", 2, opid2('|','='), ASSOC_RIGHT, 2, 0 }, + { ":", 0, opid2(':','?'), ASSOC_RIGHT, 1, 0, false}, - { ",", 2, opid1(','), ASSOC_LEFT, 1, 0 } + { ",", 2, opid1(','), ASSOC_LEFT, 0, 0, false} }; -static const size_t c_operator_count = (sizeof(c_operators) / sizeof(c_operators[0])); -static const oper_info qcc_operators[] = { - { "(", 0, opid1('('), ASSOC_LEFT, 99, OP_PREFIX}, /* paren expression - non function call */ - - { ".", 2, opid1('.'), ASSOC_LEFT, 15, 0 }, - { "(", 0, opid1('('), ASSOC_LEFT, 15, 0 }, /* function call */ - { "[", 2, opid1('['), ASSOC_LEFT, 15, 0 }, /* array subscript */ - - { "!", 1, opid2('!', 'P'), ASSOC_RIGHT, 14, OP_PREFIX }, - { "+", 1, opid2('+','P'), ASSOC_RIGHT, 14, OP_PREFIX }, - { "-", 1, opid2('-','P'), ASSOC_RIGHT, 14, OP_PREFIX }, - - { "*", 2, opid1('*'), ASSOC_LEFT, 13, 0 }, - { "/", 2, opid1('/'), ASSOC_LEFT, 13, 0 }, - { "&", 2, opid1('&'), ASSOC_LEFT, 13, 0 }, - { "|", 2, opid1('|'), ASSOC_LEFT, 13, 0 }, - - { "+", 2, opid1('+'), ASSOC_LEFT, 12, 0 }, - { "-", 2, opid1('-'), ASSOC_LEFT, 12, 0 }, - - { "<", 2, opid1('<'), ASSOC_LEFT, 10, 0 }, - { ">", 2, opid1('>'), ASSOC_LEFT, 10, 0 }, - { "<=", 2, opid2('<','='), ASSOC_LEFT, 10, 0 }, - { ">=", 2, opid2('>','='), ASSOC_LEFT, 10, 0 }, - { "==", 2, opid2('=','='), ASSOC_LEFT, 10, 0 }, - { "!=", 2, opid2('!','='), ASSOC_LEFT, 10, 0 }, - - { "=", 2, opid1('='), ASSOC_RIGHT, 8, 0 }, - { "+=", 2, opid2('+','='), ASSOC_RIGHT, 8, 0 }, - { "-=", 2, opid2('-','='), ASSOC_RIGHT, 8, 0 }, - { "*=", 2, opid2('*','='), ASSOC_RIGHT, 8, 0 }, - { "/=", 2, opid2('/','='), ASSOC_RIGHT, 8, 0 }, - { "%=", 2, opid2('%','='), ASSOC_RIGHT, 8, 0 }, - { "&=", 2, opid2('&','='), ASSOC_RIGHT, 8, 0 }, - { "|=", 2, opid2('|','='), ASSOC_RIGHT, 8, 0 }, - - { "&&", 2, opid2('&','&'), ASSOC_LEFT, 5, 0 }, - { "||", 2, opid2('|','|'), ASSOC_LEFT, 5, 0 }, - - { ",", 2, opid1(','), ASSOC_LEFT, 1, 0 } +static const oper_info fte_operators[] = { + { "(", 0, opid1('('), ASSOC_LEFT, 99, OP_PREFIX, false}, /* paren expression - non function call */ + + { "++", 1, opid3('S','+','+'), ASSOC_LEFT, 15, OP_SUFFIX, false}, + { "--", 1, opid3('S','-','-'), ASSOC_LEFT, 15, OP_SUFFIX, false}, + { ".", 2, opid1('.'), ASSOC_LEFT, 15, 0, false}, + { "(", 0, opid1('('), ASSOC_LEFT, 15, 0, false}, /* function call */ + { "[", 2, opid1('['), ASSOC_LEFT, 15, 0, false}, /* array subscript */ + + { "!", 1, opid2('!','P'), ASSOC_RIGHT, 14, OP_PREFIX, true}, + { "+", 1, opid2('+','P'), ASSOC_RIGHT, 14, OP_PREFIX, false}, + { "-", 1, opid2('-','P'), ASSOC_RIGHT, 14, OP_PREFIX, true}, + { "++", 1, opid3('+','+','P'), ASSOC_RIGHT, 14, OP_PREFIX, false}, + { "--", 1, opid3('-','-','P'), ASSOC_RIGHT, 14, OP_PREFIX, false}, + + { "*", 2, opid1('*'), ASSOC_LEFT, 13, 0, true}, + { "/", 2, opid1('/'), ASSOC_LEFT, 13, 0, true}, + { "&", 2, opid1('&'), ASSOC_LEFT, 13, 0, true}, + { "|", 2, opid1('|'), ASSOC_LEFT, 13, 0, true}, + + { "+", 2, opid1('+'), ASSOC_LEFT, 12, 0, true}, + { "-", 2, opid1('-'), ASSOC_LEFT, 12, 0, true}, + + { "<<", 2, opid2('<','<'), ASSOC_LEFT, 11, 0, true}, + { ">>", 2, opid2('>','>'), ASSOC_LEFT, 11, 0, true}, + + { "<", 2, opid1('<'), ASSOC_LEFT, 10, 0, false}, + { ">", 2, opid1('>'), ASSOC_LEFT, 10, 0, false}, + { "<=", 2, opid2('<','='), ASSOC_LEFT, 10, 0, false}, + { ">=", 2, opid2('>','='), ASSOC_LEFT, 10, 0, false}, + { "==", 2, opid2('=','='), ASSOC_LEFT, 10, 0, true}, + { "!=", 2, opid2('!','='), ASSOC_LEFT, 10, 0, true}, + + { "?", 3, opid2('?',':'), ASSOC_RIGHT, 9, 0, true}, + + { "=", 2, opid1('='), ASSOC_RIGHT, 8, 0, false}, + { "+=", 2, opid2('+','='), ASSOC_RIGHT, 8, 0, false}, + { "-=", 2, opid2('-','='), ASSOC_RIGHT, 8, 0, false}, + { "*=", 2, opid2('*','='), ASSOC_RIGHT, 8, 0, false}, + { "/=", 2, opid2('/','='), ASSOC_RIGHT, 8, 0, false}, + { "%=", 2, opid2('%','='), ASSOC_RIGHT, 8, 0, false}, + { "&=", 2, opid2('&','='), ASSOC_RIGHT, 8, 0, false}, + { "|=", 2, opid2('|','='), ASSOC_RIGHT, 8, 0, false}, + { "&~=", 2, opid3('&','~','='), ASSOC_RIGHT, 8, 0, false}, + + { "&&", 2, opid2('&','&'), ASSOC_LEFT, 5, 0, true}, + { "||", 2, opid2('|','|'), ASSOC_LEFT, 5, 0, true}, + + /* Leave precedence 3 for : with -fcorrect-ternary */ + { ",", 2, opid1(','), ASSOC_LEFT, 2, 0, false}, + { ":", 0, opid2(':','?'), ASSOC_RIGHT, 1, 0, false} }; -static const size_t qcc_operator_count = (sizeof(qcc_operators) / sizeof(qcc_operators[0])); +static const oper_info qcc_operators[] = { + { "(", 0, opid1('('), ASSOC_LEFT, 99, OP_PREFIX, false}, /* paren expression - non function call */ + + { ".", 2, opid1('.'), ASSOC_LEFT, 15, 0, false}, + { "(", 0, opid1('('), ASSOC_LEFT, 15, 0, false}, /* function call */ + { "[", 2, opid1('['), ASSOC_LEFT, 15, 0, false}, /* array subscript */ + + { "!", 1, opid2('!','P'), ASSOC_RIGHT, 14, OP_PREFIX, true}, + { "+", 1, opid2('+','P'), ASSOC_RIGHT, 14, OP_PREFIX, false}, + { "-", 1, opid2('-','P'), ASSOC_RIGHT, 14, OP_PREFIX, true}, + + { "*", 2, opid1('*'), ASSOC_LEFT, 13, 0, true}, + { "/", 2, opid1('/'), ASSOC_LEFT, 13, 0, true}, + { "&", 2, opid1('&'), ASSOC_LEFT, 13, 0, true}, + { "|", 2, opid1('|'), ASSOC_LEFT, 13, 0, true}, + + { "+", 2, opid1('+'), ASSOC_LEFT, 12, 0, true}, + { "-", 2, opid1('-'), ASSOC_LEFT, 12, 0, true}, + + { "<", 2, opid1('<'), ASSOC_LEFT, 10, 0, false}, + { ">", 2, opid1('>'), ASSOC_LEFT, 10, 0, false}, + { "<=", 2, opid2('<','='), ASSOC_LEFT, 10, 0, false}, + { ">=", 2, opid2('>','='), ASSOC_LEFT, 10, 0, false}, + { "==", 2, opid2('=','='), ASSOC_LEFT, 10, 0, true}, + { "!=", 2, opid2('!','='), ASSOC_LEFT, 10, 0, true}, + + { "=", 2, opid1('='), ASSOC_RIGHT, 8, 0, false}, + { "+=", 2, opid2('+','='), ASSOC_RIGHT, 8, 0, false}, + { "-=", 2, opid2('-','='), ASSOC_RIGHT, 8, 0, false}, + { "*=", 2, opid2('*','='), ASSOC_RIGHT, 8, 0, false}, + { "/=", 2, opid2('/','='), ASSOC_RIGHT, 8, 0, false}, + { "%=", 2, opid2('%','='), ASSOC_RIGHT, 8, 0, false}, + { "&=", 2, opid2('&','='), ASSOC_RIGHT, 8, 0, false}, + { "|=", 2, opid2('|','='), ASSOC_RIGHT, 8, 0, false}, + + { "&&", 2, opid2('&','&'), ASSOC_LEFT, 5, 0, true}, + { "||", 2, opid2('|','|'), ASSOC_LEFT, 5, 0, true}, + + { ",", 2, opid1(','), ASSOC_LEFT, 2, 0, false}, +}; extern const oper_info *operators; extern size_t operator_count; -void lexerror(lex_file*, const char *fmt, ...); #endif