/*
* Copyright (C) 2012
- * Dale Weiler
+ * Dale Weiler
*
* Permission is hereby granted, free of charge, to any person obtaining a copy of
* this software and associated documentation files (the "Software"), to deal in
* SOFTWARE.
*/
#include "gmqcc.h"
-/*
- * This is the assembler, gmqas, this is being implemented because I'm
- * not exactly sure how codegen would work for the C compiler as of yet
- * and also I plan to allow inline assembly for the compiler.
- */
-static const struct {
- const char *m; /* menomic */
- const size_t o; /* operands */
- const size_t l; /* menomic len */
-} const asm_instr[] = {
- [INSTR_DONE] = { "DONE" , 1, 4 },
- [INSTR_MUL_F] = { "MUL_F" , 3, 5 },
- [INSTR_MUL_V] = { "MUL_V" , 3, 5 },
- [INSTR_MUL_FV] = { "MUL_FV" , 3, 6 },
- [INSTR_MUL_VF] = { "MUL_VF" , 3, 6 },
- [INSTR_DIV_F] = { "DIV" , 0, 3 },
- [INSTR_ADD_F] = { "ADD_F" , 3, 5 },
- [INSTR_ADD_V] = { "ADD_V" , 3, 5 },
- [INSTR_SUB_F] = { "SUB_F" , 3, 5 },
- [INSTR_SUB_V] = { "DUB_V" , 3, 5 },
- [INSTR_EQ_F] = { "EQ_F" , 0, 4 },
- [INSTR_EQ_V] = { "EQ_V" , 0, 4 },
- [INSTR_EQ_S] = { "EQ_S" , 0, 4 },
- [INSTR_EQ_E] = { "EQ_E" , 0, 4 },
- [INSTR_EQ_FNC] = { "ES_FNC" , 0, 6 },
- [INSTR_NE_F] = { "NE_F" , 0, 4 },
- [INSTR_NE_V] = { "NE_V" , 0, 4 },
- [INSTR_NE_S] = { "NE_S" , 0, 4 },
- [INSTR_NE_E] = { "NE_E" , 0, 4 },
- [INSTR_NE_FNC] = { "NE_FNC" , 0, 6 },
- [INSTR_LE] = { "LE" , 0, 2 },
- [INSTR_GE] = { "GE" , 0, 2 },
- [INSTR_LT] = { "LT" , 0, 2 },
- [INSTR_GT] = { "GT" , 0, 2 },
- [INSTR_LOAD_F] = { "FIELD_F" , 0, 7 },
- [INSTR_LOAD_V] = { "FIELD_V" , 0, 7 },
- [INSTR_LOAD_S] = { "FIELD_S" , 0, 7 },
- [INSTR_LOAD_ENT] = { "FIELD_ENT" , 0, 9 },
- [INSTR_LOAD_FLD] = { "FIELD_FLD" , 0, 9 },
- [INSTR_LOAD_FNC] = { "FIELD_FNC" , 0, 9 },
- [INSTR_ADDRESS] = { "ADDRESS" , 0, 7 },
- [INSTR_STORE_F] = { "STORE_F" , 0, 7 },
- [INSTR_STORE_V] = { "STORE_V" , 0, 7 },
- [INSTR_STORE_S] = { "STORE_S" , 0, 7 },
- [INSTR_STORE_ENT] = { "STORE_ENT" , 0, 9 },
- [INSTR_STORE_FLD] = { "STORE_FLD" , 0, 9 },
- [INSTR_STORE_FNC] = { "STORE_FNC" , 0, 9 },
- [INSTR_STOREP_F] = { "STOREP_F" , 0, 8 },
- [INSTR_STOREP_V] = { "STOREP_V" , 0, 8 },
- [INSTR_STOREP_S] = { "STOREP_S" , 0, 8 },
- [INSTR_STOREP_ENT] = { "STOREP_ENT", 0, 10},
- [INSTR_STOREP_FLD] = { "STOREP_FLD", 0, 10},
- [INSTR_STOREP_FNC] = { "STOREP_FNC", 0, 10},
- [INSTR_RETURN] = { "RETURN" , 0, 6 },
- [INSTR_NOT_F] = { "NOT_F" , 0, 5 },
- [INSTR_NOT_V] = { "NOT_V" , 0, 5 },
- [INSTR_NOT_S] = { "NOT_S" , 0, 5 },
- [INSTR_NOT_ENT] = { "NOT_ENT" , 0, 7 },
- [INSTR_NOT_FNC] = { "NOT_FNC" , 0, 7 },
- [INSTR_IF] = { "IF" , 0, 2 },
- [INSTR_IFNOT] = { "IFNOT" , 0, 5 },
- [INSTR_CALL0] = { "CALL0" , 0, 5 },
- [INSTR_CALL1] = { "CALL1" , 0, 5 },
- [INSTR_CALL2] = { "CALL2" , 0, 5 },
- [INSTR_CALL3] = { "CALL3" , 0, 5 },
- [INSTR_CALL4] = { "CALL4" , 0, 5 },
- [INSTR_CALL5] = { "CALL5" , 0, 5 },
- [INSTR_CALL6] = { "CALL6" , 0, 5 },
- [INSTR_CALL7] = { "CALL7" , 0, 5 },
- [INSTR_CALL8] = { "CALL8" , 0, 5 },
- [INSTR_STATE] = { "STATE" , 0, 5 },
- [INSTR_GOTO] = { "GOTO" , 0, 4 },
- [INSTR_AND] = { "AND" , 0, 3 },
- [INSTR_OR] = { "OR" , 0, 2 },
- [INSTR_BITAND] = { "BITAND" , 0, 6 },
- [INSTR_BITOR] = { "BITOR" , 0, 5 }
-};
-
/*
* Some assembler keywords not part of the opcodes above: these are
* for creating functions, or constants.
*/
const char *const asm_keys[] = {
- "FLOAT" , /* define float */
- "VECTOR" , /* define vector */
- "ENTITY" , /* define ent */
- "FIELD" , /* define field */
- "STRING" , /* define string */
- "FUNCTION"
+ "FLOAT" , /* define float */
+ "VECTOR" , /* define vector */
+ "ENTITY" , /* define ent */
+ "FIELD" , /* define field */
+ "STRING" , /* define string */
+ "FUNCTION"
};
static char *const asm_getline(size_t *byte, FILE *fp) {
- char *line = NULL;
- ssize_t read = util_getline(&line, byte, fp);
- *byte = read;
- if (read == -1) {
- mem_d (line);
- return NULL;
- }
- return line;
+ char *line = NULL;
+ ssize_t read = util_getline(&line, byte, fp);
+ *byte = read;
+ if (read == -1) {
+ mem_d (line);
+ return NULL;
+ }
+ return line;
}
-#define asm_rmnewline(L,S) *((L)+*(S)-1) = '\0'
-#define asm_skipwhite(L) \
- while((*(L)==' '||*(L)=='\t')) { \
- (L)++; \
- }
-
void asm_init(const char *file, FILE **fp) {
- *fp = fopen(file, "r");
- code_init();
+ *fp = fopen(file, "r");
+ code_init();
}
void asm_close(FILE *fp) {
- fclose(fp);
- code_write();
+ fclose(fp);
+ code_write();
}
/*
* Following parse states:
- * ASM_FUNCTION -- in a function accepting input statements
- * ....
+ * ASM_FUNCTION -- in a function accepting input statements
+ * ....
*/
typedef enum {
- ASM_NULL,
- ASM_FUNCTION
+ ASM_NULL,
+ ASM_FUNCTION
} asm_state;
typedef struct {
- char *name; /* name of constant */
- int offset; /* location in globals */
+ char *name; /* name of constant */
+ int offset; /* location in globals */
} globals;
VECTOR_MAKE(globals, assembly_constants);
-
+
+void asm_clear() {
+ size_t i = 0;
+ for (; i < assembly_constants_elements; i++)
+ mem_d(assembly_constants_data[i].name);
+ mem_d(assembly_constants_data);
+}
+
+int asm_parsetype(const char *key, char **skip, long line) {
+ size_t keylen = strlen(key);
+ if (!strncmp(key, *skip, keylen)) {
+ if ((*skip)[keylen] != ':'){
+ printf("%li: Missing `:` after decltype\n", line);
+ exit(1);
+ }
+ *skip += keylen+1;
+ while (**skip == ' ' || **skip == '\t')
+ (*skip)++;
+
+ if (!isalpha(**skip)) {
+ printf("%li: Invalid identififer: %s\n", line, *skip);
+ exit(1);
+ } else {
+ assembly_constants_add((globals) {
+ .name = util_strdup("empty"),
+ .offset = code_globals_elements
+ });
+ return 1;
+ }
+ }
+ return 0;
+}
+
void asm_parse(FILE *fp) {
- char *data = NULL;
- char *skip = NULL;
- long line = 1; /* current line */
- size_t size = 0; /* size of line */
- asm_state state = ASM_NULL;
-
- while ((data = asm_getline(&size, fp)) != NULL) {
- skip = data;
- asm_skipwhite(skip);
- asm_rmnewline(skip, &size);
-
- #define DECLTYPE(X, CODE) \
- if (!strncmp(X, skip, strlen(X))) { \
- if (skip[strlen(X)] != ':') { \
- printf("%li: Missing `:` after decltype\n",line); \
- exit (1); \
- } \
- skip += strlen(X)+1; \
- asm_skipwhite(skip); \
- if(!isalpha(*skip)) { \
- printf("%li: Invalid identififer: %s\n", line, skip); \
- exit (1); \
- } else { \
- size_t offset_code = code_statements_elements+1; \
- size_t offset_chars = code_strings_elements +1; \
- size_t offset_globals = code_globals_elements +1; \
- size_t offset_functions = code_functions_elements +1; \
- size_t offset_fields = code_fields_elements +1; \
- size_t offset_defs = code_defs_elements +1; \
- CODE \
- /* silent unused warnings */ \
- (void)offset_code; \
- (void)offset_chars; \
- (void)offset_globals; \
- (void)offset_functions; \
- (void)offset_fields; \
- (void)offset_defs; \
- assembly_constants_add((globals){ \
- .name = util_strdup(skip), \
- .offset = offset_globals \
- }); \
- } \
- goto end; \
- }
-
- /* FLOAT */
- DECLTYPE(asm_keys[0], {
- code_defs_add((prog_section_def){
- .type = TYPE_FLOAT,
- .offset = offset_globals, /* global table */
- .name = offset_chars /* string table TODO */
- });
- float f = 0; /*TODO*/
- code_globals_add(*(int*)&f);
-
- });
- DECLTYPE(asm_keys[1], {
- code_defs_add((prog_section_def){
- .type = TYPE_FLOAT,
- .offset = offset_globals, /* global table */
- .name = offset_chars /* string table TODO */
- });
- float f1 = 0;
- float f2 = 0;
- float f3 = 0;
- code_globals_add(*(int*)&f1);
- code_globals_add(*(int*)&f2);
- code_globals_add(*(int*)&f3);
- });
- /* ENTITY */ DECLTYPE(asm_keys[2], {});
- /* FIELD */ DECLTYPE(asm_keys[3], {});
- /* STRING */
- DECLTYPE(asm_keys[4], {
- code_defs_add((prog_section_def){
- .type = TYPE_STRING,
- .offset = offset_globals, /* offset to offset in string table (for data)*/
- .name = offset_chars /* location of name in string table (for name)*/
- });
- code_strings_add('h');
- });
- /* FUNCTION */
- DECLTYPE(asm_keys[5], {
- /* TODO: parse */
- if (state != ASM_NULL) {
- printf("%li: Error unfinished function block, expected DONE or RETURN\n", line);
- goto end;
- }
-
- state = ASM_FUNCTION;
- code_defs_add((prog_section_def){
- .type = TYPE_VOID,
- .offset = offset_globals,
- .name = offset_chars
- });
- code_globals_add(offset_functions);
- code_functions_add((prog_section_function){
- .entry = offset_code,
- .firstlocal = 0,
- .locals = 0,
- .profile = 0,
- .name = offset_chars,
- .file = 0,
- .nargs = 0,
- .argsize = {0}
- });
- });
-
- /* if we make it this far then we have statements */
- {
- size_t i = 0; /* counter */
- size_t o = 0; /* operands */
- char *t = NULL; /* token */
-
- /*
- * Most ops a single statement can have is three.
- * lets allocate some space for all of those here.
- */
- char op[3][32768] = {{0},{0},{0}};
- for (; i < sizeof(asm_instr)/sizeof(*asm_instr); i++) {
- if (!strncmp(skip, asm_instr[i].m, asm_instr[i].l)) {
- if (state != ASM_FUNCTION) {
- printf("%li: Statement not inside function block\n", line);
- goto end;
- }
-
- /* update parser state */
- if (i == INSTR_DONE || i == INSTR_RETURN) {
- goto end;
- state = ASM_NULL;
- }
-
- /* parse the statement */
- o = asm_instr[i].o; /* operands */
- skip += asm_instr[i].l; /* skip instruction */
- t = strtok(skip, " ,");
- i = 0;
- while (t != NULL && i < 3) {
- strcpy(op[i], t);
- t = strtok(NULL, " ,");
- i ++;
- }
-
- util_debug("ASM", "Operand 1: %s\n", util_strrnl(op[0]));
- util_debug("ASM", "Operand 2: %s\n", util_strrnl(op[1]));
- util_debug("ASM", "Operand 3: %s\n", util_strrnl(op[2]));
-
- /* check */
- if (i != o) {
- printf("not enough operands, expected: %li, got %li\n", o, i);
- }
-
- /* TODO: hashtable value LOAD .... etc */
- code_statements_add((prog_section_statement){
- i, {0}, {0}, {0}
- });
- goto end;
- }
- }
- }
-
- /* if we made it this far something is wrong */
- if (*skip != '\0')
- printf("%li: Invalid statement, expression, or decleration\n", line);
-
- end:
- //free(data);
- mem_d(data);
- line ++;
- }
+ char *data = NULL;
+ char *skip = NULL;
+ long line = 1; /* current line */
+ size_t size = 0; /* size of line */
+ asm_state state = ASM_NULL;
+
+ while ((data = skip = asm_getline(&size, fp)) != NULL) {
+ /* remove any whitespace at start */
+ while (*skip == ' ' || *skip == '\t')
+ skip++;
+ /* remove newline at end of string */
+ *(skip+*(&size)-1) = '\0';
+
+ if (asm_parsetype(asm_keys[5], &skip, line)) {
+ if (state != ASM_NULL) {
+ printf("%li: Error unfinished function block, expected DONE or RETURN\n", line);
+ goto end;
+ }
+ state = ASM_FUNCTION;
+ code_defs_add((prog_section_def){
+ .type = TYPE_VOID,
+ .offset = code_globals_elements,
+ .name = code_chars_elements
+ });
+ code_globals_add(code_functions_elements);
+ code_functions_add((prog_section_function) {
+ .entry = code_statements_elements,
+ .firstlocal = 0,
+ .locals = 0,
+ .profile = 0,
+ .name = code_chars_elements,
+ .file = 0,
+ .nargs = 0,
+ .argsize = {0}
+ });
+ code_strings_add(skip);
+ };
+
+ #if 0
+ /* if we make it this far then we have statements */
+ {
+ size_t i = 0; /* counter */
+ size_t o = 0; /* operands */
+ size_t c = 0; /* copy */
+ char *t = NULL; /* token */
+
+ /*
+ * Most ops a single statement can have is three.
+ * lets allocate some space for all of those here.
+ */
+ char op[3][32768] = {{0},{0},{0}};
+ for (; i < sizeof(asm_instr)/sizeof(*asm_instr); i++) {
+ if (!strncmp(skip, asm_instr[i].m, asm_instr[i].l)) {
+ if (state != ASM_FUNCTION) {
+ printf("%li: Statement not inside function block\n", line);
+ goto end;
+ }
+
+ /* update parser state */
+ if (i == INSTR_DONE || i == INSTR_RETURN) {
+ goto end;
+ state = ASM_NULL;
+ }
+
+ /* parse the statement */
+ c = i;
+ o = asm_instr[i].o; /* operands */
+ skip += asm_instr[i].l; /* skip instruction */
+ t = strtok(skip, " ,");
+ i = 0;
+ while (t != NULL && i < 3) {
+ strcpy(op[i], t);
+ t = strtok(NULL, " ,");
+ i ++;
+ }
+
+ /* check */
+ if (i != o) {
+ printf("not enough operands, expected: %li, got %li\n", o, i);
+ }
+
+ /* TODO: hashtable value LOAD .... etc */
+ code_statements_add((prog_section_statement){
+ c,
+ { atof(op[0]) },
+ { atof(op[1]) },
+ { atof(op[2]) }
+ });
+ goto end;
+ }
+ }
+ }
+ #endif
+
+ /* if we made it this far something is wrong */
+ if (*skip != '\0')
+ printf("%li: Invalid statement %s, expression, or decleration\n", line, skip);
+
+ end:
+ mem_d(data);
+ line ++;
+ }
+ asm_clear();
}