2 * Copyright (C) 2012, 2013
6 * Permission is hereby granted, free of charge, to any person obtaining a copy of
7 * this software and associated documentation files (the "Software"), to deal in
8 * the Software without restriction, including without limitation the rights to
9 * use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
10 * of the Software, and to permit persons to whom the Software is furnished to do
11 * so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
31 * GMQCC performs tons of allocations, constructions, and crazyness
32 * all around. When trying to optimizes systems, or just get fancy
33 * statistics out of the compiler, it's often printf mess. This file
34 * implements the statistics system of the compiler. I.E the allocator
35 * we use to track allocations, and other systems of interest.
39 typedef struct stat_mem_block_s {
43 struct stat_mem_block_s *next;
44 struct stat_mem_block_s *prev;
50 } stat_size_entry_t, **stat_size_table_t;
52 static uint64_t stat_mem_allocated = 0;
53 static uint64_t stat_mem_deallocated = 0;
54 static uint64_t stat_mem_allocated_total = 0;
55 static uint64_t stat_mem_deallocated_total = 0;
56 static uint64_t stat_mem_high = 0;
57 static uint64_t stat_mem_peak = 0;
58 static uint64_t stat_mem_strdups = 0;
59 static uint64_t stat_used_strdups = 0;
60 static uint64_t stat_used_vectors = 0;
61 static uint64_t stat_used_hashtables = 0;
62 static uint64_t stat_type_vectors = 0;
63 static uint64_t stat_type_hashtables = 0;
64 static stat_size_table_t stat_size_vectors = NULL;
65 static stat_size_table_t stat_size_hashtables = NULL;
66 static stat_mem_block_t *stat_mem_block_root = NULL;
69 * A tiny size_t key-value hashtbale for tracking vector and hashtable
70 * sizes. We can use it for other things too, if we need to. This is
71 * very TIGHT, and efficent in terms of space though.
73 static stat_size_table_t stat_size_new(void) {
74 return (stat_size_table_t)memset(
75 mem_a(sizeof(stat_size_entry_t*) * ST_SIZE),
76 0, ST_SIZE * sizeof(stat_size_entry_t*)
80 static void stat_size_del(stat_size_table_t table) {
82 for (; i < ST_SIZE; i++) if(table[i]) mem_d(table[i]);
86 static stat_size_entry_t *stat_size_get(stat_size_table_t table, size_t key) {
87 size_t hash = (key % ST_SIZE);
88 while (table[hash] && table[hash]->key != key)
89 hash = (hash + 1) % ST_SIZE;
92 static void stat_size_put(stat_size_table_t table, size_t key, size_t value) {
93 size_t hash = (key % ST_SIZE);
94 while (table[hash] && table[hash]->key != key)
95 hash = (hash + 1) % ST_SIZE;
96 table[hash] = (stat_size_entry_t*)mem_a(sizeof(stat_size_entry_t));
97 table[hash]->key = key;
98 table[hash]->value = value;
102 * A basic header of information wrapper allocator. Simply stores
103 * information as a header, returns the memory + 1 past it, can be
104 * retrieved again with - 1. Where type is stat_mem_block_t*.
106 void *stat_mem_allocate(size_t size, size_t line, const char *file) {
107 stat_mem_block_t *info = (stat_mem_block_t*)malloc(sizeof(stat_mem_block_t) + size);
108 void *data = (void*)(info + 1);
117 info->next = stat_mem_block_root;
119 if (stat_mem_block_root)
120 stat_mem_block_root->prev = info;
122 stat_mem_block_root = info;
123 stat_mem_allocated += size;
124 stat_mem_high += size;
125 stat_mem_allocated_total ++;
127 if (stat_mem_high > stat_mem_peak)
128 stat_mem_peak = stat_mem_high;
133 void stat_mem_deallocate(void *ptr) {
134 stat_mem_block_t *info = NULL;
139 info = ((stat_mem_block_t*)ptr - 1);
141 stat_mem_deallocated += info->size;
142 stat_mem_high -= info->size;
143 stat_mem_deallocated_total ++;
145 if (info->prev) info->prev->next = info->next;
146 if (info->next) info->next->prev = info->prev;
149 if (info == stat_mem_block_root)
150 stat_mem_block_root = info->next;
155 void *stat_mem_reallocate(void *ptr, size_t size, size_t line, const char *file) {
156 stat_mem_block_t *oldinfo = NULL;
157 stat_mem_block_t *newinfo;
160 return stat_mem_allocate(size, line, file);
162 /* stay consistent with glic */
164 stat_mem_deallocate(ptr);
168 oldinfo = ((stat_mem_block_t*)ptr - 1);
169 newinfo = ((stat_mem_block_t*)malloc(sizeof(stat_mem_block_t) + size));
172 stat_mem_deallocate(ptr);
176 memcpy(newinfo+1, oldinfo+1, oldinfo->size);
178 if (oldinfo->prev) oldinfo->prev->next = oldinfo->next;
179 if (oldinfo->next) oldinfo->next->prev = oldinfo->prev;
182 if (oldinfo == stat_mem_block_root)
183 stat_mem_block_root = oldinfo->next;
185 newinfo->line = line;
186 newinfo->size = size;
187 newinfo->file = file;
188 newinfo->prev = NULL;
189 newinfo->next = stat_mem_block_root;
191 if (stat_mem_block_root)
192 stat_mem_block_root->prev = newinfo;
194 stat_mem_block_root = newinfo;
195 stat_mem_allocated -= oldinfo->size;
196 stat_mem_high -= oldinfo->size;
197 stat_mem_allocated += newinfo->size;
198 stat_mem_high += newinfo->size;
200 if (stat_mem_high > stat_mem_peak)
201 stat_mem_peak = stat_mem_high;
209 * strdup does it's own malloc, we need to track malloc. We don't want
210 * to overwrite malloc though, infact, we can't really hook it at all
211 * without library specific assumptions. So we re implement strdup.
213 char *stat_mem_strdup(const char *src, size_t line, const char *file, bool empty) {
221 if (((!empty) ? len : true) && (ptr = (char*)stat_mem_allocate(len + 1, line, file))) {
222 memcpy(ptr, src, len);
226 stat_used_strdups ++;
227 stat_mem_strdups += len;
232 * The reallocate function for resizing vectors.
234 void _util_vec_grow(void **a, size_t i, size_t s) {
235 vector_t *d = vec_meta(*a);
237 stat_size_entry_t *e = NULL;
241 m = 2 * d->allocated + i;
242 p = mem_r(d, s * m + sizeof(vector_t));
245 p = mem_a(s * m + sizeof(vector_t));
246 ((vector_t*)p)->used = 0;
250 if (!stat_size_vectors)
251 stat_size_vectors = stat_size_new();
253 if ((e = stat_size_get(stat_size_vectors, s))) {
256 stat_size_put(stat_size_vectors, s, 1); /* start off with 1 */
260 *a = (vector_t*)p + 1;
261 vec_meta(*a)->allocated = m;
265 * Hash table for generic data, based on dynamic memory allocations
266 * all around. This is the internal interface, please look for
267 * EXPOSED INTERFACE comment below
269 typedef struct hash_node_t {
270 char *key; /* the key for this node in table */
271 void *value; /* pointer to the data as void* */
272 struct hash_node_t *next; /* next node (linked list) */
276 * This is a patched version of the Murmur2 hashing function to use
277 * a proper pre-mix and post-mix setup. Infact this is Murmur3 for
278 * the most part just reinvented.
280 * Murmur 2 contains an inner loop such as:
293 * The two u32s that form the key are the same value x (pulled from data)
294 * this premix stage will perform the same results for both values. Unrolled
295 * this produces just:
305 * This appears to be fine, except what happens when m == 1? well x
306 * cancels out entierly, leaving just:
311 * So all keys hash to the same value, but how often does m == 1?
312 * well, it turns out testing x for all possible values yeilds only
313 * 172,013,942 unique results instead of 2^32. So nearly ~4.6 bits
314 * are cancelled out on average!
316 * This means we have a 14.5% (rounded) chance of colliding more, which
317 * results in another bucket/chain for the hashtable.
319 * We fix it buy upgrading the pre and post mix ssystems to align with murmur
323 #define GMQCC_ROTL32(X, R) (((X) << (R)) | ((X) >> (32 - (R))))
324 GMQCC_INLINE size_t util_hthash(hash_table_t *ht, const char *key) {
325 const unsigned char *data = (const unsigned char *)key;
326 const size_t len = strlen(key);
327 const size_t block = len / 4;
328 const uint32_t mask1 = 0xCC9E2D51;
329 const uint32_t mask2 = 0x1B873593;
330 const uint32_t *blocks = (const uint32_t*)(data + block * 4);
331 const unsigned char *tail = (const unsigned char *)(data + block * 4);
335 uint32_t h = 0x1EF0 ^ len;
337 for (i = -block; i; i++) {
340 k = GMQCC_ROTL32(k, 15);
343 h = GMQCC_ROTL32(h, 13);
344 h = h * 5 + 0xE6546B64;
356 k = GMQCC_ROTL32(k, 15);
368 return (size_t) (h % ht->size);
372 /* We keep the old for reference */
373 GMQCC_INLINE size_t util_hthash(hash_table_t *ht, const char *key) {
374 const uint32_t mix = 0x5BD1E995;
375 const uint32_t rot = 24;
376 size_t size = strlen(key);
377 uint32_t hash = 0x1EF0 /* LICRC TAB */ ^ size;
379 const unsigned char *data = (const unsigned char*)key;
382 alias = (data[0] | (data[1] << 8) | (data[2] << 16) | (data[3] << 24));
384 alias ^= alias >> rot;
395 case 3: hash ^= data[2] << 16;
396 case 2: hash ^= data[1] << 8;
397 case 1: hash ^= data[0];
405 return (size_t) (hash % ht->size);
409 static hash_node_t *_util_htnewpair(const char *key, void *value) {
411 if (!(node = (hash_node_t*)mem_a(sizeof(hash_node_t))))
414 if (!(node->key = util_strdupe(key))) {
426 * EXPOSED INTERFACE for the hashtable implementation
427 * util_htnew(size) -- to make a new hashtable
428 * util_htset(table, key, value, sizeof(value)) -- to set something in the table
429 * util_htget(table, key) -- to get something from the table
430 * util_htdel(table) -- to delete the table
432 hash_table_t *util_htnew(size_t size) {
433 hash_table_t *hashtable = NULL;
434 stat_size_entry_t *find = NULL;
439 if (!stat_size_hashtables)
440 stat_size_hashtables = stat_size_new();
442 if (!(hashtable = (hash_table_t*)mem_a(sizeof(hash_table_t))))
445 if (!(hashtable->table = (hash_node_t**)mem_a(sizeof(hash_node_t*) * size))) {
450 if ((find = stat_size_get(stat_size_hashtables, size)))
453 stat_type_hashtables++;
454 stat_size_put(stat_size_hashtables, size, 1);
457 hashtable->size = size;
458 memset(hashtable->table, 0, sizeof(hash_node_t*) * size);
460 stat_used_hashtables++;
464 void util_htseth(hash_table_t *ht, const char *key, size_t bin, void *value) {
465 hash_node_t *newnode = NULL;
466 hash_node_t *next = NULL;
467 hash_node_t *last = NULL;
469 next = ht->table[bin];
471 while (next && next->key && strcmp(key, next->key) > 0)
472 last = next, next = next->next;
474 /* already in table, do a replace */
475 if (next && next->key && strcmp(key, next->key) == 0) {
478 /* not found, grow a pair man :P */
479 newnode = _util_htnewpair(key, value);
480 if (next == ht->table[bin]) {
481 newnode->next = next;
482 ht->table[bin] = newnode;
484 last->next = newnode;
486 newnode->next = next;
487 last->next = newnode;
492 void util_htset(hash_table_t *ht, const char *key, void *value) {
493 util_htseth(ht, key, util_hthash(ht, key), value);
496 void *util_htgeth(hash_table_t *ht, const char *key, size_t bin) {
497 hash_node_t *pair = ht->table[bin];
499 while (pair && pair->key && strcmp(key, pair->key) > 0)
502 if (!pair || !pair->key || strcmp(key, pair->key) != 0)
508 void *util_htget(hash_table_t *ht, const char *key) {
509 return util_htgeth(ht, key, util_hthash(ht, key));
512 void *code_util_str_htgeth(hash_table_t *ht, const char *key, size_t bin) {
517 keylen = strlen(key);
519 pair = ht->table[bin];
520 while (pair && pair->key) {
521 len = strlen(pair->key);
527 cmp = strcmp(key, pair->key);
535 cmp = strcmp(key, pair->key + len - keylen);
537 uintptr_t up = (uintptr_t)pair->value;
547 * Free all allocated data in a hashtable, this is quite the amount
550 void util_htrem(hash_table_t *ht, void (*callback)(void *data)) {
553 for (; i < ht->size; ++i) {
554 hash_node_t *n = ht->table[i];
574 void util_htrmh(hash_table_t *ht, const char *key, size_t bin, void (*cb)(void*)) {
575 hash_node_t **pair = &ht->table[bin];
578 while (*pair && (*pair)->key && strcmp(key, (*pair)->key) > 0)
579 pair = &(*pair)->next;
582 if (!tmp || !tmp->key || strcmp(key, tmp->key) != 0)
593 void util_htrm(hash_table_t *ht, const char *key, void (*cb)(void*)) {
594 util_htrmh(ht, key, util_hthash(ht, key), cb);
597 void util_htdel(hash_table_t *ht) {
598 util_htrem(ht, NULL);
602 * The following functions below implement printing / dumping of statistical
605 static void stat_dump_mem_contents(stat_mem_block_t *memory, uint16_t cols) {
607 for (i = 0; i < memory->size + ((memory->size % cols) ? (cols - memory->size % cols) : 0); i++) {
608 if (i % cols == 0) con_out(" 0x%06X: ", i);
609 if (i < memory->size) con_out("%02X " , 0xFF & ((unsigned char*)(memory + 1))[i]);
612 if ((uint16_t)(i % cols) == (cols - 1)) {
613 for (j = i - (cols - 1); j <= i; j++) {
617 : (util_isprint(((unsigned char*)(memory + 1))[j]))
618 ? 0xFF & ((unsigned char*)(memory + 1)) [j]
627 static void stat_dump_mem_leaks(void) {
628 stat_mem_block_t *info;
629 for (info = stat_mem_block_root; info; info = info->next) {
630 con_out("lost: %u (bytes) at %s:%u\n",
636 stat_dump_mem_contents(info, OPTS_OPTION_U16(OPTION_MEMDUMPCOLS));
640 static void stat_dump_mem_info(void) {
641 con_out("Memory Information:\n\
642 Total allocations: %llu\n\
643 Total deallocations: %llu\n\
644 Total allocated: %f (MB)\n\
645 Total deallocated: %f (MB)\n\
646 Total peak memory: %f (MB)\n\
647 Total leaked memory: %f (MB) in %llu allocations\n",
648 stat_mem_allocated_total,
649 stat_mem_deallocated_total,
650 (float)(stat_mem_allocated) / 1048576.0f,
651 (float)(stat_mem_deallocated) / 1048576.0f,
652 (float)(stat_mem_peak) / 1048576.0f,
653 (float)(stat_mem_allocated - stat_mem_deallocated) / 1048576.0f,
654 stat_mem_allocated_total - stat_mem_deallocated_total
658 static void stat_dump_stats_table(stat_size_table_t table, const char *string, uint64_t *size) {
664 for (i = 0, j = 1; i < ST_SIZE; i++) {
665 stat_size_entry_t *entry;
667 if (!(entry = table[i]))
670 con_out(string, (unsigned)j, (unsigned)entry->key, (unsigned)entry->value);
674 *size += entry->key * entry->value;
679 if (OPTS_OPTION_BOOL(OPTION_MEMCHK) ||
680 OPTS_OPTION_BOOL(OPTION_STATISTICS)) {
683 con_out("Memory Statistics:\n\
684 Total vectors allocated: %llu\n\
685 Total string duplicates: %llu\n\
686 Total string duplicate memory: %f (MB)\n\
687 Total hashtables allocated: %llu\n\
688 Total unique vector sizes: %llu\n",
691 (float)(stat_mem_strdups) / 1048576.0f,
692 stat_used_hashtables,
696 stat_dump_stats_table (
698 " %2u| # of %5u byte vectors: %u\n",
703 " Total unique hashtable sizes: %llu\n",
707 stat_dump_stats_table (
708 stat_size_hashtables,
709 " %2u| # of %5u element hashtables: %u\n",
714 " Total vector memory: %f (MB)\n\n",
715 (float)(mem) / 1048576.0f
719 if (stat_size_vectors)
720 stat_size_del(stat_size_vectors);
721 if (stat_size_hashtables)
722 stat_size_del(stat_size_hashtables);
724 if (OPTS_OPTION_BOOL(OPTION_DEBUG) ||
725 OPTS_OPTION_BOOL(OPTION_MEMCHK))
726 stat_dump_mem_info();
728 if (OPTS_OPTION_BOOL(OPTION_DEBUG))
729 stat_dump_mem_leaks();