Cthulhu  0.2.10
Cthulhu compiler collection
ssa.c
Go to the documentation of this file.
1 // SPDX-License-Identifier: LGPL-3.0-only
2 
3 #include "common/common.h"
4 
5 #include "cthulhu/tree/query.h"
6 
7 #include "arena/arena.h"
8 #include "std/str.h"
9 #include "std/map.h"
10 #include "std/set.h"
11 #include "std/vector.h"
12 
13 #include "std/typed/vector.h"
14 
15 #include "base/panic.h"
16 #include <stdio.h>
17 
19 typedef struct ssa_compile_t
20 {
22 
26 
31 
33 
35 
38  size_t string_count;
40 
44 
48 
52 
56 
60 
63 
67 
70 
76 
78 typedef struct ssa_loop_t
79 {
82 
85 } ssa_loop_t;
86 
87 static void add_dep(ssa_compile_t *ssa, const ssa_symbol_t *symbol, const ssa_symbol_t *dep)
88 {
89  set_t *set = map_get(ssa->symbol_deps, symbol);
90  if (set == NULL)
91  {
92  set = set_new(8, kTypeInfoPtr, ssa->arena);
93  map_set(ssa->symbol_deps, symbol, set);
94  }
95 
96  set_add(set, dep);
97 }
98 
99 static ssa_symbol_t *symbol_new(ssa_compile_t *ssa, const char *name, const tree_t *type, tree_attribs_t attribs, ssa_storage_t storage)
100 {
101  const ssa_type_t *ssa_type = ssa_type_create_cached(ssa->types, type);
102 
103  ssa_symbol_t *symbol = ARENA_MALLOC(sizeof(ssa_symbol_t), name, ssa, ssa->arena);
104  symbol->linkage = attribs.link;
105  symbol->visibility = attribs.visibility;
106  symbol->linkage_string = attribs.mangle;
107  symbol->storage = storage;
108 
109  symbol->locals = NULL;
110  symbol->params = NULL;
111 
112  symbol->name = name;
113  symbol->type = ssa_type;
114  symbol->value = NULL;
115  symbol->entry = NULL;
116 
117  symbol->blocks = vector_new(4, ssa->arena);
118 
119  return symbol;
120 }
121 
122 static ssa_symbol_t *symbol_create_decl(ssa_compile_t *ssa, const tree_t *tree, ssa_storage_t storage)
123 {
124  const char *name = tree_get_name(tree);
125  const tree_attribs_t *attrib = tree_get_attrib(tree);
126 
127  return symbol_new(ssa, name, tree_get_type(tree), *attrib, storage);
128 }
129 
130 static ssa_storage_t create_new_storage(map_t *types, const tree_t *type, size_t size, tree_quals_t quals)
131 {
132  ssa_storage_t storage = {
133  .type = ssa_type_create_cached(types, type),
134  .size = size,
135  .quals = quals
136  };
137 
138  return storage;
139 }
140 
141 static ssa_storage_t create_storage_for_decl(map_t *types, const tree_t *decl)
142 {
143  const tree_t *type = tree_get_storage_type(decl);
144  size_t size = tree_get_storage_size(decl);
145  tree_quals_t quals = tree_get_storage_quals(decl);
146  return create_new_storage(types, type, size, quals);
147 }
148 
149 static ssa_symbol_t *function_create(ssa_compile_t *ssa, const tree_t *tree)
150 {
151  CTASSERTF(tree_is(tree, eTreeDeclFunction), "expected function, got %s", tree_to_string(tree));
152  ssa_storage_t storage = { .type = NULL, .size = 0, .quals = eQualNone };
153  ssa_symbol_t *self = symbol_create_decl(ssa, tree, storage);
154 
155  size_t locals = vector_len(tree->locals);
156  self->locals = typevec_of(sizeof(ssa_local_t), locals, ssa->arena);
157  for (size_t i = 0; i < locals; i++)
158  {
159  const tree_t *local = vector_get(tree->locals, i);
160  ssa_storage_t type_storage = create_storage_for_decl(ssa->types, local);
161  const ssa_type_t *type = ssa_type_create_cached(ssa->types, tree_get_type(local));
162  const char *name = tree_get_name(local);
163 
164  ssa_local_t it = {
165  .storage = type_storage,
166  .name = name,
167  .type = type,
168  };
169 
170  typevec_set(self->locals, i, &it);
171  map_set(ssa->symbol_locals, local, (void*)(uintptr_t)i);
172  }
173 
174  size_t params = vector_len(tree->params);
175  self->params = typevec_of(sizeof(ssa_param_t), params, ssa->arena);
176  for (size_t i = 0; i < params; i++)
177  {
178  const tree_t *param = vector_get(tree->params, i);
180  const char *name = tree_get_name(param);
181 
182  ssa_param_t it = {
183  .name = name,
184  .type = ty,
185  };
186 
187  typevec_set(self->params, i, &it);
188  map_set(ssa->symbol_locals, param, (void*)(uintptr_t)i);
189  }
190 
191  return self;
192 }
193 
194 static ssa_symbol_t *intern_string(ssa_compile_t *ssa, const tree_t *tree)
195 {
196  CTASSERT(ssa != NULL);
197 
198  text_view_t view = tree->string_value;
199  CTASSERT(view.text != NULL);
200 
201  // see if we already have this string
202  ssa_symbol_t *symbol = map_get(ssa->strings, &view);
203  if (symbol != NULL)
204  {
205  return symbol;
206  }
207 
208  // otherwise create all the data we need
209  tree_attribs_t attribs = {
210  .link = eLinkModule,
211  .visibility = eVisiblePrivate,
212  };
213  const tree_t *type = tree_get_type(tree);
214 
215  // we need the load type here because we're creating storage for this string
216  const tree_t *inner = tree_ty_load_type(type);
217  ssa_storage_t storage = create_new_storage(ssa->types, inner, view.length + 1, eQualConst);
218  ssa_symbol_t *it = symbol_new(ssa, NULL, type, attribs, storage);
219  it->value = ssa_value_string(it->type, view);
220  text_view_t *ptr = arena_memdup(&view, sizeof(text_view_t), ssa->arena);
221  map_set(ssa->strings, ptr, it);
222 
223  vector_push(&ssa->current_module->globals, it);
224 
225  return it;
226 }
227 
228 static ssa_module_t *module_create(ssa_compile_t *ssa, const char *name)
229 {
230  ssa_module_t *mod = ARENA_MALLOC(sizeof(ssa_module_t), name, ssa, ssa->arena);
231  mod->name = name;
232 
233  mod->globals = vector_new(32, ssa->arena);
234  mod->functions = vector_new(32, ssa->arena);
235  mod->types = vector_new(32, ssa->arena);
236 
237  return mod;
238 }
239 
240 static ssa_operand_t bb_add_step(ssa_block_t *bb, ssa_step_t step)
241 {
242  size_t index = typevec_len(bb->steps);
243 
244  typevec_push(bb->steps, &step);
245 
246  ssa_operand_t operand = {
247  .kind = eOperandReg,
248  .vreg_context = bb,
249  .vreg_index = index
250  };
251 
252  return operand;
253 }
254 
255 static ssa_operand_t operand_empty(void)
256 {
257  ssa_operand_t operand = {
258  .kind = eOperandEmpty
259  };
260  return operand;
261 }
262 
263 static ssa_operand_t operand_bb(ssa_block_t *bb)
264 {
265  ssa_operand_t operand = {
266  .kind = eOperandBlock,
267  .bb = bb
268  };
269  return operand;
270 }
271 
272 static ssa_operand_t add_step(ssa_compile_t *ssa, ssa_step_t step)
273 {
274  return bb_add_step(ssa->current_block, step);
275 }
276 
277 static ssa_block_t *ssa_block_create(ssa_symbol_t *symbol, const char *name, size_t size, arena_t *arena)
278 {
279  ssa_block_t *bb = ARENA_MALLOC(sizeof(ssa_block_t), name, symbol, arena);
280  bb->name = name;
281  bb->steps = typevec_new(sizeof(ssa_step_t), size, arena);
282  vector_push(&symbol->blocks, bb);
283 
284  ARENA_IDENTIFY(bb->steps, "steps", bb, arena);
285 
286  return bb;
287 }
288 
289 static ssa_operand_t compile_tree(ssa_compile_t *ssa, const tree_t *tree);
290 
291 static ssa_operand_t compile_branch(ssa_compile_t *ssa, const tree_t *branch)
292 {
293  ssa_operand_t cond = compile_tree(ssa, branch->cond);
294  ssa_block_t *current = ssa->current_block;
295 
296  ssa_block_t *tail_block = ssa_block_create(ssa->current_symbol, "tail", 0, ssa->arena);
297  ssa_block_t *then_block = ssa_block_create(ssa->current_symbol, "then", 0, ssa->arena);
298  ssa_block_t *else_block = branch->other != NULL ? ssa_block_create(ssa->current_symbol, "other", 0, ssa->arena) : NULL;
299 
300  ssa_step_t step = {
301  .opcode = eOpBranch,
302  .branch = {
303  .cond = cond,
304  .then = operand_bb(then_block),
305  .other = else_block ? operand_bb(else_block) : operand_bb(tail_block)
306  }
307  };
308 
309  ssa_operand_t tail = {
310  .kind = eOperandBlock,
311  .bb = tail_block
312  };
313  ssa_step_t jump_to_tail = {
314  .opcode = eOpJump,
315  .jump = {
316  .target = tail
317  }
318  };
319 
320  ssa->current_block = then_block;
321  compile_tree(ssa, branch->then);
322  bb_add_step(then_block, jump_to_tail);
323 
324  if (branch->other != NULL)
325  {
326  ssa->current_block = else_block;
327  compile_tree(ssa, branch->other);
328  bb_add_step(else_block, jump_to_tail);
329  }
330 
331  ssa->current_block = current;
332  add_step(ssa, step);
333 
334  ssa->current_block = tail_block;
335 
336  return tail;
337 }
338 
339 static ssa_operand_t compile_loop(ssa_compile_t *ssa, const tree_t *tree)
340 {
353  ssa_block_t *loop_block = ssa_block_create(ssa->current_symbol, NULL, 0, ssa->arena);
354  ssa_block_t *body_block = ssa_block_create(ssa->current_symbol, NULL, 0, ssa->arena);
355  ssa_block_t *tail_block = ssa_block_create(ssa->current_symbol, NULL, 0, ssa->arena);
356 
357  ssa_loop_t save = {
358  .enter_loop = body_block,
359  .exit_loop = tail_block,
360  };
361  map_set(ssa->symbol_loops, tree, &save);
362 
363  ssa_operand_t loop = {
364  .kind = eOperandBlock,
365  .bb = loop_block
366  };
367 
368  ssa_operand_t tail = {
369  .kind = eOperandBlock,
370  .bb = tail_block
371  };
372 
373  ssa_step_t enter_loop = {
374  .opcode = eOpJump,
375  .jump = {
376  .target = loop
377  }
378  };
379  add_step(ssa, enter_loop);
380 
381  ssa->current_block = loop_block;
382  ssa_operand_t cond = compile_tree(ssa, tree->cond);
383  ssa_step_t cmp = {
384  .opcode = eOpBranch,
385  .branch = {
386  .cond = cond,
387  .then = operand_bb(body_block),
388  .other = tail
389  }
390  };
391  add_step(ssa, cmp);
392 
393  ssa->current_block = body_block;
394  compile_tree(ssa, tree->then);
395 
396  ssa_step_t repeat_loop = {
397  .opcode = eOpJump,
398  .jump = {
399  .target = loop
400  }
401  };
402  add_step(ssa, repeat_loop);
403 
404  map_delete(ssa->symbol_loops, tree);
405 
406  ssa->current_block = tail_block;
407  return loop;
408 }
409 
410 static ssa_operand_t add_jump(ssa_compile_t *ssa, ssa_loop_t *loop, tree_jump_t jump)
411 {
412  switch (jump)
413  {
414  case eJumpBreak: {
415  ssa_step_t step = {
416  .opcode = eOpJump,
417  .jump = {
418  .target = operand_bb(loop->exit_loop)
419  }
420  };
421  return add_step(ssa, step);
422  }
423  case eJumpContinue: {
424  ssa_step_t step = {
425  .opcode = eOpJump,
426  .jump = {
427  .target = operand_bb(loop->enter_loop)
428  }
429  };
430  return add_step(ssa, step);
431  }
432 
433  default: CT_NEVER("unhandled jump %d", jump);
434  }
435 }
436 
437 static size_t get_field_index(const tree_t *ty, const tree_t *field)
438 {
439  CTASSERTF(tree_is(ty, eTreeTypeStruct), "expected struct, got %s", tree_to_string(ty));
440 
441  size_t result = vector_find(ty->fields, field);
442  CTASSERTF(result != SIZE_MAX, "field `%s` not found in `%s`", tree_get_name(field), tree_to_string(ty));
443  return result;
444 }
445 
446 static ssa_operand_t get_field(ssa_compile_t *ssa, const tree_t *tree)
447 {
448  const tree_t *ty = tree_get_type(tree->object);
449  CTASSERTF(tree_ty_is_address(ty), "expected address, got %s", tree_to_string(ty));
450 
451  ssa_operand_t object = compile_tree(ssa, tree->object);
452  size_t index = get_field_index(ty->ptr, tree->field);
453 
454  ssa_step_t step = {
455  .opcode = eOpMember,
456  .member = {
457  .object = object,
458  .index = index
459  }
460  };
461  return add_step(ssa, step);
462 }
463 
464 static ssa_operand_t compile_tree(ssa_compile_t *ssa, const tree_t *tree)
465 {
466  CTASSERT(ssa != NULL);
467  CTASSERT(tree != NULL);
468 
469  switch (tree->kind)
470  {
471  case eTreeExprEmpty: {
472  ssa_operand_t operand = {
473  .kind = eOperandEmpty
474  };
475  return operand;
476  }
477 
478  case eTreeDeclCase: {
479  ssa_operand_t operand = {
480  .kind = eOperandImm,
481  .value = ssa_value_from(ssa->types, tree->case_value)
482  };
483 
484  return operand;
485  }
486 
487  case eTreeExprDigit:
488  case eTreeExprBool:
489  case eTreeExprUnit: {
490  ssa_operand_t operand = {
491  .kind = eOperandImm,
492  .value = ssa_value_from(ssa->types, tree)
493  };
494  return operand;
495  }
496 
497  case eTreeExprString: {
498  ssa_symbol_t *string = intern_string(ssa, tree);
499  add_dep(ssa, ssa->current_symbol, string);
500  ssa_operand_t operand = {
501  .kind = eOperandGlobal,
502  .global = string
503  };
504  return operand;
505  }
506 
507  case eTreeExprCast: {
508  ssa_operand_t expr = compile_tree(ssa, tree->expr);
509  ssa_step_t step = {
510  .opcode = eOpCast,
511  .cast = {
512  .operand = expr,
513  .type = ssa_type_create_cached(ssa->types, tree_get_type(tree))
514  }
515  };
516  return add_step(ssa, step);
517  }
518 
519  case eTreeExprOffset: {
520  ssa_operand_t expr = compile_tree(ssa, tree->expr);
521  ssa_operand_t offset = compile_tree(ssa, tree->offset);
522 
523  ssa_step_t step = {
524  .opcode = eOpOffset,
525  .offset = {
526  .array = expr,
527  .offset = offset
528  }
529  };
530  return add_step(ssa, step);
531  }
532 
533  case eTreeExprField: {
534  return get_field(ssa, tree);
535  }
536 
537  case eTreeExprUnary: {
538  ssa_operand_t expr = compile_tree(ssa, tree->operand);
539  ssa_step_t step = {
540  .opcode = eOpUnary,
541  .unary = {
542  .operand = expr,
543  .unary = tree->unary
544  }
545  };
546  return add_step(ssa, step);
547  }
548 
549  case eTreeExprBinary: {
550  ssa_operand_t lhs = compile_tree(ssa, tree->lhs);
551  ssa_operand_t rhs = compile_tree(ssa, tree->rhs);
552  ssa_step_t step = {
553  .opcode = eOpBinary,
554  .binary = {
555  .lhs = lhs,
556  .rhs = rhs,
557  .binary = tree->binary
558  }
559  };
560  return add_step(ssa, step);
561  }
562 
563  case eTreeDeclGlobal: {
564  ssa_symbol_t *symbol = map_get(ssa->globals, tree);
565  CTASSERTF(symbol != NULL, "symbol table missing `%s` (%p)", tree_to_string(tree), (void*)tree);
566 
567  add_dep(ssa, ssa->current_symbol, symbol);
568 
569  ssa_operand_t operand = {
570  .kind = eOperandGlobal,
571  .global = symbol
572  };
573 
574  return operand;
575  }
576 
577  case eTreeExprLoad: {
578  ssa_operand_t operand = compile_tree(ssa, tree->load);
579  ssa_step_t step = {
580  .opcode = eOpLoad,
581  .load = {
582  .src = operand
583  }
584  };
585  return add_step(ssa, step);
586  }
587 
588  case eTreeStmtJump: {
589  ssa_loop_t *target = map_get(ssa->symbol_loops, tree->label);
590  CTASSERTF(target != NULL, "loop not found");
591 
592  return add_jump(ssa, target, tree->jump);
593  }
594 
595  case eTreeExprAddressOf: {
596  ssa_operand_t operand = compile_tree(ssa, tree->expr);
597  ssa_step_t step = {
598  .opcode = eOpAddress,
599  .addr = {
600  .symbol = operand
601  }
602  };
603  return add_step(ssa, step);
604  }
605 
606  case eTreeStmtBlock: {
607  size_t len = vector_len(tree->stmts);
608  for (size_t i = 0; i < len; i++)
609  {
610  const tree_t *stmt = vector_get(tree->stmts, i);
611  compile_tree(ssa, stmt);
612  }
613 
614  return operand_empty();
615  }
616 
617  case eTreeStmtAssign: {
618  ssa_operand_t dst = compile_tree(ssa, tree->dst);
619  ssa_operand_t src = compile_tree(ssa, tree->src);
620 
621  ssa_step_t step = {
622  .opcode = eOpStore,
623  .store = {
624  .dst = dst,
625  .src = src
626  }
627  };
628  return add_step(ssa, step);
629  }
630 
631  case eTreeDeclLocal: {
632  size_t idx = (uintptr_t)map_get_default(ssa->symbol_locals, tree, (void*)UINTPTR_MAX);
633  CTASSERTF(idx != UINTPTR_MAX, "local `%s` not found", tree_get_name(tree));
634 
635  ssa_operand_t local = {
636  .kind = eOperandLocal,
637  .local = idx
638  };
639  return local;
640  }
641 
642  case eTreeDeclParam: {
643  size_t idx = (uintptr_t)map_get_default(ssa->symbol_locals, tree, (void*)UINTPTR_MAX);
644  CTASSERTF(idx != UINTPTR_MAX, "param `%s` not found", tree_get_name(tree));
645 
646  ssa_operand_t param = {
647  .kind = eOperandParam,
648  .param = idx
649  };
650  return param;
651  }
652 
653  case eTreeStmtReturn: {
654  ssa_operand_t value = compile_tree(ssa, tree->value);
655  ssa_step_t step = {
656  .opcode = eOpReturn,
657  .ret = {
658  .value = value
659  }
660  };
661  return add_step(ssa, step);
662  }
663 
664  case eTreeExprCall: {
665  ssa_operand_t callee = compile_tree(ssa, tree->callee);
666  size_t len = vector_len(tree->args);
667  typevec_t *args = typevec_of(sizeof(ssa_operand_t), len, ssa->arena);
668  for (size_t i = 0; i < len; i++)
669  {
670  const tree_t *arg = vector_get(tree->args, i);
671  ssa_operand_t operand = compile_tree(ssa, arg);
672  typevec_set(args, i, &operand);
673  }
674 
675  ssa_step_t step = {
676  .opcode = eOpCall,
677  .call = {
678  .function = callee,
679  .args = args
680  }
681  };
682 
683  return add_step(ssa, step);
684  }
685 
686  case eTreeDeclFunction: {
687  ssa_symbol_t *fn = map_get(ssa->functions, tree);
688  CTASSERT(fn != NULL);
689 
690  add_dep(ssa, ssa->current_symbol, fn);
691  ssa_operand_t operand = {
692  .kind = eOperandFunction,
693  .function = fn
694  };
695 
696  return operand;
697  }
698 
699  case eTreeStmtBranch:
700  return compile_branch(ssa, tree);
701 
702  case eTreeExprCompare: {
703  ssa_operand_t lhs = compile_tree(ssa, tree->lhs);
704  ssa_operand_t rhs = compile_tree(ssa, tree->rhs);
705 
706  ssa_step_t step = {
707  .opcode = eOpCompare,
708  .compare = {
709  .lhs = lhs,
710  .rhs = rhs,
711  .compare = tree->compare
712  }
713  };
714 
715  return add_step(ssa, step);
716  }
717 
718  case eTreeStmtLoop:
719  return compile_loop(ssa, tree);
720 
721  case eTreeExprAlignOf: {
722  ssa_step_t step = {
723  .opcode = eOpAlignOf,
724  .size_of = {
725  ssa_type_create_cached(ssa->types, tree->object)
726  }
727  };
728 
729  return add_step(ssa, step);
730  }
731 
732  case eTreeExprSizeOf: {
733  ssa_step_t step = {
734  .opcode = eOpSizeOf,
735  .size_of = {
736  ssa_type_create_cached(ssa->types, tree->object)
737  }
738  };
739 
740  return add_step(ssa, step);
741  }
742 
743  case eTreeExprOffsetOf: {
744  const ssa_type_t *ty = ssa_type_create_cached(ssa->types, tree->object);
745 
746  ssa_step_t step = {
747  .opcode = eOpOffsetOf,
748  .offset_of = {
749  .type = ty,
750  .index = get_field_index(tree->object, tree->field)
751  }
752  };
753 
754  return add_step(ssa, step);
755  }
756 
757  default: CT_NEVER("unhandled tree %s", tree_to_string(tree));
758  }
759 }
760 
761 static void add_module_globals(ssa_compile_t *ssa, ssa_module_t *mod, map_t *globals)
762 {
763  map_iter_t iter = map_iter(globals);
764  while (map_has_next(&iter))
765  {
766  map_entry_t entry = map_next(&iter);
767 
768  const tree_t *tree = entry.value;
769  CTASSERTF(tree_is(tree, eTreeDeclGlobal), "expected global, got %s", tree_to_string(tree));
770 
771  ssa_symbol_t *global = symbol_create_decl(ssa, tree, create_storage_for_decl(ssa->types, tree));
772 
773  vector_push(&mod->globals, global);
774  map_set(ssa->globals, tree, global);
775  map_set(ssa->module_lookup, global, mod);
776  }
777 }
778 
779 static void add_module_functions(ssa_compile_t *ssa, ssa_module_t *mod, map_t *functions)
780 {
781  map_iter_t iter = map_iter(functions);
782  while (map_has_next(&iter))
783  {
784  map_entry_t entry = map_next(&iter);
785 
786  const tree_t *tree = entry.value;
787  ssa_symbol_t *symbol = function_create(ssa, tree);
788 
789  vector_push(&mod->functions, symbol);
790  map_set(ssa->functions, tree, symbol);
791  map_set(ssa->module_lookup, symbol, mod);
792  }
793 }
794 
795 static void add_module_types(ssa_compile_t *ssa, ssa_module_t *mod, map_t *types)
796 {
797  map_iter_t iter = map_iter(types);
798  while (map_has_next(&iter))
799  {
800  map_entry_t entry = map_next(&iter);
801 
802  const tree_t *tree = entry.value;
803  ssa_type_t *type = ssa_type_create_cached(ssa->types, tree);
804 
805  vector_push(&mod->types, type);
806  map_set(ssa->types, tree, type);
807  }
808 }
809 
810 static void forward_module(ssa_compile_t *ssa, const tree_t *tree)
811 {
812  const char *id = tree_get_name(tree);
813  ssa_module_t *mod = module_create(ssa, id);
814 
815  add_module_globals(ssa, mod, tree_module_tag(tree, eSemaValues));
816  add_module_functions(ssa, mod, tree_module_tag(tree, eSemaProcs));
817  add_module_types(ssa, mod, tree_module_tag(tree, eSemaTypes));
818 
819  vector_push(&ssa->modules, mod);
820 
821  map_t *children = tree_module_tag(tree, eSemaModules);
822  map_iter_t iter = map_iter(children);
823  while (map_has_next(&iter))
824  {
825  map_entry_t entry = map_next(&iter);
826 
827  forward_module(ssa, entry.value);
828  }
829 }
830 
831 static void begin_compile(ssa_compile_t *ssa, ssa_symbol_t *symbol)
832 {
833  ssa_block_t *bb = ssa_block_create(symbol, "entry", 4, ssa->arena);
834 
835  symbol->entry = bb;
836  ssa->current_block = bb;
837  ssa->current_symbol = symbol;
838 }
839 
840 // static void reset_local_maps(ssa_compile_t *ssa)
841 // {
842 // map_reset(ssa->locals);
843 // map_reset(ssa->loops);
844 // }
845 
848 typedef struct ssa_map_sizes_t
849 {
851  size_t modules;
852 
854  size_t deps;
855 
857  size_t globals;
858 
860  size_t functions;
861 
863  size_t types;
865 
866 void count_modules(ssa_map_sizes_t *sizes, const tree_t *tree)
867 {
868  CTASSERT(tree_is(tree, eTreeDeclModule));
869 
870  sizes->modules += 1;
871 
872  sizes->globals += map_count(tree_module_tag(tree, eSemaValues));
873  sizes->functions += map_count(tree_module_tag(tree, eSemaProcs));
874  sizes->types += map_count(tree_module_tag(tree, eSemaTypes));
875 
876  // count all child modules
878  while (map_has_next(&iter))
879  {
880  map_entry_t entry = map_next(&iter);
881  count_modules(sizes, entry.value);
882  }
883 }
884 
886 {
887  // initialize will small sizes just in case something
888  // returns 0
889  ssa_map_sizes_t sizes = {
890  .modules = 4,
891  .deps = 4,
892 
893  .globals = 32,
894  .functions = 32,
895  .types = 32,
896  };
897 
898  size_t len = vector_len(mods);
899  for (size_t i = 0; i < len; i++)
900  {
901  const tree_t *mod = vector_get(mods, i);
902  count_modules(&sizes, mod);
903  }
904 
905  sizes.deps = sizes.functions + sizes.globals;
906 
907  return sizes;
908 }
909 
910 STA_DECL
912 {
913  CTASSERT(mods != NULL);
914  CTASSERT(arena != NULL);
915 
916  ssa_map_sizes_t sizes = predict_maps(mods);
917 
918  ssa_compile_t ssa = {
919  .arena = arena,
920 
921  .modules = vector_new(sizes.modules, arena),
922  .symbol_deps = map_optimal(sizes.deps, kTypeInfoPtr, arena),
923 
924  .strings = map_optimal(sizes.globals + sizes.functions, kTypeInfoText, arena),
925 
926  .globals = map_optimal(sizes.globals, kTypeInfoPtr, arena),
927  .functions = map_optimal(sizes.functions, kTypeInfoPtr, arena),
928  .types = map_optimal(sizes.types, kTypeInfoPtr, arena),
929 
930  // TODO: these should be per symbol rather than persistent global
931  .symbol_locals = map_optimal(sizes.deps * 4, kTypeInfoPtr, arena),
932  .symbol_loops = map_optimal(32, kTypeInfoPtr, arena),
933 
934  .module_lookup = map_optimal(sizes.deps, kTypeInfoPtr, arena),
935  };
936 
937  size_t len = vector_len(mods);
938  for (size_t i = 0; i < len; i++)
939  {
940  const tree_t *mod = vector_get(mods, i);
941  forward_module(&ssa, mod);
942  }
943 
944  map_iter_t globals = map_iter(ssa.globals);
945  while (map_has_next(&globals))
946  {
947  map_entry_t entry = map_next(&globals);
948 
949  const tree_t *tree = entry.key;
950  ssa_symbol_t *global = entry.value;
951 
952  ssa.current_module = map_get(ssa.module_lookup, global);
953  CTASSERTF(ssa.current_module != NULL, "global `%s` has no module", global->name);
954 
955  begin_compile(&ssa, global);
956 
957  if (tree->initial != NULL)
958  {
959  ssa_operand_t value = compile_tree(&ssa, tree->initial);
960  ssa_step_t ret = {
961  .opcode = eOpReturn,
962  .ret = {
963  .value = value
964  }
965  };
966  add_step(&ssa, ret);
967  }
968  else
969  {
970  ssa_value_t *noinit = ssa_value_noinit(global->type);
971  ssa_operand_t value = operand_value(noinit);
972  ssa_step_t ret = {
973  .opcode = eOpReturn,
974  .ret = {
975  .value = value
976  }
977  };
978  add_step(&ssa, ret);
979  }
980 
981  map_reset(ssa.symbol_loops);
982  }
983 
984  map_iter_t functions = map_iter(ssa.functions);
985  while (map_has_next(&functions))
986  {
987  map_entry_t entry = map_next(&functions);
988 
989  const tree_t *tree = entry.key;
990  ssa_symbol_t *symbol = entry.value;
991 
992  ssa.current_module = map_get(ssa.module_lookup, symbol);
993  CTASSERTF(ssa.current_module != NULL, "symbol `%s` has no module", symbol->name);
994 
995  begin_compile(&ssa, symbol);
996 
997  const tree_t *body = tree->body;
998  if (body != NULL)
999  {
1000  // TODO: should extern functions be put somewhere else
1001  compile_tree(&ssa, body);
1002  }
1003  else
1004  {
1005  CTASSERTF(symbol->linkage == eLinkImport,
1006  "function `%s` has no implementation, but is not an imported symbol (linkage=%s)",
1007  symbol->name, linkage_string(symbol->linkage)
1008  );
1009  }
1010 
1011  map_reset(ssa.symbol_loops);
1012  }
1013 
1014  ssa_result_t result = {
1015  .modules = ssa.modules,
1016  .deps = ssa.symbol_deps
1017  };
1018 
1019  return result;
1020 }
1021 
1022 static const char *const kTypeNameTable[eTypeCount] = {
1023 #define SSA_KIND(ID, NAME) [ID] = (NAME),
1024 #include "cthulhu/ssa/ssa.inc"
1025 };
1026 
1027 static const char *const kOperandNameTable[eOperandCount] = {
1028 #define SSA_OPERAND(ID, NAME) [ID] = (NAME),
1029 #include "cthulhu/ssa/ssa.inc"
1030 };
1031 
1032 static const char *const kOpCodeNameTable[eOpCount] = {
1033 #define SSA_OPCODE(ID, NAME) [ID] = (NAME),
1034 #include "cthulhu/ssa/ssa.inc"
1035 };
1036 
1037 static const char *const kValueNameTable[eValueCount] = {
1038 #define SSA_VALUE(ID, NAME) [ID] = (NAME),
1039 #include "cthulhu/ssa/ssa.inc"
1040 };
1041 
1042 STA_DECL
1043 const char *ssa_type_name(ssa_kind_t kind)
1044 {
1045  CT_ASSERT_RANGE(kind, 0, eTypeCount - 1);
1046 
1047  return kTypeNameTable[kind];
1048 }
1049 
1050 STA_DECL
1052 {
1053  CT_ASSERT_RANGE(kind, 0, eOpCount - 1);
1054 
1055  return kOperandNameTable[kind];
1056 }
1057 
1058 STA_DECL
1059 const char *ssa_opcode_name(ssa_opcode_t opcode)
1060 {
1061  CT_ASSERT_RANGE(opcode, 0, eOpCount - 1);
1062 
1063  return kOpCodeNameTable[opcode];
1064 }
1065 
1066 STA_DECL
1068 {
1069  CT_ASSERT_RANGE(value, 0, eValueCount - 1);
1070 
1071  return kValueNameTable[value];
1072 }
CT_NODISCARD size_t size
Definition: scan.h:128
CT_PUREFN CT_TREE_API const char * tree_get_name(const tree_t *tree)
Definition: context.c:102
CT_PUREFN CT_TREE_API const tree_t * tree_get_type(const tree_t *tree)
Definition: context.c:132
CT_PUREFN CT_TREE_API bool tree_is(const tree_t *self, tree_kind_t kind)
Definition: query.c:91
ssa_operand_t operand_value(ssa_value_t *value)
Definition: operand.c:5
ssa_value_t * ssa_value_string(const ssa_type_t *type, text_view_t text)
Definition: value.c:62
ssa_type_t * ssa_type_create_cached(map_t *cache, const tree_t *type)
Definition: type.c:226
ssa_value_t * ssa_value_from(map_t *types, const tree_t *expr)
Definition: value.c:87
ssa_value_t * ssa_value_noinit(const ssa_type_t *type)
Definition: value.c:101
void count_modules(ssa_map_sizes_t *sizes, const tree_t *tree)
Definition: ssa.c:866
STA_DECL const char * ssa_value_name(ssa_value_state_t value)
Definition: ssa.c:1067
STA_DECL const char * ssa_type_name(ssa_kind_t kind)
Definition: ssa.c:1043
ssa_map_sizes_t predict_maps(vector_t *mods)
Definition: ssa.c:885
STA_DECL const char * ssa_opcode_name(ssa_opcode_t opcode)
Definition: ssa.c:1059
STA_DECL const char * ssa_opkind_name(ssa_opkind_t kind)
Definition: ssa.c:1051
CT_TREE_API tree_quals_t tree_get_storage_quals(const tree_t *self)
Definition: query.c:126
CT_PUREFN CT_TREE_API bool tree_ty_is_address(const tree_t *type)
Definition: query.c:238
CT_TREE_API const char * tree_to_string(const tree_t *self)
Definition: query.c:40
CT_TREE_API const tree_t * tree_get_storage_type(const tree_t *self)
Definition: query.c:136
CT_TREE_API const tree_attribs_t * tree_get_attrib(const tree_t *self)
Definition: query.c:83
CT_PUREFN CT_TREE_API const tree_t * tree_ty_load_type(const tree_t *self)
get the type of a type after it has been loaded
Definition: query.c:267
CT_TREE_API size_t tree_get_storage_size(const tree_t *self)
Definition: query.c:144
#define STA_DECL
sal2 annotation on function implementations to copy annotations from the declaration
STA_RET_STRING colour_t idx
Definition: colour.h:98
CT_NODISCARD CT_PUREFN CT_STD_API size_t map_count(const map_t *map)
get the number of key-value pairs in a map
Definition: map.c:176
CT_NODISCARD CT_PUREFN CT_STD_API void * map_get_default(const map_t *map, const void *key, void *other)
get a value from a map or a default value
Definition: map.c:333
CT_NODISCARD CT_STD_API map_t * map_optimal(size_t size, hash_info_t info, arena_t *arena)
create a new map with an optimal size
Definition: optimal.c:85
CT_NODISCARD CT_PUREFN CT_STD_API bool map_has_next(const map_iter_t *iter)
check if a map iterator has more elements
Definition: map.c:509
CT_STD_API void map_reset(map_t *map)
clear all key-value pairs from a map
Definition: map.c:386
CT_STD_API bool map_delete(map_t *map, const void *key)
delete a key-value pair from a map
Definition: map.c:361
CT_NODISCARD CT_PUREFN CT_STD_API map_iter_t map_iter(const map_t *map)
create a new map iterator
Definition: map.c:456
CT_STD_API void map_set(map_t *map, const void *key, void *value)
set a key-value pair in a map
Definition: map.c:294
CT_NODISCARD CT_PUREFN CT_STD_API void * map_get(const map_t *map, const void *key)
get a value from a map
Definition: map.c:324
CT_NODISCARD CT_NOALIAS CT_STD_API map_entry_t map_next(map_iter_t *iter)
get the next key-value pair from a map iterator
Definition: map.c:476
CT_NODISCARD CT_STD_API set_t * set_new(size_t size, hash_info_t info, arena_t *arena)
create a new set
Definition: set.c:51
CT_STD_API const void * set_add(set_t *set, const void *key)
add a key to a set
Definition: set.c:85
CT_NODISCARD CT_ARENA_API void * arena_memdup(STA_READS(size) const void *ptr, size_t size, arena_t *arena)
duplicate a memory region from a custom allocator duplicate a region of memory and return a pointer t...
#define ARENA_IDENTIFY(ptr, name, parent, arena)
rename and reparent a pointer in a custom allocator
Definition: arena.h:409
#define ARENA_MALLOC(size, name, parent, arena)
allocate memory from a custom allocator
Definition: arena.h:392
#define CT_ASSERT_RANGE(value, min, max)
assert that a value is in a range inclusive bounds check
Definition: panic.h:148
#define CT_NEVER(...)
assert that a code path is never reached
Definition: panic.h:136
#define CTASSERT(expr)
assert a condition, prints the condition as a message
Definition: panic.h:130
#define CTASSERTF(expr,...)
assert a condition with a message and optional format arguments
Definition: panic.h:116
ssa_opcode_t
Definition: ssa.h:54
STA_DECL ssa_result_t ssa_compile(vector_t *mods, arena_t *arena)
compile a set of trees into their ssa form
Definition: ssa.c:911
ssa_kind_t
Definition: ssa.h:40
ssa_opkind_t
Definition: ssa.h:47
ssa_value_state_t
Definition: ssa.h:61
@ eOpCount
Definition: ssa.h:58
@ eTypeCount
Definition: ssa.h:44
@ eOperandCount
Definition: ssa.h:51
@ eValueCount
Definition: ssa.h:65
tree_jump_t
the type of jump
Definition: ops.h:80
CT_TREE_API const char * linkage_string(tree_linkage_t link)
get the name of a linkage
Definition: ops.c:141
tree_quals_t
all type qualifiers
Definition: ops.h:25
CT_TREE_API map_t * tree_module_tag(const tree_t *self, size_t tag)
Definition: sema.c:125
@ eSemaValues
Definition: tree.h:36
@ eSemaProcs
Definition: tree.h:42
@ eSemaModules
Definition: tree.h:45
@ eSemaTypes
Definition: tree.h:39
CT_STD_API const hash_info_t kTypeInfoPtr
type information for a generic pointer this operates on the pointer itself and not the data it points...
Definition: typeinfo.c:41
CT_STD_API const hash_info_t kTypeInfoText
type information for a text_view_t
Definition: typeinfo.c:47
CT_STD_API void typevec_set(typevec_t *vec, size_t index, const void *src)
set an element in the vector
Definition: vector.c:128
CT_NODISCARD CT_STD_API typevec_t * typevec_of(size_t width, size_t len, arena_t *arena)
create a new typed vector with an initial size and length
Definition: vector.c:83
CT_STD_API void * typevec_push(typevec_t *vec, const void *src)
push a value onto the vector
Definition: vector.c:156
CT_NODISCARD CT_PUREFN CT_STD_API size_t typevec_len(const typevec_t *vec)
get the length of a vector
Definition: vector.c:120
CT_NODISCARD CT_STD_API typevec_t * typevec_new(size_t width, size_t len, arena_t *arena)
create a new typed vector on the heap
Definition: vector.c:77
CT_NODISCARD CT_PUREFN CT_STD_API void * vector_get(const vector_t *vector, size_t index)
get a value from a vector
Definition: vector.c:134
CT_NODISCARD CT_STD_API vector_t * vector_new(size_t size, arena_t *arena)
create a new vector with an initial capacity
Definition: vector.c:63
CT_STD_API void vector_push(vector_t **vector, void *value)
push a value onto the end of a vector
Definition: vector.c:108
CT_PUREFN CT_STD_API size_t vector_find(vector_t *vector, const void *element)
find an element in a vector searches via pointer equality
Definition: vector.c:160
CT_NODISCARD CT_PUREFN CT_STD_API size_t vector_len(const vector_t *vector)
get the length of a vector
Definition: vector.c:152
an allocator object
Definition: arena.h:86
a key-value pair in a map
Definition: map.h:175
const void * key
the key of this entry
Definition: map.h:176
void * value
the value of this entry
Definition: map.h:177
a map iterator handle
Definition: map.h:183
an unordered hash map
Definition: map.h:38
an unordered hash set
Definition: set.c:19
typevec_t * steps
Definition: ssa.h:330
const char * name
Definition: ssa.h:329
the ssa compilation context
Definition: ssa.c:20
map_t * symbol_locals
all locals in the current symbol map<tree, size_t>
Definition: ssa.c:55
map_t * types
all types in the program map<tree, ssa_type>
Definition: ssa.c:51
map_t * symbol_deps
direct dependencies between symbols dependecies are a cyclic graph, this is a map of the edges map<ss...
Definition: ssa.c:30
size_t string_count
all strings in the program map_t<text_view_t*, ssa_symbol>
Definition: ssa.c:38
vector_t * modules
result data
Definition: ssa.c:25
map_t * globals
all globals in the program map<tree, ssa_symbol>
Definition: ssa.c:43
map_t * symbol_loops
all loops in the current symbol map<tree, ssa_loop>
Definition: ssa.c:59
ssa_module_t * current_module
the current module being compiled
Definition: ssa.c:69
ssa_symbol_t * current_symbol
the current symbol being compiled can be a function or a global
Definition: ssa.c:66
map_t * strings
Definition: ssa.c:39
map_t * functions
all functions in the program map<tree, ssa_symbol>
Definition: ssa.c:47
map_t * module_lookup
map of symbol to its source module map<ssa_symbol, ssa_module> TODO: this is stupid
Definition: ssa.c:74
ssa_block_t * current_block
the current block being compiled
Definition: ssa.c:62
arena_t * arena
internal data
Definition: ssa.c:34
ssa_storage_t storage
Definition: ssa.h:95
loop jump context
Definition: ssa.c:79
ssa_block_t * enter_loop
the block to jump to when continuing the loop
Definition: ssa.c:81
ssa_block_t * exit_loop
the block to jump to when exiting the loop
Definition: ssa.c:84
a prediction of how many items will be in each map this is not a hard limit, but a hint to the alloca...
Definition: ssa.c:849
size_t types
the number of types in the program
Definition: ssa.c:863
size_t deps
the number of dependencies between symbols
Definition: ssa.c:854
size_t modules
the number of modules in the program
Definition: ssa.c:851
size_t globals
the number of globals in the program
Definition: ssa.c:857
size_t functions
the number of functions in the program
Definition: ssa.c:860
vector_t * types
vector<ssa_type_t> all types used by this module
Definition: ssa.h:357
vector_t * functions
vector<ssa_symbol_t> all functions declared/imported/exported by this module
Definition: ssa.h:359
vector_t * globals
vector<ssa_symbol_t> all globals declared/imported/exported by this module
Definition: ssa.h:358
const char * name
Definition: ssa.h:355
ssa_opkind_t kind
Definition: ssa.h:192
const char * name
Definition: ssa.h:90
vector_t * modules
Definition: ssa.h:363
ssa_opcode_t opcode
Definition: ssa.h:299
ssa underlying storage type
Definition: ssa.h:78
const ssa_type_t * type
the internal storage type
Definition: ssa.h:80
ssa_block_t * entry
entry block
Definition: ssa.h:349
const ssa_type_t * type
the public facing type of this symbol
Definition: ssa.h:341
vector_t * blocks
vector_t<ssa_block_t *>
Definition: ssa.h:351
ssa_storage_t storage
the backing storage for this symbol
Definition: ssa.h:342
tree_visibility_t visibility
Definition: ssa.h:336
typevec_t * params
typevec_t<ssa_type_t>
Definition: ssa.h:347
const char * linkage_string
external name
Definition: ssa.h:338
const ssa_value_t * value
the value of this symbol, must always be set for globals
Definition: ssa.h:344
typevec_t * locals
typevec_t<ssa_type_t>
Definition: ssa.h:346
tree_linkage_t linkage
Definition: ssa.h:335
const char * name
internal name
Definition: ssa.h:340
tree_quals_t quals
Definition: ssa.h:147
a non-owning view of text
Definition: text.h:24
size_t length
the number of characters in the text
Definition: text.h:30
tree_visibility_t visibility
the visibility of the declaration
Definition: tree.h:52
const char * mangle
override the mangle of the declaration
Definition: tree.h:54
tree_linkage_t link
the link type of the declaration
Definition: tree.h:51
Definition: tree.h:67
tree_kind_t kind
Definition: tree.h:68
tree_t * operand
Definition: tree.h:97
const tree_t * value
Definition: tree.h:127
tree_t * initial
Definition: tree.h:218
compare_t compare
Definition: tree.h:104
tree_t * label
Definition: tree.h:157
const tree_t * field
Definition: tree.h:151
tree_t * other
Definition: tree.h:140
const tree_t * rhs
Definition: tree.h:108
const tree_t * lhs
Definition: tree.h:107
const tree_t * callee
Definition: tree.h:113
vector_t * locals
Definition: tree.h:202
vector_t * fields
Definition: tree.h:184
const vector_t * args
Definition: tree.h:114
tree_t * cond
Definition: tree.h:138
binary_t binary
Definition: tree.h:103
text_view_t string_value
Definition: tree.h:81
tree_t * dst
Definition: tree.h:131
const tree_t * ptr
Definition: tree.h:172
tree_t * then
Definition: tree.h:139
const tree_t * offset
Definition: tree.h:148
const vector_t * stmts
Definition: tree.h:124
const tree_t * object
Definition: tree.h:145
const vector_t * params
Definition: tree.h:197
tree_t * body
Definition: tree.h:203
tree_t * load
Definition: tree.h:84
const tree_t * src
Definition: tree.h:132
const tree_t * expr
Definition: tree.h:88
tree_jump_t jump
Definition: tree.h:158
tree_t * case_value
Definition: tree.h:194
unary_t unary
Definition: tree.h:96
A vector with a fixed type size.
Definition: vector.h:24
a generic vector of pointers
Definition: vector.c:16