Cthulhu  0.2.10
Cthulhu compiler collection
tree.c
Go to the documentation of this file.
1 // SPDX-License-Identifier: LGPL-3.0-only
2 
3 #include "base/util.h"
4 #include "cthulhu/check/check.h"
5 
7 
8 #include "cthulhu/tree/ops.h"
9 #include "cthulhu/util/util.h"
10 #include "cthulhu/util/types.h"
11 
12 #include "cthulhu/tree/tree.h"
13 #include "cthulhu/tree/query.h"
14 
15 #include "arena/arena.h"
16 #include "std/vector.h"
17 #include "std/set.h"
18 #include "std/map.h"
19 #include "std/str.h"
20 
21 #include "base/panic.h"
22 #include "core/macros.h"
23 
24 #include <stdint.h>
25 #include <stdio.h>
26 
27 typedef struct check_t
28 {
30 
31  const tree_t *cli_entry;
32  const tree_t *gui_entry;
33 
36 
39 } check_t;
40 
41 // check for a valid name and a type being set
42 static bool check_simple(check_t *check, const tree_t *decl)
43 {
44  CT_UNUSED(check);
45 
46  if (tree_is(decl, eTreeError)) { return false; } // TODO: are errors always reported?
47 
48  const char *id = tree_get_user_name(decl);
49  if (!tree_is_symbol_anonymous(decl))
50  {
51  if (str_equal(id, ""))
52  {
53  msg_notify(check->reports, &kEvent_InvalidName, tree_get_node(decl),
54  "declaration has an empty name"
55  );
56  return false;
57  }
58  }
59  else
60  {
61  const tree_attribs_t *attribs = tree_get_attrib(decl);
62  if (attribs->link != eLinkModule)
63  {
64  msg_notify(check->reports, &kEvent_InvalidName, tree_get_node(decl),
65  "externally visible declaration is anonymous"
66  );
67  return false;
68  }
69  }
70 
71  const tree_t *ty = tree_get_type(decl);
72  CTASSERTF(ty != NULL, "decl `%s` has no type", id);
73 
74  return true;
75 }
76 
77 static void check_global_attribs(check_t *check, const tree_t *global)
78 {
79  const tree_attribs_t *attribs = tree_get_attrib(global);
80  switch (attribs->link)
81  {
82  case eLinkImport:
83  if (global->initial != NULL)
84  {
85  event_builder_t id = msg_notify(check->reports, &kEvent_ImportedWithImpl, tree_get_node(global),
86  "global `%s` is marked as imported but has an implementation",
87  tree_get_name(global)
88  );
89  msg_note(id, "implementation will be ignored");
90  }
91  break;
92 
93  case eLinkModule:
94  if (attribs->mangle != NULL)
95  {
96  event_builder_t id = msg_notify(check->reports, &kEvent_IgnoredMangling, tree_get_node(global),
97  "global `%s` has internal linkage and user defined mangling",
98  tree_get_name(global)
99  );
100  msg_note(id, "attribute will be ignored");
101  }
102  break;
103 
104  case eLinkEntryGui:
105  case eLinkEntryCli:
106  msg_notify(check->reports, &kEvent_EntryNotFunction, tree_get_node(global),
107  "global `%s` is marked as an entry point but is not a function",
108  tree_get_name(global)
109  );
110  break;
111 
112  default: break;
113  }
114 }
115 
116 static void check_func_has_body(check_t *check, const tree_t *fn)
117 {
118  if (fn->body != NULL) { return; }
119 
120  msg_notify(check->reports, &kEvent_EntryMissingBody, tree_get_node(fn),
121  "function `%s` is an entry point, but has no body",
122  tree_get_name(fn)
123  );
124 }
125 
126 static void check_func_attribs(check_t *check, const tree_t *fn)
127 {
128  const tree_attribs_t *attribs = tree_get_attrib(fn);
129 
130  switch (attribs->link)
131  {
132  case eLinkImport:
133  if (fn->body != NULL)
134  {
135  msg_notify(check->reports, &kEvent_ImportedWithImpl, tree_get_node(fn),
136  "function `%s` is marked as imported but has an implementation",
138  );
139  }
140  break;
141 
142  case eLinkModule:
143  if (attribs->mangle != NULL)
144  {
145  event_builder_t id = msg_notify(check->reports, &kEvent_IgnoredMangling, tree_get_node(fn),
146  "function `%s` has internal linkage and user defined mangling",
148  );
149  msg_note(id, "attribute will be ignored");
150  }
151  break;
152 
153  case eLinkEntryCli:
154  check_func_has_body(check, fn);
155  if (check->cli_entry != NULL)
156  {
157  event_builder_t id = msg_notify(check->reports, &kEvent_MultipleEntryPoints, tree_get_node(fn),
158  "multiple CLI entry points defined"
159  );
160  msg_append(id, tree_get_node(check->cli_entry), "previous entry point defined here");
161  }
162  else
163  {
164  check->cli_entry = fn;
165  }
166  break;
167  case eLinkEntryGui:
168  check_func_has_body(check, fn);
169  if (check->gui_entry != NULL)
170  {
171  event_builder_t id = msg_notify(check->reports, &kEvent_MultipleEntryPoints, tree_get_node(fn),
172  "multiple GUI entry points defined"
173  );
174  msg_append(id, tree_get_node(check->gui_entry), "previous entry point defined here");
175  }
176  else
177  {
178  check->gui_entry = fn;
179  }
180  break;
181 
182  default: break;
183  }
184 }
185 
186 static void check_func_return_equal(check_t *check, const tree_t *return_type, const tree_t *real_type)
187 {
188  if (util_types_equal(return_type, real_type)) { return; }
189 
190  msg_notify(check->reports, &kEvent_ReturnTypeMismatch, tree_get_node(real_type),
191  "return type `%s` does not match function return type `%s`",
192  tree_to_string(real_type),
193  tree_to_string(return_type)
194  );
195 }
196 
197 static void check_deprecated_call(check_t *check, const tree_t *expr)
198 {
199  const tree_t *fn = expr->callee;
200  // cant check if the callee is an indirect call
201  if (!tree_is(fn, eTreeDeclFunction)) { return; }
202 
203  const tree_attribs_t *attribs = tree_get_attrib(fn);
204 
205  if (attribs->deprecated == NULL) { return; }
206 
207  event_builder_t id = msg_notify(check->reports, &kEvent_Deprecated, tree_get_node(expr),
208  "call to deprecated function `%s`",
209  tree_get_name(fn)
210  );
211  msg_note(id, "deprecated: %s", attribs->deprecated);
212 }
213 
214 static const char *get_fn_name(const tree_t *fn)
215 {
216  if (tree_is(fn, eTreeDeclFunction)) { return tree_get_name(fn); }
217 
218  // its an indirect call, so give the type name
219 
220  // TODO: need a pretty typename function
221  return tree_to_string(tree_get_type(fn));
222 }
223 
224 static void check_single_expr(check_t *check, const tree_t *expr);
225 
226 static void check_params(check_t *check, const vector_t *args, const vector_t *params, size_t count, const char *name)
227 {
228  for (size_t i = 0; i < count; i++)
229  {
230  // at this point the language frontend will have turned
231  // any implicit casts into explicit casts, so simple type comparison
232  // is enough
233  const tree_t *arg = vector_get(args, i);
234  const tree_t *param = vector_get(params, i);
235 
236  const tree_t *arg_type = tree_get_type(arg);
237  const tree_t *param_type = tree_get_type(param);
238 
239  check_single_expr(check, arg);
240 
241  if (!util_types_equal(arg_type, param_type))
242  {
243  event_builder_t id = msg_notify(check->reports, &kEvent_IncorrectParamType, tree_get_node(arg),
244  "incorrect type for parameter %zu of function `%s`",
245  i + 1,
246  name
247  );
248  msg_note(id, "expected `%s`, got `%s`", tree_to_string(param_type), tree_to_string(arg_type));
249  }
250  }
251 }
252 
253 static void check_call_args_fixed(check_t *check, const tree_t *expr, const vector_t *args, const vector_t *params)
254 {
255  size_t arg_count = vector_len(args);
256  size_t param_count = vector_len(params);
257 
258  const char *name = get_fn_name(expr->callee);
259 
260  if (arg_count != param_count)
261  {
262  event_builder_t id = msg_notify(check->reports, &kEvent_IncorrectParamCount, tree_get_node(expr),
263  "incorrect number of parameters to function `%s`",
264  name
265  );
266  msg_note(id, "expected %zu, got %zu", param_count, arg_count);
267  }
268 
269  size_t count = CT_MIN(arg_count, param_count);
270 
271  check_params(check, args, params, count, name);
272 }
273 
274 static void check_call_args_variadic(check_t *check, const tree_t *expr, const vector_t *args, const vector_t *params)
275 {
276  size_t arg_count = vector_len(args);
277  size_t param_count = vector_len(params);
278 
279  const char *name = get_fn_name(expr->callee);
280 
281  if (arg_count < param_count)
282  {
283  event_builder_t id = msg_notify(check->reports, &kEvent_IncorrectParamCount, tree_get_node(expr),
284  "incorrect number of parameters to variadic function `%s`",
285  name
286  );
287  msg_note(id, "expected at least %zu parameters, only got %zu", param_count, arg_count);
288  }
289 
290  size_t count = CT_MIN(arg_count, param_count);
291 
292  check_params(check, args, params, count, name);
293 }
294 
295 static void check_call_arguments(check_t *check, const tree_t *expr)
296 {
297  // if this is an indirect call, we need to get the function type
298  const tree_t *fn = expr->callee;
299  if (tree_is(fn, eTreeExprLoad))
300  {
301  fn = tree_get_type(fn);
302  }
303 
304  const vector_t *fn_args = expr->args;
305  const vector_t *fn_params = tree_fn_get_params(fn);
306  tree_arity_t arity = tree_fn_get_arity(fn);
307 
308  switch (arity)
309  {
310  case eArityFixed:
311  check_call_args_fixed(check, expr, fn_args, fn_params);
312  break;
313 
314  case eArityVariable:
315  check_call_args_variadic(check, expr, fn_args, fn_params);
316  break;
317 
318  default:
319  CT_NEVER("invalid arity %d (check-call-arguments)", arity);
320  }
321 }
322 
323 static const tree_t *get_simple_expr_type(const tree_t *expr)
324 {
325  return tree_follow_type(tree_get_type(expr));
326 }
327 
328 static bool is_valid_bitcast_type(const tree_t *type)
329 {
330  return tree_is(type, eTreeTypeDigit)
331  || tree_is(type, eTreeTypePointer)
332  || tree_is(type, eTreeTypeOpaque)
333  || tree_is(type, eTreeTypeArray)
334  || tree_is(type, eTreeTypeReference); // TODO: reference is an odd case, will need extra testing
335 }
336 
337 static void check_bitcast_expr(check_t *check, const tree_t *expr)
338 {
339  const tree_t *dst = get_simple_expr_type(expr);
340  if (!is_valid_bitcast_type(dst))
341  {
342  event_builder_t msg = msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(expr),
343  "bitcast to invalid type `%s`",
344  tree_to_string(dst)
345  );
346  msg_note(msg, "expected digit, pointer or opaque pointer");
347  }
348 
349  const tree_t *src = get_simple_expr_type(expr->expr);
350  if (!is_valid_bitcast_type(src))
351  {
352  event_builder_t msg = msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(expr),
353  "bitcast from invalid type `%s`",
354  tree_to_string(src)
355  );
356  msg_note(msg, "expected digit, pointer or opaque pointer");
357  }
358 }
359 
360 static void check_signextend_expr(check_t *check, const tree_t *expr)
361 {
362  const tree_t *dst = get_simple_expr_type(expr);
363  if (!util_type_is_digit(dst))
364  {
365  msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(expr),
366  "sign extension of non-integer type `%s`",
367  tree_to_string(dst)
368  );
369  }
370 
371  const tree_t *src = get_simple_expr_type(expr->expr);
372  if (!util_type_is_digit(src))
373  {
374  msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(expr),
375  "sign extension from non-integer type `%s`",
376  tree_to_string(src)
377  );
378  }
379 }
380 
381 static void check_zeroextend_expr(check_t *check, const tree_t *expr)
382 {
383  const tree_t *dst = get_simple_expr_type(expr);
384  if (!util_type_is_digit(dst))
385  {
386  msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(expr),
387  "zero extension into non-integer type `%s`",
388  tree_to_string(dst)
389  );
390  }
391 
392  const tree_t *src = get_simple_expr_type(expr->expr);
393  if (!util_type_is_digit(src))
394  {
395  msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(expr),
396  "zero extension of non-integer type `%s`",
397  tree_to_string(src)
398  );
399  }
400 }
401 
402 static bool is_invalid_cast_type(const tree_t *type)
403 {
404  return tree_is(type, eTreeTypeUnit)
405  || tree_is(type, eTreeTypeEmpty);
406 }
407 
408 static void check_cast_expr(check_t *check, const tree_t *expr)
409 {
410  const tree_t *dst = get_simple_expr_type(expr);
411  const tree_t *src = get_simple_expr_type(expr->expr);
412  if (is_invalid_cast_type(src))
413  {
414  msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(expr),
415  "invalid cast from type `%s`",
416  tree_to_string(src)
417  );
418 
419  return;
420  }
421 
422  if (is_invalid_cast_type(dst))
423  {
424  msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(expr),
425  "invalid cast to type `%s`",
426  tree_to_string(dst)
427  );
428 
429  return;
430  }
431 
432  switch (expr->cast)
433  {
434  case eCastBit:
435  check_bitcast_expr(check, expr);
436  break;
437  case eCastSignExtend:
438  check_signextend_expr(check, expr);
439  break;
440  case eCastZeroExtend:
441  check_zeroextend_expr(check, expr);
442  break;
443  default:
444  CT_NEVER("invalid cast kind %s (check-cast-expr)", tree_to_string(expr));
445  }
446 }
447 
448 static bool is_pointer_arithmetic(const tree_t *lhs, const tree_t *rhs)
449 {
450  return tree_is(lhs, eTreeTypeDigit) && tree_is(rhs, eTreeTypePointer);
451 }
452 
453 static void check_binary_expr(check_t *check, const tree_t *expr)
454 {
455  check_single_expr(check, expr->lhs);
456  check_single_expr(check, expr->rhs);
457 
458  const tree_t *lhs = get_simple_expr_type(expr->lhs);
459  const tree_t *rhs = get_simple_expr_type(expr->rhs);
460 
461  if (!tree_is(lhs, eTreeTypeDigit) && !tree_is(rhs, eTreeTypeDigit))
462  {
463  msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(expr),
464  "binary operation with non-digit types `%s` and `%s`",
465  tree_to_string(lhs),
466  tree_to_string(rhs)
467  );
468  }
469 
470  if (is_pointer_arithmetic(lhs, rhs) || is_pointer_arithmetic(rhs, lhs))
471  {
472  return;
473  }
474 
475 
476 
477  if (!util_types_equal(lhs, rhs))
478  {
479  msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(expr),
480  "binary operation with different types `%s` and `%s`",
481  tree_to_string(lhs),
482  tree_to_string(rhs)
483  );
484  }
485 }
486 
487 static void check_single_expr(check_t *check, const tree_t *expr)
488 {
489  switch (tree_get_kind(expr))
490  {
491  case eTreeExprCall:
492  check_deprecated_call(check, expr);
493  check_call_arguments(check, expr);
494  break;
495 
496  case eTreeExprBinary: // TODO: check for correct types
497  check_binary_expr(check, expr);
498  break;
499 
500  case eTreeExprCompare:
501  check_single_expr(check, expr->lhs);
502  check_single_expr(check, expr->rhs);
503  break;
504 
505  case eTreeExprCast:
506  check_cast_expr(check, expr);
507  break;
508 
509  case eTreeExprUnary:
510  check_single_expr(check, expr->operand);
511  break;
512  case eTreeExprLoad:
513  check_single_expr(check, expr->load);
514  break;
515 
516  case eTreeExprOffset:
517  check_single_expr(check, expr->object);
518  check_single_expr(check, expr->offset);
519  break;
520 
521  case eTreeDeclLocal:
522  case eTreeDeclParam:
523  case eTreeDeclCase:
524  case eTreeDeclGlobal:
525  case eTreeDeclFunction:
526  break;
527 
528  case eTreeExprString:
529  case eTreeExprDigit:
530  case eTreeExprBool:
531  case eTreeExprUnit:
532  break;
533 
534  case eTreeExprField:
535  check_single_expr(check, expr->object);
536  break;
537 
538  case eTreeExprSizeOf:
539  case eTreeExprAlignOf:
540  case eTreeExprAddressOf:
541  break;
542 
543  case eTreeExprOffsetOf:
544  check_single_expr(check, expr->object);
545  break;
546 
547  default:
548  CT_NEVER("invalid node kind %s", tree_to_string(expr));
549  }
550 }
551 
552 static void check_assign(check_t *check, const tree_t *stmt)
553 {
554  CTASSERT(stmt != NULL);
555 
556  if (tree_has_storage(stmt->dst))
557  {
558  tree_quals_t quals = tree_get_storage_quals(stmt->dst);
559  if ((quals & eQualConst) && !stmt->init)
560  {
561  msg_notify(check->reports, &kEvent_AssignToConst, tree_get_node(stmt),
562  "assignment to constant `%s`",
563  tree_get_name(stmt->dst)
564  );
565  }
566  }
567 
568  if (tree_is(stmt->dst, eTreeDeclParam))
569  {
570  msg_notify(check->reports, &kEvent_AssignToParam, tree_get_node(stmt),
571  "assignment to parameter `%s`",
572  tree_get_name(stmt->dst)
573  );
574  }
575 
576 #if 0
577  const tree_t *src_type = tree_follow_type(tree_get_type(stmt->src));
578  const tree_t *dst_type = tree_follow_type(tree_get_type(stmt->dst));
579 
580  if (tree_is(src_type, eTreeTypeReference))
581  src_type = src_type->ptr;
582 
583  if (tree_is(dst_type, eTreeTypeReference))
584  dst_type = dst_type->ptr;
585 
586  if (!util_types_equal(src_type, dst_type))
587  {
588  msg_notify(check->reports, &kEvent_InvalidAssignment, tree_get_node(stmt),
589  "assignment of type `%s` to `%s`",
590  tree_to_string(src_type),
591  tree_to_string(dst_type)
592  );
593  }
594 #endif
595 
596  check_single_expr(check, stmt->src);
597 }
598 
599 static void check_func_body(check_t *check, const tree_t *return_type, const tree_t *stmt)
600 {
601  CTASSERT(stmt != NULL);
602 
603  switch (stmt->kind)
604  {
605  case eTreeStmtJump:
606  break;
607 
608  case eTreeStmtBlock:
609  for (size_t i = 0; i < vector_len(stmt->stmts); i++)
610  {
611  check_func_body(check, return_type, vector_get(stmt->stmts, i));
612  }
613  break;
614 
615  case eTreeStmtLoop:
616  case eTreeStmtBranch: {
617  check_func_body(check, return_type, stmt->then);
618 
619  if (stmt->other != NULL)
620  check_func_body(check, return_type, stmt->other);
621 
622  break;
623  }
624 
625  case eTreeStmtAssign:
626  check_assign(check, stmt);
627  break;
628 
629  case eTreeStmtReturn:
630  check_func_return_equal(check, return_type, tree_get_type(stmt->value));
631  break;
632 
633  case eTreeExprCast:
634  case eTreeExprLoad:
635  case eTreeExprAddressOf:
636  case eTreeExprUnary:
637  case eTreeExprBinary:
638  case eTreeExprCompare:
639  case eTreeExprField:
640  case eTreeExprOffset:
641  case eTreeExprCall:
642  check_single_expr(check, stmt);
643  break;
644 
645  default:
646  CT_NEVER("invalid statement kind %s", tree_to_string(stmt));
647  }
648 }
649 
650 static bool will_always_return(const tree_t *stmt)
651 {
652  CTASSERT(stmt != NULL);
653 
654  switch (stmt->kind)
655  {
656  case eTreeStmtReturn:
657  return true;
658 
659  case eTreeStmtBranch: {
660  // if the other branch is null then this branch may not always return
661  bool other_returns = stmt->other != NULL && will_always_return(stmt->other);
662  return will_always_return(stmt->then) && other_returns;
663  }
664 
665  case eTreeStmtLoop:
666  return will_always_return(stmt->then);
667 
668  case eTreeStmtBlock:
669  for (size_t i = 0; i < vector_len(stmt->stmts); i++)
670  {
671  if (will_always_return(vector_get(stmt->stmts, i)))
672  {
673  return true;
674  }
675  }
676  return false;
677 
678  default:
679  return false;
680  }
681 }
682 
683 static void check_func_locals(check_t *check, const vector_t *locals)
684 {
685  size_t len = vector_len(locals);
686  for (size_t i = 0; i < len; i++)
687  {
688  const tree_t *local = vector_get(locals, i);
689  check_simple(check, local);
690 
691  const tree_t *type = tree_get_type(local);
692  if (tree_is(type, eTreeTypeUnit))
693  {
694  msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(local),
695  "local `%s` has type `unit`",
696  tree_get_name(local)
697  );
698  }
699  else if (tree_is(type, eTreeTypeEmpty))
700  {
701  msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(local),
702  "local `%s` has type `empty`",
703  tree_get_name(local)
704  );
705  }
706  }
707 }
708 
709 static void check_function_definition(check_t *check, const tree_t *fn)
710 {
711  if (fn->body == NULL) { return; }
712 
713  check_func_locals(check, fn->locals);
714  const tree_t *return_type = tree_fn_get_return(fn);
715 
716  check_func_body(check, return_type, fn->body);
717 
718  if (!will_always_return(fn->body))
719  {
720  if (tree_is(return_type, eTreeTypeUnit)) { return; }
721 
722  msg_notify(check->reports, &kEvent_MayNotReturn, tree_get_node(fn),
723  "function `%s` may not return a value",
724  tree_get_name(fn)
725  );
726  }
727 }
728 
729 static void check_global_recursion(check_t *check, const tree_t *global);
730 
731 static void check_expr_recursion(check_t *check, const tree_t *tree)
732 {
733  switch (tree_get_kind(tree))
734  {
735  case eTreeExprEmpty:
736  case eTreeExprUnit:
737  case eTreeExprBool:
738  case eTreeExprDigit:
739  case eTreeExprString:
740  break;
741 
742  case eTreeExprLoad:
743  check_expr_recursion(check, tree->load);
744  break;
745 
746  case eTreeExprCall: {
747  check_expr_recursion(check, tree->callee);
748  size_t len = vector_len(tree->args);
749  for (size_t i = 0; i < len; ++i)
750  {
751  const tree_t *arg = vector_get(tree->args, i);
752  check_expr_recursion(check, arg);
753  }
754  break;
755  }
756 
757  case eTreeExprBinary:
758  check_expr_recursion(check, tree->lhs);
759  check_expr_recursion(check, tree->rhs);
760  break;
761 
762  case eTreeExprUnary:
763  check_expr_recursion(check, tree->operand);
764  break;
765 
766  case eTreeExprCast:
767  check_expr_recursion(check, tree->expr);
768  break;
769 
770  case eTreeExprCompare:
771  check_expr_recursion(check, tree->lhs);
772  check_expr_recursion(check, tree->rhs);
773  break;
774 
775  case eTreeDeclGlobal:
776  check_global_recursion(check, tree);
777  break;
778  default: CT_NEVER("invalid node kind %s (check-tree-recursion)", tree_to_string(tree));
779  }
780 }
781 
782 static void check_global_recursion(check_t *check, const tree_t *global)
783 {
784  if (set_contains(check->checked_exprs, global))
785  {
786  return;
787  }
788 
789  size_t idx = vector_find(check->expr_stack, global);
790  if (idx == SIZE_MAX)
791  {
792  if (global->initial != NULL)
793  {
794  vector_push(&check->expr_stack, (tree_t*)global);
795  check_expr_recursion(check, global->initial);
796  vector_drop(check->expr_stack);
797  }
798  }
799  else
800  {
801  event_builder_t id = msg_notify(check->reports, &kEvent_RecursiveEval, tree_get_node(global),
802  "evaluation of `%s` may be infinite",
803  tree_get_name(global)
804  );
805  size_t len = vector_len(check->expr_stack);
806  for (size_t i = 0; i < len; i++)
807  {
808  const tree_t *decl = vector_get(check->expr_stack, i);
809  msg_append(id, tree_get_node(decl), "call to `%s`", tree_get_name(decl));
810  }
811  }
812 
813  set_add(check->checked_exprs, global);
814 }
815 
816 static void check_global_type(check_t *check, const tree_t *global)
817 {
818  const tree_t *ty = tree_get_type(global);
819  CTASSERTF(ty != NULL, "global `%s` has no type", tree_get_name(global));
820 
821  if (tree_is(ty, eTreeTypeUnit))
822  {
823  msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(global),
824  "global `%s` is of unit type `%s`",
825  tree_get_name(global),
826  tree_to_string(ty)
827  );
828  }
829  else if (tree_is(ty, eTreeTypeEmpty))
830  {
831  msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(global),
832  "global `%s` is of empty type `%s`",
833  tree_get_name(global),
834  tree_to_string(ty)
835  );
836  }
837 
838  tree_storage_t storage = tree_get_storage(global);
839 
840  if (tree_is(storage.storage, eTreeTypeReference))
841  {
842  msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(global),
843  "global value `%s` has invalid storage `%s`",
844  tree_get_name(global),
845  tree_to_string(ty)
846  );
847  }
848 }
849 
853 
854 static void check_aggregate_recursion(check_t *check, const tree_t *type);
855 
856 static void check_struct_type_recursion(check_t *check, const tree_t *type)
857 {
858  CTASSERT(type != NULL);
859 
860  switch (type->kind)
861  {
862  case eTreeTypeBool:
863  case eTreeTypeDigit:
864  case eTreeTypeUnit:
865  case eTreeTypeEmpty:
866  case eTreeTypePointer:
867  case eTreeTypeOpaque:
868  case eTreeTypeClosure:
869  case eTreeTypeEnum:
870  case eTreeTypeAlias:
871  break;
872 
873  case eTreeTypeStruct:
874  case eTreeTypeUnion:
875  check_aggregate_recursion(check, type);
876  break;
877 
878  default: CT_NEVER("invalid type kind %s (check-type-size)", tree_to_string(type));
879  }
880 }
881 
882 static void check_aggregate_recursion(check_t *check, const tree_t *type)
883 {
884  if (set_contains(check->checked_types, type))
885  {
886  return;
887  }
888 
889  size_t idx = vector_find(check->type_stack, type);
890  if (idx == SIZE_MAX)
891  {
892  vector_push(&check->type_stack, (tree_t*)type);
893  size_t len = vector_len(type->fields);
894  for (size_t i = 0; i < len; i++)
895  {
896  const tree_t *field = vector_get(type->fields, i);
897  const tree_t *ty = tree_get_type(field);
898  check_struct_type_recursion(check, ty);
899  }
900  vector_drop(check->type_stack);
901  }
902  else
903  {
904  event_builder_t id = msg_notify(check->reports, &kEvent_InfiniteSizedType, tree_get_node(type),
905  "size of type `%s` may be infinite",
906  tree_get_name(type)
907  );
908  size_t len = vector_len(check->type_stack);
909  for (size_t i = 0; i < len; i++)
910  {
911  const tree_t *decl = vector_get(check->type_stack, i);
912  msg_append(id, tree_get_node(decl), "call to `%s`", tree_get_name(decl));
913  }
914  }
915 
916  set_add(check->checked_types, type);
917 }
918 
922 
923 static void check_type_recursion(check_t *check, const tree_t *type);
924 
925 static void check_inner_type_recursion(check_t *check, const tree_t *type)
926 {
927  CTASSERT(type != NULL);
928 
929  switch (type->kind)
930  {
931  case eTreeTypeBool:
932  case eTreeTypeDigit:
933  case eTreeTypeUnit:
934  case eTreeTypeEmpty:
935  case eTreeTypeStruct:
936  case eTreeTypeUnion:
937  case eTreeTypeEnum:
938  case eTreeTypeOpaque:
939  break;
940 
941  case eTreeTypeAlias:
942  check_type_recursion(check, tree_get_type(type));
943  break;
944 
945  case eTreeTypeClosure:
946  check_type_recursion(check, tree_fn_get_return(type));
947  const vector_t *params = tree_fn_get_params(type);
948  size_t len = vector_len(params);
949  for (size_t i = 0; i < len; i++)
950  {
951  const tree_t *param = vector_get(params, i);
952  const tree_t *ty = tree_get_type(param);
953  check_type_recursion(check, ty);
954  }
955  break;
956 
957  case eTreeTypePointer:
958  case eTreeTypeReference:
959  case eTreeTypeArray:
960  check_type_recursion(check, type->ptr);
961  break;
962 
963  default: CT_NEVER("invalid type kind `%s` (check-type-size)", tree_to_string(type));
964  }
965 }
966 
967 static void check_type_recursion(check_t *check, const tree_t *type)
968 {
969  if (set_contains(check->checked_types, type))
970  {
971  return;
972  }
973 
974  size_t idx = vector_find(check->type_stack, type);
975  if (idx == SIZE_MAX)
976  {
977  vector_push(&check->type_stack, (tree_t*)type);
978  check_inner_type_recursion(check, type);
979  vector_drop(check->type_stack);
980  }
981  else
982  {
983  event_builder_t id = msg_notify(check->reports, &kEvent_InvalidType, tree_get_node(type),
984  "type `%s` contains an impossible type",
985  tree_get_name(type)
986  );
987  size_t len = vector_len(check->type_stack);
988  for (size_t i = 0; i < len; i++)
989  {
990  const tree_t *decl = vector_get(check->type_stack, i);
991  msg_append(id, tree_get_node(decl), "call to `%s`", tree_get_name(decl));
992  }
993  }
994 
995  set_add(check->checked_types, type);
996 }
997 
998 static void check_any_type_recursion(check_t *check, const tree_t *type)
999 {
1000  switch (type->kind)
1001  {
1002  case eTreeTypeUnion:
1003  case eTreeTypeStruct:
1004  check_aggregate_recursion(check, type);
1005  break;
1006 
1007  default: check_type_recursion(check, type); break;
1008  }
1009 }
1010 
1011 static void check_global_init(check_t *check, const tree_t *global)
1012 {
1013  if (global->initial != NULL)
1014  {
1015  check_single_expr(check, global->initial);
1016  }
1017 }
1018 
1019 static void check_module_valid(check_t *check, const tree_t *mod)
1020 {
1021  CTASSERT(check != NULL);
1022  CTASSERTF(tree_is(mod, eTreeDeclModule), "invalid module `%s`", tree_to_string(mod));
1023 
1024  vector_t *modules = map_values(tree_module_tag(mod, eSemaModules));
1025  size_t total_modules = vector_len(modules);
1026  for (size_t i = 0; i < total_modules; i++)
1027  {
1028  const tree_t *child = vector_get(modules, i);
1029  check_module_valid(check, child);
1030  }
1031 
1032  vector_t *globals = map_values(tree_module_tag(mod, eSemaValues));
1033  size_t total_globals = vector_len(globals);
1034  for (size_t i = 0; i < total_globals; i++)
1035  {
1036  const tree_t *global = vector_get(globals, i);
1037  CTASSERTF(tree_is(global, eTreeDeclGlobal), "invalid global `%s`", tree_to_string(global));
1038  check_simple(check, global);
1039 
1040  check_global_attribs(check, global);
1041  check_global_recursion(check, global);
1042  check_global_type(check, global);
1043  check_global_init(check, global);
1044  }
1045 
1046  vector_t *functions = map_values(tree_module_tag(mod, eSemaProcs));
1047  size_t total_functions = vector_len(functions);
1048  for (size_t i = 0; i < total_functions; i++)
1049  {
1050  const tree_t *function = vector_get(functions, i);
1051  CTASSERTF(tree_is(function, eTreeDeclFunction), "invalid function `%s`", tree_to_string(function));
1052  check_simple(check, function);
1053 
1054  check_func_attribs(check, function);
1055  check_function_definition(check, function);
1056  }
1057 
1059  size_t total_types = vector_len(types);
1060  for (size_t i = 0; i < total_types; i++)
1061  {
1062  const tree_t *type = vector_get(types, i);
1063  // check_ident(check, type); TODO: check these properly
1064 
1065  // nothing else can be recursive (TODO: for now)
1066  check_any_type_recursion(check, type);
1067  }
1068 }
1069 
1070 STA_DECL
1071 void check_tree(logger_t *reports, vector_t *mods, arena_t *arena)
1072 {
1073  CTASSERT(arena != NULL);
1074  CTASSERT(reports != NULL);
1075  CTASSERT(mods != NULL);
1076 
1077  check_t check = {
1078  .reports = reports,
1079 
1080  .expr_stack = vector_new(64, arena),
1081  .type_stack = vector_new(64, arena),
1082 
1083  .checked_exprs = set_new(64, kTypeInfoPtr, arena),
1084  .checked_types = set_new(64, kTypeInfoPtr, arena),
1085  };
1086 
1087  size_t len = vector_len(mods);
1088  for (size_t i = 0; i < len; i++)
1089  {
1090  const tree_t *tree = vector_get(mods, i);
1091  check_module_valid(&check, tree);
1092  }
1093 }
CT_PUREFN CT_TREE_API const node_t * tree_get_node(const tree_t *tree)
Definition: context.c:94
CT_PUREFN CT_TREE_API tree_kind_t tree_get_kind(const tree_t *tree)
Definition: context.c:143
CT_PUREFN CT_TREE_API const char * tree_get_name(const tree_t *tree)
Definition: context.c:102
CT_PUREFN CT_TREE_API const char * tree_get_user_name(const tree_t *tree)
Definition: context.c:112
CT_PUREFN CT_TREE_API const tree_t * tree_get_type(const tree_t *tree)
Definition: context.c:132
CT_PUREFN CT_TREE_API bool tree_is(const tree_t *self, tree_kind_t kind)
Definition: query.c:91
CT_TREE_API tree_storage_t tree_get_storage(const tree_t *tree)
Definition: context.c:70
CT_PUREFN CT_TREE_API bool tree_is_symbol_anonymous(const tree_t *tree)
Definition: context.c:122
CT_TREE_API tree_quals_t tree_get_storage_quals(const tree_t *self)
Definition: query.c:126
CT_PUREFN CT_TREE_API tree_arity_t tree_fn_get_arity(const tree_t *self)
Definition: query.c:191
CT_TREE_API const char * tree_to_string(const tree_t *self)
Definition: query.c:40
CT_PUREFN CT_TREE_API const tree_t * tree_fn_get_return(const tree_t *self)
Definition: query.c:167
CT_TREE_API bool tree_has_storage(const tree_t *self)
Definition: query.c:114
CT_TREE_API const tree_attribs_t * tree_get_attrib(const tree_t *self)
Definition: query.c:83
CT_PUREFN CT_TREE_API const vector_t * tree_fn_get_params(const tree_t *self)
Definition: query.c:179
#define STA_DECL
sal2 annotation on function implementations to copy annotations from the declaration
CT_NODISCARD CT_PUREFN CT_BASE_API bool str_equal(const char *lhs, const char *rhs)
compare strings equality
Definition: util.c:76
STA_DECL void check_tree(logger_t *reports, vector_t *mods, arena_t *arena)
check the tree form IR all found errors are reported to the reports object
Definition: tree.c:1071
STA_RET_STRING colour_t idx
Definition: colour.h:98
CT_NODISCARD CT_STD_API vector_t * map_values(map_t *map)
collect all the values from a map into a vector
Definition: map.c:137
CT_NODISCARD CT_STD_API set_t * set_new(size_t size, hash_info_t info, arena_t *arena)
create a new set
Definition: set.c:51
CT_STD_API const void * set_add(set_t *set, const void *key)
add a key to a set
Definition: set.c:85
CT_NODISCARD CT_PUREFN CT_STD_API bool set_contains(const set_t *set, const void *key)
check if a set contains a key
Definition: set.c:118
#define CT_MIN(L, R)
Definition: macros.h:38
#define CT_UNUSED(x)
mark a variable as unused
Definition: macros.h:46
CT_NOTIFY_API event_builder_t msg_notify(INOUT_NOTNULL logger_t *logs, const diagnostic_t *diagnostic, const node_t *node, STA_FORMAT_STRING const char *fmt,...)
notify the logger of a new message
CT_NOTIFY_API void msg_append(event_builder_t builder, const node_t *node, STA_FORMAT_STRING const char *fmt,...)
append additional information to a message
CT_NOTIFY_API void msg_note(event_builder_t builder, STA_FORMAT_STRING const char *fmt,...)
add a note to an existing message
#define CT_NEVER(...)
assert that a code path is never reached
Definition: panic.h:136
#define CTASSERT(expr)
assert a condition, prints the condition as a message
Definition: panic.h:130
#define CTASSERTF(expr,...)
assert a condition with a message and optional format arguments
Definition: panic.h:116
CT_BEGIN_API CT_UTIL_API bool util_types_equal(const tree_t *lhs, const tree_t *rhs)
compare two types for strict equality compares two types for exact equality, does not follow typedefs
Definition: util.c:33
CT_UTIL_API bool util_type_is_digit(const tree_t *type)
Definition: util.c:353
tree_arity_t
all arities
Definition: ops.h:64
tree_quals_t
all type qualifiers
Definition: ops.h:25
CT_TREE_API map_t * tree_module_tag(const tree_t *self, size_t tag)
Definition: sema.c:125
CT_TREE_API const tree_t * tree_follow_type(const tree_t *type)
Definition: decl.c:274
@ eSemaValues
Definition: tree.h:36
@ eSemaProcs
Definition: tree.h:42
@ eSemaModules
Definition: tree.h:45
@ eSemaTypes
Definition: tree.h:39
CT_STD_API const hash_info_t kTypeInfoPtr
type information for a generic pointer this operates on the pointer itself and not the data it points...
Definition: typeinfo.c:41
CT_NODISCARD CT_PUREFN CT_STD_API void * vector_get(const vector_t *vector, size_t index)
get a value from a vector
Definition: vector.c:134
CT_NODISCARD CT_STD_API vector_t * vector_new(size_t size, arena_t *arena)
create a new vector with an initial capacity
Definition: vector.c:63
CT_STD_API void vector_push(vector_t **vector, void *value)
push a value onto the end of a vector
Definition: vector.c:108
CT_STD_API void vector_drop(vector_t *vector)
pop a value from the end of a vector
Definition: vector.c:117
CT_PUREFN CT_STD_API size_t vector_find(vector_t *vector, const void *element)
find an element in a vector searches via pointer equality
Definition: vector.c:160
CT_NODISCARD CT_PUREFN CT_STD_API size_t vector_len(const vector_t *vector)
get the length of a vector
Definition: vector.c:152
an allocator object
Definition: arena.h:86
Definition: tree.c:28
set_t * checked_types
Definition: tree.c:38
const tree_t * cli_entry
Definition: tree.c:31
const tree_t * gui_entry
Definition: tree.c:32
logger_t * reports
Definition: tree.c:29
vector_t * type_stack
Definition: tree.c:35
vector_t * expr_stack
Definition: tree.c:34
set_t * checked_exprs
Definition: tree.c:37
an event builder handles adding additional information to an event
Definition: notify.h:68
a logging sink
Definition: notify.c:14
an unordered hash set
Definition: set.c:19
const char * mangle
override the mangle of the declaration
Definition: tree.h:54
const char * deprecated
the reason for deprecation, or NULL if not deprecated
Definition: tree.h:56
tree_linkage_t link
the link type of the declaration
Definition: tree.h:51
storage for a value
Definition: context.h:23
const tree_t * storage
the underlying storage type
Definition: context.h:25
Definition: tree.h:67
tree_kind_t kind
Definition: tree.h:68
tree_t * operand
Definition: tree.h:97
const tree_t * value
Definition: tree.h:127
tree_t * initial
Definition: tree.h:218
tree_t * other
Definition: tree.h:140
const tree_t * rhs
Definition: tree.h:108
const tree_t * lhs
Definition: tree.h:107
const tree_t * callee
Definition: tree.h:113
vector_t * locals
Definition: tree.h:202
vector_t * fields
Definition: tree.h:184
const vector_t * args
Definition: tree.h:114
tree_t * dst
Definition: tree.h:131
tree_cast_t cast
Definition: tree.h:91
const tree_t * ptr
Definition: tree.h:172
tree_t * then
Definition: tree.h:139
const tree_t * offset
Definition: tree.h:148
const vector_t * stmts
Definition: tree.h:124
const tree_t * object
Definition: tree.h:145
bool init
Definition: tree.h:133
tree_t * body
Definition: tree.h:203
tree_t * load
Definition: tree.h:84
const tree_t * src
Definition: tree.h:132
const tree_t * expr
Definition: tree.h:88
a generic vector of pointers
Definition: vector.c:16