buf_size: fix handling of unknown flexible array sizes
[smatch.git] / smatch_extra.c
blob0e461a0a11a99124c71dbdae7640b37deb64cf16
1 /*
2 * Copyright (C) 2008 Dan Carpenter.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version 2
7 * of the License, or (at your option) any later version.
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, see http://www.gnu.org/copyleft/gpl.txt
19 * smatch_extra.c is supposed to track the value of every variable.
23 #define _GNU_SOURCE
24 #include <string.h>
26 #include <stdlib.h>
27 #include <errno.h>
28 #ifndef __USE_ISOC99
29 #define __USE_ISOC99
30 #endif
31 #include <limits.h>
32 #include "parse.h"
33 #include "smatch.h"
34 #include "smatch_slist.h"
35 #include "smatch_extra.h"
37 static int my_id;
38 static int link_id;
40 static void match_link_modify(struct sm_state *sm, struct expression *mod_expr);
42 struct string_list *__ignored_macros = NULL;
43 int in_warn_on_macro(void)
45 struct statement *stmt;
46 char *tmp;
47 char *macro;
49 stmt = get_current_statement();
50 if (!stmt)
51 return 0;
52 macro = get_macro_name(stmt->pos);
53 if (!macro)
54 return 0;
56 FOR_EACH_PTR(__ignored_macros, tmp) {
57 if (!strcmp(tmp, macro))
58 return 1;
59 } END_FOR_EACH_PTR(tmp);
60 return 0;
63 typedef void (mod_hook)(const char *name, struct symbol *sym, struct expression *expr, struct smatch_state *state);
64 DECLARE_PTR_LIST(void_fn_list, mod_hook *);
65 static struct void_fn_list *extra_mod_hooks;
66 static struct void_fn_list *extra_nomod_hooks;
68 void add_extra_mod_hook(mod_hook *fn)
70 mod_hook **p = malloc(sizeof(mod_hook *));
71 *p = fn;
72 add_ptr_list(&extra_mod_hooks, p);
75 void add_extra_nomod_hook(mod_hook *fn)
77 mod_hook **p = malloc(sizeof(mod_hook *));
78 *p = fn;
79 add_ptr_list(&extra_nomod_hooks, p);
82 void call_extra_hooks(struct void_fn_list *hooks, const char *name, struct symbol *sym, struct expression *expr, struct smatch_state *state)
84 mod_hook **fn;
86 FOR_EACH_PTR(hooks, fn) {
87 (*fn)(name, sym, expr, state);
88 } END_FOR_EACH_PTR(fn);
91 void call_extra_mod_hooks(const char *name, struct symbol *sym, struct expression *expr, struct smatch_state *state)
93 call_extra_hooks(extra_mod_hooks, name, sym, expr, state);
96 void call_extra_nomod_hooks(const char *name, struct symbol *sym, struct expression *expr, struct smatch_state *state)
98 call_extra_hooks(extra_nomod_hooks, name, sym, expr, state);
101 static void set_union_info(const char *name, struct symbol *sym, struct expression *expr, struct smatch_state *state)
103 struct symbol *type, *tmp, *inner_type, *inner, *new_type;
104 struct expression *deref, *member_expr;
105 struct smatch_state *new;
106 int offset, inner_offset;
107 static bool in_recurse;
108 char *member_name;
110 if (__in_fake_assign)
111 return;
113 if (in_recurse)
114 return;
115 in_recurse = true;
117 if (!expr || expr->type != EXPR_DEREF || !expr->member)
118 goto done;
119 offset = get_member_offset_from_deref(expr);
120 if (offset < 0)
121 goto done;
123 deref = strip_expr(expr->deref);
124 type = get_type(deref);
125 if (type_is_ptr(type))
126 type = get_real_base_type(type);
127 if (!type || type->type != SYM_STRUCT)
128 goto done;
130 FOR_EACH_PTR(type->symbol_list, tmp) {
131 inner_type = get_real_base_type(tmp);
132 if (!inner_type || inner_type->type != SYM_UNION)
133 continue;
135 inner = first_ptr_list((struct ptr_list *)inner_type->symbol_list);
136 if (!inner || !inner->ident)
137 continue;
139 inner_offset = get_member_offset(type, inner->ident->name);
140 if (inner_offset < offset)
141 continue;
142 if (inner_offset > offset)
143 goto done;
145 FOR_EACH_PTR(inner_type->symbol_list, inner) {
146 struct symbol *tmp_type;
148 if (!inner->ident || inner->ident == expr->member)
149 continue;
150 tmp_type = get_real_base_type(inner);
151 if (tmp_type && tmp_type->type == SYM_STRUCT)
152 continue;
153 member_expr = deref;
154 if (tmp->ident)
155 member_expr = member_expression(member_expr, '.', tmp->ident);
156 member_expr = member_expression(member_expr, expr->op, inner->ident);
157 member_name = expr_to_var(member_expr);
158 if (!member_name)
159 continue;
160 new_type = get_real_base_type(inner);
161 new = alloc_estate_rl(cast_rl(new_type, estate_rl(state)));
162 set_extra_mod_helper(member_name, sym, member_expr, new);
163 free_string(member_name);
164 } END_FOR_EACH_PTR(inner);
165 } END_FOR_EACH_PTR(tmp);
167 done:
168 in_recurse = false;
171 static bool in_param_set;
172 void set_extra_mod_helper(const char *name, struct symbol *sym, struct expression *expr, struct smatch_state *state)
174 struct expression *faked;
176 if (!expr)
177 expr = gen_expression_from_name_sym(name, sym);
178 remove_from_equiv(name, sym);
179 set_union_info(name, sym, expr, state);
180 call_extra_mod_hooks(name, sym, expr, state);
181 faked = get_faked_expression();
182 if (!faked ||
183 (faked->type == EXPR_ASSIGNMENT && is_fresh_alloc(faked->right)))
184 update_mtag_data(expr, state);
185 if (in_param_set &&
186 estate_is_unknown(state) && !get_state(SMATCH_EXTRA, name, sym))
187 return;
188 set_state(SMATCH_EXTRA, name, sym, state);
191 static void set_extra_nomod_helper(const char *name, struct symbol *sym, struct expression *expr, struct smatch_state *state)
193 call_extra_nomod_hooks(name, sym, expr, state);
194 set_state(SMATCH_EXTRA, name, sym, state);
197 static char *get_pointed_at(const char *name, struct symbol *sym, struct symbol **new_sym)
199 struct expression *assigned;
202 * Imagine we have an assignment: "foo = &addr;" then the other name
203 * of "*foo" is addr.
206 if (name[0] != '*')
207 return NULL;
208 if (strcmp(name + 1, sym->ident->name) != 0)
209 return NULL;
211 assigned = get_assigned_expr_name_sym(sym->ident->name, sym);
212 if (!assigned)
213 return NULL;
214 assigned = strip_parens(assigned);
215 if (assigned->type != EXPR_PREOP || assigned->op != '&')
216 return NULL;
218 return expr_to_var_sym(assigned->unop, new_sym);
221 char *get_other_name_sym_from_chunk(const char *name, const char *chunk, int len, struct symbol *sym, struct symbol **new_sym)
223 struct expression *assigned;
224 char *orig_name = NULL;
225 char buf[256];
226 char *ret;
228 assigned = get_assigned_expr_name_sym(chunk, sym);
229 if (!assigned)
230 return NULL;
231 if (assigned->type == EXPR_CALL)
232 return map_call_to_other_name_sym(name, sym, new_sym);
233 if (assigned->type == EXPR_PREOP && assigned->op == '&') {
235 orig_name = expr_to_var_sym(assigned, new_sym);
236 if (!orig_name || !*new_sym)
237 goto free;
239 snprintf(buf, sizeof(buf), "%s.%s", orig_name + 1, name + len);
240 ret = alloc_string(buf);
241 free_string(orig_name);
242 return ret;
245 orig_name = expr_to_var_sym(assigned, new_sym);
246 if (!orig_name || !*new_sym)
247 goto free;
249 snprintf(buf, sizeof(buf), "%s->%s", orig_name, name + len);
250 ret = alloc_string(buf);
251 free_string(orig_name);
252 return ret;
253 free:
254 free_string(orig_name);
255 return NULL;
258 static char *get_long_name_sym(const char *name, struct symbol *sym, struct symbol **new_sym, bool use_stack)
260 struct expression *tmp;
261 struct sm_state *sm;
262 char buf[256];
265 * Just prepend the name with a different name/sym and return that.
266 * For example, if we set "foo->bar = bar;" then the other name
267 * for "bar->baz" is "foo->bar->baz". Or if we have "foo = bar;" then
268 * the other name for "bar" is "foo". A third option is if we have
269 * "foo = bar;" then another name for "*bar" is "*foo".
272 FOR_EACH_MY_SM(check_assigned_expr_id, __get_cur_stree(), sm) {
273 tmp = sm->state->data;
274 if (!tmp || tmp->type != EXPR_SYMBOL)
275 continue;
276 if (tmp->symbol == sym)
277 goto found;
278 } END_FOR_EACH_SM(sm);
280 return NULL;
282 found:
283 if (!use_stack && name[tmp->symbol->ident->len] != '-')
284 return NULL;
286 if (name[0] == '*' && strcmp(name + 1, tmp->symbol_name->name) == 0)
287 snprintf(buf, sizeof(buf), "*%s", sm->name);
288 else if (name[tmp->symbol->ident->len] == '-' ||
289 name[tmp->symbol->ident->len] == '.')
290 snprintf(buf, sizeof(buf), "%s%s", sm->name, name + tmp->symbol->ident->len);
291 else if (strcmp(name, tmp->symbol_name->name) == 0)
292 snprintf(buf, sizeof(buf), "%s", sm->name);
293 else
294 return NULL;
296 *new_sym = sm->sym;
297 return alloc_string(buf);
300 char *get_other_name_sym_helper(const char *name, struct symbol *sym, struct symbol **new_sym, bool use_stack)
302 char buf[256];
303 char *ret;
304 int len;
306 *new_sym = NULL;
308 if (!sym || !sym->ident)
309 return NULL;
311 ret = get_pointed_at(name, sym, new_sym);
312 if (ret)
313 return ret;
315 ret = map_long_to_short_name_sym(name, sym, new_sym, use_stack);
316 if (ret)
317 return ret;
319 len = snprintf(buf, sizeof(buf), "%s", name);
320 if (len >= sizeof(buf) - 2)
321 return NULL;
323 while (use_stack && len >= 1) {
324 if (buf[len] == '>' && buf[len - 1] == '-') {
325 len--;
326 buf[len] = '\0';
327 ret = get_other_name_sym_from_chunk(name, buf, len + 2, sym, new_sym);
328 if (ret)
329 return ret;
331 len--;
334 ret = get_long_name_sym(name, sym, new_sym, use_stack);
335 if (ret)
336 return ret;
338 return NULL;
341 char *get_other_name_sym(const char *name, struct symbol *sym, struct symbol **new_sym)
343 return get_other_name_sym_helper(name, sym, new_sym, true);
346 char *get_other_name_sym_nostack(const char *name, struct symbol *sym, struct symbol **new_sym)
348 return get_other_name_sym_helper(name, sym, new_sym, false);
351 void set_extra_mod(const char *name, struct symbol *sym, struct expression *expr, struct smatch_state *state)
353 char *new_name;
354 struct symbol *new_sym;
356 set_extra_mod_helper(name, sym, expr, state);
357 new_name = get_other_name_sym_nostack(name, sym, &new_sym);
358 if (new_name && new_sym)
359 set_extra_mod_helper(new_name, new_sym, NULL, state);
360 free_string(new_name);
363 static struct expression *chunk_get_array_base(struct expression *expr)
366 * The problem with is_array() is that it only returns true for things
367 * like foo[1] but not for foo[1].bar.
370 expr = strip_expr(expr);
371 while (expr && expr->type == EXPR_DEREF)
372 expr = strip_expr(expr->deref);
373 return get_array_base(expr);
376 static int chunk_has_array(struct expression *expr)
378 return !!chunk_get_array_base(expr);
381 static void clear_array_states(struct expression *array)
383 struct sm_state *sm;
385 sm = get_sm_state_expr(link_id, array);
386 if (sm)
387 match_link_modify(sm, NULL);
390 static void set_extra_array_mod(struct expression *expr, struct smatch_state *state)
392 struct expression *array;
393 struct var_sym_list *vsl;
394 struct var_sym *vs;
395 char *name;
396 struct symbol *sym;
398 array = chunk_get_array_base(expr);
400 name = expr_to_chunk_sym_vsl(expr, &sym, &vsl);
401 if (!name || !vsl) {
402 clear_array_states(array);
403 goto free;
406 FOR_EACH_PTR(vsl, vs) {
407 store_link(link_id, vs->var, vs->sym, name, sym);
408 } END_FOR_EACH_PTR(vs);
410 call_extra_mod_hooks(name, sym, expr, state);
411 set_state(SMATCH_EXTRA, name, sym, state);
412 free:
413 free_string(name);
416 void set_extra_expr_mod(struct expression *expr, struct smatch_state *state)
418 struct symbol *sym;
419 char *name;
421 if (chunk_has_array(expr)) {
422 set_extra_array_mod(expr, state);
423 return;
426 expr = strip_expr(expr);
427 name = expr_to_var_sym(expr, &sym);
428 if (!name || !sym)
429 goto free;
430 set_extra_mod(name, sym, expr, state);
431 free:
432 free_string(name);
435 void set_extra_nomod(const char *name, struct symbol *sym, struct expression *expr, struct smatch_state *state)
437 char *new_name;
438 struct symbol *new_sym;
439 struct relation *rel;
440 struct smatch_state *orig_state;
442 orig_state = get_state(SMATCH_EXTRA, name, sym);
444 /* don't save unknown states if leaving it blank is the same */
445 if (!orig_state && estate_is_unknown(state))
446 return;
448 new_name = get_other_name_sym(name, sym, &new_sym);
449 if (new_name && new_sym)
450 set_extra_nomod_helper(new_name, new_sym, expr, state);
451 free_string(new_name);
453 if (!estate_related(orig_state)) {
454 set_extra_nomod_helper(name, sym, expr, state);
455 return;
458 set_related(state, estate_related(orig_state));
459 FOR_EACH_PTR(estate_related(orig_state), rel) {
460 struct smatch_state *estate;
462 estate = get_state(SMATCH_EXTRA, rel->name, rel->sym);
463 if (!estate)
464 continue;
465 set_extra_nomod_helper(rel->name, rel->sym, expr, clone_estate_cast(estate_type(estate), state));
466 } END_FOR_EACH_PTR(rel);
469 void set_extra_nomod_vsl(const char *name, struct symbol *sym, struct var_sym_list *vsl, struct expression *expr, struct smatch_state *state)
471 struct var_sym *vs;
473 FOR_EACH_PTR(vsl, vs) {
474 store_link(link_id, vs->var, vs->sym, name, sym);
475 } END_FOR_EACH_PTR(vs);
477 set_extra_nomod(name, sym, expr, state);
481 * This is for return_implies_state() hooks which modify a SMATCH_EXTRA state
483 void set_extra_expr_nomod(struct expression *expr, struct smatch_state *state)
485 struct var_sym_list *vsl;
486 struct var_sym *vs;
487 char *name;
488 struct symbol *sym;
490 name = expr_to_chunk_sym_vsl(expr, &sym, &vsl);
491 if (!name || !vsl)
492 goto free;
493 FOR_EACH_PTR(vsl, vs) {
494 store_link(link_id, vs->var, vs->sym, name, sym);
495 } END_FOR_EACH_PTR(vs);
497 set_extra_nomod(name, sym, expr, state);
498 free:
499 free_string(name);
502 static void set_extra_true_false(const char *name, struct symbol *sym,
503 struct smatch_state *true_state,
504 struct smatch_state *false_state)
506 char *new_name;
507 struct symbol *new_sym;
508 struct relation *rel;
509 struct smatch_state *orig_state;
511 if (!true_state && !false_state)
512 return;
514 if (in_warn_on_macro())
515 return;
517 new_name = get_other_name_sym(name, sym, &new_sym);
518 if (new_name && new_sym)
519 set_true_false_states(SMATCH_EXTRA, new_name, new_sym, true_state, false_state);
520 free_string(new_name);
522 orig_state = get_state(SMATCH_EXTRA, name, sym);
524 if (!estate_related(orig_state)) {
525 set_true_false_states(SMATCH_EXTRA, name, sym, true_state, false_state);
526 return;
529 if (true_state)
530 set_related(true_state, estate_related(orig_state));
531 if (false_state)
532 set_related(false_state, estate_related(orig_state));
534 FOR_EACH_PTR(estate_related(orig_state), rel) {
535 set_true_false_states(SMATCH_EXTRA, rel->name, rel->sym,
536 true_state, false_state);
537 } END_FOR_EACH_PTR(rel);
540 static void set_extra_chunk_true_false(struct expression *expr,
541 struct smatch_state *true_state,
542 struct smatch_state *false_state)
544 struct var_sym_list *vsl;
545 struct var_sym *vs;
546 struct symbol *type;
547 char *name;
548 struct symbol *sym;
550 if (in_warn_on_macro())
551 return;
553 type = get_type(expr);
554 if (!type)
555 return;
557 name = expr_to_chunk_sym_vsl(expr, &sym, &vsl);
558 if (!name || !vsl)
559 goto free;
560 FOR_EACH_PTR(vsl, vs) {
561 store_link(link_id, vs->var, vs->sym, name, sym);
562 } END_FOR_EACH_PTR(vs);
564 set_true_false_states(SMATCH_EXTRA, name, sym,
565 clone_estate(true_state),
566 clone_estate(false_state));
567 free:
568 free_string(name);
571 static void set_extra_expr_true_false(struct expression *expr,
572 struct smatch_state *true_state,
573 struct smatch_state *false_state)
575 char *name;
576 struct symbol *sym;
577 sval_t sval;
579 if (!true_state && !false_state)
580 return;
582 if (get_value(expr, &sval))
583 return;
585 expr = strip_expr(expr);
586 name = expr_to_var_sym(expr, &sym);
587 if (!name || !sym) {
588 free_string(name);
589 set_extra_chunk_true_false(expr, true_state, false_state);
590 return;
592 set_extra_true_false(name, sym, true_state, false_state);
593 free_string(name);
596 static int get_countdown_info(struct expression *condition, struct expression **unop, int *op, sval_t *right)
598 struct expression *unop_expr;
599 int comparison;
600 sval_t limit;
602 right->type = &int_ctype;
603 right->value = 0;
605 condition = strip_expr(condition);
607 if (condition->type == EXPR_COMPARE) {
608 comparison = remove_unsigned_from_comparison(condition->op);
610 if (comparison != SPECIAL_GTE && comparison != '>')
611 return 0;
612 if (!get_value(condition->right, &limit))
613 return 0;
615 unop_expr = condition->left;
616 if (unop_expr->type != EXPR_PREOP && unop_expr->type != EXPR_POSTOP)
617 return 0;
618 if (unop_expr->op != SPECIAL_DECREMENT)
619 return 0;
621 *unop = unop_expr;
622 *op = comparison;
623 *right = limit;
625 return 1;
628 if (condition->type != EXPR_PREOP && condition->type != EXPR_POSTOP)
629 return 0;
630 if (condition->op != SPECIAL_DECREMENT)
631 return 0;
633 *unop = condition;
634 *op = '>';
636 return 1;
639 static struct sm_state *handle_canonical_while_count_down(struct statement *loop)
641 struct expression *iter_var;
642 struct expression *condition, *unop;
643 struct symbol *type;
644 struct sm_state *sm;
645 struct smatch_state *estate;
646 int op;
647 sval_t start, right;
649 right.type = &int_ctype;
650 right.value = 0;
652 condition = strip_expr(loop->iterator_pre_condition);
653 if (!condition)
654 return NULL;
656 if (!get_countdown_info(condition, &unop, &op, &right))
657 return NULL;
659 iter_var = unop->unop;
661 sm = get_sm_state_expr(SMATCH_EXTRA, iter_var);
662 if (!sm)
663 return NULL;
664 if (sval_cmp(estate_min(sm->state), right) < 0)
665 return NULL;
666 start = estate_max(sm->state);
668 type = get_type(iter_var);
669 right = sval_cast(type, right);
670 start = sval_cast(type, start);
672 if (sval_cmp(start, right) <= 0)
673 return NULL;
674 if (!sval_is_max(start))
675 start.value--;
677 if (op == SPECIAL_GTE)
678 right.value--;
680 if (unop->type == EXPR_PREOP) {
681 right.value++;
682 estate = alloc_estate_range(right, start);
683 if (estate_has_hard_max(sm->state))
684 estate_set_hard_max(estate);
685 estate_copy_fuzzy_max(estate, sm->state);
686 set_extra_expr_mod(iter_var, estate);
688 if (unop->type == EXPR_POSTOP) {
689 estate = alloc_estate_range(right, start);
690 if (estate_has_hard_max(sm->state))
691 estate_set_hard_max(estate);
692 estate_copy_fuzzy_max(estate, sm->state);
693 set_extra_expr_mod(iter_var, estate);
695 return get_sm_state_expr(SMATCH_EXTRA, iter_var);
698 static struct sm_state *handle_canonical_for_inc(struct expression *iter_expr,
699 struct expression *condition)
701 struct expression *iter_var;
702 struct sm_state *sm;
703 struct smatch_state *estate;
704 sval_t start, end, max;
705 struct symbol *type;
707 iter_var = iter_expr->unop;
708 sm = get_sm_state_expr(SMATCH_EXTRA, iter_var);
709 if (!sm)
710 return NULL;
711 if (!estate_get_single_value(sm->state, &start))
712 return NULL;
713 if (!get_implied_value(condition->right, &end))
714 return NULL;
716 if (get_sm_state_expr(SMATCH_EXTRA, condition->left) != sm)
717 return NULL;
719 switch (condition->op) {
720 case SPECIAL_UNSIGNED_LT:
721 case SPECIAL_NOTEQUAL:
722 case '<':
723 if (!sval_is_min(end))
724 end.value--;
725 break;
726 case SPECIAL_UNSIGNED_LTE:
727 case SPECIAL_LTE:
728 break;
729 default:
730 return NULL;
732 if (sval_cmp(end, start) < 0)
733 return NULL;
734 type = get_type(iter_var);
735 start = sval_cast(type, start);
736 end = sval_cast(type, end);
737 estate = alloc_estate_range(start, end);
738 if (get_hard_max(condition->right, &max)) {
739 if (!get_macro_name(condition->pos))
740 estate_set_hard_max(estate);
741 if (condition->op == '<' ||
742 condition->op == SPECIAL_UNSIGNED_LT ||
743 condition->op == SPECIAL_NOTEQUAL)
744 max.value--;
745 max = sval_cast(type, max);
746 estate_set_fuzzy_max(estate, max);
748 set_extra_expr_mod(iter_var, estate);
749 return get_sm_state_expr(SMATCH_EXTRA, iter_var);
752 static struct sm_state *handle_canonical_for_dec(struct expression *iter_expr,
753 struct expression *condition)
755 struct expression *iter_var;
756 struct sm_state *sm;
757 struct smatch_state *estate;
758 sval_t start, end;
760 iter_var = iter_expr->unop;
761 sm = get_sm_state_expr(SMATCH_EXTRA, iter_var);
762 if (!sm)
763 return NULL;
764 if (!estate_get_single_value(sm->state, &start))
765 return NULL;
766 if (!get_implied_min(condition->right, &end))
767 end = sval_type_min(get_type(iter_var));
768 end = sval_cast(estate_type(sm->state), end);
769 if (get_sm_state_expr(SMATCH_EXTRA, condition->left) != sm)
770 return NULL;
772 switch (condition->op) {
773 case SPECIAL_NOTEQUAL:
774 case '>':
775 if (!sval_is_max(end))
776 end.value++;
777 break;
778 case SPECIAL_GTE:
779 break;
780 default:
781 return NULL;
783 if (sval_cmp(end, start) > 0)
784 return NULL;
785 estate = alloc_estate_range(end, start);
786 estate_set_hard_max(estate);
787 estate_set_fuzzy_max(estate, estate_get_fuzzy_max(estate));
788 set_extra_expr_mod(iter_var, estate);
789 return get_sm_state_expr(SMATCH_EXTRA, iter_var);
792 static struct sm_state *handle_canonical_for_loops(struct statement *loop)
794 struct expression *iter_expr;
795 struct expression *condition;
797 if (!loop->iterator_post_statement)
798 return NULL;
799 if (loop->iterator_post_statement->type != STMT_EXPRESSION)
800 return NULL;
801 iter_expr = loop->iterator_post_statement->expression;
802 if (!loop->iterator_pre_condition)
803 return NULL;
804 if (loop->iterator_pre_condition->type != EXPR_COMPARE)
805 return NULL;
806 condition = loop->iterator_pre_condition;
808 if (iter_expr->op == SPECIAL_INCREMENT)
809 return handle_canonical_for_inc(iter_expr, condition);
810 if (iter_expr->op == SPECIAL_DECREMENT)
811 return handle_canonical_for_dec(iter_expr, condition);
812 return NULL;
815 struct sm_state *__extra_handle_canonical_loops(struct statement *loop, struct stree **stree)
817 struct sm_state *ret;
820 * Canonical loops are a hack. The proper way to handle this is to
821 * use two passes, but unfortunately, doing two passes makes parsing
822 * code twice as slow.
824 * What we do is we set the inside state here, which overwrites whatever
825 * __extra_match_condition() does. Then we set the outside state in
826 * __extra_pre_loop_hook_after().
829 __push_fake_cur_stree();
830 if (!loop->iterator_post_statement)
831 ret = handle_canonical_while_count_down(loop);
832 else
833 ret = handle_canonical_for_loops(loop);
834 *stree = __pop_fake_cur_stree();
835 return ret;
838 int __iterator_unchanged(struct sm_state *sm)
840 if (!sm)
841 return 0;
842 if (get_sm_state(my_id, sm->name, sm->sym) == sm)
843 return 1;
844 return 0;
847 static void while_count_down_after(struct sm_state *sm, struct expression *condition)
849 struct expression *unop;
850 int op;
851 sval_t limit, after_value;
853 if (!get_countdown_info(condition, &unop, &op, &limit))
854 return;
855 after_value = estate_min(sm->state);
856 after_value.value--;
857 set_extra_mod(sm->name, sm->sym, condition->unop, alloc_estate_sval(after_value));
860 void __extra_pre_loop_hook_after(struct sm_state *sm,
861 struct statement *iterator,
862 struct expression *condition)
864 struct expression *iter_expr;
865 sval_t limit;
866 struct smatch_state *state;
868 if (!iterator) {
869 while_count_down_after(sm, condition);
870 return;
873 iter_expr = iterator->expression;
875 if (condition->type != EXPR_COMPARE)
876 return;
877 if (iter_expr->op == SPECIAL_INCREMENT) {
878 limit = sval_binop(estate_max(sm->state), '+',
879 sval_type_val(estate_type(sm->state), 1));
880 } else {
881 limit = sval_binop(estate_min(sm->state), '-',
882 sval_type_val(estate_type(sm->state), 1));
884 limit = sval_cast(estate_type(sm->state), limit);
885 if (!estate_has_hard_max(sm->state) && !__has_breaks()) {
886 if (iter_expr->op == SPECIAL_INCREMENT)
887 state = alloc_estate_range(estate_min(sm->state), limit);
888 else
889 state = alloc_estate_range(limit, estate_max(sm->state));
890 } else {
891 state = alloc_estate_sval(limit);
893 if (!estate_has_hard_max(sm->state)) {
894 estate_clear_hard_max(state);
896 if (estate_has_fuzzy_max(sm->state)) {
897 sval_t hmax = estate_get_fuzzy_max(sm->state);
898 sval_t max = estate_max(sm->state);
900 if (sval_cmp(hmax, max) != 0)
901 estate_clear_fuzzy_max(state);
902 } else if (!estate_has_fuzzy_max(sm->state)) {
903 estate_clear_fuzzy_max(state);
906 set_extra_mod(sm->name, sm->sym, iter_expr, state);
909 static bool get_global_rl(const char *name, struct symbol *sym, struct range_list **rl)
911 struct expression *expr;
913 if (!sym || !(sym->ctype.modifiers & MOD_TOPLEVEL) || !sym->ident)
914 return false;
915 if (strcmp(sym->ident->name, name) != 0)
916 return false;
918 expr = symbol_expression(sym);
919 return get_implied_rl(expr, rl);
922 static struct stree *unmatched_stree;
923 static struct smatch_state *unmatched_state(struct sm_state *sm)
925 struct smatch_state *state;
926 struct range_list *rl;
928 if (unmatched_stree) {
929 state = get_state_stree(unmatched_stree, SMATCH_EXTRA, sm->name, sm->sym);
930 if (state)
931 return state;
933 if (parent_is_gone_var_sym(sm->name, sm->sym))
934 return alloc_estate_empty();
935 if (get_global_rl(sm->name, sm->sym, &rl))
936 return alloc_estate_rl(rl);
937 return alloc_estate_whole(estate_type(sm->state));
940 static void clear_the_pointed_at(struct expression *expr)
942 struct stree *stree;
943 char *name;
944 struct symbol *sym;
945 struct sm_state *tmp;
947 name = expr_to_var_sym(expr, &sym);
948 if (!name || !sym)
949 goto free;
951 stree = __get_cur_stree();
952 FOR_EACH_MY_SM(SMATCH_EXTRA, stree, tmp) {
953 if (tmp->name[0] != '*')
954 continue;
955 if (tmp->sym != sym)
956 continue;
957 if (strcmp(tmp->name + 1, name) != 0)
958 continue;
959 set_extra_mod(tmp->name, tmp->sym, expr, alloc_estate_whole(estate_type(tmp->state)));
960 } END_FOR_EACH_SM(tmp);
962 free:
963 free_string(name);
966 static int is_const_param(struct expression *expr, int param)
968 struct symbol *type;
970 type = get_arg_type(expr, param);
971 if (!type)
972 return 0;
973 if (type->ctype.modifiers & MOD_CONST)
974 return 1;
975 return 0;
978 static void match_function_call(struct expression *expr)
980 struct expression *arg;
981 struct expression *tmp;
982 int param = -1;
984 /* if we have the db this is handled in smatch_function_hooks.c */
985 if (!option_no_db)
986 return;
987 if (inlinable(expr->fn))
988 return;
990 FOR_EACH_PTR(expr->args, arg) {
991 param++;
992 if (is_const_param(expr->fn, param))
993 continue;
994 tmp = strip_expr(arg);
995 if (tmp->type == EXPR_PREOP && tmp->op == '&')
996 set_extra_expr_mod(tmp->unop, alloc_estate_whole(get_type(tmp->unop)));
997 else
998 clear_the_pointed_at(tmp);
999 } END_FOR_EACH_PTR(arg);
1002 int values_fit_type(struct expression *left, struct expression *right)
1004 struct range_list *rl;
1005 struct symbol *type;
1007 type = get_type(left);
1008 if (!type)
1009 return 0;
1010 get_absolute_rl(right, &rl);
1011 if (type == rl_type(rl))
1012 return 1;
1013 if (type_unsigned(type) && sval_is_negative(rl_min(rl)))
1014 return 0;
1015 if (sval_cmp(sval_type_min(type), rl_min(rl)) > 0)
1016 return 0;
1017 if (sval_cmp(sval_type_max(type), rl_max(rl)) < 0)
1018 return 0;
1019 return 1;
1022 static void save_chunk_info(struct expression *left, struct expression *right)
1024 struct var_sym_list *vsl;
1025 struct var_sym *vs;
1026 struct expression *add_expr;
1027 struct symbol *type;
1028 sval_t sval;
1029 char *name;
1030 struct symbol *sym;
1032 if (right->type != EXPR_BINOP || right->op != '-')
1033 return;
1034 if (!get_value(right->left, &sval))
1035 return;
1036 if (!expr_to_sym(right->right))
1037 return;
1039 add_expr = binop_expression(left, '+', right->right);
1040 type = get_type(add_expr);
1041 if (!type)
1042 return;
1043 name = expr_to_chunk_sym_vsl(add_expr, &sym, &vsl);
1044 if (!name || !vsl)
1045 goto free;
1046 FOR_EACH_PTR(vsl, vs) {
1047 store_link(link_id, vs->var, vs->sym, name, sym);
1048 } END_FOR_EACH_PTR(vs);
1050 set_state(SMATCH_EXTRA, name, sym, alloc_estate_sval(sval_cast(type, sval)));
1051 free:
1052 free_string(name);
1055 static void do_array_assign(struct expression *left, int op, struct expression *right)
1057 struct range_list *rl;
1059 if (op == '=') {
1060 get_absolute_rl(right, &rl);
1061 rl = cast_rl(get_type(left), rl);
1062 } else {
1063 rl = alloc_whole_rl(get_type(left));
1066 set_extra_array_mod(left, alloc_estate_rl(rl));
1069 static void match_vanilla_assign(struct expression *left, struct expression *right)
1071 struct range_list *orig_rl = NULL;
1072 struct range_list *rl = NULL;
1073 struct symbol *right_sym;
1074 struct symbol *left_type;
1075 struct symbol *right_type;
1076 char *right_name = NULL;
1077 struct symbol *sym;
1078 char *name;
1079 sval_t sval, max;
1080 struct smatch_state *state;
1081 int comparison;
1083 if (is_struct(left))
1084 return;
1086 save_chunk_info(left, right);
1088 name = expr_to_var_sym(left, &sym);
1089 if (!name) {
1090 if (chunk_has_array(left))
1091 do_array_assign(left, '=', right);
1092 return;
1095 left_type = get_type(left);
1096 right_type = get_type(right);
1098 right_name = expr_to_var_sym(right, &right_sym);
1100 if (!__in_fake_assign &&
1101 !(right->type == EXPR_PREOP && right->op == '&') &&
1102 right_name && right_sym &&
1103 values_fit_type(left, strip_expr(right)) &&
1104 !has_symbol(right, sym)) {
1105 set_equiv(left, right);
1106 goto free;
1109 if (get_implied_value(right, &sval)) {
1110 state = alloc_estate_sval(sval_cast(left_type, sval));
1111 goto done;
1114 if (__in_fake_assign) {
1115 struct smatch_state *right_state;
1116 sval_t sval;
1118 if (get_value(right, &sval)) {
1119 sval = sval_cast(left_type, sval);
1120 state = alloc_estate_sval(sval);
1121 goto done;
1124 right_state = get_state(SMATCH_EXTRA, right_name, right_sym);
1125 if (right_state) {
1126 /* simple assignment */
1127 state = clone_estate(right_state);
1128 goto done;
1131 state = alloc_estate_rl(alloc_whole_rl(left_type));
1132 goto done;
1135 comparison = get_comparison_no_extra(left, right);
1136 if (comparison) {
1137 comparison = flip_comparison(comparison);
1138 get_implied_rl(left, &orig_rl);
1141 if (get_implied_rl(right, &rl)) {
1142 rl = cast_rl(left_type, rl);
1143 if (orig_rl)
1144 filter_by_comparison(&rl, comparison, orig_rl);
1145 state = alloc_estate_rl(rl);
1146 if (get_hard_max(right, &max)) {
1147 estate_set_hard_max(state);
1148 estate_set_fuzzy_max(state, max);
1150 } else {
1151 rl = alloc_whole_rl(right_type);
1152 rl = cast_rl(left_type, rl);
1153 if (orig_rl)
1154 filter_by_comparison(&rl, comparison, orig_rl);
1155 state = alloc_estate_rl(rl);
1158 done:
1159 set_extra_mod(name, sym, left, state);
1160 free:
1161 free_string(right_name);
1164 static void match_assign(struct expression *expr)
1166 struct range_list *rl = NULL;
1167 struct expression *left;
1168 struct expression *right;
1169 struct expression *binop_expr;
1170 struct symbol *left_type;
1171 struct symbol *sym;
1172 char *name;
1174 left = strip_expr(expr->left);
1176 right = strip_parens(expr->right);
1177 if (right->type == EXPR_CALL && sym_name_is("__builtin_expect", right->fn))
1178 right = get_argument_from_call_expr(right->args, 0);
1179 while (right->type == EXPR_ASSIGNMENT && right->op == '=')
1180 right = strip_parens(right->left);
1182 if (expr->op == '=' && is_condition(expr->right))
1183 return; /* handled in smatch_condition.c */
1184 if (expr->op == '=' && right->type == EXPR_CALL)
1185 return; /* handled in smatch_function_hooks.c */
1186 if (expr->op == '=') {
1187 match_vanilla_assign(left, right);
1188 return;
1191 name = expr_to_var_sym(left, &sym);
1192 if (!name)
1193 return;
1195 left_type = get_type(left);
1197 switch (expr->op) {
1198 case SPECIAL_ADD_ASSIGN:
1199 case SPECIAL_SUB_ASSIGN:
1200 case SPECIAL_AND_ASSIGN:
1201 case SPECIAL_MOD_ASSIGN:
1202 case SPECIAL_SHL_ASSIGN:
1203 case SPECIAL_SHR_ASSIGN:
1204 case SPECIAL_OR_ASSIGN:
1205 case SPECIAL_XOR_ASSIGN:
1206 case SPECIAL_MUL_ASSIGN:
1207 case SPECIAL_DIV_ASSIGN:
1208 binop_expr = binop_expression(expr->left,
1209 op_remove_assign(expr->op),
1210 expr->right);
1211 get_absolute_rl(binop_expr, &rl);
1212 rl = cast_rl(left_type, rl);
1213 if (inside_loop()) {
1214 if (expr->op == SPECIAL_ADD_ASSIGN)
1215 add_range(&rl, rl_max(rl), sval_type_max(rl_type(rl)));
1217 if (expr->op == SPECIAL_SUB_ASSIGN &&
1218 !sval_is_negative(rl_min(rl))) {
1219 sval_t zero = { .type = rl_type(rl) };
1221 add_range(&rl, rl_min(rl), zero);
1224 set_extra_mod(name, sym, left, alloc_estate_rl(rl));
1225 goto free;
1227 set_extra_mod(name, sym, left, alloc_estate_whole(left_type));
1228 free:
1229 free_string(name);
1232 static struct smatch_state *increment_state(struct smatch_state *state)
1234 sval_t min = estate_min(state);
1235 sval_t max = estate_max(state);
1237 if (!estate_rl(state))
1238 return NULL;
1240 if (inside_loop())
1241 max = sval_type_max(max.type);
1243 if (!sval_is_min(min) && !sval_is_max(min))
1244 min.value++;
1245 if (!sval_is_min(max) && !sval_is_max(max))
1246 max.value++;
1247 return alloc_estate_range(min, max);
1250 static struct smatch_state *decrement_state(struct smatch_state *state)
1252 sval_t min = estate_min(state);
1253 sval_t max = estate_max(state);
1255 if (!estate_rl(state))
1256 return NULL;
1258 if (inside_loop())
1259 min = sval_type_min(min.type);
1261 if (!sval_is_min(min) && !sval_is_max(min))
1262 min.value--;
1263 if (!sval_is_min(max) && !sval_is_max(max))
1264 max.value--;
1265 return alloc_estate_range(min, max);
1268 static void clear_pointed_at_state(struct expression *expr)
1270 struct symbol *type;
1273 * ALERT: This is sort of a mess. If it's is a struct assigment like
1274 * "foo = bar;", then that's handled by smatch_struct_assignment.c.
1275 * the same thing for p++ where "p" is a struct. Most modifications
1276 * are handled by the assignment hook or the db. Smatch_extra.c doesn't
1277 * use smatch_modification.c because we have to get the ordering right
1278 * or something. So if you have p++ where p is a pointer to a standard
1279 * c type then we handle that here. What a mess.
1281 expr = strip_expr(expr);
1282 type = get_type(expr);
1283 if (!type || type->type != SYM_PTR)
1284 return;
1285 type = get_real_base_type(type);
1286 if (!type || type->type != SYM_BASETYPE)
1287 return;
1288 set_extra_expr_nomod(deref_expression(expr), alloc_estate_whole(type));
1291 static void unop_expr(struct expression *expr)
1293 struct smatch_state *state;
1295 if (expr->smatch_flags & Handled)
1296 return;
1298 switch (expr->op) {
1299 case SPECIAL_INCREMENT:
1300 state = get_state_expr(SMATCH_EXTRA, expr->unop);
1301 state = increment_state(state);
1302 if (!state)
1303 state = alloc_estate_whole(get_type(expr));
1304 set_extra_expr_mod(expr->unop, state);
1305 clear_pointed_at_state(expr->unop);
1306 break;
1307 case SPECIAL_DECREMENT:
1308 state = get_state_expr(SMATCH_EXTRA, expr->unop);
1309 state = decrement_state(state);
1310 if (!state)
1311 state = alloc_estate_whole(get_type(expr));
1312 set_extra_expr_mod(expr->unop, state);
1313 clear_pointed_at_state(expr->unop);
1314 break;
1315 default:
1316 return;
1320 static void asm_expr(struct statement *stmt)
1323 struct expression *expr;
1324 struct symbol *type;
1326 FOR_EACH_PTR(stmt->asm_outputs, expr) {
1327 if (expr->type != EXPR_ASM_OPERAND) {
1328 sm_perror("unexpected asm param type %d", expr->type);
1329 continue;
1331 type = get_type(strip_expr(expr->expr));
1332 set_extra_expr_mod(expr->expr, alloc_estate_whole(type));
1333 } END_FOR_EACH_PTR(expr);
1336 static void check_dereference(struct expression *expr)
1338 struct smatch_state *state;
1340 if (__in_fake_assign)
1341 return;
1342 if (outside_of_function())
1343 return;
1344 state = get_extra_state(expr);
1345 if (state) {
1346 struct range_list *rl;
1348 rl = rl_intersection(estate_rl(state), valid_ptr_rl);
1349 if (rl_equiv(rl, estate_rl(state)))
1350 return;
1351 set_extra_expr_nomod(expr, alloc_estate_rl(rl));
1352 } else {
1353 struct range_list *rl;
1355 if (get_mtag_rl(expr, &rl))
1356 rl = rl_intersection(rl, valid_ptr_rl);
1357 else
1358 rl = clone_rl(valid_ptr_rl);
1360 set_extra_expr_nomod(expr, alloc_estate_rl(rl));
1364 static void match_dereferences(struct expression *expr)
1366 if (expr->type != EXPR_PREOP)
1367 return;
1368 if (getting_address(expr))
1369 return;
1370 /* it's saying that foo[1] = bar dereferences foo[1] */
1371 if (is_array(expr))
1372 return;
1373 check_dereference(expr->unop);
1376 static void match_pointer_as_array(struct expression *expr)
1378 if (!is_array(expr))
1379 return;
1380 check_dereference(get_array_base(expr));
1383 static void find_dereferences(struct expression *expr)
1385 while (expr->type == EXPR_PREOP) {
1386 if (expr->op == '*')
1387 check_dereference(expr->unop);
1388 expr = strip_expr(expr->unop);
1392 static void set_param_dereferenced(struct expression *call, struct expression *arg, char *key, char *unused)
1394 struct symbol *sym;
1395 char *name;
1397 name = get_variable_from_key(arg, key, &sym);
1398 if (name && sym) {
1399 struct smatch_state *orig, *new;
1400 struct range_list *rl;
1402 orig = get_state(SMATCH_EXTRA, name, sym);
1403 if (orig) {
1404 rl = rl_intersection(estate_rl(orig),
1405 alloc_rl(valid_ptr_min_sval,
1406 valid_ptr_max_sval));
1407 new = alloc_estate_rl(rl);
1408 } else {
1409 new = alloc_estate_range(valid_ptr_min_sval, valid_ptr_max_sval);
1412 set_extra_nomod(name, sym, NULL, new);
1414 free_string(name);
1416 find_dereferences(arg);
1419 static sval_t add_one(sval_t sval)
1421 sval.value++;
1422 return sval;
1425 static int handle_postop_inc(struct expression *left, int op, struct expression *right)
1427 struct statement *stmt;
1428 struct expression *cond;
1429 struct smatch_state *true_state, *false_state;
1430 struct symbol *type;
1431 sval_t start;
1432 sval_t limit;
1435 * If we're decrementing here then that's a canonical while count down
1436 * so it's handled already. We're only handling loops like:
1437 * i = 0;
1438 * do { ... } while (i++ < 3);
1441 if (left->type != EXPR_POSTOP || left->op != SPECIAL_INCREMENT)
1442 return 0;
1444 stmt = __cur_stmt->parent;
1445 if (!stmt)
1446 return 0;
1447 if (stmt->type == STMT_COMPOUND)
1448 stmt = stmt->parent;
1449 if (!stmt || stmt->type != STMT_ITERATOR || !stmt->iterator_post_condition)
1450 return 0;
1452 cond = strip_expr(stmt->iterator_post_condition);
1453 if (cond->type != EXPR_COMPARE || cond->op != op)
1454 return 0;
1455 if (left != strip_expr(cond->left) || right != strip_expr(cond->right))
1456 return 0;
1458 if (!get_implied_value(left->unop, &start))
1459 return 0;
1460 if (!get_implied_value(right, &limit))
1461 return 0;
1462 type = get_type(left->unop);
1463 limit = sval_cast(type, limit);
1464 if (sval_cmp(start, limit) > 0)
1465 return 0;
1467 switch (op) {
1468 case '<':
1469 case SPECIAL_UNSIGNED_LT:
1470 break;
1471 case SPECIAL_LTE:
1472 case SPECIAL_UNSIGNED_LTE:
1473 limit = add_one(limit);
1474 default:
1475 return 0;
1479 true_state = alloc_estate_range(add_one(start), limit);
1480 false_state = alloc_estate_range(add_one(limit), add_one(limit));
1482 /* Currently we just discard the false state but when two passes is
1483 * implimented correctly then it will use it.
1486 set_extra_expr_true_false(left->unop, true_state, false_state);
1488 return 1;
1491 bool is_impossible_variable(struct expression *expr)
1493 struct smatch_state *state;
1495 state = get_extra_state(expr);
1496 if (state && !estate_rl(state))
1497 return true;
1498 return false;
1501 static bool in_macro(struct expression *left, struct expression *right)
1503 if (!left || !right)
1504 return 0;
1505 if (left->pos.line != right->pos.line || left->pos.pos != right->pos.pos)
1506 return 0;
1507 if (get_macro_name(left->pos))
1508 return 1;
1509 return 0;
1512 static void handle_comparison(struct symbol *type, struct expression *left, int op, struct expression *right)
1514 struct range_list *left_orig;
1515 struct range_list *left_true;
1516 struct range_list *left_false;
1517 struct range_list *right_orig;
1518 struct range_list *right_true;
1519 struct range_list *right_false;
1520 struct smatch_state *left_true_state;
1521 struct smatch_state *left_false_state;
1522 struct smatch_state *right_true_state;
1523 struct smatch_state *right_false_state;
1524 sval_t dummy, hard_max;
1525 int left_postop = 0;
1526 int right_postop = 0;
1528 if (left->op == SPECIAL_INCREMENT || left->op == SPECIAL_DECREMENT) {
1529 if (left->type == EXPR_POSTOP) {
1530 left->smatch_flags |= Handled;
1531 left_postop = left->op;
1532 if (handle_postop_inc(left, op, right))
1533 return;
1535 left = strip_parens(left->unop);
1537 while (left->type == EXPR_ASSIGNMENT)
1538 left = strip_parens(left->left);
1540 if (right->op == SPECIAL_INCREMENT || right->op == SPECIAL_DECREMENT) {
1541 if (right->type == EXPR_POSTOP) {
1542 right->smatch_flags |= Handled;
1543 right_postop = right->op;
1545 right = strip_parens(right->unop);
1548 if (is_impossible_variable(left) || is_impossible_variable(right))
1549 return;
1551 get_real_absolute_rl(left, &left_orig);
1552 left_orig = cast_rl(type, left_orig);
1554 get_real_absolute_rl(right, &right_orig);
1555 right_orig = cast_rl(type, right_orig);
1557 split_comparison_rl(left_orig, op, right_orig, &left_true, &left_false, &right_true, &right_false);
1559 left_true = rl_truncate_cast(get_type(strip_expr(left)), left_true);
1560 left_false = rl_truncate_cast(get_type(strip_expr(left)), left_false);
1561 right_true = rl_truncate_cast(get_type(strip_expr(right)), right_true);
1562 right_false = rl_truncate_cast(get_type(strip_expr(right)), right_false);
1564 if (!left_true || !left_false) {
1565 struct range_list *tmp_true, *tmp_false;
1567 split_comparison_rl(alloc_whole_rl(type), op, right_orig, &tmp_true, &tmp_false, NULL, NULL);
1568 tmp_true = rl_truncate_cast(get_type(strip_expr(left)), tmp_true);
1569 tmp_false = rl_truncate_cast(get_type(strip_expr(left)), tmp_false);
1570 if (tmp_true && tmp_false)
1571 __save_imaginary_state(left, tmp_true, tmp_false);
1574 if (!right_true || !right_false) {
1575 struct range_list *tmp_true, *tmp_false;
1577 split_comparison_rl(alloc_whole_rl(type), op, right_orig, NULL, NULL, &tmp_true, &tmp_false);
1578 tmp_true = rl_truncate_cast(get_type(strip_expr(right)), tmp_true);
1579 tmp_false = rl_truncate_cast(get_type(strip_expr(right)), tmp_false);
1580 if (tmp_true && tmp_false)
1581 __save_imaginary_state(right, tmp_true, tmp_false);
1584 left_true_state = alloc_estate_rl(left_true);
1585 left_false_state = alloc_estate_rl(left_false);
1586 right_true_state = alloc_estate_rl(right_true);
1587 right_false_state = alloc_estate_rl(right_false);
1589 switch (op) {
1590 case '<':
1591 case SPECIAL_UNSIGNED_LT:
1592 case SPECIAL_UNSIGNED_LTE:
1593 case SPECIAL_LTE:
1594 if (get_implied_value(right, &dummy) && !in_macro(left, right))
1595 estate_set_hard_max(left_true_state);
1596 if (get_implied_value(left, &dummy) && !in_macro(left, right))
1597 estate_set_hard_max(right_false_state);
1598 break;
1599 case '>':
1600 case SPECIAL_UNSIGNED_GT:
1601 case SPECIAL_UNSIGNED_GTE:
1602 case SPECIAL_GTE:
1603 if (get_implied_value(left, &dummy) && !in_macro(left, right))
1604 estate_set_hard_max(right_true_state);
1605 if (get_implied_value(right, &dummy) && !in_macro(left, right))
1606 estate_set_hard_max(left_false_state);
1607 break;
1610 switch (op) {
1611 case '<':
1612 case SPECIAL_UNSIGNED_LT:
1613 case SPECIAL_UNSIGNED_LTE:
1614 case SPECIAL_LTE:
1615 if (get_hard_max(right, &hard_max)) {
1616 if (op == '<' || op == SPECIAL_UNSIGNED_LT)
1617 hard_max.value--;
1618 estate_set_fuzzy_max(left_true_state, hard_max);
1620 if (get_implied_value(right, &hard_max)) {
1621 if (op == SPECIAL_UNSIGNED_LTE ||
1622 op == SPECIAL_LTE)
1623 hard_max.value++;
1624 estate_set_fuzzy_max(left_false_state, hard_max);
1626 if (get_hard_max(left, &hard_max)) {
1627 if (op == SPECIAL_UNSIGNED_LTE ||
1628 op == SPECIAL_LTE)
1629 hard_max.value--;
1630 estate_set_fuzzy_max(right_false_state, hard_max);
1632 if (get_implied_value(left, &hard_max)) {
1633 if (op == '<' || op == SPECIAL_UNSIGNED_LT)
1634 hard_max.value++;
1635 estate_set_fuzzy_max(right_true_state, hard_max);
1637 break;
1638 case '>':
1639 case SPECIAL_UNSIGNED_GT:
1640 case SPECIAL_UNSIGNED_GTE:
1641 case SPECIAL_GTE:
1642 if (get_hard_max(left, &hard_max)) {
1643 if (op == '>' || op == SPECIAL_UNSIGNED_GT)
1644 hard_max.value--;
1645 estate_set_fuzzy_max(right_true_state, hard_max);
1647 if (get_implied_value(left, &hard_max)) {
1648 if (op == SPECIAL_UNSIGNED_GTE ||
1649 op == SPECIAL_GTE)
1650 hard_max.value++;
1651 estate_set_fuzzy_max(right_false_state, hard_max);
1653 if (get_hard_max(right, &hard_max)) {
1654 if (op == SPECIAL_UNSIGNED_LTE ||
1655 op == SPECIAL_LTE)
1656 hard_max.value--;
1657 estate_set_fuzzy_max(left_false_state, hard_max);
1659 if (get_implied_value(right, &hard_max)) {
1660 if (op == '>' ||
1661 op == SPECIAL_UNSIGNED_GT)
1662 hard_max.value++;
1663 estate_set_fuzzy_max(left_true_state, hard_max);
1665 break;
1666 case SPECIAL_EQUAL:
1667 if (get_hard_max(left, &hard_max))
1668 estate_set_fuzzy_max(right_true_state, hard_max);
1669 if (get_hard_max(right, &hard_max))
1670 estate_set_fuzzy_max(left_true_state, hard_max);
1671 break;
1674 if (get_hard_max(left, &hard_max)) {
1675 estate_set_hard_max(left_true_state);
1676 estate_set_hard_max(left_false_state);
1678 if (get_hard_max(right, &hard_max)) {
1679 estate_set_hard_max(right_true_state);
1680 estate_set_hard_max(right_false_state);
1683 if (left_postop == SPECIAL_INCREMENT) {
1684 left_true_state = increment_state(left_true_state);
1685 left_false_state = increment_state(left_false_state);
1687 if (left_postop == SPECIAL_DECREMENT) {
1688 left_true_state = decrement_state(left_true_state);
1689 left_false_state = decrement_state(left_false_state);
1691 if (right_postop == SPECIAL_INCREMENT) {
1692 right_true_state = increment_state(right_true_state);
1693 right_false_state = increment_state(right_false_state);
1695 if (right_postop == SPECIAL_DECREMENT) {
1696 right_true_state = decrement_state(right_true_state);
1697 right_false_state = decrement_state(right_false_state);
1700 if (estate_rl(left_true_state) && estates_equiv(left_true_state, left_false_state)) {
1701 left_true_state = NULL;
1702 left_false_state = NULL;
1705 if (estate_rl(right_true_state) && estates_equiv(right_true_state, right_false_state)) {
1706 right_true_state = NULL;
1707 right_false_state = NULL;
1710 /* Don't introduce new states for known true/false conditions */
1711 if (rl_equiv(left_orig, estate_rl(left_true_state)))
1712 left_true_state = NULL;
1713 if (rl_equiv(left_orig, estate_rl(left_false_state)))
1714 left_false_state = NULL;
1715 if (rl_equiv(right_orig, estate_rl(right_true_state)))
1716 right_true_state = NULL;
1717 if (rl_equiv(right_orig, estate_rl(right_false_state)))
1718 right_false_state = NULL;
1720 set_extra_expr_true_false(left, left_true_state, left_false_state);
1721 set_extra_expr_true_false(right, right_true_state, right_false_state);
1724 static int is_simple_math(struct expression *expr)
1726 if (!expr)
1727 return 0;
1728 if (expr->type != EXPR_BINOP)
1729 return 0;
1730 switch (expr->op) {
1731 case '+':
1732 case '-':
1733 case '*':
1734 return 1;
1736 return 0;
1739 static int flip_op(int op)
1741 /* We only care about simple math */
1742 switch (op) {
1743 case '+':
1744 return '-';
1745 case '-':
1746 return '+';
1747 case '*':
1748 return '/';
1750 return 0;
1753 static void move_known_to_rl(struct expression **expr_p, struct range_list **rl_p)
1755 struct expression *expr = *expr_p;
1756 struct range_list *rl = *rl_p;
1757 sval_t sval;
1759 if (!is_simple_math(expr))
1760 return;
1762 if (get_implied_value(expr->right, &sval)) {
1763 *expr_p = expr->left;
1764 *rl_p = rl_binop(rl, flip_op(expr->op), alloc_rl(sval, sval));
1765 move_known_to_rl(expr_p, rl_p);
1766 return;
1768 if (expr->op == '-')
1769 return;
1770 if (get_implied_value(expr->left, &sval)) {
1771 *expr_p = expr->right;
1772 *rl_p = rl_binop(rl, flip_op(expr->op), alloc_rl(sval, sval));
1773 move_known_to_rl(expr_p, rl_p);
1774 return;
1778 static void move_known_values(struct expression **left_p, struct expression **right_p)
1780 struct expression *left = *left_p;
1781 struct expression *right = *right_p;
1782 sval_t sval, dummy;
1784 if (get_implied_value(left, &sval)) {
1785 if (!is_simple_math(right))
1786 return;
1787 if (get_implied_value(right, &dummy))
1788 return;
1789 if (right->op == '*') {
1790 sval_t divisor;
1792 if (!get_value(right->right, &divisor))
1793 return;
1794 if (divisor.value == 0)
1795 return;
1796 *left_p = binop_expression(left, invert_op(right->op), right->right);
1797 *right_p = right->left;
1798 return;
1800 if (right->op == '+' && get_value(right->left, &sval)) {
1801 *left_p = binop_expression(left, invert_op(right->op), right->left);
1802 *right_p = right->right;
1803 return;
1805 if (get_value(right->right, &sval)) {
1806 *left_p = binop_expression(left, invert_op(right->op), right->right);
1807 *right_p = right->left;
1808 return;
1810 return;
1812 if (get_implied_value(right, &sval)) {
1813 if (!is_simple_math(left))
1814 return;
1815 if (get_implied_value(left, &dummy))
1816 return;
1817 if (left->op == '*') {
1818 sval_t divisor;
1820 if (!get_value(left->right, &divisor))
1821 return;
1822 if (divisor.value == 0)
1823 return;
1824 *right_p = binop_expression(right, invert_op(left->op), left->right);
1825 *left_p = left->left;
1826 return;
1828 if (left->op == '+' && get_value(left->left, &sval)) {
1829 *right_p = binop_expression(right, invert_op(left->op), left->left);
1830 *left_p = left->right;
1831 return;
1834 if (get_value(left->right, &sval)) {
1835 *right_p = binop_expression(right, invert_op(left->op), left->right);
1836 *left_p = left->left;
1837 return;
1839 return;
1844 * The reason for do_simple_algebra() is to solve things like:
1845 * if (foo > 66 || foo + bar > 64) {
1846 * "foo" is not really a known variable so it won't be handled by
1847 * move_known_variables() but it's a super common idiom.
1850 static int do_simple_algebra(struct expression **left_p, struct expression **right_p)
1852 struct expression *left = *left_p;
1853 struct expression *right = *right_p;
1854 struct range_list *rl;
1855 sval_t tmp;
1857 if (left->type != EXPR_BINOP || left->op != '+')
1858 return 0;
1859 if (can_integer_overflow(get_type(left), left))
1860 return 0;
1861 if (!get_implied_value(right, &tmp))
1862 return 0;
1864 if (!get_implied_value(left->left, &tmp) &&
1865 get_implied_rl(left->left, &rl) &&
1866 !is_whole_rl(rl)) {
1867 *right_p = binop_expression(right, '-', left->left);
1868 *left_p = left->right;
1869 return 1;
1871 if (!get_implied_value(left->right, &tmp) &&
1872 get_implied_rl(left->right, &rl) &&
1873 !is_whole_rl(rl)) {
1874 *right_p = binop_expression(right, '-', left->right);
1875 *left_p = left->left;
1876 return 1;
1879 return 0;
1882 static int match_func_comparison(struct expression *expr)
1884 struct expression *left = strip_expr(expr->left);
1885 struct expression *right = strip_expr(expr->right);
1887 if (left->type == EXPR_CALL || right->type == EXPR_CALL) {
1888 function_comparison(left, expr->op, right);
1889 return 1;
1892 return 0;
1895 /* Handle conditions like "if (foo + bar < foo) {" */
1896 static int handle_integer_overflow_test(struct expression *expr)
1898 struct expression *left, *right;
1899 struct symbol *type;
1900 sval_t left_min, right_min, min, max;
1902 if (expr->op != '<' && expr->op != SPECIAL_UNSIGNED_LT)
1903 return 0;
1905 left = strip_parens(expr->left);
1906 right = strip_parens(expr->right);
1908 if (left->op != '+')
1909 return 0;
1911 type = get_type(expr);
1912 if (!type)
1913 return 0;
1914 if (type_positive_bits(type) == 32) {
1915 max.type = &uint_ctype;
1916 max.uvalue = (unsigned int)-1;
1917 } else if (type_positive_bits(type) == 64) {
1918 max.type = &ulong_ctype;
1919 max.value = (unsigned long long)-1;
1920 } else {
1921 return 0;
1924 if (!expr_equiv(left->left, right) && !expr_equiv(left->right, right))
1925 return 0;
1927 get_absolute_min(left->left, &left_min);
1928 get_absolute_min(left->right, &right_min);
1929 min = sval_binop(left_min, '+', right_min);
1931 type = get_type(left);
1932 min = sval_cast(type, min);
1933 max = sval_cast(type, max);
1935 set_extra_chunk_true_false(left, NULL, alloc_estate_range(min, max));
1936 return 1;
1939 static void match_comparison(struct expression *expr)
1941 struct expression *left_orig = strip_parens(expr->left);
1942 struct expression *right_orig = strip_parens(expr->right);
1943 struct expression *left, *right, *tmp;
1944 struct expression *prev;
1945 struct symbol *type;
1946 int redo, count;
1948 if (match_func_comparison(expr))
1949 return;
1951 type = get_type(expr);
1952 if (!type)
1953 type = &llong_ctype;
1955 if (handle_integer_overflow_test(expr))
1956 return;
1958 left = left_orig;
1959 right = right_orig;
1960 move_known_values(&left, &right);
1961 handle_comparison(type, left, expr->op, right);
1963 left = left_orig;
1964 right = right_orig;
1965 if (do_simple_algebra(&left, &right))
1966 handle_comparison(type, left, expr->op, right);
1968 prev = get_assigned_expr(left_orig);
1969 if (is_simple_math(prev) && has_variable(prev, left_orig) == 0) {
1970 left = prev;
1971 right = right_orig;
1972 move_known_values(&left, &right);
1973 handle_comparison(type, left, expr->op, right);
1976 prev = get_assigned_expr(right_orig);
1977 if (is_simple_math(prev) && has_variable(prev, right_orig) == 0) {
1978 left = left_orig;
1979 right = prev;
1980 move_known_values(&left, &right);
1981 handle_comparison(type, left, expr->op, right);
1984 redo = 0;
1985 left = left_orig;
1986 right = right_orig;
1987 if (get_last_expr_from_expression_stmt(left_orig)) {
1988 left = get_last_expr_from_expression_stmt(left_orig);
1989 redo = 1;
1991 if (get_last_expr_from_expression_stmt(right_orig)) {
1992 right = get_last_expr_from_expression_stmt(right_orig);
1993 redo = 1;
1996 if (!redo)
1997 return;
1999 count = 0;
2000 while ((tmp = get_assigned_expr(left))) {
2001 if (count++ > 3)
2002 break;
2003 left = strip_expr(tmp);
2005 count = 0;
2006 while ((tmp = get_assigned_expr(right))) {
2007 if (count++ > 3)
2008 break;
2009 right = strip_expr(tmp);
2012 handle_comparison(type, left, expr->op, right);
2015 static sval_t get_high_mask(sval_t known)
2017 sval_t ret;
2018 int i;
2020 ret = known;
2021 ret.value = 0;
2023 for (i = type_bits(known.type) - 1; i >= 0; i--) {
2024 if (known.uvalue & (1ULL << i))
2025 ret.uvalue |= (1ULL << i);
2026 else
2027 return ret;
2030 return ret;
2033 static bool handle_bit_test(struct expression *expr)
2035 struct range_list *orig_rl, *rl;
2036 struct expression *shift, *mask, *var;
2037 struct bit_info *bit_info;
2038 sval_t sval;
2039 sval_t high = { .type = &int_ctype };
2040 sval_t low = { .type = &int_ctype };
2042 shift = strip_expr(expr->right);
2043 mask = strip_expr(expr->left);
2044 if (shift->type != EXPR_BINOP || shift->op != SPECIAL_LEFTSHIFT) {
2045 shift = strip_expr(expr->left);
2046 mask = strip_expr(expr->right);
2047 if (shift->type != EXPR_BINOP || shift->op != SPECIAL_LEFTSHIFT)
2048 return false;
2050 if (!get_implied_value(shift->left, &sval) || sval.value != 1)
2051 return false;
2052 var = strip_expr(shift->right);
2054 bit_info = get_bit_info(mask);
2055 if (!bit_info)
2056 return false;
2057 if (!bit_info->possible)
2058 return false;
2060 get_absolute_rl(var, &orig_rl);
2061 if (sval_is_negative(rl_min(orig_rl)) ||
2062 rl_max(orig_rl).uvalue > type_bits(get_type(shift->left)))
2063 return false;
2065 low.value = ffsll(bit_info->possible);
2066 high.value = sm_fls64(bit_info->possible);
2067 rl = alloc_rl(low, high);
2068 rl = cast_rl(get_type(var), rl);
2069 rl = rl_intersection(orig_rl, rl);
2070 if (!rl)
2071 return false;
2073 set_extra_expr_true_false(shift->right, alloc_estate_rl(rl), NULL);
2075 return true;
2078 static void handle_AND_op(struct expression *var, sval_t known)
2080 struct range_list *orig_rl;
2081 struct range_list *true_rl = NULL;
2082 struct range_list *false_rl = NULL;
2083 int bit;
2084 sval_t low_mask = known;
2085 sval_t high_mask;
2086 sval_t max;
2088 get_absolute_rl(var, &orig_rl);
2090 if (known.value > 0) {
2091 bit = ffsll(known.value) - 1;
2092 low_mask.uvalue = (1ULL << bit) - 1;
2093 true_rl = remove_range(orig_rl, sval_type_val(known.type, 0), low_mask);
2095 high_mask = get_high_mask(known);
2096 if (high_mask.value) {
2097 bit = ffsll(high_mask.value) - 1;
2098 low_mask.uvalue = (1ULL << bit) - 1;
2100 false_rl = orig_rl;
2101 if (sval_is_negative(rl_min(orig_rl)))
2102 false_rl = remove_range(false_rl, sval_type_min(known.type), sval_type_val(known.type, -1));
2103 false_rl = remove_range(false_rl, low_mask, sval_type_max(known.type));
2104 if (type_signed(high_mask.type) && type_unsigned(rl_type(false_rl))) {
2105 false_rl = remove_range(false_rl,
2106 sval_type_val(rl_type(false_rl), sval_type_max(known.type).uvalue),
2107 sval_type_val(rl_type(false_rl), -1));
2109 } else if (known.value == 1 &&
2110 get_hard_max(var, &max) &&
2111 sval_cmp(max, rl_max(orig_rl)) == 0 &&
2112 max.value & 1) {
2113 false_rl = remove_range(orig_rl, max, max);
2115 set_extra_expr_true_false(var,
2116 true_rl ? alloc_estate_rl(true_rl) : NULL,
2117 false_rl ? alloc_estate_rl(false_rl) : NULL);
2120 static void handle_AND_condition(struct expression *expr)
2122 sval_t known;
2124 if (handle_bit_test(expr))
2125 return;
2127 if (get_implied_value(expr->left, &known))
2128 handle_AND_op(expr->right, known);
2129 else if (get_implied_value(expr->right, &known))
2130 handle_AND_op(expr->left, known);
2133 static void handle_MOD_condition(struct expression *expr)
2135 struct range_list *orig_rl;
2136 struct range_list *true_rl;
2137 struct range_list *false_rl = NULL;
2138 sval_t right;
2139 sval_t zero = {
2140 .value = 0,
2143 if (!get_implied_value(expr->right, &right) || right.value == 0)
2144 return;
2145 get_absolute_rl(expr->left, &orig_rl);
2147 zero.type = rl_type(orig_rl);
2149 /* We're basically dorking around the min and max here */
2150 true_rl = remove_range(orig_rl, zero, zero);
2151 if (!sval_is_max(rl_max(true_rl)) &&
2152 !(rl_max(true_rl).value % right.value))
2153 true_rl = remove_range(true_rl, rl_max(true_rl), rl_max(true_rl));
2155 if (rl_equiv(true_rl, orig_rl))
2156 true_rl = NULL;
2158 if (sval_is_positive(rl_min(orig_rl)) &&
2159 (rl_max(orig_rl).value - rl_min(orig_rl).value) / right.value < 5) {
2160 sval_t add;
2161 int i;
2163 add = rl_min(orig_rl);
2164 add.value += right.value - (add.value % right.value);
2165 add.value -= right.value;
2167 for (i = 0; i < 5; i++) {
2168 add.value += right.value;
2169 if (add.value > rl_max(orig_rl).value)
2170 break;
2171 add_range(&false_rl, add, add);
2173 } else {
2174 if (rl_min(orig_rl).uvalue != 0 &&
2175 rl_min(orig_rl).uvalue < right.uvalue) {
2176 sval_t chop = right;
2177 chop.value--;
2178 false_rl = remove_range(orig_rl, zero, chop);
2181 if (!sval_is_max(rl_max(orig_rl)) &&
2182 (rl_max(orig_rl).value % right.value)) {
2183 sval_t chop = rl_max(orig_rl);
2184 chop.value -= chop.value % right.value;
2185 chop.value++;
2186 if (!false_rl)
2187 false_rl = clone_rl(orig_rl);
2188 false_rl = remove_range(false_rl, chop, rl_max(orig_rl));
2192 set_extra_expr_true_false(expr->left,
2193 true_rl ? alloc_estate_rl(true_rl) : NULL,
2194 false_rl ? alloc_estate_rl(false_rl) : NULL);
2197 /* this is actually hooked from smatch_implied.c... it's hacky, yes */
2198 void __extra_match_condition(struct expression *expr)
2200 expr = strip_expr(expr);
2201 switch (expr->type) {
2202 case EXPR_CALL:
2203 function_comparison(expr, SPECIAL_NOTEQUAL, zero_expr());
2204 return;
2205 case EXPR_PREOP:
2206 case EXPR_SYMBOL:
2207 case EXPR_DEREF:
2208 handle_comparison(get_type(expr), expr, SPECIAL_NOTEQUAL, zero_expr());
2209 return;
2210 case EXPR_COMPARE:
2211 match_comparison(expr);
2212 return;
2213 case EXPR_ASSIGNMENT:
2214 __extra_match_condition(expr->left);
2215 return;
2216 case EXPR_BINOP:
2217 if (expr->op == '&')
2218 handle_AND_condition(expr);
2219 if (expr->op == '%')
2220 handle_MOD_condition(expr);
2221 return;
2225 static void assume_indexes_are_valid(struct expression *expr)
2227 struct expression *array_expr;
2228 int array_size;
2229 struct expression *offset;
2230 struct symbol *offset_type;
2231 struct range_list *rl_before;
2232 struct range_list *rl_after;
2233 struct range_list *filter = NULL;
2234 sval_t size;
2236 expr = strip_expr(expr);
2237 if (!is_array(expr))
2238 return;
2240 offset = get_array_offset(expr);
2241 offset_type = get_type(offset);
2242 if (offset_type && type_signed(offset_type)) {
2243 filter = alloc_rl(sval_type_min(offset_type),
2244 sval_type_val(offset_type, -1));
2247 array_expr = get_array_base(expr);
2248 array_size = get_real_array_size(array_expr);
2249 if (array_size > 1) {
2250 size = sval_type_val(offset_type, array_size);
2251 add_range(&filter, size, sval_type_max(offset_type));
2254 if (!filter)
2255 return;
2256 get_absolute_rl(offset, &rl_before);
2257 rl_after = rl_filter(rl_before, filter);
2258 if (rl_equiv(rl_before, rl_after))
2259 return;
2260 set_extra_expr_nomod(offset, alloc_estate_rl(rl_after));
2263 /* returns 1 if it is not possible for expr to be value, otherwise returns 0 */
2264 int implied_not_equal(struct expression *expr, long long val)
2266 return !possibly_false(expr, SPECIAL_NOTEQUAL, value_expr(val));
2269 int implied_not_equal_name_sym(char *name, struct symbol *sym, long long val)
2271 struct smatch_state *estate;
2273 estate = get_state(SMATCH_EXTRA, name, sym);
2274 if (!estate)
2275 return 0;
2276 if (!rl_has_sval(estate_rl(estate), sval_type_val(estate_type(estate), 0)))
2277 return 1;
2278 return 0;
2281 int parent_is_null_var_sym(const char *name, struct symbol *sym)
2283 char buf[256];
2284 char *start;
2285 char *end;
2286 struct smatch_state *state;
2288 strncpy(buf, name, sizeof(buf) - 1);
2289 buf[sizeof(buf) - 1] = '\0';
2291 start = &buf[0];
2292 while (*start == '*') {
2293 start++;
2294 state = __get_state(SMATCH_EXTRA, start, sym);
2295 if (!state)
2296 continue;
2297 if (!estate_rl(state))
2298 return 1;
2299 if (estate_min(state).value == 0 &&
2300 estate_max(state).value == 0)
2301 return 1;
2304 start = &buf[0];
2305 while (*start == '&')
2306 start++;
2308 while ((end = strrchr(start, '-'))) {
2309 *end = '\0';
2310 state = __get_state(SMATCH_EXTRA, start, sym);
2311 if (!state)
2312 continue;
2313 if (estate_min(state).value == 0 &&
2314 estate_max(state).value == 0)
2315 return 1;
2317 return 0;
2320 int parent_is_null(struct expression *expr)
2322 struct symbol *sym;
2323 char *var;
2324 int ret = 0;
2326 expr = strip_expr(expr);
2327 var = expr_to_var_sym(expr, &sym);
2328 if (!var || !sym)
2329 goto free;
2330 ret = parent_is_null_var_sym(var, sym);
2331 free:
2332 free_string(var);
2333 return ret;
2336 static int param_used_callback(void *found, int argc, char **argv, char **azColName)
2338 *(int *)found = 1;
2339 return 0;
2342 static int is_kzalloc_info(struct sm_state *sm)
2344 sval_t sval;
2347 * kzalloc() information is treated as special because so there is just
2348 * a lot of stuff initialized to zero and it makes building the database
2349 * take hours and hours.
2351 * In theory, we should just remove this line and not pass any unused
2352 * information, but I'm not sure enough that this code works so I want
2353 * to hold off on that for now.
2355 if (!estate_get_single_value(sm->state, &sval))
2356 return 0;
2357 if (sval.value != 0)
2358 return 0;
2359 return 1;
2362 static int is_really_long(struct sm_state *sm)
2364 const char *p;
2365 int cnt = 0;
2367 p = sm->name;
2368 while ((p = strstr(p, "->"))) {
2369 p += 2;
2370 cnt++;
2373 if (cnt < 3 ||
2374 strlen(sm->name) < 40)
2375 return 0;
2376 return 1;
2379 static int filter_unused_param_value_info(struct expression *call, int param, char *printed_name, struct sm_state *sm)
2381 int found = 0;
2383 /* for function pointers assume everything is used */
2384 if (call->fn->type != EXPR_SYMBOL)
2385 return 0;
2388 * This is to handle __builtin_mul_overflow(). In an ideal world we
2389 * would only need this for invalid code.
2392 if (!call->fn->symbol)
2393 return 0;
2395 if (!is_kzalloc_info(sm) && !is_really_long(sm))
2396 return 0;
2398 run_sql(&param_used_callback, &found,
2399 "select * from return_implies where %s and type = %d and parameter = %d and key = '%s';",
2400 get_static_filter(call->fn->symbol), PARAM_USED, param, printed_name);
2401 if (found)
2402 return 0;
2404 /* If the database is not built yet, then assume everything is used */
2405 run_sql(&param_used_callback, &found,
2406 "select * from return_implies where %s and type = %d;",
2407 get_static_filter(call->fn->symbol), PARAM_USED);
2408 if (!found)
2409 return 0;
2411 return 1;
2414 struct range_list *intersect_with_real_abs_var_sym(const char *name, struct symbol *sym, struct range_list *start)
2416 struct smatch_state *state;
2419 * Here is the difference between implied value and real absolute, say
2420 * you have:
2422 * int a = (u8)x;
2424 * Then you know that a is 0-255. That's real absolute. But you don't
2425 * know for sure that it actually goes up to 255. So it's not implied.
2426 * Implied indicates a degree of certainty.
2428 * But then say you cap "a" at 8. That means you know it goes up to
2429 * 8. So now the implied value is s32min-8. But you can combine it
2430 * with the real absolute to say that actually it's 0-8.
2432 * We are combining it here. But now that I think about it, this is
2433 * probably not the ideal place to combine it because it should proably
2434 * be done earlier. Oh well, this is an improvement on what was there
2435 * before so I'm going to commit this code.
2439 state = get_real_absolute_state_var_sym(name, sym);
2440 if (!state || !estate_rl(state))
2441 return start;
2443 return rl_intersection(estate_rl(state), start);
2446 struct range_list *intersect_with_real_abs_expr(struct expression *expr, struct range_list *start)
2448 struct smatch_state *state;
2449 struct range_list *abs_rl;
2451 state = get_real_absolute_state(expr);
2452 if (!state || !estate_rl(state))
2453 return start;
2455 abs_rl = cast_rl(rl_type(start), estate_rl(state));
2456 return rl_intersection(abs_rl, start);
2459 static void struct_member_callback(struct expression *call, int param, char *printed_name, struct sm_state *sm)
2461 struct range_list *rl;
2462 sval_t dummy;
2464 if (estate_is_whole(sm->state) || !estate_rl(sm->state))
2465 return;
2466 if (filter_unused_param_value_info(call, param, printed_name, sm))
2467 return;
2468 rl = estate_rl(sm->state);
2469 rl = intersect_with_real_abs_var_sym(sm->name, sm->sym, rl);
2470 if (!rl)
2471 return;
2472 sql_insert_caller_info(call, PARAM_VALUE, param, printed_name, show_rl(rl));
2473 if (!estate_get_single_value(sm->state, &dummy)) {
2474 if (estate_has_hard_max(sm->state))
2475 sql_insert_caller_info(call, HARD_MAX, param, printed_name,
2476 sval_to_str(estate_max(sm->state)));
2477 if (estate_has_fuzzy_max(sm->state))
2478 sql_insert_caller_info(call, FUZZY_MAX, param, printed_name,
2479 sval_to_str(estate_get_fuzzy_max(sm->state)));
2483 static void returned_struct_members(int return_id, char *return_ranges, struct expression *expr)
2485 struct symbol *returned_sym;
2486 char *returned_name;
2487 struct sm_state *sm;
2488 char *compare_str;
2489 char name_buf[256];
2490 char val_buf[256];
2491 int len;
2493 // FIXME handle *$
2495 if (!is_pointer(expr))
2496 return;
2498 returned_name = expr_to_var_sym(expr, &returned_sym);
2499 if (!returned_name || !returned_sym)
2500 goto free;
2501 len = strlen(returned_name);
2503 FOR_EACH_MY_SM(my_id, __get_cur_stree(), sm) {
2504 if (!estate_rl(sm->state))
2505 continue;
2506 if (returned_sym != sm->sym)
2507 continue;
2508 if (strncmp(returned_name, sm->name, len) != 0)
2509 continue;
2510 if (sm->name[len] != '-')
2511 continue;
2513 snprintf(name_buf, sizeof(name_buf), "$%s", sm->name + len);
2515 compare_str = name_sym_to_param_comparison(sm->name, sm->sym);
2516 if (!compare_str && estate_is_whole(sm->state))
2517 continue;
2518 snprintf(val_buf, sizeof(val_buf), "%s%s", sm->state->name, compare_str ?: "");
2520 sql_insert_return_states(return_id, return_ranges, PARAM_VALUE,
2521 -1, name_buf, val_buf);
2522 } END_FOR_EACH_SM(sm);
2524 free:
2525 free_string(returned_name);
2528 static void db_limited_before(void)
2530 unmatched_stree = clone_stree(__get_cur_stree());
2533 static void db_limited_after(void)
2535 free_stree(&unmatched_stree);
2538 static int basically_the_same(struct range_list *orig, struct range_list *new)
2540 if (rl_equiv(orig, new))
2541 return 1;
2544 * The whole range is essentially the same as 0,4096-27777777777 so
2545 * don't overwrite the implications just to store that.
2548 if (rl_type(orig)->type == SYM_PTR &&
2549 is_whole_rl(orig) &&
2550 rl_min(new).value == 0 &&
2551 rl_max(new).value == valid_ptr_max)
2552 return 1;
2553 return 0;
2556 static void db_param_limit_binops(struct expression *arg, char *key, struct range_list *rl)
2558 struct range_list *left_rl;
2559 sval_t zero = { .type = rl_type(rl), };
2560 sval_t sval;
2562 if (arg->op != '*')
2563 return;
2564 if (!get_implied_value(arg->right, &sval))
2565 return;
2566 if (can_integer_overflow(get_type(arg), arg))
2567 return;
2569 left_rl = rl_binop(rl, '/', alloc_rl(sval, sval));
2570 if (!rl_has_sval(rl, zero))
2571 left_rl = remove_range(left_rl, zero, zero);
2573 set_extra_expr_nomod(arg->left, alloc_estate_rl(left_rl));
2576 static void db_param_limit_filter(struct expression *expr, int param, char *key, char *value, enum info_type op)
2578 struct expression *arg;
2579 char *name;
2580 struct symbol *sym;
2581 struct var_sym_list *vsl = NULL;
2582 struct sm_state *sm;
2583 struct symbol *compare_type, *var_type;
2584 struct range_list *rl;
2585 struct range_list *limit;
2586 struct range_list *new;
2587 char *other_name;
2588 struct symbol *other_sym;
2590 while (expr->type == EXPR_ASSIGNMENT)
2591 expr = strip_expr(expr->right);
2592 if (expr->type != EXPR_CALL)
2593 return;
2595 arg = get_argument_from_call_expr(expr->args, param);
2596 if (!arg)
2597 return;
2599 if (strcmp(key, "$") == 0)
2600 compare_type = get_arg_type(expr->fn, param);
2601 else
2602 compare_type = get_member_type_from_key(arg, key);
2604 call_results_to_rl(expr, compare_type, value, &limit);
2605 if (strcmp(key, "$") == 0)
2606 move_known_to_rl(&arg, &limit);
2607 name = get_chunk_from_key(arg, key, &sym, &vsl);
2608 if (!name)
2609 return;
2610 if (op != PARAM_LIMIT && !sym)
2611 goto free;
2613 sm = get_sm_state(SMATCH_EXTRA, name, sym);
2614 if (sm)
2615 rl = estate_rl(sm->state);
2616 else
2617 rl = alloc_whole_rl(compare_type);
2619 if (op == PARAM_LIMIT && !rl_fits_in_type(rl, compare_type))
2620 goto free;
2622 new = rl_intersection(rl, limit);
2624 var_type = get_member_type_from_key(arg, key);
2625 new = cast_rl(var_type, new);
2627 /* We want to preserve the implications here */
2628 if (sm && basically_the_same(rl, new))
2629 goto free;
2630 other_name = get_other_name_sym(name, sym, &other_sym);
2632 if (op == PARAM_LIMIT)
2633 set_extra_nomod_vsl(name, sym, vsl, NULL, alloc_estate_rl(new));
2634 else
2635 set_extra_mod(name, sym, NULL, alloc_estate_rl(new));
2637 if (other_name && other_sym) {
2638 if (op == PARAM_LIMIT)
2639 set_extra_nomod_vsl(other_name, other_sym, vsl, NULL, alloc_estate_rl(new));
2640 else
2641 set_extra_mod(other_name, other_sym, NULL, alloc_estate_rl(new));
2644 if (op == PARAM_LIMIT && arg->type == EXPR_BINOP)
2645 db_param_limit_binops(arg, key, new);
2646 free:
2647 free_string(name);
2650 static void db_param_limit(struct expression *expr, int param, char *key, char *value)
2652 db_param_limit_filter(expr, param, key, value, PARAM_LIMIT);
2655 static void db_param_filter(struct expression *expr, int param, char *key, char *value)
2657 db_param_limit_filter(expr, param, key, value, PARAM_FILTER);
2660 static void db_param_add_set(struct expression *expr, int param, char *key, char *value, enum info_type op)
2662 struct expression *arg, *gen_expr;
2663 char *name;
2664 char *other_name = NULL;
2665 struct symbol *sym, *other_sym;
2666 struct symbol *param_type, *arg_type;
2667 struct smatch_state *state;
2668 struct range_list *new = NULL;
2669 struct range_list *added = NULL;
2671 while (expr->type == EXPR_ASSIGNMENT)
2672 expr = strip_expr(expr->right);
2673 if (expr->type != EXPR_CALL)
2674 return;
2676 arg = get_argument_from_call_expr(expr->args, param);
2677 if (!arg)
2678 return;
2680 arg_type = get_arg_type_from_key(expr->fn, param, arg, key);
2681 param_type = get_member_type_from_key(arg, key);
2682 if (param_type && param_type->type == SYM_STRUCT)
2683 return;
2684 name = get_variable_from_key(arg, key, &sym);
2685 if (!name || !sym)
2686 goto free;
2687 gen_expr = gen_expression_from_key(arg, key);
2689 state = get_state(SMATCH_EXTRA, name, sym);
2690 if (state)
2691 new = estate_rl(state);
2693 call_results_to_rl(expr, arg_type, value, &added);
2694 added = cast_rl(param_type, added);
2695 if (op == PARAM_SET)
2696 new = added;
2697 else
2698 new = rl_union(new, added);
2700 other_name = get_other_name_sym_nostack(name, sym, &other_sym);
2701 set_extra_mod(name, sym, gen_expr, alloc_estate_rl(new));
2702 if (other_name && other_sym)
2703 set_extra_mod(other_name, other_sym, gen_expr, alloc_estate_rl(new));
2704 free:
2705 free_string(other_name);
2706 free_string(name);
2709 static void db_param_add(struct expression *expr, int param, char *key, char *value)
2711 in_param_set = true;
2712 db_param_add_set(expr, param, key, value, PARAM_ADD);
2713 in_param_set = false;
2716 static void db_param_set(struct expression *expr, int param, char *key, char *value)
2718 in_param_set = true;
2719 db_param_add_set(expr, param, key, value, PARAM_SET);
2720 in_param_set = false;
2723 static void match_lost_param(struct expression *call, int param)
2725 struct expression *arg;
2727 if (is_const_param(call->fn, param))
2728 return;
2730 arg = get_argument_from_call_expr(call->args, param);
2731 if (!arg)
2732 return;
2734 arg = strip_expr(arg);
2735 if (arg->type == EXPR_PREOP && arg->op == '&')
2736 set_extra_expr_mod(arg->unop, alloc_estate_whole(get_type(arg->unop)));
2737 else
2738 ; /* if pointer then set struct members, maybe?*/
2741 static void db_param_value(struct expression *expr, int param, char *key, char *value)
2743 struct expression *call;
2744 char *name;
2745 struct symbol *sym;
2746 struct symbol *type;
2747 struct range_list *rl = NULL;
2749 if (param != -1)
2750 return;
2752 call = expr;
2753 while (call->type == EXPR_ASSIGNMENT)
2754 call = strip_expr(call->right);
2755 if (call->type != EXPR_CALL)
2756 return;
2758 type = get_member_type_from_key(expr->left, key);
2759 name = get_variable_from_key(expr->left, key, &sym);
2760 if (!name || !sym)
2761 goto free;
2763 call_results_to_rl(call, type, value, &rl);
2765 set_extra_mod(name, sym, NULL, alloc_estate_rl(rl));
2766 free:
2767 free_string(name);
2770 static void match_call_info(struct expression *expr)
2772 struct smatch_state *state;
2773 struct range_list *rl = NULL;
2774 struct expression *arg;
2775 struct symbol *type;
2776 sval_t dummy;
2777 int i = 0;
2779 FOR_EACH_PTR(expr->args, arg) {
2780 type = get_arg_type(expr->fn, i);
2782 get_absolute_rl(arg, &rl);
2783 rl = cast_rl(type, rl);
2785 if (!is_whole_rl(rl)) {
2786 rl = intersect_with_real_abs_expr(arg, rl);
2787 sql_insert_caller_info(expr, PARAM_VALUE, i, "$", show_rl(rl));
2789 state = get_state_expr(SMATCH_EXTRA, arg);
2790 if (!estate_get_single_value(state, &dummy) && estate_has_hard_max(state)) {
2791 sql_insert_caller_info(expr, HARD_MAX, i, "$",
2792 sval_to_str(estate_max(state)));
2794 if (estate_has_fuzzy_max(state)) {
2795 sql_insert_caller_info(expr, FUZZY_MAX, i, "$",
2796 sval_to_str(estate_get_fuzzy_max(state)));
2798 i++;
2799 } END_FOR_EACH_PTR(arg);
2802 static void set_param_value(const char *name, struct symbol *sym, char *key, char *value)
2804 struct expression *expr;
2805 struct range_list *rl = NULL;
2806 struct smatch_state *state;
2807 struct symbol *type;
2808 char *key_orig = key;
2809 char *fullname;
2810 sval_t dummy;
2812 expr = symbol_expression(sym);
2813 fullname = get_variable_from_key(expr, key, NULL);
2814 if (!fullname)
2815 return;
2817 type = get_member_type_from_key(expr, key_orig);
2818 str_to_rl(type, value, &rl);
2819 state = alloc_estate_rl(rl);
2820 if (estate_get_single_value(state, &dummy))
2821 estate_set_hard_max(state);
2822 set_state(SMATCH_EXTRA, fullname, sym, state);
2825 static void set_param_fuzzy_max(const char *name, struct symbol *sym, char *key, char *value)
2827 struct expression *expr;
2828 struct range_list *rl = NULL;
2829 struct smatch_state *state;
2830 struct symbol *type;
2831 char *fullname;
2832 sval_t max;
2834 expr = symbol_expression(sym);
2835 fullname = get_variable_from_key(expr, key, NULL);
2836 if (!fullname)
2837 return;
2839 state = get_state(SMATCH_EXTRA, fullname, sym);
2840 if (!state)
2841 return;
2842 type = estate_type(state);
2843 str_to_rl(type, value, &rl);
2844 if (!rl_to_sval(rl, &max))
2845 return;
2846 estate_set_fuzzy_max(state, max);
2849 static void set_param_hard_max(const char *name, struct symbol *sym, char *key, char *value)
2851 struct smatch_state *state;
2852 struct expression *expr;
2853 char *fullname;
2855 expr = symbol_expression(sym);
2856 fullname = get_variable_from_key(expr, key, NULL);
2857 if (!fullname)
2858 return;
2860 state = get_state(SMATCH_EXTRA, fullname, sym);
2861 if (!state)
2862 return;
2863 estate_set_hard_max(state);
2866 struct sm_state *get_extra_sm_state(struct expression *expr)
2868 char *name;
2869 struct symbol *sym;
2870 struct sm_state *ret = NULL;
2872 name = expr_to_known_chunk_sym(expr, &sym);
2873 if (!name)
2874 goto free;
2876 ret = get_sm_state(SMATCH_EXTRA, name, sym);
2877 free:
2878 free_string(name);
2879 return ret;
2882 struct smatch_state *get_extra_state(struct expression *expr)
2884 struct sm_state *sm;
2886 sm = get_extra_sm_state(expr);
2887 if (!sm)
2888 return NULL;
2889 return sm->state;
2892 void register_smatch_extra(int id)
2894 my_id = id;
2896 set_dynamic_states(my_id);
2897 add_merge_hook(my_id, &merge_estates);
2898 add_unmatched_state_hook(my_id, &unmatched_state);
2899 select_caller_info_hook(set_param_value, PARAM_VALUE);
2900 select_caller_info_hook(set_param_fuzzy_max, FUZZY_MAX);
2901 select_caller_info_hook(set_param_hard_max, HARD_MAX);
2902 select_return_states_before(&db_limited_before);
2903 select_return_states_hook(PARAM_LIMIT, &db_param_limit);
2904 select_return_states_hook(PARAM_FILTER, &db_param_filter);
2905 select_return_states_hook(PARAM_ADD, &db_param_add);
2906 select_return_states_hook(PARAM_SET, &db_param_set);
2907 add_lost_param_hook(&match_lost_param);
2908 select_return_states_hook(PARAM_VALUE, &db_param_value);
2909 select_return_states_after(&db_limited_after);
2912 static void match_link_modify(struct sm_state *sm, struct expression *mod_expr)
2914 struct var_sym_list *links;
2915 struct var_sym *tmp;
2916 struct smatch_state *state;
2918 links = sm->state->data;
2920 FOR_EACH_PTR(links, tmp) {
2921 if (sm->sym == tmp->sym &&
2922 strcmp(sm->name, tmp->var) == 0)
2923 continue;
2924 state = get_state(SMATCH_EXTRA, tmp->var, tmp->sym);
2925 if (!state)
2926 continue;
2927 set_state(SMATCH_EXTRA, tmp->var, tmp->sym, alloc_estate_whole(estate_type(state)));
2928 } END_FOR_EACH_PTR(tmp);
2929 set_state(link_id, sm->name, sm->sym, &undefined);
2932 void register_smatch_extra_links(int id)
2934 link_id = id;
2935 set_dynamic_states(link_id);
2938 void register_smatch_extra_late(int id)
2940 add_merge_hook(link_id, &merge_link_states);
2941 add_modification_hook(link_id, &match_link_modify);
2942 add_hook(&match_dereferences, DEREF_HOOK);
2943 add_hook(&match_pointer_as_array, OP_HOOK);
2944 select_return_implies_hook(DEREFERENCE, &set_param_dereferenced);
2945 add_hook(&match_function_call, FUNCTION_CALL_HOOK);
2946 add_hook(&match_assign, ASSIGNMENT_HOOK);
2947 add_hook(&match_assign, GLOBAL_ASSIGNMENT_HOOK);
2948 add_hook(&unop_expr, OP_HOOK);
2949 add_hook(&asm_expr, ASM_HOOK);
2951 add_hook(&match_call_info, FUNCTION_CALL_HOOK);
2952 add_member_info_callback(my_id, struct_member_callback);
2953 add_split_return_callback(&returned_struct_members);
2955 // add_hook(&assume_indexes_are_valid, OP_HOOK);