math: silence hard max false positives
[smatch.git] / smatch_db.c
blobc3079448d266dda66dc14b505ed5640b3ec792c7
1 /*
2 * Copyright (C) 2010 Dan Carpenter.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version 2
7 * of the License, or (at your option) any later version.
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, see http://www.gnu.org/copyleft/gpl.txt
18 #include <string.h>
19 #include <errno.h>
20 #include <sqlite3.h>
21 #include <unistd.h>
22 #include <ctype.h>
23 #include "smatch.h"
24 #include "smatch_slist.h"
25 #include "smatch_extra.h"
27 static sqlite3 *db;
28 static sqlite3 *mem_db;
30 static int return_id;
32 #define sql_insert_helper(table, ignore, late, values...) \
33 do { \
34 if (__inline_fn) { \
35 char buf[1024]; \
36 char *err, *p = buf; \
37 int rc; \
39 if (!mem_db) \
40 break; \
42 p += snprintf(p, buf + sizeof(buf) - p, \
43 "insert %sinto %s values (", \
44 ignore ? "or ignore " : "", #table); \
45 p += snprintf(p, buf + sizeof(buf) - p, values); \
46 p += snprintf(p, buf + sizeof(buf) - p, ");"); \
47 sm_debug("in-mem: %s\n", buf); \
48 rc = sqlite3_exec(mem_db, buf, NULL, NULL, &err); \
49 if (rc != SQLITE_OK) { \
50 fprintf(stderr, "SQL error #2: %s\n", err); \
51 fprintf(stderr, "SQL: '%s'\n", buf); \
52 parse_error = 1; \
53 } \
54 break; \
55 } \
56 if (option_info) { \
57 FILE *tmp_fd = sm_outfd; \
58 sm_outfd = sql_outfd; \
59 sm_prefix(); \
60 sm_printf("SQL%s: insert %sinto " #table " values(", \
61 late ? "_late" : "", ignore ? "or ignore " : ""); \
62 sm_printf(values); \
63 sm_printf(");\n"); \
64 sm_outfd = tmp_fd; \
65 } \
66 } while (0)
68 #define sql_insert(table, values...) sql_insert_helper(table, 0, 0, values);
69 #define sql_insert_or_ignore(table, values...) sql_insert_helper(table, 1, 0, values);
70 #define sql_insert_late(table, values...) sql_insert_helper(table, 0, 1, values);
72 struct def_callback {
73 int hook_type;
74 void (*callback)(const char *name, struct symbol *sym, char *key, char *value);
76 ALLOCATOR(def_callback, "definition db hook callbacks");
77 DECLARE_PTR_LIST(callback_list, struct def_callback);
78 static struct callback_list *select_caller_info_callbacks;
80 struct member_info_callback {
81 int owner;
82 void (*callback)(struct expression *call, int param, char *printed_name, struct sm_state *sm);
84 ALLOCATOR(member_info_callback, "caller_info callbacks");
85 DECLARE_PTR_LIST(member_info_cb_list, struct member_info_callback);
86 static struct member_info_cb_list *member_callbacks;
88 struct returned_state_callback {
89 void (*callback)(int return_id, char *return_ranges, struct expression *return_expr);
91 ALLOCATOR(returned_state_callback, "returned state callbacks");
92 DECLARE_PTR_LIST(returned_state_cb_list, struct returned_state_callback);
93 static struct returned_state_cb_list *returned_state_callbacks;
95 struct returned_member_callback {
96 int owner;
97 void (*callback)(int return_id, char *return_ranges, struct expression *expr, char *printed_name, struct smatch_state *state);
99 ALLOCATOR(returned_member_callback, "returned member callbacks");
100 DECLARE_PTR_LIST(returned_member_cb_list, struct returned_member_callback);
101 static struct returned_member_cb_list *returned_member_callbacks;
103 struct call_implies_callback {
104 int type;
105 void (*callback)(struct expression *call, struct expression *arg, char *key, char *value);
107 ALLOCATOR(call_implies_callback, "call_implies callbacks");
108 DECLARE_PTR_LIST(call_implies_cb_list, struct call_implies_callback);
109 static struct call_implies_cb_list *call_implies_cb_list;
111 static int print_sql_output(void *unused, int argc, char **argv, char **azColName)
113 int i;
115 for (i = 0; i < argc; i++) {
116 if (i != 0)
117 printf(", ");
118 sm_printf("%s", argv[i]);
120 sm_printf("\n");
121 return 0;
124 void debug_sql(const char *sql)
126 if (!option_debug)
127 return;
128 sm_msg("%s", sql);
129 sql_exec(print_sql_output, NULL, sql);
132 void debug_mem_sql(const char *sql)
134 if (!option_debug)
135 return;
136 sm_msg("%s", sql);
137 sql_mem_exec(print_sql_output, NULL, sql);
140 void sql_exec(int (*callback)(void*, int, char**, char**), void *data, const char *sql)
142 char *err = NULL;
143 int rc;
145 if (option_no_db || !db)
146 return;
148 rc = sqlite3_exec(db, sql, callback, data, &err);
149 if (rc != SQLITE_OK && !parse_error) {
150 fprintf(stderr, "SQL error #2: %s\n", err);
151 fprintf(stderr, "SQL: '%s'\n", sql);
152 parse_error = 1;
156 void sql_mem_exec(int (*callback)(void*, int, char**, char**), void *data, const char *sql)
158 char *err = NULL;
159 int rc;
161 if (!mem_db)
162 return;
164 rc = sqlite3_exec(mem_db, sql, callback, data, &err);
165 if (rc != SQLITE_OK) {
166 fprintf(stderr, "SQL error #2: %s\n", err);
167 fprintf(stderr, "SQL: '%s'\n", sql);
168 parse_error = 1;
172 static int replace_count;
173 static char **replace_table;
174 static const char *replace_return_ranges(const char *return_ranges)
176 int i;
178 if (!get_function()) {
179 /* I have no idea why EXPORT_SYMBOL() is here */
180 return return_ranges;
182 for (i = 0; i < replace_count; i += 3) {
183 if (strcmp(replace_table[i + 0], get_function()) == 0) {
184 if (strcmp(replace_table[i + 1], return_ranges) == 0)
185 return replace_table[i + 2];
188 return return_ranges;
191 void sql_insert_return_states(int return_id, const char *return_ranges,
192 int type, int param, const char *key, const char *value)
194 if (key && strlen(key) >= 80)
195 return;
196 return_ranges = replace_return_ranges(return_ranges);
197 sql_insert(return_states, "'%s', '%s', %lu, %d, '%s', %d, %d, %d, '%s', '%s'",
198 get_base_file(), get_function(), (unsigned long)__inline_fn,
199 return_id, return_ranges, fn_static(), type, param, key, value);
202 static struct string_list *common_funcs;
203 static int is_common_function(const char *fn)
205 char *tmp;
207 if (!fn)
208 return 0;
210 if (strncmp(fn, "__builtin_", 10) == 0)
211 return 1;
213 FOR_EACH_PTR(common_funcs, tmp) {
214 if (strcmp(tmp, fn) == 0)
215 return 1;
216 } END_FOR_EACH_PTR(tmp);
218 return 0;
221 static char *function_signature(void)
223 return type_to_str(get_real_base_type(cur_func_sym));
226 void sql_insert_caller_info(struct expression *call, int type,
227 int param, const char *key, const char *value)
229 FILE *tmp_fd = sm_outfd;
230 char *fn;
232 if (!option_info && !__inline_call)
233 return;
235 if (key && strlen(key) >= 80)
236 return;
238 fn = get_fnptr_name(call->fn);
239 if (!fn)
240 return;
242 if (__inline_call) {
243 mem_sql(NULL, NULL,
244 "insert into caller_info values ('%s', '%s', '%s', %lu, %d, %d, %d, '%s', '%s');",
245 get_base_file(), get_function(), fn, (unsigned long)call,
246 is_static(call->fn), type, param, key, value);
249 if (!option_info)
250 return;
252 if (strncmp(fn, "__builtin_", 10) == 0)
253 return;
254 if (type != INTERNAL && is_common_function(fn))
255 return;
257 sm_outfd = caller_info_fd;
258 sm_msg("SQL_caller_info: insert into caller_info values ("
259 "'%s', '%s', '%s', %%CALL_ID%%, %d, %d, %d, '%s', '%s');",
260 get_base_file(), get_function(), fn, is_static(call->fn),
261 type, param, key, value);
262 sm_outfd = tmp_fd;
264 free_string(fn);
267 void sql_insert_function_ptr(const char *fn, const char *struct_name)
269 sql_insert(function_ptr, "'%s', '%s', '%s', 0", get_base_file(), fn,
270 struct_name);
273 void sql_insert_call_implies(int type, int param, const char *key, const char *value)
275 sql_insert(call_implies, "'%s', '%s', %lu, %d, %d, %d, '%s', '%s'", get_base_file(),
276 get_function(), (unsigned long)__inline_fn, fn_static(),
277 type, param, key, value);
280 void sql_insert_function_type_size(const char *member, const char *ranges)
282 sql_insert(function_type_size, "'%s', '%s', '%s', '%s'", get_base_file(), get_function(), member, ranges);
285 void sql_insert_local_values(const char *name, const char *value)
287 sql_insert(local_values, "'%s', '%s', '%s'", get_base_file(), name, value);
290 void sql_insert_function_type_value(const char *type, const char *value)
292 sql_insert(function_type_value, "'%s', '%s', '%s', '%s'", get_base_file(), get_function(), type, value);
295 void sql_insert_function_type(int param, const char *value)
297 sql_insert(function_type, "'%s', '%s', %d, %d, '%s'",
298 get_base_file(), get_function(), fn_static(), param, value);
301 void sql_insert_parameter_name(int param, const char *value)
303 sql_insert(parameter_name, "'%s', '%s', %d, %d, '%s'",
304 get_base_file(), get_function(), fn_static(), param, value);
307 void sql_insert_data_info(struct expression *data, int type, const char *value)
309 char *data_name;
311 data_name = get_data_info_name(data);
312 if (!data_name)
313 return;
314 sql_insert(data_info, "'%s', '%s', %d, '%s'",
315 is_static(data) ? get_base_file() : "extern",
316 data_name, type, value);
319 void sql_insert_data_info_var_sym(const char *var, struct symbol *sym, int type, const char *value)
321 sql_insert(data_info, "'%s', '%s', %d, '%s'",
322 (sym->ctype.modifiers & MOD_STATIC) ? get_base_file() : "extern",
323 var, type, value);
326 void sql_save_constraint(const char *con)
328 if (!option_info)
329 return;
331 sm_msg("SQL: insert or ignore into constraints (str) values('%s');", con);
334 void sql_save_constraint_required(const char *data, int op, const char *limit)
336 sql_insert_or_ignore(constraints_required, "'%s', '%s', '%s'", data, show_special(op), limit);
339 void sql_copy_constraint_required(const char *new_limit, const char *old_limit)
341 if (!option_info)
342 return;
344 sm_msg("SQL_late: insert or ignore into constraints_required (data, op, bound) "
345 "select constraints_required.data, constraints_required.op, '%s' from "
346 "constraints_required where bound = '%s';", new_limit, old_limit);
349 void sql_insert_fn_ptr_data_link(const char *ptr, const char *data)
351 sql_insert_or_ignore(fn_ptr_data_link, "'%s', '%s'", ptr, data);
354 void sql_insert_fn_data_link(struct expression *fn, int type, int param, const char *key, const char *value)
356 if (fn->type != EXPR_SYMBOL || !fn->symbol->ident)
357 return;
359 sql_insert(fn_data_link, "'%s', '%s', %d, %d, %d, '%s', '%s'",
360 (fn->symbol->ctype.modifiers & MOD_STATIC) ? get_base_file() : "extern",
361 fn->symbol->ident->name,
362 !!(fn->symbol->ctype.modifiers & MOD_STATIC),
363 type, param, key, value);
366 void sql_insert_mtag_about(mtag_t tag, const char *left_name, const char *right_name)
368 sql_insert(mtag_about, "%lld, '%s', '%s', %d, '%s', '%s'",
369 tag, get_filename(), get_function(), get_lineno(), left_name, right_name);
372 void sql_insert_mtag_data(mtag_t tag, const char *var, int offset, int type, const char *value)
374 sql_insert(mtag_data, "%lld, '%s', %d, %d, '%s'", tag, var, offset, type, value);
377 void sql_insert_mtag_map(mtag_t tag, int offset, mtag_t container)
379 sql_insert(mtag_map, "%lld, %d, %lld", tag, offset, container);
382 static int save_mtag(void *_tag, int argc, char **argv, char **azColName)
384 mtag_t *tag = _tag;
386 if (!*tag)
387 *tag = strtoll(argv[0], NULL, 10);
388 else
389 *tag = -1ULL;
391 return 0;
394 int mtag_map_select_container(mtag_t tag, int offset, mtag_t *container)
396 mtag_t tmp = 0;
398 run_sql(save_mtag, &tmp,
399 "select container from mtag_map where tag = %lld and offset = %d;",
400 tag, offset);
402 if (tmp == 0 || tmp == -1ULL)
403 return 0;
404 *container = tmp;
405 return 1;
408 int mtag_map_select_tag(mtag_t container, int offset, mtag_t *tag)
410 mtag_t tmp = 0;
412 run_sql(save_mtag, &tmp,
413 "select tag from mtag_map where container = %lld and offset = %d;",
414 container, offset);
416 if (tmp == 0 || tmp == -1ULL)
417 return 0;
418 *tag = tmp;
419 return 1;
422 char *get_static_filter(struct symbol *sym)
424 static char sql_filter[1024];
426 /* This can only happen on buggy code. Return invalid SQL. */
427 if (!sym) {
428 sql_filter[0] = '\0';
429 return sql_filter;
432 if (sym->ctype.modifiers & MOD_STATIC) {
433 snprintf(sql_filter, sizeof(sql_filter),
434 "file = '%s' and function = '%s' and static = '1'",
435 get_base_file(), sym->ident->name);
436 } else {
437 snprintf(sql_filter, sizeof(sql_filter),
438 "function = '%s' and static = '0'", sym->ident->name);
441 return sql_filter;
444 static int get_row_count(void *_row_count, int argc, char **argv, char **azColName)
446 int *row_count = _row_count;
448 *row_count = 0;
449 if (argc != 1)
450 return 0;
451 *row_count = atoi(argv[0]);
452 return 0;
455 static void mark_params_untracked(struct expression *call)
457 struct expression *arg;
458 int i = 0;
460 FOR_EACH_PTR(call->args, arg) {
461 mark_untracked(call, i++, "$", NULL);
462 } END_FOR_EACH_PTR(arg);
465 static void sql_select_return_states_pointer(const char *cols,
466 struct expression *call, int (*callback)(void*, int, char**, char**), void *info)
468 char *ptr;
469 int return_count = 0;
471 ptr = get_fnptr_name(call->fn);
472 if (!ptr)
473 return;
475 run_sql(get_row_count, &return_count,
476 "select count(*) from return_states join function_ptr "
477 "where return_states.function == function_ptr.function and "
478 "ptr = '%s' and searchable = 1 and type = %d;", ptr, INTERNAL);
479 /* The magic number 100 is just from testing on the kernel. */
480 if (return_count > 100) {
481 mark_params_untracked(call);
482 return;
485 run_sql(callback, info,
486 "select %s from return_states join function_ptr where "
487 "return_states.function == function_ptr.function and ptr = '%s' "
488 "and searchable = 1 "
489 "order by function_ptr.file, return_states.file, return_id, type;",
490 cols, ptr);
493 static int is_local_symbol(struct expression *expr)
495 if (expr->type != EXPR_SYMBOL)
496 return 0;
497 if (expr->symbol->ctype.modifiers & (MOD_NONLOCAL | MOD_STATIC | MOD_ADDRESSABLE))
498 return 0;
499 return 1;
502 void sql_select_return_states(const char *cols, struct expression *call,
503 int (*callback)(void*, int, char**, char**), void *info)
505 int row_count = 0;
507 if (is_fake_call(call))
508 return;
510 if (call->fn->type != EXPR_SYMBOL || !call->fn->symbol || is_local_symbol(call->fn)) {
511 sql_select_return_states_pointer(cols, call, callback, info);
512 return;
515 if (inlinable(call->fn)) {
516 mem_sql(callback, info,
517 "select %s from return_states where call_id = '%lu' order by return_id, type;",
518 cols, (unsigned long)call);
519 return;
522 run_sql(get_row_count, &row_count, "select count(*) from return_states where %s;",
523 get_static_filter(call->fn->symbol));
524 if (row_count > 3000)
525 return;
527 run_sql(callback, info, "select %s from return_states where %s order by file, return_id, type;",
528 cols, get_static_filter(call->fn->symbol));
531 void sql_select_call_implies(const char *cols, struct expression *call,
532 int (*callback)(void*, int, char**, char**))
534 if (call->fn->type != EXPR_SYMBOL || !call->fn->symbol)
535 return;
537 if (inlinable(call->fn)) {
538 mem_sql(callback, call,
539 "select %s from call_implies where call_id = '%lu';",
540 cols, (unsigned long)call);
541 return;
544 run_sql(callback, call, "select %s from call_implies where %s;",
545 cols, get_static_filter(call->fn->symbol));
548 struct select_caller_info_data {
549 struct stree *final_states;
550 struct timeval start_time;
551 int prev_func_id;
552 int ignore;
553 int results;
556 static int caller_info_callback(void *_data, int argc, char **argv, char **azColName);
558 static void sql_select_caller_info(struct select_caller_info_data *data,
559 const char *cols, struct symbol *sym)
561 if (__inline_fn) {
562 mem_sql(caller_info_callback, data,
563 "select %s from caller_info where call_id = %lu;",
564 cols, (unsigned long)__inline_fn);
565 return;
568 if (sym->ident->name && is_common_function(sym->ident->name))
569 return;
570 run_sql(caller_info_callback, data,
571 "select %s from common_caller_info where %s order by call_id;",
572 cols, get_static_filter(sym));
573 if (data->results)
574 return;
576 run_sql(caller_info_callback, data,
577 "select %s from caller_info where %s order by call_id;",
578 cols, get_static_filter(sym));
581 void select_caller_info_hook(void (*callback)(const char *name, struct symbol *sym, char *key, char *value), int type)
583 struct def_callback *def_callback = __alloc_def_callback(0);
585 def_callback->hook_type = type;
586 def_callback->callback = callback;
587 add_ptr_list(&select_caller_info_callbacks, def_callback);
591 * These call backs are used when the --info option is turned on to print struct
592 * member information. For example foo->bar could have a state in
593 * smatch_extra.c and also check_user.c.
595 void add_member_info_callback(int owner, void (*callback)(struct expression *call, int param, char *printed_name, struct sm_state *sm))
597 struct member_info_callback *member_callback = __alloc_member_info_callback(0);
599 member_callback->owner = owner;
600 member_callback->callback = callback;
601 add_ptr_list(&member_callbacks, member_callback);
604 void add_split_return_callback(void (*fn)(int return_id, char *return_ranges, struct expression *returned_expr))
606 struct returned_state_callback *callback = __alloc_returned_state_callback(0);
608 callback->callback = fn;
609 add_ptr_list(&returned_state_callbacks, callback);
612 void add_returned_member_callback(int owner, void (*callback)(int return_id, char *return_ranges, struct expression *expr, char *printed_name, struct smatch_state *state))
614 struct returned_member_callback *member_callback = __alloc_returned_member_callback(0);
616 member_callback->owner = owner;
617 member_callback->callback = callback;
618 add_ptr_list(&returned_member_callbacks, member_callback);
621 void select_call_implies_hook(int type, void (*callback)(struct expression *call, struct expression *arg, char *key, char *value))
623 struct call_implies_callback *cb = __alloc_call_implies_callback(0);
625 cb->type = type;
626 cb->callback = callback;
627 add_ptr_list(&call_implies_cb_list, cb);
630 struct return_info {
631 struct expression *static_returns_call;
632 struct symbol *return_type;
633 struct range_list *return_range_list;
636 static int db_return_callback(void *_ret_info, int argc, char **argv, char **azColName)
638 struct return_info *ret_info = _ret_info;
639 struct range_list *rl;
640 struct expression *call_expr = ret_info->static_returns_call;
642 if (argc != 1)
643 return 0;
644 call_results_to_rl(call_expr, ret_info->return_type, argv[0], &rl);
645 ret_info->return_range_list = rl_union(ret_info->return_range_list, rl);
646 return 0;
649 struct range_list *db_return_vals(struct expression *expr)
651 struct return_info ret_info = {};
652 char buf[64];
653 struct sm_state *sm;
655 if (is_fake_call(expr))
656 return NULL;
658 snprintf(buf, sizeof(buf), "return %p", expr);
659 sm = get_sm_state(SMATCH_EXTRA, buf, NULL);
660 if (sm)
661 return clone_rl(estate_rl(sm->state));
662 ret_info.static_returns_call = expr;
663 ret_info.return_type = get_type(expr);
664 if (!ret_info.return_type)
665 return NULL;
667 if (expr->fn->type != EXPR_SYMBOL || !expr->fn->symbol)
668 return NULL;
670 ret_info.return_range_list = NULL;
671 if (inlinable(expr->fn)) {
672 mem_sql(db_return_callback, &ret_info,
673 "select distinct return from return_states where call_id = '%lu';",
674 (unsigned long)expr);
675 } else {
676 run_sql(db_return_callback, &ret_info,
677 "select distinct return from return_states where %s;",
678 get_static_filter(expr->fn->symbol));
680 return ret_info.return_range_list;
683 struct range_list *db_return_vals_from_str(const char *fn_name)
685 struct return_info ret_info;
687 ret_info.static_returns_call = NULL;
688 ret_info.return_type = &llong_ctype;
689 ret_info.return_range_list = NULL;
691 run_sql(db_return_callback, &ret_info,
692 "select distinct return from return_states where function = '%s';",
693 fn_name);
694 return ret_info.return_range_list;
697 static void match_call_marker(struct expression *expr)
699 struct symbol *type;
701 type = get_type(expr->fn);
702 if (type && type->type == SYM_PTR)
703 type = get_real_base_type(type);
706 * we just want to record something in the database so that if we have
707 * two calls like: frob(4); frob(some_unkown); then on the receiving
708 * side we know that sometimes frob is called with unknown parameters.
711 sql_insert_caller_info(expr, INTERNAL, -1, "%call_marker%", type_to_str(type));
714 static char *show_offset(int offset)
716 static char buf[64];
718 buf[0] = '\0';
719 if (offset != -1)
720 snprintf(buf, sizeof(buf), "(-%d)", offset);
721 return buf;
724 static void print_struct_members(struct expression *call, struct expression *expr, int param, int offset, struct stree *stree,
725 void (*callback)(struct expression *call, int param, char *printed_name, struct sm_state *sm))
727 struct sm_state *sm;
728 char *name;
729 struct symbol *sym;
730 int len;
731 char printed_name[256];
732 int is_address = 0;
734 expr = strip_expr(expr);
735 if (!expr)
736 return;
737 if (expr->type == EXPR_PREOP && expr->op == '&') {
738 expr = strip_expr(expr->unop);
739 is_address = 1;
742 name = expr_to_var_sym(expr, &sym);
743 if (!name || !sym)
744 goto free;
746 len = strlen(name);
747 FOR_EACH_SM(stree, sm) {
748 if (sm->sym != sym)
749 continue;
750 if (strcmp(name, sm->name) == 0) {
751 if (is_address)
752 snprintf(printed_name, sizeof(printed_name), "*$%s", show_offset(offset));
753 else /* these are already handled. fixme: handle them here */
754 continue;
755 } else if (sm->name[0] == '*' && strcmp(name, sm->name + 1) == 0) {
756 snprintf(printed_name, sizeof(printed_name), "*$%s", show_offset(offset));
757 } else if (strncmp(name, sm->name, len) == 0) {
758 if (isalnum(sm->name[len]))
759 continue;
760 if (is_address)
761 snprintf(printed_name, sizeof(printed_name), "$%s->%s", show_offset(offset), sm->name + len + 1);
762 else
763 snprintf(printed_name, sizeof(printed_name), "$%s%s", show_offset(offset), sm->name + len);
764 } else {
765 continue;
767 callback(call, param, printed_name, sm);
768 } END_FOR_EACH_SM(sm);
769 free:
770 free_string(name);
773 static int param_used_callback(void *_container, int argc, char **argv, char **azColName)
775 char **container = _container;
776 static char buf[256];
778 snprintf(buf, sizeof(buf), "%s", argv[0]);
779 *container = buf;
780 return 0;
783 static void print_container_struct_members(struct expression *call, struct expression *expr, int param, struct stree *stree,
784 void (*callback)(struct expression *call, int param, char *printed_name, struct sm_state *sm))
786 struct expression *tmp;
787 char *container = NULL;
788 int offset;
789 int holder_offset;
790 char *p;
792 if (!call->fn || call->fn->type != EXPR_SYMBOL)
793 return;
796 * We can't use the in-mem DB because we have to parse the function
797 * first, then we know if it takes a container, then we know to pass it
798 * the container data.
801 run_sql(&param_used_callback, &container,
802 "select key from call_implies where %s and type = %d and key like '%%$(%%' and parameter = %d limit 1;",
803 get_static_filter(call->fn->symbol), CONTAINER, param);
804 if (!container)
805 return;
807 p = strchr(container, '-');
808 if (!p)
809 return;
810 offset = atoi(p);
811 p = strchr(p, ')');
812 if (!p)
813 return;
814 p++;
816 tmp = get_assigned_expr(expr);
817 if (tmp)
818 expr = tmp;
820 if (expr->type != EXPR_PREOP || expr->op != '&')
821 return;
822 expr = strip_expr(expr->unop);
823 holder_offset = get_member_offset_from_deref(expr);
824 if (-holder_offset != offset)
825 return;
827 expr = strip_expr(expr->deref);
828 if (expr->type == EXPR_PREOP && expr->op == '*')
829 expr = strip_expr(expr->unop);
831 print_struct_members(call, expr, param, holder_offset, stree, callback);
834 static void match_call_info(struct expression *call)
836 struct member_info_callback *cb;
837 struct expression *arg;
838 struct stree *stree;
839 char *name;
840 int i;
842 name = get_fnptr_name(call->fn);
843 if (!name)
844 return;
846 FOR_EACH_PTR(member_callbacks, cb) {
847 stree = get_all_states_stree(cb->owner);
848 i = 0;
849 FOR_EACH_PTR(call->args, arg) {
850 print_struct_members(call, arg, i, -1, stree, cb->callback);
851 print_container_struct_members(call, arg, i, stree, cb->callback);
852 i++;
853 } END_FOR_EACH_PTR(arg);
854 free_stree(&stree);
855 } END_FOR_EACH_PTR(cb);
857 free_string(name);
860 static int get_param(int param, char **name, struct symbol **sym)
862 struct symbol *arg;
863 int i;
865 i = 0;
866 FOR_EACH_PTR(cur_func_sym->ctype.base_type->arguments, arg) {
868 * this is a temporary hack to work around a bug (I think in sparse?)
869 * 2.6.37-rc1:fs/reiserfs/journal.o
870 * If there is a function definition without parameter name found
871 * after a function implementation then it causes a crash.
872 * int foo() {}
873 * int bar(char *);
875 if (arg->ident->name < (char *)100)
876 continue;
877 if (i == param) {
878 *name = arg->ident->name;
879 *sym = arg;
880 return TRUE;
882 i++;
883 } END_FOR_EACH_PTR(arg);
885 return FALSE;
888 static int function_signature_matches(const char *sig)
890 char *my_sig;
892 my_sig = function_signature();
893 if (!sig || !my_sig)
894 return 1; /* default to matching */
895 if (strcmp(my_sig, sig) == 0)
896 return 1;
897 return 0;
900 static int caller_info_callback(void *_data, int argc, char **argv, char **azColName)
902 struct select_caller_info_data *data = _data;
903 int func_id;
904 long type;
905 long param;
906 char *key;
907 char *value;
908 char *name = NULL;
909 struct symbol *sym = NULL;
910 struct def_callback *def_callback;
911 struct stree *stree;
912 struct timeval cur_time;
914 data->results = 1;
916 if (argc != 5)
917 return 0;
919 gettimeofday(&cur_time, NULL);
920 if (cur_time.tv_sec - data->start_time.tv_sec > 10)
921 return 0;
923 func_id = atoi(argv[0]);
924 errno = 0;
925 type = strtol(argv[1], NULL, 10);
926 param = strtol(argv[2], NULL, 10);
927 if (errno)
928 return 0;
929 key = argv[3];
930 value = argv[4];
932 if (data->prev_func_id == -1)
933 data->prev_func_id = func_id;
934 if (func_id != data->prev_func_id) {
935 stree = __pop_fake_cur_stree();
936 if (!data->ignore)
937 merge_stree(&data->final_states, stree);
938 free_stree(&stree);
939 __push_fake_cur_stree();
940 __unnullify_path();
941 data->prev_func_id = func_id;
942 data->ignore = 0;
945 if (data->ignore)
946 return 0;
947 if (type == INTERNAL &&
948 !function_signature_matches(value)) {
949 data->ignore = 1;
950 return 0;
953 if (param >= 0 && !get_param(param, &name, &sym))
954 return 0;
956 FOR_EACH_PTR(select_caller_info_callbacks, def_callback) {
957 if (def_callback->hook_type == type)
958 def_callback->callback(name, sym, key, value);
959 } END_FOR_EACH_PTR(def_callback);
961 return 0;
964 static struct string_list *ptr_names_done;
965 static struct string_list *ptr_names;
967 static int get_ptr_name(void *unused, int argc, char **argv, char **azColName)
969 insert_string(&ptr_names, alloc_string(argv[0]));
970 return 0;
973 static char *get_next_ptr_name(void)
975 char *ptr;
977 FOR_EACH_PTR(ptr_names, ptr) {
978 if (list_has_string(ptr_names_done, ptr))
979 continue;
980 insert_string(&ptr_names_done, ptr);
981 return ptr;
982 } END_FOR_EACH_PTR(ptr);
983 return NULL;
986 static void get_ptr_names(const char *file, const char *name)
988 char sql_filter[1024];
989 int before, after;
991 if (file) {
992 snprintf(sql_filter, 1024, "file = '%s' and function = '%s';",
993 file, name);
994 } else {
995 snprintf(sql_filter, 1024, "function = '%s';", name);
998 before = ptr_list_size((struct ptr_list *)ptr_names);
1000 run_sql(get_ptr_name, NULL,
1001 "select distinct ptr from function_ptr where %s",
1002 sql_filter);
1004 after = ptr_list_size((struct ptr_list *)ptr_names);
1005 if (before == after)
1006 return;
1008 while ((name = get_next_ptr_name()))
1009 get_ptr_names(NULL, name);
1012 static void match_data_from_db(struct symbol *sym)
1014 struct select_caller_info_data data = { .prev_func_id = -1 };
1015 struct sm_state *sm;
1016 struct stree *stree;
1017 struct timeval end_time;
1019 if (!sym || !sym->ident)
1020 return;
1022 gettimeofday(&data.start_time, NULL);
1024 __push_fake_cur_stree();
1025 __unnullify_path();
1027 if (!__inline_fn) {
1028 char *ptr;
1030 if (sym->ctype.modifiers & MOD_STATIC)
1031 get_ptr_names(get_base_file(), sym->ident->name);
1032 else
1033 get_ptr_names(NULL, sym->ident->name);
1035 if (ptr_list_size((struct ptr_list *)ptr_names) > 20) {
1036 __free_ptr_list((struct ptr_list **)&ptr_names);
1037 __free_ptr_list((struct ptr_list **)&ptr_names_done);
1038 stree = __pop_fake_cur_stree();
1039 free_stree(&stree);
1040 return;
1043 sql_select_caller_info(&data,
1044 "call_id, type, parameter, key, value",
1045 sym);
1048 stree = __pop_fake_cur_stree();
1049 if (!data.ignore)
1050 merge_stree(&data.final_states, stree);
1051 free_stree(&stree);
1052 __push_fake_cur_stree();
1053 __unnullify_path();
1054 data.prev_func_id = -1;
1055 data.ignore = 0;
1057 FOR_EACH_PTR(ptr_names, ptr) {
1058 run_sql(caller_info_callback, &data,
1059 "select call_id, type, parameter, key, value"
1060 " from common_caller_info where function = '%s' order by call_id",
1061 ptr);
1062 } END_FOR_EACH_PTR(ptr);
1064 if (data.results) {
1065 FOR_EACH_PTR(ptr_names, ptr) {
1066 free_string(ptr);
1067 } END_FOR_EACH_PTR(ptr);
1068 goto free_ptr_names;
1071 FOR_EACH_PTR(ptr_names, ptr) {
1072 run_sql(caller_info_callback, &data,
1073 "select call_id, type, parameter, key, value"
1074 " from caller_info where function = '%s' order by call_id",
1075 ptr);
1076 free_string(ptr);
1077 } END_FOR_EACH_PTR(ptr);
1079 free_ptr_names:
1080 __free_ptr_list((struct ptr_list **)&ptr_names);
1081 __free_ptr_list((struct ptr_list **)&ptr_names_done);
1082 } else {
1083 sql_select_caller_info(&data,
1084 "call_id, type, parameter, key, value",
1085 sym);
1088 stree = __pop_fake_cur_stree();
1089 if (!data.ignore)
1090 merge_stree(&data.final_states, stree);
1091 free_stree(&stree);
1093 gettimeofday(&end_time, NULL);
1094 if (end_time.tv_sec - data.start_time.tv_sec <= 10) {
1095 FOR_EACH_SM(data.final_states, sm) {
1096 __set_sm(sm);
1097 } END_FOR_EACH_SM(sm);
1100 free_stree(&data.final_states);
1103 static int call_implies_callbacks(void *_call, int argc, char **argv, char **azColName)
1105 struct expression *call_expr = _call;
1106 struct call_implies_callback *cb;
1107 struct expression *arg = NULL;
1108 int type;
1109 int param;
1111 if (argc != 5)
1112 return 0;
1114 type = atoi(argv[1]);
1115 param = atoi(argv[2]);
1117 FOR_EACH_PTR(call_implies_cb_list, cb) {
1118 if (cb->type != type)
1119 continue;
1120 if (param != -1) {
1121 arg = get_argument_from_call_expr(call_expr->args, param);
1122 if (!arg)
1123 continue;
1125 cb->callback(call_expr, arg, argv[3], argv[4]);
1126 } END_FOR_EACH_PTR(cb);
1128 return 0;
1131 static void match_call_implies(struct expression *expr)
1133 sql_select_call_implies("function, type, parameter, key, value", expr,
1134 call_implies_callbacks);
1137 static void print_initializer_list(struct expression_list *expr_list,
1138 struct symbol *struct_type)
1140 struct expression *expr;
1141 struct symbol *base_type;
1142 char struct_name[256];
1144 FOR_EACH_PTR(expr_list, expr) {
1145 if (expr->type == EXPR_INDEX && expr->idx_expression && expr->idx_expression->type == EXPR_INITIALIZER) {
1146 print_initializer_list(expr->idx_expression->expr_list, struct_type);
1147 continue;
1149 if (expr->type != EXPR_IDENTIFIER)
1150 continue;
1151 if (!expr->expr_ident)
1152 continue;
1153 if (!expr->ident_expression || !expr->ident_expression->symbol_name)
1154 continue;
1155 base_type = get_type(expr->ident_expression);
1156 if (!base_type || base_type->type != SYM_FN)
1157 continue;
1158 snprintf(struct_name, sizeof(struct_name), "(struct %s)->%s",
1159 struct_type->ident->name, expr->expr_ident->name);
1160 sql_insert_function_ptr(expr->ident_expression->symbol_name->name,
1161 struct_name);
1162 } END_FOR_EACH_PTR(expr);
1165 static void global_variable(struct symbol *sym)
1167 struct symbol *struct_type;
1169 if (!sym->ident)
1170 return;
1171 if (!sym->initializer || sym->initializer->type != EXPR_INITIALIZER)
1172 return;
1173 struct_type = get_base_type(sym);
1174 if (!struct_type)
1175 return;
1176 if (struct_type->type == SYM_ARRAY) {
1177 struct_type = get_base_type(struct_type);
1178 if (!struct_type)
1179 return;
1181 if (struct_type->type != SYM_STRUCT || !struct_type->ident)
1182 return;
1183 print_initializer_list(sym->initializer->expr_list, struct_type);
1186 static void match_return_info(int return_id, char *return_ranges, struct expression *expr)
1188 sql_insert_return_states(return_id, return_ranges, INTERNAL, -1, "", function_signature());
1191 static void call_return_state_hooks_conditional(struct expression *expr)
1193 struct returned_state_callback *cb;
1194 struct range_list *rl;
1195 char *return_ranges;
1196 int final_pass_orig = final_pass;
1198 __push_fake_cur_stree();
1200 final_pass = 0;
1201 __split_whole_condition(expr->conditional);
1202 final_pass = final_pass_orig;
1204 if (get_implied_rl(expr->cond_true, &rl))
1205 rl = cast_rl(cur_func_return_type(), rl);
1206 else
1207 rl = cast_rl(cur_func_return_type(), alloc_whole_rl(get_type(expr->cond_true)));
1208 return_ranges = show_rl(rl);
1209 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(rl));
1211 return_id++;
1212 FOR_EACH_PTR(returned_state_callbacks, cb) {
1213 cb->callback(return_id, return_ranges, expr->cond_true);
1214 } END_FOR_EACH_PTR(cb);
1216 __push_true_states();
1217 __use_false_states();
1219 if (get_implied_rl(expr->cond_false, &rl))
1220 rl = cast_rl(cur_func_return_type(), rl);
1221 else
1222 rl = cast_rl(cur_func_return_type(), alloc_whole_rl(get_type(expr->cond_false)));
1223 return_ranges = show_rl(rl);
1224 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(rl));
1226 return_id++;
1227 FOR_EACH_PTR(returned_state_callbacks, cb) {
1228 cb->callback(return_id, return_ranges, expr->cond_false);
1229 } END_FOR_EACH_PTR(cb);
1231 __merge_true_states();
1232 __free_fake_cur_stree();
1235 static void call_return_state_hooks_compare(struct expression *expr)
1237 struct returned_state_callback *cb;
1238 char *return_ranges;
1239 int final_pass_orig = final_pass;
1240 sval_t sval = { .type = &int_ctype };
1241 sval_t ret;
1243 if (!get_implied_value(expr, &ret))
1244 ret.value = -1;
1246 __push_fake_cur_stree();
1248 final_pass = 0;
1249 __split_whole_condition(expr);
1250 final_pass = final_pass_orig;
1252 if (ret.value != 0) {
1253 return_ranges = alloc_sname("1");
1254 sval.value = 1;
1255 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_sval(sval));
1257 return_id++;
1258 FOR_EACH_PTR(returned_state_callbacks, cb) {
1259 cb->callback(return_id, return_ranges, expr);
1260 } END_FOR_EACH_PTR(cb);
1263 __push_true_states();
1264 __use_false_states();
1266 if (ret.value != 1) {
1267 return_ranges = alloc_sname("0");
1268 sval.value = 0;
1269 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_sval(sval));
1271 return_id++;
1272 FOR_EACH_PTR(returned_state_callbacks, cb) {
1273 cb->callback(return_id, return_ranges, expr);
1274 } END_FOR_EACH_PTR(cb);
1277 __merge_true_states();
1278 __free_fake_cur_stree();
1281 static int ptr_in_list(struct sm_state *sm, struct state_list *slist)
1283 struct sm_state *tmp;
1285 FOR_EACH_PTR(slist, tmp) {
1286 if (strcmp(tmp->state->name, sm->state->name) == 0)
1287 return 1;
1288 } END_FOR_EACH_PTR(tmp);
1290 return 0;
1293 static char *get_return_compare_str(struct expression *expr)
1295 char *compare_str;
1296 char *var;
1297 char buf[256];
1298 int comparison;
1299 int param;
1301 compare_str = expr_lte_to_param(expr, -1);
1302 if (compare_str)
1303 return compare_str;
1304 param = get_param_num(expr);
1305 if (param < 0)
1306 return NULL;
1308 var = expr_to_var(expr);
1309 if (!var)
1310 return NULL;
1311 snprintf(buf, sizeof(buf), "%s orig", var);
1312 comparison = get_comparison_strings(var, buf);
1313 free_string(var);
1315 if (!comparison)
1316 return NULL;
1318 snprintf(buf, sizeof(buf), "[%s$%d]", show_special(comparison), param);
1319 return alloc_sname(buf);
1322 static int split_possible_helper(struct sm_state *sm, struct expression *expr)
1324 struct returned_state_callback *cb;
1325 struct range_list *rl;
1326 char *return_ranges;
1327 struct sm_state *tmp;
1328 int ret = 0;
1329 int nr_possible, nr_states;
1330 char *compare_str = NULL;
1331 char buf[128];
1332 struct state_list *already_handled = NULL;
1334 if (!sm || !sm->merged)
1335 return 0;
1337 if (too_many_possible(sm))
1338 return 0;
1340 /* bail if it gets too complicated */
1341 nr_possible = ptr_list_size((struct ptr_list *)sm->possible);
1342 nr_states = stree_count(__get_cur_stree());
1343 if (nr_states * nr_possible >= 2000)
1344 return 0;
1346 FOR_EACH_PTR(sm->possible, tmp) {
1347 if (tmp->merged)
1348 continue;
1349 if (ptr_in_list(tmp, already_handled))
1350 continue;
1351 add_ptr_list(&already_handled, tmp);
1353 ret = 1;
1354 __push_fake_cur_stree();
1356 overwrite_states_using_pool(sm, tmp);
1358 rl = cast_rl(cur_func_return_type(), estate_rl(tmp->state));
1359 return_ranges = show_rl(rl);
1360 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(clone_rl(rl)));
1361 compare_str = get_return_compare_str(expr);
1362 if (compare_str) {
1363 snprintf(buf, sizeof(buf), "%s%s", return_ranges, compare_str);
1364 return_ranges = alloc_sname(buf);
1367 return_id++;
1368 FOR_EACH_PTR(returned_state_callbacks, cb) {
1369 cb->callback(return_id, return_ranges, expr);
1370 } END_FOR_EACH_PTR(cb);
1372 __free_fake_cur_stree();
1373 } END_FOR_EACH_PTR(tmp);
1375 free_slist(&already_handled);
1377 return ret;
1380 static int call_return_state_hooks_split_possible(struct expression *expr)
1382 struct sm_state *sm;
1384 if (!expr || expr_equal_to_param(expr, -1))
1385 return 0;
1387 sm = get_sm_state_expr(SMATCH_EXTRA, expr);
1388 return split_possible_helper(sm, expr);
1391 static const char *get_return_ranges_str(struct expression *expr, struct range_list **rl_p)
1393 struct range_list *rl;
1394 char *return_ranges;
1395 sval_t sval;
1396 char *compare_str;
1397 char *math_str;
1398 char buf[128];
1400 *rl_p = NULL;
1402 if (!expr)
1403 return alloc_sname("");
1405 if (get_implied_value(expr, &sval)) {
1406 sval = sval_cast(cur_func_return_type(), sval);
1407 *rl_p = alloc_rl(sval, sval);
1408 return sval_to_str(sval);
1411 compare_str = expr_equal_to_param(expr, -1);
1412 math_str = get_value_in_terms_of_parameter_math(expr);
1414 if (get_implied_rl(expr, &rl)) {
1415 rl = cast_rl(cur_func_return_type(), rl);
1416 return_ranges = show_rl(rl);
1417 } else if (get_imaginary_absolute(expr, &rl)){
1418 rl = cast_rl(cur_func_return_type(), rl);
1419 return alloc_sname(show_rl(rl));
1420 } else {
1421 rl = cast_rl(cur_func_return_type(), alloc_whole_rl(get_type(expr)));
1422 return_ranges = show_rl(rl);
1424 *rl_p = rl;
1426 if (compare_str) {
1427 snprintf(buf, sizeof(buf), "%s%s", return_ranges, compare_str);
1428 return alloc_sname(buf);
1430 if (math_str) {
1431 snprintf(buf, sizeof(buf), "%s[%s]", return_ranges, math_str);
1432 return alloc_sname(buf);
1434 compare_str = get_return_compare_str(expr);
1435 if (compare_str) {
1436 snprintf(buf, sizeof(buf), "%s%s", return_ranges, compare_str);
1437 return alloc_sname(buf);
1440 return return_ranges;
1443 static int split_positive_from_negative(struct expression *expr)
1445 struct returned_state_callback *cb;
1446 struct range_list *rl;
1447 const char *return_ranges;
1448 struct range_list *ret_rl;
1449 int undo;
1451 /* We're going to print the states 3 times */
1452 if (stree_count(__get_cur_stree()) > 10000 / 3)
1453 return 0;
1455 if (!get_implied_rl(expr, &rl) || !rl)
1456 return 0;
1457 if (is_whole_rl(rl) || is_whole_rl_non_zero(rl))
1458 return 0;
1459 /* Forget about INT_MAX and larger */
1460 if (rl_max(rl).value <= 0)
1461 return 0;
1462 if (!sval_is_negative(rl_min(rl)))
1463 return 0;
1465 if (!assume(compare_expression(expr, '>', zero_expr())))
1466 return 0;
1468 return_id++;
1469 return_ranges = get_return_ranges_str(expr, &ret_rl);
1470 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(ret_rl));
1471 FOR_EACH_PTR(returned_state_callbacks, cb) {
1472 cb->callback(return_id, (char *)return_ranges, expr);
1473 } END_FOR_EACH_PTR(cb);
1475 end_assume();
1477 if (rl_has_sval(rl, sval_type_val(rl_type(rl), 0))) {
1478 undo = assume(compare_expression(expr, SPECIAL_EQUAL, zero_expr()));
1480 return_id++;
1481 return_ranges = get_return_ranges_str(expr, &ret_rl);
1482 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(ret_rl));
1483 FOR_EACH_PTR(returned_state_callbacks, cb) {
1484 cb->callback(return_id, (char *)return_ranges, expr);
1485 } END_FOR_EACH_PTR(cb);
1487 if (undo)
1488 end_assume();
1491 undo = assume(compare_expression(expr, '<', zero_expr()));
1493 return_id++;
1494 return_ranges = get_return_ranges_str(expr, &ret_rl);
1495 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(ret_rl));
1496 FOR_EACH_PTR(returned_state_callbacks, cb) {
1497 cb->callback(return_id, (char *)return_ranges, expr);
1498 } END_FOR_EACH_PTR(cb);
1500 if (undo)
1501 end_assume();
1503 return 1;
1506 static int call_return_state_hooks_split_null_non_null(struct expression *expr)
1508 struct returned_state_callback *cb;
1509 struct range_list *rl;
1510 struct range_list *nonnull_rl;
1511 sval_t null_sval;
1512 struct range_list *null_rl = NULL;
1513 char *return_ranges;
1514 struct sm_state *sm;
1515 struct smatch_state *state;
1516 int nr_states;
1517 int final_pass_orig = final_pass;
1519 if (!expr || expr_equal_to_param(expr, -1))
1520 return 0;
1521 if (expr->type == EXPR_CALL)
1522 return 0;
1523 if (!is_pointer(expr))
1524 return 0;
1526 sm = get_sm_state_expr(SMATCH_EXTRA, expr);
1527 if (!sm)
1528 return 0;
1529 if (ptr_list_size((struct ptr_list *)sm->possible) == 1)
1530 return 0;
1531 state = sm->state;
1532 if (!estate_rl(state))
1533 return 0;
1534 if (estate_min(state).value == 0 && estate_max(state).value == 0)
1535 return 0;
1536 if (!rl_has_sval(estate_rl(state), sval_type_val(estate_type(state), 0)))
1537 return 0;
1539 nr_states = stree_count(__get_cur_stree());
1540 if (option_info && nr_states >= 1500)
1541 return 0;
1543 rl = estate_rl(state);
1545 __push_fake_cur_stree();
1547 final_pass = 0;
1548 __split_whole_condition(expr);
1549 final_pass = final_pass_orig;
1551 nonnull_rl = rl_filter(rl, rl_zero());
1552 return_ranges = show_rl(nonnull_rl);
1553 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(nonnull_rl));
1555 return_id++;
1556 FOR_EACH_PTR(returned_state_callbacks, cb) {
1557 cb->callback(return_id, return_ranges, expr);
1558 } END_FOR_EACH_PTR(cb);
1560 __push_true_states();
1561 __use_false_states();
1563 return_ranges = alloc_sname("0");
1564 null_sval = sval_type_val(rl_type(rl), 0);
1565 add_range(&null_rl, null_sval, null_sval);
1566 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(null_rl));
1567 return_id++;
1568 FOR_EACH_PTR(returned_state_callbacks, cb) {
1569 cb->callback(return_id, return_ranges, expr);
1570 } END_FOR_EACH_PTR(cb);
1572 __merge_true_states();
1573 __free_fake_cur_stree();
1575 return 1;
1578 static int call_return_state_hooks_split_success_fail(struct expression *expr)
1580 struct range_list *rl;
1581 struct range_list *nonzero_rl;
1582 sval_t zero_sval;
1583 struct range_list *zero_rl = NULL;
1584 int nr_states;
1585 struct returned_state_callback *cb;
1586 char *return_ranges;
1587 int final_pass_orig = final_pass;
1588 sval_t val;
1590 if (option_project != PROJ_KERNEL)
1591 return 0;
1593 nr_states = stree_count(__get_cur_stree());
1594 if (nr_states > 1500)
1595 return 0;
1597 if (get_value(expr, &val))
1598 return 0;
1599 if (!get_implied_rl(expr, &rl))
1600 return 0;
1601 if (rl_min(rl).value < -4095 || rl_min(rl).value >= 0)
1602 return 0;
1603 if (rl_max(rl).value != 0)
1604 return 0;
1606 __push_fake_cur_stree();
1608 final_pass = 0;
1609 __split_whole_condition(expr);
1610 final_pass = final_pass_orig;
1612 nonzero_rl = rl_filter(rl, rl_zero());
1613 return_ranges = show_rl(nonzero_rl);
1614 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(nonzero_rl));
1616 return_id++;
1617 FOR_EACH_PTR(returned_state_callbacks, cb) {
1618 cb->callback(return_id, return_ranges, expr);
1619 } END_FOR_EACH_PTR(cb);
1621 __push_true_states();
1622 __use_false_states();
1624 return_ranges = alloc_sname("0");
1625 zero_sval = sval_type_val(rl_type(rl), 0);
1626 add_range(&zero_rl, zero_sval, zero_sval);
1627 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(zero_rl));
1628 return_id++;
1629 FOR_EACH_PTR(returned_state_callbacks, cb) {
1630 cb->callback(return_id, return_ranges, expr);
1631 } END_FOR_EACH_PTR(cb);
1633 __merge_true_states();
1634 __free_fake_cur_stree();
1636 return 1;
1639 static int is_boolean(struct expression *expr)
1641 struct range_list *rl;
1643 if (!get_implied_rl(expr, &rl))
1644 return 0;
1645 if (rl_min(rl).value == 0 && rl_max(rl).value == 1)
1646 return 1;
1647 return 0;
1650 static int is_conditional(struct expression *expr)
1652 if (!expr)
1653 return 0;
1654 if (expr->type == EXPR_CONDITIONAL || expr->type == EXPR_SELECT)
1655 return 1;
1656 return 0;
1659 static int splitable_function_call(struct expression *expr)
1661 struct sm_state *sm;
1662 char buf[64];
1664 if (!expr || expr->type != EXPR_CALL)
1665 return 0;
1666 snprintf(buf, sizeof(buf), "return %p", expr);
1667 sm = get_sm_state(SMATCH_EXTRA, buf, NULL);
1668 return split_possible_helper(sm, expr);
1671 static struct sm_state *find_bool_param(void)
1673 struct stree *start_states;
1674 struct symbol *arg;
1675 struct sm_state *sm, *tmp;
1676 sval_t sval;
1678 start_states = get_start_states();
1680 FOR_EACH_PTR_REVERSE(cur_func_sym->ctype.base_type->arguments, arg) {
1681 if (!arg->ident)
1682 continue;
1683 sm = get_sm_state_stree(start_states, SMATCH_EXTRA, arg->ident->name, arg);
1684 if (!sm)
1685 continue;
1686 if (rl_min(estate_rl(sm->state)).value != 0 ||
1687 rl_max(estate_rl(sm->state)).value != 1)
1688 continue;
1689 goto found;
1690 } END_FOR_EACH_PTR_REVERSE(arg);
1692 return NULL;
1694 found:
1696 * Check if it's splitable. If not, then splitting it up is likely not
1697 * useful for the callers.
1699 FOR_EACH_PTR(sm->possible, tmp) {
1700 if (is_merged(tmp))
1701 continue;
1702 if (!estate_get_single_value(tmp->state, &sval))
1703 return NULL;
1704 } END_FOR_EACH_PTR(tmp);
1706 return sm;
1709 static int split_on_bool_sm(struct sm_state *sm, struct expression *expr)
1711 struct returned_state_callback *cb;
1712 struct range_list *ret_rl;
1713 const char *return_ranges;
1714 struct sm_state *tmp;
1715 int ret = 0;
1716 int nr_possible, nr_states;
1717 char *compare_str = NULL;
1718 char buf[128];
1719 struct state_list *already_handled = NULL;
1721 if (!sm || !sm->merged)
1722 return 0;
1724 if (too_many_possible(sm))
1725 return 0;
1727 /* bail if it gets too complicated */
1728 nr_possible = ptr_list_size((struct ptr_list *)sm->possible);
1729 nr_states = stree_count(__get_cur_stree());
1730 if (nr_states * nr_possible >= 2000)
1731 return 0;
1733 FOR_EACH_PTR(sm->possible, tmp) {
1734 if (tmp->merged)
1735 continue;
1736 if (ptr_in_list(tmp, already_handled))
1737 continue;
1738 add_ptr_list(&already_handled, tmp);
1740 ret = 1;
1741 __push_fake_cur_stree();
1743 overwrite_states_using_pool(sm, tmp);
1745 return_ranges = get_return_ranges_str(expr, &ret_rl);
1746 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(ret_rl));
1747 compare_str = get_return_compare_str(expr);
1748 if (compare_str) {
1749 snprintf(buf, sizeof(buf), "%s%s", return_ranges, compare_str);
1750 return_ranges = alloc_sname(buf);
1753 return_id++;
1754 FOR_EACH_PTR(returned_state_callbacks, cb) {
1755 cb->callback(return_id, (char *)return_ranges, expr);
1756 } END_FOR_EACH_PTR(cb);
1758 __free_fake_cur_stree();
1759 } END_FOR_EACH_PTR(tmp);
1761 free_slist(&already_handled);
1763 return ret;
1766 static int split_by_bool_param(struct expression *expr)
1768 struct sm_state *start_sm, *sm;
1769 sval_t sval;
1771 start_sm = find_bool_param();
1772 if (!start_sm)
1773 return 0;
1774 sm = get_sm_state(SMATCH_EXTRA, start_sm->name, start_sm->sym);
1775 if (!sm || estate_get_single_value(sm->state, &sval))
1776 return 0;
1777 return split_on_bool_sm(sm, expr);
1780 static int split_by_null_nonnull_param(struct expression *expr)
1782 struct symbol *arg;
1783 struct sm_state *sm;
1784 sval_t zero = {
1785 .type = &ulong_ctype,
1788 /* function must only take one pointer */
1789 if (ptr_list_size((struct ptr_list *)cur_func_sym->ctype.base_type->arguments) != 1)
1790 return 0;
1791 arg = first_ptr_list((struct ptr_list *)cur_func_sym->ctype.base_type->arguments);
1792 if (!arg->ident)
1793 return 0;
1794 if (get_real_base_type(arg)->type != SYM_PTR)
1795 return 0;
1797 if (param_was_set_var_sym(arg->ident->name, arg))
1798 return 0;
1799 sm = get_sm_state(SMATCH_EXTRA, arg->ident->name, arg);
1800 if (!sm)
1801 return 0;
1803 if (!rl_has_sval(estate_rl(sm->state), zero))
1804 return 0;
1806 return split_on_bool_sm(sm, expr);
1809 struct expression *strip_expr_statement(struct expression *expr)
1811 struct expression *orig = expr;
1812 struct statement *stmt, *last_stmt;
1814 if (!expr)
1815 return NULL;
1816 if (expr->type == EXPR_PREOP && expr->op == '(')
1817 expr = expr->unop;
1818 if (expr->type != EXPR_STATEMENT)
1819 return orig;
1820 stmt = expr->statement;
1821 if (!stmt || stmt->type != STMT_COMPOUND)
1822 return orig;
1824 last_stmt = last_ptr_list((struct ptr_list *)stmt->stmts);
1825 if (!last_stmt || last_stmt->type == STMT_LABEL)
1826 last_stmt = last_stmt->label_statement;
1827 if (!last_stmt || last_stmt->type != STMT_EXPRESSION)
1828 return orig;
1829 return strip_expr(last_stmt->expression);
1832 static void call_return_state_hooks(struct expression *expr)
1834 struct returned_state_callback *cb;
1835 struct range_list *ret_rl;
1836 const char *return_ranges;
1837 int nr_states;
1838 sval_t sval;
1840 if (__path_is_null())
1841 return;
1843 expr = strip_expr(expr);
1844 expr = strip_expr_statement(expr);
1846 if (is_impossible_path())
1847 goto vanilla;
1849 if (expr && (expr->type == EXPR_COMPARE ||
1850 !get_implied_value(expr, &sval)) &&
1851 (is_condition(expr) || is_boolean(expr))) {
1852 call_return_state_hooks_compare(expr);
1853 return;
1854 } else if (is_conditional(expr)) {
1855 call_return_state_hooks_conditional(expr);
1856 return;
1857 } else if (call_return_state_hooks_split_possible(expr)) {
1858 return;
1859 } else if (call_return_state_hooks_split_null_non_null(expr)) {
1860 return;
1861 } else if (call_return_state_hooks_split_success_fail(expr)) {
1862 return;
1863 } else if (splitable_function_call(expr)) {
1864 return;
1865 } else if (split_positive_from_negative(expr)) {
1866 return;
1867 } else if (split_by_bool_param(expr)) {
1868 } else if (split_by_null_nonnull_param(expr)) {
1869 return;
1872 vanilla:
1873 return_ranges = get_return_ranges_str(expr, &ret_rl);
1874 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(ret_rl));
1876 return_id++;
1877 nr_states = stree_count(__get_cur_stree());
1878 if (nr_states >= 10000) {
1879 match_return_info(return_id, (char *)return_ranges, expr);
1880 return;
1882 FOR_EACH_PTR(returned_state_callbacks, cb) {
1883 cb->callback(return_id, (char *)return_ranges, expr);
1884 } END_FOR_EACH_PTR(cb);
1887 static void print_returned_struct_members(int return_id, char *return_ranges, struct expression *expr)
1889 struct returned_member_callback *cb;
1890 struct stree *stree;
1891 struct sm_state *sm;
1892 struct symbol *type;
1893 char *name;
1894 char member_name[256];
1895 int len;
1897 type = get_type(expr);
1898 if (!type || type->type != SYM_PTR)
1899 return;
1900 name = expr_to_var(expr);
1901 if (!name)
1902 return;
1904 member_name[sizeof(member_name) - 1] = '\0';
1905 strcpy(member_name, "$");
1907 len = strlen(name);
1908 FOR_EACH_PTR(returned_member_callbacks, cb) {
1909 stree = __get_cur_stree();
1910 FOR_EACH_MY_SM(cb->owner, stree, sm) {
1911 if (sm->name[0] == '*' && strcmp(sm->name + 1, name) == 0) {
1912 strcpy(member_name, "*$");
1913 cb->callback(return_id, return_ranges, expr, member_name, sm->state);
1914 continue;
1916 if (strncmp(sm->name, name, len) != 0)
1917 continue;
1918 if (strncmp(sm->name + len, "->", 2) != 0)
1919 continue;
1920 snprintf(member_name, sizeof(member_name), "$%s", sm->name + len);
1921 cb->callback(return_id, return_ranges, expr, member_name, sm->state);
1922 } END_FOR_EACH_SM(sm);
1923 } END_FOR_EACH_PTR(cb);
1925 free_string(name);
1928 static void reset_memdb(struct symbol *sym)
1930 mem_sql(NULL, NULL, "delete from caller_info;");
1931 mem_sql(NULL, NULL, "delete from return_states;");
1932 mem_sql(NULL, NULL, "delete from call_implies;");
1935 static void match_end_func_info(struct symbol *sym)
1937 if (__path_is_null())
1938 return;
1939 call_return_state_hooks(NULL);
1942 static void match_after_func(struct symbol *sym)
1944 if (!__inline_fn)
1945 reset_memdb(sym);
1948 static void init_memdb(void)
1950 char *err = NULL;
1951 int rc;
1952 const char *schema_files[] = {
1953 "db/db.schema",
1954 "db/caller_info.schema",
1955 "db/return_states.schema",
1956 "db/function_type_size.schema",
1957 "db/type_size.schema",
1958 "db/call_implies.schema",
1959 "db/function_ptr.schema",
1960 "db/local_values.schema",
1961 "db/function_type_value.schema",
1962 "db/type_value.schema",
1963 "db/function_type.schema",
1964 "db/data_info.schema",
1965 "db/parameter_name.schema",
1966 "db/constraints.schema",
1967 "db/constraints_required.schema",
1968 "db/fn_ptr_data_link.schema",
1969 "db/fn_data_link.schema",
1970 "db/mtag_about.schema",
1971 "db/mtag_map.schema",
1972 "db/mtag_data.schema",
1973 "db/mtag_alias.schema",
1975 static char buf[4096];
1976 int fd;
1977 int ret;
1978 int i;
1980 rc = sqlite3_open(":memory:", &mem_db);
1981 if (rc != SQLITE_OK) {
1982 printf("Error starting In-Memory database.");
1983 return;
1986 for (i = 0; i < ARRAY_SIZE(schema_files); i++) {
1987 fd = open_data_file(schema_files[i]);
1988 if (fd < 0) {
1989 printf("failed to open: %s\n", schema_files[i]);
1990 continue;
1992 ret = read(fd, buf, sizeof(buf));
1993 if (ret < 0) {
1994 printf("failed to read: %s\n", schema_files[i]);
1995 continue;
1997 close(fd);
1998 if (ret == sizeof(buf)) {
1999 printf("Schema file too large: %s (limit %zd bytes)",
2000 schema_files[i], sizeof(buf));
2001 continue;
2003 buf[ret] = '\0';
2004 rc = sqlite3_exec(mem_db, buf, NULL, NULL, &err);
2005 if (rc != SQLITE_OK) {
2006 fprintf(stderr, "SQL error #2: %s\n", err);
2007 fprintf(stderr, "%s\n", buf);
2012 void open_smatch_db(void)
2014 int rc;
2016 if (option_no_db)
2017 return;
2019 init_memdb();
2021 rc = sqlite3_open_v2("smatch_db.sqlite", &db, SQLITE_OPEN_READONLY, NULL);
2022 if (rc != SQLITE_OK) {
2023 option_no_db = 1;
2024 return;
2026 return;
2029 static void register_common_funcs(void)
2031 struct token *token;
2032 char *func;
2033 char filename[256];
2035 if (option_project == PROJ_NONE)
2036 strcpy(filename, "common_functions");
2037 else
2038 snprintf(filename, 256, "%s.common_functions", option_project_str);
2040 token = get_tokens_file(filename);
2041 if (!token)
2042 return;
2043 if (token_type(token) != TOKEN_STREAMBEGIN)
2044 return;
2045 token = token->next;
2046 while (token_type(token) != TOKEN_STREAMEND) {
2047 if (token_type(token) != TOKEN_IDENT)
2048 return;
2049 func = alloc_string(show_ident(token->ident));
2050 add_ptr_list(&common_funcs, func);
2051 token = token->next;
2053 clear_token_alloc();
2056 static char *get_next_string(char **str)
2058 static char string[256];
2059 char *start;
2060 char *p = *str;
2061 int len;
2063 if (*p == '\0')
2064 return NULL;
2065 start = p;
2067 while (*p != '\0' && *p != ' ' && *p != '\n')
2068 p++;
2070 len = p - start;
2071 if (len > 256) {
2072 memcpy(string, start, 255);
2073 string[255] = '\0';
2074 printf("return_fix: '%s' too long", string);
2075 **str = '\0';
2076 return NULL;
2078 memcpy(string, start, len);
2079 string[len] = '\0';
2080 if (*p != '\0')
2081 p++;
2082 *str = p;
2083 return string;
2086 static void register_return_replacements(void)
2088 char *func, *orig, *new;
2089 char filename[256];
2090 char buf[4096];
2091 int fd, ret, i;
2092 char *p;
2094 snprintf(filename, 256, "db/%s.return_fixes", option_project_str);
2095 fd = open_data_file(filename);
2096 if (fd < 0)
2097 return;
2098 ret = read(fd, buf, sizeof(buf));
2099 close(fd);
2100 if (ret < 0)
2101 return;
2102 if (ret == sizeof(buf)) {
2103 printf("file too large: %s (limit %zd bytes)",
2104 filename, sizeof(buf));
2105 return;
2107 buf[ret] = '\0';
2109 p = buf;
2110 while (*p) {
2111 get_next_string(&p);
2112 replace_count++;
2114 if (replace_count == 0 || replace_count % 3 != 0) {
2115 replace_count = 0;
2116 return;
2118 replace_table = malloc(replace_count * sizeof(char *));
2120 p = buf;
2121 i = 0;
2122 while (*p) {
2123 func = alloc_string(get_next_string(&p));
2124 orig = alloc_string(get_next_string(&p));
2125 new = alloc_string(get_next_string(&p));
2127 replace_table[i++] = func;
2128 replace_table[i++] = orig;
2129 replace_table[i++] = new;
2133 void register_definition_db_callbacks(int id)
2135 add_hook(&match_call_info, FUNCTION_CALL_HOOK);
2136 add_hook(&global_variable, BASE_HOOK);
2137 add_hook(&global_variable, DECLARATION_HOOK);
2138 add_split_return_callback(match_return_info);
2139 add_split_return_callback(print_returned_struct_members);
2140 add_hook(&call_return_state_hooks, RETURN_HOOK);
2141 add_hook(&match_end_func_info, END_FUNC_HOOK);
2142 add_hook(&match_after_func, AFTER_FUNC_HOOK);
2144 add_hook(&match_data_from_db, FUNC_DEF_HOOK);
2145 add_hook(&match_call_implies, CALL_HOOK_AFTER_INLINE);
2147 register_common_funcs();
2148 register_return_replacements();
2151 void register_db_call_marker(int id)
2153 add_hook(&match_call_marker, FUNCTION_CALL_HOOK);
2156 char *return_state_to_var_sym(struct expression *expr, int param, const char *key, struct symbol **sym)
2158 struct expression *arg;
2159 char *name = NULL;
2160 char member_name[256];
2162 *sym = NULL;
2164 if (param == -1) {
2165 const char *star = "";
2167 if (expr->type != EXPR_ASSIGNMENT)
2168 return NULL;
2169 name = expr_to_var_sym(expr->left, sym);
2170 if (!name)
2171 return NULL;
2172 if (key[0] == '*') {
2173 star = "*";
2174 key++;
2176 if (strncmp(key, "$", 1) != 0)
2177 return name;
2178 snprintf(member_name, sizeof(member_name), "%s%s%s", star, name, key + 1);
2179 free_string(name);
2180 return alloc_string(member_name);
2183 while (expr->type == EXPR_ASSIGNMENT)
2184 expr = strip_expr(expr->right);
2185 if (expr->type != EXPR_CALL)
2186 return NULL;
2188 arg = get_argument_from_call_expr(expr->args, param);
2189 if (!arg)
2190 return NULL;
2192 return get_variable_from_key(arg, key, sym);
2195 char *get_variable_from_key(struct expression *arg, const char *key, struct symbol **sym)
2197 char buf[256];
2198 char *tmp;
2200 if (!arg)
2201 return NULL;
2203 arg = strip_expr(arg);
2205 if (strcmp(key, "$") == 0)
2206 return expr_to_var_sym(arg, sym);
2208 if (strcmp(key, "*$") == 0) {
2209 if (arg->type == EXPR_PREOP && arg->op == '&') {
2210 arg = strip_expr(arg->unop);
2211 return expr_to_var_sym(arg, sym);
2212 } else {
2213 tmp = expr_to_var_sym(arg, sym);
2214 if (!tmp)
2215 return NULL;
2216 snprintf(buf, sizeof(buf), "*%s", tmp);
2217 free_string(tmp);
2218 return alloc_string(buf);
2222 if (arg->type == EXPR_PREOP && arg->op == '&') {
2223 arg = strip_expr(arg->unop);
2224 tmp = expr_to_var_sym(arg, sym);
2225 if (!tmp)
2226 return NULL;
2227 snprintf(buf, sizeof(buf), "%s.%s", tmp, key + 3);
2228 return alloc_string(buf);
2231 tmp = expr_to_var_sym(arg, sym);
2232 if (!tmp)
2233 return NULL;
2234 snprintf(buf, sizeof(buf), "%s%s", tmp, key + 1);
2235 free_string(tmp);
2236 return alloc_string(buf);
2239 char *get_chunk_from_key(struct expression *arg, char *key, struct symbol **sym, struct var_sym_list **vsl)
2241 *vsl = NULL;
2243 if (strcmp("$", key) == 0)
2244 return expr_to_chunk_sym_vsl(arg, sym, vsl);
2245 return get_variable_from_key(arg, key, sym);
2248 const char *state_name_to_param_name(const char *state_name, const char *param_name)
2250 int name_len;
2251 static char buf[256];
2253 name_len = strlen(param_name);
2255 if (strcmp(state_name, param_name) == 0) {
2256 return "$";
2257 } else if (state_name[name_len] == '-' && /* check for '-' from "->" */
2258 strncmp(state_name, param_name, name_len) == 0) {
2259 snprintf(buf, sizeof(buf), "$%s", state_name + name_len);
2260 return buf;
2261 } else if (state_name[0] == '*' && strcmp(state_name + 1, param_name) == 0) {
2262 return "*$";
2264 return NULL;
2267 const char *get_param_name_var_sym(const char *name, struct symbol *sym)
2269 if (!sym || !sym->ident)
2270 return NULL;
2272 return state_name_to_param_name(name, sym->ident->name);
2275 const char *get_mtag_name_var_sym(const char *state_name, struct symbol *sym)
2277 struct symbol *type;
2278 const char *sym_name;
2279 int name_len;
2280 static char buf[256];
2283 * mtag_name is different from param_name because mtags can be a struct
2284 * instead of a struct pointer. But we want to treat it like a pointer
2285 * because really an mtag is a pointer. Or in other words, if you pass
2286 * a struct foo then you want to talk about foo.bar but with an mtag
2287 * you want to refer to it as foo->bar.
2291 if (!sym || !sym->ident)
2292 return NULL;
2294 type = get_real_base_type(sym);
2295 if (type && type->type == SYM_BASETYPE)
2296 return "*$";
2298 sym_name = sym->ident->name;
2299 name_len = strlen(sym_name);
2301 if (state_name[name_len] == '.' && /* check for '-' from "->" */
2302 strncmp(state_name, sym_name, name_len) == 0) {
2303 snprintf(buf, sizeof(buf), "$->%s", state_name + name_len + 1);
2304 return buf;
2307 return state_name_to_param_name(state_name, sym_name);
2310 const char *get_mtag_name_expr(struct expression *expr)
2312 char *name;
2313 struct symbol *sym;
2314 const char *ret = NULL;
2316 name = expr_to_var_sym(expr, &sym);
2317 if (!name || !sym)
2318 goto free;
2320 ret = get_mtag_name_var_sym(name, sym);
2321 free:
2322 free_string(name);
2323 return ret;
2326 const char *get_param_name(struct sm_state *sm)
2328 return get_param_name_var_sym(sm->name, sm->sym);
2331 char *get_data_info_name(struct expression *expr)
2333 struct symbol *sym;
2334 char *name;
2335 char buf[256];
2336 char *ret = NULL;
2338 expr = strip_expr(expr);
2339 name = get_member_name(expr);
2340 if (name)
2341 return name;
2342 name = expr_to_var_sym(expr, &sym);
2343 if (!name || !sym)
2344 goto free;
2345 if (!(sym->ctype.modifiers & MOD_TOPLEVEL))
2346 goto free;
2347 if (sym->ctype.modifiers & MOD_STATIC)
2348 snprintf(buf, sizeof(buf), "static %s", name);
2349 else
2350 snprintf(buf, sizeof(buf), "global %s", name);
2351 ret = alloc_sname(buf);
2352 free:
2353 free_string(name);
2354 return ret;