2 * Copyright (C) 2011 Dan Carpenter.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version 2
7 * of the License, or (at your option) any later version.
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, see http://www.gnu.org/copyleft/gpl.txt
19 * There are a couple checks that try to see if a variable
20 * comes from the user. It would be better to unify them
21 * into one place. Also it we should follow the data down
22 * the call paths. Hence this file.
26 #include "smatch_slist.h"
27 #include "smatch_extra.h"
30 static int my_call_id
;
33 static bool func_gets_user_data
;
35 static const char * kstr_funcs
[] = {
36 "kstrtoull", "kstrtoll", "kstrtoul", "kstrtol", "kstrtouint",
37 "kstrtoint", "kstrtou64", "kstrtos64", "kstrtou32", "kstrtos32",
38 "kstrtou16", "kstrtos16", "kstrtou8", "kstrtos8", "kstrtoull_from_user"
39 "kstrtoll_from_user", "kstrtoul_from_user", "kstrtol_from_user",
40 "kstrtouint_from_user", "kstrtoint_from_user", "kstrtou16_from_user",
41 "kstrtos16_from_user", "kstrtou8_from_user", "kstrtos8_from_user",
42 "kstrtou64_from_user", "kstrtos64_from_user", "kstrtou32_from_user",
43 "kstrtos32_from_user",
46 static void set_points_to_user_data(struct expression
*expr
);
48 static struct stree
*start_states
;
49 static struct stree_stack
*saved_stack
;
50 static void save_start_states(struct statement
*stmt
)
52 start_states
= clone_stree(__get_cur_stree());
55 static void free_start_states(void)
57 free_stree(&start_states
);
60 static void match_save_states(struct expression
*expr
)
62 push_stree(&saved_stack
, start_states
);
66 static void match_restore_states(struct expression
*expr
)
68 free_stree(&start_states
);
69 start_states
= pop_stree(&saved_stack
);
72 static struct smatch_state
*empty_state(struct sm_state
*sm
)
74 return alloc_estate_empty();
77 static void pre_merge_hook(struct sm_state
*sm
)
79 struct smatch_state
*user
;
80 struct smatch_state
*extra
;
81 struct range_list
*rl
;
83 extra
= get_state(SMATCH_EXTRA
, sm
->name
, sm
->sym
);
84 if (!extra
|| !estate_rl(extra
))
86 user
= get_state(my_id
, sm
->name
, sm
->sym
);
87 if (!user
|| !estate_rl(user
))
89 rl
= rl_intersection(estate_rl(user
), estate_rl(extra
));
90 set_state(my_id
, sm
->name
, sm
->sym
, alloc_estate_rl(clone_rl(rl
)));
93 static void tag_inner_struct_members(struct expression
*expr
, struct symbol
*member
)
95 struct expression
*edge_member
;
96 struct symbol
*base
= get_real_base_type(member
);
100 expr
= member_expression(expr
, '.', member
->ident
);
102 FOR_EACH_PTR(base
->symbol_list
, tmp
) {
105 type
= get_real_base_type(tmp
);
109 if (type
->type
== SYM_UNION
|| type
->type
== SYM_STRUCT
) {
110 tag_inner_struct_members(expr
, tmp
);
117 edge_member
= member_expression(expr
, '.', tmp
->ident
);
118 set_state_expr(my_id
, edge_member
, alloc_estate_whole(type
));
119 } END_FOR_EACH_PTR(tmp
);
122 static void tag_struct_members(struct symbol
*type
, struct expression
*expr
)
125 struct expression
*member
;
128 if (expr
->type
== EXPR_PREOP
&& expr
->op
== '&') {
129 expr
= strip_expr(expr
->unop
);
133 FOR_EACH_PTR(type
->symbol_list
, tmp
) {
134 type
= get_real_base_type(tmp
);
138 if (type
->type
== SYM_UNION
|| type
->type
== SYM_STRUCT
) {
139 tag_inner_struct_members(expr
, tmp
);
146 member
= member_expression(expr
, op
, tmp
->ident
);
147 set_state_expr(my_id
, member
, alloc_estate_whole(get_type(member
)));
149 if (type
->type
== SYM_ARRAY
)
150 set_points_to_user_data(member
);
151 } END_FOR_EACH_PTR(tmp
);
154 static void tag_base_type(struct expression
*expr
)
156 if (expr
->type
== EXPR_PREOP
&& expr
->op
== '&')
157 expr
= strip_expr(expr
->unop
);
159 expr
= deref_expression(expr
);
160 set_state_expr(my_id
, expr
, alloc_estate_whole(get_type(expr
)));
163 static void tag_as_user_data(struct expression
*expr
)
167 expr
= strip_expr(expr
);
169 type
= get_type(expr
);
170 if (!type
|| type
->type
!= SYM_PTR
)
172 type
= get_real_base_type(type
);
175 if (type
== &void_ctype
) {
176 set_state_expr(my_id
, deref_expression(expr
), alloc_estate_whole(&ulong_ctype
));
179 if (type
->type
== SYM_BASETYPE
)
181 if (type
->type
== SYM_STRUCT
) {
182 if (expr
->type
!= EXPR_PREOP
|| expr
->op
!= '&')
183 expr
= deref_expression(expr
);
185 set_state_expr(my_id
, deref_expression(expr
), alloc_estate_whole(&ulong_ctype
));
186 tag_struct_members(type
, expr
);
190 static void match_user_copy(const char *fn
, struct expression
*expr
, void *_param
)
192 int param
= PTR_INT(_param
);
193 struct expression
*dest
;
195 func_gets_user_data
= true;
197 dest
= get_argument_from_call_expr(expr
->args
, param
);
198 dest
= strip_expr(dest
);
201 tag_as_user_data(dest
);
204 static void match_sscanf(const char *fn
, struct expression
*expr
, void *unused
)
206 struct expression
*arg
;
209 func_gets_user_data
= true;
212 FOR_EACH_PTR(expr
->args
, arg
) {
216 tag_as_user_data(arg
);
217 } END_FOR_EACH_PTR(arg
);
220 static int points_to_user_data(struct expression
*expr
)
222 struct smatch_state
*state
;
228 expr
= strip_expr(expr
);
230 if (expr
->type
== EXPR_BINOP
&& expr
->op
== '+') {
231 if (points_to_user_data(expr
->left
))
233 if (points_to_user_data(expr
->right
))
238 name
= expr_to_var_sym(expr
, &sym
);
241 snprintf(buf
, sizeof(buf
), "*%s", name
);
242 state
= get_state(my_id
, buf
, sym
);
243 if (state
&& estate_rl(state
))
250 static void set_points_to_user_data(struct expression
*expr
)
256 name
= expr_to_var_sym(expr
, &sym
);
259 snprintf(buf
, sizeof(buf
), "*%s", name
);
260 set_state(my_id
, buf
, sym
, alloc_estate_whole(&llong_ctype
));
265 static int is_skb_data(struct expression
*expr
)
269 if (expr
->type
== EXPR_BINOP
&& expr
->op
== '+')
270 return is_skb_data(expr
->left
);
272 expr
= strip_expr(expr
);
275 if (expr
->type
!= EXPR_DEREF
|| expr
->op
!= '.')
280 if (strcmp(expr
->member
->name
, "data") != 0)
283 sym
= expr_to_sym(expr
->deref
);
286 sym
= get_real_base_type(sym
);
287 if (!sym
|| sym
->type
!= SYM_PTR
)
289 sym
= get_real_base_type(sym
);
290 if (!sym
|| sym
->type
!= SYM_STRUCT
|| !sym
->ident
)
292 if (strcmp(sym
->ident
->name
, "sk_buff") != 0)
298 static int comes_from_skb_data(struct expression
*expr
)
300 expr
= strip_expr(expr
);
301 if (!expr
|| expr
->type
!= EXPR_PREOP
|| expr
->op
!= '*')
304 expr
= strip_expr(expr
->unop
);
305 if (expr
->type
== EXPR_BINOP
&& expr
->op
== '+')
306 expr
= strip_expr(expr
->left
);
308 return is_skb_data(expr
);
311 static int handle_struct_assignment(struct expression
*expr
)
313 struct expression
*right
;
314 struct symbol
*left_type
, *right_type
;
316 left_type
= get_type(expr
->left
);
317 if (!left_type
|| left_type
->type
!= SYM_PTR
)
319 left_type
= get_real_base_type(left_type
);
320 if (!left_type
|| left_type
->type
!= SYM_STRUCT
)
324 * Ignore struct to struct assignments because for those we look at the
325 * individual members.
327 right
= strip_expr(expr
->right
);
328 right_type
= get_type(right
);
329 if (!right_type
|| right_type
->type
!= SYM_PTR
)
332 /* If we are assigning struct members then normally that is handled
333 * by fake assignments, however if we cast one struct to a different
334 * of struct then we handle that here.
336 right_type
= get_real_base_type(right_type
);
337 if (right_type
== left_type
)
340 if (!points_to_user_data(right
) && !is_skb_data(right
))
343 tag_as_user_data(expr
->left
);
347 static int handle_get_user(struct expression
*expr
)
352 name
= get_macro_name(expr
->pos
);
353 if (!name
|| strcmp(name
, "get_user") != 0)
356 name
= expr_to_var(expr
->right
);
357 if (!name
|| strcmp(name
, "__val_gu") != 0)
359 set_state_expr(my_id
, expr
->left
, alloc_estate_whole(get_type(expr
->left
)));
366 static void match_assign(struct expression
*expr
)
368 struct range_list
*rl
;
370 if (is_fake_call(expr
->right
))
372 if (handle_get_user(expr
))
374 if (points_to_user_data(expr
->right
))
375 set_points_to_user_data(expr
->left
);
376 if (handle_struct_assignment(expr
))
379 if (!get_user_rl(expr
->right
, &rl
))
380 goto clear_old_state
;
382 rl
= cast_rl(get_type(expr
->left
), rl
);
383 set_state_expr(my_id
, expr
->left
, alloc_estate_rl(rl
));
388 if (get_state_expr(my_id
, expr
->left
))
389 set_state_expr(my_id
, expr
->left
, alloc_estate_empty());
392 static void match_condition(struct expression
*expr
)
394 struct smatch_state
*left_orig
= NULL
;
395 struct smatch_state
*right_orig
= NULL
;
397 if (expr
->type
!= EXPR_COMPARE
|| expr
->op
!= SPECIAL_EQUAL
)
400 left_orig
= get_state_expr(my_id
, expr
->left
);
401 right_orig
= get_state_expr(my_id
, expr
->right
);
403 if (!left_orig
&& !right_orig
)
405 if (left_orig
&& right_orig
)
409 set_true_false_states_expr(my_id
, expr
->left
, alloc_estate_empty(), NULL
);
411 set_true_false_states_expr(my_id
, expr
->right
, alloc_estate_empty(), NULL
);
414 static void match_user_assign_function(const char *fn
, struct expression
*expr
, void *unused
)
416 func_gets_user_data
= true;
418 tag_as_user_data(expr
->left
);
419 set_points_to_user_data(expr
->left
);
422 static void match_simple_strtoul(const char *fn
, struct expression
*expr
, void *unused
)
424 func_gets_user_data
= true;
426 set_state_expr(my_id
, expr
->left
, alloc_estate_whole(get_type(expr
->left
)));
429 static int get_user_macro_rl(struct expression
*expr
, struct range_list
**rl
)
435 macro
= get_macro_name(expr
->pos
);
440 if (strcmp(macro
, "ntohl") == 0) {
441 *rl
= alloc_whole_rl(&uint_ctype
);
444 if (strcmp(macro
, "ntohs") == 0) {
445 *rl
= alloc_whole_rl(&ushort_ctype
);
452 struct range_list
*rl
;
453 struct expression
*call
;
455 static int returned_rl_callback(void *_info
, int argc
, char **argv
, char **azColName
)
457 struct db_info
*db_info
= _info
;
458 struct range_list
*rl
;
459 char *return_ranges
= argv
[0];
460 char *user_ranges
= argv
[1];
461 struct expression
*arg
;
467 call_results_to_rl(db_info
->call
, get_type(db_info
->call
), user_ranges
, &rl
);
468 if (str_to_comparison_arg(return_ranges
, db_info
->call
, &comparison
, &arg
) &&
469 comparison
== SPECIAL_EQUAL
) {
470 struct range_list
*orig_rl
;
472 if (!get_user_rl(arg
, &orig_rl
))
474 rl
= rl_intersection(rl
, orig_rl
);
478 db_info
->rl
= rl_union(db_info
->rl
, rl
);
483 static int has_user_data(struct symbol
*sym
)
485 struct sm_state
*tmp
;
487 FOR_EACH_MY_SM(my_id
, __get_cur_stree(), tmp
) {
490 } END_FOR_EACH_SM(tmp
);
494 static int we_pass_user_data(struct expression
*call
)
496 struct expression
*arg
;
499 FOR_EACH_PTR(call
->args
, arg
) {
500 sym
= expr_to_sym(arg
);
503 if (has_user_data(sym
))
505 } END_FOR_EACH_PTR(arg
);
510 static int db_returned_user_rl(struct expression
*call
, struct range_list
**rl
)
512 struct db_info db_info
= {};
514 /* for function pointers assume everything is used */
515 if (call
->fn
->type
!= EXPR_SYMBOL
)
517 if (is_fake_call(call
))
521 run_sql(&returned_rl_callback
, &db_info
,
522 "select return, value from return_states where %s and type = %d and parameter = -1 and key = '$';",
523 get_static_filter(call
->fn
->symbol
), USER_DATA3_SET
);
525 func_gets_user_data
= true;
530 run_sql(&returned_rl_callback
, &db_info
,
531 "select return, value from return_states where %s and type = %d and parameter = -1 and key = '$';",
532 get_static_filter(call
->fn
->symbol
), USER_DATA3
);
534 if (!we_pass_user_data(call
))
536 func_gets_user_data
= true;
544 static int user_data_flag
;
545 static struct range_list
*var_user_rl(struct expression
*expr
)
547 struct smatch_state
*state
;
548 struct range_list
*rl
;
549 struct range_list
*absolute_rl
;
551 if (get_user_macro_rl(expr
, &rl
))
554 if (comes_from_skb_data(expr
)) {
555 rl
= alloc_whole_rl(get_type(expr
));
559 state
= get_state_expr(my_id
, expr
);
560 if (state
&& estate_rl(state
)) {
561 rl
= estate_rl(state
);
565 if (expr
->type
== EXPR_CALL
&& db_returned_user_rl(expr
, &rl
))
571 absolute_rl
= var_to_absolute_rl(expr
);
572 return clone_rl(rl_intersection(rl
, absolute_rl
));
575 int get_user_rl(struct expression
*expr
, struct range_list
**rl
)
579 custom_get_absolute_rl(expr
, &var_user_rl
, rl
);
580 if (!user_data_flag
) {
587 int get_user_rl_var_sym(const char *name
, struct symbol
*sym
, struct range_list
**rl
)
589 struct smatch_state
*state
;
591 state
= get_state(my_id
, name
, sym
);
592 if (state
&& estate_rl(state
)) {
593 *rl
= estate_rl(state
);
599 static void match_call_info(struct expression
*expr
)
601 struct range_list
*rl
;
602 struct expression
*arg
;
606 FOR_EACH_PTR(expr
->args
, arg
) {
609 if (!get_user_rl(arg
, &rl
))
612 sql_insert_caller_info(expr
, USER_DATA3
, i
, "$", show_rl(rl
));
613 } END_FOR_EACH_PTR(arg
);
616 static void struct_member_callback(struct expression
*call
, int param
, char *printed_name
, struct sm_state
*sm
)
618 struct smatch_state
*state
;
619 struct range_list
*rl
;
621 if (strcmp(sm
->state
->name
, "") == 0)
624 state
= get_state(SMATCH_EXTRA
, sm
->name
, sm
->sym
);
625 if (!state
|| !estate_rl(state
))
626 rl
= estate_rl(sm
->state
);
628 rl
= rl_intersection(estate_rl(sm
->state
), estate_rl(state
));
630 sql_insert_caller_info(call
, USER_DATA3
, param
, printed_name
, show_rl(rl
));
633 static void set_param_user_data(const char *name
, struct symbol
*sym
, char *key
, char *value
)
635 struct range_list
*rl
= NULL
;
636 struct smatch_state
*state
;
640 if (strcmp(key
, "*$") == 0)
641 snprintf(fullname
, sizeof(fullname
), "*%s", name
);
642 else if (strncmp(key
, "$", 1) == 0)
643 snprintf(fullname
, 256, "%s%s", name
, key
+ 1);
647 type
= get_member_type_from_key(symbol_expression(sym
), key
);
649 /* if the caller passes a void pointer with user data */
650 if (strcmp(key
, "*$") == 0 && type
&& type
!= &void_ctype
) {
651 struct expression
*expr
= symbol_expression(sym
);
653 tag_as_user_data(expr
);
654 set_points_to_user_data(expr
);
657 str_to_rl(type
, value
, &rl
);
658 state
= alloc_estate_rl(rl
);
659 set_state(my_id
, fullname
, sym
, state
);
662 static void set_called(const char *name
, struct symbol
*sym
, char *key
, char *value
)
664 set_state(my_call_id
, "this_function", NULL
, &called
);
667 static void match_syscall_definition(struct symbol
*sym
)
674 macro
= get_macro_name(sym
->pos
);
676 (strncmp("SYSCALL_DEFINE", macro
, strlen("SYSCALL_DEFINE")) == 0 ||
677 strncmp("COMPAT_SYSCALL_DEFINE", macro
, strlen("COMPAT_SYSCALL_DEFINE")) == 0))
680 name
= get_function();
681 if (!option_no_db
&& get_state(my_call_id
, "this_function", NULL
) != &called
) {
682 if (name
&& strncmp(name
, "sys_", 4) == 0)
686 if (name
&& strncmp(name
, "compat_sys_", 11) == 0)
692 FOR_EACH_PTR(sym
->ctype
.base_type
->arguments
, arg
) {
693 set_state(my_id
, arg
->ident
->name
, arg
, alloc_estate_whole(get_real_base_type(arg
)));
694 } END_FOR_EACH_PTR(arg
);
697 static void set_to_user_data(struct expression
*expr
, char *key
, char *value
)
702 struct range_list
*rl
= NULL
;
704 type
= get_member_type_from_key(expr
, key
);
705 name
= get_variable_from_key(expr
, key
, &sym
);
709 call_results_to_rl(expr
, type
, value
, &rl
);
711 set_state(my_id
, name
, sym
, alloc_estate_rl(rl
));
717 static void returns_param_user_data(struct expression
*expr
, int param
, char *key
, char *value
)
719 struct expression
*arg
;
720 struct expression
*call
;
723 while (call
->type
== EXPR_ASSIGNMENT
)
724 call
= strip_expr(call
->right
);
725 if (call
->type
!= EXPR_CALL
)
728 if (!we_pass_user_data(call
))
732 if (expr
->type
!= EXPR_ASSIGNMENT
)
734 set_to_user_data(expr
->left
, key
, value
);
738 arg
= get_argument_from_call_expr(call
->args
, param
);
741 set_to_user_data(arg
, key
, value
);
744 static void returns_param_user_data_set(struct expression
*expr
, int param
, char *key
, char *value
)
746 struct expression
*arg
;
748 func_gets_user_data
= true;
751 if (expr
->type
!= EXPR_ASSIGNMENT
)
753 set_to_user_data(expr
->left
, key
, value
);
757 while (expr
->type
== EXPR_ASSIGNMENT
)
758 expr
= strip_expr(expr
->right
);
759 if (expr
->type
!= EXPR_CALL
)
762 arg
= get_argument_from_call_expr(expr
->args
, param
);
765 set_to_user_data(arg
, key
, value
);
768 static int has_empty_state(struct sm_state
*sm
)
770 struct sm_state
*tmp
;
772 FOR_EACH_PTR(sm
->possible
, tmp
) {
773 if (!estate_rl(tmp
->state
))
775 } END_FOR_EACH_PTR(tmp
);
780 static void param_set_to_user_data(int return_id
, char *return_ranges
, struct expression
*expr
)
783 struct smatch_state
*start_state
;
784 struct range_list
*rl
;
786 const char *param_name
;
788 FOR_EACH_MY_SM(my_id
, __get_cur_stree(), sm
) {
789 if (has_empty_state(sm
))
792 param
= get_param_num_from_sym(sm
->sym
);
794 if (expr_to_sym(expr
) == sm
->sym
)
800 /* The logic here was that if we were passed in a user data then
801 * we don't record that. It's like the difference between
802 * param_filter and param_set. When I think about it, I'm not
803 * sure it actually works. It's probably harmless because we
804 * checked earlier that we're not returning a parameter...
805 * Let's mark this as a TODO.
807 start_state
= get_state_stree(start_states
, my_id
, sm
->name
, sm
->sym
);
808 if (start_state
&& rl_equiv(estate_rl(sm
->state
), estate_rl(start_state
)))
811 param_name
= get_param_name(sm
);
814 if (strcmp(param_name
, "$") == 0)
817 sql_insert_return_states(return_id
, return_ranges
,
818 func_gets_user_data
? USER_DATA3_SET
: USER_DATA3
,
819 param
, param_name
, show_rl(estate_rl(sm
->state
)));
820 } END_FOR_EACH_SM(sm
);
822 if (get_user_rl(expr
, &rl
)) {
823 sql_insert_return_states(return_id
, return_ranges
,
824 func_gets_user_data
? USER_DATA3_SET
: USER_DATA3
,
825 -1, "$", show_rl(rl
));
829 static void match_function_def(struct symbol
*sym
)
831 func_gets_user_data
= false;
834 void check_user_data2(int id
)
840 if (option_project
!= PROJ_KERNEL
)
843 add_hook(&match_function_def
, FUNC_DEF_HOOK
);
845 add_hook(&save_start_states
, AFTER_DEF_HOOK
);
846 add_hook(&free_start_states
, AFTER_FUNC_HOOK
);
847 add_hook(&match_save_states
, INLINE_FN_START
);
848 add_hook(&match_restore_states
, INLINE_FN_END
);
850 add_unmatched_state_hook(my_id
, &empty_state
);
851 add_pre_merge_hook(my_id
, &pre_merge_hook
);
852 add_merge_hook(my_id
, &merge_estates
);
854 add_function_hook("copy_from_user", &match_user_copy
, INT_PTR(0));
855 add_function_hook("__copy_from_user", &match_user_copy
, INT_PTR(0));
856 add_function_hook("memcpy_fromiovec", &match_user_copy
, INT_PTR(0));
857 for (i
= 0; i
< ARRAY_SIZE(kstr_funcs
); i
++)
858 add_function_hook(kstr_funcs
[i
], &match_user_copy
, INT_PTR(2));
860 add_function_assign_hook("simple_strtol", &match_simple_strtoul
, NULL
);
861 add_function_assign_hook("simple_strtoll", &match_simple_strtoul
, NULL
);
862 add_function_assign_hook("simple_strtoul", &match_simple_strtoul
, NULL
);
863 add_function_assign_hook("simple_strtoull", &match_simple_strtoul
, NULL
);
865 add_function_hook("sscanf", &match_sscanf
, NULL
);
867 add_function_assign_hook("memdup_user", &match_user_assign_function
, NULL
);
868 add_function_assign_hook("kmap_atomic", &match_user_assign_function
, NULL
);
869 add_function_assign_hook("skb_network_header", &match_user_assign_function
, NULL
);
871 add_hook(&match_syscall_definition
, AFTER_DEF_HOOK
);
873 add_hook(&match_assign
, ASSIGNMENT_HOOK
);
874 add_hook(&match_condition
, CONDITION_HOOK
);
876 add_hook(&match_call_info
, FUNCTION_CALL_HOOK
);
877 add_member_info_callback(my_id
, struct_member_callback
);
878 select_caller_info_hook(set_param_user_data
, USER_DATA3
);
879 select_return_states_hook(USER_DATA3
, &returns_param_user_data
);
880 select_return_states_hook(USER_DATA3_SET
, &returns_param_user_data_set
);
881 add_split_return_callback(¶m_set_to_user_data
);
884 void check_user_data3(int id
)
888 if (option_project
!= PROJ_KERNEL
)
890 select_caller_info_hook(set_called
, INTERNAL
);