smatch: save less stuff, run faster
[smatch.git] / check_arm64_tagged.c
blobe126552e59646dcbc477c774549d8e9112862a33
1 /*
2 * Copyright (C) 2019 ARM.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version 2
7 * of the License, or (at your option) any later version.
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, see http://www.gnu.org/copyleft/gpl.txt
18 #include "smatch.h"
19 #include "smatch_extra.h"
20 #include "smatch_function_hashtable.h"
22 static bool expr_has_memory_addr(struct expression *expr);
24 static DEFINE_HASHTABLE_SEARCH(search_symbol, char, char);
25 static DEFINE_HASHTABLE_INSERT(insert_symbol, char, char);
26 static struct hashtable *symbols;
28 static void match_assign(struct expression *expr)
30 char *left_name;
31 struct symbol *left_sym;
33 left_name = expr_to_var_sym(expr->left, &left_sym);
34 if (!left_name || !left_sym)
35 return;
38 * Once we have spotted a symbol of interest (one that may hold
39 * an untagged memory address), we keep track of any assignments
40 * made, such that we can also treat the assigned symbol as something
41 * of interest. This tracking is limited in scope to the function.
43 if (expr_has_memory_addr(expr->right))
44 insert_symbol(symbols, left_name, left_name);
47 static void match_endfunc(struct symbol *sym)
49 destroy_function_hashtable(symbols);
50 symbols = create_function_hashtable(4000);
53 static bool expr_has_untagged_symbol(struct expression *expr)
55 char *name;
56 struct symbol *sym;
58 if (expr->type != EXPR_SYMBOL)
59 return false;
61 name = expr_to_var_sym(expr, &sym);
62 if (!name || !sym)
63 return false;
65 /* See if this is something we already know is of interest */
66 if (search_symbol(symbols, name))
67 return true;
69 return false;
72 static bool expr_has_untagged_member(struct expression *expr)
74 if (expr->type != EXPR_DEREF)
75 return false;
77 if (!strcmp(expr->member->name, "vm_start") ||
78 !strcmp(expr->member->name, "vm_end") ||
79 !strcmp(expr->member->name, "addr_limit"))
80 return true;
82 return false;
85 static bool expr_has_macro_with_name(struct expression *expr, const char *macro_name)
87 char *name;
89 name = get_macro_name(expr->pos);
90 return (name && !strcmp(name, macro_name));
93 static bool expr_has_untagged_macro(struct expression *expr)
95 if (expr_has_macro_with_name(expr, "PAGE_SIZE") ||
96 expr_has_macro_with_name(expr, "PAGE_MASK") ||
97 expr_has_macro_with_name(expr, "TASK_SIZE"))
98 return true;
101 * We can't detect a marco (such as PAGE_MASK) inside another macro
102 * such as offset_in_page, therefore we have to detect the outer macro
103 * instead.
105 if (expr_has_macro_with_name(expr, "offset_in_page"))
106 return true;
108 return false;
112 * Identify expressions that contain memory addresses, in the future
113 * we may use annotations on symbols or function parameters.
115 static bool expr_has_memory_addr(struct expression *expr)
117 if (expr->type == EXPR_PREOP || expr->type == EXPR_POSTOP)
118 expr = strip_expr(expr->unop);
120 if (expr_has_untagged_member(expr))
121 return true;
123 if (expr_has_untagged_macro(expr))
124 return true;
126 if (expr_has_untagged_symbol(expr))
127 return true;
129 return false;
132 int rl_is_larger_or_equal(struct range_list *rl, sval_t sval)
134 struct data_range *tmp;
136 FOR_EACH_PTR(rl, tmp) {
137 if (sval_cmp(tmp->max, sval) >= 0)
138 return 1;
139 } END_FOR_EACH_PTR(tmp);
140 return 0;
143 int rl_range_has_min_value(struct range_list *rl, sval_t sval)
145 struct data_range *tmp;
147 FOR_EACH_PTR(rl, tmp) {
148 if (!sval_cmp(tmp->min, sval)) {
149 return 1;
151 } END_FOR_EACH_PTR(tmp);
152 return 0;
155 static bool rl_is_tagged(struct range_list *rl)
157 sval_t invalid = { .type = &ullong_ctype, .value = (1ULL << 56) };
158 sval_t invalid_kernel = { .type = &ullong_ctype, .value = (0xff8ULL << 52) };
161 * We only care for tagged addresses, thus ignore anything where the
162 * ranges of potential values cannot possibly have any of the top byte
163 * bits set.
165 if (!rl_is_larger_or_equal(rl, invalid))
166 return false;
169 * Tagged addresses are untagged in the kernel by using sign_extend64 in
170 * the untagged_addr macro. For userspace addresses bit 55 will always
171 * be 0 and thus this has the effect of clearing the top byte. However
172 * for kernel addresses this is not true and the top bits end up set to
173 * all 1s. The untagged_addr macro results in leaving a gap in the range
174 * of possible values which can exist, thus let's look for a tell-tale
175 * range which starts from (0xff8ULL << 52).
177 if (rl_range_has_min_value(rl, invalid_kernel))
178 return false;
180 return true;
183 static void match_condition(struct expression *expr)
185 struct range_list *rl = NULL;
186 struct expression *val = NULL;
187 struct symbol *type;
188 char *var_name;
191 * Match instances where something is compared against something
192 * else - we include binary operators as these are commonly used
193 * to make a comparison, e.g. if (start & ~PAGE_MASK).
195 if (expr->type != EXPR_COMPARE &&
196 expr->type != EXPR_BINOP)
197 return;
200 * Look on both sides of the comparison for something that shouldn't
201 * be compared with a tagged address, e.g. macros such as PAGE_MASK
202 * or struct members named .vm_start.
204 if (expr_has_memory_addr(expr->left))
205 val = expr->right;
208 * The macro 'offset_in_page' has the PAGE_MASK macro inside it, this
209 * results in 'expr_has_memory_addr' returning true for both sides. To
210 * work around this we assume PAGE_MASK (or similar) is on the right
211 * side, thus we do the following test last.
213 if (expr_has_memory_addr(expr->right))
214 val = expr->left;
216 if (!val)
217 return;
219 /* We only care about memory addresses which are 64 bits */
220 type = get_type(val);
221 if (!type || type_bits(type) != 64)
222 return;
224 /* We only care for comparison against user originated data */
225 if (!get_user_rl(val, &rl))
226 return;
228 /* We only care for tagged addresses */
229 if (!rl_is_tagged(rl))
230 return;
232 /* Finally, we believe we may have spotted a risky comparison */
233 var_name = expr_to_var(val);
234 if (var_name)
235 sm_warning("comparison of a potentially tagged address (%s, %d, %s)", get_function(), get_param_num(val), var_name);
238 void check_arm64_tagged(int id)
240 char *arch;
242 if (option_project != PROJ_KERNEL)
243 return;
245 /* Limit to aarch64 */
246 arch = getenv("ARCH");
247 if (!arch || strcmp(arch, "arm64"))
248 return;
250 symbols = create_function_hashtable(4000);
252 add_hook(&match_assign, ASSIGNMENT_HOOK);
253 add_hook(&match_condition, CONDITION_HOOK);
254 add_hook(&match_endfunc, END_FUNC_HOOK);