pet_expr_insert_arg: use pet_expr_access_get_domain_space
[pet.git] / expr_arg.c
blob6660c5f80bef5ebbb5a889dcb567b183fbad590e
1 /*
2 * Copyright 2011 Leiden University. All rights reserved.
3 * Copyright 2012-2014 Ecole Normale Superieure. All rights reserved.
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
9 * 1. Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above
13 * copyright notice, this list of conditions and the following
14 * disclaimer in the documentation and/or other materials provided
15 * with the distribution.
17 * THIS SOFTWARE IS PROVIDED BY LEIDEN UNIVERSITY ''AS IS'' AND ANY
18 * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
20 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL LEIDEN UNIVERSITY OR
21 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
22 * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
23 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA,
24 * OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
27 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 * The views and conclusions contained in the software and documentation
30 * are those of the authors and should not be interpreted as
31 * representing official policies, either expressed or implied, of
32 * Leiden University.
35 #include "context.h"
36 #include "expr.h"
37 #include "expr_arg.h"
39 /* Equate the arguments "pos1" and "pos2" of the access expression "expr".
41 * We may assume that "pos1" is smaller than "pos2".
42 * We replace all references to the argument at position "pos2"
43 * to references to the argument at position "pos1" (leaving all other
44 * variables untouched) and then drop argument "pos2".
46 static __isl_give pet_expr *equate_arg(__isl_take pet_expr *expr, int pos1,
47 int pos2)
49 int in;
50 isl_space *space;
51 isl_multi_aff *ma;
53 if (!expr)
54 return NULL;
55 if (pos1 == pos2)
56 return expr;
57 if (pos1 > pos2)
58 return equate_arg(expr, pos2, pos1);
59 if (pos1 < 0 || pos2 >= expr->n_arg)
60 isl_die(pet_expr_get_ctx(expr), isl_error_invalid,
61 "position out of bounds", return pet_expr_free(expr));
63 space = isl_multi_pw_aff_get_domain_space(expr->acc.index);
64 space = isl_space_unwrap(space);
65 in = isl_space_dim(space, isl_dim_in);
66 isl_space_free(space);
68 pos1 += in;
69 pos2 += in;
70 space = isl_multi_pw_aff_get_domain_space(expr->acc.index);
71 space = isl_space_map_from_set(space);
72 ma = isl_multi_aff_identity(space);
73 ma = isl_multi_aff_set_aff(ma, pos2, isl_multi_aff_get_aff(ma, pos1));
74 expr = pet_expr_access_pullback_multi_aff(expr, ma);
75 expr = pet_expr_access_project_out_arg(expr, in, pos2 - in);
77 return expr;
80 /* Remove all arguments of the access expression "expr" that are duplicates
81 * of earlier arguments.
83 __isl_give pet_expr *pet_expr_remove_duplicate_args(__isl_take pet_expr *expr)
85 int i, j;
87 if (!expr)
88 return NULL;
89 if (expr->n_arg < 2)
90 return expr;
92 for (i = expr->n_arg - 1; i >= 0; --i) {
93 for (j = 0; j < i; ++j)
94 if (pet_expr_is_equal(expr->args[i], expr->args[j]))
95 break;
96 if (j >= i)
97 continue;
98 expr = equate_arg(expr, j, i);
99 if (!expr)
100 return NULL;
103 return expr;
106 /* Insert argument "arg" at position "pos" in the arguments
107 * of access expression "expr".
109 * Besides actually inserting the argument, we also need to make
110 * sure that we adjust the references to the original arguments.
112 * If "expr" has no arguments to start with, then its domain is of the form
114 * S[i]
116 * otherwise, it is of the form
118 * [S[i] -> [args]]
120 * In the first case, we compute the pullback over
122 * [S[i] -> [arg]] -> S[i]
124 * In the second case, we compute the pullback over
126 * [S[i] -> [args_before_pos,arg,args_after_pos]] -> [S[i] -> [args]]
128 __isl_give pet_expr *pet_expr_insert_arg(__isl_take pet_expr *expr, int pos,
129 __isl_take pet_expr *arg)
131 int i, n;
132 isl_space *space;
133 isl_multi_aff *ma;
135 if (!expr || !arg)
136 goto error;
137 if (expr->type != pet_expr_access)
138 isl_die(pet_expr_get_ctx(expr), isl_error_invalid,
139 "not an access pet_expr", goto error);
141 n = pet_expr_get_n_arg(expr);
142 if (pos < 0 || pos > n)
143 isl_die(pet_expr_get_ctx(expr), isl_error_invalid,
144 "position out of bounds", goto error);
146 expr = pet_expr_set_n_arg(expr, n + 1);
147 for (i = n; i > pos; --i)
148 pet_expr_set_arg(expr, i, pet_expr_get_arg(expr, i - 1));
149 expr = pet_expr_set_arg(expr, pos, arg);
151 space = pet_expr_access_get_domain_space(expr);
152 space = isl_space_from_domain(space);
153 space = isl_space_add_dims(space, isl_dim_out, n + 1);
155 if (n == 0) {
156 ma = isl_multi_aff_domain_map(space);
157 } else {
158 isl_multi_aff *ma2, *proj;
160 ma = isl_multi_aff_domain_map(isl_space_copy(space));
161 ma2 = isl_multi_aff_range_map(space);
162 space = isl_space_range(isl_multi_aff_get_space(ma2));
163 proj = isl_multi_aff_project_out_map(space,
164 isl_dim_set, pos, 1);
165 ma2 = isl_multi_aff_pullback_multi_aff(proj, ma2);
166 ma = isl_multi_aff_range_product(ma, ma2);
169 expr = pet_expr_access_pullback_multi_aff(expr, ma);
171 return expr;
172 error:
173 pet_expr_free(expr);
174 pet_expr_free(arg);
175 return NULL;
178 /* Remove the argument at position "pos" in the arguments
179 * of access expression "expr", making sure it is not referenced
180 * from the index expression.
181 * "dim" is the dimension of the iteration domain.
183 * Besides actually removing the argument, we also need to make sure that
184 * we eliminate any reference from the access relation (if any) and that
185 * we adjust the references to the remaining arguments.
187 * If "expr" has a single argument, then we compute the pullback over
189 * S[i] -> [S[i] -> [arg]]
191 * Otherwise, we compute the pullback over
193 * [S[i] -> [args]] -> [S[i] -> [args_before_pos,args_after_pos]]
195 __isl_give pet_expr *pet_expr_access_project_out_arg(__isl_take pet_expr *expr,
196 int dim, int pos)
198 int i, n;
199 isl_space *space, *dom, *ran;
200 isl_multi_aff *ma1, *ma2;
201 enum pet_expr_access_type type;
202 isl_map *map;
203 isl_union_map *umap;
205 expr = pet_expr_cow(expr);
206 if (!expr)
207 return NULL;
208 if (expr->type != pet_expr_access)
209 isl_die(pet_expr_get_ctx(expr), isl_error_invalid,
210 "not an access pet_expr", return pet_expr_free(expr));
211 n = pet_expr_get_n_arg(expr);
212 if (pos < 0 || pos >= n)
213 isl_die(pet_expr_get_ctx(expr), isl_error_invalid,
214 "position out of bounds", return pet_expr_free(expr));
216 if (isl_multi_pw_aff_involves_dims(expr->acc.index,
217 isl_dim_in, dim + pos, 1))
218 isl_die(pet_expr_get_ctx(expr), isl_error_invalid,
219 "cannot project out", return pet_expr_free(expr));
220 space = isl_multi_pw_aff_get_domain_space(expr->acc.index);
221 map = isl_map_identity(isl_space_map_from_set(space));
222 map = isl_map_eliminate(map, isl_dim_out, dim + pos, 1);
223 umap = isl_union_map_from_map(map);
224 for (type = pet_expr_access_begin; type < pet_expr_access_end; ++type) {
225 if (!expr->acc.access[type])
226 continue;
227 expr->acc.access[type] =
228 isl_union_map_apply_domain(expr->acc.access[type],
229 isl_union_map_copy(umap));
230 if (!expr->acc.access[type])
231 break;
233 isl_union_map_free(umap);
234 if (!expr->acc.index || type < pet_expr_access_end)
235 return pet_expr_free(expr);
237 space = isl_multi_pw_aff_get_domain_space(expr->acc.index);
238 space = isl_space_unwrap(space);
239 dom = isl_space_map_from_set(isl_space_domain(isl_space_copy(space)));
240 ma1 = isl_multi_aff_identity(dom);
241 if (n == 1) {
242 ma2 = isl_multi_aff_zero(space);
243 ma1 = isl_multi_aff_range_product(ma1, ma2);
244 } else {
245 ran = isl_space_map_from_set(isl_space_range(space));
246 ma2 = isl_multi_aff_identity(ran);
247 ma2 = isl_multi_aff_drop_dims(ma2, isl_dim_in, pos, 1);
248 ma1 = isl_multi_aff_product(ma1, ma2);
251 expr = pet_expr_access_pullback_multi_aff(expr, ma1);
252 if (!expr)
253 return NULL;
254 pet_expr_free(expr->args[pos]);
255 for (i = pos; i + 1 < n; ++i)
256 expr->args[i] = expr->args[i + 1];
257 expr->n_arg = n - 1;
259 return expr;
262 /* Plug in "value" for the argument at position "pos" of "expr".
264 * The input "value" is of the form
266 * S[i] -> [value(i)]
268 * while the index expression of "expr" has domain
270 * [S[i] -> [args]]
272 * We therefore first pullback "value" to this domain, resulting in
274 * [S[i] -> [args]] -> [value(i)]
276 * Then we compute the pullback of "expr" over
278 * [S[i] -> [args]] -> [S[i] -> [args_before_pos,value(i),args_after_pos]]
280 * and drop the now redundant argument at position "pos".
282 static __isl_give pet_expr *plug_in(__isl_take pet_expr *expr, int pos,
283 __isl_take isl_pw_aff *value)
285 int n_in;
286 isl_space *space;
287 isl_multi_aff *ma;
288 isl_multi_pw_aff *mpa;
290 space = isl_multi_pw_aff_get_space(expr->acc.index);
291 space = isl_space_unwrap(isl_space_domain(space));
292 n_in = isl_space_dim(space, isl_dim_in);
293 ma = isl_multi_aff_domain_map(space);
294 value = isl_pw_aff_pullback_multi_aff(value, ma);
296 space = isl_multi_pw_aff_get_space(expr->acc.index);
297 space = isl_space_map_from_set(isl_space_domain(space));
298 mpa = isl_multi_pw_aff_identity(space);
299 mpa = isl_multi_pw_aff_set_pw_aff(mpa, n_in + pos, value);
301 expr = pet_expr_access_pullback_multi_pw_aff(expr, mpa);
302 expr = pet_expr_access_project_out_arg(expr, n_in, pos);
304 return expr;
307 /* Given that the argument of "expr" at position "pos" is a sum
308 * of two expressions, replace references to this argument by the sum
309 * of references to the two expressions.
310 * "dim" is the dimension of the iteration domain.
312 * That is, replace
314 * [S[i] -> [args]] -> [f(i,args_before_pos,arg_pos,args_after_pos)]
316 * by
318 * [S[i] -> [args_before_pos,arg0,arg1,args_after_pos]] ->
319 * [f(i, args_before_pos, arg0 + arg1, args_after_pos)]
321 * where arg0 and arg1 refer to the arguments of the sum expression
322 * that the original arg_pos referred to.
324 * We introduce (an unreferenced) arg1 and replace arg_pos by arg0
325 * in the arguments and then we compute the pullback over
327 * [S[i] -> [args_before_pos,arg0,arg1,args_after_pos]] ->
328 * [S[i] -> [args_before_pos,arg0+arg1,arg1,args_after_pos]]
330 static __isl_give pet_expr *splice_sum(__isl_take pet_expr *expr, int dim,
331 int pos)
333 isl_space *space;
334 pet_expr *arg;
335 isl_multi_aff *ma;
336 isl_aff *aff1, *aff2;
338 arg = expr->args[pos];
339 expr = pet_expr_insert_arg(expr, pos + 1, pet_expr_get_arg(arg, 1));
340 expr = pet_expr_set_arg(expr, pos, pet_expr_get_arg(arg, 0));
341 if (!expr)
342 return NULL;
344 space = isl_multi_pw_aff_get_space(expr->acc.index);
345 space = isl_space_map_from_set(isl_space_domain(space));
346 ma = isl_multi_aff_identity(space);
347 aff1 = isl_multi_aff_get_aff(ma, dim + pos);
348 aff2 = isl_multi_aff_get_aff(ma, dim + pos + 1);
349 aff1 = isl_aff_add(aff1, aff2);
350 ma = isl_multi_aff_set_aff(ma, dim + pos, aff1);
352 expr = pet_expr_access_pullback_multi_aff(expr, ma);
354 return expr;
357 /* Try and integrate the arguments of "expr" into the index expression
358 * of "expr" by trying to convert the arguments to affine expressions.
359 * "pc" is the context in which the affine expressions are created.
361 * For example, given an access expression with index expression
363 * [S[i] -> [arg0]] -> A[arg0]
365 * where the first argument is itself an access to a variable "i"
366 * that is assigned the value
368 * S[i] -> [i]
370 * by "pc", this value is plugged into
371 * the index expression of "expr", resulting in
373 * [i] -> { S[] -> A[i] }
374 * S[i] -> A[i]
377 * In particular, we first remove duplicate arguments so that we
378 * only need to convert a given expression once.
380 * Then we try and convert the arguments to affine expressions and
381 * (if successful) we plug them into the index expression.
383 * Occasionally, we may be unable to convert an entire argument, while
384 * we could convert a sub-argument. In particular, this may happen
385 * if the top-level argument is an addition of two expressions
386 * of which only one can be converted to an affine expression.
387 * We therefore replace a reference to a "+" argument by the sum
388 * of references to the summands.
390 __isl_give pet_expr *pet_expr_access_plug_in_args(__isl_take pet_expr *expr,
391 __isl_keep pet_context *pc)
393 int i, n;
395 expr = pet_expr_remove_duplicate_args(expr);
396 if (!expr)
397 return NULL;
398 if (expr->type != pet_expr_access)
399 isl_die(pet_expr_get_ctx(expr), isl_error_invalid,
400 "not an access pet_expr", return pet_expr_free(expr));
402 n = pet_expr_get_n_arg(expr);
403 if (n == 0)
404 return expr;
406 for (i = n - 1; expr && i >= 0; --i) {
407 isl_pw_aff *pa;
408 pet_expr *arg = expr->args[i];
410 pa = pet_expr_extract_affine(arg, pc);
411 if (!pa)
412 return pet_expr_free(expr);
413 if (!isl_pw_aff_involves_nan(pa)) {
414 expr = plug_in(expr, i, pa);
415 continue;
417 isl_pw_aff_free(pa);
419 if (pet_expr_get_type(arg) == pet_expr_op &&
420 pet_expr_op_get_type(arg) == pet_op_add) {
421 int dim = pet_context_dim(pc);
422 expr = splice_sum(expr, dim, i);
423 i += 2;
427 return expr;
430 /* A wrapper around pet_expr_access_plug_in_args for use
431 * as a pet_expr_map_access callback.
433 static __isl_give pet_expr *plug_in_args(__isl_take pet_expr *expr, void *user)
435 struct pet_context *pc = user;
436 return pet_expr_access_plug_in_args(expr, pc);
439 /* For each access subexpression of "expr", try and integrate its arguments in
440 * its index expression by trying to convert the arguments
441 * to affine expressions.
442 * "pc" is the context in which the affine expressions are created.
444 __isl_give pet_expr *pet_expr_plug_in_args(__isl_take pet_expr *expr,
445 __isl_keep pet_context *pc)
447 return pet_expr_map_access(expr, &plug_in_args, pc);