2 * Simplify - do instruction simplification before CSE
4 * Copyright (C) 2004 Linus Torvalds
10 #include "expression.h"
11 #include "linearize.h"
15 /* Find the trivial parent for a phi-source */
16 static struct basic_block
*phi_parent(struct basic_block
*source
, pseudo_t pseudo
)
18 /* Can't go upwards if the pseudo is defined in the bb it came from.. */
19 if (pseudo
->type
== PSEUDO_REG
) {
20 struct instruction
*def
= pseudo
->def
;
21 if (def
->bb
== source
)
24 if (bb_list_size(source
->children
) != 1 || bb_list_size(source
->parents
) != 1)
26 return first_basic_block(source
->parents
);
29 static void clear_phi(struct instruction
*insn
)
34 FOR_EACH_PTR(insn
->phi_list
, phi
) {
35 *THIS_ADDRESS(phi
) = VOID
;
36 } END_FOR_EACH_PTR(phi
);
39 static int if_convert_phi(struct instruction
*insn
)
42 struct basic_block
*parents
[3];
43 struct basic_block
*bb
, *bb1
, *bb2
, *source
;
44 struct instruction
*br
;
48 if (linearize_ptr_list((struct ptr_list
*)insn
->phi_list
, (void **)array
, 3) != 2)
50 if (linearize_ptr_list((struct ptr_list
*)bb
->parents
, (void **)parents
, 3) != 2)
52 p1
= array
[0]->def
->src1
;
53 bb1
= array
[0]->def
->bb
;
54 p2
= array
[1]->def
->src1
;
55 bb2
= array
[1]->def
->bb
;
57 /* Only try the simple "direct parents" case */
58 if ((bb1
!= parents
[0] || bb2
!= parents
[1]) &&
59 (bb1
!= parents
[1] || bb2
!= parents
[0]))
63 * See if we can find a common source for this..
65 source
= phi_parent(bb1
, p1
);
66 if (source
!= phi_parent(bb2
, p2
))
70 * Cool. We now know that 'source' is the exclusive
71 * parent of both phi-nodes, so the exit at the
72 * end of it fully determines which one it is, and
73 * we can turn it into a select.
75 * HOWEVER, right now we only handle regular
76 * conditional branches. No multijumps or computed
77 * stuff. Verify that here.
79 br
= last_instruction(source
->insns
);
80 if (!br
|| br
->opcode
!= OP_BR
)
87 * We're in business. Match up true/false with p1/p2.
89 if (br
->bb_true
== bb2
|| br
->bb_false
== bb1
) {
96 * OK, we can now replace that last
103 * select pseudo, p1, p2
106 * and remove the phi-node. If it then
107 * turns out that 'a' or 'b' is entirely
108 * empty (common case), and now no longer
109 * a phi-source, we'll be able to simplify
110 * the conditional branch too.
112 insert_select(source
, br
, insn
, p1
, p2
);
117 static int clean_up_phi(struct instruction
*insn
)
120 struct instruction
*last
;
125 FOR_EACH_PTR(insn
->phi_list
, phi
) {
126 struct instruction
*def
;
130 if (def
->src1
== VOID
|| !def
->bb
)
133 if (last
->src1
!= def
->src1
)
138 } END_FOR_EACH_PTR(phi
);
141 pseudo_t pseudo
= last
? last
->src1
: VOID
;
142 convert_instruction_target(insn
, pseudo
);
147 return if_convert_phi(insn
);
150 static int delete_pseudo_user_list_entry(struct pseudo_user_list
**list
, pseudo_t
*entry
, int count
)
152 struct pseudo_user
*pu
;
154 FOR_EACH_PTR(*list
, pu
) {
155 if (pu
->userp
== entry
) {
156 DELETE_CURRENT_PTR(pu
);
160 } END_FOR_EACH_PTR(pu
);
163 pack_ptr_list((struct ptr_list
**)list
);
167 static inline void remove_usage(pseudo_t p
, pseudo_t
*usep
)
169 if (has_use_list(p
)) {
170 delete_pseudo_user_list_entry(&p
->users
, usep
, 1);
172 kill_instruction(p
->def
);
176 void kill_use(pseudo_t
*usep
)
181 remove_usage(p
, usep
);
185 void kill_instruction(struct instruction
*insn
)
187 if (!insn
|| !insn
->bb
)
190 switch (insn
->opcode
) {
193 kill_use(&insn
->src3
);
196 case OP_BINARY
... OP_BINCMP_END
:
197 kill_use(&insn
->src2
);
204 case OP_NOT
: case OP_NEG
:
205 kill_use(&insn
->src1
);
213 repeat_phase
|= REPEAT_SYMBOL_CLEANUP
;
217 if (!insn
->bb_true
|| !insn
->bb_false
)
221 case OP_COMPUTEDGOTO
:
222 kill_use(&insn
->cond
);
232 repeat_phase
|= REPEAT_CSE
;
237 * Kill trivially dead instructions
239 static int dead_insn(struct instruction
*insn
, pseudo_t
*src1
, pseudo_t
*src2
, pseudo_t
*src3
)
241 struct pseudo_user
*pu
;
242 FOR_EACH_PTR(insn
->target
->users
, pu
) {
243 if (*pu
->userp
!= VOID
)
245 } END_FOR_EACH_PTR(pu
);
254 static inline int constant(pseudo_t pseudo
)
256 return pseudo
->type
== PSEUDO_VAL
;
259 static int replace_with_pseudo(struct instruction
*insn
, pseudo_t pseudo
)
261 convert_instruction_target(insn
, pseudo
);
263 switch (insn
->opcode
) {
266 kill_use(&insn
->src3
);
267 case OP_BINARY
... OP_BINCMP_END
:
268 kill_use(&insn
->src2
);
276 kill_use(&insn
->src1
);
286 static unsigned int value_size(long long value
)
301 * Try to determine the maximum size of bits in a pseudo.
303 * Right now this only follow casts and constant values, but we
304 * could look at things like logical 'and' instructions etc.
306 static unsigned int operand_size(struct instruction
*insn
, pseudo_t pseudo
)
308 unsigned int size
= insn
->size
;
310 if (pseudo
->type
== PSEUDO_REG
) {
311 struct instruction
*src
= pseudo
->def
;
312 if (src
&& src
->opcode
== OP_CAST
&& src
->orig_type
) {
313 unsigned int orig_size
= src
->orig_type
->bit_size
;
314 if (orig_size
< size
)
318 if (pseudo
->type
== PSEUDO_VAL
) {
319 unsigned int orig_size
= value_size(pseudo
->value
);
320 if (orig_size
< size
)
326 static int simplify_asr(struct instruction
*insn
, pseudo_t pseudo
, long long value
)
328 unsigned int size
= operand_size(insn
, pseudo
);
331 warning(insn
->pos
, "right shift by bigger than source value");
332 return replace_with_pseudo(insn
, value_pseudo(0));
335 return replace_with_pseudo(insn
, pseudo
);
339 static int simplify_constant_rightside(struct instruction
*insn
)
341 long long value
= insn
->src2
->value
;
343 switch (insn
->opcode
) {
346 insn
->opcode
= OP_ADD
;
347 insn
->src2
= value_pseudo(-value
);
352 case OP_OR
: case OP_XOR
:
357 return replace_with_pseudo(insn
, insn
->src1
);
360 return simplify_asr(insn
, insn
->src1
, value
);
362 case OP_MULU
: case OP_MULS
:
365 return replace_with_pseudo(insn
, insn
->src1
);
369 return replace_with_pseudo(insn
, insn
->src2
);
375 static int simplify_constant_leftside(struct instruction
*insn
)
377 long long value
= insn
->src1
->value
;
379 switch (insn
->opcode
) {
380 case OP_ADD
: case OP_OR
: case OP_XOR
:
382 return replace_with_pseudo(insn
, insn
->src2
);
386 case OP_LSR
: case OP_ASR
:
388 case OP_MULU
: case OP_MULS
:
390 return replace_with_pseudo(insn
, insn
->src1
);
396 static int simplify_constant_binop(struct instruction
*insn
)
398 /* FIXME! Verify signs and sizes!! */
399 long long left
= insn
->src1
->value
;
400 long long right
= insn
->src2
->value
;
401 unsigned long long ul
, ur
;
402 long long res
, mask
, bits
;
404 mask
= 1ULL << (insn
->size
-1);
405 bits
= mask
| (mask
-1);
414 switch (insn
->opcode
) {
435 if (left
== mask
&& right
== -1)
447 if (left
== mask
&& right
== -1)
477 /* Binary comparison */
513 replace_with_pseudo(insn
, value_pseudo(res
));
517 static int simplify_binop(struct instruction
*insn
)
519 if (dead_insn(insn
, &insn
->src1
, &insn
->src2
, NULL
))
521 if (constant(insn
->src1
)) {
522 if (constant(insn
->src2
))
523 return simplify_constant_binop(insn
);
524 return simplify_constant_leftside(insn
);
526 if (constant(insn
->src2
))
527 return simplify_constant_rightside(insn
);
531 static void switch_pseudo(struct instruction
*insn1
, pseudo_t
*pp1
, struct instruction
*insn2
, pseudo_t
*pp2
)
533 pseudo_t p1
= *pp1
, p2
= *pp2
;
535 use_pseudo(insn1
, p2
, pp1
);
536 use_pseudo(insn2
, p1
, pp2
);
537 remove_usage(p1
, pp1
);
538 remove_usage(p2
, pp2
);
541 static int canonical_order(pseudo_t p1
, pseudo_t p2
)
543 /* symbol/constants on the right */
544 if (p1
->type
== PSEUDO_VAL
)
545 return p2
->type
== PSEUDO_VAL
;
547 if (p1
->type
== PSEUDO_SYM
)
548 return p2
->type
== PSEUDO_SYM
|| p2
->type
== PSEUDO_VAL
;
553 static int simplify_commutative_binop(struct instruction
*insn
)
555 if (!canonical_order(insn
->src1
, insn
->src2
)) {
556 switch_pseudo(insn
, &insn
->src1
, insn
, &insn
->src2
);
562 static inline int simple_pseudo(pseudo_t pseudo
)
564 return pseudo
->type
== PSEUDO_VAL
|| pseudo
->type
== PSEUDO_SYM
;
567 static int simplify_associative_binop(struct instruction
*insn
)
569 struct instruction
*def
;
570 pseudo_t pseudo
= insn
->src1
;
572 if (!simple_pseudo(insn
->src2
))
574 if (pseudo
->type
!= PSEUDO_REG
)
579 if (def
->opcode
!= insn
->opcode
)
581 if (!simple_pseudo(def
->src2
))
583 if (ptr_list_size((struct ptr_list
*)def
->target
->users
) != 1)
585 switch_pseudo(def
, &def
->src1
, insn
, &insn
->src2
);
589 static int simplify_constant_unop(struct instruction
*insn
)
591 long long val
= insn
->src1
->value
;
594 switch (insn
->opcode
) {
604 mask
= 1ULL << (insn
->size
-1);
605 res
&= mask
| (mask
-1);
607 replace_with_pseudo(insn
, value_pseudo(res
));
611 static int simplify_unop(struct instruction
*insn
)
613 if (dead_insn(insn
, &insn
->src1
, NULL
, NULL
))
615 if (constant(insn
->src1
))
616 return simplify_constant_unop(insn
);
620 static int simplify_one_memop(struct instruction
*insn
, pseudo_t orig
)
622 pseudo_t addr
= insn
->src
;
625 if (addr
->type
== PSEUDO_REG
) {
626 struct instruction
*def
= addr
->def
;
627 if (def
->opcode
== OP_SYMADDR
&& def
->src
) {
628 kill_use(&insn
->src
);
629 use_pseudo(insn
, def
->src
, &insn
->src
);
630 return REPEAT_CSE
| REPEAT_SYMBOL_CLEANUP
;
632 if (def
->opcode
== OP_ADD
) {
652 warning(insn
->pos
, "crazy programmer");
654 insn
->offset
+= off
->value
;
655 use_pseudo(insn
, new, &insn
->src
);
656 remove_usage(addr
, &insn
->src
);
657 return REPEAT_CSE
| REPEAT_SYMBOL_CLEANUP
;
661 * We walk the whole chain of adds/subs backwards. That's not
662 * only more efficient, but it allows us to find loops.
664 static int simplify_memop(struct instruction
*insn
)
667 pseudo_t orig
= insn
->src
;
670 one
= simplify_one_memop(insn
, orig
);
676 static long long get_cast_value(long long val
, int old_size
, int new_size
, int sign
)
680 if (sign
&& new_size
> old_size
) {
681 mask
= 1 << (old_size
-1);
683 val
|= ~(mask
| (mask
-1));
685 mask
= 1 << (new_size
-1);
686 return val
& (mask
| (mask
-1));
689 static int simplify_cast(struct instruction
*insn
)
691 struct symbol
*orig_type
;
695 if (dead_insn(insn
, &insn
->src
, NULL
, NULL
))
698 orig_type
= insn
->orig_type
;
702 /* Keep casts with pointer on either side (not only case of OP_PTRCAST) */
703 if (is_ptr_type(orig_type
) || is_ptr_type(insn
->type
))
706 orig_size
= orig_type
->bit_size
;
710 /* A cast of a constant? */
712 int sign
= orig_type
->ctype
.modifiers
& MOD_SIGNED
;
713 long long val
= get_cast_value(src
->value
, orig_size
, size
, sign
);
714 src
= value_pseudo(val
);
718 /* A cast of a "and" might be a no-op.. */
719 if (src
->type
== PSEUDO_REG
) {
720 struct instruction
*def
= src
->def
;
721 if (def
->opcode
== OP_AND
&& def
->size
>= size
) {
722 pseudo_t val
= def
->src2
;
723 if (val
->type
== PSEUDO_VAL
) {
724 unsigned long long value
= val
->value
;
725 if (!(value
>> (size
-1)))
731 if (size
== orig_size
) {
732 int op
= (orig_type
->ctype
.modifiers
& MOD_SIGNED
) ? OP_SCAST
: OP_CAST
;
733 if (insn
->opcode
== op
)
740 return replace_with_pseudo(insn
, src
);
743 static int simplify_select(struct instruction
*insn
)
745 pseudo_t cond
, src1
, src2
;
747 if (dead_insn(insn
, &insn
->src1
, &insn
->src2
, &insn
->src3
))
753 if (constant(cond
) || src1
== src2
) {
754 pseudo_t
*kill
, take
;
755 kill_use(&insn
->src1
);
756 take
= cond
->value
? src1
: src2
;
757 kill
= cond
->value
? &insn
->src3
: &insn
->src2
;
759 replace_with_pseudo(insn
, take
);
762 if (constant(src1
) && constant(src2
)) {
763 long long val1
= src1
->value
;
764 long long val2
= src2
->value
;
766 /* The pair 0/1 is special - replace with SETNE/SETEQ */
767 if ((val1
| val2
) == 1) {
768 int opcode
= OP_SET_EQ
;
773 insn
->opcode
= opcode
;
774 /* insn->src1 is already cond */
775 insn
->src2
= src1
; /* Zero */
782 static int is_in_range(pseudo_t src
, long long low
, long long high
)
789 return value
>= low
&& value
<= high
;
795 static int simplify_range(struct instruction
*insn
)
797 pseudo_t src1
, src2
, src3
;
802 if (src2
->type
!= PSEUDO_VAL
|| src3
->type
!= PSEUDO_VAL
)
804 if (is_in_range(src1
, src2
->value
, src3
->value
)) {
805 kill_instruction(insn
);
812 * Simplify "set_ne/eq $0 + br"
814 static int simplify_cond_branch(struct instruction
*br
, pseudo_t cond
, struct instruction
*def
, pseudo_t
*pp
)
816 use_pseudo(br
, *pp
, &br
->cond
);
817 remove_usage(cond
, &br
->cond
);
818 if (def
->opcode
== OP_SET_EQ
) {
819 struct basic_block
*true = br
->bb_true
;
820 struct basic_block
*false = br
->bb_false
;
827 static int simplify_branch(struct instruction
*insn
)
829 pseudo_t cond
= insn
->cond
;
834 /* Constant conditional */
835 if (constant(cond
)) {
836 insert_branch(insn
->bb
, insn
, cond
->value
? insn
->bb_true
: insn
->bb_false
);
841 if (insn
->bb_true
== insn
->bb_false
) {
842 struct basic_block
*bb
= insn
->bb
;
843 struct basic_block
*target
= insn
->bb_false
;
844 remove_bb_from_list(&target
->parents
, bb
, 1);
845 remove_bb_from_list(&bb
->children
, target
, 1);
846 insn
->bb_false
= NULL
;
847 kill_use(&insn
->cond
);
852 /* Conditional on a SETNE $0 or SETEQ $0 */
853 if (cond
->type
== PSEUDO_REG
) {
854 struct instruction
*def
= cond
->def
;
856 if (def
->opcode
== OP_SET_NE
|| def
->opcode
== OP_SET_EQ
) {
857 if (constant(def
->src1
) && !def
->src1
->value
)
858 return simplify_cond_branch(insn
, cond
, def
, &def
->src2
);
859 if (constant(def
->src2
) && !def
->src2
->value
)
860 return simplify_cond_branch(insn
, cond
, def
, &def
->src1
);
862 if (def
->opcode
== OP_SEL
) {
863 if (constant(def
->src2
) && constant(def
->src3
)) {
864 long long val1
= def
->src2
->value
;
865 long long val2
= def
->src3
->value
;
866 if (!val1
&& !val2
) {
867 insert_branch(insn
->bb
, insn
, insn
->bb_false
);
871 insert_branch(insn
->bb
, insn
, insn
->bb_true
);
875 struct basic_block
*true = insn
->bb_true
;
876 struct basic_block
*false = insn
->bb_false
;
877 insn
->bb_false
= true;
878 insn
->bb_true
= false;
880 use_pseudo(insn
, def
->src1
, &insn
->cond
);
881 remove_usage(cond
, &insn
->cond
);
885 if (def
->opcode
== OP_CAST
|| def
->opcode
== OP_SCAST
) {
886 int orig_size
= def
->orig_type
? def
->orig_type
->bit_size
: 0;
887 if (def
->size
> orig_size
) {
888 use_pseudo(insn
, def
->src
, &insn
->cond
);
889 remove_usage(cond
, &insn
->cond
);
897 static int simplify_switch(struct instruction
*insn
)
899 pseudo_t cond
= insn
->cond
;
901 struct multijmp
*jmp
;
905 val
= insn
->cond
->value
;
907 FOR_EACH_PTR(insn
->multijmp_list
, jmp
) {
909 if (jmp
->begin
> jmp
->end
)
911 if (val
>= jmp
->begin
&& val
<= jmp
->end
)
913 } END_FOR_EACH_PTR(jmp
);
914 warning(insn
->pos
, "Impossible case statement");
918 insert_branch(insn
->bb
, insn
, jmp
->target
);
922 int simplify_instruction(struct instruction
*insn
)
926 switch (insn
->opcode
) {
927 case OP_ADD
: case OP_MULS
:
928 case OP_AND
: case OP_OR
: case OP_XOR
:
929 case OP_AND_BOOL
: case OP_OR_BOOL
:
930 if (simplify_binop(insn
))
932 if (simplify_commutative_binop(insn
))
934 return simplify_associative_binop(insn
);
937 case OP_SET_EQ
: case OP_SET_NE
:
938 if (simplify_binop(insn
))
940 return simplify_commutative_binop(insn
);
943 case OP_DIVU
: case OP_DIVS
:
944 case OP_MODU
: case OP_MODS
:
946 case OP_LSR
: case OP_ASR
:
947 case OP_SET_LE
: case OP_SET_GE
:
948 case OP_SET_LT
: case OP_SET_GT
:
949 case OP_SET_B
: case OP_SET_A
:
950 case OP_SET_BE
: case OP_SET_AE
:
951 return simplify_binop(insn
);
953 case OP_NOT
: case OP_NEG
:
954 return simplify_unop(insn
);
955 case OP_LOAD
: case OP_STORE
:
956 return simplify_memop(insn
);
958 if (dead_insn(insn
, NULL
, NULL
, NULL
))
959 return REPEAT_CSE
| REPEAT_SYMBOL_CLEANUP
;
960 return replace_with_pseudo(insn
, insn
->symbol
);
965 return simplify_cast(insn
);
967 if (dead_insn(insn
, NULL
, NULL
, NULL
)) {
971 return clean_up_phi(insn
);
973 if (dead_insn(insn
, &insn
->phi_src
, NULL
, NULL
))
977 return simplify_select(insn
);
979 return simplify_branch(insn
);
981 return simplify_switch(insn
);
983 return simplify_range(insn
);