2 * Simplify - do instruction simplification before CSE
4 * Copyright (C) 2004 Linus Torvalds
10 #include "expression.h"
11 #include "linearize.h"
14 /* Find the trivial parent for a phi-source */
15 static struct basic_block
*phi_parent(struct basic_block
*source
, pseudo_t pseudo
)
17 /* Can't go upwards if the pseudo is defined in the bb it came from.. */
18 if (pseudo
->type
== PSEUDO_REG
) {
19 struct instruction
*def
= pseudo
->def
;
20 if (def
->bb
== source
)
23 if (bb_list_size(source
->children
) != 1 || bb_list_size(source
->parents
) != 1)
25 return first_basic_block(source
->parents
);
28 static void clear_phi(struct instruction
*insn
)
33 FOR_EACH_PTR(insn
->phi_list
, phi
) {
34 *THIS_ADDRESS(phi
) = VOID
;
35 } END_FOR_EACH_PTR(phi
);
38 static int if_convert_phi(struct instruction
*insn
)
41 struct basic_block
*parents
[3];
42 struct basic_block
*bb
, *bb1
, *bb2
, *source
;
43 struct instruction
*br
;
47 if (linearize_ptr_list((struct ptr_list
*)insn
->phi_list
, (void **)array
, 3) != 2)
49 if (linearize_ptr_list((struct ptr_list
*)bb
->parents
, (void **)parents
, 3) != 2)
51 p1
= array
[0]->def
->src1
;
52 bb1
= array
[0]->def
->bb
;
53 p2
= array
[1]->def
->src1
;
54 bb2
= array
[1]->def
->bb
;
56 /* Only try the simple "direct parents" case */
57 if ((bb1
!= parents
[0] || bb2
!= parents
[1]) &&
58 (bb1
!= parents
[1] || bb2
!= parents
[0]))
62 * See if we can find a common source for this..
64 source
= phi_parent(bb1
, p1
);
65 if (source
!= phi_parent(bb2
, p2
))
69 * Cool. We now know that 'source' is the exclusive
70 * parent of both phi-nodes, so the exit at the
71 * end of it fully determines which one it is, and
72 * we can turn it into a select.
74 * HOWEVER, right now we only handle regular
75 * conditional branches. No multijumps or computed
76 * stuff. Verify that here.
78 br
= last_instruction(source
->insns
);
79 if (!br
|| br
->opcode
!= OP_BR
)
86 * We're in business. Match up true/false with p1/p2.
88 if (br
->bb_true
== bb2
|| br
->bb_false
== bb1
) {
95 * Ok, we can now replace that last
102 * select pseudo, p1, p2
105 * and remove the phi-node. If it then
106 * turns out that 'a' or 'b' is entirely
107 * empty (common case), and now no longer
108 * a phi-source, we'll be able to simplify
109 * the conditional branch too.
111 insert_select(source
, br
, insn
, p1
, p2
);
116 static int clean_up_phi(struct instruction
*insn
)
119 struct instruction
*last
;
124 FOR_EACH_PTR(insn
->phi_list
, phi
) {
125 struct instruction
*def
;
129 if (def
->src1
== VOID
|| !def
->bb
)
132 if (last
->src1
!= def
->src1
)
137 } END_FOR_EACH_PTR(phi
);
140 pseudo_t pseudo
= last
? last
->src1
: VOID
;
141 convert_instruction_target(insn
, pseudo
);
146 return if_convert_phi(insn
);
149 static inline void remove_usage(pseudo_t p
, pseudo_t
*usep
)
151 if (has_use_list(p
)) {
152 delete_ptr_list_entry((struct ptr_list
**)&p
->users
, usep
, 1);
154 kill_instruction(p
->def
);
158 void kill_use(pseudo_t
*usep
)
163 remove_usage(p
, usep
);
167 void kill_instruction(struct instruction
*insn
)
169 if (!insn
|| !insn
->bb
)
172 switch (insn
->opcode
) {
173 case OP_BINARY
... OP_BINCMP_END
:
175 kill_use(&insn
->src1
);
176 kill_use(&insn
->src2
);
177 repeat_phase
|= REPEAT_CSE
;
180 case OP_NOT
: case OP_NEG
:
182 kill_use(&insn
->src1
);
183 repeat_phase
|= REPEAT_CSE
;
188 repeat_phase
|= REPEAT_CSE
;
193 repeat_phase
|= REPEAT_CSE
| REPEAT_SYMBOL_CLEANUP
;
198 repeat_phase
|= REPEAT_CSE
;
199 kill_use(&insn
->src1
);
200 kill_use(&insn
->src2
);
201 kill_use(&insn
->src3
);
207 * Kill trivially dead instructions
209 static int dead_insn(struct instruction
*insn
, pseudo_t
*src1
, pseudo_t
*src2
, pseudo_t
*src3
)
212 FOR_EACH_PTR(insn
->target
->users
, usep
) {
215 } END_FOR_EACH_PTR(usep
);
224 static inline int constant(pseudo_t pseudo
)
226 return pseudo
->type
== PSEUDO_VAL
;
229 static int replace_with_pseudo(struct instruction
*insn
, pseudo_t pseudo
)
231 convert_instruction_target(insn
, pseudo
);
236 static int simplify_constant_rightside(struct instruction
*insn
)
238 long long value
= insn
->src2
->value
;
240 switch (insn
->opcode
) {
243 insn
->opcode
= OP_ADD
;
244 insn
->src2
= value_pseudo(-value
);
249 case OP_OR
: case OP_XOR
:
251 case OP_LSR
: case OP_ASR
:
253 return replace_with_pseudo(insn
, insn
->src1
);
257 case OP_MULU
: case OP_MULS
:
259 return replace_with_pseudo(insn
, insn
->src2
);
265 static int simplify_constant_leftside(struct instruction
*insn
)
267 long long value
= insn
->src1
->value
;
269 switch (insn
->opcode
) {
270 case OP_ADD
: case OP_OR
: case OP_XOR
:
272 return replace_with_pseudo(insn
, insn
->src2
);
276 case OP_LSR
: case OP_ASR
:
278 case OP_MULU
: case OP_MULS
:
280 return replace_with_pseudo(insn
, insn
->src1
);
286 static int simplify_constant_binop(struct instruction
*insn
)
288 /* FIXME! Verify signs and sizes!! */
289 long long left
= insn
->src1
->value
;
290 long long right
= insn
->src2
->value
;
291 unsigned long long ul
, ur
;
292 long long res
, mask
, bits
;
294 mask
= 1ULL << (insn
->size
-1);
295 bits
= mask
| (mask
-1);
304 switch (insn
->opcode
) {
363 /* Binary comparison */
399 replace_with_pseudo(insn
, value_pseudo(res
));
403 static int simplify_binop(struct instruction
*insn
)
405 if (dead_insn(insn
, &insn
->src1
, &insn
->src2
, NULL
))
407 if (constant(insn
->src1
)) {
408 if (constant(insn
->src2
))
409 return simplify_constant_binop(insn
);
410 return simplify_constant_leftside(insn
);
412 if (constant(insn
->src2
))
413 return simplify_constant_rightside(insn
);
417 static void switch_pseudo(pseudo_t
*pp1
, pseudo_t
*pp2
)
419 pseudo_t p1
= *pp1
, p2
= *pp2
;
423 remove_usage(p1
, pp1
);
424 remove_usage(p2
, pp2
);
427 static int canonical_order(pseudo_t p1
, pseudo_t p2
)
429 /* symbol/constants on the right */
430 if (p1
->type
== PSEUDO_VAL
)
431 return p2
->type
== PSEUDO_VAL
;
433 if (p1
->type
== PSEUDO_SYM
)
434 return p2
->type
== PSEUDO_SYM
|| p2
->type
== PSEUDO_VAL
;
439 static int simplify_commutative_binop(struct instruction
*insn
)
441 if (!canonical_order(insn
->src1
, insn
->src2
)) {
442 switch_pseudo(&insn
->src1
, &insn
->src2
);
448 static inline int simple_pseudo(pseudo_t pseudo
)
450 return pseudo
->type
== PSEUDO_VAL
|| pseudo
->type
== PSEUDO_SYM
;
453 static int simplify_associative_binop(struct instruction
*insn
)
455 struct instruction
*def
;
456 pseudo_t pseudo
= insn
->src1
;
458 if (!simple_pseudo(insn
->src2
))
460 if (pseudo
->type
!= PSEUDO_REG
)
465 if (def
->opcode
!= insn
->opcode
)
467 if (!simple_pseudo(def
->src2
))
469 if (ptr_list_size((struct ptr_list
*)def
->target
->users
) != 1)
471 switch_pseudo(&def
->src1
, &insn
->src2
);
475 static int simplify_constant_unop(struct instruction
*insn
)
477 long long val
= insn
->src1
->value
;
480 switch (insn
->opcode
) {
490 mask
= 1ULL << (insn
->size
-1);
491 res
&= mask
| (mask
-1);
493 replace_with_pseudo(insn
, value_pseudo(res
));
497 static int simplify_unop(struct instruction
*insn
)
499 if (dead_insn(insn
, &insn
->src1
, NULL
, NULL
))
501 if (constant(insn
->src1
))
502 return simplify_constant_unop(insn
);
506 static int simplify_one_memop(struct instruction
*insn
, pseudo_t orig
)
508 pseudo_t addr
= insn
->src
;
511 if (addr
->type
== PSEUDO_REG
) {
512 struct instruction
*def
= addr
->def
;
513 if (def
->opcode
== OP_SYMADDR
&& def
->src
) {
514 kill_use(&insn
->src
);
515 use_pseudo(def
->src
, &insn
->src
);
516 return REPEAT_CSE
| REPEAT_SYMBOL_CLEANUP
;
518 if (def
->opcode
== OP_ADD
) {
538 warning(insn
->pos
, "crazy programmer");
540 insn
->offset
+= off
->value
;
541 use_pseudo(new, &insn
->src
);
542 remove_usage(addr
, &insn
->src
);
543 return REPEAT_CSE
| REPEAT_SYMBOL_CLEANUP
;
547 * We walk the whole chain of adds/subs backwards. That's not
548 * only more efficient, but it allows us to find looops.
550 static int simplify_memop(struct instruction
*insn
)
553 pseudo_t orig
= insn
->src
;
556 one
= simplify_one_memop(insn
, orig
);
562 static int simplify_cast(struct instruction
*insn
)
564 struct symbol
*orig_type
;
568 if (dead_insn(insn
, &insn
->src
, NULL
, NULL
))
571 orig_type
= insn
->orig_type
;
574 orig_size
= orig_type
->bit_size
;
578 /* A cast of a "and" might be a no-op.. */
579 if (src
->type
== PSEUDO_REG
) {
580 struct instruction
*def
= src
->def
;
581 if (def
->opcode
== OP_AND
&& def
->size
>= size
) {
582 pseudo_t val
= def
->src2
;
583 if (val
->type
== PSEUDO_VAL
) {
584 unsigned long long value
= val
->value
;
585 if (!(value
>> (size
-1)))
591 if (size
== orig_size
) {
592 int op
= (orig_type
->ctype
.modifiers
& MOD_SIGNED
) ? OP_SCAST
: OP_CAST
;
593 if (insn
->opcode
== op
)
600 return replace_with_pseudo(insn
, insn
->src
);
603 static int simplify_select(struct instruction
*insn
)
605 pseudo_t cond
, src1
, src2
;
607 if (dead_insn(insn
, &insn
->src1
, &insn
->src2
, &insn
->src3
))
613 if (constant(cond
) || src1
== src2
) {
614 pseudo_t
*kill
, take
;
615 kill_use(&insn
->src1
);
616 take
= cond
->value
? src1
: src2
;
617 kill
= cond
->value
? &insn
->src3
: &insn
->src2
;
619 replace_with_pseudo(insn
, take
);
622 if (constant(src1
) && constant(src2
)) {
623 long long val1
= src1
->value
;
624 long long val2
= src2
->value
;
626 /* The pair 0/1 is special - replace with SETNE/SETEQ */
627 if ((val1
| val2
) == 1) {
628 int opcode
= OP_SET_EQ
;
633 insn
->opcode
= opcode
;
634 /* insn->src1 is already cond */
635 insn
->src2
= src1
; /* Zero */
642 static int is_in_range(pseudo_t src
, long long low
, long long high
)
649 return value
>= low
&& value
<= high
;
655 static int simplify_range(struct instruction
*insn
)
657 pseudo_t src1
, src2
, src3
;
662 if (src2
->type
!= PSEUDO_VAL
|| src3
->type
!= PSEUDO_VAL
)
664 if (is_in_range(src1
, src2
->value
, src3
->value
)) {
665 kill_instruction(insn
);
672 * Simplify "set_ne/eq $0 + br"
674 static int simplify_cond_branch(struct instruction
*br
, pseudo_t cond
, struct instruction
*def
, pseudo_t
*pp
)
676 use_pseudo(*pp
, &br
->cond
);
677 remove_usage(cond
, &br
->cond
);
678 if (def
->opcode
== OP_SET_EQ
) {
679 struct basic_block
*true = br
->bb_true
;
680 struct basic_block
*false = br
->bb_false
;
687 static int simplify_branch(struct instruction
*insn
)
689 pseudo_t cond
= insn
->cond
;
694 /* Constant conditional */
695 if (constant(cond
)) {
696 insert_branch(insn
->bb
, insn
, cond
->value
? insn
->bb_true
: insn
->bb_false
);
701 if (insn
->bb_true
== insn
->bb_false
) {
702 struct basic_block
*bb
= insn
->bb
;
703 struct basic_block
*target
= insn
->bb_false
;
704 remove_bb_from_list(&target
->parents
, bb
, 1);
705 remove_bb_from_list(&bb
->children
, target
, 1);
706 insn
->bb_false
= NULL
;
707 kill_use(&insn
->cond
);
712 /* Conditional on a SETNE $0 or SETEQ $0 */
713 if (cond
->type
== PSEUDO_REG
) {
714 struct instruction
*def
= cond
->def
;
716 if (def
->opcode
== OP_SET_NE
|| def
->opcode
== OP_SET_EQ
) {
717 if (constant(def
->src1
) && !def
->src1
->value
)
718 return simplify_cond_branch(insn
, cond
, def
, &def
->src2
);
719 if (constant(def
->src2
) && !def
->src2
->value
)
720 return simplify_cond_branch(insn
, cond
, def
, &def
->src1
);
722 if (def
->opcode
== OP_SEL
) {
723 if (constant(def
->src2
) && constant(def
->src3
)) {
724 long long val1
= def
->src2
->value
;
725 long long val2
= def
->src3
->value
;
726 if (!val1
&& !val2
) {
727 insert_branch(insn
->bb
, insn
, insn
->bb_false
);
731 insert_branch(insn
->bb
, insn
, insn
->bb_true
);
735 struct basic_block
*true = insn
->bb_true
;
736 struct basic_block
*false = insn
->bb_false
;
737 insn
->bb_false
= true;
738 insn
->bb_true
= false;
740 use_pseudo(def
->src1
, &insn
->cond
);
741 remove_usage(cond
, &insn
->cond
);
745 if (def
->opcode
== OP_CAST
|| def
->opcode
== OP_SCAST
) {
746 int orig_size
= def
->orig_type
? def
->orig_type
->bit_size
: 0;
747 if (def
->size
> orig_size
) {
748 use_pseudo(def
->src
, &insn
->cond
);
749 remove_usage(cond
, &insn
->cond
);
757 static int simplify_switch(struct instruction
*insn
)
759 pseudo_t cond
= insn
->cond
;
761 struct multijmp
*jmp
;
765 val
= insn
->cond
->value
;
767 FOR_EACH_PTR(insn
->multijmp_list
, jmp
) {
769 if (jmp
->begin
> jmp
->end
)
771 if (val
>= jmp
->begin
&& val
<= jmp
->end
)
773 } END_FOR_EACH_PTR(jmp
);
774 warning(insn
->pos
, "Impossible case statement");
778 insert_branch(insn
->bb
, insn
, jmp
->target
);
782 int simplify_instruction(struct instruction
*insn
)
786 switch (insn
->opcode
) {
787 case OP_ADD
: case OP_MULS
:
788 case OP_AND
: case OP_OR
: case OP_XOR
:
789 case OP_AND_BOOL
: case OP_OR_BOOL
:
790 if (simplify_binop(insn
))
792 if (simplify_commutative_binop(insn
))
794 return simplify_associative_binop(insn
);
797 case OP_SET_EQ
: case OP_SET_NE
:
798 if (simplify_binop(insn
))
800 return simplify_commutative_binop(insn
);
803 case OP_DIVU
: case OP_DIVS
:
804 case OP_MODU
: case OP_MODS
:
806 case OP_LSR
: case OP_ASR
:
807 case OP_SET_LE
: case OP_SET_GE
:
808 case OP_SET_LT
: case OP_SET_GT
:
809 case OP_SET_B
: case OP_SET_A
:
810 case OP_SET_BE
: case OP_SET_AE
:
811 return simplify_binop(insn
);
813 case OP_NOT
: case OP_NEG
:
814 return simplify_unop(insn
);
815 case OP_LOAD
: case OP_STORE
:
816 return simplify_memop(insn
);
818 if (dead_insn(insn
, NULL
, NULL
, NULL
))
819 return REPEAT_CSE
| REPEAT_SYMBOL_CLEANUP
;
820 return replace_with_pseudo(insn
, insn
->symbol
);
825 return simplify_cast(insn
);
827 if (dead_insn(insn
, NULL
, NULL
, NULL
)) {
831 return clean_up_phi(insn
);
833 if (dead_insn(insn
, &insn
->phi_src
, NULL
, NULL
))
837 return simplify_select(insn
);
839 return simplify_branch(insn
);
841 return simplify_switch(insn
);
843 return simplify_range(insn
);