[gcc]
[official-gcc.git] / gcc / sched-int.h
blobde5d32692663620af67b5dac06dd5efb5c40e303
1 /* Instruction scheduling pass. This file contains definitions used
2 internally in the scheduler.
3 Copyright (C) 1992-2016 Free Software Foundation, Inc.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #ifndef GCC_SCHED_INT_H
22 #define GCC_SCHED_INT_H
24 #ifdef INSN_SCHEDULING
26 /* Identificator of a scheduler pass. */
27 enum sched_pass_id_t { SCHED_PASS_UNKNOWN, SCHED_RGN_PASS, SCHED_EBB_PASS,
28 SCHED_SMS_PASS, SCHED_SEL_PASS };
30 /* The algorithm used to implement -fsched-pressure. */
31 enum sched_pressure_algorithm
33 SCHED_PRESSURE_NONE,
34 SCHED_PRESSURE_WEIGHTED,
35 SCHED_PRESSURE_MODEL
38 typedef vec<basic_block> bb_vec_t;
39 typedef vec<rtx_insn *> insn_vec_t;
40 typedef vec<rtx_insn *> rtx_vec_t;
42 extern void sched_init_bbs (void);
44 extern void sched_extend_luids (void);
45 extern void sched_init_insn_luid (rtx_insn *);
46 extern void sched_init_luids (bb_vec_t);
47 extern void sched_finish_luids (void);
49 extern void sched_extend_target (void);
51 extern void haifa_init_h_i_d (bb_vec_t);
52 extern void haifa_finish_h_i_d (void);
54 /* Hooks that are common to all the schedulers. */
55 struct common_sched_info_def
57 /* Called after blocks were rearranged due to movement of jump instruction.
58 The first parameter - index of basic block, in which jump currently is.
59 The second parameter - index of basic block, in which jump used
60 to be.
61 The third parameter - index of basic block, that follows the second
62 parameter. */
63 void (*fix_recovery_cfg) (int, int, int);
65 /* Called to notify frontend, that new basic block is being added.
66 The first parameter - new basic block.
67 The second parameter - block, after which new basic block is being added,
68 or the exit block, if recovery block is being added,
69 or NULL, if standalone block is being added. */
70 void (*add_block) (basic_block, basic_block);
72 /* Estimate number of insns in the basic block. */
73 int (*estimate_number_of_insns) (basic_block);
75 /* Given a non-insn (!INSN_P (x)) return
76 -1 - if this rtx don't need a luid.
77 0 - if it should have the same luid as the previous insn.
78 1 - if it needs a separate luid. */
79 int (*luid_for_non_insn) (rtx);
81 /* Scheduler pass identifier. It is preferably used in assertions. */
82 enum sched_pass_id_t sched_pass_id;
85 extern struct common_sched_info_def *common_sched_info;
87 extern const struct common_sched_info_def haifa_common_sched_info;
89 /* Return true if selective scheduling pass is working. */
90 static inline bool
91 sel_sched_p (void)
93 return common_sched_info->sched_pass_id == SCHED_SEL_PASS;
96 /* Returns maximum priority that an insn was assigned to. */
97 extern int get_rgn_sched_max_insns_priority (void);
99 /* Increases effective priority for INSN by AMOUNT. */
100 extern void sel_add_to_insn_priority (rtx, int);
102 /* True if during selective scheduling we need to emulate some of haifa
103 scheduler behavior. */
104 extern int sched_emulate_haifa_p;
106 /* Mapping from INSN_UID to INSN_LUID. In the end all other per insn data
107 structures should be indexed by luid. */
108 extern vec<int> sched_luids;
109 #define INSN_LUID(INSN) (sched_luids[INSN_UID (INSN)])
110 #define LUID_BY_UID(UID) (sched_luids[UID])
112 #define SET_INSN_LUID(INSN, LUID) \
113 (sched_luids[INSN_UID (INSN)] = (LUID))
115 /* The highest INSN_LUID. */
116 extern int sched_max_luid;
118 extern int insn_luid (rtx);
120 /* This list holds ripped off notes from the current block. These notes will
121 be attached to the beginning of the block when its scheduling is
122 finished. */
123 extern rtx_insn *note_list;
125 extern void remove_notes (rtx_insn *, rtx_insn *);
126 extern rtx_insn *restore_other_notes (rtx_insn *, basic_block);
127 extern void sched_insns_init (rtx);
128 extern void sched_insns_finish (void);
130 extern void *xrecalloc (void *, size_t, size_t, size_t);
132 extern void reemit_notes (rtx_insn *);
134 /* Functions in haifa-sched.c. */
135 extern int haifa_classify_insn (const_rtx);
137 /* Functions in sel-sched-ir.c. */
138 extern void sel_find_rgns (void);
139 extern void sel_mark_hard_insn (rtx);
141 extern size_t dfa_state_size;
143 extern void advance_state (state_t);
145 extern void setup_sched_dump (void);
146 extern void sched_init (void);
147 extern void sched_finish (void);
149 extern bool sel_insn_is_speculation_check (rtx);
151 /* Describe the ready list of the scheduler.
152 VEC holds space enough for all insns in the current region. VECLEN
153 says how many exactly.
154 FIRST is the index of the element with the highest priority; i.e. the
155 last one in the ready list, since elements are ordered by ascending
156 priority.
157 N_READY determines how many insns are on the ready list.
158 N_DEBUG determines how many debug insns are on the ready list. */
159 struct ready_list
161 rtx_insn **vec;
162 int veclen;
163 int first;
164 int n_ready;
165 int n_debug;
168 extern signed char *ready_try;
169 extern struct ready_list ready;
171 extern int max_issue (struct ready_list *, int, state_t, bool, int *);
173 extern void ebb_compute_jump_reg_dependencies (rtx, regset);
175 extern edge find_fallthru_edge_from (basic_block);
177 extern void (* sched_init_only_bb) (basic_block, basic_block);
178 extern basic_block (* sched_split_block) (basic_block, rtx);
179 extern basic_block sched_split_block_1 (basic_block, rtx);
180 extern basic_block (* sched_create_empty_bb) (basic_block);
181 extern basic_block sched_create_empty_bb_1 (basic_block);
183 extern basic_block sched_create_recovery_block (basic_block *);
184 extern void sched_create_recovery_edges (basic_block, basic_block,
185 basic_block);
187 /* Pointer to data describing the current DFA state. */
188 extern state_t curr_state;
190 /* Type to represent status of a dependence. */
191 typedef unsigned int ds_t;
192 #define BITS_PER_DEP_STATUS HOST_BITS_PER_INT
194 /* Type to represent weakness of speculative dependence. */
195 typedef unsigned int dw_t;
197 extern enum reg_note ds_to_dk (ds_t);
198 extern ds_t dk_to_ds (enum reg_note);
200 /* Describe a dependency that can be broken by making a replacement
201 in one of the patterns. LOC is the location, ORIG and NEWVAL the
202 two alternative contents, and INSN the instruction that must be
203 changed. */
204 struct dep_replacement
206 rtx *loc;
207 rtx orig;
208 rtx newval;
209 rtx_insn *insn;
212 /* Information about the dependency. */
213 struct _dep
215 /* Producer. */
216 rtx_insn *pro;
218 /* Consumer. */
219 rtx_insn *con;
221 /* If nonnull, holds a pointer to information about how to break the
222 dependency by making a replacement in one of the insns. There is
223 only one such dependency for each insn that must be modified in
224 order to break such a dependency. */
225 struct dep_replacement *replace;
227 /* Dependency status. This field holds all dependency types and additional
228 information for speculative dependencies. */
229 ds_t status;
231 /* Dependency major type. This field is superseded by STATUS above.
232 Though, it is still in place because some targets use it. */
233 ENUM_BITFIELD(reg_note) type:6;
235 unsigned nonreg:1;
236 unsigned multiple:1;
238 /* Cached cost of the dependency. Make sure to update UNKNOWN_DEP_COST
239 when changing the size of this field. */
240 int cost:20;
243 #define UNKNOWN_DEP_COST ((int) ((unsigned int) -1 << 19))
245 typedef struct _dep dep_def;
246 typedef dep_def *dep_t;
248 #define DEP_PRO(D) ((D)->pro)
249 #define DEP_CON(D) ((D)->con)
250 #define DEP_TYPE(D) ((D)->type)
251 #define DEP_STATUS(D) ((D)->status)
252 #define DEP_COST(D) ((D)->cost)
253 #define DEP_NONREG(D) ((D)->nonreg)
254 #define DEP_MULTIPLE(D) ((D)->multiple)
255 #define DEP_REPLACE(D) ((D)->replace)
257 /* Functions to work with dep. */
259 extern void init_dep_1 (dep_t, rtx_insn *, rtx_insn *, enum reg_note, ds_t);
260 extern void init_dep (dep_t, rtx_insn *, rtx_insn *, enum reg_note);
262 extern void sd_debug_dep (dep_t);
264 /* Definition of this struct resides below. */
265 struct _dep_node;
266 typedef struct _dep_node *dep_node_t;
268 /* A link in the dependency list. This is essentially an equivalent of a
269 single {INSN, DEPS}_LIST rtx. */
270 struct _dep_link
272 /* Dep node with all the data. */
273 dep_node_t node;
275 /* Next link in the list. For the last one it is NULL. */
276 struct _dep_link *next;
278 /* Pointer to the next field of the previous link in the list.
279 For the first link this points to the deps_list->first.
281 With help of this field it is easy to remove and insert links to the
282 list. */
283 struct _dep_link **prev_nextp;
285 typedef struct _dep_link *dep_link_t;
287 #define DEP_LINK_NODE(N) ((N)->node)
288 #define DEP_LINK_NEXT(N) ((N)->next)
289 #define DEP_LINK_PREV_NEXTP(N) ((N)->prev_nextp)
291 /* Macros to work dep_link. For most usecases only part of the dependency
292 information is need. These macros conveniently provide that piece of
293 information. */
295 #define DEP_LINK_DEP(N) (DEP_NODE_DEP (DEP_LINK_NODE (N)))
296 #define DEP_LINK_PRO(N) (DEP_PRO (DEP_LINK_DEP (N)))
297 #define DEP_LINK_CON(N) (DEP_CON (DEP_LINK_DEP (N)))
298 #define DEP_LINK_TYPE(N) (DEP_TYPE (DEP_LINK_DEP (N)))
299 #define DEP_LINK_STATUS(N) (DEP_STATUS (DEP_LINK_DEP (N)))
301 /* A list of dep_links. */
302 struct _deps_list
304 /* First element. */
305 dep_link_t first;
307 /* Total number of elements in the list. */
308 int n_links;
310 typedef struct _deps_list *deps_list_t;
312 #define DEPS_LIST_FIRST(L) ((L)->first)
313 #define DEPS_LIST_N_LINKS(L) ((L)->n_links)
315 /* Suppose we have a dependence Y between insn pro1 and con1, where pro1 has
316 additional dependents con0 and con2, and con1 is dependent on additional
317 insns pro0 and pro1:
319 .con0 pro0
320 . ^ |
321 . | |
322 . | |
323 . X A
324 . | |
325 . | |
326 . | V
327 .pro1--Y-->con1
328 . | ^
329 . | |
330 . | |
331 . Z B
332 . | |
333 . | |
334 . V |
335 .con2 pro2
337 This is represented using a "dep_node" for each dependence arc, which are
338 connected as follows (diagram is centered around Y which is fully shown;
339 other dep_nodes shown partially):
341 . +------------+ +--------------+ +------------+
342 . : dep_node X : | dep_node Y | : dep_node Z :
343 . : : | | : :
344 . : : | | : :
345 . : forw : | forw | : forw :
346 . : +--------+ : | +--------+ | : +--------+ :
347 forw_deps : |dep_link| : | |dep_link| | : |dep_link| :
348 +-----+ : | +----+ | : | | +----+ | | : | +----+ | :
349 |first|----->| |next|-+------+->| |next|-+--+----->| |next|-+--->NULL
350 +-----+ : | +----+ | : | | +----+ | | : | +----+ | :
351 . ^ ^ : | ^ | : | | ^ | | : | | :
352 . | | : | | | : | | | | | : | | :
353 . | +--<----+--+ +--+---<--+--+--+ +--+--+--<---+--+ | :
354 . | : | | | : | | | | | : | | | :
355 . | : | +----+ | : | | +----+ | | : | +----+ | :
356 . | : | |prev| | : | | |prev| | | : | |prev| | :
357 . | : | |next| | : | | |next| | | : | |next| | :
358 . | : | +----+ | : | | +----+ | | : | +----+ | :
359 . | : | | :<-+ | | | |<-+ : | | :<-+
360 . | : | +----+ | : | | | +----+ | | | : | +----+ | : |
361 . | : | |node|-+----+ | | |node|-+--+--+ : | |node|-+----+
362 . | : | +----+ | : | | +----+ | | : | +----+ | :
363 . | : | | : | | | | : | | :
364 . | : +--------+ : | +--------+ | : +--------+ :
365 . | : : | | : :
366 . | : SAME pro1 : | +--------+ | : SAME pro1 :
367 . | : DIFF con0 : | |dep | | : DIFF con2 :
368 . | : : | | | | : :
369 . | | | +----+ | |
370 .RTX<------------------------+--+-|pro1| | |
371 .pro1 | | +----+ | |
372 . | | | |
373 . | | +----+ | |
374 .RTX<------------------------+--+-|con1| | |
375 .con1 | | +----+ | |
376 . | | | | |
377 . | | | +----+ | |
378 . | | | |kind| | |
379 . | | | +----+ | |
380 . | : : | | |stat| | | : :
381 . | : DIFF pro0 : | | +----+ | | : DIFF pro2 :
382 . | : SAME con1 : | | | | : SAME con1 :
383 . | : : | +--------+ | : :
384 . | : : | | : :
385 . | : back : | back | : back :
386 . v : +--------+ : | +--------+ | : +--------+ :
387 back_deps : |dep_link| : | |dep_link| | : |dep_link| :
388 +-----+ : | +----+ | : | | +----+ | | : | +----+ | :
389 |first|----->| |next|-+------+->| |next|-+--+----->| |next|-+--->NULL
390 +-----+ : | +----+ | : | | +----+ | | : | +----+ | :
391 . ^ : | ^ | : | | ^ | | : | | :
392 . | : | | | : | | | | | : | | :
393 . +--<----+--+ +--+---<--+--+--+ +--+--+--<---+--+ | :
394 . : | | | : | | | | | : | | | :
395 . : | +----+ | : | | +----+ | | : | +----+ | :
396 . : | |prev| | : | | |prev| | | : | |prev| | :
397 . : | |next| | : | | |next| | | : | |next| | :
398 . : | +----+ | : | | +----+ | | : | +----+ | :
399 . : | | :<-+ | | | |<-+ : | | :<-+
400 . : | +----+ | : | | | +----+ | | | : | +----+ | : |
401 . : | |node|-+----+ | | |node|-+--+--+ : | |node|-+----+
402 . : | +----+ | : | | +----+ | | : | +----+ | :
403 . : | | : | | | | : | | :
404 . : +--------+ : | +--------+ | : +--------+ :
405 . : : | | : :
406 . : dep_node A : | dep_node Y | : dep_node B :
407 . +------------+ +--------------+ +------------+
410 struct _dep_node
412 /* Backward link. */
413 struct _dep_link back;
415 /* The dep. */
416 struct _dep dep;
418 /* Forward link. */
419 struct _dep_link forw;
422 #define DEP_NODE_BACK(N) (&(N)->back)
423 #define DEP_NODE_DEP(N) (&(N)->dep)
424 #define DEP_NODE_FORW(N) (&(N)->forw)
426 /* The following enumeration values tell us what dependencies we
427 should use to implement the barrier. We use true-dependencies for
428 TRUE_BARRIER and anti-dependencies for MOVE_BARRIER. */
429 enum reg_pending_barrier_mode
431 NOT_A_BARRIER = 0,
432 MOVE_BARRIER,
433 TRUE_BARRIER
436 /* Whether a register movement is associated with a call. */
437 enum post_call_group
439 not_post_call,
440 post_call,
441 post_call_initial
444 /* Insns which affect pseudo-registers. */
445 struct deps_reg
447 rtx_insn_list *uses;
448 rtx_insn_list *sets;
449 rtx_insn_list *implicit_sets;
450 rtx_insn_list *control_uses;
451 rtx_insn_list *clobbers;
452 int uses_length;
453 int clobbers_length;
456 /* Describe state of dependencies used during sched_analyze phase. */
457 struct deps_desc
459 /* The *_insns and *_mems are paired lists. Each pending memory operation
460 will have a pointer to the MEM rtx on one list and a pointer to the
461 containing insn on the other list in the same place in the list. */
463 /* We can't use add_dependence like the old code did, because a single insn
464 may have multiple memory accesses, and hence needs to be on the list
465 once for each memory access. Add_dependence won't let you add an insn
466 to a list more than once. */
468 /* An INSN_LIST containing all insns with pending read operations. */
469 rtx_insn_list *pending_read_insns;
471 /* An EXPR_LIST containing all MEM rtx's which are pending reads. */
472 rtx_expr_list *pending_read_mems;
474 /* An INSN_LIST containing all insns with pending write operations. */
475 rtx_insn_list *pending_write_insns;
477 /* An EXPR_LIST containing all MEM rtx's which are pending writes. */
478 rtx_expr_list *pending_write_mems;
480 /* An INSN_LIST containing all jump insns. */
481 rtx_insn_list *pending_jump_insns;
483 /* We must prevent the above lists from ever growing too large since
484 the number of dependencies produced is at least O(N*N),
485 and execution time is at least O(4*N*N), as a function of the
486 length of these pending lists. */
488 /* Indicates the length of the pending_read list. */
489 int pending_read_list_length;
491 /* Indicates the length of the pending_write list. */
492 int pending_write_list_length;
494 /* Length of the pending memory flush list plus the length of the pending
495 jump insn list. Large functions with no calls may build up extremely
496 large lists. */
497 int pending_flush_length;
499 /* The last insn upon which all memory references must depend.
500 This is an insn which flushed the pending lists, creating a dependency
501 between it and all previously pending memory references. This creates
502 a barrier (or a checkpoint) which no memory reference is allowed to cross.
504 This includes all non constant CALL_INSNs. When we do interprocedural
505 alias analysis, this restriction can be relaxed.
506 This may also be an INSN that writes memory if the pending lists grow
507 too large. */
508 rtx_insn_list *last_pending_memory_flush;
510 /* A list of the last function calls we have seen. We use a list to
511 represent last function calls from multiple predecessor blocks.
512 Used to prevent register lifetimes from expanding unnecessarily. */
513 rtx_insn_list *last_function_call;
515 /* A list of the last function calls that may not return normally
516 we have seen. We use a list to represent last function calls from
517 multiple predecessor blocks. Used to prevent moving trapping insns
518 across such calls. */
519 rtx_insn_list *last_function_call_may_noreturn;
521 /* A list of insns which use a pseudo register that does not already
522 cross a call. We create dependencies between each of those insn
523 and the next call insn, to ensure that they won't cross a call after
524 scheduling is done. */
525 rtx_insn_list *sched_before_next_call;
527 /* Similarly, a list of insns which should not cross a branch. */
528 rtx_insn_list *sched_before_next_jump;
530 /* Used to keep post-call pseudo/hard reg movements together with
531 the call. */
532 enum post_call_group in_post_call_group_p;
534 /* The last debug insn we've seen. */
535 rtx_insn *last_debug_insn;
537 /* The last insn bearing REG_ARGS_SIZE that we've seen. */
538 rtx_insn *last_args_size;
540 /* The maximum register number for the following arrays. Before reload
541 this is max_reg_num; after reload it is FIRST_PSEUDO_REGISTER. */
542 int max_reg;
544 /* Element N is the next insn that sets (hard or pseudo) register
545 N within the current basic block; or zero, if there is no
546 such insn. Needed for new registers which may be introduced
547 by splitting insns. */
548 struct deps_reg *reg_last;
550 /* Element N is set for each register that has any nonzero element
551 in reg_last[N].{uses,sets,clobbers}. */
552 regset_head reg_last_in_use;
554 /* Shows the last value of reg_pending_barrier associated with the insn. */
555 enum reg_pending_barrier_mode last_reg_pending_barrier;
557 /* True when this context should be treated as a readonly by
558 the analysis. */
559 BOOL_BITFIELD readonly : 1;
562 typedef struct deps_desc *deps_t;
564 /* This structure holds some state of the current scheduling pass, and
565 contains some function pointers that abstract out some of the non-generic
566 functionality from functions such as schedule_block or schedule_insn.
567 There is one global variable, current_sched_info, which points to the
568 sched_info structure currently in use. */
569 struct haifa_sched_info
571 /* Add all insns that are initially ready to the ready list. Called once
572 before scheduling a set of insns. */
573 void (*init_ready_list) (void);
574 /* Called after taking an insn from the ready list. Returns nonzero if
575 this insn can be scheduled, nonzero if we should silently discard it. */
576 int (*can_schedule_ready_p) (rtx_insn *);
577 /* Return nonzero if there are more insns that should be scheduled. */
578 int (*schedule_more_p) (void);
579 /* Called after an insn has all its hard dependencies resolved.
580 Adjusts status of instruction (which is passed through second parameter)
581 to indicate if instruction should be moved to the ready list or the
582 queue, or if it should silently discard it (until next resolved
583 dependence). */
584 ds_t (*new_ready) (rtx_insn *, ds_t);
585 /* Compare priority of two insns. Return a positive number if the second
586 insn is to be preferred for scheduling, and a negative one if the first
587 is to be preferred. Zero if they are equally good. */
588 int (*rank) (rtx_insn *, rtx_insn *);
589 /* Return a string that contains the insn uid and optionally anything else
590 necessary to identify this insn in an output. It's valid to use a
591 static buffer for this. The ALIGNED parameter should cause the string
592 to be formatted so that multiple output lines will line up nicely. */
593 const char *(*print_insn) (const rtx_insn *, int);
594 /* Return nonzero if an insn should be included in priority
595 calculations. */
596 int (*contributes_to_priority) (rtx_insn *, rtx_insn *);
598 /* Return true if scheduling insn (passed as the parameter) will trigger
599 finish of scheduling current block. */
600 bool (*insn_finishes_block_p) (rtx_insn *);
602 /* The boundaries of the set of insns to be scheduled. */
603 rtx_insn *prev_head, *next_tail;
605 /* Filled in after the schedule is finished; the first and last scheduled
606 insns. */
607 rtx_insn *head, *tail;
609 /* If nonzero, enables an additional sanity check in schedule_block. */
610 unsigned int queue_must_finish_empty:1;
612 /* Maximum priority that has been assigned to an insn. */
613 int sched_max_insns_priority;
615 /* Hooks to support speculative scheduling. */
617 /* Called to notify frontend that instruction is being added (second
618 parameter == 0) or removed (second parameter == 1). */
619 void (*add_remove_insn) (rtx_insn *, int);
621 /* Called to notify the frontend that instruction INSN is being
622 scheduled. */
623 void (*begin_schedule_ready) (rtx_insn *insn);
625 /* Called to notify the frontend that an instruction INSN is about to be
626 moved to its correct place in the final schedule. This is done for all
627 insns in order of the schedule. LAST indicates the last scheduled
628 instruction. */
629 void (*begin_move_insn) (rtx_insn *insn, rtx_insn *last);
631 /* If the second parameter is not NULL, return nonnull value, if the
632 basic block should be advanced.
633 If the second parameter is NULL, return the next basic block in EBB.
634 The first parameter is the current basic block in EBB. */
635 basic_block (*advance_target_bb) (basic_block, rtx_insn *);
637 /* Allocate memory, store the frontend scheduler state in it, and
638 return it. */
639 void *(*save_state) (void);
640 /* Restore frontend scheduler state from the argument, and free the
641 memory. */
642 void (*restore_state) (void *);
644 /* ??? FIXME: should use straight bitfields inside sched_info instead of
645 this flag field. */
646 unsigned int flags;
649 /* This structure holds description of the properties for speculative
650 scheduling. */
651 struct spec_info_def
653 /* Holds types of allowed speculations: BEGIN_{DATA|CONTROL},
654 BE_IN_{DATA_CONTROL}. */
655 int mask;
657 /* A dump file for additional information on speculative scheduling. */
658 FILE *dump;
660 /* Minimal cumulative weakness of speculative instruction's
661 dependencies, so that insn will be scheduled. */
662 dw_t data_weakness_cutoff;
664 /* Minimal usefulness of speculative instruction to be considered for
665 scheduling. */
666 int control_weakness_cutoff;
668 /* Flags from the enum SPEC_SCHED_FLAGS. */
669 int flags;
671 typedef struct spec_info_def *spec_info_t;
673 extern spec_info_t spec_info;
675 extern struct haifa_sched_info *current_sched_info;
677 /* Do register pressure sensitive insn scheduling if the flag is set
678 up. */
679 extern enum sched_pressure_algorithm sched_pressure;
681 /* Map regno -> its pressure class. The map defined only when
682 SCHED_PRESSURE_P is true. */
683 extern enum reg_class *sched_regno_pressure_class;
685 /* Indexed by INSN_UID, the collection of all data associated with
686 a single instruction. */
688 struct _haifa_deps_insn_data
690 /* The number of incoming edges in the forward dependency graph.
691 As scheduling proceeds, counts are decreased. An insn moves to
692 the ready queue when its counter reaches zero. */
693 int dep_count;
695 /* Nonzero if instruction has internal dependence
696 (e.g. add_dependence was invoked with (insn == elem)). */
697 unsigned int has_internal_dep;
699 /* NB: We can't place 'struct _deps_list' here instead of deps_list_t into
700 h_i_d because when h_i_d extends, addresses of the deps_list->first
701 change without updating deps_list->first->next->prev_nextp. Thus
702 BACK_DEPS and RESOLVED_BACK_DEPS are allocated on the heap and FORW_DEPS
703 list is allocated on the obstack. */
705 /* A list of hard backward dependencies. The insn is a consumer of all the
706 deps mentioned here. */
707 deps_list_t hard_back_deps;
709 /* A list of speculative (weak) dependencies. The insn is a consumer of all
710 the deps mentioned here. */
711 deps_list_t spec_back_deps;
713 /* A list of insns which depend on the instruction. Unlike 'back_deps',
714 it represents forward dependencies. */
715 deps_list_t forw_deps;
717 /* A list of scheduled producers of the instruction. Links are being moved
718 from 'back_deps' to 'resolved_back_deps' while scheduling. */
719 deps_list_t resolved_back_deps;
721 /* A list of scheduled consumers of the instruction. Links are being moved
722 from 'forw_deps' to 'resolved_forw_deps' while scheduling to fasten the
723 search in 'forw_deps'. */
724 deps_list_t resolved_forw_deps;
726 /* If the insn is conditional (either through COND_EXEC, or because
727 it is a conditional branch), this records the condition. NULL
728 for insns that haven't been seen yet or don't have a condition;
729 const_true_rtx to mark an insn without a condition, or with a
730 condition that has been clobbered by a subsequent insn. */
731 rtx cond;
733 /* For a conditional insn, a list of insns that could set the condition
734 register. Used when generating control dependencies. */
735 rtx_insn_list *cond_deps;
737 /* True if the condition in 'cond' should be reversed to get the actual
738 condition. */
739 unsigned int reverse_cond : 1;
741 /* Some insns (e.g. call) are not allowed to move across blocks. */
742 unsigned int cant_move : 1;
746 /* Bits used for storing values of the fields in the following
747 structure. */
748 #define INCREASE_BITS 8
750 /* The structure describes how the corresponding insn increases the
751 register pressure for each pressure class. */
752 struct reg_pressure_data
754 /* Pressure increase for given class because of clobber. */
755 unsigned int clobber_increase : INCREASE_BITS;
756 /* Increase in register pressure for given class because of register
757 sets. */
758 unsigned int set_increase : INCREASE_BITS;
759 /* Pressure increase for given class because of unused register
760 set. */
761 unsigned int unused_set_increase : INCREASE_BITS;
762 /* Pressure change: #sets - #deaths. */
763 int change : INCREASE_BITS;
766 /* The following structure describes usage of registers by insns. */
767 struct reg_use_data
769 /* Regno used in the insn. */
770 int regno;
771 /* Insn using the regno. */
772 rtx_insn *insn;
773 /* Cyclic list of elements with the same regno. */
774 struct reg_use_data *next_regno_use;
775 /* List of elements with the same insn. */
776 struct reg_use_data *next_insn_use;
779 /* The following structure describes used sets of registers by insns.
780 Registers are pseudos whose pressure class is not NO_REGS or hard
781 registers available for allocations. */
782 struct reg_set_data
784 /* Regno used in the insn. */
785 int regno;
786 /* Insn setting the regno. */
787 rtx insn;
788 /* List of elements with the same insn. */
789 struct reg_set_data *next_insn_set;
792 enum autopref_multipass_data_status {
793 /* Entry is irrelevant for auto-prefetcher. */
794 AUTOPREF_MULTIPASS_DATA_IRRELEVANT = -2,
795 /* Entry is uninitialized. */
796 AUTOPREF_MULTIPASS_DATA_UNINITIALIZED = -1,
797 /* Entry is relevant for auto-prefetcher and insn can be delayed
798 to allow another insn through. */
799 AUTOPREF_MULTIPASS_DATA_NORMAL = 0,
800 /* Entry is relevant for auto-prefetcher, but insn should not be
801 delayed as that will break scheduling. */
802 AUTOPREF_MULTIPASS_DATA_DONT_DELAY = 1
805 /* Data for modeling cache auto-prefetcher. */
806 struct autopref_multipass_data_
808 /* Base part of memory address. */
809 rtx base;
811 /* Memory offsets from the base. For single simple sets
812 only min_offset is valid. For multi-set insns min_offset
813 and max_offset record the minimum and maximum offsets from the same
814 base among the sets inside the PARALLEL. */
815 int min_offset;
816 int max_offset;
818 /* True if this is a load/store-multiple instruction. */
819 bool multi_mem_insn_p;
821 /* Entry status. */
822 enum autopref_multipass_data_status status;
824 typedef struct autopref_multipass_data_ autopref_multipass_data_def;
825 typedef autopref_multipass_data_def *autopref_multipass_data_t;
827 struct _haifa_insn_data
829 /* We can't place 'struct _deps_list' into h_i_d instead of deps_list_t
830 because when h_i_d extends, addresses of the deps_list->first
831 change without updating deps_list->first->next->prev_nextp. */
833 /* Logical uid gives the original ordering of the insns. */
834 int luid;
836 /* A priority for each insn. */
837 int priority;
839 /* The fusion priority for each insn. */
840 int fusion_priority;
842 /* The minimum clock tick at which the insn becomes ready. This is
843 used to note timing constraints for the insns in the pending list. */
844 int tick;
846 /* For insns that are scheduled at a fixed difference from another,
847 this records the tick in which they must be ready. */
848 int exact_tick;
850 /* INTER_TICK is used to adjust INSN_TICKs of instructions from the
851 subsequent blocks in a region. */
852 int inter_tick;
854 /* Used temporarily to estimate an INSN_TICK value for an insn given
855 current knowledge. */
856 int tick_estimate;
858 /* See comment on QUEUE_INDEX macro in haifa-sched.c. */
859 int queue_index;
861 short cost;
863 /* '> 0' if priority is valid,
864 '== 0' if priority was not yet computed,
865 '< 0' if priority in invalid and should be recomputed. */
866 signed char priority_status;
868 /* Set if there's DEF-USE dependence between some speculatively
869 moved load insn and this one. */
870 unsigned int fed_by_spec_load : 1;
871 unsigned int is_load_insn : 1;
872 /* Nonzero if this insn has negative-cost forward dependencies against
873 an already scheduled insn. */
874 unsigned int feeds_backtrack_insn : 1;
876 /* Nonzero if this insn is a shadow of another, scheduled after a fixed
877 delay. We only emit shadows at the end of a cycle, with no other
878 real insns following them. */
879 unsigned int shadow_p : 1;
881 /* Used internally in unschedule_insns_until to mark insns that must have
882 their TODO_SPEC recomputed. */
883 unsigned int must_recompute_spec : 1;
885 /* What speculations are necessary to apply to schedule the instruction. */
886 ds_t todo_spec;
888 /* What speculations were already applied. */
889 ds_t done_spec;
891 /* What speculations are checked by this instruction. */
892 ds_t check_spec;
894 /* Recovery block for speculation checks. */
895 basic_block recovery_block;
897 /* Original pattern of the instruction. */
898 rtx orig_pat;
900 /* For insns with DEP_CONTROL dependencies, the predicated pattern if it
901 was ever successfully constructed. */
902 rtx predicated_pat;
904 /* The following array contains info how the insn increases register
905 pressure. There is an element for each cover class of pseudos
906 referenced in insns. */
907 struct reg_pressure_data *reg_pressure;
908 /* The following array contains maximal reg pressure between last
909 scheduled insn and given insn. There is an element for each
910 pressure class of pseudos referenced in insns. This info updated
911 after scheduling each insn for each insn between the two
912 mentioned insns. */
913 int *max_reg_pressure;
914 /* The following list contains info about used pseudos and hard
915 registers available for allocation. */
916 struct reg_use_data *reg_use_list;
917 /* The following list contains info about set pseudos and hard
918 registers available for allocation. */
919 struct reg_set_data *reg_set_list;
920 /* Info about how scheduling the insn changes cost of register
921 pressure excess (between source and target). */
922 int reg_pressure_excess_cost_change;
923 int model_index;
925 /* Original order of insns in the ready list. */
926 int rfs_debug_orig_order;
928 /* The deciding reason for INSN's place in the ready list. */
929 int last_rfs_win;
931 /* Two entries for cache auto-prefetcher model: one for mem reads,
932 and one for mem writes. */
933 autopref_multipass_data_def autopref_multipass_data[2];
936 typedef struct _haifa_insn_data haifa_insn_data_def;
937 typedef haifa_insn_data_def *haifa_insn_data_t;
940 extern vec<haifa_insn_data_def> h_i_d;
942 #define HID(INSN) (&h_i_d[INSN_UID (INSN)])
944 /* Accessor macros for h_i_d. There are more in haifa-sched.c and
945 sched-rgn.c. */
946 #define INSN_PRIORITY(INSN) (HID (INSN)->priority)
947 #define INSN_FUSION_PRIORITY(INSN) (HID (INSN)->fusion_priority)
948 #define INSN_REG_PRESSURE(INSN) (HID (INSN)->reg_pressure)
949 #define INSN_MAX_REG_PRESSURE(INSN) (HID (INSN)->max_reg_pressure)
950 #define INSN_REG_USE_LIST(INSN) (HID (INSN)->reg_use_list)
951 #define INSN_REG_SET_LIST(INSN) (HID (INSN)->reg_set_list)
952 #define INSN_REG_PRESSURE_EXCESS_COST_CHANGE(INSN) \
953 (HID (INSN)->reg_pressure_excess_cost_change)
954 #define INSN_PRIORITY_STATUS(INSN) (HID (INSN)->priority_status)
955 #define INSN_MODEL_INDEX(INSN) (HID (INSN)->model_index)
956 #define INSN_AUTOPREF_MULTIPASS_DATA(INSN) \
957 (HID (INSN)->autopref_multipass_data)
959 typedef struct _haifa_deps_insn_data haifa_deps_insn_data_def;
960 typedef haifa_deps_insn_data_def *haifa_deps_insn_data_t;
963 extern vec<haifa_deps_insn_data_def> h_d_i_d;
965 #define HDID(INSN) (&h_d_i_d[INSN_LUID (INSN)])
966 #define INSN_DEP_COUNT(INSN) (HDID (INSN)->dep_count)
967 #define HAS_INTERNAL_DEP(INSN) (HDID (INSN)->has_internal_dep)
968 #define INSN_FORW_DEPS(INSN) (HDID (INSN)->forw_deps)
969 #define INSN_RESOLVED_BACK_DEPS(INSN) (HDID (INSN)->resolved_back_deps)
970 #define INSN_RESOLVED_FORW_DEPS(INSN) (HDID (INSN)->resolved_forw_deps)
971 #define INSN_HARD_BACK_DEPS(INSN) (HDID (INSN)->hard_back_deps)
972 #define INSN_SPEC_BACK_DEPS(INSN) (HDID (INSN)->spec_back_deps)
973 #define INSN_CACHED_COND(INSN) (HDID (INSN)->cond)
974 #define INSN_REVERSE_COND(INSN) (HDID (INSN)->reverse_cond)
975 #define INSN_COND_DEPS(INSN) (HDID (INSN)->cond_deps)
976 #define CANT_MOVE(INSN) (HDID (INSN)->cant_move)
977 #define CANT_MOVE_BY_LUID(LUID) (h_d_i_d[LUID].cant_move)
980 #define INSN_PRIORITY(INSN) (HID (INSN)->priority)
981 #define INSN_PRIORITY_STATUS(INSN) (HID (INSN)->priority_status)
982 #define INSN_PRIORITY_KNOWN(INSN) (INSN_PRIORITY_STATUS (INSN) > 0)
983 #define TODO_SPEC(INSN) (HID (INSN)->todo_spec)
984 #define DONE_SPEC(INSN) (HID (INSN)->done_spec)
985 #define CHECK_SPEC(INSN) (HID (INSN)->check_spec)
986 #define RECOVERY_BLOCK(INSN) (HID (INSN)->recovery_block)
987 #define ORIG_PAT(INSN) (HID (INSN)->orig_pat)
988 #define PREDICATED_PAT(INSN) (HID (INSN)->predicated_pat)
990 /* INSN is either a simple or a branchy speculation check. */
991 #define IS_SPECULATION_CHECK_P(INSN) \
992 (sel_sched_p () ? sel_insn_is_speculation_check (INSN) : RECOVERY_BLOCK (INSN) != NULL)
994 /* INSN is a speculation check that will simply reexecute the speculatively
995 scheduled instruction if the speculation fails. */
996 #define IS_SPECULATION_SIMPLE_CHECK_P(INSN) \
997 (RECOVERY_BLOCK (INSN) == EXIT_BLOCK_PTR_FOR_FN (cfun))
999 /* INSN is a speculation check that will branch to RECOVERY_BLOCK if the
1000 speculation fails. Insns in that block will reexecute the speculatively
1001 scheduled code and then will return immediately after INSN thus preserving
1002 semantics of the program. */
1003 #define IS_SPECULATION_BRANCHY_CHECK_P(INSN) \
1004 (RECOVERY_BLOCK (INSN) != NULL \
1005 && RECOVERY_BLOCK (INSN) != EXIT_BLOCK_PTR_FOR_FN (cfun))
1008 /* Dep status (aka ds_t) of the link encapsulates all information for a given
1009 dependency, including everything that is needed for speculative scheduling.
1011 The lay-out of a ds_t is as follows:
1013 1. Integers corresponding to the probability of the dependence to *not*
1014 exist. This is the probability that overcoming this dependence will
1015 not be followed by execution of the recovery code. Note that however
1016 high this probability is, the recovery code should still always be
1017 generated to preserve semantics of the program.
1019 The probability values can be set or retrieved using the functions
1020 the set_dep_weak() and get_dep_weak() in sched-deps.c. The values
1021 are always in the range [0, MAX_DEP_WEAK].
1023 BEGIN_DATA : BITS_PER_DEP_WEAK
1024 BE_IN_DATA : BITS_PER_DEP_WEAK
1025 BEGIN_CONTROL : BITS_PER_DEP_WEAK
1026 BE_IN_CONTROL : BITS_PER_DEP_WEAK
1028 The basic type of DS_T is a host int. For a 32-bits int, the values
1029 will each take 6 bits.
1031 2. The type of dependence. This supercedes the old-style REG_NOTE_KIND
1032 values. TODO: Use this field instead of DEP_TYPE, or make DEP_TYPE
1033 extract the dependence type from here.
1035 dep_type : 4 => DEP_{TRUE|OUTPUT|ANTI|CONTROL}
1037 3. Various flags:
1039 HARD_DEP : 1 => Set if an instruction has a non-speculative
1040 dependence. This is an instruction property
1041 so this bit can only appear in the TODO_SPEC
1042 field of an instruction.
1043 DEP_POSTPONED : 1 => Like HARD_DEP, but the hard dependence may
1044 still be broken by adjusting the instruction.
1045 DEP_CANCELLED : 1 => Set if a dependency has been broken using
1046 some form of speculation.
1047 RESERVED : 1 => Reserved for use in the delay slot scheduler.
1049 See also: check_dep_status () in sched-deps.c . */
1051 /* The number of bits per weakness probability. There are 4 weakness types
1052 and we need 8 bits for other data in a DS_T. */
1053 #define BITS_PER_DEP_WEAK ((BITS_PER_DEP_STATUS - 8) / 4)
1055 /* Mask of speculative weakness in dep_status. */
1056 #define DEP_WEAK_MASK ((1 << BITS_PER_DEP_WEAK) - 1)
1058 /* This constant means that dependence is fake with 99.999...% probability.
1059 This is the maximum value, that can appear in dep_status.
1060 Note, that we don't want MAX_DEP_WEAK to be the same as DEP_WEAK_MASK for
1061 debugging reasons. Though, it can be set to DEP_WEAK_MASK, and, when
1062 done so, we'll get fast (mul for)/(div by) NO_DEP_WEAK. */
1063 #define MAX_DEP_WEAK (DEP_WEAK_MASK - 1)
1065 /* This constant means that dependence is 99.999...% real and it is a really
1066 bad idea to overcome it (though this can be done, preserving program
1067 semantics). */
1068 #define MIN_DEP_WEAK 1
1070 /* This constant represents 100% probability.
1071 E.g. it is used to represent weakness of dependence, that doesn't exist.
1072 This value never appears in a ds_t, it is only used for computing the
1073 weakness of a dependence. */
1074 #define NO_DEP_WEAK (MAX_DEP_WEAK + MIN_DEP_WEAK)
1076 /* Default weakness of speculative dependence. Used when we can't say
1077 neither bad nor good about the dependence. */
1078 #define UNCERTAIN_DEP_WEAK (MAX_DEP_WEAK - MAX_DEP_WEAK / 4)
1080 /* Offset for speculative weaknesses in dep_status. */
1081 enum SPEC_TYPES_OFFSETS {
1082 BEGIN_DATA_BITS_OFFSET = 0,
1083 BE_IN_DATA_BITS_OFFSET = BEGIN_DATA_BITS_OFFSET + BITS_PER_DEP_WEAK,
1084 BEGIN_CONTROL_BITS_OFFSET = BE_IN_DATA_BITS_OFFSET + BITS_PER_DEP_WEAK,
1085 BE_IN_CONTROL_BITS_OFFSET = BEGIN_CONTROL_BITS_OFFSET + BITS_PER_DEP_WEAK
1088 /* The following defines provide numerous constants used to distinguish
1089 between different types of speculative dependencies. They are also
1090 used as masks to clear/preserve the bits corresponding to the type
1091 of dependency weakness. */
1093 /* Dependence can be overcome with generation of new data speculative
1094 instruction. */
1095 #define BEGIN_DATA (((ds_t) DEP_WEAK_MASK) << BEGIN_DATA_BITS_OFFSET)
1097 /* This dependence is to the instruction in the recovery block, that was
1098 formed to recover after data-speculation failure.
1099 Thus, this dependence can overcome with generating of the copy of
1100 this instruction in the recovery block. */
1101 #define BE_IN_DATA (((ds_t) DEP_WEAK_MASK) << BE_IN_DATA_BITS_OFFSET)
1103 /* Dependence can be overcome with generation of new control speculative
1104 instruction. */
1105 #define BEGIN_CONTROL (((ds_t) DEP_WEAK_MASK) << BEGIN_CONTROL_BITS_OFFSET)
1107 /* This dependence is to the instruction in the recovery block, that was
1108 formed to recover after control-speculation failure.
1109 Thus, this dependence can be overcome with generating of the copy of
1110 this instruction in the recovery block. */
1111 #define BE_IN_CONTROL (((ds_t) DEP_WEAK_MASK) << BE_IN_CONTROL_BITS_OFFSET)
1113 /* A few convenient combinations. */
1114 #define BEGIN_SPEC (BEGIN_DATA | BEGIN_CONTROL)
1115 #define DATA_SPEC (BEGIN_DATA | BE_IN_DATA)
1116 #define CONTROL_SPEC (BEGIN_CONTROL | BE_IN_CONTROL)
1117 #define SPECULATIVE (DATA_SPEC | CONTROL_SPEC)
1118 #define BE_IN_SPEC (BE_IN_DATA | BE_IN_CONTROL)
1120 /* Constants, that are helpful in iterating through dep_status. */
1121 #define FIRST_SPEC_TYPE BEGIN_DATA
1122 #define LAST_SPEC_TYPE BE_IN_CONTROL
1123 #define SPEC_TYPE_SHIFT BITS_PER_DEP_WEAK
1125 /* Dependence on instruction can be of multiple types
1126 (e.g. true and output). This fields enhance REG_NOTE_KIND information
1127 of the dependence. */
1128 #define DEP_TRUE (((ds_t) 1) << (BE_IN_CONTROL_BITS_OFFSET + BITS_PER_DEP_WEAK))
1129 #define DEP_OUTPUT (DEP_TRUE << 1)
1130 #define DEP_ANTI (DEP_OUTPUT << 1)
1131 #define DEP_CONTROL (DEP_ANTI << 1)
1133 #define DEP_TYPES (DEP_TRUE | DEP_OUTPUT | DEP_ANTI | DEP_CONTROL)
1135 /* Instruction has non-speculative dependence. This bit represents the
1136 property of an instruction - not the one of a dependence.
1137 Therefore, it can appear only in the TODO_SPEC field of an instruction. */
1138 #define HARD_DEP (DEP_CONTROL << 1)
1140 /* Like HARD_DEP, but dependencies can perhaps be broken by modifying
1141 the instructions. This is used for example to change:
1143 rn++ => rm=[rn + 4]
1144 rm=[rn] rn++
1146 For instructions that have this bit set, one of the dependencies of
1147 the instructions will have a non-NULL REPLACE field in its DEP_T.
1148 Just like HARD_DEP, this bit is only ever set in TODO_SPEC. */
1149 #define DEP_POSTPONED (HARD_DEP << 1)
1151 /* Set if a dependency is cancelled via speculation. */
1152 #define DEP_CANCELLED (DEP_POSTPONED << 1)
1155 /* This represents the results of calling sched-deps.c functions,
1156 which modify dependencies. */
1157 enum DEPS_ADJUST_RESULT {
1158 /* No dependence needed (e.g. producer == consumer). */
1159 DEP_NODEP,
1160 /* Dependence is already present and wasn't modified. */
1161 DEP_PRESENT,
1162 /* Existing dependence was modified to include additional information. */
1163 DEP_CHANGED,
1164 /* New dependence has been created. */
1165 DEP_CREATED
1168 /* Represents the bits that can be set in the flags field of the
1169 sched_info structure. */
1170 enum SCHED_FLAGS {
1171 /* If set, generate links between instruction as DEPS_LIST.
1172 Otherwise, generate usual INSN_LIST links. */
1173 USE_DEPS_LIST = 1,
1174 /* Perform data or control (or both) speculation.
1175 Results in generation of data and control speculative dependencies.
1176 Requires USE_DEPS_LIST set. */
1177 DO_SPECULATION = USE_DEPS_LIST << 1,
1178 DO_BACKTRACKING = DO_SPECULATION << 1,
1179 DO_PREDICATION = DO_BACKTRACKING << 1,
1180 DONT_BREAK_DEPENDENCIES = DO_PREDICATION << 1,
1181 SCHED_RGN = DONT_BREAK_DEPENDENCIES << 1,
1182 SCHED_EBB = SCHED_RGN << 1,
1183 /* Scheduler can possibly create new basic blocks. Used for assertions. */
1184 NEW_BBS = SCHED_EBB << 1,
1185 SEL_SCHED = NEW_BBS << 1
1188 enum SPEC_SCHED_FLAGS {
1189 COUNT_SPEC_IN_CRITICAL_PATH = 1,
1190 SEL_SCHED_SPEC_DONT_CHECK_CONTROL = COUNT_SPEC_IN_CRITICAL_PATH << 1
1193 #define NOTE_NOT_BB_P(NOTE) (NOTE_P (NOTE) && (NOTE_KIND (NOTE) \
1194 != NOTE_INSN_BASIC_BLOCK))
1196 extern FILE *sched_dump;
1197 extern int sched_verbose;
1199 extern spec_info_t spec_info;
1200 extern bool haifa_recovery_bb_ever_added_p;
1202 /* Exception Free Loads:
1204 We define five classes of speculative loads: IFREE, IRISKY,
1205 PFREE, PRISKY, and MFREE.
1207 IFREE loads are loads that are proved to be exception-free, just
1208 by examining the load insn. Examples for such loads are loads
1209 from TOC and loads of global data.
1211 IRISKY loads are loads that are proved to be exception-risky,
1212 just by examining the load insn. Examples for such loads are
1213 volatile loads and loads from shared memory.
1215 PFREE loads are loads for which we can prove, by examining other
1216 insns, that they are exception-free. Currently, this class consists
1217 of loads for which we are able to find a "similar load", either in
1218 the target block, or, if only one split-block exists, in that split
1219 block. Load2 is similar to load1 if both have same single base
1220 register. We identify only part of the similar loads, by finding
1221 an insn upon which both load1 and load2 have a DEF-USE dependence.
1223 PRISKY loads are loads for which we can prove, by examining other
1224 insns, that they are exception-risky. Currently we have two proofs for
1225 such loads. The first proof detects loads that are probably guarded by a
1226 test on the memory address. This proof is based on the
1227 backward and forward data dependence information for the region.
1228 Let load-insn be the examined load.
1229 Load-insn is PRISKY iff ALL the following hold:
1231 - insn1 is not in the same block as load-insn
1232 - there is a DEF-USE dependence chain (insn1, ..., load-insn)
1233 - test-insn is either a compare or a branch, not in the same block
1234 as load-insn
1235 - load-insn is reachable from test-insn
1236 - there is a DEF-USE dependence chain (insn1, ..., test-insn)
1238 This proof might fail when the compare and the load are fed
1239 by an insn not in the region. To solve this, we will add to this
1240 group all loads that have no input DEF-USE dependence.
1242 The second proof detects loads that are directly or indirectly
1243 fed by a speculative load. This proof is affected by the
1244 scheduling process. We will use the flag fed_by_spec_load.
1245 Initially, all insns have this flag reset. After a speculative
1246 motion of an insn, if insn is either a load, or marked as
1247 fed_by_spec_load, we will also mark as fed_by_spec_load every
1248 insn1 for which a DEF-USE dependence (insn, insn1) exists. A
1249 load which is fed_by_spec_load is also PRISKY.
1251 MFREE (maybe-free) loads are all the remaining loads. They may be
1252 exception-free, but we cannot prove it.
1254 Now, all loads in IFREE and PFREE classes are considered
1255 exception-free, while all loads in IRISKY and PRISKY classes are
1256 considered exception-risky. As for loads in the MFREE class,
1257 these are considered either exception-free or exception-risky,
1258 depending on whether we are pessimistic or optimistic. We have
1259 to take the pessimistic approach to assure the safety of
1260 speculative scheduling, but we can take the optimistic approach
1261 by invoking the -fsched_spec_load_dangerous option. */
1263 enum INSN_TRAP_CLASS
1265 TRAP_FREE = 0, IFREE = 1, PFREE_CANDIDATE = 2,
1266 PRISKY_CANDIDATE = 3, IRISKY = 4, TRAP_RISKY = 5
1269 #define WORST_CLASS(class1, class2) \
1270 ((class1 > class2) ? class1 : class2)
1272 #ifndef __GNUC__
1273 #define __inline
1274 #endif
1276 #ifndef HAIFA_INLINE
1277 #define HAIFA_INLINE __inline
1278 #endif
1280 struct sched_deps_info_def
1282 /* Called when computing dependencies for a JUMP_INSN. This function
1283 should store the set of registers that must be considered as set by
1284 the jump in the regset. */
1285 void (*compute_jump_reg_dependencies) (rtx, regset);
1287 /* Start analyzing insn. */
1288 void (*start_insn) (rtx_insn *);
1290 /* Finish analyzing insn. */
1291 void (*finish_insn) (void);
1293 /* Start analyzing insn LHS (Left Hand Side). */
1294 void (*start_lhs) (rtx);
1296 /* Finish analyzing insn LHS. */
1297 void (*finish_lhs) (void);
1299 /* Start analyzing insn RHS (Right Hand Side). */
1300 void (*start_rhs) (rtx);
1302 /* Finish analyzing insn RHS. */
1303 void (*finish_rhs) (void);
1305 /* Note set of the register. */
1306 void (*note_reg_set) (int);
1308 /* Note clobber of the register. */
1309 void (*note_reg_clobber) (int);
1311 /* Note use of the register. */
1312 void (*note_reg_use) (int);
1314 /* Note memory dependence of type DS between MEM1 and MEM2 (which is
1315 in the INSN2). */
1316 void (*note_mem_dep) (rtx mem1, rtx mem2, rtx_insn *insn2, ds_t ds);
1318 /* Note a dependence of type DS from the INSN. */
1319 void (*note_dep) (rtx_insn *, ds_t ds);
1321 /* Nonzero if we should use cselib for better alias analysis. This
1322 must be 0 if the dependency information is used after sched_analyze
1323 has completed, e.g. if we're using it to initialize state for successor
1324 blocks in region scheduling. */
1325 unsigned int use_cselib : 1;
1327 /* If set, generate links between instruction as DEPS_LIST.
1328 Otherwise, generate usual INSN_LIST links. */
1329 unsigned int use_deps_list : 1;
1331 /* Generate data and control speculative dependencies.
1332 Requires USE_DEPS_LIST set. */
1333 unsigned int generate_spec_deps : 1;
1336 extern struct sched_deps_info_def *sched_deps_info;
1339 /* Functions in sched-deps.c. */
1340 extern rtx sched_get_reverse_condition_uncached (const rtx_insn *);
1341 extern bool sched_insns_conditions_mutex_p (const rtx_insn *,
1342 const rtx_insn *);
1343 extern bool sched_insn_is_legitimate_for_speculation_p (const rtx_insn *, ds_t);
1344 extern void add_dependence (rtx_insn *, rtx_insn *, enum reg_note);
1345 extern void sched_analyze (struct deps_desc *, rtx_insn *, rtx_insn *);
1346 extern void init_deps (struct deps_desc *, bool);
1347 extern void init_deps_reg_last (struct deps_desc *);
1348 extern void free_deps (struct deps_desc *);
1349 extern void init_deps_global (void);
1350 extern void finish_deps_global (void);
1351 extern void deps_analyze_insn (struct deps_desc *, rtx_insn *);
1352 extern void remove_from_deps (struct deps_desc *, rtx_insn *);
1353 extern void init_insn_reg_pressure_info (rtx_insn *);
1354 extern void get_implicit_reg_pending_clobbers (HARD_REG_SET *, rtx_insn *);
1356 extern dw_t get_dep_weak (ds_t, ds_t);
1357 extern ds_t set_dep_weak (ds_t, ds_t, dw_t);
1358 extern dw_t estimate_dep_weak (rtx, rtx);
1359 extern ds_t ds_merge (ds_t, ds_t);
1360 extern ds_t ds_full_merge (ds_t, ds_t, rtx, rtx);
1361 extern ds_t ds_max_merge (ds_t, ds_t);
1362 extern dw_t ds_weak (ds_t);
1363 extern ds_t ds_get_speculation_types (ds_t);
1364 extern ds_t ds_get_max_dep_weak (ds_t);
1366 extern void sched_deps_init (bool);
1367 extern void sched_deps_finish (void);
1369 extern void haifa_note_reg_set (int);
1370 extern void haifa_note_reg_clobber (int);
1371 extern void haifa_note_reg_use (int);
1373 extern void maybe_extend_reg_info_p (void);
1375 extern void deps_start_bb (struct deps_desc *, rtx_insn *);
1376 extern enum reg_note ds_to_dt (ds_t);
1378 extern bool deps_pools_are_empty_p (void);
1379 extern void sched_free_deps (rtx_insn *, rtx_insn *, bool);
1380 extern void extend_dependency_caches (int, bool);
1382 extern void debug_ds (ds_t);
1385 /* Functions in haifa-sched.c. */
1386 extern void initialize_live_range_shrinkage (void);
1387 extern void finish_live_range_shrinkage (void);
1388 extern void sched_init_region_reg_pressure_info (void);
1389 extern void free_global_sched_pressure_data (void);
1390 extern int haifa_classify_insn (const_rtx);
1391 extern void get_ebb_head_tail (basic_block, basic_block,
1392 rtx_insn **, rtx_insn **);
1393 extern int no_real_insns_p (const rtx_insn *, const rtx_insn *);
1395 extern int insn_cost (rtx_insn *);
1396 extern int dep_cost_1 (dep_t, dw_t);
1397 extern int dep_cost (dep_t);
1398 extern int set_priorities (rtx_insn *, rtx_insn *);
1400 extern void sched_setup_bb_reg_pressure_info (basic_block, rtx_insn *);
1401 extern bool schedule_block (basic_block *, state_t);
1403 extern int cycle_issued_insns;
1404 extern int issue_rate;
1405 extern int dfa_lookahead;
1407 extern int autopref_multipass_dfa_lookahead_guard (rtx_insn *, int);
1409 extern rtx_insn *ready_element (struct ready_list *, int);
1410 extern rtx_insn **ready_lastpos (struct ready_list *);
1412 extern int try_ready (rtx_insn *);
1413 extern void sched_extend_ready_list (int);
1414 extern void sched_finish_ready_list (void);
1415 extern void sched_change_pattern (rtx, rtx);
1416 extern int sched_speculate_insn (rtx_insn *, ds_t, rtx *);
1417 extern void unlink_bb_notes (basic_block, basic_block);
1418 extern void add_block (basic_block, basic_block);
1419 extern rtx_note *bb_note (basic_block);
1420 extern void concat_note_lists (rtx_insn *, rtx_insn **);
1421 extern rtx_insn *sched_emit_insn (rtx);
1422 extern rtx_insn *get_ready_element (int);
1423 extern int number_in_ready (void);
1425 /* Types and functions in sched-ebb.c. */
1427 extern basic_block schedule_ebb (rtx_insn *, rtx_insn *, bool);
1428 extern void schedule_ebbs_init (void);
1429 extern void schedule_ebbs_finish (void);
1431 /* Types and functions in sched-rgn.c. */
1433 /* A region is the main entity for interblock scheduling: insns
1434 are allowed to move between blocks in the same region, along
1435 control flow graph edges, in the 'up' direction. */
1436 struct region
1438 /* Number of extended basic blocks in region. */
1439 int rgn_nr_blocks;
1440 /* cblocks in the region (actually index in rgn_bb_table). */
1441 int rgn_blocks;
1442 /* Dependencies for this region are already computed. Basically, indicates,
1443 that this is a recovery block. */
1444 unsigned int dont_calc_deps : 1;
1445 /* This region has at least one non-trivial ebb. */
1446 unsigned int has_real_ebb : 1;
1449 extern int nr_regions;
1450 extern region *rgn_table;
1451 extern int *rgn_bb_table;
1452 extern int *block_to_bb;
1453 extern int *containing_rgn;
1455 /* Often used short-hand in the scheduler. The rest of the compiler uses
1456 BLOCK_FOR_INSN(INSN) and an indirect reference to get the basic block
1457 number ("index"). For historical reasons, the scheduler does not. */
1458 #define BLOCK_NUM(INSN) (BLOCK_FOR_INSN (INSN)->index + 0)
1460 #define RGN_NR_BLOCKS(rgn) (rgn_table[rgn].rgn_nr_blocks)
1461 #define RGN_BLOCKS(rgn) (rgn_table[rgn].rgn_blocks)
1462 #define RGN_DONT_CALC_DEPS(rgn) (rgn_table[rgn].dont_calc_deps)
1463 #define RGN_HAS_REAL_EBB(rgn) (rgn_table[rgn].has_real_ebb)
1464 #define BLOCK_TO_BB(block) (block_to_bb[block])
1465 #define CONTAINING_RGN(block) (containing_rgn[block])
1467 /* The mapping from ebb to block. */
1468 extern int *ebb_head;
1469 #define BB_TO_BLOCK(ebb) (rgn_bb_table[ebb_head[ebb]])
1470 #define EBB_FIRST_BB(ebb) BASIC_BLOCK_FOR_FN (cfun, BB_TO_BLOCK (ebb))
1471 #define EBB_LAST_BB(ebb) \
1472 BASIC_BLOCK_FOR_FN (cfun, rgn_bb_table[ebb_head[ebb + 1] - 1])
1473 #define INSN_BB(INSN) (BLOCK_TO_BB (BLOCK_NUM (INSN)))
1475 extern int current_nr_blocks;
1476 extern int current_blocks;
1477 extern int target_bb;
1478 extern bool sched_no_dce;
1480 extern void set_modulo_params (int, int, int, int);
1481 extern void record_delay_slot_pair (rtx_insn *, rtx_insn *, int, int);
1482 extern rtx_insn *real_insn_for_shadow (rtx_insn *);
1483 extern void discard_delay_pairs_above (int);
1484 extern void free_delay_pairs (void);
1485 extern void add_delay_dependencies (rtx_insn *);
1486 extern bool sched_is_disabled_for_current_region_p (void);
1487 extern void sched_rgn_init (bool);
1488 extern void sched_rgn_finish (void);
1489 extern void rgn_setup_region (int);
1490 extern void sched_rgn_compute_dependencies (int);
1491 extern void sched_rgn_local_init (int);
1492 extern void sched_rgn_local_finish (void);
1493 extern void sched_rgn_local_free (void);
1494 extern void extend_regions (void);
1495 extern void rgn_make_new_region_out_of_new_block (basic_block);
1497 extern void compute_priorities (void);
1498 extern void increase_insn_priority (rtx_insn *, int);
1499 extern void debug_rgn_dependencies (int);
1500 extern void debug_dependencies (rtx_insn *, rtx_insn *);
1501 extern void dump_rgn_dependencies_dot (FILE *);
1502 extern void dump_rgn_dependencies_dot (const char *);
1504 extern void free_rgn_deps (void);
1505 extern int contributes_to_priority (rtx_insn *, rtx_insn *);
1506 extern void extend_rgns (int *, int *, sbitmap, int *);
1507 extern void deps_join (struct deps_desc *, struct deps_desc *);
1509 extern void rgn_setup_common_sched_info (void);
1510 extern void rgn_setup_sched_infos (void);
1512 extern void debug_regions (void);
1513 extern void debug_region (int);
1514 extern void dump_region_dot (FILE *, int);
1515 extern void dump_region_dot_file (const char *, int);
1517 extern void haifa_sched_init (void);
1518 extern void haifa_sched_finish (void);
1520 extern void find_modifiable_mems (rtx_insn *, rtx_insn *);
1522 /* sched-deps.c interface to walk, add, search, update, resolve, delete
1523 and debug instruction dependencies. */
1525 /* Constants defining dependences lists. */
1527 /* No list. */
1528 #define SD_LIST_NONE (0)
1530 /* hard_back_deps. */
1531 #define SD_LIST_HARD_BACK (1)
1533 /* spec_back_deps. */
1534 #define SD_LIST_SPEC_BACK (2)
1536 /* forw_deps. */
1537 #define SD_LIST_FORW (4)
1539 /* resolved_back_deps. */
1540 #define SD_LIST_RES_BACK (8)
1542 /* resolved_forw_deps. */
1543 #define SD_LIST_RES_FORW (16)
1545 #define SD_LIST_BACK (SD_LIST_HARD_BACK | SD_LIST_SPEC_BACK)
1547 /* A type to hold above flags. */
1548 typedef int sd_list_types_def;
1550 extern void sd_next_list (const_rtx, sd_list_types_def *, deps_list_t *, bool *);
1552 /* Iterator to walk through, resolve and delete dependencies. */
1553 struct _sd_iterator
1555 /* What lists to walk. Can be any combination of SD_LIST_* flags. */
1556 sd_list_types_def types;
1558 /* Instruction dependencies lists of which will be walked. */
1559 rtx insn;
1561 /* Pointer to the next field of the previous element. This is not
1562 simply a pointer to the next element to allow easy deletion from the
1563 list. When a dep is being removed from the list the iterator
1564 will automatically advance because the value in *linkp will start
1565 referring to the next element. */
1566 dep_link_t *linkp;
1568 /* True if the current list is a resolved one. */
1569 bool resolved_p;
1572 typedef struct _sd_iterator sd_iterator_def;
1574 /* ??? We can move some definitions that are used in below inline functions
1575 out of sched-int.h to sched-deps.c provided that the below functions will
1576 become global externals.
1577 These definitions include:
1578 * struct _deps_list: opaque pointer is needed at global scope.
1579 * struct _dep_link: opaque pointer is needed at scope of sd_iterator_def.
1580 * struct _dep_node: opaque pointer is needed at scope of
1581 struct _deps_link. */
1583 /* Return initialized iterator. */
1584 static inline sd_iterator_def
1585 sd_iterator_start (rtx insn, sd_list_types_def types)
1587 /* Some dep_link a pointer to which will return NULL. */
1588 static dep_link_t null_link = NULL;
1590 sd_iterator_def i;
1592 i.types = types;
1593 i.insn = insn;
1594 i.linkp = &null_link;
1596 /* Avoid 'uninitialized warning'. */
1597 i.resolved_p = false;
1599 return i;
1602 /* Return the current element. */
1603 static inline bool
1604 sd_iterator_cond (sd_iterator_def *it_ptr, dep_t *dep_ptr)
1606 while (true)
1608 dep_link_t link = *it_ptr->linkp;
1610 if (link != NULL)
1612 *dep_ptr = DEP_LINK_DEP (link);
1613 return true;
1615 else
1617 sd_list_types_def types = it_ptr->types;
1619 if (types != SD_LIST_NONE)
1620 /* Switch to next list. */
1622 deps_list_t list;
1624 sd_next_list (it_ptr->insn,
1625 &it_ptr->types, &list, &it_ptr->resolved_p);
1627 it_ptr->linkp = &DEPS_LIST_FIRST (list);
1629 if (list)
1630 continue;
1633 *dep_ptr = NULL;
1634 return false;
1639 /* Advance iterator. */
1640 static inline void
1641 sd_iterator_next (sd_iterator_def *it_ptr)
1643 it_ptr->linkp = &DEP_LINK_NEXT (*it_ptr->linkp);
1646 /* A cycle wrapper. */
1647 #define FOR_EACH_DEP(INSN, LIST_TYPES, ITER, DEP) \
1648 for ((ITER) = sd_iterator_start ((INSN), (LIST_TYPES)); \
1649 sd_iterator_cond (&(ITER), &(DEP)); \
1650 sd_iterator_next (&(ITER)))
1652 #define IS_DISPATCH_ON 1
1653 #define IS_CMP 2
1654 #define DISPATCH_VIOLATION 3
1655 #define FITS_DISPATCH_WINDOW 4
1656 #define DISPATCH_INIT 5
1657 #define ADD_TO_DISPATCH_WINDOW 6
1659 extern int sd_lists_size (const_rtx, sd_list_types_def);
1660 extern bool sd_lists_empty_p (const_rtx, sd_list_types_def);
1661 extern void sd_init_insn (rtx_insn *);
1662 extern void sd_finish_insn (rtx_insn *);
1663 extern dep_t sd_find_dep_between (rtx, rtx, bool);
1664 extern void sd_add_dep (dep_t, bool);
1665 extern enum DEPS_ADJUST_RESULT sd_add_or_update_dep (dep_t, bool);
1666 extern void sd_resolve_dep (sd_iterator_def);
1667 extern void sd_unresolve_dep (sd_iterator_def);
1668 extern void sd_copy_back_deps (rtx_insn *, rtx_insn *, bool);
1669 extern void sd_delete_dep (sd_iterator_def);
1670 extern void sd_debug_lists (rtx, sd_list_types_def);
1672 /* Macros and declarations for scheduling fusion. */
1673 #define FUSION_MAX_PRIORITY (INT_MAX)
1674 extern bool sched_fusion;
1676 #endif /* INSN_SCHEDULING */
1678 #endif /* GCC_SCHED_INT_H */