1 ;; Goldmont(GLM) Scheduling
2 ;; Copyright (C) 2018 Free Software Foundation, Inc.
4 ;; This file is part of GCC.
6 ;; GCC is free software; you can redistribute it and/or modify
7 ;; it under the terms of the GNU General Public License as published by
8 ;; the Free Software Foundation; either version 3, or (at your option)
11 ;; GCC is distributed in the hope that it will be useful,
12 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
13 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 ;; GNU General Public License for more details.
16 ;; You should have received a copy of the GNU General Public License
17 ;; along with GCC; see the file COPYING3. If not see
18 ;; <http://www.gnu.org/licenses/>.
20 ;; Goldmont has 3 out-of-order IEC, 2 out-of--order FEC and out-of-order MEC.
23 (define_automaton "glm")
26 ;; Goldmont has 3 clusters - IEC, FPC, MEC
28 ;; IEC has three execution ports - IEC-0, IEC-1 and IEC-2.
29 ;; FPC has two execution ports - FPC-0 and FPC-1.
30 ;; MEC has two execution ports - MEC-0 (load) and MEC-1 (store0.
31 (define_cpu_unit "glm-iec-0,glm-iec-1,glm-iec-2" "glm")
32 (define_cpu_unit "glm-fec-0,glm-fec-1,glm-load,glm-store" "glm")
34 ;; Some EUs have duplicated copied and can be accessed via either ports 0, 1 or 2.
35 (define_reservation "glm-iec-any" "(glm-iec-0 | glm-iec-1 | glm-iec-2)")
36 (define_reservation "glm-iec-any-load" "(glm-iec-0|glm-iec-1|glm-iec-2)+glm-load")
37 (define_reservation "glm-iec-any-store" "(glm-iec-0|glm-iec-1|glm-iec-2)+glm-store")
38 (define_reservation "glm-iec-any-both" "(glm-iec-0 | glm-iec-1 | glm-iec-2) + glm-load + glm-store")
39 (define_reservation "glm-fec-all" "(glm-fec-0 + glm-fec-1)")
40 (define_reservation "glm-all" "(glm-iec-0+glm-iec-1+glm-iec-2)+(glm-fec-0+glm-fec-1)+(glm-load+glm-store)")
41 (define_reservation "glm-int-0" "glm-iec-0")
42 (define_reservation "glm-int-0-load" "glm-iec-0 + glm-load")
43 (define_reservation "glm-int-0-both" "glm-iec-0 + glm-load + glm-store")
44 (define_reservation "glm-int-1" "glm-iec-1")
45 (define_reservation "glm-int-1-mem" "glm-iec-1 + glm-load")
46 (define_reservation "glm-int-2" "glm-iec-2")
47 (define_reservation "glm-int-2-mem" "glm-iec-2 + glm-load")
48 (define_reservation "glm-fp-0" "glm-fec-0")
49 (define_reservation "glm-fec-any" "(glm-fec-0 | glm-fec-1)")
51 ;;; fmul insn can have 4 or 5 cycles latency for scalar and vector types.
52 (define_reservation "glm-fmul-4c" "glm-fec-0, nothing*3")
53 (define_reservation "glm-fmul-4c-mem" "glm-fec-0+glm-load, nothing*3")
54 (define_reservation "glm-fmul-5c" "glm-fec-0, nothing*4")
56 ;;; fadd has 3 cycles latency.
57 (define_reservation "glm-fadd-3c" "glm-fec-1, nothing*2")
58 (define_reservation "glm-fadd-3c-mem" "glm-fec-1+glm-load, nothing*2")
60 ;;; imul insn has 3 cycles latency for SI operands
61 (define_reservation "glm-imul-32" "glm-iec-1, nothing*2")
62 (define_reservation "glm-imul-mem-32"
63 "(glm-iec-1+glm-load), nothing*2")
64 ;;; imul has 5 cycles latency for DI operands with 1/2 tput
65 (define_reservation "glm-imul-64"
66 "glm-iec-1, glm-iec-1, nothing*3")
67 (define_reservation "glm-imul-mem-64"
68 "glm-iec-1+glm-load, glm-iec-1, nothing*3")
71 (define_insn_reservation "glm_other" 9
72 (and (eq_attr "cpu" "glm")
73 (and (eq_attr "type" "other")
74 (eq_attr "atom_unit" "!jeu")))
77 ;; return has type "other" with atom_unit "jeu"
78 (define_insn_reservation "glm_other_2" 1
79 (and (eq_attr "cpu" "glm")
80 (and (eq_attr "type" "other")
81 (eq_attr "atom_unit" "jeu")))
84 (define_insn_reservation "glm_multi" 9
85 (and (eq_attr "cpu" "glm")
86 (eq_attr "type" "multi"))
89 ;; Normal alu insns without carry
90 (define_insn_reservation "glm_alu" 1
91 (and (eq_attr "cpu" "glm")
92 (and (eq_attr "type" "alu")
93 (and (eq_attr "memory" "none")
94 (eq_attr "use_carry" "0"))))
97 ;; Normal alu insns without carry, but use MEC.
98 (define_insn_reservation "glm_alu_load" 1
99 (and (eq_attr "cpu" "glm")
100 (and (eq_attr "type" "alu")
101 (and (eq_attr "memory" "load")
102 (eq_attr "use_carry" "0"))))
105 (define_insn_reservation "glm_alu_mem" 1
106 (and (eq_attr "cpu" "glm")
107 (and (eq_attr "type" "alu")
108 (and (eq_attr "memory" "both")
109 (eq_attr "use_carry" "0"))))
113 ;; Alu insn consuming CF, such as add/sbb
114 (define_insn_reservation "glm_alu_carry" 2
115 (and (eq_attr "cpu" "glm")
116 (and (eq_attr "type" "alu")
117 (and (eq_attr "memory" "none")
118 (eq_attr "use_carry" "1"))))
119 "glm-int-2, nothing")
121 ;; Alu insn consuming CF, such as add/sbb
122 (define_insn_reservation "glm_alu_carry_mem" 2
123 (and (eq_attr "cpu" "glm")
124 (and (eq_attr "type" "alu")
125 (and (eq_attr "memory" "!none")
126 (eq_attr "use_carry" "1"))))
127 "glm-int-2-mem, nothing")
129 (define_insn_reservation "glm_alu1" 1
130 (and (eq_attr "cpu" "glm")
131 (and (eq_attr "type" "alu1")
132 (eq_attr "memory" "none") (eq_attr "prefix_0f" "0")))
136 (define_insn_reservation "glm_alu1_1" 10
137 (and (eq_attr "cpu" "glm")
138 (and (eq_attr "type" "alu1")
139 (eq_attr "memory" "none") (eq_attr "prefix_0f" "1")))
140 "glm-int-1*8,nothing*2")
142 (define_insn_reservation "glm_alu1_mem" 1
143 (and (eq_attr "cpu" "glm")
144 (and (eq_attr "type" "alu1")
145 (eq_attr "memory" "!none")))
148 (define_insn_reservation "glm_negnot" 1
149 (and (eq_attr "cpu" "glm")
150 (and (eq_attr "type" "negnot")
151 (eq_attr "memory" "none")))
154 (define_insn_reservation "glm_negnot_mem" 1
155 (and (eq_attr "cpu" "glm")
156 (and (eq_attr "type" "negnot")
157 (eq_attr "memory" "!none")))
160 (define_insn_reservation "glm_imov" 1
161 (and (eq_attr "cpu" "glm")
162 (and (eq_attr "type" "imov")
163 (eq_attr "memory" "none")))
166 (define_insn_reservation "glm_imov_load" 2
167 (and (eq_attr "cpu" "glm")
168 (and (eq_attr "type" "imov")
169 (eq_attr "memory" "load")))
170 "glm-iec-any-load,nothing")
172 (define_insn_reservation "glm_imov_store" 1
173 (and (eq_attr "cpu" "glm")
174 (and (eq_attr "type" "imov")
175 (eq_attr "memory" "store")))
179 (define_insn_reservation "glm_imovx" 1
180 (and (eq_attr "cpu" "glm")
181 (and (eq_attr "type" "imovx")
182 (and (eq_attr "memory" "none")
183 (ior (and (match_operand:HI 0 "register_operand")
184 (match_operand:HI 1 "general_operand"))
185 (and (match_operand:SI 0 "register_operand")
186 (match_operand:SI 1 "general_operand"))))))
189 ;; 16<-16, 32<-32, mem
190 (define_insn_reservation "glm_imovx_mem" 1
191 (and (eq_attr "cpu" "glm")
192 (and (eq_attr "type" "imovx")
193 (and (eq_attr "memory" "!none")
194 (ior (and (match_operand:HI 0 "register_operand")
195 (match_operand:HI 1 "general_operand"))
196 (and (match_operand:SI 0 "register_operand")
197 (match_operand:SI 1 "general_operand"))))))
201 ;; 32<-16, 32<-8, 64<-16, 64<-8, 64<-32, 8<-8
202 (define_insn_reservation "glm_imovx_2" 1
203 (and (eq_attr "cpu" "glm")
204 (and (eq_attr "type" "imovx")
205 (and (eq_attr "memory" "none")
206 (ior (match_operand:QI 0 "register_operand")
207 (ior (and (match_operand:SI 0 "register_operand")
208 (not (match_operand:SI 1 "general_operand")))
209 (match_operand:DI 0 "register_operand"))))))
212 ;; 32<-16, 32<-8, 64<-16, 64<-8, 64<-32, 8<-8, mem
213 (define_insn_reservation "glm_imovx_2_load" 2
214 (and (eq_attr "cpu" "glm")
215 (and (eq_attr "type" "imovx")
216 (and (eq_attr "memory" "load")
217 (ior (match_operand:QI 0 "register_operand")
218 (ior (and (match_operand:SI 0 "register_operand")
219 (not (match_operand:SI 1 "general_operand")))
220 (match_operand:DI 0 "register_operand"))))))
221 "glm-iec-any-load,nothing")
223 (define_insn_reservation "glm_imovx_2_mem" 1
224 (and (eq_attr "cpu" "glm")
225 (and (eq_attr "type" "imovx")
226 (and (eq_attr "memory" "!none")
227 (ior (match_operand:QI 0 "register_operand")
228 (ior (and (match_operand:SI 0 "register_operand")
229 (not (match_operand:SI 1 "general_operand")))
230 (match_operand:DI 0 "register_operand"))))))
235 (define_insn_reservation "glm_imovx_3" 3
236 (and (eq_attr "cpu" "glm")
237 (and (eq_attr "type" "imovx")
238 (and (match_operand:HI 0 "register_operand")
239 (match_operand:QI 1 "general_operand"))))
240 "glm-int-0, nothing*2")
242 (define_insn_reservation "glm_lea" 1
243 (and (eq_attr "cpu" "glm")
244 (and (eq_attr "type" "lea")
245 (eq_attr "mode" "!HI")))
248 ;; lea 16bit address is complex insn
249 (define_insn_reservation "glm_lea_2" 2
250 (and (eq_attr "cpu" "glm")
251 (and (eq_attr "type" "lea")
252 (eq_attr "mode" "HI")))
255 (define_insn_reservation "glm_incdec" 1
256 (and (eq_attr "cpu" "glm")
257 (and (eq_attr "type" "incdec")
258 (eq_attr "memory" "none")))
261 (define_insn_reservation "glm_incdec_mem" 3
262 (and (eq_attr "cpu" "glm")
263 (and (eq_attr "type" "incdec")
264 (eq_attr "memory" "!none")))
265 "glm-int-0-both, nothing*2")
267 ;; simple shift instruction use SHIFT eu, none memory
268 (define_insn_reservation "glm_ishift" 1
269 (and (eq_attr "cpu" "glm")
270 (and (eq_attr "type" "ishift")
271 (and (eq_attr "memory" "none") (eq_attr "prefix_0f" "0"))))
274 ;; simple shift instruction use SHIFT eu, memory
275 (define_insn_reservation "glm_ishift_mem" 2
276 (and (eq_attr "cpu" "glm")
277 (and (eq_attr "type" "ishift")
278 (and (eq_attr "memory" "!none") (eq_attr "prefix_0f" "0"))))
279 "glm-int-0-both,nothing")
281 ;; DF shift (prefixed with 0f) is complex insn with latency of 4 cycles
282 (define_insn_reservation "glm_ishift_3" 4
283 (and (eq_attr "cpu" "glm")
284 (and (eq_attr "type" "ishift")
285 (eq_attr "prefix_0f" "1")))
288 (define_insn_reservation "glm_ishift1" 1
289 (and (eq_attr "cpu" "glm")
290 (and (eq_attr "type" "ishift1")
291 (eq_attr "memory" "none")))
294 (define_insn_reservation "glm_ishift1_mem" 2
295 (and (eq_attr "cpu" "glm")
296 (and (eq_attr "type" "ishift1")
297 (eq_attr "memory" "!none")))
298 "glm-int-0-both,nothing")
300 (define_insn_reservation "glm_rotate" 1
301 (and (eq_attr "cpu" "glm")
302 (and (eq_attr "type" "rotate")
303 (eq_attr "memory" "none")))
306 (define_insn_reservation "glm_rotate_mem" 2
307 (and (eq_attr "cpu" "glm")
308 (and (eq_attr "type" "rotate")
309 (eq_attr "memory" "!none")))
310 "glm-int-0-both,nothing")
312 (define_insn_reservation "glm_imul" 3
313 (and (eq_attr "cpu" "glm")
314 (and (eq_attr "type" "imul")
315 (and (eq_attr "memory" "none") (eq_attr "mode" "SI"))))
318 (define_insn_reservation "glm_imul_load" 3
319 (and (eq_attr "cpu" "glm")
320 (and (eq_attr "type" "imul")
321 (and (eq_attr "memory" "!none") (eq_attr "mode" "SI"))))
325 ;; latency set to 5 as common 64x64 imul with 1/2 tput
326 (define_insn_reservation "glm_imul64" 5
327 (and (eq_attr "cpu" "glm")
328 (and (eq_attr "type" "imul")
329 (and (eq_attr "memory" "none") (eq_attr "mode" "!SI"))))
332 (define_insn_reservation "glm_imul64-load" 5
333 (and (eq_attr "cpu" "glm")
334 (and (eq_attr "type" "imul")
335 (and (eq_attr "memory" "!none") (eq_attr "mode" "!SI"))))
338 (define_insn_reservation "glm_idiv" 25
339 (and (eq_attr "cpu" "glm")
340 (eq_attr "type" "idiv"))
341 "glm-all*16, nothing*9")
343 (define_insn_reservation "glm_icmp" 1
344 (and (eq_attr "cpu" "glm")
345 (and (eq_attr "type" "icmp")
346 (eq_attr "memory" "none")))
349 (define_insn_reservation "glm_icmp_mem" 2
350 (and (eq_attr "cpu" "glm")
351 (and (eq_attr "type" "icmp")
352 (eq_attr "memory" "!none")))
353 "glm-int-0-load,nothing")
355 (define_insn_reservation "glm_test" 1
356 (and (eq_attr "cpu" "glm")
357 (and (eq_attr "type" "test")
358 (eq_attr "memory" "none")))
361 (define_insn_reservation "glm_test_mem" 2
362 (and (eq_attr "cpu" "glm")
363 (and (eq_attr "type" "test")
364 (eq_attr "memory" "!none")))
365 "glm-int-0-load,nothing")
367 (define_insn_reservation "glm_ibr" 1
368 (and (eq_attr "cpu" "glm")
369 (and (eq_attr "type" "ibr")
370 (eq_attr "memory" "!load")))
373 ;; complex if jump target is from address
374 (define_insn_reservation "glm_ibr_2" 2
375 (and (eq_attr "cpu" "glm")
376 (and (eq_attr "type" "ibr")
377 (eq_attr "memory" "load")))
380 (define_insn_reservation "glm_setcc" 1
381 (and (eq_attr "cpu" "glm")
382 (and (eq_attr "type" "setcc")
383 (eq_attr "memory" "!store")))
386 ;; 2 cycles complex if target is in memory
387 (define_insn_reservation "glm_setcc_2" 2
388 (and (eq_attr "cpu" "glm")
389 (and (eq_attr "type" "setcc")
390 (eq_attr "memory" "store")))
393 (define_insn_reservation "glm_icmov" 2
394 (and (eq_attr "cpu" "glm")
395 (and (eq_attr "type" "icmov")
396 (eq_attr "memory" "none")))
397 "glm-iec-any, nothing")
399 (define_insn_reservation "glm_icmov_mem" 2
400 (and (eq_attr "cpu" "glm")
401 (and (eq_attr "type" "icmov")
402 (eq_attr "memory" "!none")))
403 "glm-int-0-load, nothing")
405 ;; UCODE if segreg, ignored
406 (define_insn_reservation "glm_push" 2
407 (and (eq_attr "cpu" "glm")
408 (eq_attr "type" "push"))
409 "(glm-int-1+glm-int-2)*2")
411 ;; pop r64 is 1 cycle. UCODE if segreg, ignored
412 (define_insn_reservation "glm_pop" 1
413 (and (eq_attr "cpu" "glm")
414 (and (eq_attr "type" "pop")
415 (eq_attr "mode" "DI")))
416 "glm-int-1+glm-int-2")
418 ;; pop non-r64 is 2 cycles. UCODE if segreg, ignored
419 (define_insn_reservation "glm_pop_2" 2
420 (and (eq_attr "cpu" "glm")
421 (and (eq_attr "type" "pop")
422 (eq_attr "mode" "!DI")))
423 "(glm-int-1+glm-int-2)*2")
425 ;; UCODE if segreg, ignored
426 (define_insn_reservation "glm_call" 1
427 (and (eq_attr "cpu" "glm")
428 (eq_attr "type" "call,callv"))
429 "(glm-int-0+glm-int-1)")
431 (define_insn_reservation "glm_leave" 3
432 (and (eq_attr "cpu" "glm")
433 (eq_attr "type" "leave"))
436 (define_insn_reservation "glm_str" 3
437 (and (eq_attr "cpu" "glm")
438 (eq_attr "type" "str"))
441 (define_insn_reservation "glm_sselog" 1
442 (and (eq_attr "cpu" "glm")
443 (and (eq_attr "type" "sselog")
444 (eq_attr "memory" "none")))
447 (define_insn_reservation "glm_sselog_mem" 1
448 (and (eq_attr "cpu" "glm")
449 (and (eq_attr "type" "sselog")
450 (eq_attr "memory" "!none")))
451 "glm-fec-all+glm-load")
453 (define_insn_reservation "glm_sselog1" 1
454 (and (eq_attr "cpu" "glm")
455 (and (eq_attr "type" "sselog1")
456 (eq_attr "memory" "none")))
459 (define_insn_reservation "glm_sselog1_mem" 1
460 (and (eq_attr "cpu" "glm")
461 (and (eq_attr "type" "sselog1")
462 (eq_attr "memory" "!none")))
465 ;; not pmad, not psad
466 (define_insn_reservation "glm_sseiadd" 3
467 (and (eq_attr "cpu" "glm")
468 (and (eq_attr "type" "sseiadd")
469 (and (not (match_operand:V2DI 0 "register_operand"))
470 (and (eq_attr "atom_unit" "!simul")
471 (eq_attr "atom_unit" "!complex")))))
475 (define_insn_reservation "glm_sseiadd_2" 4
476 (and (eq_attr "cpu" "glm")
477 (and (eq_attr "type" "sseiadd")
478 (and (not (match_operand:V2DI 0 "register_operand"))
479 (and (eq_attr "atom_unit" "simul")
480 (eq_attr "mode" "DI,TI")))))
483 ;; if paddq(64 bit op), phadd/phsub
484 (define_insn_reservation "glm_sseiadd_3" 5
485 (and (eq_attr "cpu" "glm")
486 (and (eq_attr "type" "sseiadd")
487 (ior (match_operand:V2DI 0 "register_operand")
488 (eq_attr "atom_unit" "complex"))))
492 (define_insn_reservation "glm_sseishft" 2
493 (and (eq_attr "cpu" "glm")
494 (and (eq_attr "type" "sseishft")
495 (match_operand 2 "immediate_operand")))
498 (define_insn_reservation "glm_sseimul" 4
499 (and (eq_attr "cpu" "glm")
500 (and (eq_attr "type" "sseimul")
501 (eq_attr "memory" "none")))
504 (define_insn_reservation "glm_sseimul_load" 4
505 (and (eq_attr "cpu" "glm")
506 (and (eq_attr "type" "sseimul")
507 (eq_attr "memory" "!none")))
512 (define_insn_reservation "glm_sse" 4
513 (and (eq_attr "cpu" "glm")
514 (and (eq_attr "type" "sse")
515 (and (eq_attr "atom_sse_attr" "rcp") (eq_attr "mode" "SF"))))
518 ;; movshdup, movsldup. Suggest to type sseishft
519 (define_insn_reservation "glm_sse_2" 1
520 (and (eq_attr "cpu" "glm")
521 (and (eq_attr "type" "sse")
522 (eq_attr "atom_sse_attr" "movdup")))
526 (define_insn_reservation "glm_sse_3" 1
527 (and (eq_attr "cpu" "glm")
528 (and (eq_attr "type" "sse")
529 (eq_attr "atom_sse_attr" "lfence")))
532 ;; sfence,clflush,mfence, prefetch
533 (define_insn_reservation "glm_sse_4" 1
534 (and (eq_attr "cpu" "glm")
535 (and (eq_attr "type" "sse")
536 (ior (eq_attr "atom_sse_attr" "fence")
537 (eq_attr "atom_sse_attr" "prefetch"))))
540 ;; rcpps, rsqrtss, sqrt, ldmxcsr
541 (define_insn_reservation "glm_sse_5" 9
542 (and (eq_attr "cpu" "glm")
543 (and (eq_attr "type" "sse")
544 (ior (ior (eq_attr "atom_sse_attr" "sqrt")
545 (eq_attr "atom_sse_attr" "mxcsr"))
546 (and (eq_attr "atom_sse_attr" "rcp")
547 (eq_attr "mode" "V4SF")))))
548 "glm-fec-all*6, nothing*3")
551 (define_insn_reservation "glm_ssemov" 1
552 (and (eq_attr "cpu" "glm")
553 (and (eq_attr "type" "ssemov")
554 (and (match_operand 0 "register_operand" "xy")
555 (match_operand 1 "register_operand" "xy"))))
559 (define_insn_reservation "glm_ssemov_2" 1
560 (and (eq_attr "cpu" "glm")
561 (and (eq_attr "type" "ssemov")
562 (and (match_operand 0 "register_operand" "xy")
563 (match_operand 1 "register_operand" "r"))))
567 (define_insn_reservation "glm_ssemov_3" 3
568 (and (eq_attr "cpu" "glm")
569 (and (eq_attr "type" "ssemov")
570 (and (match_operand 0 "register_operand" "r")
571 (match_operand 1 "register_operand" "xy"))))
572 "glm-fp-0, nothing*2")
575 (define_insn_reservation "glm_ssemov_load" 2
576 (and (eq_attr "cpu" "glm")
577 (and (eq_attr "type" "ssemov")
578 (eq_attr "memory" "load")))
579 "glm-fec-any+glm-load,nothing")
581 (define_insn_reservation "glm_ssemov_store" 1
582 (and (eq_attr "cpu" "glm")
583 (and (eq_attr "type" "ssemov")
584 (eq_attr "memory" "store")))
585 "glm-fec-any+glm-store")
588 (define_insn_reservation "glm_sseadd" 3
589 (and (eq_attr "cpu" "glm")
590 (and (eq_attr "type" "sseadd")
591 (eq_attr "memory" "none")))
595 (define_insn_reservation "glm_sseadd_mem" 3
596 (and (eq_attr "cpu" "glm")
597 (and (eq_attr "type" "sseadd")
598 (eq_attr "memory" "!none")))
602 (define_insn_reservation "glm_ssemul" 4
603 (and (eq_attr "cpu" "glm")
604 (and (eq_attr "type" "ssemul")
605 (eq_attr "memory" "none")))
608 (define_insn_reservation "glm_ssemul_mem" 4
609 (and (eq_attr "cpu" "glm")
610 (and (eq_attr "type" "ssemul")
611 (eq_attr "memory" "!none")))
614 (define_insn_reservation "glm_ssecmp" 1
615 (and (eq_attr "cpu" "glm")
616 (eq_attr "type" "ssecmp"))
619 (define_insn_reservation "glm_ssecomi" 1
620 (and (eq_attr "cpu" "glm")
621 (eq_attr "type" "ssecomi"))
624 ;; no memory and cvtpi2ps, cvtps2pi, cvttps2pi
625 (define_insn_reservation "glm_ssecvt" 4
626 (and (eq_attr "cpu" "glm")
627 (and (eq_attr "type" "ssecvt")
628 (ior (and (match_operand:V2SI 0 "register_operand")
629 (match_operand:V4SF 1 "register_operand"))
630 (and (match_operand:V4SF 0 "register_operand")
631 (match_operand:V2SI 1 "register_operand")))))
632 "glm-fp-0, nothing*3")
634 ;; memory and cvtpi2ps, cvtps2pi, cvttps2pi
635 (define_insn_reservation "glm_ssecvt_mem" 4
636 (and (eq_attr "cpu" "glm")
637 (and (eq_attr "type" "ssecvt")
638 (ior (and (match_operand:V2SI 0 "register_operand")
639 (match_operand:V4SF 1 "memory_operand"))
640 (and (match_operand:V4SF 0 "register_operand")
641 (match_operand:V2SI 1 "memory_operand")))))
642 "glm-fp-0+glm-load, nothing*3")
644 ;; memory and cvtsi2sd
645 (define_insn_reservation "glm_sseicvt" 1
646 (and (eq_attr "cpu" "glm")
647 (and (eq_attr "type" "sseicvt")
648 (and (match_operand:V2DF 0 "register_operand")
649 (match_operand:SI 1 "nonimmediate_operand"))))
652 ;; otherwise. 8 cycles average for cvtsd2si
653 (define_insn_reservation "glm_sseicvt_2" 4
654 (and (eq_attr "cpu" "glm")
655 (and (eq_attr "type" "sseicvt")
656 (not (and (match_operand:V2DF 0 "register_operand")
657 (match_operand:SI 1 "memory_operand")))))
658 "glm-fp-0, nothing*3")
660 (define_insn_reservation "glm_ssediv" 13
661 (and (eq_attr "cpu" "glm")
662 (eq_attr "type" "ssediv"))
663 "glm-fec-all*12, nothing")
666 (define_insn_reservation "glm_fmov" 1
667 (and (eq_attr "cpu" "glm")
668 (and (eq_attr "type" "fmov")
669 (eq_attr "memory" "none")))
673 (define_insn_reservation "glm_fmov_load" 3
674 (and (eq_attr "cpu" "glm")
675 (and (eq_attr "type" "fmov")
676 (eq_attr "memory" "load")))
677 "glm-fec-any+glm-load, nothing*2")
679 (define_insn_reservation "glm_fmov_store" 1
680 (and (eq_attr "cpu" "glm")
681 (and (eq_attr "type" "fmov")
682 (eq_attr "memory" "store")))
683 "glm-fec-any+glm-store")
685 ;; Define bypass here
687 ;; There will be 0 cycle stall from cmp/test to jcc
689 ;; There will be 1 cycle stall from flag producer to cmov and adc/sbb
690 (define_bypass 2 "glm_icmp, glm_test, glm_alu, glm_alu_carry,
691 glm_alu1, glm_negnot, glm_incdec, glm_ishift,
692 glm_ishift1, glm_rotate"
693 "glm_icmov, glm_alu_carry")
695 ;; lea to shift source stall is 1 cycle
696 (define_bypass 2 "glm_lea"
697 "glm_ishift, glm_ishift1, glm_rotate"
698 "!ix86_dep_by_shift_count")
700 ;; non-lea to shift count stall is 1 cycle
701 (define_bypass 2 "glm_alu_carry,
702 glm_alu,glm_alu1,glm_negnot,glm_imov,glm_imovx,
703 glm_incdec,glm_ishift,glm_ishift1,glm_rotate,
704 glm_setcc, glm_icmov, glm_pop, glm_imov_store,
705 glm_alu_mem, glm_alu_carry_mem, glm_alu1_mem,
706 glm_alu_load, glm_imovx_mem, glm_imovx_2_mem,
707 glm_imov_load, glm_icmov_mem, glm_fmov_load, glm_fmov_store"
708 "glm_ishift, glm_ishift1, glm_rotate,
709 glm_ishift_mem, glm_ishift1_mem,
711 "ix86_dep_by_shift_count")