1 |
709 |
jeremybenn |
;; GCC machine description for IA-32 and x86-64.
|
2 |
|
|
;; Copyright (C) 1988, 1994, 1995, 1996, 1997, 1998, 1999, 2000,
|
3 |
|
|
;; 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012
|
4 |
|
|
;; Free Software Foundation, Inc.
|
5 |
|
|
;; Mostly by William Schelter.
|
6 |
|
|
;; x86_64 support added by Jan Hubicka
|
7 |
|
|
;;
|
8 |
|
|
;; This file is part of GCC.
|
9 |
|
|
;;
|
10 |
|
|
;; GCC is free software; you can redistribute it and/or modify
|
11 |
|
|
;; it under the terms of the GNU General Public License as published by
|
12 |
|
|
;; the Free Software Foundation; either version 3, or (at your option)
|
13 |
|
|
;; any later version.
|
14 |
|
|
;;
|
15 |
|
|
;; GCC is distributed in the hope that it will be useful,
|
16 |
|
|
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
|
17 |
|
|
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
18 |
|
|
;; GNU General Public License for more details.
|
19 |
|
|
;;
|
20 |
|
|
;; You should have received a copy of the GNU General Public License
|
21 |
|
|
;; along with GCC; see the file COPYING3. If not see
|
22 |
|
|
;; . */
|
23 |
|
|
;;
|
24 |
|
|
;; The original PO technology requires these to be ordered by speed,
|
25 |
|
|
;; so that assigner will pick the fastest.
|
26 |
|
|
;;
|
27 |
|
|
;; See file "rtl.def" for documentation on define_insn, match_*, et. al.
|
28 |
|
|
;;
|
29 |
|
|
;; The special asm out single letter directives following a '%' are:
|
30 |
|
|
;; L,W,B,Q,S,T -- print the opcode suffix for specified size of operand.
|
31 |
|
|
;; C -- print opcode suffix for set/cmov insn.
|
32 |
|
|
;; c -- like C, but print reversed condition
|
33 |
|
|
;; F,f -- likewise, but for floating-point.
|
34 |
|
|
;; O -- if HAVE_AS_IX86_CMOV_SUN_SYNTAX, expand to "w.", "l." or "q.",
|
35 |
|
|
;; otherwise nothing
|
36 |
|
|
;; R -- print the prefix for register names.
|
37 |
|
|
;; z -- print the opcode suffix for the size of the current operand.
|
38 |
|
|
;; Z -- likewise, with special suffixes for x87 instructions.
|
39 |
|
|
;; * -- print a star (in certain assembler syntax)
|
40 |
|
|
;; A -- print an absolute memory reference.
|
41 |
|
|
;; w -- print the operand as if it's a "word" (HImode) even if it isn't.
|
42 |
|
|
;; s -- print a shift double count, followed by the assemblers argument
|
43 |
|
|
;; delimiter.
|
44 |
|
|
;; b -- print the QImode name of the register for the indicated operand.
|
45 |
|
|
;; %b0 would print %al if operands[0] is reg 0.
|
46 |
|
|
;; w -- likewise, print the HImode name of the register.
|
47 |
|
|
;; k -- likewise, print the SImode name of the register.
|
48 |
|
|
;; q -- likewise, print the DImode name of the register.
|
49 |
|
|
;; x -- likewise, print the V4SFmode name of the register.
|
50 |
|
|
;; t -- likewise, print the V8SFmode name of the register.
|
51 |
|
|
;; h -- print the QImode name for a "high" register, either ah, bh, ch or dh.
|
52 |
|
|
;; y -- print "st(0)" instead of "st" as a register.
|
53 |
|
|
;; d -- print duplicated register operand for AVX instruction.
|
54 |
|
|
;; D -- print condition for SSE cmp instruction.
|
55 |
|
|
;; P -- if PIC, print an @PLT suffix.
|
56 |
|
|
;; p -- print raw symbol name.
|
57 |
|
|
;; X -- don't print any sort of PIC '@' suffix for a symbol.
|
58 |
|
|
;; & -- print some in-use local-dynamic symbol name.
|
59 |
|
|
;; H -- print a memory address offset by 8; used for sse high-parts
|
60 |
|
|
;; Y -- print condition for XOP pcom* instruction.
|
61 |
|
|
;; + -- print a branch hint as 'cs' or 'ds' prefix
|
62 |
|
|
;; ; -- print a semicolon (after prefixes due to bug in older gas).
|
63 |
|
|
;; @ -- print a segment register of thread base pointer load
|
64 |
|
|
|
65 |
|
|
(define_c_enum "unspec" [
|
66 |
|
|
;; Relocation specifiers
|
67 |
|
|
UNSPEC_GOT
|
68 |
|
|
UNSPEC_GOTOFF
|
69 |
|
|
UNSPEC_GOTPCREL
|
70 |
|
|
UNSPEC_GOTTPOFF
|
71 |
|
|
UNSPEC_TPOFF
|
72 |
|
|
UNSPEC_NTPOFF
|
73 |
|
|
UNSPEC_DTPOFF
|
74 |
|
|
UNSPEC_GOTNTPOFF
|
75 |
|
|
UNSPEC_INDNTPOFF
|
76 |
|
|
UNSPEC_PLTOFF
|
77 |
|
|
UNSPEC_MACHOPIC_OFFSET
|
78 |
|
|
UNSPEC_PCREL
|
79 |
|
|
|
80 |
|
|
;; Prologue support
|
81 |
|
|
UNSPEC_STACK_ALLOC
|
82 |
|
|
UNSPEC_SET_GOT
|
83 |
|
|
UNSPEC_REG_SAVE
|
84 |
|
|
UNSPEC_DEF_CFA
|
85 |
|
|
UNSPEC_SET_RIP
|
86 |
|
|
UNSPEC_SET_GOT_OFFSET
|
87 |
|
|
UNSPEC_MEMORY_BLOCKAGE
|
88 |
|
|
UNSPEC_STACK_CHECK
|
89 |
|
|
|
90 |
|
|
;; TLS support
|
91 |
|
|
UNSPEC_TP
|
92 |
|
|
UNSPEC_TLS_GD
|
93 |
|
|
UNSPEC_TLS_LD_BASE
|
94 |
|
|
UNSPEC_TLSDESC
|
95 |
|
|
UNSPEC_TLS_IE_SUN
|
96 |
|
|
|
97 |
|
|
;; Other random patterns
|
98 |
|
|
UNSPEC_SCAS
|
99 |
|
|
UNSPEC_FNSTSW
|
100 |
|
|
UNSPEC_SAHF
|
101 |
|
|
UNSPEC_PARITY
|
102 |
|
|
UNSPEC_FSTCW
|
103 |
|
|
UNSPEC_ADD_CARRY
|
104 |
|
|
UNSPEC_FLDCW
|
105 |
|
|
UNSPEC_REP
|
106 |
|
|
UNSPEC_LD_MPIC ; load_macho_picbase
|
107 |
|
|
UNSPEC_TRUNC_NOOP
|
108 |
|
|
UNSPEC_DIV_ALREADY_SPLIT
|
109 |
|
|
UNSPEC_MS_TO_SYSV_CALL
|
110 |
|
|
UNSPEC_CALL_NEEDS_VZEROUPPER
|
111 |
|
|
UNSPEC_PAUSE
|
112 |
|
|
|
113 |
|
|
;; For SSE/MMX support:
|
114 |
|
|
UNSPEC_FIX_NOTRUNC
|
115 |
|
|
UNSPEC_MASKMOV
|
116 |
|
|
UNSPEC_MOVMSK
|
117 |
|
|
UNSPEC_RCP
|
118 |
|
|
UNSPEC_RSQRT
|
119 |
|
|
UNSPEC_PSADBW
|
120 |
|
|
|
121 |
|
|
;; Generic math support
|
122 |
|
|
UNSPEC_COPYSIGN
|
123 |
|
|
UNSPEC_IEEE_MIN ; not commutative
|
124 |
|
|
UNSPEC_IEEE_MAX ; not commutative
|
125 |
|
|
|
126 |
|
|
;; x87 Floating point
|
127 |
|
|
UNSPEC_SIN
|
128 |
|
|
UNSPEC_COS
|
129 |
|
|
UNSPEC_FPATAN
|
130 |
|
|
UNSPEC_FYL2X
|
131 |
|
|
UNSPEC_FYL2XP1
|
132 |
|
|
UNSPEC_FRNDINT
|
133 |
|
|
UNSPEC_FIST
|
134 |
|
|
UNSPEC_F2XM1
|
135 |
|
|
UNSPEC_TAN
|
136 |
|
|
UNSPEC_FXAM
|
137 |
|
|
|
138 |
|
|
;; x87 Rounding
|
139 |
|
|
UNSPEC_FRNDINT_FLOOR
|
140 |
|
|
UNSPEC_FRNDINT_CEIL
|
141 |
|
|
UNSPEC_FRNDINT_TRUNC
|
142 |
|
|
UNSPEC_FRNDINT_MASK_PM
|
143 |
|
|
UNSPEC_FIST_FLOOR
|
144 |
|
|
UNSPEC_FIST_CEIL
|
145 |
|
|
|
146 |
|
|
;; x87 Double output FP
|
147 |
|
|
UNSPEC_SINCOS_COS
|
148 |
|
|
UNSPEC_SINCOS_SIN
|
149 |
|
|
UNSPEC_XTRACT_FRACT
|
150 |
|
|
UNSPEC_XTRACT_EXP
|
151 |
|
|
UNSPEC_FSCALE_FRACT
|
152 |
|
|
UNSPEC_FSCALE_EXP
|
153 |
|
|
UNSPEC_FPREM_F
|
154 |
|
|
UNSPEC_FPREM_U
|
155 |
|
|
UNSPEC_FPREM1_F
|
156 |
|
|
UNSPEC_FPREM1_U
|
157 |
|
|
|
158 |
|
|
UNSPEC_C2_FLAG
|
159 |
|
|
UNSPEC_FXAM_MEM
|
160 |
|
|
|
161 |
|
|
;; SSP patterns
|
162 |
|
|
UNSPEC_SP_SET
|
163 |
|
|
UNSPEC_SP_TEST
|
164 |
|
|
UNSPEC_SP_TLS_SET
|
165 |
|
|
UNSPEC_SP_TLS_TEST
|
166 |
|
|
|
167 |
|
|
;; For ROUND support
|
168 |
|
|
UNSPEC_ROUND
|
169 |
|
|
|
170 |
|
|
;; For CRC32 support
|
171 |
|
|
UNSPEC_CRC32
|
172 |
|
|
|
173 |
|
|
;; For RDRAND support
|
174 |
|
|
UNSPEC_RDRAND
|
175 |
|
|
|
176 |
|
|
;; For BMI support
|
177 |
|
|
UNSPEC_BEXTR
|
178 |
|
|
|
179 |
|
|
;; For BMI2 support
|
180 |
|
|
UNSPEC_PDEP
|
181 |
|
|
UNSPEC_PEXT
|
182 |
|
|
])
|
183 |
|
|
|
184 |
|
|
(define_c_enum "unspecv" [
|
185 |
|
|
UNSPECV_BLOCKAGE
|
186 |
|
|
UNSPECV_STACK_PROBE
|
187 |
|
|
UNSPECV_PROBE_STACK_RANGE
|
188 |
|
|
UNSPECV_ALIGN
|
189 |
|
|
UNSPECV_PROLOGUE_USE
|
190 |
|
|
UNSPECV_SPLIT_STACK_RETURN
|
191 |
|
|
UNSPECV_CLD
|
192 |
|
|
UNSPECV_NOPS
|
193 |
|
|
UNSPECV_RDTSC
|
194 |
|
|
UNSPECV_RDTSCP
|
195 |
|
|
UNSPECV_RDPMC
|
196 |
|
|
UNSPECV_LLWP_INTRINSIC
|
197 |
|
|
UNSPECV_SLWP_INTRINSIC
|
198 |
|
|
UNSPECV_LWPVAL_INTRINSIC
|
199 |
|
|
UNSPECV_LWPINS_INTRINSIC
|
200 |
|
|
UNSPECV_RDFSBASE
|
201 |
|
|
UNSPECV_RDGSBASE
|
202 |
|
|
UNSPECV_WRFSBASE
|
203 |
|
|
UNSPECV_WRGSBASE
|
204 |
|
|
])
|
205 |
|
|
|
206 |
|
|
;; Constants to represent rounding modes in the ROUND instruction
|
207 |
|
|
(define_constants
|
208 |
|
|
[(ROUND_FLOOR 0x1)
|
209 |
|
|
(ROUND_CEIL 0x2)
|
210 |
|
|
(ROUND_TRUNC 0x3)
|
211 |
|
|
(ROUND_MXCSR 0x4)
|
212 |
|
|
(ROUND_NO_EXC 0x8)
|
213 |
|
|
])
|
214 |
|
|
|
215 |
|
|
;; Constants to represent pcomtrue/pcomfalse variants
|
216 |
|
|
(define_constants
|
217 |
|
|
[(PCOM_FALSE 0)
|
218 |
|
|
(PCOM_TRUE 1)
|
219 |
|
|
(COM_FALSE_S 2)
|
220 |
|
|
(COM_FALSE_P 3)
|
221 |
|
|
(COM_TRUE_S 4)
|
222 |
|
|
(COM_TRUE_P 5)
|
223 |
|
|
])
|
224 |
|
|
|
225 |
|
|
;; Constants used in the XOP pperm instruction
|
226 |
|
|
(define_constants
|
227 |
|
|
[(PPERM_SRC 0x00) /* copy source */
|
228 |
|
|
(PPERM_INVERT 0x20) /* invert source */
|
229 |
|
|
(PPERM_REVERSE 0x40) /* bit reverse source */
|
230 |
|
|
(PPERM_REV_INV 0x60) /* bit reverse & invert src */
|
231 |
|
|
(PPERM_ZERO 0x80) /* all 0's */
|
232 |
|
|
(PPERM_ONES 0xa0) /* all 1's */
|
233 |
|
|
(PPERM_SIGN 0xc0) /* propagate sign bit */
|
234 |
|
|
(PPERM_INV_SIGN 0xe0) /* invert & propagate sign */
|
235 |
|
|
(PPERM_SRC1 0x00) /* use first source byte */
|
236 |
|
|
(PPERM_SRC2 0x10) /* use second source byte */
|
237 |
|
|
])
|
238 |
|
|
|
239 |
|
|
;; Registers by name.
|
240 |
|
|
(define_constants
|
241 |
|
|
[(AX_REG 0)
|
242 |
|
|
(DX_REG 1)
|
243 |
|
|
(CX_REG 2)
|
244 |
|
|
(BX_REG 3)
|
245 |
|
|
(SI_REG 4)
|
246 |
|
|
(DI_REG 5)
|
247 |
|
|
(BP_REG 6)
|
248 |
|
|
(SP_REG 7)
|
249 |
|
|
(ST0_REG 8)
|
250 |
|
|
(ST1_REG 9)
|
251 |
|
|
(ST2_REG 10)
|
252 |
|
|
(ST3_REG 11)
|
253 |
|
|
(ST4_REG 12)
|
254 |
|
|
(ST5_REG 13)
|
255 |
|
|
(ST6_REG 14)
|
256 |
|
|
(ST7_REG 15)
|
257 |
|
|
(FLAGS_REG 17)
|
258 |
|
|
(FPSR_REG 18)
|
259 |
|
|
(FPCR_REG 19)
|
260 |
|
|
(XMM0_REG 21)
|
261 |
|
|
(XMM1_REG 22)
|
262 |
|
|
(XMM2_REG 23)
|
263 |
|
|
(XMM3_REG 24)
|
264 |
|
|
(XMM4_REG 25)
|
265 |
|
|
(XMM5_REG 26)
|
266 |
|
|
(XMM6_REG 27)
|
267 |
|
|
(XMM7_REG 28)
|
268 |
|
|
(MM0_REG 29)
|
269 |
|
|
(MM1_REG 30)
|
270 |
|
|
(MM2_REG 31)
|
271 |
|
|
(MM3_REG 32)
|
272 |
|
|
(MM4_REG 33)
|
273 |
|
|
(MM5_REG 34)
|
274 |
|
|
(MM6_REG 35)
|
275 |
|
|
(MM7_REG 36)
|
276 |
|
|
(R8_REG 37)
|
277 |
|
|
(R9_REG 38)
|
278 |
|
|
(R10_REG 39)
|
279 |
|
|
(R11_REG 40)
|
280 |
|
|
(R12_REG 41)
|
281 |
|
|
(R13_REG 42)
|
282 |
|
|
(XMM8_REG 45)
|
283 |
|
|
(XMM9_REG 46)
|
284 |
|
|
(XMM10_REG 47)
|
285 |
|
|
(XMM11_REG 48)
|
286 |
|
|
(XMM12_REG 49)
|
287 |
|
|
(XMM13_REG 50)
|
288 |
|
|
(XMM14_REG 51)
|
289 |
|
|
(XMM15_REG 52)
|
290 |
|
|
])
|
291 |
|
|
|
292 |
|
|
;; Insns whose names begin with "x86_" are emitted by gen_FOO calls
|
293 |
|
|
;; from i386.c.
|
294 |
|
|
|
295 |
|
|
;; In C guard expressions, put expressions which may be compile-time
|
296 |
|
|
;; constants first. This allows for better optimization. For
|
297 |
|
|
;; example, write "TARGET_64BIT && reload_completed", not
|
298 |
|
|
;; "reload_completed && TARGET_64BIT".
|
299 |
|
|
|
300 |
|
|
|
301 |
|
|
;; Processor type.
|
302 |
|
|
(define_attr "cpu" "none,pentium,pentiumpro,geode,k6,athlon,k8,core2,corei7,
|
303 |
|
|
atom,generic64,amdfam10,bdver1,bdver2,btver1"
|
304 |
|
|
(const (symbol_ref "ix86_schedule")))
|
305 |
|
|
|
306 |
|
|
;; A basic instruction type. Refinements due to arguments to be
|
307 |
|
|
;; provided in other attributes.
|
308 |
|
|
(define_attr "type"
|
309 |
|
|
"other,multi,
|
310 |
|
|
alu,alu1,negnot,imov,imovx,lea,
|
311 |
|
|
incdec,ishift,ishiftx,ishift1,rotate,rotatex,rotate1,imul,imulx,idiv,
|
312 |
|
|
icmp,test,ibr,setcc,icmov,
|
313 |
|
|
push,pop,call,callv,leave,
|
314 |
|
|
str,bitmanip,
|
315 |
|
|
fmov,fop,fsgn,fmul,fdiv,fpspc,fcmov,fcmp,fxch,fistp,fisttp,frndint,
|
316 |
|
|
sselog,sselog1,sseiadd,sseiadd1,sseishft,sseishft1,sseimul,
|
317 |
|
|
sse,ssemov,sseadd,ssemul,ssecmp,ssecomi,ssecvt,ssecvt1,sseicvt,ssediv,sseins,
|
318 |
|
|
ssemuladd,sse4arg,lwp,
|
319 |
|
|
mmx,mmxmov,mmxadd,mmxmul,mmxcmp,mmxcvt,mmxshft"
|
320 |
|
|
(const_string "other"))
|
321 |
|
|
|
322 |
|
|
;; Main data type used by the insn
|
323 |
|
|
(define_attr "mode"
|
324 |
|
|
"unknown,none,QI,HI,SI,DI,TI,OI,SF,DF,XF,TF,V8SF,V4DF,V4SF,V2DF,V2SF,V1DF"
|
325 |
|
|
(const_string "unknown"))
|
326 |
|
|
|
327 |
|
|
;; The CPU unit operations uses.
|
328 |
|
|
(define_attr "unit" "integer,i387,sse,mmx,unknown"
|
329 |
|
|
(cond [(eq_attr "type" "fmov,fop,fsgn,fmul,fdiv,fpspc,fcmov,fcmp,fxch,fistp,fisttp,frndint")
|
330 |
|
|
(const_string "i387")
|
331 |
|
|
(eq_attr "type" "sselog,sselog1,sseiadd,sseiadd1,sseishft,sseishft1,sseimul,
|
332 |
|
|
sse,ssemov,sseadd,ssemul,ssecmp,ssecomi,ssecvt,
|
333 |
|
|
ssecvt1,sseicvt,ssediv,sseins,ssemuladd,sse4arg")
|
334 |
|
|
(const_string "sse")
|
335 |
|
|
(eq_attr "type" "mmx,mmxmov,mmxadd,mmxmul,mmxcmp,mmxcvt,mmxshft")
|
336 |
|
|
(const_string "mmx")
|
337 |
|
|
(eq_attr "type" "other")
|
338 |
|
|
(const_string "unknown")]
|
339 |
|
|
(const_string "integer")))
|
340 |
|
|
|
341 |
|
|
;; The (bounding maximum) length of an instruction immediate.
|
342 |
|
|
(define_attr "length_immediate" ""
|
343 |
|
|
(cond [(eq_attr "type" "incdec,setcc,icmov,str,lea,other,multi,idiv,leave,
|
344 |
|
|
bitmanip,imulx")
|
345 |
|
|
(const_int 0)
|
346 |
|
|
(eq_attr "unit" "i387,sse,mmx")
|
347 |
|
|
(const_int 0)
|
348 |
|
|
(eq_attr "type" "alu,alu1,negnot,imovx,ishift,ishiftx,ishift1,
|
349 |
|
|
rotate,rotatex,rotate1,imul,icmp,push,pop")
|
350 |
|
|
(symbol_ref "ix86_attr_length_immediate_default (insn, true)")
|
351 |
|
|
(eq_attr "type" "imov,test")
|
352 |
|
|
(symbol_ref "ix86_attr_length_immediate_default (insn, false)")
|
353 |
|
|
(eq_attr "type" "call")
|
354 |
|
|
(if_then_else (match_operand 0 "constant_call_address_operand" "")
|
355 |
|
|
(const_int 4)
|
356 |
|
|
(const_int 0))
|
357 |
|
|
(eq_attr "type" "callv")
|
358 |
|
|
(if_then_else (match_operand 1 "constant_call_address_operand" "")
|
359 |
|
|
(const_int 4)
|
360 |
|
|
(const_int 0))
|
361 |
|
|
;; We don't know the size before shorten_branches. Expect
|
362 |
|
|
;; the instruction to fit for better scheduling.
|
363 |
|
|
(eq_attr "type" "ibr")
|
364 |
|
|
(const_int 1)
|
365 |
|
|
]
|
366 |
|
|
(symbol_ref "/* Update immediate_length and other attributes! */
|
367 |
|
|
gcc_unreachable (),1")))
|
368 |
|
|
|
369 |
|
|
;; The (bounding maximum) length of an instruction address.
|
370 |
|
|
(define_attr "length_address" ""
|
371 |
|
|
(cond [(eq_attr "type" "str,other,multi,fxch")
|
372 |
|
|
(const_int 0)
|
373 |
|
|
(and (eq_attr "type" "call")
|
374 |
|
|
(match_operand 0 "constant_call_address_operand" ""))
|
375 |
|
|
(const_int 0)
|
376 |
|
|
(and (eq_attr "type" "callv")
|
377 |
|
|
(match_operand 1 "constant_call_address_operand" ""))
|
378 |
|
|
(const_int 0)
|
379 |
|
|
]
|
380 |
|
|
(symbol_ref "ix86_attr_length_address_default (insn)")))
|
381 |
|
|
|
382 |
|
|
;; Set when length prefix is used.
|
383 |
|
|
(define_attr "prefix_data16" ""
|
384 |
|
|
(cond [(eq_attr "type" "ssemuladd,sse4arg,sseiadd1,ssecvt1")
|
385 |
|
|
(const_int 0)
|
386 |
|
|
(eq_attr "mode" "HI")
|
387 |
|
|
(const_int 1)
|
388 |
|
|
(and (eq_attr "unit" "sse") (eq_attr "mode" "V2DF,TI"))
|
389 |
|
|
(const_int 1)
|
390 |
|
|
]
|
391 |
|
|
(const_int 0)))
|
392 |
|
|
|
393 |
|
|
;; Set when string REP prefix is used.
|
394 |
|
|
(define_attr "prefix_rep" ""
|
395 |
|
|
(cond [(eq_attr "type" "ssemuladd,sse4arg,sseiadd1,ssecvt1")
|
396 |
|
|
(const_int 0)
|
397 |
|
|
(and (eq_attr "unit" "sse") (eq_attr "mode" "SF,DF"))
|
398 |
|
|
(const_int 1)
|
399 |
|
|
]
|
400 |
|
|
(const_int 0)))
|
401 |
|
|
|
402 |
|
|
;; Set when 0f opcode prefix is used.
|
403 |
|
|
(define_attr "prefix_0f" ""
|
404 |
|
|
(if_then_else
|
405 |
|
|
(ior (eq_attr "type" "imovx,setcc,icmov,bitmanip")
|
406 |
|
|
(eq_attr "unit" "sse,mmx"))
|
407 |
|
|
(const_int 1)
|
408 |
|
|
(const_int 0)))
|
409 |
|
|
|
410 |
|
|
;; Set when REX opcode prefix is used.
|
411 |
|
|
(define_attr "prefix_rex" ""
|
412 |
|
|
(cond [(not (match_test "TARGET_64BIT"))
|
413 |
|
|
(const_int 0)
|
414 |
|
|
(and (eq_attr "mode" "DI")
|
415 |
|
|
(and (eq_attr "type" "!push,pop,call,callv,leave,ibr")
|
416 |
|
|
(eq_attr "unit" "!mmx")))
|
417 |
|
|
(const_int 1)
|
418 |
|
|
(and (eq_attr "mode" "QI")
|
419 |
|
|
(match_test "x86_extended_QIreg_mentioned_p (insn)"))
|
420 |
|
|
(const_int 1)
|
421 |
|
|
(match_test "x86_extended_reg_mentioned_p (insn)")
|
422 |
|
|
(const_int 1)
|
423 |
|
|
(and (eq_attr "type" "imovx")
|
424 |
|
|
(match_operand:QI 1 "ext_QIreg_operand" ""))
|
425 |
|
|
(const_int 1)
|
426 |
|
|
]
|
427 |
|
|
(const_int 0)))
|
428 |
|
|
|
429 |
|
|
;; There are also additional prefixes in 3DNOW, SSSE3.
|
430 |
|
|
;; ssemuladd,sse4arg default to 0f24/0f25 and DREX byte,
|
431 |
|
|
;; sseiadd1,ssecvt1 to 0f7a with no DREX byte.
|
432 |
|
|
;; 3DNOW has 0f0f prefix, SSSE3 and SSE4_{1,2} 0f38/0f3a.
|
433 |
|
|
(define_attr "prefix_extra" ""
|
434 |
|
|
(cond [(eq_attr "type" "ssemuladd,sse4arg")
|
435 |
|
|
(const_int 2)
|
436 |
|
|
(eq_attr "type" "sseiadd1,ssecvt1")
|
437 |
|
|
(const_int 1)
|
438 |
|
|
]
|
439 |
|
|
(const_int 0)))
|
440 |
|
|
|
441 |
|
|
;; Prefix used: original, VEX or maybe VEX.
|
442 |
|
|
(define_attr "prefix" "orig,vex,maybe_vex"
|
443 |
|
|
(if_then_else (eq_attr "mode" "OI,V8SF,V4DF")
|
444 |
|
|
(const_string "vex")
|
445 |
|
|
(const_string "orig")))
|
446 |
|
|
|
447 |
|
|
;; VEX W bit is used.
|
448 |
|
|
(define_attr "prefix_vex_w" "" (const_int 0))
|
449 |
|
|
|
450 |
|
|
;; The length of VEX prefix
|
451 |
|
|
;; Only instructions with 0f prefix can have 2 byte VEX prefix,
|
452 |
|
|
;; 0f38/0f3a prefixes can't. In i386.md 0f3[8a] is
|
453 |
|
|
;; still prefix_0f 1, with prefix_extra 1.
|
454 |
|
|
(define_attr "length_vex" ""
|
455 |
|
|
(if_then_else (and (eq_attr "prefix_0f" "1")
|
456 |
|
|
(eq_attr "prefix_extra" "0"))
|
457 |
|
|
(if_then_else (eq_attr "prefix_vex_w" "1")
|
458 |
|
|
(symbol_ref "ix86_attr_length_vex_default (insn, true, true)")
|
459 |
|
|
(symbol_ref "ix86_attr_length_vex_default (insn, true, false)"))
|
460 |
|
|
(if_then_else (eq_attr "prefix_vex_w" "1")
|
461 |
|
|
(symbol_ref "ix86_attr_length_vex_default (insn, false, true)")
|
462 |
|
|
(symbol_ref "ix86_attr_length_vex_default (insn, false, false)"))))
|
463 |
|
|
|
464 |
|
|
;; Set when modrm byte is used.
|
465 |
|
|
(define_attr "modrm" ""
|
466 |
|
|
(cond [(eq_attr "type" "str,leave")
|
467 |
|
|
(const_int 0)
|
468 |
|
|
(eq_attr "unit" "i387")
|
469 |
|
|
(const_int 0)
|
470 |
|
|
(and (eq_attr "type" "incdec")
|
471 |
|
|
(and (not (match_test "TARGET_64BIT"))
|
472 |
|
|
(ior (match_operand:SI 1 "register_operand" "")
|
473 |
|
|
(match_operand:HI 1 "register_operand" ""))))
|
474 |
|
|
(const_int 0)
|
475 |
|
|
(and (eq_attr "type" "push")
|
476 |
|
|
(not (match_operand 1 "memory_operand" "")))
|
477 |
|
|
(const_int 0)
|
478 |
|
|
(and (eq_attr "type" "pop")
|
479 |
|
|
(not (match_operand 0 "memory_operand" "")))
|
480 |
|
|
(const_int 0)
|
481 |
|
|
(and (eq_attr "type" "imov")
|
482 |
|
|
(and (not (eq_attr "mode" "DI"))
|
483 |
|
|
(ior (and (match_operand 0 "register_operand" "")
|
484 |
|
|
(match_operand 1 "immediate_operand" ""))
|
485 |
|
|
(ior (and (match_operand 0 "ax_reg_operand" "")
|
486 |
|
|
(match_operand 1 "memory_displacement_only_operand" ""))
|
487 |
|
|
(and (match_operand 0 "memory_displacement_only_operand" "")
|
488 |
|
|
(match_operand 1 "ax_reg_operand" ""))))))
|
489 |
|
|
(const_int 0)
|
490 |
|
|
(and (eq_attr "type" "call")
|
491 |
|
|
(match_operand 0 "constant_call_address_operand" ""))
|
492 |
|
|
(const_int 0)
|
493 |
|
|
(and (eq_attr "type" "callv")
|
494 |
|
|
(match_operand 1 "constant_call_address_operand" ""))
|
495 |
|
|
(const_int 0)
|
496 |
|
|
(and (eq_attr "type" "alu,alu1,icmp,test")
|
497 |
|
|
(match_operand 0 "ax_reg_operand" ""))
|
498 |
|
|
(symbol_ref "(get_attr_length_immediate (insn) <= (get_attr_mode (insn) != MODE_QI))")
|
499 |
|
|
]
|
500 |
|
|
(const_int 1)))
|
501 |
|
|
|
502 |
|
|
;; The (bounding maximum) length of an instruction in bytes.
|
503 |
|
|
;; ??? fistp and frndint are in fact fldcw/{fistp,frndint}/fldcw sequences.
|
504 |
|
|
;; Later we may want to split them and compute proper length as for
|
505 |
|
|
;; other insns.
|
506 |
|
|
(define_attr "length" ""
|
507 |
|
|
(cond [(eq_attr "type" "other,multi,fistp,frndint")
|
508 |
|
|
(const_int 16)
|
509 |
|
|
(eq_attr "type" "fcmp")
|
510 |
|
|
(const_int 4)
|
511 |
|
|
(eq_attr "unit" "i387")
|
512 |
|
|
(plus (const_int 2)
|
513 |
|
|
(plus (attr "prefix_data16")
|
514 |
|
|
(attr "length_address")))
|
515 |
|
|
(ior (eq_attr "prefix" "vex")
|
516 |
|
|
(and (eq_attr "prefix" "maybe_vex")
|
517 |
|
|
(match_test "TARGET_AVX")))
|
518 |
|
|
(plus (attr "length_vex")
|
519 |
|
|
(plus (attr "length_immediate")
|
520 |
|
|
(plus (attr "modrm")
|
521 |
|
|
(attr "length_address"))))]
|
522 |
|
|
(plus (plus (attr "modrm")
|
523 |
|
|
(plus (attr "prefix_0f")
|
524 |
|
|
(plus (attr "prefix_rex")
|
525 |
|
|
(plus (attr "prefix_extra")
|
526 |
|
|
(const_int 1)))))
|
527 |
|
|
(plus (attr "prefix_rep")
|
528 |
|
|
(plus (attr "prefix_data16")
|
529 |
|
|
(plus (attr "length_immediate")
|
530 |
|
|
(attr "length_address")))))))
|
531 |
|
|
|
532 |
|
|
;; The `memory' attribute is `none' if no memory is referenced, `load' or
|
533 |
|
|
;; `store' if there is a simple memory reference therein, or `unknown'
|
534 |
|
|
;; if the instruction is complex.
|
535 |
|
|
|
536 |
|
|
(define_attr "memory" "none,load,store,both,unknown"
|
537 |
|
|
(cond [(eq_attr "type" "other,multi,str,lwp")
|
538 |
|
|
(const_string "unknown")
|
539 |
|
|
(eq_attr "type" "lea,fcmov,fpspc")
|
540 |
|
|
(const_string "none")
|
541 |
|
|
(eq_attr "type" "fistp,leave")
|
542 |
|
|
(const_string "both")
|
543 |
|
|
(eq_attr "type" "frndint")
|
544 |
|
|
(const_string "load")
|
545 |
|
|
(eq_attr "type" "push")
|
546 |
|
|
(if_then_else (match_operand 1 "memory_operand" "")
|
547 |
|
|
(const_string "both")
|
548 |
|
|
(const_string "store"))
|
549 |
|
|
(eq_attr "type" "pop")
|
550 |
|
|
(if_then_else (match_operand 0 "memory_operand" "")
|
551 |
|
|
(const_string "both")
|
552 |
|
|
(const_string "load"))
|
553 |
|
|
(eq_attr "type" "setcc")
|
554 |
|
|
(if_then_else (match_operand 0 "memory_operand" "")
|
555 |
|
|
(const_string "store")
|
556 |
|
|
(const_string "none"))
|
557 |
|
|
(eq_attr "type" "icmp,test,ssecmp,ssecomi,mmxcmp,fcmp")
|
558 |
|
|
(if_then_else (ior (match_operand 0 "memory_operand" "")
|
559 |
|
|
(match_operand 1 "memory_operand" ""))
|
560 |
|
|
(const_string "load")
|
561 |
|
|
(const_string "none"))
|
562 |
|
|
(eq_attr "type" "ibr")
|
563 |
|
|
(if_then_else (match_operand 0 "memory_operand" "")
|
564 |
|
|
(const_string "load")
|
565 |
|
|
(const_string "none"))
|
566 |
|
|
(eq_attr "type" "call")
|
567 |
|
|
(if_then_else (match_operand 0 "constant_call_address_operand" "")
|
568 |
|
|
(const_string "none")
|
569 |
|
|
(const_string "load"))
|
570 |
|
|
(eq_attr "type" "callv")
|
571 |
|
|
(if_then_else (match_operand 1 "constant_call_address_operand" "")
|
572 |
|
|
(const_string "none")
|
573 |
|
|
(const_string "load"))
|
574 |
|
|
(and (eq_attr "type" "alu1,negnot,ishift1,sselog1")
|
575 |
|
|
(match_operand 1 "memory_operand" ""))
|
576 |
|
|
(const_string "both")
|
577 |
|
|
(and (match_operand 0 "memory_operand" "")
|
578 |
|
|
(match_operand 1 "memory_operand" ""))
|
579 |
|
|
(const_string "both")
|
580 |
|
|
(match_operand 0 "memory_operand" "")
|
581 |
|
|
(const_string "store")
|
582 |
|
|
(match_operand 1 "memory_operand" "")
|
583 |
|
|
(const_string "load")
|
584 |
|
|
(and (eq_attr "type"
|
585 |
|
|
"!alu1,negnot,ishift1,
|
586 |
|
|
imov,imovx,icmp,test,bitmanip,
|
587 |
|
|
fmov,fcmp,fsgn,
|
588 |
|
|
sse,ssemov,ssecmp,ssecomi,ssecvt,ssecvt1,sseicvt,sselog1,
|
589 |
|
|
sseiadd1,mmx,mmxmov,mmxcmp,mmxcvt")
|
590 |
|
|
(match_operand 2 "memory_operand" ""))
|
591 |
|
|
(const_string "load")
|
592 |
|
|
(and (eq_attr "type" "icmov,ssemuladd,sse4arg")
|
593 |
|
|
(match_operand 3 "memory_operand" ""))
|
594 |
|
|
(const_string "load")
|
595 |
|
|
]
|
596 |
|
|
(const_string "none")))
|
597 |
|
|
|
598 |
|
|
;; Indicates if an instruction has both an immediate and a displacement.
|
599 |
|
|
|
600 |
|
|
(define_attr "imm_disp" "false,true,unknown"
|
601 |
|
|
(cond [(eq_attr "type" "other,multi")
|
602 |
|
|
(const_string "unknown")
|
603 |
|
|
(and (eq_attr "type" "icmp,test,imov,alu1,ishift1,rotate1")
|
604 |
|
|
(and (match_operand 0 "memory_displacement_operand" "")
|
605 |
|
|
(match_operand 1 "immediate_operand" "")))
|
606 |
|
|
(const_string "true")
|
607 |
|
|
(and (eq_attr "type" "alu,ishift,ishiftx,rotate,rotatex,imul,idiv")
|
608 |
|
|
(and (match_operand 0 "memory_displacement_operand" "")
|
609 |
|
|
(match_operand 2 "immediate_operand" "")))
|
610 |
|
|
(const_string "true")
|
611 |
|
|
]
|
612 |
|
|
(const_string "false")))
|
613 |
|
|
|
614 |
|
|
;; Indicates if an FP operation has an integer source.
|
615 |
|
|
|
616 |
|
|
(define_attr "fp_int_src" "false,true"
|
617 |
|
|
(const_string "false"))
|
618 |
|
|
|
619 |
|
|
;; Defines rounding mode of an FP operation.
|
620 |
|
|
|
621 |
|
|
(define_attr "i387_cw" "trunc,floor,ceil,mask_pm,uninitialized,any"
|
622 |
|
|
(const_string "any"))
|
623 |
|
|
|
624 |
|
|
;; Define attribute to classify add/sub insns that consumes carry flag (CF)
|
625 |
|
|
(define_attr "use_carry" "0,1" (const_string "0"))
|
626 |
|
|
|
627 |
|
|
;; Define attribute to indicate unaligned ssemov insns
|
628 |
|
|
(define_attr "movu" "0,1" (const_string "0"))
|
629 |
|
|
|
630 |
|
|
;; Used to control the "enabled" attribute on a per-instruction basis.
|
631 |
|
|
(define_attr "isa" "base,sse2,sse2_noavx,sse3,sse4,sse4_noavx,noavx,avx,bmi2"
|
632 |
|
|
(const_string "base"))
|
633 |
|
|
|
634 |
|
|
(define_attr "enabled" ""
|
635 |
|
|
(cond [(eq_attr "isa" "sse2") (symbol_ref "TARGET_SSE2")
|
636 |
|
|
(eq_attr "isa" "sse2_noavx")
|
637 |
|
|
(symbol_ref "TARGET_SSE2 && !TARGET_AVX")
|
638 |
|
|
(eq_attr "isa" "sse3") (symbol_ref "TARGET_SSE3")
|
639 |
|
|
(eq_attr "isa" "sse4") (symbol_ref "TARGET_SSE4_1")
|
640 |
|
|
(eq_attr "isa" "sse4_noavx")
|
641 |
|
|
(symbol_ref "TARGET_SSE4_1 && !TARGET_AVX")
|
642 |
|
|
(eq_attr "isa" "avx") (symbol_ref "TARGET_AVX")
|
643 |
|
|
(eq_attr "isa" "noavx") (symbol_ref "!TARGET_AVX")
|
644 |
|
|
(eq_attr "isa" "bmi2") (symbol_ref "TARGET_BMI2")
|
645 |
|
|
]
|
646 |
|
|
(const_int 1)))
|
647 |
|
|
|
648 |
|
|
;; Describe a user's asm statement.
|
649 |
|
|
(define_asm_attributes
|
650 |
|
|
[(set_attr "length" "128")
|
651 |
|
|
(set_attr "type" "multi")])
|
652 |
|
|
|
653 |
|
|
(define_code_iterator plusminus [plus minus])
|
654 |
|
|
|
655 |
|
|
(define_code_iterator sat_plusminus [ss_plus us_plus ss_minus us_minus])
|
656 |
|
|
|
657 |
|
|
;; Base name for define_insn
|
658 |
|
|
(define_code_attr plusminus_insn
|
659 |
|
|
[(plus "add") (ss_plus "ssadd") (us_plus "usadd")
|
660 |
|
|
(minus "sub") (ss_minus "sssub") (us_minus "ussub")])
|
661 |
|
|
|
662 |
|
|
;; Base name for insn mnemonic.
|
663 |
|
|
(define_code_attr plusminus_mnemonic
|
664 |
|
|
[(plus "add") (ss_plus "adds") (us_plus "addus")
|
665 |
|
|
(minus "sub") (ss_minus "subs") (us_minus "subus")])
|
666 |
|
|
(define_code_attr plusminus_carry_mnemonic
|
667 |
|
|
[(plus "adc") (minus "sbb")])
|
668 |
|
|
|
669 |
|
|
;; Mark commutative operators as such in constraints.
|
670 |
|
|
(define_code_attr comm [(plus "%") (ss_plus "%") (us_plus "%")
|
671 |
|
|
(minus "") (ss_minus "") (us_minus "")])
|
672 |
|
|
|
673 |
|
|
;; Mapping of max and min
|
674 |
|
|
(define_code_iterator maxmin [smax smin umax umin])
|
675 |
|
|
|
676 |
|
|
;; Mapping of signed max and min
|
677 |
|
|
(define_code_iterator smaxmin [smax smin])
|
678 |
|
|
|
679 |
|
|
;; Mapping of unsigned max and min
|
680 |
|
|
(define_code_iterator umaxmin [umax umin])
|
681 |
|
|
|
682 |
|
|
;; Base name for integer and FP insn mnemonic
|
683 |
|
|
(define_code_attr maxmin_int [(smax "maxs") (smin "mins")
|
684 |
|
|
(umax "maxu") (umin "minu")])
|
685 |
|
|
(define_code_attr maxmin_float [(smax "max") (smin "min")])
|
686 |
|
|
|
687 |
|
|
;; Mapping of logic operators
|
688 |
|
|
(define_code_iterator any_logic [and ior xor])
|
689 |
|
|
(define_code_iterator any_or [ior xor])
|
690 |
|
|
|
691 |
|
|
;; Base name for insn mnemonic.
|
692 |
|
|
(define_code_attr logic [(and "and") (ior "or") (xor "xor")])
|
693 |
|
|
|
694 |
|
|
;; Mapping of logic-shift operators
|
695 |
|
|
(define_code_iterator any_lshift [ashift lshiftrt])
|
696 |
|
|
|
697 |
|
|
;; Mapping of shift-right operators
|
698 |
|
|
(define_code_iterator any_shiftrt [lshiftrt ashiftrt])
|
699 |
|
|
|
700 |
|
|
;; Base name for define_insn
|
701 |
|
|
(define_code_attr shift_insn
|
702 |
|
|
[(ashift "ashl") (lshiftrt "lshr") (ashiftrt "ashr")])
|
703 |
|
|
|
704 |
|
|
;; Base name for insn mnemonic.
|
705 |
|
|
(define_code_attr shift [(ashift "sll") (lshiftrt "shr") (ashiftrt "sar")])
|
706 |
|
|
(define_code_attr vshift [(ashift "sll") (lshiftrt "srl") (ashiftrt "sra")])
|
707 |
|
|
|
708 |
|
|
;; Mapping of rotate operators
|
709 |
|
|
(define_code_iterator any_rotate [rotate rotatert])
|
710 |
|
|
|
711 |
|
|
;; Base name for define_insn
|
712 |
|
|
(define_code_attr rotate_insn [(rotate "rotl") (rotatert "rotr")])
|
713 |
|
|
|
714 |
|
|
;; Base name for insn mnemonic.
|
715 |
|
|
(define_code_attr rotate [(rotate "rol") (rotatert "ror")])
|
716 |
|
|
|
717 |
|
|
;; Mapping of abs neg operators
|
718 |
|
|
(define_code_iterator absneg [abs neg])
|
719 |
|
|
|
720 |
|
|
;; Base name for x87 insn mnemonic.
|
721 |
|
|
(define_code_attr absneg_mnemonic [(abs "abs") (neg "chs")])
|
722 |
|
|
|
723 |
|
|
;; Used in signed and unsigned widening multiplications.
|
724 |
|
|
(define_code_iterator any_extend [sign_extend zero_extend])
|
725 |
|
|
|
726 |
|
|
;; Prefix for insn menmonic.
|
727 |
|
|
(define_code_attr sgnprefix [(sign_extend "i") (zero_extend "")])
|
728 |
|
|
|
729 |
|
|
;; Prefix for define_insn
|
730 |
|
|
(define_code_attr u [(sign_extend "") (zero_extend "u")])
|
731 |
|
|
(define_code_attr s [(sign_extend "s") (zero_extend "u")])
|
732 |
|
|
|
733 |
|
|
;; All integer modes.
|
734 |
|
|
(define_mode_iterator SWI1248x [QI HI SI DI])
|
735 |
|
|
|
736 |
|
|
;; All integer modes without QImode.
|
737 |
|
|
(define_mode_iterator SWI248x [HI SI DI])
|
738 |
|
|
|
739 |
|
|
;; All integer modes without QImode and HImode.
|
740 |
|
|
(define_mode_iterator SWI48x [SI DI])
|
741 |
|
|
|
742 |
|
|
;; All integer modes without SImode and DImode.
|
743 |
|
|
(define_mode_iterator SWI12 [QI HI])
|
744 |
|
|
|
745 |
|
|
;; All integer modes without DImode.
|
746 |
|
|
(define_mode_iterator SWI124 [QI HI SI])
|
747 |
|
|
|
748 |
|
|
;; All integer modes without QImode and DImode.
|
749 |
|
|
(define_mode_iterator SWI24 [HI SI])
|
750 |
|
|
|
751 |
|
|
;; Single word integer modes.
|
752 |
|
|
(define_mode_iterator SWI [QI HI SI (DI "TARGET_64BIT")])
|
753 |
|
|
|
754 |
|
|
;; Single word integer modes without QImode.
|
755 |
|
|
(define_mode_iterator SWI248 [HI SI (DI "TARGET_64BIT")])
|
756 |
|
|
|
757 |
|
|
;; Single word integer modes without QImode and HImode.
|
758 |
|
|
(define_mode_iterator SWI48 [SI (DI "TARGET_64BIT")])
|
759 |
|
|
|
760 |
|
|
;; All math-dependant single and double word integer modes.
|
761 |
|
|
(define_mode_iterator SDWIM [(QI "TARGET_QIMODE_MATH")
|
762 |
|
|
(HI "TARGET_HIMODE_MATH")
|
763 |
|
|
SI DI (TI "TARGET_64BIT")])
|
764 |
|
|
|
765 |
|
|
;; Math-dependant single word integer modes.
|
766 |
|
|
(define_mode_iterator SWIM [(QI "TARGET_QIMODE_MATH")
|
767 |
|
|
(HI "TARGET_HIMODE_MATH")
|
768 |
|
|
SI (DI "TARGET_64BIT")])
|
769 |
|
|
|
770 |
|
|
;; Math-dependant integer modes without DImode.
|
771 |
|
|
(define_mode_iterator SWIM124 [(QI "TARGET_QIMODE_MATH")
|
772 |
|
|
(HI "TARGET_HIMODE_MATH")
|
773 |
|
|
SI])
|
774 |
|
|
|
775 |
|
|
;; Math-dependant single word integer modes without QImode.
|
776 |
|
|
(define_mode_iterator SWIM248 [(HI "TARGET_HIMODE_MATH")
|
777 |
|
|
SI (DI "TARGET_64BIT")])
|
778 |
|
|
|
779 |
|
|
;; Double word integer modes.
|
780 |
|
|
(define_mode_iterator DWI [(DI "!TARGET_64BIT")
|
781 |
|
|
(TI "TARGET_64BIT")])
|
782 |
|
|
|
783 |
|
|
;; Double word integer modes as mode attribute.
|
784 |
|
|
(define_mode_attr DWI [(SI "DI") (DI "TI")])
|
785 |
|
|
(define_mode_attr dwi [(SI "di") (DI "ti")])
|
786 |
|
|
|
787 |
|
|
;; Half mode for double word integer modes.
|
788 |
|
|
(define_mode_iterator DWIH [(SI "!TARGET_64BIT")
|
789 |
|
|
(DI "TARGET_64BIT")])
|
790 |
|
|
|
791 |
|
|
;; Instruction suffix for integer modes.
|
792 |
|
|
(define_mode_attr imodesuffix [(QI "b") (HI "w") (SI "l") (DI "q")])
|
793 |
|
|
|
794 |
|
|
;; Pointer size prefix for integer modes (Intel asm dialect)
|
795 |
|
|
(define_mode_attr iptrsize [(QI "BYTE")
|
796 |
|
|
(HI "WORD")
|
797 |
|
|
(SI "DWORD")
|
798 |
|
|
(DI "QWORD")])
|
799 |
|
|
|
800 |
|
|
;; Register class for integer modes.
|
801 |
|
|
(define_mode_attr r [(QI "q") (HI "r") (SI "r") (DI "r")])
|
802 |
|
|
|
803 |
|
|
;; Immediate operand constraint for integer modes.
|
804 |
|
|
(define_mode_attr i [(QI "n") (HI "n") (SI "e") (DI "e")])
|
805 |
|
|
|
806 |
|
|
;; General operand constraint for word modes.
|
807 |
|
|
(define_mode_attr g [(QI "qmn") (HI "rmn") (SI "rme") (DI "rme")])
|
808 |
|
|
|
809 |
|
|
;; Immediate operand constraint for double integer modes.
|
810 |
|
|
(define_mode_attr di [(SI "nF") (DI "e")])
|
811 |
|
|
|
812 |
|
|
;; Immediate operand constraint for shifts.
|
813 |
|
|
(define_mode_attr S [(QI "I") (HI "I") (SI "I") (DI "J") (TI "O")])
|
814 |
|
|
|
815 |
|
|
;; General operand predicate for integer modes.
|
816 |
|
|
(define_mode_attr general_operand
|
817 |
|
|
[(QI "general_operand")
|
818 |
|
|
(HI "general_operand")
|
819 |
|
|
(SI "x86_64_general_operand")
|
820 |
|
|
(DI "x86_64_general_operand")
|
821 |
|
|
(TI "x86_64_general_operand")])
|
822 |
|
|
|
823 |
|
|
;; General sign/zero extend operand predicate for integer modes.
|
824 |
|
|
(define_mode_attr general_szext_operand
|
825 |
|
|
[(QI "general_operand")
|
826 |
|
|
(HI "general_operand")
|
827 |
|
|
(SI "x86_64_szext_general_operand")
|
828 |
|
|
(DI "x86_64_szext_general_operand")])
|
829 |
|
|
|
830 |
|
|
;; Immediate operand predicate for integer modes.
|
831 |
|
|
(define_mode_attr immediate_operand
|
832 |
|
|
[(QI "immediate_operand")
|
833 |
|
|
(HI "immediate_operand")
|
834 |
|
|
(SI "x86_64_immediate_operand")
|
835 |
|
|
(DI "x86_64_immediate_operand")])
|
836 |
|
|
|
837 |
|
|
;; Nonmemory operand predicate for integer modes.
|
838 |
|
|
(define_mode_attr nonmemory_operand
|
839 |
|
|
[(QI "nonmemory_operand")
|
840 |
|
|
(HI "nonmemory_operand")
|
841 |
|
|
(SI "x86_64_nonmemory_operand")
|
842 |
|
|
(DI "x86_64_nonmemory_operand")])
|
843 |
|
|
|
844 |
|
|
;; Operand predicate for shifts.
|
845 |
|
|
(define_mode_attr shift_operand
|
846 |
|
|
[(QI "nonimmediate_operand")
|
847 |
|
|
(HI "nonimmediate_operand")
|
848 |
|
|
(SI "nonimmediate_operand")
|
849 |
|
|
(DI "shiftdi_operand")
|
850 |
|
|
(TI "register_operand")])
|
851 |
|
|
|
852 |
|
|
;; Operand predicate for shift argument.
|
853 |
|
|
(define_mode_attr shift_immediate_operand
|
854 |
|
|
[(QI "const_1_to_31_operand")
|
855 |
|
|
(HI "const_1_to_31_operand")
|
856 |
|
|
(SI "const_1_to_31_operand")
|
857 |
|
|
(DI "const_1_to_63_operand")])
|
858 |
|
|
|
859 |
|
|
;; Input operand predicate for arithmetic left shifts.
|
860 |
|
|
(define_mode_attr ashl_input_operand
|
861 |
|
|
[(QI "nonimmediate_operand")
|
862 |
|
|
(HI "nonimmediate_operand")
|
863 |
|
|
(SI "nonimmediate_operand")
|
864 |
|
|
(DI "ashldi_input_operand")
|
865 |
|
|
(TI "reg_or_pm1_operand")])
|
866 |
|
|
|
867 |
|
|
;; SSE and x87 SFmode and DFmode floating point modes
|
868 |
|
|
(define_mode_iterator MODEF [SF DF])
|
869 |
|
|
|
870 |
|
|
;; All x87 floating point modes
|
871 |
|
|
(define_mode_iterator X87MODEF [SF DF XF])
|
872 |
|
|
|
873 |
|
|
;; SSE instruction suffix for various modes
|
874 |
|
|
(define_mode_attr ssemodesuffix
|
875 |
|
|
[(SF "ss") (DF "sd")
|
876 |
|
|
(V8SF "ps") (V4DF "pd")
|
877 |
|
|
(V4SF "ps") (V2DF "pd")
|
878 |
|
|
(V16QI "b") (V8HI "w") (V4SI "d") (V2DI "q")
|
879 |
|
|
(V32QI "b") (V16HI "w") (V8SI "d") (V4DI "q")])
|
880 |
|
|
|
881 |
|
|
;; SSE vector suffix for floating point modes
|
882 |
|
|
(define_mode_attr ssevecmodesuffix [(SF "ps") (DF "pd")])
|
883 |
|
|
|
884 |
|
|
;; SSE vector mode corresponding to a scalar mode
|
885 |
|
|
(define_mode_attr ssevecmode
|
886 |
|
|
[(QI "V16QI") (HI "V8HI") (SI "V4SI") (DI "V2DI") (SF "V4SF") (DF "V2DF")])
|
887 |
|
|
|
888 |
|
|
;; Instruction suffix for REX 64bit operators.
|
889 |
|
|
(define_mode_attr rex64suffix [(SI "") (DI "{q}")])
|
890 |
|
|
|
891 |
|
|
;; This mode iterator allows :P to be used for patterns that operate on
|
892 |
|
|
;; pointer-sized quantities. Exactly one of the two alternatives will match.
|
893 |
|
|
(define_mode_iterator P [(SI "Pmode == SImode") (DI "Pmode == DImode")])
|
894 |
|
|
|
895 |
|
|
;; This mode iterator allows :PTR to be used for patterns that operate on
|
896 |
|
|
;; ptr_mode sized quantities.
|
897 |
|
|
(define_mode_iterator PTR
|
898 |
|
|
[(SI "ptr_mode == SImode") (DI "ptr_mode == DImode")])
|
899 |
|
|
|
900 |
|
|
;; Scheduling descriptions
|
901 |
|
|
|
902 |
|
|
(include "pentium.md")
|
903 |
|
|
(include "ppro.md")
|
904 |
|
|
(include "k6.md")
|
905 |
|
|
(include "athlon.md")
|
906 |
|
|
(include "bdver1.md")
|
907 |
|
|
(include "geode.md")
|
908 |
|
|
(include "atom.md")
|
909 |
|
|
(include "core2.md")
|
910 |
|
|
|
911 |
|
|
|
912 |
|
|
;; Operand and operator predicates and constraints
|
913 |
|
|
|
914 |
|
|
(include "predicates.md")
|
915 |
|
|
(include "constraints.md")
|
916 |
|
|
|
917 |
|
|
|
918 |
|
|
;; Compare and branch/compare and store instructions.
|
919 |
|
|
|
920 |
|
|
(define_expand "cbranch4"
|
921 |
|
|
[(set (reg:CC FLAGS_REG)
|
922 |
|
|
(compare:CC (match_operand:SDWIM 1 "nonimmediate_operand" "")
|
923 |
|
|
(match_operand:SDWIM 2 "" "")))
|
924 |
|
|
(set (pc) (if_then_else
|
925 |
|
|
(match_operator 0 "ordered_comparison_operator"
|
926 |
|
|
[(reg:CC FLAGS_REG) (const_int 0)])
|
927 |
|
|
(label_ref (match_operand 3 "" ""))
|
928 |
|
|
(pc)))]
|
929 |
|
|
""
|
930 |
|
|
{
|
931 |
|
|
if (MEM_P (operands[1]) && MEM_P (operands[2]))
|
932 |
|
|
operands[1] = force_reg (mode, operands[1]);
|
933 |
|
|
ix86_expand_branch (GET_CODE (operands[0]),
|
934 |
|
|
operands[1], operands[2], operands[3]);
|
935 |
|
|
DONE;
|
936 |
|
|
})
|
937 |
|
|
|
938 |
|
|
(define_expand "cstore4"
|
939 |
|
|
[(set (reg:CC FLAGS_REG)
|
940 |
|
|
(compare:CC (match_operand:SWIM 2 "nonimmediate_operand" "")
|
941 |
|
|
(match_operand:SWIM 3 "" "")))
|
942 |
|
|
(set (match_operand:QI 0 "register_operand" "")
|
943 |
|
|
(match_operator 1 "ordered_comparison_operator"
|
944 |
|
|
[(reg:CC FLAGS_REG) (const_int 0)]))]
|
945 |
|
|
""
|
946 |
|
|
{
|
947 |
|
|
if (MEM_P (operands[2]) && MEM_P (operands[3]))
|
948 |
|
|
operands[2] = force_reg (mode, operands[2]);
|
949 |
|
|
ix86_expand_setcc (operands[0], GET_CODE (operands[1]),
|
950 |
|
|
operands[2], operands[3]);
|
951 |
|
|
DONE;
|
952 |
|
|
})
|
953 |
|
|
|
954 |
|
|
(define_expand "cmp_1"
|
955 |
|
|
[(set (reg:CC FLAGS_REG)
|
956 |
|
|
(compare:CC (match_operand:SWI48 0 "nonimmediate_operand" "")
|
957 |
|
|
(match_operand:SWI48 1 "" "")))])
|
958 |
|
|
|
959 |
|
|
(define_insn "*cmp_ccno_1"
|
960 |
|
|
[(set (reg FLAGS_REG)
|
961 |
|
|
(compare (match_operand:SWI 0 "nonimmediate_operand" ",?m")
|
962 |
|
|
(match_operand:SWI 1 "const0_operand" "")))]
|
963 |
|
|
"ix86_match_ccmode (insn, CCNOmode)"
|
964 |
|
|
"@
|
965 |
|
|
test{}\t%0, %0
|
966 |
|
|
cmp{}\t{%1, %0|%0, %1}"
|
967 |
|
|
[(set_attr "type" "test,icmp")
|
968 |
|
|
(set_attr "length_immediate" "0,1")
|
969 |
|
|
(set_attr "mode" "")])
|
970 |
|
|
|
971 |
|
|
(define_insn "*cmp_1"
|
972 |
|
|
[(set (reg FLAGS_REG)
|
973 |
|
|
(compare (match_operand:SWI 0 "nonimmediate_operand" "m,")
|
974 |
|
|
(match_operand:SWI 1 "" ",m")))]
|
975 |
|
|
"ix86_match_ccmode (insn, CCmode)"
|
976 |
|
|
"cmp{}\t{%1, %0|%0, %1}"
|
977 |
|
|
[(set_attr "type" "icmp")
|
978 |
|
|
(set_attr "mode" "")])
|
979 |
|
|
|
980 |
|
|
(define_insn "*cmp_minus_1"
|
981 |
|
|
[(set (reg FLAGS_REG)
|
982 |
|
|
(compare
|
983 |
|
|
(minus:SWI (match_operand:SWI 0 "nonimmediate_operand" "m,")
|
984 |
|
|
(match_operand:SWI 1 "" ",m"))
|
985 |
|
|
(const_int 0)))]
|
986 |
|
|
"ix86_match_ccmode (insn, CCGOCmode)"
|
987 |
|
|
"cmp{}\t{%1, %0|%0, %1}"
|
988 |
|
|
[(set_attr "type" "icmp")
|
989 |
|
|
(set_attr "mode" "")])
|
990 |
|
|
|
991 |
|
|
(define_insn "*cmpqi_ext_1"
|
992 |
|
|
[(set (reg FLAGS_REG)
|
993 |
|
|
(compare
|
994 |
|
|
(match_operand:QI 0 "general_operand" "Qm")
|
995 |
|
|
(subreg:QI
|
996 |
|
|
(zero_extract:SI
|
997 |
|
|
(match_operand 1 "ext_register_operand" "Q")
|
998 |
|
|
(const_int 8)
|
999 |
|
|
(const_int 8)) 0)))]
|
1000 |
|
|
"!TARGET_64BIT && ix86_match_ccmode (insn, CCmode)"
|
1001 |
|
|
"cmp{b}\t{%h1, %0|%0, %h1}"
|
1002 |
|
|
[(set_attr "type" "icmp")
|
1003 |
|
|
(set_attr "mode" "QI")])
|
1004 |
|
|
|
1005 |
|
|
(define_insn "*cmpqi_ext_1_rex64"
|
1006 |
|
|
[(set (reg FLAGS_REG)
|
1007 |
|
|
(compare
|
1008 |
|
|
(match_operand:QI 0 "register_operand" "Q")
|
1009 |
|
|
(subreg:QI
|
1010 |
|
|
(zero_extract:SI
|
1011 |
|
|
(match_operand 1 "ext_register_operand" "Q")
|
1012 |
|
|
(const_int 8)
|
1013 |
|
|
(const_int 8)) 0)))]
|
1014 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCmode)"
|
1015 |
|
|
"cmp{b}\t{%h1, %0|%0, %h1}"
|
1016 |
|
|
[(set_attr "type" "icmp")
|
1017 |
|
|
(set_attr "mode" "QI")])
|
1018 |
|
|
|
1019 |
|
|
(define_insn "*cmpqi_ext_2"
|
1020 |
|
|
[(set (reg FLAGS_REG)
|
1021 |
|
|
(compare
|
1022 |
|
|
(subreg:QI
|
1023 |
|
|
(zero_extract:SI
|
1024 |
|
|
(match_operand 0 "ext_register_operand" "Q")
|
1025 |
|
|
(const_int 8)
|
1026 |
|
|
(const_int 8)) 0)
|
1027 |
|
|
(match_operand:QI 1 "const0_operand" "")))]
|
1028 |
|
|
"ix86_match_ccmode (insn, CCNOmode)"
|
1029 |
|
|
"test{b}\t%h0, %h0"
|
1030 |
|
|
[(set_attr "type" "test")
|
1031 |
|
|
(set_attr "length_immediate" "0")
|
1032 |
|
|
(set_attr "mode" "QI")])
|
1033 |
|
|
|
1034 |
|
|
(define_expand "cmpqi_ext_3"
|
1035 |
|
|
[(set (reg:CC FLAGS_REG)
|
1036 |
|
|
(compare:CC
|
1037 |
|
|
(subreg:QI
|
1038 |
|
|
(zero_extract:SI
|
1039 |
|
|
(match_operand 0 "ext_register_operand" "")
|
1040 |
|
|
(const_int 8)
|
1041 |
|
|
(const_int 8)) 0)
|
1042 |
|
|
(match_operand:QI 1 "immediate_operand" "")))])
|
1043 |
|
|
|
1044 |
|
|
(define_insn "*cmpqi_ext_3_insn"
|
1045 |
|
|
[(set (reg FLAGS_REG)
|
1046 |
|
|
(compare
|
1047 |
|
|
(subreg:QI
|
1048 |
|
|
(zero_extract:SI
|
1049 |
|
|
(match_operand 0 "ext_register_operand" "Q")
|
1050 |
|
|
(const_int 8)
|
1051 |
|
|
(const_int 8)) 0)
|
1052 |
|
|
(match_operand:QI 1 "general_operand" "Qmn")))]
|
1053 |
|
|
"!TARGET_64BIT && ix86_match_ccmode (insn, CCmode)"
|
1054 |
|
|
"cmp{b}\t{%1, %h0|%h0, %1}"
|
1055 |
|
|
[(set_attr "type" "icmp")
|
1056 |
|
|
(set_attr "modrm" "1")
|
1057 |
|
|
(set_attr "mode" "QI")])
|
1058 |
|
|
|
1059 |
|
|
(define_insn "*cmpqi_ext_3_insn_rex64"
|
1060 |
|
|
[(set (reg FLAGS_REG)
|
1061 |
|
|
(compare
|
1062 |
|
|
(subreg:QI
|
1063 |
|
|
(zero_extract:SI
|
1064 |
|
|
(match_operand 0 "ext_register_operand" "Q")
|
1065 |
|
|
(const_int 8)
|
1066 |
|
|
(const_int 8)) 0)
|
1067 |
|
|
(match_operand:QI 1 "nonmemory_operand" "Qn")))]
|
1068 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCmode)"
|
1069 |
|
|
"cmp{b}\t{%1, %h0|%h0, %1}"
|
1070 |
|
|
[(set_attr "type" "icmp")
|
1071 |
|
|
(set_attr "modrm" "1")
|
1072 |
|
|
(set_attr "mode" "QI")])
|
1073 |
|
|
|
1074 |
|
|
(define_insn "*cmpqi_ext_4"
|
1075 |
|
|
[(set (reg FLAGS_REG)
|
1076 |
|
|
(compare
|
1077 |
|
|
(subreg:QI
|
1078 |
|
|
(zero_extract:SI
|
1079 |
|
|
(match_operand 0 "ext_register_operand" "Q")
|
1080 |
|
|
(const_int 8)
|
1081 |
|
|
(const_int 8)) 0)
|
1082 |
|
|
(subreg:QI
|
1083 |
|
|
(zero_extract:SI
|
1084 |
|
|
(match_operand 1 "ext_register_operand" "Q")
|
1085 |
|
|
(const_int 8)
|
1086 |
|
|
(const_int 8)) 0)))]
|
1087 |
|
|
"ix86_match_ccmode (insn, CCmode)"
|
1088 |
|
|
"cmp{b}\t{%h1, %h0|%h0, %h1}"
|
1089 |
|
|
[(set_attr "type" "icmp")
|
1090 |
|
|
(set_attr "mode" "QI")])
|
1091 |
|
|
|
1092 |
|
|
;; These implement float point compares.
|
1093 |
|
|
;; %%% See if we can get away with VOIDmode operands on the actual insns,
|
1094 |
|
|
;; which would allow mix and match FP modes on the compares. Which is what
|
1095 |
|
|
;; the old patterns did, but with many more of them.
|
1096 |
|
|
|
1097 |
|
|
(define_expand "cbranchxf4"
|
1098 |
|
|
[(set (reg:CC FLAGS_REG)
|
1099 |
|
|
(compare:CC (match_operand:XF 1 "nonmemory_operand" "")
|
1100 |
|
|
(match_operand:XF 2 "nonmemory_operand" "")))
|
1101 |
|
|
(set (pc) (if_then_else
|
1102 |
|
|
(match_operator 0 "ix86_fp_comparison_operator"
|
1103 |
|
|
[(reg:CC FLAGS_REG)
|
1104 |
|
|
(const_int 0)])
|
1105 |
|
|
(label_ref (match_operand 3 "" ""))
|
1106 |
|
|
(pc)))]
|
1107 |
|
|
"TARGET_80387"
|
1108 |
|
|
{
|
1109 |
|
|
ix86_expand_branch (GET_CODE (operands[0]),
|
1110 |
|
|
operands[1], operands[2], operands[3]);
|
1111 |
|
|
DONE;
|
1112 |
|
|
})
|
1113 |
|
|
|
1114 |
|
|
(define_expand "cstorexf4"
|
1115 |
|
|
[(set (reg:CC FLAGS_REG)
|
1116 |
|
|
(compare:CC (match_operand:XF 2 "nonmemory_operand" "")
|
1117 |
|
|
(match_operand:XF 3 "nonmemory_operand" "")))
|
1118 |
|
|
(set (match_operand:QI 0 "register_operand" "")
|
1119 |
|
|
(match_operator 1 "ix86_fp_comparison_operator"
|
1120 |
|
|
[(reg:CC FLAGS_REG)
|
1121 |
|
|
(const_int 0)]))]
|
1122 |
|
|
"TARGET_80387"
|
1123 |
|
|
{
|
1124 |
|
|
ix86_expand_setcc (operands[0], GET_CODE (operands[1]),
|
1125 |
|
|
operands[2], operands[3]);
|
1126 |
|
|
DONE;
|
1127 |
|
|
})
|
1128 |
|
|
|
1129 |
|
|
(define_expand "cbranch4"
|
1130 |
|
|
[(set (reg:CC FLAGS_REG)
|
1131 |
|
|
(compare:CC (match_operand:MODEF 1 "cmp_fp_expander_operand" "")
|
1132 |
|
|
(match_operand:MODEF 2 "cmp_fp_expander_operand" "")))
|
1133 |
|
|
(set (pc) (if_then_else
|
1134 |
|
|
(match_operator 0 "ix86_fp_comparison_operator"
|
1135 |
|
|
[(reg:CC FLAGS_REG)
|
1136 |
|
|
(const_int 0)])
|
1137 |
|
|
(label_ref (match_operand 3 "" ""))
|
1138 |
|
|
(pc)))]
|
1139 |
|
|
"TARGET_80387 || (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)"
|
1140 |
|
|
{
|
1141 |
|
|
ix86_expand_branch (GET_CODE (operands[0]),
|
1142 |
|
|
operands[1], operands[2], operands[3]);
|
1143 |
|
|
DONE;
|
1144 |
|
|
})
|
1145 |
|
|
|
1146 |
|
|
(define_expand "cstore4"
|
1147 |
|
|
[(set (reg:CC FLAGS_REG)
|
1148 |
|
|
(compare:CC (match_operand:MODEF 2 "cmp_fp_expander_operand" "")
|
1149 |
|
|
(match_operand:MODEF 3 "cmp_fp_expander_operand" "")))
|
1150 |
|
|
(set (match_operand:QI 0 "register_operand" "")
|
1151 |
|
|
(match_operator 1 "ix86_fp_comparison_operator"
|
1152 |
|
|
[(reg:CC FLAGS_REG)
|
1153 |
|
|
(const_int 0)]))]
|
1154 |
|
|
"TARGET_80387 || (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)"
|
1155 |
|
|
{
|
1156 |
|
|
ix86_expand_setcc (operands[0], GET_CODE (operands[1]),
|
1157 |
|
|
operands[2], operands[3]);
|
1158 |
|
|
DONE;
|
1159 |
|
|
})
|
1160 |
|
|
|
1161 |
|
|
(define_expand "cbranchcc4"
|
1162 |
|
|
[(set (pc) (if_then_else
|
1163 |
|
|
(match_operator 0 "comparison_operator"
|
1164 |
|
|
[(match_operand 1 "flags_reg_operand" "")
|
1165 |
|
|
(match_operand 2 "const0_operand" "")])
|
1166 |
|
|
(label_ref (match_operand 3 "" ""))
|
1167 |
|
|
(pc)))]
|
1168 |
|
|
""
|
1169 |
|
|
{
|
1170 |
|
|
ix86_expand_branch (GET_CODE (operands[0]),
|
1171 |
|
|
operands[1], operands[2], operands[3]);
|
1172 |
|
|
DONE;
|
1173 |
|
|
})
|
1174 |
|
|
|
1175 |
|
|
(define_expand "cstorecc4"
|
1176 |
|
|
[(set (match_operand:QI 0 "register_operand" "")
|
1177 |
|
|
(match_operator 1 "comparison_operator"
|
1178 |
|
|
[(match_operand 2 "flags_reg_operand" "")
|
1179 |
|
|
(match_operand 3 "const0_operand" "")]))]
|
1180 |
|
|
""
|
1181 |
|
|
{
|
1182 |
|
|
ix86_expand_setcc (operands[0], GET_CODE (operands[1]),
|
1183 |
|
|
operands[2], operands[3]);
|
1184 |
|
|
DONE;
|
1185 |
|
|
})
|
1186 |
|
|
|
1187 |
|
|
|
1188 |
|
|
;; FP compares, step 1:
|
1189 |
|
|
;; Set the FP condition codes.
|
1190 |
|
|
;;
|
1191 |
|
|
;; CCFPmode compare with exceptions
|
1192 |
|
|
;; CCFPUmode compare with no exceptions
|
1193 |
|
|
|
1194 |
|
|
;; We may not use "#" to split and emit these, since the REG_DEAD notes
|
1195 |
|
|
;; used to manage the reg stack popping would not be preserved.
|
1196 |
|
|
|
1197 |
|
|
(define_insn "*cmpfp_0"
|
1198 |
|
|
[(set (match_operand:HI 0 "register_operand" "=a")
|
1199 |
|
|
(unspec:HI
|
1200 |
|
|
[(compare:CCFP
|
1201 |
|
|
(match_operand 1 "register_operand" "f")
|
1202 |
|
|
(match_operand 2 "const0_operand" ""))]
|
1203 |
|
|
UNSPEC_FNSTSW))]
|
1204 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
1205 |
|
|
&& GET_MODE (operands[1]) == GET_MODE (operands[2])"
|
1206 |
|
|
"* return output_fp_compare (insn, operands, false, false);"
|
1207 |
|
|
[(set_attr "type" "multi")
|
1208 |
|
|
(set_attr "unit" "i387")
|
1209 |
|
|
(set (attr "mode")
|
1210 |
|
|
(cond [(match_operand:SF 1 "" "")
|
1211 |
|
|
(const_string "SF")
|
1212 |
|
|
(match_operand:DF 1 "" "")
|
1213 |
|
|
(const_string "DF")
|
1214 |
|
|
]
|
1215 |
|
|
(const_string "XF")))])
|
1216 |
|
|
|
1217 |
|
|
(define_insn_and_split "*cmpfp_0_cc"
|
1218 |
|
|
[(set (reg:CCFP FLAGS_REG)
|
1219 |
|
|
(compare:CCFP
|
1220 |
|
|
(match_operand 1 "register_operand" "f")
|
1221 |
|
|
(match_operand 2 "const0_operand" "")))
|
1222 |
|
|
(clobber (match_operand:HI 0 "register_operand" "=a"))]
|
1223 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
1224 |
|
|
&& TARGET_SAHF && !TARGET_CMOVE
|
1225 |
|
|
&& GET_MODE (operands[1]) == GET_MODE (operands[2])"
|
1226 |
|
|
"#"
|
1227 |
|
|
"&& reload_completed"
|
1228 |
|
|
[(set (match_dup 0)
|
1229 |
|
|
(unspec:HI
|
1230 |
|
|
[(compare:CCFP (match_dup 1)(match_dup 2))]
|
1231 |
|
|
UNSPEC_FNSTSW))
|
1232 |
|
|
(set (reg:CC FLAGS_REG)
|
1233 |
|
|
(unspec:CC [(match_dup 0)] UNSPEC_SAHF))]
|
1234 |
|
|
""
|
1235 |
|
|
[(set_attr "type" "multi")
|
1236 |
|
|
(set_attr "unit" "i387")
|
1237 |
|
|
(set (attr "mode")
|
1238 |
|
|
(cond [(match_operand:SF 1 "" "")
|
1239 |
|
|
(const_string "SF")
|
1240 |
|
|
(match_operand:DF 1 "" "")
|
1241 |
|
|
(const_string "DF")
|
1242 |
|
|
]
|
1243 |
|
|
(const_string "XF")))])
|
1244 |
|
|
|
1245 |
|
|
(define_insn "*cmpfp_xf"
|
1246 |
|
|
[(set (match_operand:HI 0 "register_operand" "=a")
|
1247 |
|
|
(unspec:HI
|
1248 |
|
|
[(compare:CCFP
|
1249 |
|
|
(match_operand:XF 1 "register_operand" "f")
|
1250 |
|
|
(match_operand:XF 2 "register_operand" "f"))]
|
1251 |
|
|
UNSPEC_FNSTSW))]
|
1252 |
|
|
"TARGET_80387"
|
1253 |
|
|
"* return output_fp_compare (insn, operands, false, false);"
|
1254 |
|
|
[(set_attr "type" "multi")
|
1255 |
|
|
(set_attr "unit" "i387")
|
1256 |
|
|
(set_attr "mode" "XF")])
|
1257 |
|
|
|
1258 |
|
|
(define_insn_and_split "*cmpfp_xf_cc"
|
1259 |
|
|
[(set (reg:CCFP FLAGS_REG)
|
1260 |
|
|
(compare:CCFP
|
1261 |
|
|
(match_operand:XF 1 "register_operand" "f")
|
1262 |
|
|
(match_operand:XF 2 "register_operand" "f")))
|
1263 |
|
|
(clobber (match_operand:HI 0 "register_operand" "=a"))]
|
1264 |
|
|
"TARGET_80387
|
1265 |
|
|
&& TARGET_SAHF && !TARGET_CMOVE"
|
1266 |
|
|
"#"
|
1267 |
|
|
"&& reload_completed"
|
1268 |
|
|
[(set (match_dup 0)
|
1269 |
|
|
(unspec:HI
|
1270 |
|
|
[(compare:CCFP (match_dup 1)(match_dup 2))]
|
1271 |
|
|
UNSPEC_FNSTSW))
|
1272 |
|
|
(set (reg:CC FLAGS_REG)
|
1273 |
|
|
(unspec:CC [(match_dup 0)] UNSPEC_SAHF))]
|
1274 |
|
|
""
|
1275 |
|
|
[(set_attr "type" "multi")
|
1276 |
|
|
(set_attr "unit" "i387")
|
1277 |
|
|
(set_attr "mode" "XF")])
|
1278 |
|
|
|
1279 |
|
|
(define_insn "*cmpfp_"
|
1280 |
|
|
[(set (match_operand:HI 0 "register_operand" "=a")
|
1281 |
|
|
(unspec:HI
|
1282 |
|
|
[(compare:CCFP
|
1283 |
|
|
(match_operand:MODEF 1 "register_operand" "f")
|
1284 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "fm"))]
|
1285 |
|
|
UNSPEC_FNSTSW))]
|
1286 |
|
|
"TARGET_80387"
|
1287 |
|
|
"* return output_fp_compare (insn, operands, false, false);"
|
1288 |
|
|
[(set_attr "type" "multi")
|
1289 |
|
|
(set_attr "unit" "i387")
|
1290 |
|
|
(set_attr "mode" "")])
|
1291 |
|
|
|
1292 |
|
|
(define_insn_and_split "*cmpfp__cc"
|
1293 |
|
|
[(set (reg:CCFP FLAGS_REG)
|
1294 |
|
|
(compare:CCFP
|
1295 |
|
|
(match_operand:MODEF 1 "register_operand" "f")
|
1296 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "fm")))
|
1297 |
|
|
(clobber (match_operand:HI 0 "register_operand" "=a"))]
|
1298 |
|
|
"TARGET_80387
|
1299 |
|
|
&& TARGET_SAHF && !TARGET_CMOVE"
|
1300 |
|
|
"#"
|
1301 |
|
|
"&& reload_completed"
|
1302 |
|
|
[(set (match_dup 0)
|
1303 |
|
|
(unspec:HI
|
1304 |
|
|
[(compare:CCFP (match_dup 1)(match_dup 2))]
|
1305 |
|
|
UNSPEC_FNSTSW))
|
1306 |
|
|
(set (reg:CC FLAGS_REG)
|
1307 |
|
|
(unspec:CC [(match_dup 0)] UNSPEC_SAHF))]
|
1308 |
|
|
""
|
1309 |
|
|
[(set_attr "type" "multi")
|
1310 |
|
|
(set_attr "unit" "i387")
|
1311 |
|
|
(set_attr "mode" "")])
|
1312 |
|
|
|
1313 |
|
|
(define_insn "*cmpfp_u"
|
1314 |
|
|
[(set (match_operand:HI 0 "register_operand" "=a")
|
1315 |
|
|
(unspec:HI
|
1316 |
|
|
[(compare:CCFPU
|
1317 |
|
|
(match_operand 1 "register_operand" "f")
|
1318 |
|
|
(match_operand 2 "register_operand" "f"))]
|
1319 |
|
|
UNSPEC_FNSTSW))]
|
1320 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
1321 |
|
|
&& GET_MODE (operands[1]) == GET_MODE (operands[2])"
|
1322 |
|
|
"* return output_fp_compare (insn, operands, false, true);"
|
1323 |
|
|
[(set_attr "type" "multi")
|
1324 |
|
|
(set_attr "unit" "i387")
|
1325 |
|
|
(set (attr "mode")
|
1326 |
|
|
(cond [(match_operand:SF 1 "" "")
|
1327 |
|
|
(const_string "SF")
|
1328 |
|
|
(match_operand:DF 1 "" "")
|
1329 |
|
|
(const_string "DF")
|
1330 |
|
|
]
|
1331 |
|
|
(const_string "XF")))])
|
1332 |
|
|
|
1333 |
|
|
(define_insn_and_split "*cmpfp_u_cc"
|
1334 |
|
|
[(set (reg:CCFPU FLAGS_REG)
|
1335 |
|
|
(compare:CCFPU
|
1336 |
|
|
(match_operand 1 "register_operand" "f")
|
1337 |
|
|
(match_operand 2 "register_operand" "f")))
|
1338 |
|
|
(clobber (match_operand:HI 0 "register_operand" "=a"))]
|
1339 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
1340 |
|
|
&& TARGET_SAHF && !TARGET_CMOVE
|
1341 |
|
|
&& GET_MODE (operands[1]) == GET_MODE (operands[2])"
|
1342 |
|
|
"#"
|
1343 |
|
|
"&& reload_completed"
|
1344 |
|
|
[(set (match_dup 0)
|
1345 |
|
|
(unspec:HI
|
1346 |
|
|
[(compare:CCFPU (match_dup 1)(match_dup 2))]
|
1347 |
|
|
UNSPEC_FNSTSW))
|
1348 |
|
|
(set (reg:CC FLAGS_REG)
|
1349 |
|
|
(unspec:CC [(match_dup 0)] UNSPEC_SAHF))]
|
1350 |
|
|
""
|
1351 |
|
|
[(set_attr "type" "multi")
|
1352 |
|
|
(set_attr "unit" "i387")
|
1353 |
|
|
(set (attr "mode")
|
1354 |
|
|
(cond [(match_operand:SF 1 "" "")
|
1355 |
|
|
(const_string "SF")
|
1356 |
|
|
(match_operand:DF 1 "" "")
|
1357 |
|
|
(const_string "DF")
|
1358 |
|
|
]
|
1359 |
|
|
(const_string "XF")))])
|
1360 |
|
|
|
1361 |
|
|
(define_insn "*cmpfp_"
|
1362 |
|
|
[(set (match_operand:HI 0 "register_operand" "=a")
|
1363 |
|
|
(unspec:HI
|
1364 |
|
|
[(compare:CCFP
|
1365 |
|
|
(match_operand 1 "register_operand" "f")
|
1366 |
|
|
(match_operator 3 "float_operator"
|
1367 |
|
|
[(match_operand:SWI24 2 "memory_operand" "m")]))]
|
1368 |
|
|
UNSPEC_FNSTSW))]
|
1369 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
1370 |
|
|
&& (TARGET_USE_MODE_FIOP || optimize_function_for_size_p (cfun))
|
1371 |
|
|
&& (GET_MODE (operands [3]) == GET_MODE (operands[1]))"
|
1372 |
|
|
"* return output_fp_compare (insn, operands, false, false);"
|
1373 |
|
|
[(set_attr "type" "multi")
|
1374 |
|
|
(set_attr "unit" "i387")
|
1375 |
|
|
(set_attr "fp_int_src" "true")
|
1376 |
|
|
(set_attr "mode" "")])
|
1377 |
|
|
|
1378 |
|
|
(define_insn_and_split "*cmpfp__cc"
|
1379 |
|
|
[(set (reg:CCFP FLAGS_REG)
|
1380 |
|
|
(compare:CCFP
|
1381 |
|
|
(match_operand 1 "register_operand" "f")
|
1382 |
|
|
(match_operator 3 "float_operator"
|
1383 |
|
|
[(match_operand:SWI24 2 "memory_operand" "m")])))
|
1384 |
|
|
(clobber (match_operand:HI 0 "register_operand" "=a"))]
|
1385 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
1386 |
|
|
&& TARGET_SAHF && !TARGET_CMOVE
|
1387 |
|
|
&& (TARGET_USE_MODE_FIOP || optimize_function_for_size_p (cfun))
|
1388 |
|
|
&& (GET_MODE (operands [3]) == GET_MODE (operands[1]))"
|
1389 |
|
|
"#"
|
1390 |
|
|
"&& reload_completed"
|
1391 |
|
|
[(set (match_dup 0)
|
1392 |
|
|
(unspec:HI
|
1393 |
|
|
[(compare:CCFP
|
1394 |
|
|
(match_dup 1)
|
1395 |
|
|
(match_op_dup 3 [(match_dup 2)]))]
|
1396 |
|
|
UNSPEC_FNSTSW))
|
1397 |
|
|
(set (reg:CC FLAGS_REG)
|
1398 |
|
|
(unspec:CC [(match_dup 0)] UNSPEC_SAHF))]
|
1399 |
|
|
""
|
1400 |
|
|
[(set_attr "type" "multi")
|
1401 |
|
|
(set_attr "unit" "i387")
|
1402 |
|
|
(set_attr "fp_int_src" "true")
|
1403 |
|
|
(set_attr "mode" "")])
|
1404 |
|
|
|
1405 |
|
|
;; FP compares, step 2
|
1406 |
|
|
;; Move the fpsw to ax.
|
1407 |
|
|
|
1408 |
|
|
(define_insn "x86_fnstsw_1"
|
1409 |
|
|
[(set (match_operand:HI 0 "register_operand" "=a")
|
1410 |
|
|
(unspec:HI [(reg:CCFP FPSR_REG)] UNSPEC_FNSTSW))]
|
1411 |
|
|
"TARGET_80387"
|
1412 |
|
|
"fnstsw\t%0"
|
1413 |
|
|
[(set (attr "length")
|
1414 |
|
|
(symbol_ref "ix86_attr_length_address_default (insn) + 2"))
|
1415 |
|
|
(set_attr "mode" "SI")
|
1416 |
|
|
(set_attr "unit" "i387")])
|
1417 |
|
|
|
1418 |
|
|
;; FP compares, step 3
|
1419 |
|
|
;; Get ax into flags, general case.
|
1420 |
|
|
|
1421 |
|
|
(define_insn "x86_sahf_1"
|
1422 |
|
|
[(set (reg:CC FLAGS_REG)
|
1423 |
|
|
(unspec:CC [(match_operand:HI 0 "register_operand" "a")]
|
1424 |
|
|
UNSPEC_SAHF))]
|
1425 |
|
|
"TARGET_SAHF"
|
1426 |
|
|
{
|
1427 |
|
|
#ifndef HAVE_AS_IX86_SAHF
|
1428 |
|
|
if (TARGET_64BIT)
|
1429 |
|
|
return ASM_BYTE "0x9e";
|
1430 |
|
|
else
|
1431 |
|
|
#endif
|
1432 |
|
|
return "sahf";
|
1433 |
|
|
}
|
1434 |
|
|
[(set_attr "length" "1")
|
1435 |
|
|
(set_attr "athlon_decode" "vector")
|
1436 |
|
|
(set_attr "amdfam10_decode" "direct")
|
1437 |
|
|
(set_attr "bdver1_decode" "direct")
|
1438 |
|
|
(set_attr "mode" "SI")])
|
1439 |
|
|
|
1440 |
|
|
;; Pentium Pro can do steps 1 through 3 in one go.
|
1441 |
|
|
;; comi*, ucomi*, fcomi*, ficomi*, fucomi*
|
1442 |
|
|
;; (these i387 instructions set flags directly)
|
1443 |
|
|
(define_insn "*cmpfp_i_mixed"
|
1444 |
|
|
[(set (reg:CCFP FLAGS_REG)
|
1445 |
|
|
(compare:CCFP (match_operand 0 "register_operand" "f,x")
|
1446 |
|
|
(match_operand 1 "nonimmediate_operand" "f,xm")))]
|
1447 |
|
|
"TARGET_MIX_SSE_I387
|
1448 |
|
|
&& SSE_FLOAT_MODE_P (GET_MODE (operands[0]))
|
1449 |
|
|
&& GET_MODE (operands[0]) == GET_MODE (operands[1])"
|
1450 |
|
|
"* return output_fp_compare (insn, operands, true, false);"
|
1451 |
|
|
[(set_attr "type" "fcmp,ssecomi")
|
1452 |
|
|
(set_attr "prefix" "orig,maybe_vex")
|
1453 |
|
|
(set (attr "mode")
|
1454 |
|
|
(if_then_else (match_operand:SF 1 "" "")
|
1455 |
|
|
(const_string "SF")
|
1456 |
|
|
(const_string "DF")))
|
1457 |
|
|
(set (attr "prefix_rep")
|
1458 |
|
|
(if_then_else (eq_attr "type" "ssecomi")
|
1459 |
|
|
(const_string "0")
|
1460 |
|
|
(const_string "*")))
|
1461 |
|
|
(set (attr "prefix_data16")
|
1462 |
|
|
(cond [(eq_attr "type" "fcmp")
|
1463 |
|
|
(const_string "*")
|
1464 |
|
|
(eq_attr "mode" "DF")
|
1465 |
|
|
(const_string "1")
|
1466 |
|
|
]
|
1467 |
|
|
(const_string "0")))
|
1468 |
|
|
(set_attr "athlon_decode" "vector")
|
1469 |
|
|
(set_attr "amdfam10_decode" "direct")
|
1470 |
|
|
(set_attr "bdver1_decode" "double")])
|
1471 |
|
|
|
1472 |
|
|
(define_insn "*cmpfp_i_sse"
|
1473 |
|
|
[(set (reg:CCFP FLAGS_REG)
|
1474 |
|
|
(compare:CCFP (match_operand 0 "register_operand" "x")
|
1475 |
|
|
(match_operand 1 "nonimmediate_operand" "xm")))]
|
1476 |
|
|
"TARGET_SSE_MATH
|
1477 |
|
|
&& SSE_FLOAT_MODE_P (GET_MODE (operands[0]))
|
1478 |
|
|
&& GET_MODE (operands[0]) == GET_MODE (operands[1])"
|
1479 |
|
|
"* return output_fp_compare (insn, operands, true, false);"
|
1480 |
|
|
[(set_attr "type" "ssecomi")
|
1481 |
|
|
(set_attr "prefix" "maybe_vex")
|
1482 |
|
|
(set (attr "mode")
|
1483 |
|
|
(if_then_else (match_operand:SF 1 "" "")
|
1484 |
|
|
(const_string "SF")
|
1485 |
|
|
(const_string "DF")))
|
1486 |
|
|
(set_attr "prefix_rep" "0")
|
1487 |
|
|
(set (attr "prefix_data16")
|
1488 |
|
|
(if_then_else (eq_attr "mode" "DF")
|
1489 |
|
|
(const_string "1")
|
1490 |
|
|
(const_string "0")))
|
1491 |
|
|
(set_attr "athlon_decode" "vector")
|
1492 |
|
|
(set_attr "amdfam10_decode" "direct")
|
1493 |
|
|
(set_attr "bdver1_decode" "double")])
|
1494 |
|
|
|
1495 |
|
|
(define_insn "*cmpfp_i_i387"
|
1496 |
|
|
[(set (reg:CCFP FLAGS_REG)
|
1497 |
|
|
(compare:CCFP (match_operand 0 "register_operand" "f")
|
1498 |
|
|
(match_operand 1 "register_operand" "f")))]
|
1499 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[0]))
|
1500 |
|
|
&& TARGET_CMOVE
|
1501 |
|
|
&& !(SSE_FLOAT_MODE_P (GET_MODE (operands[0])) && TARGET_SSE_MATH)
|
1502 |
|
|
&& GET_MODE (operands[0]) == GET_MODE (operands[1])"
|
1503 |
|
|
"* return output_fp_compare (insn, operands, true, false);"
|
1504 |
|
|
[(set_attr "type" "fcmp")
|
1505 |
|
|
(set (attr "mode")
|
1506 |
|
|
(cond [(match_operand:SF 1 "" "")
|
1507 |
|
|
(const_string "SF")
|
1508 |
|
|
(match_operand:DF 1 "" "")
|
1509 |
|
|
(const_string "DF")
|
1510 |
|
|
]
|
1511 |
|
|
(const_string "XF")))
|
1512 |
|
|
(set_attr "athlon_decode" "vector")
|
1513 |
|
|
(set_attr "amdfam10_decode" "direct")
|
1514 |
|
|
(set_attr "bdver1_decode" "double")])
|
1515 |
|
|
|
1516 |
|
|
(define_insn "*cmpfp_iu_mixed"
|
1517 |
|
|
[(set (reg:CCFPU FLAGS_REG)
|
1518 |
|
|
(compare:CCFPU (match_operand 0 "register_operand" "f,x")
|
1519 |
|
|
(match_operand 1 "nonimmediate_operand" "f,xm")))]
|
1520 |
|
|
"TARGET_MIX_SSE_I387
|
1521 |
|
|
&& SSE_FLOAT_MODE_P (GET_MODE (operands[0]))
|
1522 |
|
|
&& GET_MODE (operands[0]) == GET_MODE (operands[1])"
|
1523 |
|
|
"* return output_fp_compare (insn, operands, true, true);"
|
1524 |
|
|
[(set_attr "type" "fcmp,ssecomi")
|
1525 |
|
|
(set_attr "prefix" "orig,maybe_vex")
|
1526 |
|
|
(set (attr "mode")
|
1527 |
|
|
(if_then_else (match_operand:SF 1 "" "")
|
1528 |
|
|
(const_string "SF")
|
1529 |
|
|
(const_string "DF")))
|
1530 |
|
|
(set (attr "prefix_rep")
|
1531 |
|
|
(if_then_else (eq_attr "type" "ssecomi")
|
1532 |
|
|
(const_string "0")
|
1533 |
|
|
(const_string "*")))
|
1534 |
|
|
(set (attr "prefix_data16")
|
1535 |
|
|
(cond [(eq_attr "type" "fcmp")
|
1536 |
|
|
(const_string "*")
|
1537 |
|
|
(eq_attr "mode" "DF")
|
1538 |
|
|
(const_string "1")
|
1539 |
|
|
]
|
1540 |
|
|
(const_string "0")))
|
1541 |
|
|
(set_attr "athlon_decode" "vector")
|
1542 |
|
|
(set_attr "amdfam10_decode" "direct")
|
1543 |
|
|
(set_attr "bdver1_decode" "double")])
|
1544 |
|
|
|
1545 |
|
|
(define_insn "*cmpfp_iu_sse"
|
1546 |
|
|
[(set (reg:CCFPU FLAGS_REG)
|
1547 |
|
|
(compare:CCFPU (match_operand 0 "register_operand" "x")
|
1548 |
|
|
(match_operand 1 "nonimmediate_operand" "xm")))]
|
1549 |
|
|
"TARGET_SSE_MATH
|
1550 |
|
|
&& SSE_FLOAT_MODE_P (GET_MODE (operands[0]))
|
1551 |
|
|
&& GET_MODE (operands[0]) == GET_MODE (operands[1])"
|
1552 |
|
|
"* return output_fp_compare (insn, operands, true, true);"
|
1553 |
|
|
[(set_attr "type" "ssecomi")
|
1554 |
|
|
(set_attr "prefix" "maybe_vex")
|
1555 |
|
|
(set (attr "mode")
|
1556 |
|
|
(if_then_else (match_operand:SF 1 "" "")
|
1557 |
|
|
(const_string "SF")
|
1558 |
|
|
(const_string "DF")))
|
1559 |
|
|
(set_attr "prefix_rep" "0")
|
1560 |
|
|
(set (attr "prefix_data16")
|
1561 |
|
|
(if_then_else (eq_attr "mode" "DF")
|
1562 |
|
|
(const_string "1")
|
1563 |
|
|
(const_string "0")))
|
1564 |
|
|
(set_attr "athlon_decode" "vector")
|
1565 |
|
|
(set_attr "amdfam10_decode" "direct")
|
1566 |
|
|
(set_attr "bdver1_decode" "double")])
|
1567 |
|
|
|
1568 |
|
|
(define_insn "*cmpfp_iu_387"
|
1569 |
|
|
[(set (reg:CCFPU FLAGS_REG)
|
1570 |
|
|
(compare:CCFPU (match_operand 0 "register_operand" "f")
|
1571 |
|
|
(match_operand 1 "register_operand" "f")))]
|
1572 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[0]))
|
1573 |
|
|
&& TARGET_CMOVE
|
1574 |
|
|
&& !(SSE_FLOAT_MODE_P (GET_MODE (operands[0])) && TARGET_SSE_MATH)
|
1575 |
|
|
&& GET_MODE (operands[0]) == GET_MODE (operands[1])"
|
1576 |
|
|
"* return output_fp_compare (insn, operands, true, true);"
|
1577 |
|
|
[(set_attr "type" "fcmp")
|
1578 |
|
|
(set (attr "mode")
|
1579 |
|
|
(cond [(match_operand:SF 1 "" "")
|
1580 |
|
|
(const_string "SF")
|
1581 |
|
|
(match_operand:DF 1 "" "")
|
1582 |
|
|
(const_string "DF")
|
1583 |
|
|
]
|
1584 |
|
|
(const_string "XF")))
|
1585 |
|
|
(set_attr "athlon_decode" "vector")
|
1586 |
|
|
(set_attr "amdfam10_decode" "direct")
|
1587 |
|
|
(set_attr "bdver1_decode" "direct")])
|
1588 |
|
|
|
1589 |
|
|
;; Push/pop instructions.
|
1590 |
|
|
|
1591 |
|
|
(define_insn "*push2"
|
1592 |
|
|
[(set (match_operand:DWI 0 "push_operand" "=<")
|
1593 |
|
|
(match_operand:DWI 1 "general_no_elim_operand" "riF*o"))]
|
1594 |
|
|
""
|
1595 |
|
|
"#"
|
1596 |
|
|
[(set_attr "type" "multi")
|
1597 |
|
|
(set_attr "mode" "")])
|
1598 |
|
|
|
1599 |
|
|
(define_split
|
1600 |
|
|
[(set (match_operand:TI 0 "push_operand" "")
|
1601 |
|
|
(match_operand:TI 1 "general_operand" ""))]
|
1602 |
|
|
"TARGET_64BIT && reload_completed
|
1603 |
|
|
&& !SSE_REG_P (operands[1])"
|
1604 |
|
|
[(const_int 0)]
|
1605 |
|
|
"ix86_split_long_move (operands); DONE;")
|
1606 |
|
|
|
1607 |
|
|
(define_insn "*pushdi2_rex64"
|
1608 |
|
|
[(set (match_operand:DI 0 "push_operand" "=<,!<")
|
1609 |
|
|
(match_operand:DI 1 "general_no_elim_operand" "re*m,n"))]
|
1610 |
|
|
"TARGET_64BIT"
|
1611 |
|
|
"@
|
1612 |
|
|
push{q}\t%1
|
1613 |
|
|
#"
|
1614 |
|
|
[(set_attr "type" "push,multi")
|
1615 |
|
|
(set_attr "mode" "DI")])
|
1616 |
|
|
|
1617 |
|
|
;; Convert impossible pushes of immediate to existing instructions.
|
1618 |
|
|
;; First try to get scratch register and go through it. In case this
|
1619 |
|
|
;; fails, push sign extended lower part first and then overwrite
|
1620 |
|
|
;; upper part by 32bit move.
|
1621 |
|
|
(define_peephole2
|
1622 |
|
|
[(match_scratch:DI 2 "r")
|
1623 |
|
|
(set (match_operand:DI 0 "push_operand" "")
|
1624 |
|
|
(match_operand:DI 1 "immediate_operand" ""))]
|
1625 |
|
|
"TARGET_64BIT && !symbolic_operand (operands[1], DImode)
|
1626 |
|
|
&& !x86_64_immediate_operand (operands[1], DImode)"
|
1627 |
|
|
[(set (match_dup 2) (match_dup 1))
|
1628 |
|
|
(set (match_dup 0) (match_dup 2))])
|
1629 |
|
|
|
1630 |
|
|
;; We need to define this as both peepholer and splitter for case
|
1631 |
|
|
;; peephole2 pass is not run.
|
1632 |
|
|
;; "&& 1" is needed to keep it from matching the previous pattern.
|
1633 |
|
|
(define_peephole2
|
1634 |
|
|
[(set (match_operand:DI 0 "push_operand" "")
|
1635 |
|
|
(match_operand:DI 1 "immediate_operand" ""))]
|
1636 |
|
|
"TARGET_64BIT && !symbolic_operand (operands[1], DImode)
|
1637 |
|
|
&& !x86_64_immediate_operand (operands[1], DImode) && 1"
|
1638 |
|
|
[(set (match_dup 0) (match_dup 1))
|
1639 |
|
|
(set (match_dup 2) (match_dup 3))]
|
1640 |
|
|
{
|
1641 |
|
|
split_double_mode (DImode, &operands[1], 1, &operands[2], &operands[3]);
|
1642 |
|
|
|
1643 |
|
|
operands[1] = gen_lowpart (DImode, operands[2]);
|
1644 |
|
|
operands[2] = gen_rtx_MEM (SImode, gen_rtx_PLUS (DImode, stack_pointer_rtx,
|
1645 |
|
|
GEN_INT (4)));
|
1646 |
|
|
})
|
1647 |
|
|
|
1648 |
|
|
(define_split
|
1649 |
|
|
[(set (match_operand:DI 0 "push_operand" "")
|
1650 |
|
|
(match_operand:DI 1 "immediate_operand" ""))]
|
1651 |
|
|
"TARGET_64BIT && ((optimize > 0 && flag_peephole2)
|
1652 |
|
|
? epilogue_completed : reload_completed)
|
1653 |
|
|
&& !symbolic_operand (operands[1], DImode)
|
1654 |
|
|
&& !x86_64_immediate_operand (operands[1], DImode)"
|
1655 |
|
|
[(set (match_dup 0) (match_dup 1))
|
1656 |
|
|
(set (match_dup 2) (match_dup 3))]
|
1657 |
|
|
{
|
1658 |
|
|
split_double_mode (DImode, &operands[1], 1, &operands[2], &operands[3]);
|
1659 |
|
|
|
1660 |
|
|
operands[1] = gen_lowpart (DImode, operands[2]);
|
1661 |
|
|
operands[2] = gen_rtx_MEM (SImode, gen_rtx_PLUS (DImode, stack_pointer_rtx,
|
1662 |
|
|
GEN_INT (4)));
|
1663 |
|
|
})
|
1664 |
|
|
|
1665 |
|
|
(define_split
|
1666 |
|
|
[(set (match_operand:DI 0 "push_operand" "")
|
1667 |
|
|
(match_operand:DI 1 "general_operand" ""))]
|
1668 |
|
|
"!TARGET_64BIT && reload_completed
|
1669 |
|
|
&& !(MMX_REG_P (operands[1]) || SSE_REG_P (operands[1]))"
|
1670 |
|
|
[(const_int 0)]
|
1671 |
|
|
"ix86_split_long_move (operands); DONE;")
|
1672 |
|
|
|
1673 |
|
|
(define_insn "*pushsi2"
|
1674 |
|
|
[(set (match_operand:SI 0 "push_operand" "=<")
|
1675 |
|
|
(match_operand:SI 1 "general_no_elim_operand" "ri*m"))]
|
1676 |
|
|
"!TARGET_64BIT"
|
1677 |
|
|
"push{l}\t%1"
|
1678 |
|
|
[(set_attr "type" "push")
|
1679 |
|
|
(set_attr "mode" "SI")])
|
1680 |
|
|
|
1681 |
|
|
;; emit_push_insn when it calls move_by_pieces requires an insn to
|
1682 |
|
|
;; "push a byte/word". But actually we use pushl, which has the effect
|
1683 |
|
|
;; of rounding the amount pushed up to a word.
|
1684 |
|
|
|
1685 |
|
|
;; For TARGET_64BIT we always round up to 8 bytes.
|
1686 |
|
|
(define_insn "*push2_rex64"
|
1687 |
|
|
[(set (match_operand:SWI124 0 "push_operand" "=X")
|
1688 |
|
|
(match_operand:SWI124 1 "nonmemory_no_elim_operand" "r"))]
|
1689 |
|
|
"TARGET_64BIT"
|
1690 |
|
|
"push{q}\t%q1"
|
1691 |
|
|
[(set_attr "type" "push")
|
1692 |
|
|
(set_attr "mode" "DI")])
|
1693 |
|
|
|
1694 |
|
|
(define_insn "*push2"
|
1695 |
|
|
[(set (match_operand:SWI12 0 "push_operand" "=X")
|
1696 |
|
|
(match_operand:SWI12 1 "nonmemory_no_elim_operand" "rn"))]
|
1697 |
|
|
"!TARGET_64BIT"
|
1698 |
|
|
"push{l}\t%k1"
|
1699 |
|
|
[(set_attr "type" "push")
|
1700 |
|
|
(set_attr "mode" "SI")])
|
1701 |
|
|
|
1702 |
|
|
(define_insn "*push2_prologue"
|
1703 |
|
|
[(set (match_operand:P 0 "push_operand" "=<")
|
1704 |
|
|
(match_operand:P 1 "general_no_elim_operand" "r*m"))
|
1705 |
|
|
(clobber (mem:BLK (scratch)))]
|
1706 |
|
|
""
|
1707 |
|
|
"push{}\t%1"
|
1708 |
|
|
[(set_attr "type" "push")
|
1709 |
|
|
(set_attr "mode" "")])
|
1710 |
|
|
|
1711 |
|
|
(define_insn "*pop1"
|
1712 |
|
|
[(set (match_operand:P 0 "nonimmediate_operand" "=r*m")
|
1713 |
|
|
(match_operand:P 1 "pop_operand" ">"))]
|
1714 |
|
|
""
|
1715 |
|
|
"pop{}\t%0"
|
1716 |
|
|
[(set_attr "type" "pop")
|
1717 |
|
|
(set_attr "mode" "")])
|
1718 |
|
|
|
1719 |
|
|
(define_insn "*pop1_epilogue"
|
1720 |
|
|
[(set (match_operand:P 0 "nonimmediate_operand" "=r*m")
|
1721 |
|
|
(match_operand:P 1 "pop_operand" ">"))
|
1722 |
|
|
(clobber (mem:BLK (scratch)))]
|
1723 |
|
|
""
|
1724 |
|
|
"pop{}\t%0"
|
1725 |
|
|
[(set_attr "type" "pop")
|
1726 |
|
|
(set_attr "mode" "")])
|
1727 |
|
|
|
1728 |
|
|
;; Move instructions.
|
1729 |
|
|
|
1730 |
|
|
(define_expand "movoi"
|
1731 |
|
|
[(set (match_operand:OI 0 "nonimmediate_operand" "")
|
1732 |
|
|
(match_operand:OI 1 "general_operand" ""))]
|
1733 |
|
|
"TARGET_AVX"
|
1734 |
|
|
"ix86_expand_move (OImode, operands); DONE;")
|
1735 |
|
|
|
1736 |
|
|
(define_expand "movti"
|
1737 |
|
|
[(set (match_operand:TI 0 "nonimmediate_operand" "")
|
1738 |
|
|
(match_operand:TI 1 "nonimmediate_operand" ""))]
|
1739 |
|
|
"TARGET_64BIT || TARGET_SSE"
|
1740 |
|
|
{
|
1741 |
|
|
if (TARGET_64BIT)
|
1742 |
|
|
ix86_expand_move (TImode, operands);
|
1743 |
|
|
else if (push_operand (operands[0], TImode))
|
1744 |
|
|
ix86_expand_push (TImode, operands[1]);
|
1745 |
|
|
else
|
1746 |
|
|
ix86_expand_vector_move (TImode, operands);
|
1747 |
|
|
DONE;
|
1748 |
|
|
})
|
1749 |
|
|
|
1750 |
|
|
;; This expands to what emit_move_complex would generate if we didn't
|
1751 |
|
|
;; have a movti pattern. Having this avoids problems with reload on
|
1752 |
|
|
;; 32-bit targets when SSE is present, but doesn't seem to be harmful
|
1753 |
|
|
;; to have around all the time.
|
1754 |
|
|
(define_expand "movcdi"
|
1755 |
|
|
[(set (match_operand:CDI 0 "nonimmediate_operand" "")
|
1756 |
|
|
(match_operand:CDI 1 "general_operand" ""))]
|
1757 |
|
|
""
|
1758 |
|
|
{
|
1759 |
|
|
if (push_operand (operands[0], CDImode))
|
1760 |
|
|
emit_move_complex_push (CDImode, operands[0], operands[1]);
|
1761 |
|
|
else
|
1762 |
|
|
emit_move_complex_parts (operands[0], operands[1]);
|
1763 |
|
|
DONE;
|
1764 |
|
|
})
|
1765 |
|
|
|
1766 |
|
|
(define_expand "mov"
|
1767 |
|
|
[(set (match_operand:SWI1248x 0 "nonimmediate_operand" "")
|
1768 |
|
|
(match_operand:SWI1248x 1 "general_operand" ""))]
|
1769 |
|
|
""
|
1770 |
|
|
"ix86_expand_move (mode, operands); DONE;")
|
1771 |
|
|
|
1772 |
|
|
(define_insn "*mov_xor"
|
1773 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
1774 |
|
|
(match_operand:SWI48 1 "const0_operand" ""))
|
1775 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
1776 |
|
|
"reload_completed"
|
1777 |
|
|
"xor{l}\t%k0, %k0"
|
1778 |
|
|
[(set_attr "type" "alu1")
|
1779 |
|
|
(set_attr "mode" "SI")
|
1780 |
|
|
(set_attr "length_immediate" "0")])
|
1781 |
|
|
|
1782 |
|
|
(define_insn "*mov_or"
|
1783 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
1784 |
|
|
(match_operand:SWI48 1 "const_int_operand" ""))
|
1785 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
1786 |
|
|
"reload_completed
|
1787 |
|
|
&& operands[1] == constm1_rtx"
|
1788 |
|
|
"or{}\t{%1, %0|%0, %1}"
|
1789 |
|
|
[(set_attr "type" "alu1")
|
1790 |
|
|
(set_attr "mode" "")
|
1791 |
|
|
(set_attr "length_immediate" "1")])
|
1792 |
|
|
|
1793 |
|
|
(define_insn "*movoi_internal_avx"
|
1794 |
|
|
[(set (match_operand:OI 0 "nonimmediate_operand" "=x,x,m")
|
1795 |
|
|
(match_operand:OI 1 "vector_move_operand" "C,xm,x"))]
|
1796 |
|
|
"TARGET_AVX && !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
1797 |
|
|
{
|
1798 |
|
|
switch (which_alternative)
|
1799 |
|
|
{
|
1800 |
|
|
case 0:
|
1801 |
|
|
return standard_sse_constant_opcode (insn, operands[1]);
|
1802 |
|
|
case 1:
|
1803 |
|
|
case 2:
|
1804 |
|
|
if (misaligned_operand (operands[0], OImode)
|
1805 |
|
|
|| misaligned_operand (operands[1], OImode))
|
1806 |
|
|
return "vmovdqu\t{%1, %0|%0, %1}";
|
1807 |
|
|
else
|
1808 |
|
|
return "vmovdqa\t{%1, %0|%0, %1}";
|
1809 |
|
|
default:
|
1810 |
|
|
gcc_unreachable ();
|
1811 |
|
|
}
|
1812 |
|
|
}
|
1813 |
|
|
[(set_attr "type" "sselog1,ssemov,ssemov")
|
1814 |
|
|
(set_attr "prefix" "vex")
|
1815 |
|
|
(set_attr "mode" "OI")])
|
1816 |
|
|
|
1817 |
|
|
(define_insn "*movti_internal_rex64"
|
1818 |
|
|
[(set (match_operand:TI 0 "nonimmediate_operand" "=!r,o,x,x,xm")
|
1819 |
|
|
(match_operand:TI 1 "general_operand" "riFo,riF,C,xm,x"))]
|
1820 |
|
|
"TARGET_64BIT && !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
1821 |
|
|
{
|
1822 |
|
|
switch (which_alternative)
|
1823 |
|
|
{
|
1824 |
|
|
case 0:
|
1825 |
|
|
case 1:
|
1826 |
|
|
return "#";
|
1827 |
|
|
case 2:
|
1828 |
|
|
return standard_sse_constant_opcode (insn, operands[1]);
|
1829 |
|
|
case 3:
|
1830 |
|
|
case 4:
|
1831 |
|
|
/* TDmode values are passed as TImode on the stack. Moving them
|
1832 |
|
|
to stack may result in unaligned memory access. */
|
1833 |
|
|
if (misaligned_operand (operands[0], TImode)
|
1834 |
|
|
|| misaligned_operand (operands[1], TImode))
|
1835 |
|
|
{
|
1836 |
|
|
if (get_attr_mode (insn) == MODE_V4SF)
|
1837 |
|
|
return "%vmovups\t{%1, %0|%0, %1}";
|
1838 |
|
|
else
|
1839 |
|
|
return "%vmovdqu\t{%1, %0|%0, %1}";
|
1840 |
|
|
}
|
1841 |
|
|
else
|
1842 |
|
|
{
|
1843 |
|
|
if (get_attr_mode (insn) == MODE_V4SF)
|
1844 |
|
|
return "%vmovaps\t{%1, %0|%0, %1}";
|
1845 |
|
|
else
|
1846 |
|
|
return "%vmovdqa\t{%1, %0|%0, %1}";
|
1847 |
|
|
}
|
1848 |
|
|
default:
|
1849 |
|
|
gcc_unreachable ();
|
1850 |
|
|
}
|
1851 |
|
|
}
|
1852 |
|
|
[(set_attr "type" "*,*,sselog1,ssemov,ssemov")
|
1853 |
|
|
(set_attr "prefix" "*,*,maybe_vex,maybe_vex,maybe_vex")
|
1854 |
|
|
(set (attr "mode")
|
1855 |
|
|
(cond [(eq_attr "alternative" "2,3")
|
1856 |
|
|
(if_then_else
|
1857 |
|
|
(match_test "optimize_function_for_size_p (cfun)")
|
1858 |
|
|
(const_string "V4SF")
|
1859 |
|
|
(const_string "TI"))
|
1860 |
|
|
(eq_attr "alternative" "4")
|
1861 |
|
|
(if_then_else
|
1862 |
|
|
(ior (match_test "TARGET_SSE_TYPELESS_STORES")
|
1863 |
|
|
(match_test "optimize_function_for_size_p (cfun)"))
|
1864 |
|
|
(const_string "V4SF")
|
1865 |
|
|
(const_string "TI"))]
|
1866 |
|
|
(const_string "DI")))])
|
1867 |
|
|
|
1868 |
|
|
(define_split
|
1869 |
|
|
[(set (match_operand:TI 0 "nonimmediate_operand" "")
|
1870 |
|
|
(match_operand:TI 1 "general_operand" ""))]
|
1871 |
|
|
"reload_completed
|
1872 |
|
|
&& !SSE_REG_P (operands[0]) && !SSE_REG_P (operands[1])"
|
1873 |
|
|
[(const_int 0)]
|
1874 |
|
|
"ix86_split_long_move (operands); DONE;")
|
1875 |
|
|
|
1876 |
|
|
(define_insn "*movti_internal_sse"
|
1877 |
|
|
[(set (match_operand:TI 0 "nonimmediate_operand" "=x,x,m")
|
1878 |
|
|
(match_operand:TI 1 "vector_move_operand" "C,xm,x"))]
|
1879 |
|
|
"TARGET_SSE && !TARGET_64BIT
|
1880 |
|
|
&& !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
1881 |
|
|
{
|
1882 |
|
|
switch (which_alternative)
|
1883 |
|
|
{
|
1884 |
|
|
case 0:
|
1885 |
|
|
return standard_sse_constant_opcode (insn, operands[1]);
|
1886 |
|
|
case 1:
|
1887 |
|
|
case 2:
|
1888 |
|
|
/* TDmode values are passed as TImode on the stack. Moving them
|
1889 |
|
|
to stack may result in unaligned memory access. */
|
1890 |
|
|
if (misaligned_operand (operands[0], TImode)
|
1891 |
|
|
|| misaligned_operand (operands[1], TImode))
|
1892 |
|
|
{
|
1893 |
|
|
if (get_attr_mode (insn) == MODE_V4SF)
|
1894 |
|
|
return "%vmovups\t{%1, %0|%0, %1}";
|
1895 |
|
|
else
|
1896 |
|
|
return "%vmovdqu\t{%1, %0|%0, %1}";
|
1897 |
|
|
}
|
1898 |
|
|
else
|
1899 |
|
|
{
|
1900 |
|
|
if (get_attr_mode (insn) == MODE_V4SF)
|
1901 |
|
|
return "%vmovaps\t{%1, %0|%0, %1}";
|
1902 |
|
|
else
|
1903 |
|
|
return "%vmovdqa\t{%1, %0|%0, %1}";
|
1904 |
|
|
}
|
1905 |
|
|
default:
|
1906 |
|
|
gcc_unreachable ();
|
1907 |
|
|
}
|
1908 |
|
|
}
|
1909 |
|
|
[(set_attr "type" "sselog1,ssemov,ssemov")
|
1910 |
|
|
(set_attr "prefix" "maybe_vex")
|
1911 |
|
|
(set (attr "mode")
|
1912 |
|
|
(cond [(ior (not (match_test "TARGET_SSE2"))
|
1913 |
|
|
(match_test "optimize_function_for_size_p (cfun)"))
|
1914 |
|
|
(const_string "V4SF")
|
1915 |
|
|
(and (eq_attr "alternative" "2")
|
1916 |
|
|
(match_test "TARGET_SSE_TYPELESS_STORES"))
|
1917 |
|
|
(const_string "V4SF")]
|
1918 |
|
|
(const_string "TI")))])
|
1919 |
|
|
|
1920 |
|
|
(define_insn "*movdi_internal_rex64"
|
1921 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand"
|
1922 |
|
|
"=r,r ,r,m ,!o,*y,m*y,?*y,?r ,?*Ym,*x,m ,*x,*x,?r ,?*Yi,?*x,?*Ym")
|
1923 |
|
|
(match_operand:DI 1 "general_operand"
|
1924 |
|
|
"Z ,rem,i,re,n ,C ,*y ,m ,*Ym,r ,C ,*x,*x,m ,*Yi,r ,*Ym,*x"))]
|
1925 |
|
|
"TARGET_64BIT && !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
1926 |
|
|
{
|
1927 |
|
|
switch (get_attr_type (insn))
|
1928 |
|
|
{
|
1929 |
|
|
case TYPE_SSECVT:
|
1930 |
|
|
if (SSE_REG_P (operands[0]))
|
1931 |
|
|
return "movq2dq\t{%1, %0|%0, %1}";
|
1932 |
|
|
else
|
1933 |
|
|
return "movdq2q\t{%1, %0|%0, %1}";
|
1934 |
|
|
|
1935 |
|
|
case TYPE_SSEMOV:
|
1936 |
|
|
if (get_attr_mode (insn) == MODE_TI)
|
1937 |
|
|
return "%vmovdqa\t{%1, %0|%0, %1}";
|
1938 |
|
|
/* Handle broken assemblers that require movd instead of movq. */
|
1939 |
|
|
if (GENERAL_REG_P (operands[0]) || GENERAL_REG_P (operands[1]))
|
1940 |
|
|
return "%vmovd\t{%1, %0|%0, %1}";
|
1941 |
|
|
else
|
1942 |
|
|
return "%vmovq\t{%1, %0|%0, %1}";
|
1943 |
|
|
|
1944 |
|
|
case TYPE_MMXMOV:
|
1945 |
|
|
/* Handle broken assemblers that require movd instead of movq. */
|
1946 |
|
|
if (GENERAL_REG_P (operands[0]) || GENERAL_REG_P (operands[1]))
|
1947 |
|
|
return "movd\t{%1, %0|%0, %1}";
|
1948 |
|
|
else
|
1949 |
|
|
return "movq\t{%1, %0|%0, %1}";
|
1950 |
|
|
|
1951 |
|
|
case TYPE_SSELOG1:
|
1952 |
|
|
return standard_sse_constant_opcode (insn, operands[1]);
|
1953 |
|
|
|
1954 |
|
|
case TYPE_MMX:
|
1955 |
|
|
return "pxor\t%0, %0";
|
1956 |
|
|
|
1957 |
|
|
case TYPE_MULTI:
|
1958 |
|
|
return "#";
|
1959 |
|
|
|
1960 |
|
|
case TYPE_LEA:
|
1961 |
|
|
return "lea{q}\t{%a1, %0|%0, %a1}";
|
1962 |
|
|
|
1963 |
|
|
default:
|
1964 |
|
|
gcc_assert (!flag_pic || LEGITIMATE_PIC_OPERAND_P (operands[1]));
|
1965 |
|
|
if (get_attr_mode (insn) == MODE_SI)
|
1966 |
|
|
return "mov{l}\t{%k1, %k0|%k0, %k1}";
|
1967 |
|
|
else if (which_alternative == 2)
|
1968 |
|
|
return "movabs{q}\t{%1, %0|%0, %1}";
|
1969 |
|
|
else if (ix86_use_lea_for_mov (insn, operands))
|
1970 |
|
|
return "lea{q}\t{%a1, %0|%0, %a1}";
|
1971 |
|
|
else
|
1972 |
|
|
return "mov{q}\t{%1, %0|%0, %1}";
|
1973 |
|
|
}
|
1974 |
|
|
}
|
1975 |
|
|
[(set (attr "type")
|
1976 |
|
|
(cond [(eq_attr "alternative" "4")
|
1977 |
|
|
(const_string "multi")
|
1978 |
|
|
(eq_attr "alternative" "5")
|
1979 |
|
|
(const_string "mmx")
|
1980 |
|
|
(eq_attr "alternative" "6,7,8,9")
|
1981 |
|
|
(const_string "mmxmov")
|
1982 |
|
|
(eq_attr "alternative" "10")
|
1983 |
|
|
(const_string "sselog1")
|
1984 |
|
|
(eq_attr "alternative" "11,12,13,14,15")
|
1985 |
|
|
(const_string "ssemov")
|
1986 |
|
|
(eq_attr "alternative" "16,17")
|
1987 |
|
|
(const_string "ssecvt")
|
1988 |
|
|
(match_operand 1 "pic_32bit_operand" "")
|
1989 |
|
|
(const_string "lea")
|
1990 |
|
|
]
|
1991 |
|
|
(const_string "imov")))
|
1992 |
|
|
(set (attr "modrm")
|
1993 |
|
|
(if_then_else
|
1994 |
|
|
(and (eq_attr "alternative" "2") (eq_attr "type" "imov"))
|
1995 |
|
|
(const_string "0")
|
1996 |
|
|
(const_string "*")))
|
1997 |
|
|
(set (attr "length_immediate")
|
1998 |
|
|
(if_then_else
|
1999 |
|
|
(and (eq_attr "alternative" "2") (eq_attr "type" "imov"))
|
2000 |
|
|
(const_string "8")
|
2001 |
|
|
(const_string "*")))
|
2002 |
|
|
(set (attr "prefix_rex")
|
2003 |
|
|
(if_then_else (eq_attr "alternative" "8,9")
|
2004 |
|
|
(const_string "1")
|
2005 |
|
|
(const_string "*")))
|
2006 |
|
|
(set (attr "prefix_data16")
|
2007 |
|
|
(if_then_else (eq_attr "alternative" "11")
|
2008 |
|
|
(const_string "1")
|
2009 |
|
|
(const_string "*")))
|
2010 |
|
|
(set (attr "prefix")
|
2011 |
|
|
(if_then_else (eq_attr "alternative" "10,11,12,13,14,15")
|
2012 |
|
|
(const_string "maybe_vex")
|
2013 |
|
|
(const_string "orig")))
|
2014 |
|
|
(set_attr "mode" "SI,DI,DI,DI,SI,DI,DI,DI,DI,DI,TI,DI,TI,DI,DI,DI,DI,DI")])
|
2015 |
|
|
|
2016 |
|
|
;; Reload patterns to support multi-word load/store
|
2017 |
|
|
;; with non-offsetable address.
|
2018 |
|
|
(define_expand "reload_noff_store"
|
2019 |
|
|
[(parallel [(match_operand 0 "memory_operand" "=m")
|
2020 |
|
|
(match_operand 1 "register_operand" "r")
|
2021 |
|
|
(match_operand:DI 2 "register_operand" "=&r")])]
|
2022 |
|
|
"TARGET_64BIT"
|
2023 |
|
|
{
|
2024 |
|
|
rtx mem = operands[0];
|
2025 |
|
|
rtx addr = XEXP (mem, 0);
|
2026 |
|
|
|
2027 |
|
|
emit_move_insn (operands[2], addr);
|
2028 |
|
|
mem = replace_equiv_address_nv (mem, operands[2]);
|
2029 |
|
|
|
2030 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, mem, operands[1]));
|
2031 |
|
|
DONE;
|
2032 |
|
|
})
|
2033 |
|
|
|
2034 |
|
|
(define_expand "reload_noff_load"
|
2035 |
|
|
[(parallel [(match_operand 0 "register_operand" "=r")
|
2036 |
|
|
(match_operand 1 "memory_operand" "m")
|
2037 |
|
|
(match_operand:DI 2 "register_operand" "=r")])]
|
2038 |
|
|
"TARGET_64BIT"
|
2039 |
|
|
{
|
2040 |
|
|
rtx mem = operands[1];
|
2041 |
|
|
rtx addr = XEXP (mem, 0);
|
2042 |
|
|
|
2043 |
|
|
emit_move_insn (operands[2], addr);
|
2044 |
|
|
mem = replace_equiv_address_nv (mem, operands[2]);
|
2045 |
|
|
|
2046 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[0], mem));
|
2047 |
|
|
DONE;
|
2048 |
|
|
})
|
2049 |
|
|
|
2050 |
|
|
;; Convert impossible stores of immediate to existing instructions.
|
2051 |
|
|
;; First try to get scratch register and go through it. In case this
|
2052 |
|
|
;; fails, move by 32bit parts.
|
2053 |
|
|
(define_peephole2
|
2054 |
|
|
[(match_scratch:DI 2 "r")
|
2055 |
|
|
(set (match_operand:DI 0 "memory_operand" "")
|
2056 |
|
|
(match_operand:DI 1 "immediate_operand" ""))]
|
2057 |
|
|
"TARGET_64BIT && !symbolic_operand (operands[1], DImode)
|
2058 |
|
|
&& !x86_64_immediate_operand (operands[1], DImode)"
|
2059 |
|
|
[(set (match_dup 2) (match_dup 1))
|
2060 |
|
|
(set (match_dup 0) (match_dup 2))])
|
2061 |
|
|
|
2062 |
|
|
;; We need to define this as both peepholer and splitter for case
|
2063 |
|
|
;; peephole2 pass is not run.
|
2064 |
|
|
;; "&& 1" is needed to keep it from matching the previous pattern.
|
2065 |
|
|
(define_peephole2
|
2066 |
|
|
[(set (match_operand:DI 0 "memory_operand" "")
|
2067 |
|
|
(match_operand:DI 1 "immediate_operand" ""))]
|
2068 |
|
|
"TARGET_64BIT && !symbolic_operand (operands[1], DImode)
|
2069 |
|
|
&& !x86_64_immediate_operand (operands[1], DImode) && 1"
|
2070 |
|
|
[(set (match_dup 2) (match_dup 3))
|
2071 |
|
|
(set (match_dup 4) (match_dup 5))]
|
2072 |
|
|
"split_double_mode (DImode, &operands[0], 2, &operands[2], &operands[4]);")
|
2073 |
|
|
|
2074 |
|
|
(define_split
|
2075 |
|
|
[(set (match_operand:DI 0 "memory_operand" "")
|
2076 |
|
|
(match_operand:DI 1 "immediate_operand" ""))]
|
2077 |
|
|
"TARGET_64BIT && ((optimize > 0 && flag_peephole2)
|
2078 |
|
|
? epilogue_completed : reload_completed)
|
2079 |
|
|
&& !symbolic_operand (operands[1], DImode)
|
2080 |
|
|
&& !x86_64_immediate_operand (operands[1], DImode)"
|
2081 |
|
|
[(set (match_dup 2) (match_dup 3))
|
2082 |
|
|
(set (match_dup 4) (match_dup 5))]
|
2083 |
|
|
"split_double_mode (DImode, &operands[0], 2, &operands[2], &operands[4]);")
|
2084 |
|
|
|
2085 |
|
|
(define_insn "*movdi_internal"
|
2086 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand"
|
2087 |
|
|
"=r ,o ,*y,m*y,*y,*x,m ,*x,*x,*x,m ,*x,*x,?*x,?*Ym")
|
2088 |
|
|
(match_operand:DI 1 "general_operand"
|
2089 |
|
|
"riFo,riF,C ,*y ,m ,C ,*x,*x,m ,C ,*x,*x,m ,*Ym,*x"))]
|
2090 |
|
|
"!TARGET_64BIT && !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
2091 |
|
|
{
|
2092 |
|
|
switch (get_attr_type (insn))
|
2093 |
|
|
{
|
2094 |
|
|
case TYPE_SSECVT:
|
2095 |
|
|
if (SSE_REG_P (operands[0]))
|
2096 |
|
|
return "movq2dq\t{%1, %0|%0, %1}";
|
2097 |
|
|
else
|
2098 |
|
|
return "movdq2q\t{%1, %0|%0, %1}";
|
2099 |
|
|
|
2100 |
|
|
case TYPE_SSEMOV:
|
2101 |
|
|
switch (get_attr_mode (insn))
|
2102 |
|
|
{
|
2103 |
|
|
case MODE_TI:
|
2104 |
|
|
return "%vmovdqa\t{%1, %0|%0, %1}";
|
2105 |
|
|
case MODE_DI:
|
2106 |
|
|
return "%vmovq\t{%1, %0|%0, %1}";
|
2107 |
|
|
case MODE_V4SF:
|
2108 |
|
|
return "movaps\t{%1, %0|%0, %1}";
|
2109 |
|
|
case MODE_V2SF:
|
2110 |
|
|
return "movlps\t{%1, %0|%0, %1}";
|
2111 |
|
|
default:
|
2112 |
|
|
gcc_unreachable ();
|
2113 |
|
|
}
|
2114 |
|
|
|
2115 |
|
|
case TYPE_MMXMOV:
|
2116 |
|
|
return "movq\t{%1, %0|%0, %1}";
|
2117 |
|
|
|
2118 |
|
|
case TYPE_SSELOG1:
|
2119 |
|
|
return standard_sse_constant_opcode (insn, operands[1]);
|
2120 |
|
|
|
2121 |
|
|
case TYPE_MMX:
|
2122 |
|
|
return "pxor\t%0, %0";
|
2123 |
|
|
|
2124 |
|
|
case TYPE_MULTI:
|
2125 |
|
|
return "#";
|
2126 |
|
|
|
2127 |
|
|
default:
|
2128 |
|
|
gcc_unreachable ();
|
2129 |
|
|
}
|
2130 |
|
|
}
|
2131 |
|
|
[(set (attr "isa")
|
2132 |
|
|
(cond [(eq_attr "alternative" "5,6,7,8,13,14")
|
2133 |
|
|
(const_string "sse2")
|
2134 |
|
|
(eq_attr "alternative" "9,10,11,12")
|
2135 |
|
|
(const_string "noavx")
|
2136 |
|
|
]
|
2137 |
|
|
(const_string "*")))
|
2138 |
|
|
(set (attr "type")
|
2139 |
|
|
(cond [(eq_attr "alternative" "0,1")
|
2140 |
|
|
(const_string "multi")
|
2141 |
|
|
(eq_attr "alternative" "2")
|
2142 |
|
|
(const_string "mmx")
|
2143 |
|
|
(eq_attr "alternative" "3,4")
|
2144 |
|
|
(const_string "mmxmov")
|
2145 |
|
|
(eq_attr "alternative" "5,9")
|
2146 |
|
|
(const_string "sselog1")
|
2147 |
|
|
(eq_attr "alternative" "13,14")
|
2148 |
|
|
(const_string "ssecvt")
|
2149 |
|
|
]
|
2150 |
|
|
(const_string "ssemov")))
|
2151 |
|
|
(set (attr "prefix")
|
2152 |
|
|
(if_then_else (eq_attr "alternative" "5,6,7,8")
|
2153 |
|
|
(const_string "maybe_vex")
|
2154 |
|
|
(const_string "orig")))
|
2155 |
|
|
(set_attr "mode" "DI,DI,DI,DI,DI,TI,DI,TI,DI,V4SF,V2SF,V4SF,V2SF,DI,DI")])
|
2156 |
|
|
|
2157 |
|
|
(define_split
|
2158 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "")
|
2159 |
|
|
(match_operand:DI 1 "general_operand" ""))]
|
2160 |
|
|
"!TARGET_64BIT && reload_completed
|
2161 |
|
|
&& !(MMX_REG_P (operands[0]) || SSE_REG_P (operands[0]))
|
2162 |
|
|
&& !(MMX_REG_P (operands[1]) || SSE_REG_P (operands[1]))"
|
2163 |
|
|
[(const_int 0)]
|
2164 |
|
|
"ix86_split_long_move (operands); DONE;")
|
2165 |
|
|
|
2166 |
|
|
(define_insn "*movsi_internal"
|
2167 |
|
|
[(set (match_operand:SI 0 "nonimmediate_operand"
|
2168 |
|
|
"=r,m ,*y,*y,?rm,?*y,*x,*x,?r ,m ,?*Yi,*x")
|
2169 |
|
|
(match_operand:SI 1 "general_operand"
|
2170 |
|
|
"g ,re,C ,*y,*y ,rm ,C ,*x,*Yi,*x,r ,m "))]
|
2171 |
|
|
"!(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
2172 |
|
|
{
|
2173 |
|
|
switch (get_attr_type (insn))
|
2174 |
|
|
{
|
2175 |
|
|
case TYPE_SSELOG1:
|
2176 |
|
|
return standard_sse_constant_opcode (insn, operands[1]);
|
2177 |
|
|
|
2178 |
|
|
case TYPE_SSEMOV:
|
2179 |
|
|
switch (get_attr_mode (insn))
|
2180 |
|
|
{
|
2181 |
|
|
case MODE_TI:
|
2182 |
|
|
return "%vmovdqa\t{%1, %0|%0, %1}";
|
2183 |
|
|
case MODE_V4SF:
|
2184 |
|
|
return "%vmovaps\t{%1, %0|%0, %1}";
|
2185 |
|
|
case MODE_SI:
|
2186 |
|
|
return "%vmovd\t{%1, %0|%0, %1}";
|
2187 |
|
|
case MODE_SF:
|
2188 |
|
|
return "%vmovss\t{%1, %0|%0, %1}";
|
2189 |
|
|
default:
|
2190 |
|
|
gcc_unreachable ();
|
2191 |
|
|
}
|
2192 |
|
|
|
2193 |
|
|
case TYPE_MMX:
|
2194 |
|
|
return "pxor\t%0, %0";
|
2195 |
|
|
|
2196 |
|
|
case TYPE_MMXMOV:
|
2197 |
|
|
if (get_attr_mode (insn) == MODE_DI)
|
2198 |
|
|
return "movq\t{%1, %0|%0, %1}";
|
2199 |
|
|
return "movd\t{%1, %0|%0, %1}";
|
2200 |
|
|
|
2201 |
|
|
case TYPE_LEA:
|
2202 |
|
|
return "lea{l}\t{%a1, %0|%0, %a1}";
|
2203 |
|
|
|
2204 |
|
|
default:
|
2205 |
|
|
gcc_assert (!flag_pic || LEGITIMATE_PIC_OPERAND_P (operands[1]));
|
2206 |
|
|
if (ix86_use_lea_for_mov (insn, operands))
|
2207 |
|
|
return "lea{l}\t{%a1, %0|%0, %a1}";
|
2208 |
|
|
else
|
2209 |
|
|
return "mov{l}\t{%1, %0|%0, %1}";
|
2210 |
|
|
}
|
2211 |
|
|
}
|
2212 |
|
|
[(set (attr "type")
|
2213 |
|
|
(cond [(eq_attr "alternative" "2")
|
2214 |
|
|
(const_string "mmx")
|
2215 |
|
|
(eq_attr "alternative" "3,4,5")
|
2216 |
|
|
(const_string "mmxmov")
|
2217 |
|
|
(eq_attr "alternative" "6")
|
2218 |
|
|
(const_string "sselog1")
|
2219 |
|
|
(eq_attr "alternative" "7,8,9,10,11")
|
2220 |
|
|
(const_string "ssemov")
|
2221 |
|
|
(match_operand 1 "pic_32bit_operand" "")
|
2222 |
|
|
(const_string "lea")
|
2223 |
|
|
]
|
2224 |
|
|
(const_string "imov")))
|
2225 |
|
|
(set (attr "prefix")
|
2226 |
|
|
(if_then_else (eq_attr "alternative" "0,1,2,3,4,5")
|
2227 |
|
|
(const_string "orig")
|
2228 |
|
|
(const_string "maybe_vex")))
|
2229 |
|
|
(set (attr "prefix_data16")
|
2230 |
|
|
(if_then_else (and (eq_attr "type" "ssemov") (eq_attr "mode" "SI"))
|
2231 |
|
|
(const_string "1")
|
2232 |
|
|
(const_string "*")))
|
2233 |
|
|
(set (attr "mode")
|
2234 |
|
|
(cond [(eq_attr "alternative" "2,3")
|
2235 |
|
|
(const_string "DI")
|
2236 |
|
|
(eq_attr "alternative" "6,7")
|
2237 |
|
|
(if_then_else
|
2238 |
|
|
(not (match_test "TARGET_SSE2"))
|
2239 |
|
|
(const_string "V4SF")
|
2240 |
|
|
(const_string "TI"))
|
2241 |
|
|
(and (eq_attr "alternative" "8,9,10,11")
|
2242 |
|
|
(not (match_test "TARGET_SSE2")))
|
2243 |
|
|
(const_string "SF")
|
2244 |
|
|
]
|
2245 |
|
|
(const_string "SI")))])
|
2246 |
|
|
|
2247 |
|
|
(define_insn "*movhi_internal"
|
2248 |
|
|
[(set (match_operand:HI 0 "nonimmediate_operand" "=r,r,r,m")
|
2249 |
|
|
(match_operand:HI 1 "general_operand" "r,rn,rm,rn"))]
|
2250 |
|
|
"!(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
2251 |
|
|
{
|
2252 |
|
|
switch (get_attr_type (insn))
|
2253 |
|
|
{
|
2254 |
|
|
case TYPE_IMOVX:
|
2255 |
|
|
/* movzwl is faster than movw on p2 due to partial word stalls,
|
2256 |
|
|
though not as fast as an aligned movl. */
|
2257 |
|
|
return "movz{wl|x}\t{%1, %k0|%k0, %1}";
|
2258 |
|
|
default:
|
2259 |
|
|
if (get_attr_mode (insn) == MODE_SI)
|
2260 |
|
|
return "mov{l}\t{%k1, %k0|%k0, %k1}";
|
2261 |
|
|
else
|
2262 |
|
|
return "mov{w}\t{%1, %0|%0, %1}";
|
2263 |
|
|
}
|
2264 |
|
|
}
|
2265 |
|
|
[(set (attr "type")
|
2266 |
|
|
(cond [(match_test "optimize_function_for_size_p (cfun)")
|
2267 |
|
|
(const_string "imov")
|
2268 |
|
|
(and (eq_attr "alternative" "0")
|
2269 |
|
|
(ior (not (match_test "TARGET_PARTIAL_REG_STALL"))
|
2270 |
|
|
(not (match_test "TARGET_HIMODE_MATH"))))
|
2271 |
|
|
(const_string "imov")
|
2272 |
|
|
(and (eq_attr "alternative" "1,2")
|
2273 |
|
|
(match_operand:HI 1 "aligned_operand" ""))
|
2274 |
|
|
(const_string "imov")
|
2275 |
|
|
(and (match_test "TARGET_MOVX")
|
2276 |
|
|
(eq_attr "alternative" "0,2"))
|
2277 |
|
|
(const_string "imovx")
|
2278 |
|
|
]
|
2279 |
|
|
(const_string "imov")))
|
2280 |
|
|
(set (attr "mode")
|
2281 |
|
|
(cond [(eq_attr "type" "imovx")
|
2282 |
|
|
(const_string "SI")
|
2283 |
|
|
(and (eq_attr "alternative" "1,2")
|
2284 |
|
|
(match_operand:HI 1 "aligned_operand" ""))
|
2285 |
|
|
(const_string "SI")
|
2286 |
|
|
(and (eq_attr "alternative" "0")
|
2287 |
|
|
(ior (not (match_test "TARGET_PARTIAL_REG_STALL"))
|
2288 |
|
|
(not (match_test "TARGET_HIMODE_MATH"))))
|
2289 |
|
|
(const_string "SI")
|
2290 |
|
|
]
|
2291 |
|
|
(const_string "HI")))])
|
2292 |
|
|
|
2293 |
|
|
;; Situation is quite tricky about when to choose full sized (SImode) move
|
2294 |
|
|
;; over QImode moves. For Q_REG -> Q_REG move we use full size only for
|
2295 |
|
|
;; partial register dependency machines (such as AMD Athlon), where QImode
|
2296 |
|
|
;; moves issue extra dependency and for partial register stalls machines
|
2297 |
|
|
;; that don't use QImode patterns (and QImode move cause stall on the next
|
2298 |
|
|
;; instruction).
|
2299 |
|
|
;;
|
2300 |
|
|
;; For loads of Q_REG to NONQ_REG we use full sized moves except for partial
|
2301 |
|
|
;; register stall machines with, where we use QImode instructions, since
|
2302 |
|
|
;; partial register stall can be caused there. Then we use movzx.
|
2303 |
|
|
(define_insn "*movqi_internal"
|
2304 |
|
|
[(set (match_operand:QI 0 "nonimmediate_operand" "=q,q ,q ,r,r ,?r,m")
|
2305 |
|
|
(match_operand:QI 1 "general_operand" " q,qn,qm,q,rn,qm,qn"))]
|
2306 |
|
|
"!(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
2307 |
|
|
{
|
2308 |
|
|
switch (get_attr_type (insn))
|
2309 |
|
|
{
|
2310 |
|
|
case TYPE_IMOVX:
|
2311 |
|
|
gcc_assert (ANY_QI_REG_P (operands[1]) || MEM_P (operands[1]));
|
2312 |
|
|
return "movz{bl|x}\t{%1, %k0|%k0, %1}";
|
2313 |
|
|
default:
|
2314 |
|
|
if (get_attr_mode (insn) == MODE_SI)
|
2315 |
|
|
return "mov{l}\t{%k1, %k0|%k0, %k1}";
|
2316 |
|
|
else
|
2317 |
|
|
return "mov{b}\t{%1, %0|%0, %1}";
|
2318 |
|
|
}
|
2319 |
|
|
}
|
2320 |
|
|
[(set (attr "type")
|
2321 |
|
|
(cond [(and (eq_attr "alternative" "5")
|
2322 |
|
|
(not (match_operand:QI 1 "aligned_operand" "")))
|
2323 |
|
|
(const_string "imovx")
|
2324 |
|
|
(match_test "optimize_function_for_size_p (cfun)")
|
2325 |
|
|
(const_string "imov")
|
2326 |
|
|
(and (eq_attr "alternative" "3")
|
2327 |
|
|
(ior (not (match_test "TARGET_PARTIAL_REG_STALL"))
|
2328 |
|
|
(not (match_test "TARGET_QIMODE_MATH"))))
|
2329 |
|
|
(const_string "imov")
|
2330 |
|
|
(eq_attr "alternative" "3,5")
|
2331 |
|
|
(const_string "imovx")
|
2332 |
|
|
(and (match_test "TARGET_MOVX")
|
2333 |
|
|
(eq_attr "alternative" "2"))
|
2334 |
|
|
(const_string "imovx")
|
2335 |
|
|
]
|
2336 |
|
|
(const_string "imov")))
|
2337 |
|
|
(set (attr "mode")
|
2338 |
|
|
(cond [(eq_attr "alternative" "3,4,5")
|
2339 |
|
|
(const_string "SI")
|
2340 |
|
|
(eq_attr "alternative" "6")
|
2341 |
|
|
(const_string "QI")
|
2342 |
|
|
(eq_attr "type" "imovx")
|
2343 |
|
|
(const_string "SI")
|
2344 |
|
|
(and (eq_attr "type" "imov")
|
2345 |
|
|
(and (eq_attr "alternative" "0,1")
|
2346 |
|
|
(and (match_test "TARGET_PARTIAL_REG_DEPENDENCY")
|
2347 |
|
|
(and (not (match_test "optimize_function_for_size_p (cfun)"))
|
2348 |
|
|
(not (match_test "TARGET_PARTIAL_REG_STALL"))))))
|
2349 |
|
|
(const_string "SI")
|
2350 |
|
|
;; Avoid partial register stalls when not using QImode arithmetic
|
2351 |
|
|
(and (eq_attr "type" "imov")
|
2352 |
|
|
(and (eq_attr "alternative" "0,1")
|
2353 |
|
|
(and (match_test "TARGET_PARTIAL_REG_STALL")
|
2354 |
|
|
(not (match_test "TARGET_QIMODE_MATH")))))
|
2355 |
|
|
(const_string "SI")
|
2356 |
|
|
]
|
2357 |
|
|
(const_string "QI")))])
|
2358 |
|
|
|
2359 |
|
|
;; Stores and loads of ax to arbitrary constant address.
|
2360 |
|
|
;; We fake an second form of instruction to force reload to load address
|
2361 |
|
|
;; into register when rax is not available
|
2362 |
|
|
(define_insn "*movabs_1"
|
2363 |
|
|
[(set (mem:SWI1248x (match_operand:DI 0 "x86_64_movabs_operand" "i,r"))
|
2364 |
|
|
(match_operand:SWI1248x 1 "nonmemory_operand" "a,r"))]
|
2365 |
|
|
"TARGET_LP64 && ix86_check_movabs (insn, 0)"
|
2366 |
|
|
"@
|
2367 |
|
|
movabs{}\t{%1, %P0|%P0, %1}
|
2368 |
|
|
mov{}\t{%1, %a0|%a0, %1}"
|
2369 |
|
|
[(set_attr "type" "imov")
|
2370 |
|
|
(set_attr "modrm" "0,*")
|
2371 |
|
|
(set_attr "length_address" "8,0")
|
2372 |
|
|
(set_attr "length_immediate" "0,*")
|
2373 |
|
|
(set_attr "memory" "store")
|
2374 |
|
|
(set_attr "mode" "")])
|
2375 |
|
|
|
2376 |
|
|
(define_insn "*movabs_2"
|
2377 |
|
|
[(set (match_operand:SWI1248x 0 "register_operand" "=a,r")
|
2378 |
|
|
(mem:SWI1248x (match_operand:DI 1 "x86_64_movabs_operand" "i,r")))]
|
2379 |
|
|
"TARGET_LP64 && ix86_check_movabs (insn, 1)"
|
2380 |
|
|
"@
|
2381 |
|
|
movabs{}\t{%P1, %0|%0, %P1}
|
2382 |
|
|
mov{}\t{%a1, %0|%0, %a1}"
|
2383 |
|
|
[(set_attr "type" "imov")
|
2384 |
|
|
(set_attr "modrm" "0,*")
|
2385 |
|
|
(set_attr "length_address" "8,0")
|
2386 |
|
|
(set_attr "length_immediate" "0")
|
2387 |
|
|
(set_attr "memory" "load")
|
2388 |
|
|
(set_attr "mode" "")])
|
2389 |
|
|
|
2390 |
|
|
(define_insn "*swap"
|
2391 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "+r")
|
2392 |
|
|
(match_operand:SWI48 1 "register_operand" "+r"))
|
2393 |
|
|
(set (match_dup 1)
|
2394 |
|
|
(match_dup 0))]
|
2395 |
|
|
""
|
2396 |
|
|
"xchg{}\t%1, %0"
|
2397 |
|
|
[(set_attr "type" "imov")
|
2398 |
|
|
(set_attr "mode" "")
|
2399 |
|
|
(set_attr "pent_pair" "np")
|
2400 |
|
|
(set_attr "athlon_decode" "vector")
|
2401 |
|
|
(set_attr "amdfam10_decode" "double")
|
2402 |
|
|
(set_attr "bdver1_decode" "double")])
|
2403 |
|
|
|
2404 |
|
|
(define_insn "*swap_1"
|
2405 |
|
|
[(set (match_operand:SWI12 0 "register_operand" "+r")
|
2406 |
|
|
(match_operand:SWI12 1 "register_operand" "+r"))
|
2407 |
|
|
(set (match_dup 1)
|
2408 |
|
|
(match_dup 0))]
|
2409 |
|
|
"!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun)"
|
2410 |
|
|
"xchg{l}\t%k1, %k0"
|
2411 |
|
|
[(set_attr "type" "imov")
|
2412 |
|
|
(set_attr "mode" "SI")
|
2413 |
|
|
(set_attr "pent_pair" "np")
|
2414 |
|
|
(set_attr "athlon_decode" "vector")
|
2415 |
|
|
(set_attr "amdfam10_decode" "double")
|
2416 |
|
|
(set_attr "bdver1_decode" "double")])
|
2417 |
|
|
|
2418 |
|
|
;; Not added amdfam10_decode since TARGET_PARTIAL_REG_STALL
|
2419 |
|
|
;; is disabled for AMDFAM10
|
2420 |
|
|
(define_insn "*swap_2"
|
2421 |
|
|
[(set (match_operand:SWI12 0 "register_operand" "+")
|
2422 |
|
|
(match_operand:SWI12 1 "register_operand" "+"))
|
2423 |
|
|
(set (match_dup 1)
|
2424 |
|
|
(match_dup 0))]
|
2425 |
|
|
"TARGET_PARTIAL_REG_STALL"
|
2426 |
|
|
"xchg{}\t%1, %0"
|
2427 |
|
|
[(set_attr "type" "imov")
|
2428 |
|
|
(set_attr "mode" "")
|
2429 |
|
|
(set_attr "pent_pair" "np")
|
2430 |
|
|
(set_attr "athlon_decode" "vector")])
|
2431 |
|
|
|
2432 |
|
|
(define_expand "movstrict"
|
2433 |
|
|
[(set (strict_low_part (match_operand:SWI12 0 "nonimmediate_operand" ""))
|
2434 |
|
|
(match_operand:SWI12 1 "general_operand" ""))]
|
2435 |
|
|
""
|
2436 |
|
|
{
|
2437 |
|
|
if (TARGET_PARTIAL_REG_STALL && optimize_function_for_speed_p (cfun))
|
2438 |
|
|
FAIL;
|
2439 |
|
|
if (GET_CODE (operands[0]) == SUBREG
|
2440 |
|
|
&& GET_MODE_CLASS (GET_MODE (SUBREG_REG (operands[0]))) != MODE_INT)
|
2441 |
|
|
FAIL;
|
2442 |
|
|
/* Don't generate memory->memory moves, go through a register */
|
2443 |
|
|
if (MEM_P (operands[0]) && MEM_P (operands[1]))
|
2444 |
|
|
operands[1] = force_reg (mode, operands[1]);
|
2445 |
|
|
})
|
2446 |
|
|
|
2447 |
|
|
(define_insn "*movstrict_1"
|
2448 |
|
|
[(set (strict_low_part
|
2449 |
|
|
(match_operand:SWI12 0 "nonimmediate_operand" "+m,"))
|
2450 |
|
|
(match_operand:SWI12 1 "general_operand" "n,m"))]
|
2451 |
|
|
"(!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
2452 |
|
|
&& !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
2453 |
|
|
"mov{}\t{%1, %0|%0, %1}"
|
2454 |
|
|
[(set_attr "type" "imov")
|
2455 |
|
|
(set_attr "mode" "")])
|
2456 |
|
|
|
2457 |
|
|
(define_insn "*movstrict_xor"
|
2458 |
|
|
[(set (strict_low_part (match_operand:SWI12 0 "register_operand" "+"))
|
2459 |
|
|
(match_operand:SWI12 1 "const0_operand" ""))
|
2460 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
2461 |
|
|
"reload_completed"
|
2462 |
|
|
"xor{}\t%0, %0"
|
2463 |
|
|
[(set_attr "type" "alu1")
|
2464 |
|
|
(set_attr "mode" "")
|
2465 |
|
|
(set_attr "length_immediate" "0")])
|
2466 |
|
|
|
2467 |
|
|
(define_insn "*mov_extv_1"
|
2468 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "=R")
|
2469 |
|
|
(sign_extract:SWI24 (match_operand 1 "ext_register_operand" "Q")
|
2470 |
|
|
(const_int 8)
|
2471 |
|
|
(const_int 8)))]
|
2472 |
|
|
""
|
2473 |
|
|
"movs{bl|x}\t{%h1, %k0|%k0, %h1}"
|
2474 |
|
|
[(set_attr "type" "imovx")
|
2475 |
|
|
(set_attr "mode" "SI")])
|
2476 |
|
|
|
2477 |
|
|
(define_insn "*movqi_extv_1_rex64"
|
2478 |
|
|
[(set (match_operand:QI 0 "register_operand" "=Q,?R")
|
2479 |
|
|
(sign_extract:QI (match_operand 1 "ext_register_operand" "Q,Q")
|
2480 |
|
|
(const_int 8)
|
2481 |
|
|
(const_int 8)))]
|
2482 |
|
|
"TARGET_64BIT"
|
2483 |
|
|
{
|
2484 |
|
|
switch (get_attr_type (insn))
|
2485 |
|
|
{
|
2486 |
|
|
case TYPE_IMOVX:
|
2487 |
|
|
return "movs{bl|x}\t{%h1, %k0|%k0, %h1}";
|
2488 |
|
|
default:
|
2489 |
|
|
return "mov{b}\t{%h1, %0|%0, %h1}";
|
2490 |
|
|
}
|
2491 |
|
|
}
|
2492 |
|
|
[(set (attr "type")
|
2493 |
|
|
(if_then_else (ior (not (match_operand:QI 0 "QIreg_operand" ""))
|
2494 |
|
|
(match_test "TARGET_MOVX"))
|
2495 |
|
|
(const_string "imovx")
|
2496 |
|
|
(const_string "imov")))
|
2497 |
|
|
(set (attr "mode")
|
2498 |
|
|
(if_then_else (eq_attr "type" "imovx")
|
2499 |
|
|
(const_string "SI")
|
2500 |
|
|
(const_string "QI")))])
|
2501 |
|
|
|
2502 |
|
|
(define_insn "*movqi_extv_1"
|
2503 |
|
|
[(set (match_operand:QI 0 "nonimmediate_operand" "=Qm,?r")
|
2504 |
|
|
(sign_extract:QI (match_operand 1 "ext_register_operand" "Q,Q")
|
2505 |
|
|
(const_int 8)
|
2506 |
|
|
(const_int 8)))]
|
2507 |
|
|
"!TARGET_64BIT"
|
2508 |
|
|
{
|
2509 |
|
|
switch (get_attr_type (insn))
|
2510 |
|
|
{
|
2511 |
|
|
case TYPE_IMOVX:
|
2512 |
|
|
return "movs{bl|x}\t{%h1, %k0|%k0, %h1}";
|
2513 |
|
|
default:
|
2514 |
|
|
return "mov{b}\t{%h1, %0|%0, %h1}";
|
2515 |
|
|
}
|
2516 |
|
|
}
|
2517 |
|
|
[(set (attr "type")
|
2518 |
|
|
(if_then_else (and (match_operand:QI 0 "register_operand" "")
|
2519 |
|
|
(ior (not (match_operand:QI 0 "QIreg_operand" ""))
|
2520 |
|
|
(match_test "TARGET_MOVX")))
|
2521 |
|
|
(const_string "imovx")
|
2522 |
|
|
(const_string "imov")))
|
2523 |
|
|
(set (attr "mode")
|
2524 |
|
|
(if_then_else (eq_attr "type" "imovx")
|
2525 |
|
|
(const_string "SI")
|
2526 |
|
|
(const_string "QI")))])
|
2527 |
|
|
|
2528 |
|
|
(define_insn "*mov_extzv_1"
|
2529 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=R")
|
2530 |
|
|
(zero_extract:SWI48 (match_operand 1 "ext_register_operand" "Q")
|
2531 |
|
|
(const_int 8)
|
2532 |
|
|
(const_int 8)))]
|
2533 |
|
|
""
|
2534 |
|
|
"movz{bl|x}\t{%h1, %k0|%k0, %h1}"
|
2535 |
|
|
[(set_attr "type" "imovx")
|
2536 |
|
|
(set_attr "mode" "SI")])
|
2537 |
|
|
|
2538 |
|
|
(define_insn "*movqi_extzv_2_rex64"
|
2539 |
|
|
[(set (match_operand:QI 0 "register_operand" "=Q,?R")
|
2540 |
|
|
(subreg:QI
|
2541 |
|
|
(zero_extract:SI (match_operand 1 "ext_register_operand" "Q,Q")
|
2542 |
|
|
(const_int 8)
|
2543 |
|
|
(const_int 8)) 0))]
|
2544 |
|
|
"TARGET_64BIT"
|
2545 |
|
|
{
|
2546 |
|
|
switch (get_attr_type (insn))
|
2547 |
|
|
{
|
2548 |
|
|
case TYPE_IMOVX:
|
2549 |
|
|
return "movz{bl|x}\t{%h1, %k0|%k0, %h1}";
|
2550 |
|
|
default:
|
2551 |
|
|
return "mov{b}\t{%h1, %0|%0, %h1}";
|
2552 |
|
|
}
|
2553 |
|
|
}
|
2554 |
|
|
[(set (attr "type")
|
2555 |
|
|
(if_then_else (ior (not (match_operand:QI 0 "QIreg_operand" ""))
|
2556 |
|
|
(match_test "TARGET_MOVX"))
|
2557 |
|
|
(const_string "imovx")
|
2558 |
|
|
(const_string "imov")))
|
2559 |
|
|
(set (attr "mode")
|
2560 |
|
|
(if_then_else (eq_attr "type" "imovx")
|
2561 |
|
|
(const_string "SI")
|
2562 |
|
|
(const_string "QI")))])
|
2563 |
|
|
|
2564 |
|
|
(define_insn "*movqi_extzv_2"
|
2565 |
|
|
[(set (match_operand:QI 0 "nonimmediate_operand" "=Qm,?R")
|
2566 |
|
|
(subreg:QI
|
2567 |
|
|
(zero_extract:SI (match_operand 1 "ext_register_operand" "Q,Q")
|
2568 |
|
|
(const_int 8)
|
2569 |
|
|
(const_int 8)) 0))]
|
2570 |
|
|
"!TARGET_64BIT"
|
2571 |
|
|
{
|
2572 |
|
|
switch (get_attr_type (insn))
|
2573 |
|
|
{
|
2574 |
|
|
case TYPE_IMOVX:
|
2575 |
|
|
return "movz{bl|x}\t{%h1, %k0|%k0, %h1}";
|
2576 |
|
|
default:
|
2577 |
|
|
return "mov{b}\t{%h1, %0|%0, %h1}";
|
2578 |
|
|
}
|
2579 |
|
|
}
|
2580 |
|
|
[(set (attr "type")
|
2581 |
|
|
(if_then_else (and (match_operand:QI 0 "register_operand" "")
|
2582 |
|
|
(ior (not (match_operand:QI 0 "QIreg_operand" ""))
|
2583 |
|
|
(match_test "TARGET_MOVX")))
|
2584 |
|
|
(const_string "imovx")
|
2585 |
|
|
(const_string "imov")))
|
2586 |
|
|
(set (attr "mode")
|
2587 |
|
|
(if_then_else (eq_attr "type" "imovx")
|
2588 |
|
|
(const_string "SI")
|
2589 |
|
|
(const_string "QI")))])
|
2590 |
|
|
|
2591 |
|
|
(define_expand "mov_insv_1"
|
2592 |
|
|
[(set (zero_extract:SWI48 (match_operand 0 "ext_register_operand" "")
|
2593 |
|
|
(const_int 8)
|
2594 |
|
|
(const_int 8))
|
2595 |
|
|
(match_operand:SWI48 1 "nonmemory_operand" ""))])
|
2596 |
|
|
|
2597 |
|
|
(define_insn "*mov_insv_1_rex64"
|
2598 |
|
|
[(set (zero_extract:SWI48x (match_operand 0 "ext_register_operand" "+Q")
|
2599 |
|
|
(const_int 8)
|
2600 |
|
|
(const_int 8))
|
2601 |
|
|
(match_operand:SWI48x 1 "nonmemory_operand" "Qn"))]
|
2602 |
|
|
"TARGET_64BIT"
|
2603 |
|
|
"mov{b}\t{%b1, %h0|%h0, %b1}"
|
2604 |
|
|
[(set_attr "type" "imov")
|
2605 |
|
|
(set_attr "mode" "QI")])
|
2606 |
|
|
|
2607 |
|
|
(define_insn "*movsi_insv_1"
|
2608 |
|
|
[(set (zero_extract:SI (match_operand 0 "ext_register_operand" "+Q")
|
2609 |
|
|
(const_int 8)
|
2610 |
|
|
(const_int 8))
|
2611 |
|
|
(match_operand:SI 1 "general_operand" "Qmn"))]
|
2612 |
|
|
"!TARGET_64BIT"
|
2613 |
|
|
"mov{b}\t{%b1, %h0|%h0, %b1}"
|
2614 |
|
|
[(set_attr "type" "imov")
|
2615 |
|
|
(set_attr "mode" "QI")])
|
2616 |
|
|
|
2617 |
|
|
(define_insn "*movqi_insv_2"
|
2618 |
|
|
[(set (zero_extract:SI (match_operand 0 "ext_register_operand" "+Q")
|
2619 |
|
|
(const_int 8)
|
2620 |
|
|
(const_int 8))
|
2621 |
|
|
(lshiftrt:SI (match_operand:SI 1 "register_operand" "Q")
|
2622 |
|
|
(const_int 8)))]
|
2623 |
|
|
""
|
2624 |
|
|
"mov{b}\t{%h1, %h0|%h0, %h1}"
|
2625 |
|
|
[(set_attr "type" "imov")
|
2626 |
|
|
(set_attr "mode" "QI")])
|
2627 |
|
|
|
2628 |
|
|
;; Floating point push instructions.
|
2629 |
|
|
|
2630 |
|
|
(define_insn "*pushtf"
|
2631 |
|
|
[(set (match_operand:TF 0 "push_operand" "=<,<,<")
|
2632 |
|
|
(match_operand:TF 1 "general_no_elim_operand" "x,Fo,*r"))]
|
2633 |
|
|
"TARGET_SSE2"
|
2634 |
|
|
{
|
2635 |
|
|
/* This insn should be already split before reg-stack. */
|
2636 |
|
|
gcc_unreachable ();
|
2637 |
|
|
}
|
2638 |
|
|
[(set_attr "type" "multi")
|
2639 |
|
|
(set_attr "unit" "sse,*,*")
|
2640 |
|
|
(set_attr "mode" "TF,SI,SI")])
|
2641 |
|
|
|
2642 |
|
|
;; %%% Kill this when call knows how to work this out.
|
2643 |
|
|
(define_split
|
2644 |
|
|
[(set (match_operand:TF 0 "push_operand" "")
|
2645 |
|
|
(match_operand:TF 1 "sse_reg_operand" ""))]
|
2646 |
|
|
"TARGET_SSE2 && reload_completed"
|
2647 |
|
|
[(set (reg:P SP_REG) (plus:P (reg:P SP_REG) (const_int -16)))
|
2648 |
|
|
(set (mem:TF (reg:P SP_REG)) (match_dup 1))])
|
2649 |
|
|
|
2650 |
|
|
(define_insn "*pushxf"
|
2651 |
|
|
[(set (match_operand:XF 0 "push_operand" "=<,<")
|
2652 |
|
|
(match_operand:XF 1 "general_no_elim_operand" "f,ro"))]
|
2653 |
|
|
"optimize_function_for_speed_p (cfun)"
|
2654 |
|
|
{
|
2655 |
|
|
/* This insn should be already split before reg-stack. */
|
2656 |
|
|
gcc_unreachable ();
|
2657 |
|
|
}
|
2658 |
|
|
[(set_attr "type" "multi")
|
2659 |
|
|
(set_attr "unit" "i387,*")
|
2660 |
|
|
(set_attr "mode" "XF,SI")])
|
2661 |
|
|
|
2662 |
|
|
;; Size of pushxf is 3 (for sub) + 2 (for fstp) + memory operand size.
|
2663 |
|
|
;; Size of pushxf using integer instructions is 3+3*memory operand size
|
2664 |
|
|
;; Pushing using integer instructions is longer except for constants
|
2665 |
|
|
;; and direct memory references (assuming that any given constant is pushed
|
2666 |
|
|
;; only once, but this ought to be handled elsewhere).
|
2667 |
|
|
|
2668 |
|
|
(define_insn "*pushxf_nointeger"
|
2669 |
|
|
[(set (match_operand:XF 0 "push_operand" "=<,<")
|
2670 |
|
|
(match_operand:XF 1 "general_no_elim_operand" "f,*rFo"))]
|
2671 |
|
|
"optimize_function_for_size_p (cfun)"
|
2672 |
|
|
{
|
2673 |
|
|
/* This insn should be already split before reg-stack. */
|
2674 |
|
|
gcc_unreachable ();
|
2675 |
|
|
}
|
2676 |
|
|
[(set_attr "type" "multi")
|
2677 |
|
|
(set_attr "unit" "i387,*")
|
2678 |
|
|
(set_attr "mode" "XF,SI")])
|
2679 |
|
|
|
2680 |
|
|
;; %%% Kill this when call knows how to work this out.
|
2681 |
|
|
(define_split
|
2682 |
|
|
[(set (match_operand:XF 0 "push_operand" "")
|
2683 |
|
|
(match_operand:XF 1 "fp_register_operand" ""))]
|
2684 |
|
|
"reload_completed"
|
2685 |
|
|
[(set (reg:P SP_REG) (plus:P (reg:P SP_REG) (match_dup 2)))
|
2686 |
|
|
(set (mem:XF (reg:P SP_REG)) (match_dup 1))]
|
2687 |
|
|
"operands[2] = GEN_INT (-GET_MODE_SIZE (XFmode));")
|
2688 |
|
|
|
2689 |
|
|
(define_insn "*pushdf_rex64"
|
2690 |
|
|
[(set (match_operand:DF 0 "push_operand" "=<,<,<")
|
2691 |
|
|
(match_operand:DF 1 "general_no_elim_operand" "f,Yd*rFm,x"))]
|
2692 |
|
|
"TARGET_64BIT"
|
2693 |
|
|
{
|
2694 |
|
|
/* This insn should be already split before reg-stack. */
|
2695 |
|
|
gcc_unreachable ();
|
2696 |
|
|
}
|
2697 |
|
|
[(set_attr "type" "multi")
|
2698 |
|
|
(set_attr "unit" "i387,*,*")
|
2699 |
|
|
(set_attr "mode" "DF,DI,DF")])
|
2700 |
|
|
|
2701 |
|
|
;; Size of pushdf is 3 (for sub) + 2 (for fstp) + memory operand size.
|
2702 |
|
|
;; Size of pushdf using integer instructions is 2+2*memory operand size
|
2703 |
|
|
;; On the average, pushdf using integers can be still shorter.
|
2704 |
|
|
|
2705 |
|
|
(define_insn "*pushdf"
|
2706 |
|
|
[(set (match_operand:DF 0 "push_operand" "=<,<,<")
|
2707 |
|
|
(match_operand:DF 1 "general_no_elim_operand" "f,Yd*rFo,x"))]
|
2708 |
|
|
"!TARGET_64BIT"
|
2709 |
|
|
{
|
2710 |
|
|
/* This insn should be already split before reg-stack. */
|
2711 |
|
|
gcc_unreachable ();
|
2712 |
|
|
}
|
2713 |
|
|
[(set_attr "isa" "*,*,sse2")
|
2714 |
|
|
(set_attr "type" "multi")
|
2715 |
|
|
(set_attr "unit" "i387,*,*")
|
2716 |
|
|
(set_attr "mode" "DF,DI,DF")])
|
2717 |
|
|
|
2718 |
|
|
;; %%% Kill this when call knows how to work this out.
|
2719 |
|
|
(define_split
|
2720 |
|
|
[(set (match_operand:DF 0 "push_operand" "")
|
2721 |
|
|
(match_operand:DF 1 "any_fp_register_operand" ""))]
|
2722 |
|
|
"reload_completed"
|
2723 |
|
|
[(set (reg:P SP_REG) (plus:P (reg:P SP_REG) (const_int -8)))
|
2724 |
|
|
(set (mem:DF (reg:P SP_REG)) (match_dup 1))])
|
2725 |
|
|
|
2726 |
|
|
(define_insn "*pushsf_rex64"
|
2727 |
|
|
[(set (match_operand:SF 0 "push_operand" "=X,X,X")
|
2728 |
|
|
(match_operand:SF 1 "nonmemory_no_elim_operand" "f,rF,x"))]
|
2729 |
|
|
"TARGET_64BIT"
|
2730 |
|
|
{
|
2731 |
|
|
/* Anything else should be already split before reg-stack. */
|
2732 |
|
|
gcc_assert (which_alternative == 1);
|
2733 |
|
|
return "push{q}\t%q1";
|
2734 |
|
|
}
|
2735 |
|
|
[(set_attr "type" "multi,push,multi")
|
2736 |
|
|
(set_attr "unit" "i387,*,*")
|
2737 |
|
|
(set_attr "mode" "SF,DI,SF")])
|
2738 |
|
|
|
2739 |
|
|
(define_insn "*pushsf"
|
2740 |
|
|
[(set (match_operand:SF 0 "push_operand" "=<,<,<")
|
2741 |
|
|
(match_operand:SF 1 "general_no_elim_operand" "f,rFm,x"))]
|
2742 |
|
|
"!TARGET_64BIT"
|
2743 |
|
|
{
|
2744 |
|
|
/* Anything else should be already split before reg-stack. */
|
2745 |
|
|
gcc_assert (which_alternative == 1);
|
2746 |
|
|
return "push{l}\t%1";
|
2747 |
|
|
}
|
2748 |
|
|
[(set_attr "type" "multi,push,multi")
|
2749 |
|
|
(set_attr "unit" "i387,*,*")
|
2750 |
|
|
(set_attr "mode" "SF,SI,SF")])
|
2751 |
|
|
|
2752 |
|
|
;; %%% Kill this when call knows how to work this out.
|
2753 |
|
|
(define_split
|
2754 |
|
|
[(set (match_operand:SF 0 "push_operand" "")
|
2755 |
|
|
(match_operand:SF 1 "any_fp_register_operand" ""))]
|
2756 |
|
|
"reload_completed"
|
2757 |
|
|
[(set (reg:P SP_REG) (plus:P (reg:P SP_REG) (match_dup 2)))
|
2758 |
|
|
(set (mem:SF (reg:P SP_REG)) (match_dup 1))]
|
2759 |
|
|
"operands[2] = GEN_INT (-GET_MODE_SIZE (mode));")
|
2760 |
|
|
|
2761 |
|
|
(define_split
|
2762 |
|
|
[(set (match_operand:SF 0 "push_operand" "")
|
2763 |
|
|
(match_operand:SF 1 "memory_operand" ""))]
|
2764 |
|
|
"reload_completed
|
2765 |
|
|
&& (operands[2] = find_constant_src (insn))"
|
2766 |
|
|
[(set (match_dup 0) (match_dup 2))])
|
2767 |
|
|
|
2768 |
|
|
(define_split
|
2769 |
|
|
[(set (match_operand 0 "push_operand" "")
|
2770 |
|
|
(match_operand 1 "general_operand" ""))]
|
2771 |
|
|
"reload_completed
|
2772 |
|
|
&& (GET_MODE (operands[0]) == TFmode
|
2773 |
|
|
|| GET_MODE (operands[0]) == XFmode
|
2774 |
|
|
|| GET_MODE (operands[0]) == DFmode)
|
2775 |
|
|
&& !ANY_FP_REG_P (operands[1])"
|
2776 |
|
|
[(const_int 0)]
|
2777 |
|
|
"ix86_split_long_move (operands); DONE;")
|
2778 |
|
|
|
2779 |
|
|
;; Floating point move instructions.
|
2780 |
|
|
|
2781 |
|
|
(define_expand "movtf"
|
2782 |
|
|
[(set (match_operand:TF 0 "nonimmediate_operand" "")
|
2783 |
|
|
(match_operand:TF 1 "nonimmediate_operand" ""))]
|
2784 |
|
|
"TARGET_SSE2"
|
2785 |
|
|
{
|
2786 |
|
|
ix86_expand_move (TFmode, operands);
|
2787 |
|
|
DONE;
|
2788 |
|
|
})
|
2789 |
|
|
|
2790 |
|
|
(define_expand "mov"
|
2791 |
|
|
[(set (match_operand:X87MODEF 0 "nonimmediate_operand" "")
|
2792 |
|
|
(match_operand:X87MODEF 1 "general_operand" ""))]
|
2793 |
|
|
""
|
2794 |
|
|
"ix86_expand_move (mode, operands); DONE;")
|
2795 |
|
|
|
2796 |
|
|
(define_insn "*movtf_internal"
|
2797 |
|
|
[(set (match_operand:TF 0 "nonimmediate_operand" "=x,m,x,?*r ,!o")
|
2798 |
|
|
(match_operand:TF 1 "general_operand" "xm,x,C,*roF,F*r"))]
|
2799 |
|
|
"TARGET_SSE2
|
2800 |
|
|
&& !(MEM_P (operands[0]) && MEM_P (operands[1]))
|
2801 |
|
|
&& (!can_create_pseudo_p ()
|
2802 |
|
|
|| (ix86_cmodel == CM_MEDIUM || ix86_cmodel == CM_LARGE)
|
2803 |
|
|
|| GET_CODE (operands[1]) != CONST_DOUBLE
|
2804 |
|
|
|| (optimize_function_for_size_p (cfun)
|
2805 |
|
|
&& standard_sse_constant_p (operands[1])
|
2806 |
|
|
&& !memory_operand (operands[0], TFmode))
|
2807 |
|
|
|| (!TARGET_MEMORY_MISMATCH_STALL
|
2808 |
|
|
&& memory_operand (operands[0], TFmode)))"
|
2809 |
|
|
{
|
2810 |
|
|
switch (which_alternative)
|
2811 |
|
|
{
|
2812 |
|
|
case 0:
|
2813 |
|
|
case 1:
|
2814 |
|
|
/* Handle misaligned load/store since we
|
2815 |
|
|
don't have movmisaligntf pattern. */
|
2816 |
|
|
if (misaligned_operand (operands[0], TFmode)
|
2817 |
|
|
|| misaligned_operand (operands[1], TFmode))
|
2818 |
|
|
{
|
2819 |
|
|
if (get_attr_mode (insn) == MODE_V4SF)
|
2820 |
|
|
return "%vmovups\t{%1, %0|%0, %1}";
|
2821 |
|
|
else
|
2822 |
|
|
return "%vmovdqu\t{%1, %0|%0, %1}";
|
2823 |
|
|
}
|
2824 |
|
|
else
|
2825 |
|
|
{
|
2826 |
|
|
if (get_attr_mode (insn) == MODE_V4SF)
|
2827 |
|
|
return "%vmovaps\t{%1, %0|%0, %1}";
|
2828 |
|
|
else
|
2829 |
|
|
return "%vmovdqa\t{%1, %0|%0, %1}";
|
2830 |
|
|
}
|
2831 |
|
|
|
2832 |
|
|
case 2:
|
2833 |
|
|
return standard_sse_constant_opcode (insn, operands[1]);
|
2834 |
|
|
|
2835 |
|
|
case 3:
|
2836 |
|
|
case 4:
|
2837 |
|
|
return "#";
|
2838 |
|
|
|
2839 |
|
|
default:
|
2840 |
|
|
gcc_unreachable ();
|
2841 |
|
|
}
|
2842 |
|
|
}
|
2843 |
|
|
[(set_attr "type" "ssemov,ssemov,sselog1,*,*")
|
2844 |
|
|
(set_attr "prefix" "maybe_vex,maybe_vex,maybe_vex,*,*")
|
2845 |
|
|
(set (attr "mode")
|
2846 |
|
|
(cond [(eq_attr "alternative" "0,2")
|
2847 |
|
|
(if_then_else
|
2848 |
|
|
(match_test "optimize_function_for_size_p (cfun)")
|
2849 |
|
|
(const_string "V4SF")
|
2850 |
|
|
(const_string "TI"))
|
2851 |
|
|
(eq_attr "alternative" "1")
|
2852 |
|
|
(if_then_else
|
2853 |
|
|
(ior (match_test "TARGET_SSE_TYPELESS_STORES")
|
2854 |
|
|
(match_test "optimize_function_for_size_p (cfun)"))
|
2855 |
|
|
(const_string "V4SF")
|
2856 |
|
|
(const_string "TI"))]
|
2857 |
|
|
(const_string "DI")))])
|
2858 |
|
|
|
2859 |
|
|
;; Possible store forwarding (partial memory) stall in alternative 4.
|
2860 |
|
|
(define_insn "*movxf_internal"
|
2861 |
|
|
[(set (match_operand:XF 0 "nonimmediate_operand" "=f,m,f,?Yx*r ,!o")
|
2862 |
|
|
(match_operand:XF 1 "general_operand" "fm,f,G,Yx*roF,FYx*r"))]
|
2863 |
|
|
"!(MEM_P (operands[0]) && MEM_P (operands[1]))
|
2864 |
|
|
&& (!can_create_pseudo_p ()
|
2865 |
|
|
|| (ix86_cmodel == CM_MEDIUM || ix86_cmodel == CM_LARGE)
|
2866 |
|
|
|| GET_CODE (operands[1]) != CONST_DOUBLE
|
2867 |
|
|
|| (optimize_function_for_size_p (cfun)
|
2868 |
|
|
&& standard_80387_constant_p (operands[1]) > 0
|
2869 |
|
|
&& !memory_operand (operands[0], XFmode))
|
2870 |
|
|
|| (!TARGET_MEMORY_MISMATCH_STALL
|
2871 |
|
|
&& memory_operand (operands[0], XFmode)))"
|
2872 |
|
|
{
|
2873 |
|
|
switch (which_alternative)
|
2874 |
|
|
{
|
2875 |
|
|
case 0:
|
2876 |
|
|
case 1:
|
2877 |
|
|
return output_387_reg_move (insn, operands);
|
2878 |
|
|
|
2879 |
|
|
case 2:
|
2880 |
|
|
return standard_80387_constant_opcode (operands[1]);
|
2881 |
|
|
|
2882 |
|
|
case 3:
|
2883 |
|
|
case 4:
|
2884 |
|
|
return "#";
|
2885 |
|
|
|
2886 |
|
|
default:
|
2887 |
|
|
gcc_unreachable ();
|
2888 |
|
|
}
|
2889 |
|
|
}
|
2890 |
|
|
[(set_attr "type" "fmov,fmov,fmov,multi,multi")
|
2891 |
|
|
(set_attr "mode" "XF,XF,XF,SI,SI")])
|
2892 |
|
|
|
2893 |
|
|
(define_insn "*movdf_internal_rex64"
|
2894 |
|
|
[(set (match_operand:DF 0 "nonimmediate_operand"
|
2895 |
|
|
"=f,m,f,?r,?m,?r,!o,x,x,x,m,Yi,r ")
|
2896 |
|
|
(match_operand:DF 1 "general_operand"
|
2897 |
|
|
"fm,f,G,rm,r ,F ,F ,C,x,m,x,r ,Yi"))]
|
2898 |
|
|
"TARGET_64BIT && !(MEM_P (operands[0]) && MEM_P (operands[1]))
|
2899 |
|
|
&& (!can_create_pseudo_p ()
|
2900 |
|
|
|| (ix86_cmodel == CM_MEDIUM || ix86_cmodel == CM_LARGE)
|
2901 |
|
|
|| GET_CODE (operands[1]) != CONST_DOUBLE
|
2902 |
|
|
|| (optimize_function_for_size_p (cfun)
|
2903 |
|
|
&& ((!(TARGET_SSE2 && TARGET_SSE_MATH)
|
2904 |
|
|
&& standard_80387_constant_p (operands[1]) > 0)
|
2905 |
|
|
|| (TARGET_SSE2 && TARGET_SSE_MATH
|
2906 |
|
|
&& standard_sse_constant_p (operands[1]))))
|
2907 |
|
|
|| memory_operand (operands[0], DFmode))"
|
2908 |
|
|
{
|
2909 |
|
|
switch (which_alternative)
|
2910 |
|
|
{
|
2911 |
|
|
case 0:
|
2912 |
|
|
case 1:
|
2913 |
|
|
return output_387_reg_move (insn, operands);
|
2914 |
|
|
|
2915 |
|
|
case 2:
|
2916 |
|
|
return standard_80387_constant_opcode (operands[1]);
|
2917 |
|
|
|
2918 |
|
|
case 3:
|
2919 |
|
|
case 4:
|
2920 |
|
|
return "mov{q}\t{%1, %0|%0, %1}";
|
2921 |
|
|
|
2922 |
|
|
case 5:
|
2923 |
|
|
return "movabs{q}\t{%1, %0|%0, %1}";
|
2924 |
|
|
|
2925 |
|
|
case 6:
|
2926 |
|
|
return "#";
|
2927 |
|
|
|
2928 |
|
|
case 7:
|
2929 |
|
|
return standard_sse_constant_opcode (insn, operands[1]);
|
2930 |
|
|
|
2931 |
|
|
case 8:
|
2932 |
|
|
case 9:
|
2933 |
|
|
case 10:
|
2934 |
|
|
switch (get_attr_mode (insn))
|
2935 |
|
|
{
|
2936 |
|
|
case MODE_V2DF:
|
2937 |
|
|
if (!TARGET_SSE_PACKED_SINGLE_INSN_OPTIMAL)
|
2938 |
|
|
return "%vmovapd\t{%1, %0|%0, %1}";
|
2939 |
|
|
case MODE_V4SF:
|
2940 |
|
|
return "%vmovaps\t{%1, %0|%0, %1}";
|
2941 |
|
|
|
2942 |
|
|
case MODE_DI:
|
2943 |
|
|
return "%vmovq\t{%1, %0|%0, %1}";
|
2944 |
|
|
case MODE_DF:
|
2945 |
|
|
if (TARGET_AVX && REG_P (operands[0]) && REG_P (operands[1]))
|
2946 |
|
|
return "vmovsd\t{%1, %0, %0|%0, %0, %1}";
|
2947 |
|
|
return "%vmovsd\t{%1, %0|%0, %1}";
|
2948 |
|
|
case MODE_V1DF:
|
2949 |
|
|
return "%vmovlpd\t{%1, %d0|%d0, %1}";
|
2950 |
|
|
case MODE_V2SF:
|
2951 |
|
|
return "%vmovlps\t{%1, %d0|%d0, %1}";
|
2952 |
|
|
default:
|
2953 |
|
|
gcc_unreachable ();
|
2954 |
|
|
}
|
2955 |
|
|
|
2956 |
|
|
case 11:
|
2957 |
|
|
case 12:
|
2958 |
|
|
/* Handle broken assemblers that require movd instead of movq. */
|
2959 |
|
|
return "%vmovd\t{%1, %0|%0, %1}";
|
2960 |
|
|
|
2961 |
|
|
default:
|
2962 |
|
|
gcc_unreachable();
|
2963 |
|
|
}
|
2964 |
|
|
}
|
2965 |
|
|
[(set (attr "type")
|
2966 |
|
|
(cond [(eq_attr "alternative" "0,1,2")
|
2967 |
|
|
(const_string "fmov")
|
2968 |
|
|
(eq_attr "alternative" "3,4,5")
|
2969 |
|
|
(const_string "imov")
|
2970 |
|
|
(eq_attr "alternative" "6")
|
2971 |
|
|
(const_string "multi")
|
2972 |
|
|
(eq_attr "alternative" "7")
|
2973 |
|
|
(const_string "sselog1")
|
2974 |
|
|
]
|
2975 |
|
|
(const_string "ssemov")))
|
2976 |
|
|
(set (attr "modrm")
|
2977 |
|
|
(if_then_else
|
2978 |
|
|
(and (eq_attr "alternative" "5") (eq_attr "type" "imov"))
|
2979 |
|
|
(const_string "0")
|
2980 |
|
|
(const_string "*")))
|
2981 |
|
|
(set (attr "length_immediate")
|
2982 |
|
|
(if_then_else
|
2983 |
|
|
(and (eq_attr "alternative" "5") (eq_attr "type" "imov"))
|
2984 |
|
|
(const_string "8")
|
2985 |
|
|
(const_string "*")))
|
2986 |
|
|
(set (attr "prefix")
|
2987 |
|
|
(if_then_else (eq_attr "alternative" "0,1,2,3,4,5,6")
|
2988 |
|
|
(const_string "orig")
|
2989 |
|
|
(const_string "maybe_vex")))
|
2990 |
|
|
(set (attr "prefix_data16")
|
2991 |
|
|
(if_then_else (eq_attr "mode" "V1DF")
|
2992 |
|
|
(const_string "1")
|
2993 |
|
|
(const_string "*")))
|
2994 |
|
|
(set (attr "mode")
|
2995 |
|
|
(cond [(eq_attr "alternative" "0,1,2")
|
2996 |
|
|
(const_string "DF")
|
2997 |
|
|
(eq_attr "alternative" "3,4,5,6,11,12")
|
2998 |
|
|
(const_string "DI")
|
2999 |
|
|
|
3000 |
|
|
/* xorps is one byte shorter. */
|
3001 |
|
|
(eq_attr "alternative" "7")
|
3002 |
|
|
(cond [(match_test "optimize_function_for_size_p (cfun)")
|
3003 |
|
|
(const_string "V4SF")
|
3004 |
|
|
(match_test "TARGET_SSE_LOAD0_BY_PXOR")
|
3005 |
|
|
(const_string "TI")
|
3006 |
|
|
]
|
3007 |
|
|
(const_string "V2DF"))
|
3008 |
|
|
|
3009 |
|
|
/* For architectures resolving dependencies on
|
3010 |
|
|
whole SSE registers use APD move to break dependency
|
3011 |
|
|
chains, otherwise use short move to avoid extra work.
|
3012 |
|
|
|
3013 |
|
|
movaps encodes one byte shorter. */
|
3014 |
|
|
(eq_attr "alternative" "8")
|
3015 |
|
|
(cond
|
3016 |
|
|
[(match_test "optimize_function_for_size_p (cfun)")
|
3017 |
|
|
(const_string "V4SF")
|
3018 |
|
|
(match_test "TARGET_SSE_PARTIAL_REG_DEPENDENCY")
|
3019 |
|
|
(const_string "V2DF")
|
3020 |
|
|
]
|
3021 |
|
|
(const_string "DF"))
|
3022 |
|
|
/* For architectures resolving dependencies on register
|
3023 |
|
|
parts we may avoid extra work to zero out upper part
|
3024 |
|
|
of register. */
|
3025 |
|
|
(eq_attr "alternative" "9")
|
3026 |
|
|
(if_then_else
|
3027 |
|
|
(match_test "TARGET_SSE_SPLIT_REGS")
|
3028 |
|
|
(const_string "V1DF")
|
3029 |
|
|
(const_string "DF"))
|
3030 |
|
|
]
|
3031 |
|
|
(const_string "DF")))])
|
3032 |
|
|
|
3033 |
|
|
;; Possible store forwarding (partial memory) stall in alternative 4.
|
3034 |
|
|
(define_insn "*movdf_internal"
|
3035 |
|
|
[(set (match_operand:DF 0 "nonimmediate_operand"
|
3036 |
|
|
"=f,m,f,?Yd*r ,!o ,x,x,x,m,*x,*x,*x,m")
|
3037 |
|
|
(match_operand:DF 1 "general_operand"
|
3038 |
|
|
"fm,f,G,Yd*roF,FYd*r,C,x,m,x,C ,*x,m ,*x"))]
|
3039 |
|
|
"!TARGET_64BIT && !(MEM_P (operands[0]) && MEM_P (operands[1]))
|
3040 |
|
|
&& (!can_create_pseudo_p ()
|
3041 |
|
|
|| (ix86_cmodel == CM_MEDIUM || ix86_cmodel == CM_LARGE)
|
3042 |
|
|
|| GET_CODE (operands[1]) != CONST_DOUBLE
|
3043 |
|
|
|| (optimize_function_for_size_p (cfun)
|
3044 |
|
|
&& ((!(TARGET_SSE2 && TARGET_SSE_MATH)
|
3045 |
|
|
&& standard_80387_constant_p (operands[1]) > 0)
|
3046 |
|
|
|| (TARGET_SSE2 && TARGET_SSE_MATH
|
3047 |
|
|
&& standard_sse_constant_p (operands[1])))
|
3048 |
|
|
&& !memory_operand (operands[0], DFmode))
|
3049 |
|
|
|| (!TARGET_MEMORY_MISMATCH_STALL
|
3050 |
|
|
&& memory_operand (operands[0], DFmode)))"
|
3051 |
|
|
{
|
3052 |
|
|
switch (which_alternative)
|
3053 |
|
|
{
|
3054 |
|
|
case 0:
|
3055 |
|
|
case 1:
|
3056 |
|
|
return output_387_reg_move (insn, operands);
|
3057 |
|
|
|
3058 |
|
|
case 2:
|
3059 |
|
|
return standard_80387_constant_opcode (operands[1]);
|
3060 |
|
|
|
3061 |
|
|
case 3:
|
3062 |
|
|
case 4:
|
3063 |
|
|
return "#";
|
3064 |
|
|
|
3065 |
|
|
case 5:
|
3066 |
|
|
case 9:
|
3067 |
|
|
return standard_sse_constant_opcode (insn, operands[1]);
|
3068 |
|
|
|
3069 |
|
|
case 6:
|
3070 |
|
|
case 7:
|
3071 |
|
|
case 8:
|
3072 |
|
|
case 10:
|
3073 |
|
|
case 11:
|
3074 |
|
|
case 12:
|
3075 |
|
|
switch (get_attr_mode (insn))
|
3076 |
|
|
{
|
3077 |
|
|
case MODE_V2DF:
|
3078 |
|
|
if (!TARGET_SSE_PACKED_SINGLE_INSN_OPTIMAL)
|
3079 |
|
|
return "%vmovapd\t{%1, %0|%0, %1}";
|
3080 |
|
|
case MODE_V4SF:
|
3081 |
|
|
return "%vmovaps\t{%1, %0|%0, %1}";
|
3082 |
|
|
|
3083 |
|
|
case MODE_DI:
|
3084 |
|
|
return "%vmovq\t{%1, %0|%0, %1}";
|
3085 |
|
|
case MODE_DF:
|
3086 |
|
|
if (TARGET_AVX && REG_P (operands[0]) && REG_P (operands[1]))
|
3087 |
|
|
return "vmovsd\t{%1, %0, %0|%0, %0, %1}";
|
3088 |
|
|
return "%vmovsd\t{%1, %0|%0, %1}";
|
3089 |
|
|
case MODE_V1DF:
|
3090 |
|
|
return "%vmovlpd\t{%1, %d0|%d0, %1}";
|
3091 |
|
|
case MODE_V2SF:
|
3092 |
|
|
return "%vmovlps\t{%1, %d0|%d0, %1}";
|
3093 |
|
|
default:
|
3094 |
|
|
gcc_unreachable ();
|
3095 |
|
|
}
|
3096 |
|
|
|
3097 |
|
|
default:
|
3098 |
|
|
gcc_unreachable ();
|
3099 |
|
|
}
|
3100 |
|
|
}
|
3101 |
|
|
[(set (attr "isa")
|
3102 |
|
|
(if_then_else (eq_attr "alternative" "5,6,7,8")
|
3103 |
|
|
(const_string "sse2")
|
3104 |
|
|
(const_string "*")))
|
3105 |
|
|
(set (attr "type")
|
3106 |
|
|
(cond [(eq_attr "alternative" "0,1,2")
|
3107 |
|
|
(const_string "fmov")
|
3108 |
|
|
(eq_attr "alternative" "3,4")
|
3109 |
|
|
(const_string "multi")
|
3110 |
|
|
(eq_attr "alternative" "5,9")
|
3111 |
|
|
(const_string "sselog1")
|
3112 |
|
|
]
|
3113 |
|
|
(const_string "ssemov")))
|
3114 |
|
|
(set (attr "prefix")
|
3115 |
|
|
(if_then_else (eq_attr "alternative" "0,1,2,3,4")
|
3116 |
|
|
(const_string "orig")
|
3117 |
|
|
(const_string "maybe_vex")))
|
3118 |
|
|
(set (attr "prefix_data16")
|
3119 |
|
|
(if_then_else (eq_attr "mode" "V1DF")
|
3120 |
|
|
(const_string "1")
|
3121 |
|
|
(const_string "*")))
|
3122 |
|
|
(set (attr "mode")
|
3123 |
|
|
(cond [(eq_attr "alternative" "0,1,2")
|
3124 |
|
|
(const_string "DF")
|
3125 |
|
|
(eq_attr "alternative" "3,4")
|
3126 |
|
|
(const_string "SI")
|
3127 |
|
|
|
3128 |
|
|
/* For SSE1, we have many fewer alternatives. */
|
3129 |
|
|
(not (match_test "TARGET_SSE2"))
|
3130 |
|
|
(if_then_else
|
3131 |
|
|
(eq_attr "alternative" "5,6,9,10")
|
3132 |
|
|
(const_string "V4SF")
|
3133 |
|
|
(const_string "V2SF"))
|
3134 |
|
|
|
3135 |
|
|
/* xorps is one byte shorter. */
|
3136 |
|
|
(eq_attr "alternative" "5,9")
|
3137 |
|
|
(cond [(match_test "optimize_function_for_size_p (cfun)")
|
3138 |
|
|
(const_string "V4SF")
|
3139 |
|
|
(match_test "TARGET_SSE_LOAD0_BY_PXOR")
|
3140 |
|
|
(const_string "TI")
|
3141 |
|
|
]
|
3142 |
|
|
(const_string "V2DF"))
|
3143 |
|
|
|
3144 |
|
|
/* For architectures resolving dependencies on
|
3145 |
|
|
whole SSE registers use APD move to break dependency
|
3146 |
|
|
chains, otherwise use short move to avoid extra work.
|
3147 |
|
|
|
3148 |
|
|
movaps encodes one byte shorter. */
|
3149 |
|
|
(eq_attr "alternative" "6,10")
|
3150 |
|
|
(cond
|
3151 |
|
|
[(match_test "optimize_function_for_size_p (cfun)")
|
3152 |
|
|
(const_string "V4SF")
|
3153 |
|
|
(match_test "TARGET_SSE_PARTIAL_REG_DEPENDENCY")
|
3154 |
|
|
(const_string "V2DF")
|
3155 |
|
|
]
|
3156 |
|
|
(const_string "DF"))
|
3157 |
|
|
/* For architectures resolving dependencies on register
|
3158 |
|
|
parts we may avoid extra work to zero out upper part
|
3159 |
|
|
of register. */
|
3160 |
|
|
(eq_attr "alternative" "7,11")
|
3161 |
|
|
(if_then_else
|
3162 |
|
|
(match_test "TARGET_SSE_SPLIT_REGS")
|
3163 |
|
|
(const_string "V1DF")
|
3164 |
|
|
(const_string "DF"))
|
3165 |
|
|
]
|
3166 |
|
|
(const_string "DF")))])
|
3167 |
|
|
|
3168 |
|
|
(define_insn "*movsf_internal"
|
3169 |
|
|
[(set (match_operand:SF 0 "nonimmediate_operand"
|
3170 |
|
|
"=f,m,f,?r ,?m,x,x,x,m,!*y,!m,!*y,?Yi,?r,!*Ym,!r")
|
3171 |
|
|
(match_operand:SF 1 "general_operand"
|
3172 |
|
|
"fm,f,G,rmF,Fr,C,x,m,x,m ,*y,*y ,r ,Yi,r ,*Ym"))]
|
3173 |
|
|
"!(MEM_P (operands[0]) && MEM_P (operands[1]))
|
3174 |
|
|
&& (!can_create_pseudo_p ()
|
3175 |
|
|
|| (ix86_cmodel == CM_MEDIUM || ix86_cmodel == CM_LARGE)
|
3176 |
|
|
|| GET_CODE (operands[1]) != CONST_DOUBLE
|
3177 |
|
|
|| (optimize_function_for_size_p (cfun)
|
3178 |
|
|
&& ((!TARGET_SSE_MATH
|
3179 |
|
|
&& standard_80387_constant_p (operands[1]) > 0)
|
3180 |
|
|
|| (TARGET_SSE_MATH
|
3181 |
|
|
&& standard_sse_constant_p (operands[1]))))
|
3182 |
|
|
|| memory_operand (operands[0], SFmode))"
|
3183 |
|
|
{
|
3184 |
|
|
switch (which_alternative)
|
3185 |
|
|
{
|
3186 |
|
|
case 0:
|
3187 |
|
|
case 1:
|
3188 |
|
|
return output_387_reg_move (insn, operands);
|
3189 |
|
|
|
3190 |
|
|
case 2:
|
3191 |
|
|
return standard_80387_constant_opcode (operands[1]);
|
3192 |
|
|
|
3193 |
|
|
case 3:
|
3194 |
|
|
case 4:
|
3195 |
|
|
return "mov{l}\t{%1, %0|%0, %1}";
|
3196 |
|
|
|
3197 |
|
|
case 5:
|
3198 |
|
|
return standard_sse_constant_opcode (insn, operands[1]);
|
3199 |
|
|
|
3200 |
|
|
case 6:
|
3201 |
|
|
if (get_attr_mode (insn) == MODE_V4SF)
|
3202 |
|
|
return "%vmovaps\t{%1, %0|%0, %1}";
|
3203 |
|
|
if (TARGET_AVX)
|
3204 |
|
|
return "vmovss\t{%1, %0, %0|%0, %0, %1}";
|
3205 |
|
|
|
3206 |
|
|
case 7:
|
3207 |
|
|
case 8:
|
3208 |
|
|
return "%vmovss\t{%1, %0|%0, %1}";
|
3209 |
|
|
|
3210 |
|
|
case 9:
|
3211 |
|
|
case 10:
|
3212 |
|
|
case 14:
|
3213 |
|
|
case 15:
|
3214 |
|
|
return "movd\t{%1, %0|%0, %1}";
|
3215 |
|
|
|
3216 |
|
|
case 11:
|
3217 |
|
|
return "movq\t{%1, %0|%0, %1}";
|
3218 |
|
|
|
3219 |
|
|
case 12:
|
3220 |
|
|
case 13:
|
3221 |
|
|
return "%vmovd\t{%1, %0|%0, %1}";
|
3222 |
|
|
|
3223 |
|
|
default:
|
3224 |
|
|
gcc_unreachable ();
|
3225 |
|
|
}
|
3226 |
|
|
}
|
3227 |
|
|
[(set (attr "type")
|
3228 |
|
|
(cond [(eq_attr "alternative" "0,1,2")
|
3229 |
|
|
(const_string "fmov")
|
3230 |
|
|
(eq_attr "alternative" "3,4")
|
3231 |
|
|
(const_string "multi")
|
3232 |
|
|
(eq_attr "alternative" "5")
|
3233 |
|
|
(const_string "sselog1")
|
3234 |
|
|
(eq_attr "alternative" "9,10,11,14,15")
|
3235 |
|
|
(const_string "mmxmov")
|
3236 |
|
|
]
|
3237 |
|
|
(const_string "ssemov")))
|
3238 |
|
|
(set (attr "prefix")
|
3239 |
|
|
(if_then_else (eq_attr "alternative" "5,6,7,8,12,13")
|
3240 |
|
|
(const_string "maybe_vex")
|
3241 |
|
|
(const_string "orig")))
|
3242 |
|
|
(set (attr "mode")
|
3243 |
|
|
(cond [(eq_attr "alternative" "3,4,9,10")
|
3244 |
|
|
(const_string "SI")
|
3245 |
|
|
(eq_attr "alternative" "5")
|
3246 |
|
|
(if_then_else
|
3247 |
|
|
(and (and (match_test "TARGET_SSE_LOAD0_BY_PXOR")
|
3248 |
|
|
(match_test "TARGET_SSE2"))
|
3249 |
|
|
(not (match_test "optimize_function_for_size_p (cfun)")))
|
3250 |
|
|
(const_string "TI")
|
3251 |
|
|
(const_string "V4SF"))
|
3252 |
|
|
/* For architectures resolving dependencies on
|
3253 |
|
|
whole SSE registers use APS move to break dependency
|
3254 |
|
|
chains, otherwise use short move to avoid extra work.
|
3255 |
|
|
|
3256 |
|
|
Do the same for architectures resolving dependencies on
|
3257 |
|
|
the parts. While in DF mode it is better to always handle
|
3258 |
|
|
just register parts, the SF mode is different due to lack
|
3259 |
|
|
of instructions to load just part of the register. It is
|
3260 |
|
|
better to maintain the whole registers in single format
|
3261 |
|
|
to avoid problems on using packed logical operations. */
|
3262 |
|
|
(eq_attr "alternative" "6")
|
3263 |
|
|
(if_then_else
|
3264 |
|
|
(ior (match_test "TARGET_SSE_PARTIAL_REG_DEPENDENCY")
|
3265 |
|
|
(match_test "TARGET_SSE_SPLIT_REGS"))
|
3266 |
|
|
(const_string "V4SF")
|
3267 |
|
|
(const_string "SF"))
|
3268 |
|
|
(eq_attr "alternative" "11")
|
3269 |
|
|
(const_string "DI")]
|
3270 |
|
|
(const_string "SF")))])
|
3271 |
|
|
|
3272 |
|
|
(define_split
|
3273 |
|
|
[(set (match_operand 0 "any_fp_register_operand" "")
|
3274 |
|
|
(match_operand 1 "memory_operand" ""))]
|
3275 |
|
|
"reload_completed
|
3276 |
|
|
&& (GET_MODE (operands[0]) == TFmode
|
3277 |
|
|
|| GET_MODE (operands[0]) == XFmode
|
3278 |
|
|
|| GET_MODE (operands[0]) == DFmode
|
3279 |
|
|
|| GET_MODE (operands[0]) == SFmode)
|
3280 |
|
|
&& (operands[2] = find_constant_src (insn))"
|
3281 |
|
|
[(set (match_dup 0) (match_dup 2))]
|
3282 |
|
|
{
|
3283 |
|
|
rtx c = operands[2];
|
3284 |
|
|
int r = REGNO (operands[0]);
|
3285 |
|
|
|
3286 |
|
|
if ((SSE_REGNO_P (r) && !standard_sse_constant_p (c))
|
3287 |
|
|
|| (FP_REGNO_P (r) && standard_80387_constant_p (c) < 1))
|
3288 |
|
|
FAIL;
|
3289 |
|
|
})
|
3290 |
|
|
|
3291 |
|
|
(define_split
|
3292 |
|
|
[(set (match_operand 0 "any_fp_register_operand" "")
|
3293 |
|
|
(float_extend (match_operand 1 "memory_operand" "")))]
|
3294 |
|
|
"reload_completed
|
3295 |
|
|
&& (GET_MODE (operands[0]) == TFmode
|
3296 |
|
|
|| GET_MODE (operands[0]) == XFmode
|
3297 |
|
|
|| GET_MODE (operands[0]) == DFmode)
|
3298 |
|
|
&& (operands[2] = find_constant_src (insn))"
|
3299 |
|
|
[(set (match_dup 0) (match_dup 2))]
|
3300 |
|
|
{
|
3301 |
|
|
rtx c = operands[2];
|
3302 |
|
|
int r = REGNO (operands[0]);
|
3303 |
|
|
|
3304 |
|
|
if ((SSE_REGNO_P (r) && !standard_sse_constant_p (c))
|
3305 |
|
|
|| (FP_REGNO_P (r) && standard_80387_constant_p (c) < 1))
|
3306 |
|
|
FAIL;
|
3307 |
|
|
})
|
3308 |
|
|
|
3309 |
|
|
;; Split the load of -0.0 or -1.0 into fldz;fchs or fld1;fchs sequence
|
3310 |
|
|
(define_split
|
3311 |
|
|
[(set (match_operand:X87MODEF 0 "fp_register_operand" "")
|
3312 |
|
|
(match_operand:X87MODEF 1 "immediate_operand" ""))]
|
3313 |
|
|
"reload_completed
|
3314 |
|
|
&& (standard_80387_constant_p (operands[1]) == 8
|
3315 |
|
|
|| standard_80387_constant_p (operands[1]) == 9)"
|
3316 |
|
|
[(set (match_dup 0)(match_dup 1))
|
3317 |
|
|
(set (match_dup 0)
|
3318 |
|
|
(neg:X87MODEF (match_dup 0)))]
|
3319 |
|
|
{
|
3320 |
|
|
REAL_VALUE_TYPE r;
|
3321 |
|
|
|
3322 |
|
|
REAL_VALUE_FROM_CONST_DOUBLE (r, operands[1]);
|
3323 |
|
|
if (real_isnegzero (&r))
|
3324 |
|
|
operands[1] = CONST0_RTX (mode);
|
3325 |
|
|
else
|
3326 |
|
|
operands[1] = CONST1_RTX (mode);
|
3327 |
|
|
})
|
3328 |
|
|
|
3329 |
|
|
(define_split
|
3330 |
|
|
[(set (match_operand 0 "nonimmediate_operand" "")
|
3331 |
|
|
(match_operand 1 "general_operand" ""))]
|
3332 |
|
|
"reload_completed
|
3333 |
|
|
&& (GET_MODE (operands[0]) == TFmode
|
3334 |
|
|
|| GET_MODE (operands[0]) == XFmode
|
3335 |
|
|
|| GET_MODE (operands[0]) == DFmode)
|
3336 |
|
|
&& !(ANY_FP_REG_P (operands[0]) || ANY_FP_REG_P (operands[1]))"
|
3337 |
|
|
[(const_int 0)]
|
3338 |
|
|
"ix86_split_long_move (operands); DONE;")
|
3339 |
|
|
|
3340 |
|
|
(define_insn "swapxf"
|
3341 |
|
|
[(set (match_operand:XF 0 "register_operand" "+f")
|
3342 |
|
|
(match_operand:XF 1 "register_operand" "+f"))
|
3343 |
|
|
(set (match_dup 1)
|
3344 |
|
|
(match_dup 0))]
|
3345 |
|
|
"TARGET_80387"
|
3346 |
|
|
{
|
3347 |
|
|
if (STACK_TOP_P (operands[0]))
|
3348 |
|
|
return "fxch\t%1";
|
3349 |
|
|
else
|
3350 |
|
|
return "fxch\t%0";
|
3351 |
|
|
}
|
3352 |
|
|
[(set_attr "type" "fxch")
|
3353 |
|
|
(set_attr "mode" "XF")])
|
3354 |
|
|
|
3355 |
|
|
(define_insn "*swap"
|
3356 |
|
|
[(set (match_operand:MODEF 0 "fp_register_operand" "+f")
|
3357 |
|
|
(match_operand:MODEF 1 "fp_register_operand" "+f"))
|
3358 |
|
|
(set (match_dup 1)
|
3359 |
|
|
(match_dup 0))]
|
3360 |
|
|
"TARGET_80387 || reload_completed"
|
3361 |
|
|
{
|
3362 |
|
|
if (STACK_TOP_P (operands[0]))
|
3363 |
|
|
return "fxch\t%1";
|
3364 |
|
|
else
|
3365 |
|
|
return "fxch\t%0";
|
3366 |
|
|
}
|
3367 |
|
|
[(set_attr "type" "fxch")
|
3368 |
|
|
(set_attr "mode" "")])
|
3369 |
|
|
|
3370 |
|
|
;; Zero extension instructions
|
3371 |
|
|
|
3372 |
|
|
(define_expand "zero_extendsidi2"
|
3373 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "")
|
3374 |
|
|
(zero_extend:DI (match_operand:SI 1 "nonimmediate_operand" "")))]
|
3375 |
|
|
""
|
3376 |
|
|
{
|
3377 |
|
|
if (!TARGET_64BIT)
|
3378 |
|
|
{
|
3379 |
|
|
emit_insn (gen_zero_extendsidi2_1 (operands[0], operands[1]));
|
3380 |
|
|
DONE;
|
3381 |
|
|
}
|
3382 |
|
|
})
|
3383 |
|
|
|
3384 |
|
|
(define_insn "*zero_extendsidi2_rex64"
|
3385 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "=r,o,?*Ym,?*y,?*Yi,*x")
|
3386 |
|
|
(zero_extend:DI
|
3387 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "rm,0,r ,m ,r ,m")))]
|
3388 |
|
|
"TARGET_64BIT"
|
3389 |
|
|
"@
|
3390 |
|
|
mov{l}\t{%1, %k0|%k0, %1}
|
3391 |
|
|
#
|
3392 |
|
|
movd\t{%1, %0|%0, %1}
|
3393 |
|
|
movd\t{%1, %0|%0, %1}
|
3394 |
|
|
%vmovd\t{%1, %0|%0, %1}
|
3395 |
|
|
%vmovd\t{%1, %0|%0, %1}"
|
3396 |
|
|
[(set_attr "type" "imovx,imov,mmxmov,mmxmov,ssemov,ssemov")
|
3397 |
|
|
(set_attr "prefix" "orig,*,orig,orig,maybe_vex,maybe_vex")
|
3398 |
|
|
(set_attr "prefix_0f" "0,*,*,*,*,*")
|
3399 |
|
|
(set_attr "mode" "SI,DI,DI,DI,TI,TI")])
|
3400 |
|
|
|
3401 |
|
|
(define_split
|
3402 |
|
|
[(set (match_operand:DI 0 "memory_operand" "")
|
3403 |
|
|
(zero_extend:DI (match_dup 0)))]
|
3404 |
|
|
"TARGET_64BIT"
|
3405 |
|
|
[(set (match_dup 4) (const_int 0))]
|
3406 |
|
|
"split_double_mode (DImode, &operands[0], 1, &operands[3], &operands[4]);")
|
3407 |
|
|
|
3408 |
|
|
;; %%% Kill me once multi-word ops are sane.
|
3409 |
|
|
(define_insn "zero_extendsidi2_1"
|
3410 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "=r,?r,?o,?*Ym,?*y,?*Yi,*x")
|
3411 |
|
|
(zero_extend:DI
|
3412 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "0,rm,r ,r ,m ,r ,m")))
|
3413 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
3414 |
|
|
"!TARGET_64BIT"
|
3415 |
|
|
"@
|
3416 |
|
|
#
|
3417 |
|
|
#
|
3418 |
|
|
#
|
3419 |
|
|
movd\t{%1, %0|%0, %1}
|
3420 |
|
|
movd\t{%1, %0|%0, %1}
|
3421 |
|
|
%vmovd\t{%1, %0|%0, %1}
|
3422 |
|
|
%vmovd\t{%1, %0|%0, %1}"
|
3423 |
|
|
[(set_attr "isa" "*,*,*,*,*,*,sse2")
|
3424 |
|
|
(set_attr "type" "multi,multi,multi,mmxmov,mmxmov,ssemov,ssemov")
|
3425 |
|
|
(set_attr "prefix" "*,*,*,orig,orig,maybe_vex,maybe_vex")
|
3426 |
|
|
(set_attr "mode" "SI,SI,SI,DI,DI,TI,TI")])
|
3427 |
|
|
|
3428 |
|
|
(define_split
|
3429 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
3430 |
|
|
(zero_extend:DI (match_operand:SI 1 "register_operand" "")))
|
3431 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
3432 |
|
|
"!TARGET_64BIT && reload_completed
|
3433 |
|
|
&& true_regnum (operands[0]) == true_regnum (operands[1])"
|
3434 |
|
|
[(set (match_dup 4) (const_int 0))]
|
3435 |
|
|
"split_double_mode (DImode, &operands[0], 1, &operands[3], &operands[4]);")
|
3436 |
|
|
|
3437 |
|
|
(define_split
|
3438 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "")
|
3439 |
|
|
(zero_extend:DI (match_operand:SI 1 "general_operand" "")))
|
3440 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
3441 |
|
|
"!TARGET_64BIT && reload_completed
|
3442 |
|
|
&& !(MMX_REG_P (operands[0]) || SSE_REG_P (operands[0]))"
|
3443 |
|
|
[(set (match_dup 3) (match_dup 1))
|
3444 |
|
|
(set (match_dup 4) (const_int 0))]
|
3445 |
|
|
"split_double_mode (DImode, &operands[0], 1, &operands[3], &operands[4]);")
|
3446 |
|
|
|
3447 |
|
|
(define_insn "zero_extenddi2"
|
3448 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
3449 |
|
|
(zero_extend:DI
|
3450 |
|
|
(match_operand:SWI12 1 "nonimmediate_operand" "m")))]
|
3451 |
|
|
"TARGET_64BIT"
|
3452 |
|
|
"movz{l|x}\t{%1, %k0|%k0, %1}"
|
3453 |
|
|
[(set_attr "type" "imovx")
|
3454 |
|
|
(set_attr "mode" "SI")])
|
3455 |
|
|
|
3456 |
|
|
(define_expand "zero_extendhisi2"
|
3457 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
3458 |
|
|
(zero_extend:SI (match_operand:HI 1 "nonimmediate_operand" "")))]
|
3459 |
|
|
""
|
3460 |
|
|
{
|
3461 |
|
|
if (TARGET_ZERO_EXTEND_WITH_AND && optimize_function_for_speed_p (cfun))
|
3462 |
|
|
{
|
3463 |
|
|
operands[1] = force_reg (HImode, operands[1]);
|
3464 |
|
|
emit_insn (gen_zero_extendhisi2_and (operands[0], operands[1]));
|
3465 |
|
|
DONE;
|
3466 |
|
|
}
|
3467 |
|
|
})
|
3468 |
|
|
|
3469 |
|
|
(define_insn_and_split "zero_extendhisi2_and"
|
3470 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
3471 |
|
|
(zero_extend:SI (match_operand:HI 1 "register_operand" "0")))
|
3472 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
3473 |
|
|
"TARGET_ZERO_EXTEND_WITH_AND && optimize_function_for_speed_p (cfun)"
|
3474 |
|
|
"#"
|
3475 |
|
|
"&& reload_completed"
|
3476 |
|
|
[(parallel [(set (match_dup 0) (and:SI (match_dup 0) (const_int 65535)))
|
3477 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
3478 |
|
|
""
|
3479 |
|
|
[(set_attr "type" "alu1")
|
3480 |
|
|
(set_attr "mode" "SI")])
|
3481 |
|
|
|
3482 |
|
|
(define_insn "*zero_extendhisi2_movzwl"
|
3483 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
3484 |
|
|
(zero_extend:SI (match_operand:HI 1 "nonimmediate_operand" "rm")))]
|
3485 |
|
|
"!TARGET_ZERO_EXTEND_WITH_AND
|
3486 |
|
|
|| optimize_function_for_size_p (cfun)"
|
3487 |
|
|
"movz{wl|x}\t{%1, %0|%0, %1}"
|
3488 |
|
|
[(set_attr "type" "imovx")
|
3489 |
|
|
(set_attr "mode" "SI")])
|
3490 |
|
|
|
3491 |
|
|
(define_expand "zero_extendqi2"
|
3492 |
|
|
[(parallel
|
3493 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "")
|
3494 |
|
|
(zero_extend:SWI24 (match_operand:QI 1 "nonimmediate_operand" "")))
|
3495 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
3496 |
|
|
|
3497 |
|
|
(define_insn "*zero_extendqi2_and"
|
3498 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "=r,?&q")
|
3499 |
|
|
(zero_extend:SWI24 (match_operand:QI 1 "nonimmediate_operand" "0,qm")))
|
3500 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
3501 |
|
|
"TARGET_ZERO_EXTEND_WITH_AND && optimize_function_for_speed_p (cfun)"
|
3502 |
|
|
"#"
|
3503 |
|
|
[(set_attr "type" "alu1")
|
3504 |
|
|
(set_attr "mode" "")])
|
3505 |
|
|
|
3506 |
|
|
;; When source and destination does not overlap, clear destination
|
3507 |
|
|
;; first and then do the movb
|
3508 |
|
|
(define_split
|
3509 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "")
|
3510 |
|
|
(zero_extend:SWI24 (match_operand:QI 1 "nonimmediate_operand" "")))
|
3511 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
3512 |
|
|
"reload_completed
|
3513 |
|
|
&& (TARGET_ZERO_EXTEND_WITH_AND && optimize_function_for_speed_p (cfun))
|
3514 |
|
|
&& ANY_QI_REG_P (operands[0])
|
3515 |
|
|
&& (ANY_QI_REG_P (operands[1]) || MEM_P (operands[1]))
|
3516 |
|
|
&& !reg_overlap_mentioned_p (operands[0], operands[1])"
|
3517 |
|
|
[(set (strict_low_part (match_dup 2)) (match_dup 1))]
|
3518 |
|
|
{
|
3519 |
|
|
operands[2] = gen_lowpart (QImode, operands[0]);
|
3520 |
|
|
ix86_expand_clear (operands[0]);
|
3521 |
|
|
})
|
3522 |
|
|
|
3523 |
|
|
(define_insn "*zero_extendqi2_movzbl_and"
|
3524 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "=r,r")
|
3525 |
|
|
(zero_extend:SWI24 (match_operand:QI 1 "nonimmediate_operand" "qm,0")))
|
3526 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
3527 |
|
|
"!TARGET_ZERO_EXTEND_WITH_AND || optimize_function_for_size_p (cfun)"
|
3528 |
|
|
"#"
|
3529 |
|
|
[(set_attr "type" "imovx,alu1")
|
3530 |
|
|
(set_attr "mode" "")])
|
3531 |
|
|
|
3532 |
|
|
;; For the movzbl case strip only the clobber
|
3533 |
|
|
(define_split
|
3534 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "")
|
3535 |
|
|
(zero_extend:SWI24 (match_operand:QI 1 "nonimmediate_operand" "")))
|
3536 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
3537 |
|
|
"reload_completed
|
3538 |
|
|
&& (!TARGET_ZERO_EXTEND_WITH_AND || optimize_function_for_size_p (cfun))
|
3539 |
|
|
&& (!REG_P (operands[1]) || ANY_QI_REG_P (operands[1]))"
|
3540 |
|
|
[(set (match_dup 0)
|
3541 |
|
|
(zero_extend:SWI24 (match_dup 1)))])
|
3542 |
|
|
|
3543 |
|
|
; zero extend to SImode to avoid partial register stalls
|
3544 |
|
|
(define_insn "*zero_extendqi2_movzbl"
|
3545 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "=r")
|
3546 |
|
|
(zero_extend:SWI24 (match_operand:QI 1 "nonimmediate_operand" "qm")))]
|
3547 |
|
|
"reload_completed
|
3548 |
|
|
&& (!TARGET_ZERO_EXTEND_WITH_AND || optimize_function_for_size_p (cfun))"
|
3549 |
|
|
"movz{bl|x}\t{%1, %k0|%k0, %1}"
|
3550 |
|
|
[(set_attr "type" "imovx")
|
3551 |
|
|
(set_attr "mode" "SI")])
|
3552 |
|
|
|
3553 |
|
|
;; Rest is handled by single and.
|
3554 |
|
|
(define_split
|
3555 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "")
|
3556 |
|
|
(zero_extend:SWI24 (match_operand:QI 1 "register_operand" "")))
|
3557 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
3558 |
|
|
"reload_completed
|
3559 |
|
|
&& true_regnum (operands[0]) == true_regnum (operands[1])"
|
3560 |
|
|
[(parallel [(set (match_dup 0) (and:SWI24 (match_dup 0) (const_int 255)))
|
3561 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
3562 |
|
|
|
3563 |
|
|
;; Sign extension instructions
|
3564 |
|
|
|
3565 |
|
|
(define_expand "extendsidi2"
|
3566 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
3567 |
|
|
(sign_extend:DI (match_operand:SI 1 "register_operand" "")))]
|
3568 |
|
|
""
|
3569 |
|
|
{
|
3570 |
|
|
if (!TARGET_64BIT)
|
3571 |
|
|
{
|
3572 |
|
|
emit_insn (gen_extendsidi2_1 (operands[0], operands[1]));
|
3573 |
|
|
DONE;
|
3574 |
|
|
}
|
3575 |
|
|
})
|
3576 |
|
|
|
3577 |
|
|
(define_insn "*extendsidi2_rex64"
|
3578 |
|
|
[(set (match_operand:DI 0 "register_operand" "=*a,r")
|
3579 |
|
|
(sign_extend:DI (match_operand:SI 1 "nonimmediate_operand" "*0,rm")))]
|
3580 |
|
|
"TARGET_64BIT"
|
3581 |
|
|
"@
|
3582 |
|
|
{cltq|cdqe}
|
3583 |
|
|
movs{lq|x}\t{%1, %0|%0, %1}"
|
3584 |
|
|
[(set_attr "type" "imovx")
|
3585 |
|
|
(set_attr "mode" "DI")
|
3586 |
|
|
(set_attr "prefix_0f" "0")
|
3587 |
|
|
(set_attr "modrm" "0,1")])
|
3588 |
|
|
|
3589 |
|
|
(define_insn "extendsidi2_1"
|
3590 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "=*A,r,?r,?*o")
|
3591 |
|
|
(sign_extend:DI (match_operand:SI 1 "register_operand" "0,0,r,r")))
|
3592 |
|
|
(clobber (reg:CC FLAGS_REG))
|
3593 |
|
|
(clobber (match_scratch:SI 2 "=X,X,X,&r"))]
|
3594 |
|
|
"!TARGET_64BIT"
|
3595 |
|
|
"#")
|
3596 |
|
|
|
3597 |
|
|
;; Extend to memory case when source register does die.
|
3598 |
|
|
(define_split
|
3599 |
|
|
[(set (match_operand:DI 0 "memory_operand" "")
|
3600 |
|
|
(sign_extend:DI (match_operand:SI 1 "register_operand" "")))
|
3601 |
|
|
(clobber (reg:CC FLAGS_REG))
|
3602 |
|
|
(clobber (match_operand:SI 2 "register_operand" ""))]
|
3603 |
|
|
"(reload_completed
|
3604 |
|
|
&& dead_or_set_p (insn, operands[1])
|
3605 |
|
|
&& !reg_mentioned_p (operands[1], operands[0]))"
|
3606 |
|
|
[(set (match_dup 3) (match_dup 1))
|
3607 |
|
|
(parallel [(set (match_dup 1) (ashiftrt:SI (match_dup 1) (const_int 31)))
|
3608 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
3609 |
|
|
(set (match_dup 4) (match_dup 1))]
|
3610 |
|
|
"split_double_mode (DImode, &operands[0], 1, &operands[3], &operands[4]);")
|
3611 |
|
|
|
3612 |
|
|
;; Extend to memory case when source register does not die.
|
3613 |
|
|
(define_split
|
3614 |
|
|
[(set (match_operand:DI 0 "memory_operand" "")
|
3615 |
|
|
(sign_extend:DI (match_operand:SI 1 "register_operand" "")))
|
3616 |
|
|
(clobber (reg:CC FLAGS_REG))
|
3617 |
|
|
(clobber (match_operand:SI 2 "register_operand" ""))]
|
3618 |
|
|
"reload_completed"
|
3619 |
|
|
[(const_int 0)]
|
3620 |
|
|
{
|
3621 |
|
|
split_double_mode (DImode, &operands[0], 1, &operands[3], &operands[4]);
|
3622 |
|
|
|
3623 |
|
|
emit_move_insn (operands[3], operands[1]);
|
3624 |
|
|
|
3625 |
|
|
/* Generate a cltd if possible and doing so it profitable. */
|
3626 |
|
|
if ((optimize_function_for_size_p (cfun) || TARGET_USE_CLTD)
|
3627 |
|
|
&& true_regnum (operands[1]) == AX_REG
|
3628 |
|
|
&& true_regnum (operands[2]) == DX_REG)
|
3629 |
|
|
{
|
3630 |
|
|
emit_insn (gen_ashrsi3_cvt (operands[2], operands[1], GEN_INT (31)));
|
3631 |
|
|
}
|
3632 |
|
|
else
|
3633 |
|
|
{
|
3634 |
|
|
emit_move_insn (operands[2], operands[1]);
|
3635 |
|
|
emit_insn (gen_ashrsi3_cvt (operands[2], operands[2], GEN_INT (31)));
|
3636 |
|
|
}
|
3637 |
|
|
emit_move_insn (operands[4], operands[2]);
|
3638 |
|
|
DONE;
|
3639 |
|
|
})
|
3640 |
|
|
|
3641 |
|
|
;; Extend to register case. Optimize case where source and destination
|
3642 |
|
|
;; registers match and cases where we can use cltd.
|
3643 |
|
|
(define_split
|
3644 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
3645 |
|
|
(sign_extend:DI (match_operand:SI 1 "register_operand" "")))
|
3646 |
|
|
(clobber (reg:CC FLAGS_REG))
|
3647 |
|
|
(clobber (match_scratch:SI 2 ""))]
|
3648 |
|
|
"reload_completed"
|
3649 |
|
|
[(const_int 0)]
|
3650 |
|
|
{
|
3651 |
|
|
split_double_mode (DImode, &operands[0], 1, &operands[3], &operands[4]);
|
3652 |
|
|
|
3653 |
|
|
if (true_regnum (operands[3]) != true_regnum (operands[1]))
|
3654 |
|
|
emit_move_insn (operands[3], operands[1]);
|
3655 |
|
|
|
3656 |
|
|
/* Generate a cltd if possible and doing so it profitable. */
|
3657 |
|
|
if ((optimize_function_for_size_p (cfun) || TARGET_USE_CLTD)
|
3658 |
|
|
&& true_regnum (operands[3]) == AX_REG
|
3659 |
|
|
&& true_regnum (operands[4]) == DX_REG)
|
3660 |
|
|
{
|
3661 |
|
|
emit_insn (gen_ashrsi3_cvt (operands[4], operands[3], GEN_INT (31)));
|
3662 |
|
|
DONE;
|
3663 |
|
|
}
|
3664 |
|
|
|
3665 |
|
|
if (true_regnum (operands[4]) != true_regnum (operands[1]))
|
3666 |
|
|
emit_move_insn (operands[4], operands[1]);
|
3667 |
|
|
|
3668 |
|
|
emit_insn (gen_ashrsi3_cvt (operands[4], operands[4], GEN_INT (31)));
|
3669 |
|
|
DONE;
|
3670 |
|
|
})
|
3671 |
|
|
|
3672 |
|
|
(define_insn "extenddi2"
|
3673 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
3674 |
|
|
(sign_extend:DI
|
3675 |
|
|
(match_operand:SWI12 1 "nonimmediate_operand" "m")))]
|
3676 |
|
|
"TARGET_64BIT"
|
3677 |
|
|
"movs{q|x}\t{%1, %0|%0, %1}"
|
3678 |
|
|
[(set_attr "type" "imovx")
|
3679 |
|
|
(set_attr "mode" "DI")])
|
3680 |
|
|
|
3681 |
|
|
(define_insn "extendhisi2"
|
3682 |
|
|
[(set (match_operand:SI 0 "register_operand" "=*a,r")
|
3683 |
|
|
(sign_extend:SI (match_operand:HI 1 "nonimmediate_operand" "*0,rm")))]
|
3684 |
|
|
""
|
3685 |
|
|
{
|
3686 |
|
|
switch (get_attr_prefix_0f (insn))
|
3687 |
|
|
{
|
3688 |
|
|
case 0:
|
3689 |
|
|
return "{cwtl|cwde}";
|
3690 |
|
|
default:
|
3691 |
|
|
return "movs{wl|x}\t{%1, %0|%0, %1}";
|
3692 |
|
|
}
|
3693 |
|
|
}
|
3694 |
|
|
[(set_attr "type" "imovx")
|
3695 |
|
|
(set_attr "mode" "SI")
|
3696 |
|
|
(set (attr "prefix_0f")
|
3697 |
|
|
;; movsx is short decodable while cwtl is vector decoded.
|
3698 |
|
|
(if_then_else (and (eq_attr "cpu" "!k6")
|
3699 |
|
|
(eq_attr "alternative" "0"))
|
3700 |
|
|
(const_string "0")
|
3701 |
|
|
(const_string "1")))
|
3702 |
|
|
(set (attr "modrm")
|
3703 |
|
|
(if_then_else (eq_attr "prefix_0f" "0")
|
3704 |
|
|
(const_string "0")
|
3705 |
|
|
(const_string "1")))])
|
3706 |
|
|
|
3707 |
|
|
(define_insn "*extendhisi2_zext"
|
3708 |
|
|
[(set (match_operand:DI 0 "register_operand" "=*a,r")
|
3709 |
|
|
(zero_extend:DI
|
3710 |
|
|
(sign_extend:SI
|
3711 |
|
|
(match_operand:HI 1 "nonimmediate_operand" "*0,rm"))))]
|
3712 |
|
|
"TARGET_64BIT"
|
3713 |
|
|
{
|
3714 |
|
|
switch (get_attr_prefix_0f (insn))
|
3715 |
|
|
{
|
3716 |
|
|
case 0:
|
3717 |
|
|
return "{cwtl|cwde}";
|
3718 |
|
|
default:
|
3719 |
|
|
return "movs{wl|x}\t{%1, %k0|%k0, %1}";
|
3720 |
|
|
}
|
3721 |
|
|
}
|
3722 |
|
|
[(set_attr "type" "imovx")
|
3723 |
|
|
(set_attr "mode" "SI")
|
3724 |
|
|
(set (attr "prefix_0f")
|
3725 |
|
|
;; movsx is short decodable while cwtl is vector decoded.
|
3726 |
|
|
(if_then_else (and (eq_attr "cpu" "!k6")
|
3727 |
|
|
(eq_attr "alternative" "0"))
|
3728 |
|
|
(const_string "0")
|
3729 |
|
|
(const_string "1")))
|
3730 |
|
|
(set (attr "modrm")
|
3731 |
|
|
(if_then_else (eq_attr "prefix_0f" "0")
|
3732 |
|
|
(const_string "0")
|
3733 |
|
|
(const_string "1")))])
|
3734 |
|
|
|
3735 |
|
|
(define_insn "extendqisi2"
|
3736 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
3737 |
|
|
(sign_extend:SI (match_operand:QI 1 "nonimmediate_operand" "qm")))]
|
3738 |
|
|
""
|
3739 |
|
|
"movs{bl|x}\t{%1, %0|%0, %1}"
|
3740 |
|
|
[(set_attr "type" "imovx")
|
3741 |
|
|
(set_attr "mode" "SI")])
|
3742 |
|
|
|
3743 |
|
|
(define_insn "*extendqisi2_zext"
|
3744 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
3745 |
|
|
(zero_extend:DI
|
3746 |
|
|
(sign_extend:SI (match_operand:QI 1 "nonimmediate_operand" "qm"))))]
|
3747 |
|
|
"TARGET_64BIT"
|
3748 |
|
|
"movs{bl|x}\t{%1, %k0|%k0, %1}"
|
3749 |
|
|
[(set_attr "type" "imovx")
|
3750 |
|
|
(set_attr "mode" "SI")])
|
3751 |
|
|
|
3752 |
|
|
(define_insn "extendqihi2"
|
3753 |
|
|
[(set (match_operand:HI 0 "register_operand" "=*a,r")
|
3754 |
|
|
(sign_extend:HI (match_operand:QI 1 "nonimmediate_operand" "*0,qm")))]
|
3755 |
|
|
""
|
3756 |
|
|
{
|
3757 |
|
|
switch (get_attr_prefix_0f (insn))
|
3758 |
|
|
{
|
3759 |
|
|
case 0:
|
3760 |
|
|
return "{cbtw|cbw}";
|
3761 |
|
|
default:
|
3762 |
|
|
return "movs{bw|x}\t{%1, %0|%0, %1}";
|
3763 |
|
|
}
|
3764 |
|
|
}
|
3765 |
|
|
[(set_attr "type" "imovx")
|
3766 |
|
|
(set_attr "mode" "HI")
|
3767 |
|
|
(set (attr "prefix_0f")
|
3768 |
|
|
;; movsx is short decodable while cwtl is vector decoded.
|
3769 |
|
|
(if_then_else (and (eq_attr "cpu" "!k6")
|
3770 |
|
|
(eq_attr "alternative" "0"))
|
3771 |
|
|
(const_string "0")
|
3772 |
|
|
(const_string "1")))
|
3773 |
|
|
(set (attr "modrm")
|
3774 |
|
|
(if_then_else (eq_attr "prefix_0f" "0")
|
3775 |
|
|
(const_string "0")
|
3776 |
|
|
(const_string "1")))])
|
3777 |
|
|
|
3778 |
|
|
;; Conversions between float and double.
|
3779 |
|
|
|
3780 |
|
|
;; These are all no-ops in the model used for the 80387.
|
3781 |
|
|
;; So just emit moves.
|
3782 |
|
|
|
3783 |
|
|
;; %%% Kill these when call knows how to work out a DFmode push earlier.
|
3784 |
|
|
(define_split
|
3785 |
|
|
[(set (match_operand:DF 0 "push_operand" "")
|
3786 |
|
|
(float_extend:DF (match_operand:SF 1 "fp_register_operand" "")))]
|
3787 |
|
|
"reload_completed"
|
3788 |
|
|
[(set (reg:P SP_REG) (plus:P (reg:P SP_REG) (const_int -8)))
|
3789 |
|
|
(set (mem:DF (reg:P SP_REG)) (float_extend:DF (match_dup 1)))])
|
3790 |
|
|
|
3791 |
|
|
(define_split
|
3792 |
|
|
[(set (match_operand:XF 0 "push_operand" "")
|
3793 |
|
|
(float_extend:XF (match_operand:MODEF 1 "fp_register_operand" "")))]
|
3794 |
|
|
"reload_completed"
|
3795 |
|
|
[(set (reg:P SP_REG) (plus:P (reg:P SP_REG) (match_dup 2)))
|
3796 |
|
|
(set (mem:XF (reg:P SP_REG)) (float_extend:XF (match_dup 1)))]
|
3797 |
|
|
"operands[2] = GEN_INT (-GET_MODE_SIZE (XFmode));")
|
3798 |
|
|
|
3799 |
|
|
(define_expand "extendsfdf2"
|
3800 |
|
|
[(set (match_operand:DF 0 "nonimmediate_operand" "")
|
3801 |
|
|
(float_extend:DF (match_operand:SF 1 "general_operand" "")))]
|
3802 |
|
|
"TARGET_80387 || (TARGET_SSE2 && TARGET_SSE_MATH)"
|
3803 |
|
|
{
|
3804 |
|
|
/* ??? Needed for compress_float_constant since all fp constants
|
3805 |
|
|
are TARGET_LEGITIMATE_CONSTANT_P. */
|
3806 |
|
|
if (GET_CODE (operands[1]) == CONST_DOUBLE)
|
3807 |
|
|
{
|
3808 |
|
|
if ((!TARGET_SSE2 || TARGET_MIX_SSE_I387)
|
3809 |
|
|
&& standard_80387_constant_p (operands[1]) > 0)
|
3810 |
|
|
{
|
3811 |
|
|
operands[1] = simplify_const_unary_operation
|
3812 |
|
|
(FLOAT_EXTEND, DFmode, operands[1], SFmode);
|
3813 |
|
|
emit_move_insn_1 (operands[0], operands[1]);
|
3814 |
|
|
DONE;
|
3815 |
|
|
}
|
3816 |
|
|
operands[1] = validize_mem (force_const_mem (SFmode, operands[1]));
|
3817 |
|
|
}
|
3818 |
|
|
})
|
3819 |
|
|
|
3820 |
|
|
/* For converting SF(xmm2) to DF(xmm1), use the following code instead of
|
3821 |
|
|
cvtss2sd:
|
3822 |
|
|
unpcklps xmm2,xmm2 ; packed conversion might crash on signaling NaNs
|
3823 |
|
|
cvtps2pd xmm2,xmm1
|
3824 |
|
|
We do the conversion post reload to avoid producing of 128bit spills
|
3825 |
|
|
that might lead to ICE on 32bit target. The sequence unlikely combine
|
3826 |
|
|
anyway. */
|
3827 |
|
|
(define_split
|
3828 |
|
|
[(set (match_operand:DF 0 "register_operand" "")
|
3829 |
|
|
(float_extend:DF
|
3830 |
|
|
(match_operand:SF 1 "nonimmediate_operand" "")))]
|
3831 |
|
|
"TARGET_USE_VECTOR_FP_CONVERTS
|
3832 |
|
|
&& optimize_insn_for_speed_p ()
|
3833 |
|
|
&& reload_completed && SSE_REG_P (operands[0])"
|
3834 |
|
|
[(set (match_dup 2)
|
3835 |
|
|
(float_extend:V2DF
|
3836 |
|
|
(vec_select:V2SF
|
3837 |
|
|
(match_dup 3)
|
3838 |
|
|
(parallel [(const_int 0) (const_int 1)]))))]
|
3839 |
|
|
{
|
3840 |
|
|
operands[2] = simplify_gen_subreg (V2DFmode, operands[0], DFmode, 0);
|
3841 |
|
|
operands[3] = simplify_gen_subreg (V4SFmode, operands[0], DFmode, 0);
|
3842 |
|
|
/* Use movss for loading from memory, unpcklps reg, reg for registers.
|
3843 |
|
|
Try to avoid move when unpacking can be done in source. */
|
3844 |
|
|
if (REG_P (operands[1]))
|
3845 |
|
|
{
|
3846 |
|
|
/* If it is unsafe to overwrite upper half of source, we need
|
3847 |
|
|
to move to destination and unpack there. */
|
3848 |
|
|
if ((ORIGINAL_REGNO (operands[1]) < FIRST_PSEUDO_REGISTER
|
3849 |
|
|
|| PSEUDO_REGNO_BYTES (ORIGINAL_REGNO (operands[1])) > 4)
|
3850 |
|
|
&& true_regnum (operands[0]) != true_regnum (operands[1]))
|
3851 |
|
|
{
|
3852 |
|
|
rtx tmp = gen_rtx_REG (SFmode, true_regnum (operands[0]));
|
3853 |
|
|
emit_move_insn (tmp, operands[1]);
|
3854 |
|
|
}
|
3855 |
|
|
else
|
3856 |
|
|
operands[3] = simplify_gen_subreg (V4SFmode, operands[1], SFmode, 0);
|
3857 |
|
|
emit_insn (gen_vec_interleave_lowv4sf (operands[3], operands[3],
|
3858 |
|
|
operands[3]));
|
3859 |
|
|
}
|
3860 |
|
|
else
|
3861 |
|
|
emit_insn (gen_vec_setv4sf_0 (operands[3],
|
3862 |
|
|
CONST0_RTX (V4SFmode), operands[1]));
|
3863 |
|
|
})
|
3864 |
|
|
|
3865 |
|
|
(define_insn "*extendsfdf2_mixed"
|
3866 |
|
|
[(set (match_operand:DF 0 "nonimmediate_operand" "=f,m,x")
|
3867 |
|
|
(float_extend:DF
|
3868 |
|
|
(match_operand:SF 1 "nonimmediate_operand" "fm,f,xm")))]
|
3869 |
|
|
"TARGET_SSE2 && TARGET_MIX_SSE_I387"
|
3870 |
|
|
{
|
3871 |
|
|
switch (which_alternative)
|
3872 |
|
|
{
|
3873 |
|
|
case 0:
|
3874 |
|
|
case 1:
|
3875 |
|
|
return output_387_reg_move (insn, operands);
|
3876 |
|
|
|
3877 |
|
|
case 2:
|
3878 |
|
|
return "%vcvtss2sd\t{%1, %d0|%d0, %1}";
|
3879 |
|
|
|
3880 |
|
|
default:
|
3881 |
|
|
gcc_unreachable ();
|
3882 |
|
|
}
|
3883 |
|
|
}
|
3884 |
|
|
[(set_attr "type" "fmov,fmov,ssecvt")
|
3885 |
|
|
(set_attr "prefix" "orig,orig,maybe_vex")
|
3886 |
|
|
(set_attr "mode" "SF,XF,DF")])
|
3887 |
|
|
|
3888 |
|
|
(define_insn "*extendsfdf2_sse"
|
3889 |
|
|
[(set (match_operand:DF 0 "nonimmediate_operand" "=x")
|
3890 |
|
|
(float_extend:DF (match_operand:SF 1 "nonimmediate_operand" "xm")))]
|
3891 |
|
|
"TARGET_SSE2 && TARGET_SSE_MATH"
|
3892 |
|
|
"%vcvtss2sd\t{%1, %d0|%d0, %1}"
|
3893 |
|
|
[(set_attr "type" "ssecvt")
|
3894 |
|
|
(set_attr "prefix" "maybe_vex")
|
3895 |
|
|
(set_attr "mode" "DF")])
|
3896 |
|
|
|
3897 |
|
|
(define_insn "*extendsfdf2_i387"
|
3898 |
|
|
[(set (match_operand:DF 0 "nonimmediate_operand" "=f,m")
|
3899 |
|
|
(float_extend:DF (match_operand:SF 1 "nonimmediate_operand" "fm,f")))]
|
3900 |
|
|
"TARGET_80387"
|
3901 |
|
|
"* return output_387_reg_move (insn, operands);"
|
3902 |
|
|
[(set_attr "type" "fmov")
|
3903 |
|
|
(set_attr "mode" "SF,XF")])
|
3904 |
|
|
|
3905 |
|
|
(define_expand "extendxf2"
|
3906 |
|
|
[(set (match_operand:XF 0 "nonimmediate_operand" "")
|
3907 |
|
|
(float_extend:XF (match_operand:MODEF 1 "general_operand" "")))]
|
3908 |
|
|
"TARGET_80387"
|
3909 |
|
|
{
|
3910 |
|
|
/* ??? Needed for compress_float_constant since all fp constants
|
3911 |
|
|
are TARGET_LEGITIMATE_CONSTANT_P. */
|
3912 |
|
|
if (GET_CODE (operands[1]) == CONST_DOUBLE)
|
3913 |
|
|
{
|
3914 |
|
|
if (standard_80387_constant_p (operands[1]) > 0)
|
3915 |
|
|
{
|
3916 |
|
|
operands[1] = simplify_const_unary_operation
|
3917 |
|
|
(FLOAT_EXTEND, XFmode, operands[1], mode);
|
3918 |
|
|
emit_move_insn_1 (operands[0], operands[1]);
|
3919 |
|
|
DONE;
|
3920 |
|
|
}
|
3921 |
|
|
operands[1] = validize_mem (force_const_mem (mode, operands[1]));
|
3922 |
|
|
}
|
3923 |
|
|
})
|
3924 |
|
|
|
3925 |
|
|
(define_insn "*extendxf2_i387"
|
3926 |
|
|
[(set (match_operand:XF 0 "nonimmediate_operand" "=f,m")
|
3927 |
|
|
(float_extend:XF
|
3928 |
|
|
(match_operand:MODEF 1 "nonimmediate_operand" "fm,f")))]
|
3929 |
|
|
"TARGET_80387"
|
3930 |
|
|
"* return output_387_reg_move (insn, operands);"
|
3931 |
|
|
[(set_attr "type" "fmov")
|
3932 |
|
|
(set_attr "mode" ",XF")])
|
3933 |
|
|
|
3934 |
|
|
;; %%% This seems bad bad news.
|
3935 |
|
|
;; This cannot output into an f-reg because there is no way to be sure
|
3936 |
|
|
;; of truncating in that case. Otherwise this is just like a simple move
|
3937 |
|
|
;; insn. So we pretend we can output to a reg in order to get better
|
3938 |
|
|
;; register preferencing, but we really use a stack slot.
|
3939 |
|
|
|
3940 |
|
|
;; Conversion from DFmode to SFmode.
|
3941 |
|
|
|
3942 |
|
|
(define_expand "truncdfsf2"
|
3943 |
|
|
[(set (match_operand:SF 0 "nonimmediate_operand" "")
|
3944 |
|
|
(float_truncate:SF
|
3945 |
|
|
(match_operand:DF 1 "nonimmediate_operand" "")))]
|
3946 |
|
|
"TARGET_80387 || (TARGET_SSE2 && TARGET_SSE_MATH)"
|
3947 |
|
|
{
|
3948 |
|
|
if (TARGET_SSE2 && TARGET_SSE_MATH && !TARGET_MIX_SSE_I387)
|
3949 |
|
|
;
|
3950 |
|
|
else if (flag_unsafe_math_optimizations)
|
3951 |
|
|
;
|
3952 |
|
|
else
|
3953 |
|
|
{
|
3954 |
|
|
enum ix86_stack_slot slot = (virtuals_instantiated
|
3955 |
|
|
? SLOT_TEMP
|
3956 |
|
|
: SLOT_VIRTUAL);
|
3957 |
|
|
rtx temp = assign_386_stack_local (SFmode, slot);
|
3958 |
|
|
emit_insn (gen_truncdfsf2_with_temp (operands[0], operands[1], temp));
|
3959 |
|
|
DONE;
|
3960 |
|
|
}
|
3961 |
|
|
})
|
3962 |
|
|
|
3963 |
|
|
/* For converting DF(xmm2) to SF(xmm1), use the following code instead of
|
3964 |
|
|
cvtsd2ss:
|
3965 |
|
|
unpcklpd xmm2,xmm2 ; packed conversion might crash on signaling NaNs
|
3966 |
|
|
cvtpd2ps xmm2,xmm1
|
3967 |
|
|
We do the conversion post reload to avoid producing of 128bit spills
|
3968 |
|
|
that might lead to ICE on 32bit target. The sequence unlikely combine
|
3969 |
|
|
anyway. */
|
3970 |
|
|
(define_split
|
3971 |
|
|
[(set (match_operand:SF 0 "register_operand" "")
|
3972 |
|
|
(float_truncate:SF
|
3973 |
|
|
(match_operand:DF 1 "nonimmediate_operand" "")))]
|
3974 |
|
|
"TARGET_USE_VECTOR_FP_CONVERTS
|
3975 |
|
|
&& optimize_insn_for_speed_p ()
|
3976 |
|
|
&& reload_completed && SSE_REG_P (operands[0])"
|
3977 |
|
|
[(set (match_dup 2)
|
3978 |
|
|
(vec_concat:V4SF
|
3979 |
|
|
(float_truncate:V2SF
|
3980 |
|
|
(match_dup 4))
|
3981 |
|
|
(match_dup 3)))]
|
3982 |
|
|
{
|
3983 |
|
|
operands[2] = simplify_gen_subreg (V4SFmode, operands[0], SFmode, 0);
|
3984 |
|
|
operands[3] = CONST0_RTX (V2SFmode);
|
3985 |
|
|
operands[4] = simplify_gen_subreg (V2DFmode, operands[0], SFmode, 0);
|
3986 |
|
|
/* Use movsd for loading from memory, unpcklpd for registers.
|
3987 |
|
|
Try to avoid move when unpacking can be done in source, or SSE3
|
3988 |
|
|
movddup is available. */
|
3989 |
|
|
if (REG_P (operands[1]))
|
3990 |
|
|
{
|
3991 |
|
|
if (!TARGET_SSE3
|
3992 |
|
|
&& true_regnum (operands[0]) != true_regnum (operands[1])
|
3993 |
|
|
&& (ORIGINAL_REGNO (operands[1]) < FIRST_PSEUDO_REGISTER
|
3994 |
|
|
|| PSEUDO_REGNO_BYTES (ORIGINAL_REGNO (operands[1])) > 8))
|
3995 |
|
|
{
|
3996 |
|
|
rtx tmp = simplify_gen_subreg (DFmode, operands[0], SFmode, 0);
|
3997 |
|
|
emit_move_insn (tmp, operands[1]);
|
3998 |
|
|
operands[1] = tmp;
|
3999 |
|
|
}
|
4000 |
|
|
else if (!TARGET_SSE3)
|
4001 |
|
|
operands[4] = simplify_gen_subreg (V2DFmode, operands[1], DFmode, 0);
|
4002 |
|
|
emit_insn (gen_vec_dupv2df (operands[4], operands[1]));
|
4003 |
|
|
}
|
4004 |
|
|
else
|
4005 |
|
|
emit_insn (gen_sse2_loadlpd (operands[4],
|
4006 |
|
|
CONST0_RTX (V2DFmode), operands[1]));
|
4007 |
|
|
})
|
4008 |
|
|
|
4009 |
|
|
(define_expand "truncdfsf2_with_temp"
|
4010 |
|
|
[(parallel [(set (match_operand:SF 0 "" "")
|
4011 |
|
|
(float_truncate:SF (match_operand:DF 1 "" "")))
|
4012 |
|
|
(clobber (match_operand:SF 2 "" ""))])])
|
4013 |
|
|
|
4014 |
|
|
(define_insn "*truncdfsf_fast_mixed"
|
4015 |
|
|
[(set (match_operand:SF 0 "nonimmediate_operand" "=fm,x")
|
4016 |
|
|
(float_truncate:SF
|
4017 |
|
|
(match_operand:DF 1 "nonimmediate_operand" "f ,xm")))]
|
4018 |
|
|
"TARGET_SSE2 && TARGET_MIX_SSE_I387 && flag_unsafe_math_optimizations"
|
4019 |
|
|
{
|
4020 |
|
|
switch (which_alternative)
|
4021 |
|
|
{
|
4022 |
|
|
case 0:
|
4023 |
|
|
return output_387_reg_move (insn, operands);
|
4024 |
|
|
case 1:
|
4025 |
|
|
return "%vcvtsd2ss\t{%1, %d0|%d0, %1}";
|
4026 |
|
|
default:
|
4027 |
|
|
gcc_unreachable ();
|
4028 |
|
|
}
|
4029 |
|
|
}
|
4030 |
|
|
[(set_attr "type" "fmov,ssecvt")
|
4031 |
|
|
(set_attr "prefix" "orig,maybe_vex")
|
4032 |
|
|
(set_attr "mode" "SF")])
|
4033 |
|
|
|
4034 |
|
|
;; Yes, this one doesn't depend on flag_unsafe_math_optimizations,
|
4035 |
|
|
;; because nothing we do here is unsafe.
|
4036 |
|
|
(define_insn "*truncdfsf_fast_sse"
|
4037 |
|
|
[(set (match_operand:SF 0 "nonimmediate_operand" "=x")
|
4038 |
|
|
(float_truncate:SF
|
4039 |
|
|
(match_operand:DF 1 "nonimmediate_operand" "xm")))]
|
4040 |
|
|
"TARGET_SSE2 && TARGET_SSE_MATH"
|
4041 |
|
|
"%vcvtsd2ss\t{%1, %d0|%d0, %1}"
|
4042 |
|
|
[(set_attr "type" "ssecvt")
|
4043 |
|
|
(set_attr "prefix" "maybe_vex")
|
4044 |
|
|
(set_attr "mode" "SF")])
|
4045 |
|
|
|
4046 |
|
|
(define_insn "*truncdfsf_fast_i387"
|
4047 |
|
|
[(set (match_operand:SF 0 "nonimmediate_operand" "=fm")
|
4048 |
|
|
(float_truncate:SF
|
4049 |
|
|
(match_operand:DF 1 "nonimmediate_operand" "f")))]
|
4050 |
|
|
"TARGET_80387 && flag_unsafe_math_optimizations"
|
4051 |
|
|
"* return output_387_reg_move (insn, operands);"
|
4052 |
|
|
[(set_attr "type" "fmov")
|
4053 |
|
|
(set_attr "mode" "SF")])
|
4054 |
|
|
|
4055 |
|
|
(define_insn "*truncdfsf_mixed"
|
4056 |
|
|
[(set (match_operand:SF 0 "nonimmediate_operand" "=m,x ,?f,?x,?*r")
|
4057 |
|
|
(float_truncate:SF
|
4058 |
|
|
(match_operand:DF 1 "nonimmediate_operand" "f ,xm,f ,f ,f")))
|
4059 |
|
|
(clobber (match_operand:SF 2 "memory_operand" "=X,X ,m ,m ,m"))]
|
4060 |
|
|
"TARGET_MIX_SSE_I387"
|
4061 |
|
|
{
|
4062 |
|
|
switch (which_alternative)
|
4063 |
|
|
{
|
4064 |
|
|
case 0:
|
4065 |
|
|
return output_387_reg_move (insn, operands);
|
4066 |
|
|
case 1:
|
4067 |
|
|
return "%vcvtsd2ss\t{%1, %d0|%d0, %1}";
|
4068 |
|
|
|
4069 |
|
|
default:
|
4070 |
|
|
return "#";
|
4071 |
|
|
}
|
4072 |
|
|
}
|
4073 |
|
|
[(set_attr "isa" "*,sse2,*,*,*")
|
4074 |
|
|
(set_attr "type" "fmov,ssecvt,multi,multi,multi")
|
4075 |
|
|
(set_attr "unit" "*,*,i387,i387,i387")
|
4076 |
|
|
(set_attr "prefix" "orig,maybe_vex,orig,orig,orig")
|
4077 |
|
|
(set_attr "mode" "SF")])
|
4078 |
|
|
|
4079 |
|
|
(define_insn "*truncdfsf_i387"
|
4080 |
|
|
[(set (match_operand:SF 0 "nonimmediate_operand" "=m,?f,?x,?*r")
|
4081 |
|
|
(float_truncate:SF
|
4082 |
|
|
(match_operand:DF 1 "nonimmediate_operand" "f ,f ,f ,f")))
|
4083 |
|
|
(clobber (match_operand:SF 2 "memory_operand" "=X,m ,m ,m"))]
|
4084 |
|
|
"TARGET_80387"
|
4085 |
|
|
{
|
4086 |
|
|
switch (which_alternative)
|
4087 |
|
|
{
|
4088 |
|
|
case 0:
|
4089 |
|
|
return output_387_reg_move (insn, operands);
|
4090 |
|
|
|
4091 |
|
|
default:
|
4092 |
|
|
return "#";
|
4093 |
|
|
}
|
4094 |
|
|
}
|
4095 |
|
|
[(set_attr "type" "fmov,multi,multi,multi")
|
4096 |
|
|
(set_attr "unit" "*,i387,i387,i387")
|
4097 |
|
|
(set_attr "mode" "SF")])
|
4098 |
|
|
|
4099 |
|
|
(define_insn "*truncdfsf2_i387_1"
|
4100 |
|
|
[(set (match_operand:SF 0 "memory_operand" "=m")
|
4101 |
|
|
(float_truncate:SF
|
4102 |
|
|
(match_operand:DF 1 "register_operand" "f")))]
|
4103 |
|
|
"TARGET_80387
|
4104 |
|
|
&& !(TARGET_SSE2 && TARGET_SSE_MATH)
|
4105 |
|
|
&& !TARGET_MIX_SSE_I387"
|
4106 |
|
|
"* return output_387_reg_move (insn, operands);"
|
4107 |
|
|
[(set_attr "type" "fmov")
|
4108 |
|
|
(set_attr "mode" "SF")])
|
4109 |
|
|
|
4110 |
|
|
(define_split
|
4111 |
|
|
[(set (match_operand:SF 0 "register_operand" "")
|
4112 |
|
|
(float_truncate:SF
|
4113 |
|
|
(match_operand:DF 1 "fp_register_operand" "")))
|
4114 |
|
|
(clobber (match_operand 2 "" ""))]
|
4115 |
|
|
"reload_completed"
|
4116 |
|
|
[(set (match_dup 2) (match_dup 1))
|
4117 |
|
|
(set (match_dup 0) (match_dup 2))]
|
4118 |
|
|
"operands[1] = gen_rtx_REG (SFmode, true_regnum (operands[1]));")
|
4119 |
|
|
|
4120 |
|
|
;; Conversion from XFmode to {SF,DF}mode
|
4121 |
|
|
|
4122 |
|
|
(define_expand "truncxf2"
|
4123 |
|
|
[(parallel [(set (match_operand:MODEF 0 "nonimmediate_operand" "")
|
4124 |
|
|
(float_truncate:MODEF
|
4125 |
|
|
(match_operand:XF 1 "register_operand" "")))
|
4126 |
|
|
(clobber (match_dup 2))])]
|
4127 |
|
|
"TARGET_80387"
|
4128 |
|
|
{
|
4129 |
|
|
if (flag_unsafe_math_optimizations)
|
4130 |
|
|
{
|
4131 |
|
|
rtx reg = REG_P (operands[0]) ? operands[0] : gen_reg_rtx (mode);
|
4132 |
|
|
emit_insn (gen_truncxf2_i387_noop (reg, operands[1]));
|
4133 |
|
|
if (reg != operands[0])
|
4134 |
|
|
emit_move_insn (operands[0], reg);
|
4135 |
|
|
DONE;
|
4136 |
|
|
}
|
4137 |
|
|
else
|
4138 |
|
|
{
|
4139 |
|
|
enum ix86_stack_slot slot = (virtuals_instantiated
|
4140 |
|
|
? SLOT_TEMP
|
4141 |
|
|
: SLOT_VIRTUAL);
|
4142 |
|
|
operands[2] = assign_386_stack_local (mode, slot);
|
4143 |
|
|
}
|
4144 |
|
|
})
|
4145 |
|
|
|
4146 |
|
|
(define_insn "*truncxfsf2_mixed"
|
4147 |
|
|
[(set (match_operand:SF 0 "nonimmediate_operand" "=m,?f,?x,?*r")
|
4148 |
|
|
(float_truncate:SF
|
4149 |
|
|
(match_operand:XF 1 "register_operand" "f ,f ,f ,f")))
|
4150 |
|
|
(clobber (match_operand:SF 2 "memory_operand" "=X,m ,m ,m"))]
|
4151 |
|
|
"TARGET_80387"
|
4152 |
|
|
{
|
4153 |
|
|
gcc_assert (!which_alternative);
|
4154 |
|
|
return output_387_reg_move (insn, operands);
|
4155 |
|
|
}
|
4156 |
|
|
[(set_attr "type" "fmov,multi,multi,multi")
|
4157 |
|
|
(set_attr "unit" "*,i387,i387,i387")
|
4158 |
|
|
(set_attr "mode" "SF")])
|
4159 |
|
|
|
4160 |
|
|
(define_insn "*truncxfdf2_mixed"
|
4161 |
|
|
[(set (match_operand:DF 0 "nonimmediate_operand" "=m,?f,?x,?*r")
|
4162 |
|
|
(float_truncate:DF
|
4163 |
|
|
(match_operand:XF 1 "register_operand" "f ,f ,f ,f")))
|
4164 |
|
|
(clobber (match_operand:DF 2 "memory_operand" "=X,m ,m ,m"))]
|
4165 |
|
|
"TARGET_80387"
|
4166 |
|
|
{
|
4167 |
|
|
gcc_assert (!which_alternative);
|
4168 |
|
|
return output_387_reg_move (insn, operands);
|
4169 |
|
|
}
|
4170 |
|
|
[(set_attr "isa" "*,*,sse2,*")
|
4171 |
|
|
(set_attr "type" "fmov,multi,multi,multi")
|
4172 |
|
|
(set_attr "unit" "*,i387,i387,i387")
|
4173 |
|
|
(set_attr "mode" "DF")])
|
4174 |
|
|
|
4175 |
|
|
(define_insn "truncxf2_i387_noop"
|
4176 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f")
|
4177 |
|
|
(float_truncate:MODEF
|
4178 |
|
|
(match_operand:XF 1 "register_operand" "f")))]
|
4179 |
|
|
"TARGET_80387 && flag_unsafe_math_optimizations"
|
4180 |
|
|
"* return output_387_reg_move (insn, operands);"
|
4181 |
|
|
[(set_attr "type" "fmov")
|
4182 |
|
|
(set_attr "mode" "")])
|
4183 |
|
|
|
4184 |
|
|
(define_insn "*truncxf2_i387"
|
4185 |
|
|
[(set (match_operand:MODEF 0 "memory_operand" "=m")
|
4186 |
|
|
(float_truncate:MODEF
|
4187 |
|
|
(match_operand:XF 1 "register_operand" "f")))]
|
4188 |
|
|
"TARGET_80387"
|
4189 |
|
|
"* return output_387_reg_move (insn, operands);"
|
4190 |
|
|
[(set_attr "type" "fmov")
|
4191 |
|
|
(set_attr "mode" "")])
|
4192 |
|
|
|
4193 |
|
|
(define_split
|
4194 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
4195 |
|
|
(float_truncate:MODEF
|
4196 |
|
|
(match_operand:XF 1 "register_operand" "")))
|
4197 |
|
|
(clobber (match_operand:MODEF 2 "memory_operand" ""))]
|
4198 |
|
|
"TARGET_80387 && reload_completed"
|
4199 |
|
|
[(set (match_dup 2) (float_truncate:MODEF (match_dup 1)))
|
4200 |
|
|
(set (match_dup 0) (match_dup 2))])
|
4201 |
|
|
|
4202 |
|
|
(define_split
|
4203 |
|
|
[(set (match_operand:MODEF 0 "memory_operand" "")
|
4204 |
|
|
(float_truncate:MODEF
|
4205 |
|
|
(match_operand:XF 1 "register_operand" "")))
|
4206 |
|
|
(clobber (match_operand:MODEF 2 "memory_operand" ""))]
|
4207 |
|
|
"TARGET_80387"
|
4208 |
|
|
[(set (match_dup 0) (float_truncate:MODEF (match_dup 1)))])
|
4209 |
|
|
|
4210 |
|
|
;; Signed conversion to DImode.
|
4211 |
|
|
|
4212 |
|
|
(define_expand "fix_truncxfdi2"
|
4213 |
|
|
[(parallel [(set (match_operand:DI 0 "nonimmediate_operand" "")
|
4214 |
|
|
(fix:DI (match_operand:XF 1 "register_operand" "")))
|
4215 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
4216 |
|
|
"TARGET_80387"
|
4217 |
|
|
{
|
4218 |
|
|
if (TARGET_FISTTP)
|
4219 |
|
|
{
|
4220 |
|
|
emit_insn (gen_fix_truncdi_fisttp_i387_1 (operands[0], operands[1]));
|
4221 |
|
|
DONE;
|
4222 |
|
|
}
|
4223 |
|
|
})
|
4224 |
|
|
|
4225 |
|
|
(define_expand "fix_truncdi2"
|
4226 |
|
|
[(parallel [(set (match_operand:DI 0 "nonimmediate_operand" "")
|
4227 |
|
|
(fix:DI (match_operand:MODEF 1 "register_operand" "")))
|
4228 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
4229 |
|
|
"TARGET_80387 || (TARGET_64BIT && SSE_FLOAT_MODE_P (mode))"
|
4230 |
|
|
{
|
4231 |
|
|
if (TARGET_FISTTP
|
4232 |
|
|
&& !(TARGET_64BIT && SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH))
|
4233 |
|
|
{
|
4234 |
|
|
emit_insn (gen_fix_truncdi_fisttp_i387_1 (operands[0], operands[1]));
|
4235 |
|
|
DONE;
|
4236 |
|
|
}
|
4237 |
|
|
if (TARGET_64BIT && SSE_FLOAT_MODE_P (mode))
|
4238 |
|
|
{
|
4239 |
|
|
rtx out = REG_P (operands[0]) ? operands[0] : gen_reg_rtx (DImode);
|
4240 |
|
|
emit_insn (gen_fix_truncdi_sse (out, operands[1]));
|
4241 |
|
|
if (out != operands[0])
|
4242 |
|
|
emit_move_insn (operands[0], out);
|
4243 |
|
|
DONE;
|
4244 |
|
|
}
|
4245 |
|
|
})
|
4246 |
|
|
|
4247 |
|
|
;; Signed conversion to SImode.
|
4248 |
|
|
|
4249 |
|
|
(define_expand "fix_truncxfsi2"
|
4250 |
|
|
[(parallel [(set (match_operand:SI 0 "nonimmediate_operand" "")
|
4251 |
|
|
(fix:SI (match_operand:XF 1 "register_operand" "")))
|
4252 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
4253 |
|
|
"TARGET_80387"
|
4254 |
|
|
{
|
4255 |
|
|
if (TARGET_FISTTP)
|
4256 |
|
|
{
|
4257 |
|
|
emit_insn (gen_fix_truncsi_fisttp_i387_1 (operands[0], operands[1]));
|
4258 |
|
|
DONE;
|
4259 |
|
|
}
|
4260 |
|
|
})
|
4261 |
|
|
|
4262 |
|
|
(define_expand "fix_truncsi2"
|
4263 |
|
|
[(parallel [(set (match_operand:SI 0 "nonimmediate_operand" "")
|
4264 |
|
|
(fix:SI (match_operand:MODEF 1 "register_operand" "")))
|
4265 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
4266 |
|
|
"TARGET_80387 || SSE_FLOAT_MODE_P (mode)"
|
4267 |
|
|
{
|
4268 |
|
|
if (TARGET_FISTTP
|
4269 |
|
|
&& !(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH))
|
4270 |
|
|
{
|
4271 |
|
|
emit_insn (gen_fix_truncsi_fisttp_i387_1 (operands[0], operands[1]));
|
4272 |
|
|
DONE;
|
4273 |
|
|
}
|
4274 |
|
|
if (SSE_FLOAT_MODE_P (mode))
|
4275 |
|
|
{
|
4276 |
|
|
rtx out = REG_P (operands[0]) ? operands[0] : gen_reg_rtx (SImode);
|
4277 |
|
|
emit_insn (gen_fix_truncsi_sse (out, operands[1]));
|
4278 |
|
|
if (out != operands[0])
|
4279 |
|
|
emit_move_insn (operands[0], out);
|
4280 |
|
|
DONE;
|
4281 |
|
|
}
|
4282 |
|
|
})
|
4283 |
|
|
|
4284 |
|
|
;; Signed conversion to HImode.
|
4285 |
|
|
|
4286 |
|
|
(define_expand "fix_trunchi2"
|
4287 |
|
|
[(parallel [(set (match_operand:HI 0 "nonimmediate_operand" "")
|
4288 |
|
|
(fix:HI (match_operand:X87MODEF 1 "register_operand" "")))
|
4289 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
4290 |
|
|
"TARGET_80387
|
4291 |
|
|
&& !(SSE_FLOAT_MODE_P (mode) && (!TARGET_FISTTP || TARGET_SSE_MATH))"
|
4292 |
|
|
{
|
4293 |
|
|
if (TARGET_FISTTP)
|
4294 |
|
|
{
|
4295 |
|
|
emit_insn (gen_fix_trunchi_fisttp_i387_1 (operands[0], operands[1]));
|
4296 |
|
|
DONE;
|
4297 |
|
|
}
|
4298 |
|
|
})
|
4299 |
|
|
|
4300 |
|
|
;; Unsigned conversion to SImode.
|
4301 |
|
|
|
4302 |
|
|
(define_expand "fixuns_truncsi2"
|
4303 |
|
|
[(parallel
|
4304 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
4305 |
|
|
(unsigned_fix:SI
|
4306 |
|
|
(match_operand:MODEF 1 "nonimmediate_operand" "")))
|
4307 |
|
|
(use (match_dup 2))
|
4308 |
|
|
(clobber (match_scratch: 3 ""))
|
4309 |
|
|
(clobber (match_scratch: 4 ""))])]
|
4310 |
|
|
"!TARGET_64BIT && TARGET_SSE2 && TARGET_SSE_MATH"
|
4311 |
|
|
{
|
4312 |
|
|
enum machine_mode mode = mode;
|
4313 |
|
|
enum machine_mode vecmode = mode;
|
4314 |
|
|
REAL_VALUE_TYPE TWO31r;
|
4315 |
|
|
rtx two31;
|
4316 |
|
|
|
4317 |
|
|
if (optimize_insn_for_size_p ())
|
4318 |
|
|
FAIL;
|
4319 |
|
|
|
4320 |
|
|
real_ldexp (&TWO31r, &dconst1, 31);
|
4321 |
|
|
two31 = const_double_from_real_value (TWO31r, mode);
|
4322 |
|
|
two31 = ix86_build_const_vector (vecmode, true, two31);
|
4323 |
|
|
operands[2] = force_reg (vecmode, two31);
|
4324 |
|
|
})
|
4325 |
|
|
|
4326 |
|
|
(define_insn_and_split "*fixuns_trunc_1"
|
4327 |
|
|
[(set (match_operand:SI 0 "register_operand" "=&x,&x")
|
4328 |
|
|
(unsigned_fix:SI
|
4329 |
|
|
(match_operand:MODEF 3 "nonimmediate_operand" "xm,xm")))
|
4330 |
|
|
(use (match_operand: 4 "nonimmediate_operand" "m,x"))
|
4331 |
|
|
(clobber (match_scratch: 1 "=x,&x"))
|
4332 |
|
|
(clobber (match_scratch: 2 "=x,x"))]
|
4333 |
|
|
"!TARGET_64BIT && TARGET_SSE2 && TARGET_SSE_MATH
|
4334 |
|
|
&& optimize_function_for_speed_p (cfun)"
|
4335 |
|
|
"#"
|
4336 |
|
|
"&& reload_completed"
|
4337 |
|
|
[(const_int 0)]
|
4338 |
|
|
{
|
4339 |
|
|
ix86_split_convert_uns_si_sse (operands);
|
4340 |
|
|
DONE;
|
4341 |
|
|
})
|
4342 |
|
|
|
4343 |
|
|
;; Unsigned conversion to HImode.
|
4344 |
|
|
;; Without these patterns, we'll try the unsigned SI conversion which
|
4345 |
|
|
;; is complex for SSE, rather than the signed SI conversion, which isn't.
|
4346 |
|
|
|
4347 |
|
|
(define_expand "fixuns_trunchi2"
|
4348 |
|
|
[(set (match_dup 2)
|
4349 |
|
|
(fix:SI (match_operand:MODEF 1 "nonimmediate_operand" "")))
|
4350 |
|
|
(set (match_operand:HI 0 "nonimmediate_operand" "")
|
4351 |
|
|
(subreg:HI (match_dup 2) 0))]
|
4352 |
|
|
"SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH"
|
4353 |
|
|
"operands[2] = gen_reg_rtx (SImode);")
|
4354 |
|
|
|
4355 |
|
|
;; When SSE is available, it is always faster to use it!
|
4356 |
|
|
(define_insn "fix_truncdi_sse"
|
4357 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r,r")
|
4358 |
|
|
(fix:DI (match_operand:MODEF 1 "nonimmediate_operand" "x,m")))]
|
4359 |
|
|
"TARGET_64BIT && SSE_FLOAT_MODE_P (mode)
|
4360 |
|
|
&& (!TARGET_FISTTP || TARGET_SSE_MATH)"
|
4361 |
|
|
"%vcvtt2si{q}\t{%1, %0|%0, %1}"
|
4362 |
|
|
[(set_attr "type" "sseicvt")
|
4363 |
|
|
(set_attr "prefix" "maybe_vex")
|
4364 |
|
|
(set_attr "prefix_rex" "1")
|
4365 |
|
|
(set_attr "mode" "")
|
4366 |
|
|
(set_attr "athlon_decode" "double,vector")
|
4367 |
|
|
(set_attr "amdfam10_decode" "double,double")
|
4368 |
|
|
(set_attr "bdver1_decode" "double,double")])
|
4369 |
|
|
|
4370 |
|
|
(define_insn "fix_truncsi_sse"
|
4371 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r,r")
|
4372 |
|
|
(fix:SI (match_operand:MODEF 1 "nonimmediate_operand" "x,m")))]
|
4373 |
|
|
"SSE_FLOAT_MODE_P (mode)
|
4374 |
|
|
&& (!TARGET_FISTTP || TARGET_SSE_MATH)"
|
4375 |
|
|
"%vcvtt2si\t{%1, %0|%0, %1}"
|
4376 |
|
|
[(set_attr "type" "sseicvt")
|
4377 |
|
|
(set_attr "prefix" "maybe_vex")
|
4378 |
|
|
(set_attr "mode" "")
|
4379 |
|
|
(set_attr "athlon_decode" "double,vector")
|
4380 |
|
|
(set_attr "amdfam10_decode" "double,double")
|
4381 |
|
|
(set_attr "bdver1_decode" "double,double")])
|
4382 |
|
|
|
4383 |
|
|
;; Shorten x87->SSE reload sequences of fix_trunc?f?i_sse patterns.
|
4384 |
|
|
(define_peephole2
|
4385 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
4386 |
|
|
(match_operand:MODEF 1 "memory_operand" ""))
|
4387 |
|
|
(set (match_operand:SWI48x 2 "register_operand" "")
|
4388 |
|
|
(fix:SWI48x (match_dup 0)))]
|
4389 |
|
|
"TARGET_SHORTEN_X87_SSE
|
4390 |
|
|
&& !(TARGET_AVOID_VECTOR_DECODE && optimize_insn_for_speed_p ())
|
4391 |
|
|
&& peep2_reg_dead_p (2, operands[0])"
|
4392 |
|
|
[(set (match_dup 2) (fix:SWI48x (match_dup 1)))])
|
4393 |
|
|
|
4394 |
|
|
;; Avoid vector decoded forms of the instruction.
|
4395 |
|
|
(define_peephole2
|
4396 |
|
|
[(match_scratch:DF 2 "x")
|
4397 |
|
|
(set (match_operand:SWI48x 0 "register_operand" "")
|
4398 |
|
|
(fix:SWI48x (match_operand:DF 1 "memory_operand" "")))]
|
4399 |
|
|
"TARGET_SSE2 && TARGET_AVOID_VECTOR_DECODE && optimize_insn_for_speed_p ()"
|
4400 |
|
|
[(set (match_dup 2) (match_dup 1))
|
4401 |
|
|
(set (match_dup 0) (fix:SWI48x (match_dup 2)))])
|
4402 |
|
|
|
4403 |
|
|
(define_peephole2
|
4404 |
|
|
[(match_scratch:SF 2 "x")
|
4405 |
|
|
(set (match_operand:SWI48x 0 "register_operand" "")
|
4406 |
|
|
(fix:SWI48x (match_operand:SF 1 "memory_operand" "")))]
|
4407 |
|
|
"TARGET_AVOID_VECTOR_DECODE && optimize_insn_for_speed_p ()"
|
4408 |
|
|
[(set (match_dup 2) (match_dup 1))
|
4409 |
|
|
(set (match_dup 0) (fix:SWI48x (match_dup 2)))])
|
4410 |
|
|
|
4411 |
|
|
(define_insn_and_split "fix_trunc_fisttp_i387_1"
|
4412 |
|
|
[(set (match_operand:SWI248x 0 "nonimmediate_operand" "")
|
4413 |
|
|
(fix:SWI248x (match_operand 1 "register_operand" "")))]
|
4414 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
4415 |
|
|
&& TARGET_FISTTP
|
4416 |
|
|
&& !((SSE_FLOAT_MODE_P (GET_MODE (operands[1]))
|
4417 |
|
|
&& (TARGET_64BIT || mode != DImode))
|
4418 |
|
|
&& TARGET_SSE_MATH)
|
4419 |
|
|
&& can_create_pseudo_p ()"
|
4420 |
|
|
"#"
|
4421 |
|
|
"&& 1"
|
4422 |
|
|
[(const_int 0)]
|
4423 |
|
|
{
|
4424 |
|
|
if (memory_operand (operands[0], VOIDmode))
|
4425 |
|
|
emit_insn (gen_fix_trunc_i387_fisttp (operands[0], operands[1]));
|
4426 |
|
|
else
|
4427 |
|
|
{
|
4428 |
|
|
operands[2] = assign_386_stack_local (mode, SLOT_TEMP);
|
4429 |
|
|
emit_insn (gen_fix_trunc_i387_fisttp_with_temp (operands[0],
|
4430 |
|
|
operands[1],
|
4431 |
|
|
operands[2]));
|
4432 |
|
|
}
|
4433 |
|
|
DONE;
|
4434 |
|
|
}
|
4435 |
|
|
[(set_attr "type" "fisttp")
|
4436 |
|
|
(set_attr "mode" "")])
|
4437 |
|
|
|
4438 |
|
|
(define_insn "fix_trunc_i387_fisttp"
|
4439 |
|
|
[(set (match_operand:SWI248x 0 "memory_operand" "=m")
|
4440 |
|
|
(fix:SWI248x (match_operand 1 "register_operand" "f")))
|
4441 |
|
|
(clobber (match_scratch:XF 2 "=&1f"))]
|
4442 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
4443 |
|
|
&& TARGET_FISTTP
|
4444 |
|
|
&& !((SSE_FLOAT_MODE_P (GET_MODE (operands[1]))
|
4445 |
|
|
&& (TARGET_64BIT || mode != DImode))
|
4446 |
|
|
&& TARGET_SSE_MATH)"
|
4447 |
|
|
"* return output_fix_trunc (insn, operands, true);"
|
4448 |
|
|
[(set_attr "type" "fisttp")
|
4449 |
|
|
(set_attr "mode" "")])
|
4450 |
|
|
|
4451 |
|
|
(define_insn "fix_trunc_i387_fisttp_with_temp"
|
4452 |
|
|
[(set (match_operand:SWI248x 0 "nonimmediate_operand" "=m,?r")
|
4453 |
|
|
(fix:SWI248x (match_operand 1 "register_operand" "f,f")))
|
4454 |
|
|
(clobber (match_operand:SWI248x 2 "memory_operand" "=X,m"))
|
4455 |
|
|
(clobber (match_scratch:XF 3 "=&1f,&1f"))]
|
4456 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
4457 |
|
|
&& TARGET_FISTTP
|
4458 |
|
|
&& !((SSE_FLOAT_MODE_P (GET_MODE (operands[1]))
|
4459 |
|
|
&& (TARGET_64BIT || mode != DImode))
|
4460 |
|
|
&& TARGET_SSE_MATH)"
|
4461 |
|
|
"#"
|
4462 |
|
|
[(set_attr "type" "fisttp")
|
4463 |
|
|
(set_attr "mode" "")])
|
4464 |
|
|
|
4465 |
|
|
(define_split
|
4466 |
|
|
[(set (match_operand:SWI248x 0 "register_operand" "")
|
4467 |
|
|
(fix:SWI248x (match_operand 1 "register_operand" "")))
|
4468 |
|
|
(clobber (match_operand:SWI248x 2 "memory_operand" ""))
|
4469 |
|
|
(clobber (match_scratch 3 ""))]
|
4470 |
|
|
"reload_completed"
|
4471 |
|
|
[(parallel [(set (match_dup 2) (fix:SWI248x (match_dup 1)))
|
4472 |
|
|
(clobber (match_dup 3))])
|
4473 |
|
|
(set (match_dup 0) (match_dup 2))])
|
4474 |
|
|
|
4475 |
|
|
(define_split
|
4476 |
|
|
[(set (match_operand:SWI248x 0 "memory_operand" "")
|
4477 |
|
|
(fix:SWI248x (match_operand 1 "register_operand" "")))
|
4478 |
|
|
(clobber (match_operand:SWI248x 2 "memory_operand" ""))
|
4479 |
|
|
(clobber (match_scratch 3 ""))]
|
4480 |
|
|
"reload_completed"
|
4481 |
|
|
[(parallel [(set (match_dup 0) (fix:SWI248x (match_dup 1)))
|
4482 |
|
|
(clobber (match_dup 3))])])
|
4483 |
|
|
|
4484 |
|
|
;; See the comments in i386.h near OPTIMIZE_MODE_SWITCHING for the description
|
4485 |
|
|
;; of the machinery. Please note the clobber of FLAGS_REG. In i387 control
|
4486 |
|
|
;; word calculation (inserted by LCM in mode switching pass) a FLAGS_REG
|
4487 |
|
|
;; clobbering insns can be used. Look at emit_i387_cw_initialization ()
|
4488 |
|
|
;; function in i386.c.
|
4489 |
|
|
(define_insn_and_split "*fix_trunc_i387_1"
|
4490 |
|
|
[(set (match_operand:SWI248x 0 "nonimmediate_operand" "")
|
4491 |
|
|
(fix:SWI248x (match_operand 1 "register_operand" "")))
|
4492 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
4493 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
4494 |
|
|
&& !TARGET_FISTTP
|
4495 |
|
|
&& !(SSE_FLOAT_MODE_P (GET_MODE (operands[1]))
|
4496 |
|
|
&& (TARGET_64BIT || mode != DImode))
|
4497 |
|
|
&& can_create_pseudo_p ()"
|
4498 |
|
|
"#"
|
4499 |
|
|
"&& 1"
|
4500 |
|
|
[(const_int 0)]
|
4501 |
|
|
{
|
4502 |
|
|
ix86_optimize_mode_switching[I387_TRUNC] = 1;
|
4503 |
|
|
|
4504 |
|
|
operands[2] = assign_386_stack_local (HImode, SLOT_CW_STORED);
|
4505 |
|
|
operands[3] = assign_386_stack_local (HImode, SLOT_CW_TRUNC);
|
4506 |
|
|
if (memory_operand (operands[0], VOIDmode))
|
4507 |
|
|
emit_insn (gen_fix_trunc_i387 (operands[0], operands[1],
|
4508 |
|
|
operands[2], operands[3]));
|
4509 |
|
|
else
|
4510 |
|
|
{
|
4511 |
|
|
operands[4] = assign_386_stack_local (mode, SLOT_TEMP);
|
4512 |
|
|
emit_insn (gen_fix_trunc_i387_with_temp (operands[0], operands[1],
|
4513 |
|
|
operands[2], operands[3],
|
4514 |
|
|
operands[4]));
|
4515 |
|
|
}
|
4516 |
|
|
DONE;
|
4517 |
|
|
}
|
4518 |
|
|
[(set_attr "type" "fistp")
|
4519 |
|
|
(set_attr "i387_cw" "trunc")
|
4520 |
|
|
(set_attr "mode" "")])
|
4521 |
|
|
|
4522 |
|
|
(define_insn "fix_truncdi_i387"
|
4523 |
|
|
[(set (match_operand:DI 0 "memory_operand" "=m")
|
4524 |
|
|
(fix:DI (match_operand 1 "register_operand" "f")))
|
4525 |
|
|
(use (match_operand:HI 2 "memory_operand" "m"))
|
4526 |
|
|
(use (match_operand:HI 3 "memory_operand" "m"))
|
4527 |
|
|
(clobber (match_scratch:XF 4 "=&1f"))]
|
4528 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
4529 |
|
|
&& !TARGET_FISTTP
|
4530 |
|
|
&& !(TARGET_64BIT && SSE_FLOAT_MODE_P (GET_MODE (operands[1])))"
|
4531 |
|
|
"* return output_fix_trunc (insn, operands, false);"
|
4532 |
|
|
[(set_attr "type" "fistp")
|
4533 |
|
|
(set_attr "i387_cw" "trunc")
|
4534 |
|
|
(set_attr "mode" "DI")])
|
4535 |
|
|
|
4536 |
|
|
(define_insn "fix_truncdi_i387_with_temp"
|
4537 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "=m,?r")
|
4538 |
|
|
(fix:DI (match_operand 1 "register_operand" "f,f")))
|
4539 |
|
|
(use (match_operand:HI 2 "memory_operand" "m,m"))
|
4540 |
|
|
(use (match_operand:HI 3 "memory_operand" "m,m"))
|
4541 |
|
|
(clobber (match_operand:DI 4 "memory_operand" "=X,m"))
|
4542 |
|
|
(clobber (match_scratch:XF 5 "=&1f,&1f"))]
|
4543 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
4544 |
|
|
&& !TARGET_FISTTP
|
4545 |
|
|
&& !(TARGET_64BIT && SSE_FLOAT_MODE_P (GET_MODE (operands[1])))"
|
4546 |
|
|
"#"
|
4547 |
|
|
[(set_attr "type" "fistp")
|
4548 |
|
|
(set_attr "i387_cw" "trunc")
|
4549 |
|
|
(set_attr "mode" "DI")])
|
4550 |
|
|
|
4551 |
|
|
(define_split
|
4552 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
4553 |
|
|
(fix:DI (match_operand 1 "register_operand" "")))
|
4554 |
|
|
(use (match_operand:HI 2 "memory_operand" ""))
|
4555 |
|
|
(use (match_operand:HI 3 "memory_operand" ""))
|
4556 |
|
|
(clobber (match_operand:DI 4 "memory_operand" ""))
|
4557 |
|
|
(clobber (match_scratch 5 ""))]
|
4558 |
|
|
"reload_completed"
|
4559 |
|
|
[(parallel [(set (match_dup 4) (fix:DI (match_dup 1)))
|
4560 |
|
|
(use (match_dup 2))
|
4561 |
|
|
(use (match_dup 3))
|
4562 |
|
|
(clobber (match_dup 5))])
|
4563 |
|
|
(set (match_dup 0) (match_dup 4))])
|
4564 |
|
|
|
4565 |
|
|
(define_split
|
4566 |
|
|
[(set (match_operand:DI 0 "memory_operand" "")
|
4567 |
|
|
(fix:DI (match_operand 1 "register_operand" "")))
|
4568 |
|
|
(use (match_operand:HI 2 "memory_operand" ""))
|
4569 |
|
|
(use (match_operand:HI 3 "memory_operand" ""))
|
4570 |
|
|
(clobber (match_operand:DI 4 "memory_operand" ""))
|
4571 |
|
|
(clobber (match_scratch 5 ""))]
|
4572 |
|
|
"reload_completed"
|
4573 |
|
|
[(parallel [(set (match_dup 0) (fix:DI (match_dup 1)))
|
4574 |
|
|
(use (match_dup 2))
|
4575 |
|
|
(use (match_dup 3))
|
4576 |
|
|
(clobber (match_dup 5))])])
|
4577 |
|
|
|
4578 |
|
|
(define_insn "fix_trunc_i387"
|
4579 |
|
|
[(set (match_operand:SWI24 0 "memory_operand" "=m")
|
4580 |
|
|
(fix:SWI24 (match_operand 1 "register_operand" "f")))
|
4581 |
|
|
(use (match_operand:HI 2 "memory_operand" "m"))
|
4582 |
|
|
(use (match_operand:HI 3 "memory_operand" "m"))]
|
4583 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
4584 |
|
|
&& !TARGET_FISTTP
|
4585 |
|
|
&& !SSE_FLOAT_MODE_P (GET_MODE (operands[1]))"
|
4586 |
|
|
"* return output_fix_trunc (insn, operands, false);"
|
4587 |
|
|
[(set_attr "type" "fistp")
|
4588 |
|
|
(set_attr "i387_cw" "trunc")
|
4589 |
|
|
(set_attr "mode" "")])
|
4590 |
|
|
|
4591 |
|
|
(define_insn "fix_trunc_i387_with_temp"
|
4592 |
|
|
[(set (match_operand:SWI24 0 "nonimmediate_operand" "=m,?r")
|
4593 |
|
|
(fix:SWI24 (match_operand 1 "register_operand" "f,f")))
|
4594 |
|
|
(use (match_operand:HI 2 "memory_operand" "m,m"))
|
4595 |
|
|
(use (match_operand:HI 3 "memory_operand" "m,m"))
|
4596 |
|
|
(clobber (match_operand:SWI24 4 "memory_operand" "=X,m"))]
|
4597 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
4598 |
|
|
&& !TARGET_FISTTP
|
4599 |
|
|
&& !SSE_FLOAT_MODE_P (GET_MODE (operands[1]))"
|
4600 |
|
|
"#"
|
4601 |
|
|
[(set_attr "type" "fistp")
|
4602 |
|
|
(set_attr "i387_cw" "trunc")
|
4603 |
|
|
(set_attr "mode" "")])
|
4604 |
|
|
|
4605 |
|
|
(define_split
|
4606 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "")
|
4607 |
|
|
(fix:SWI24 (match_operand 1 "register_operand" "")))
|
4608 |
|
|
(use (match_operand:HI 2 "memory_operand" ""))
|
4609 |
|
|
(use (match_operand:HI 3 "memory_operand" ""))
|
4610 |
|
|
(clobber (match_operand:SWI24 4 "memory_operand" ""))]
|
4611 |
|
|
"reload_completed"
|
4612 |
|
|
[(parallel [(set (match_dup 4) (fix:SWI24 (match_dup 1)))
|
4613 |
|
|
(use (match_dup 2))
|
4614 |
|
|
(use (match_dup 3))])
|
4615 |
|
|
(set (match_dup 0) (match_dup 4))])
|
4616 |
|
|
|
4617 |
|
|
(define_split
|
4618 |
|
|
[(set (match_operand:SWI24 0 "memory_operand" "")
|
4619 |
|
|
(fix:SWI24 (match_operand 1 "register_operand" "")))
|
4620 |
|
|
(use (match_operand:HI 2 "memory_operand" ""))
|
4621 |
|
|
(use (match_operand:HI 3 "memory_operand" ""))
|
4622 |
|
|
(clobber (match_operand:SWI24 4 "memory_operand" ""))]
|
4623 |
|
|
"reload_completed"
|
4624 |
|
|
[(parallel [(set (match_dup 0) (fix:SWI24 (match_dup 1)))
|
4625 |
|
|
(use (match_dup 2))
|
4626 |
|
|
(use (match_dup 3))])])
|
4627 |
|
|
|
4628 |
|
|
(define_insn "x86_fnstcw_1"
|
4629 |
|
|
[(set (match_operand:HI 0 "memory_operand" "=m")
|
4630 |
|
|
(unspec:HI [(reg:HI FPCR_REG)] UNSPEC_FSTCW))]
|
4631 |
|
|
"TARGET_80387"
|
4632 |
|
|
"fnstcw\t%0"
|
4633 |
|
|
[(set (attr "length")
|
4634 |
|
|
(symbol_ref "ix86_attr_length_address_default (insn) + 2"))
|
4635 |
|
|
(set_attr "mode" "HI")
|
4636 |
|
|
(set_attr "unit" "i387")
|
4637 |
|
|
(set_attr "bdver1_decode" "vector")])
|
4638 |
|
|
|
4639 |
|
|
(define_insn "x86_fldcw_1"
|
4640 |
|
|
[(set (reg:HI FPCR_REG)
|
4641 |
|
|
(unspec:HI [(match_operand:HI 0 "memory_operand" "m")] UNSPEC_FLDCW))]
|
4642 |
|
|
"TARGET_80387"
|
4643 |
|
|
"fldcw\t%0"
|
4644 |
|
|
[(set (attr "length")
|
4645 |
|
|
(symbol_ref "ix86_attr_length_address_default (insn) + 2"))
|
4646 |
|
|
(set_attr "mode" "HI")
|
4647 |
|
|
(set_attr "unit" "i387")
|
4648 |
|
|
(set_attr "athlon_decode" "vector")
|
4649 |
|
|
(set_attr "amdfam10_decode" "vector")
|
4650 |
|
|
(set_attr "bdver1_decode" "vector")])
|
4651 |
|
|
|
4652 |
|
|
;; Conversion between fixed point and floating point.
|
4653 |
|
|
|
4654 |
|
|
;; Even though we only accept memory inputs, the backend _really_
|
4655 |
|
|
;; wants to be able to do this between registers.
|
4656 |
|
|
|
4657 |
|
|
(define_expand "floathi2"
|
4658 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "")
|
4659 |
|
|
(float:X87MODEF (match_operand:HI 1 "nonimmediate_operand" "")))]
|
4660 |
|
|
"TARGET_80387
|
4661 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
4662 |
|
|
|| TARGET_MIX_SSE_I387)")
|
4663 |
|
|
|
4664 |
|
|
;; Pre-reload splitter to add memory clobber to the pattern.
|
4665 |
|
|
(define_insn_and_split "*floathi2_1"
|
4666 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "")
|
4667 |
|
|
(float:X87MODEF (match_operand:HI 1 "register_operand" "")))]
|
4668 |
|
|
"TARGET_80387
|
4669 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
4670 |
|
|
|| TARGET_MIX_SSE_I387)
|
4671 |
|
|
&& can_create_pseudo_p ()"
|
4672 |
|
|
"#"
|
4673 |
|
|
"&& 1"
|
4674 |
|
|
[(parallel [(set (match_dup 0)
|
4675 |
|
|
(float:X87MODEF (match_dup 1)))
|
4676 |
|
|
(clobber (match_dup 2))])]
|
4677 |
|
|
"operands[2] = assign_386_stack_local (HImode, SLOT_TEMP);")
|
4678 |
|
|
|
4679 |
|
|
(define_insn "*floathi2_i387_with_temp"
|
4680 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "=f,f")
|
4681 |
|
|
(float:X87MODEF (match_operand:HI 1 "nonimmediate_operand" "m,?r")))
|
4682 |
|
|
(clobber (match_operand:HI 2 "memory_operand" "=X,m"))]
|
4683 |
|
|
"TARGET_80387
|
4684 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
4685 |
|
|
|| TARGET_MIX_SSE_I387)"
|
4686 |
|
|
"#"
|
4687 |
|
|
[(set_attr "type" "fmov,multi")
|
4688 |
|
|
(set_attr "mode" "")
|
4689 |
|
|
(set_attr "unit" "*,i387")
|
4690 |
|
|
(set_attr "fp_int_src" "true")])
|
4691 |
|
|
|
4692 |
|
|
(define_insn "*floathi2_i387"
|
4693 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "=f")
|
4694 |
|
|
(float:X87MODEF (match_operand:HI 1 "memory_operand" "m")))]
|
4695 |
|
|
"TARGET_80387
|
4696 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
4697 |
|
|
|| TARGET_MIX_SSE_I387)"
|
4698 |
|
|
"fild%Z1\t%1"
|
4699 |
|
|
[(set_attr "type" "fmov")
|
4700 |
|
|
(set_attr "mode" "")
|
4701 |
|
|
(set_attr "fp_int_src" "true")])
|
4702 |
|
|
|
4703 |
|
|
(define_split
|
4704 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "")
|
4705 |
|
|
(float:X87MODEF (match_operand:HI 1 "register_operand" "")))
|
4706 |
|
|
(clobber (match_operand:HI 2 "memory_operand" ""))]
|
4707 |
|
|
"TARGET_80387
|
4708 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
4709 |
|
|
|| TARGET_MIX_SSE_I387)
|
4710 |
|
|
&& reload_completed"
|
4711 |
|
|
[(set (match_dup 2) (match_dup 1))
|
4712 |
|
|
(set (match_dup 0) (float:X87MODEF (match_dup 2)))])
|
4713 |
|
|
|
4714 |
|
|
(define_split
|
4715 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "")
|
4716 |
|
|
(float:X87MODEF (match_operand:HI 1 "memory_operand" "")))
|
4717 |
|
|
(clobber (match_operand:HI 2 "memory_operand" ""))]
|
4718 |
|
|
"TARGET_80387
|
4719 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
4720 |
|
|
|| TARGET_MIX_SSE_I387)
|
4721 |
|
|
&& reload_completed"
|
4722 |
|
|
[(set (match_dup 0) (float:X87MODEF (match_dup 1)))])
|
4723 |
|
|
|
4724 |
|
|
(define_expand "float2"
|
4725 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "")
|
4726 |
|
|
(float:X87MODEF
|
4727 |
|
|
(match_operand:SWI48x 1 "nonimmediate_operand" "")))]
|
4728 |
|
|
"TARGET_80387
|
4729 |
|
|
|| ((mode != DImode || TARGET_64BIT)
|
4730 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)"
|
4731 |
|
|
{
|
4732 |
|
|
if (!((mode != DImode || TARGET_64BIT)
|
4733 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
4734 |
|
|
&& !X87_ENABLE_FLOAT (mode, mode))
|
4735 |
|
|
{
|
4736 |
|
|
rtx reg = gen_reg_rtx (XFmode);
|
4737 |
|
|
rtx (*insn)(rtx, rtx);
|
4738 |
|
|
|
4739 |
|
|
emit_insn (gen_floatxf2 (reg, operands[1]));
|
4740 |
|
|
|
4741 |
|
|
if (mode == SFmode)
|
4742 |
|
|
insn = gen_truncxfsf2;
|
4743 |
|
|
else if (mode == DFmode)
|
4744 |
|
|
insn = gen_truncxfdf2;
|
4745 |
|
|
else
|
4746 |
|
|
gcc_unreachable ();
|
4747 |
|
|
|
4748 |
|
|
emit_insn (insn (operands[0], reg));
|
4749 |
|
|
DONE;
|
4750 |
|
|
}
|
4751 |
|
|
})
|
4752 |
|
|
|
4753 |
|
|
;; Pre-reload splitter to add memory clobber to the pattern.
|
4754 |
|
|
(define_insn_and_split "*float2_1"
|
4755 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "")
|
4756 |
|
|
(float:X87MODEF (match_operand:SWI48x 1 "register_operand" "")))]
|
4757 |
|
|
"((TARGET_80387
|
4758 |
|
|
&& X87_ENABLE_FLOAT (mode, mode)
|
4759 |
|
|
&& (!((mode != DImode || TARGET_64BIT)
|
4760 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
4761 |
|
|
|| TARGET_MIX_SSE_I387))
|
4762 |
|
|
|| ((mode != DImode || TARGET_64BIT)
|
4763 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
4764 |
|
|
&& ((mode == SImode
|
4765 |
|
|
&& TARGET_SSE2 && TARGET_USE_VECTOR_CONVERTS
|
4766 |
|
|
&& optimize_function_for_speed_p (cfun)
|
4767 |
|
|
&& flag_trapping_math)
|
4768 |
|
|
|| !(TARGET_INTER_UNIT_CONVERSIONS
|
4769 |
|
|
|| optimize_function_for_size_p (cfun)))))
|
4770 |
|
|
&& can_create_pseudo_p ()"
|
4771 |
|
|
"#"
|
4772 |
|
|
"&& 1"
|
4773 |
|
|
[(parallel [(set (match_dup 0) (float:X87MODEF (match_dup 1)))
|
4774 |
|
|
(clobber (match_dup 2))])]
|
4775 |
|
|
{
|
4776 |
|
|
operands[2] = assign_386_stack_local (mode, SLOT_TEMP);
|
4777 |
|
|
|
4778 |
|
|
/* Avoid store forwarding (partial memory) stall penalty
|
4779 |
|
|
by passing DImode value through XMM registers. */
|
4780 |
|
|
if (mode == DImode && !TARGET_64BIT
|
4781 |
|
|
&& TARGET_80387 && TARGET_SSE2 && TARGET_INTER_UNIT_MOVES
|
4782 |
|
|
&& optimize_function_for_speed_p (cfun))
|
4783 |
|
|
{
|
4784 |
|
|
emit_insn (gen_floatdi2_i387_with_xmm (operands[0],
|
4785 |
|
|
operands[1],
|
4786 |
|
|
operands[2]));
|
4787 |
|
|
DONE;
|
4788 |
|
|
}
|
4789 |
|
|
})
|
4790 |
|
|
|
4791 |
|
|
(define_insn "*floatsi2_vector_mixed_with_temp"
|
4792 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f,f,x,x,x")
|
4793 |
|
|
(float:MODEF
|
4794 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "m,?r,r,m,!x")))
|
4795 |
|
|
(clobber (match_operand:SI 2 "memory_operand" "=X,m,m,X,m"))]
|
4796 |
|
|
"TARGET_SSE2 && TARGET_MIX_SSE_I387
|
4797 |
|
|
&& TARGET_USE_VECTOR_CONVERTS && optimize_function_for_speed_p (cfun)"
|
4798 |
|
|
"#"
|
4799 |
|
|
[(set_attr "type" "fmov,multi,sseicvt,sseicvt,sseicvt")
|
4800 |
|
|
(set_attr "mode" ",,,,")
|
4801 |
|
|
(set_attr "unit" "*,i387,*,*,*")
|
4802 |
|
|
(set_attr "athlon_decode" "*,*,double,direct,double")
|
4803 |
|
|
(set_attr "amdfam10_decode" "*,*,vector,double,double")
|
4804 |
|
|
(set_attr "bdver1_decode" "*,*,double,direct,double")
|
4805 |
|
|
(set_attr "fp_int_src" "true")])
|
4806 |
|
|
|
4807 |
|
|
(define_insn "*floatsi2_vector_mixed"
|
4808 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f,x")
|
4809 |
|
|
(float:MODEF (match_operand:SI 1 "memory_operand" "m,m")))]
|
4810 |
|
|
"TARGET_SSE2 && TARGET_MIX_SSE_I387
|
4811 |
|
|
&& TARGET_USE_VECTOR_CONVERTS && optimize_function_for_speed_p (cfun)"
|
4812 |
|
|
"@
|
4813 |
|
|
fild%Z1\t%1
|
4814 |
|
|
#"
|
4815 |
|
|
[(set_attr "type" "fmov,sseicvt")
|
4816 |
|
|
(set_attr "mode" ",")
|
4817 |
|
|
(set_attr "unit" "i387,*")
|
4818 |
|
|
(set_attr "athlon_decode" "*,direct")
|
4819 |
|
|
(set_attr "amdfam10_decode" "*,double")
|
4820 |
|
|
(set_attr "bdver1_decode" "*,direct")
|
4821 |
|
|
(set_attr "fp_int_src" "true")])
|
4822 |
|
|
|
4823 |
|
|
(define_insn "*float2_mixed_with_temp"
|
4824 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f,f,x,x")
|
4825 |
|
|
(float:MODEF
|
4826 |
|
|
(match_operand:SWI48x 1 "nonimmediate_operand" "m,?r,r,m")))
|
4827 |
|
|
(clobber (match_operand:SWI48x 2 "memory_operand" "=X,m,m,X"))]
|
4828 |
|
|
"(mode != DImode || TARGET_64BIT)
|
4829 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_MIX_SSE_I387"
|
4830 |
|
|
"#"
|
4831 |
|
|
[(set_attr "type" "fmov,multi,sseicvt,sseicvt")
|
4832 |
|
|
(set_attr "mode" "")
|
4833 |
|
|
(set_attr "unit" "*,i387,*,*")
|
4834 |
|
|
(set_attr "athlon_decode" "*,*,double,direct")
|
4835 |
|
|
(set_attr "amdfam10_decode" "*,*,vector,double")
|
4836 |
|
|
(set_attr "bdver1_decode" "*,*,double,direct")
|
4837 |
|
|
(set_attr "fp_int_src" "true")])
|
4838 |
|
|
|
4839 |
|
|
(define_split
|
4840 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
4841 |
|
|
(float:MODEF (match_operand:SWI48x 1 "register_operand" "")))
|
4842 |
|
|
(clobber (match_operand:SWI48x 2 "memory_operand" ""))]
|
4843 |
|
|
"(mode != DImode || TARGET_64BIT)
|
4844 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_MIX_SSE_I387
|
4845 |
|
|
&& TARGET_INTER_UNIT_CONVERSIONS
|
4846 |
|
|
&& reload_completed
|
4847 |
|
|
&& (SSE_REG_P (operands[0])
|
4848 |
|
|
|| (GET_CODE (operands[0]) == SUBREG
|
4849 |
|
|
&& SSE_REG_P (SUBREG_REG (operands[0]))))"
|
4850 |
|
|
[(set (match_dup 0) (float:MODEF (match_dup 1)))])
|
4851 |
|
|
|
4852 |
|
|
(define_split
|
4853 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
4854 |
|
|
(float:MODEF (match_operand:SWI48x 1 "register_operand" "")))
|
4855 |
|
|
(clobber (match_operand:SWI48x 2 "memory_operand" ""))]
|
4856 |
|
|
"(mode != DImode || TARGET_64BIT)
|
4857 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_MIX_SSE_I387
|
4858 |
|
|
&& !(TARGET_INTER_UNIT_CONVERSIONS || optimize_function_for_size_p (cfun))
|
4859 |
|
|
&& reload_completed
|
4860 |
|
|
&& (SSE_REG_P (operands[0])
|
4861 |
|
|
|| (GET_CODE (operands[0]) == SUBREG
|
4862 |
|
|
&& SSE_REG_P (SUBREG_REG (operands[0]))))"
|
4863 |
|
|
[(set (match_dup 2) (match_dup 1))
|
4864 |
|
|
(set (match_dup 0) (float:MODEF (match_dup 2)))])
|
4865 |
|
|
|
4866 |
|
|
(define_insn "*float2_mixed_interunit"
|
4867 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f,x,x")
|
4868 |
|
|
(float:MODEF
|
4869 |
|
|
(match_operand:SWI48x 1 "nonimmediate_operand" "m,r,m")))]
|
4870 |
|
|
"(mode != DImode || TARGET_64BIT)
|
4871 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_MIX_SSE_I387
|
4872 |
|
|
&& (TARGET_INTER_UNIT_CONVERSIONS || optimize_function_for_size_p (cfun))"
|
4873 |
|
|
"@
|
4874 |
|
|
fild%Z1\t%1
|
4875 |
|
|
%vcvtsi2\t{%1, %d0|%d0, %1}
|
4876 |
|
|
%vcvtsi2\t{%1, %d0|%d0, %1}"
|
4877 |
|
|
[(set_attr "type" "fmov,sseicvt,sseicvt")
|
4878 |
|
|
(set_attr "prefix" "orig,maybe_vex,maybe_vex")
|
4879 |
|
|
(set_attr "mode" "")
|
4880 |
|
|
(set (attr "prefix_rex")
|
4881 |
|
|
(if_then_else
|
4882 |
|
|
(and (eq_attr "prefix" "maybe_vex")
|
4883 |
|
|
(match_test "mode == DImode"))
|
4884 |
|
|
(const_string "1")
|
4885 |
|
|
(const_string "*")))
|
4886 |
|
|
(set_attr "unit" "i387,*,*")
|
4887 |
|
|
(set_attr "athlon_decode" "*,double,direct")
|
4888 |
|
|
(set_attr "amdfam10_decode" "*,vector,double")
|
4889 |
|
|
(set_attr "bdver1_decode" "*,double,direct")
|
4890 |
|
|
(set_attr "fp_int_src" "true")])
|
4891 |
|
|
|
4892 |
|
|
(define_insn "*float2_mixed_nointerunit"
|
4893 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f,x")
|
4894 |
|
|
(float:MODEF
|
4895 |
|
|
(match_operand:SWI48x 1 "memory_operand" "m,m")))]
|
4896 |
|
|
"(mode != DImode || TARGET_64BIT)
|
4897 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_MIX_SSE_I387
|
4898 |
|
|
&& !(TARGET_INTER_UNIT_CONVERSIONS || optimize_function_for_size_p (cfun))"
|
4899 |
|
|
"@
|
4900 |
|
|
fild%Z1\t%1
|
4901 |
|
|
%vcvtsi2\t{%1, %d0|%d0, %1}"
|
4902 |
|
|
[(set_attr "type" "fmov,sseicvt")
|
4903 |
|
|
(set_attr "prefix" "orig,maybe_vex")
|
4904 |
|
|
(set_attr "mode" "")
|
4905 |
|
|
(set (attr "prefix_rex")
|
4906 |
|
|
(if_then_else
|
4907 |
|
|
(and (eq_attr "prefix" "maybe_vex")
|
4908 |
|
|
(match_test "mode == DImode"))
|
4909 |
|
|
(const_string "1")
|
4910 |
|
|
(const_string "*")))
|
4911 |
|
|
(set_attr "athlon_decode" "*,direct")
|
4912 |
|
|
(set_attr "amdfam10_decode" "*,double")
|
4913 |
|
|
(set_attr "bdver1_decode" "*,direct")
|
4914 |
|
|
(set_attr "fp_int_src" "true")])
|
4915 |
|
|
|
4916 |
|
|
(define_insn "*floatsi2_vector_sse_with_temp"
|
4917 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x,x,x")
|
4918 |
|
|
(float:MODEF
|
4919 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "r,m,!x")))
|
4920 |
|
|
(clobber (match_operand:SI 2 "memory_operand" "=m,X,m"))]
|
4921 |
|
|
"TARGET_SSE2 && TARGET_SSE_MATH
|
4922 |
|
|
&& TARGET_USE_VECTOR_CONVERTS && optimize_function_for_speed_p (cfun)"
|
4923 |
|
|
"#"
|
4924 |
|
|
[(set_attr "type" "sseicvt")
|
4925 |
|
|
(set_attr "mode" ",,")
|
4926 |
|
|
(set_attr "athlon_decode" "double,direct,double")
|
4927 |
|
|
(set_attr "amdfam10_decode" "vector,double,double")
|
4928 |
|
|
(set_attr "bdver1_decode" "double,direct,double")
|
4929 |
|
|
(set_attr "fp_int_src" "true")])
|
4930 |
|
|
|
4931 |
|
|
(define_insn "*floatsi2_vector_sse"
|
4932 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x")
|
4933 |
|
|
(float:MODEF (match_operand:SI 1 "memory_operand" "m")))]
|
4934 |
|
|
"TARGET_SSE2 && TARGET_SSE_MATH
|
4935 |
|
|
&& TARGET_USE_VECTOR_CONVERTS && optimize_function_for_speed_p (cfun)"
|
4936 |
|
|
"#"
|
4937 |
|
|
[(set_attr "type" "sseicvt")
|
4938 |
|
|
(set_attr "mode" "")
|
4939 |
|
|
(set_attr "athlon_decode" "direct")
|
4940 |
|
|
(set_attr "amdfam10_decode" "double")
|
4941 |
|
|
(set_attr "bdver1_decode" "direct")
|
4942 |
|
|
(set_attr "fp_int_src" "true")])
|
4943 |
|
|
|
4944 |
|
|
(define_split
|
4945 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
4946 |
|
|
(float:MODEF (match_operand:SI 1 "register_operand" "")))
|
4947 |
|
|
(clobber (match_operand:SI 2 "memory_operand" ""))]
|
4948 |
|
|
"TARGET_SSE2 && TARGET_SSE_MATH
|
4949 |
|
|
&& TARGET_USE_VECTOR_CONVERTS && optimize_function_for_speed_p (cfun)
|
4950 |
|
|
&& reload_completed
|
4951 |
|
|
&& (SSE_REG_P (operands[0])
|
4952 |
|
|
|| (GET_CODE (operands[0]) == SUBREG
|
4953 |
|
|
&& SSE_REG_P (SUBREG_REG (operands[0]))))"
|
4954 |
|
|
[(const_int 0)]
|
4955 |
|
|
{
|
4956 |
|
|
rtx op1 = operands[1];
|
4957 |
|
|
|
4958 |
|
|
operands[3] = simplify_gen_subreg (mode, operands[0],
|
4959 |
|
|
mode, 0);
|
4960 |
|
|
if (GET_CODE (op1) == SUBREG)
|
4961 |
|
|
op1 = SUBREG_REG (op1);
|
4962 |
|
|
|
4963 |
|
|
if (GENERAL_REG_P (op1) && TARGET_INTER_UNIT_MOVES)
|
4964 |
|
|
{
|
4965 |
|
|
operands[4] = simplify_gen_subreg (V4SImode, operands[0], mode, 0);
|
4966 |
|
|
emit_insn (gen_sse2_loadld (operands[4],
|
4967 |
|
|
CONST0_RTX (V4SImode), operands[1]));
|
4968 |
|
|
}
|
4969 |
|
|
/* We can ignore possible trapping value in the
|
4970 |
|
|
high part of SSE register for non-trapping math. */
|
4971 |
|
|
else if (SSE_REG_P (op1) && !flag_trapping_math)
|
4972 |
|
|
operands[4] = simplify_gen_subreg (V4SImode, operands[1], SImode, 0);
|
4973 |
|
|
else
|
4974 |
|
|
{
|
4975 |
|
|
operands[4] = simplify_gen_subreg (V4SImode, operands[0], mode, 0);
|
4976 |
|
|
emit_move_insn (operands[2], operands[1]);
|
4977 |
|
|
emit_insn (gen_sse2_loadld (operands[4],
|
4978 |
|
|
CONST0_RTX (V4SImode), operands[2]));
|
4979 |
|
|
}
|
4980 |
|
|
if (mode == V4SFmode)
|
4981 |
|
|
emit_insn (gen_floatv4siv4sf2 (operands[3], operands[4]));
|
4982 |
|
|
else
|
4983 |
|
|
emit_insn (gen_sse2_cvtdq2pd (operands[3], operands[4]));
|
4984 |
|
|
DONE;
|
4985 |
|
|
})
|
4986 |
|
|
|
4987 |
|
|
(define_split
|
4988 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
4989 |
|
|
(float:MODEF (match_operand:SI 1 "memory_operand" "")))
|
4990 |
|
|
(clobber (match_operand:SI 2 "memory_operand" ""))]
|
4991 |
|
|
"TARGET_SSE2 && TARGET_SSE_MATH
|
4992 |
|
|
&& TARGET_USE_VECTOR_CONVERTS && optimize_function_for_speed_p (cfun)
|
4993 |
|
|
&& reload_completed
|
4994 |
|
|
&& (SSE_REG_P (operands[0])
|
4995 |
|
|
|| (GET_CODE (operands[0]) == SUBREG
|
4996 |
|
|
&& SSE_REG_P (SUBREG_REG (operands[0]))))"
|
4997 |
|
|
[(const_int 0)]
|
4998 |
|
|
{
|
4999 |
|
|
operands[3] = simplify_gen_subreg (mode, operands[0],
|
5000 |
|
|
mode, 0);
|
5001 |
|
|
operands[4] = simplify_gen_subreg (V4SImode, operands[0], mode, 0);
|
5002 |
|
|
|
5003 |
|
|
emit_insn (gen_sse2_loadld (operands[4],
|
5004 |
|
|
CONST0_RTX (V4SImode), operands[1]));
|
5005 |
|
|
if (mode == V4SFmode)
|
5006 |
|
|
emit_insn (gen_floatv4siv4sf2 (operands[3], operands[4]));
|
5007 |
|
|
else
|
5008 |
|
|
emit_insn (gen_sse2_cvtdq2pd (operands[3], operands[4]));
|
5009 |
|
|
DONE;
|
5010 |
|
|
})
|
5011 |
|
|
|
5012 |
|
|
(define_split
|
5013 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
5014 |
|
|
(float:MODEF (match_operand:SI 1 "register_operand" "")))]
|
5015 |
|
|
"TARGET_SSE2 && TARGET_SSE_MATH
|
5016 |
|
|
&& TARGET_USE_VECTOR_CONVERTS && optimize_function_for_speed_p (cfun)
|
5017 |
|
|
&& reload_completed
|
5018 |
|
|
&& (SSE_REG_P (operands[0])
|
5019 |
|
|
|| (GET_CODE (operands[0]) == SUBREG
|
5020 |
|
|
&& SSE_REG_P (SUBREG_REG (operands[0]))))"
|
5021 |
|
|
[(const_int 0)]
|
5022 |
|
|
{
|
5023 |
|
|
rtx op1 = operands[1];
|
5024 |
|
|
|
5025 |
|
|
operands[3] = simplify_gen_subreg (mode, operands[0],
|
5026 |
|
|
mode, 0);
|
5027 |
|
|
if (GET_CODE (op1) == SUBREG)
|
5028 |
|
|
op1 = SUBREG_REG (op1);
|
5029 |
|
|
|
5030 |
|
|
if (GENERAL_REG_P (op1))
|
5031 |
|
|
{
|
5032 |
|
|
operands[4] = simplify_gen_subreg (V4SImode, operands[0], mode, 0);
|
5033 |
|
|
if (TARGET_INTER_UNIT_MOVES)
|
5034 |
|
|
emit_insn (gen_sse2_loadld (operands[4],
|
5035 |
|
|
CONST0_RTX (V4SImode), operands[1]));
|
5036 |
|
|
else
|
5037 |
|
|
{
|
5038 |
|
|
operands[5] = ix86_force_to_memory (GET_MODE (operands[1]),
|
5039 |
|
|
operands[1]);
|
5040 |
|
|
emit_insn (gen_sse2_loadld (operands[4],
|
5041 |
|
|
CONST0_RTX (V4SImode), operands[5]));
|
5042 |
|
|
ix86_free_from_memory (GET_MODE (operands[1]));
|
5043 |
|
|
}
|
5044 |
|
|
}
|
5045 |
|
|
/* We can ignore possible trapping value in the
|
5046 |
|
|
high part of SSE register for non-trapping math. */
|
5047 |
|
|
else if (SSE_REG_P (op1) && !flag_trapping_math)
|
5048 |
|
|
operands[4] = simplify_gen_subreg (V4SImode, operands[1], SImode, 0);
|
5049 |
|
|
else
|
5050 |
|
|
gcc_unreachable ();
|
5051 |
|
|
if (mode == V4SFmode)
|
5052 |
|
|
emit_insn (gen_floatv4siv4sf2 (operands[3], operands[4]));
|
5053 |
|
|
else
|
5054 |
|
|
emit_insn (gen_sse2_cvtdq2pd (operands[3], operands[4]));
|
5055 |
|
|
DONE;
|
5056 |
|
|
})
|
5057 |
|
|
|
5058 |
|
|
(define_split
|
5059 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
5060 |
|
|
(float:MODEF (match_operand:SI 1 "memory_operand" "")))]
|
5061 |
|
|
"TARGET_SSE2 && TARGET_SSE_MATH
|
5062 |
|
|
&& TARGET_USE_VECTOR_CONVERTS && optimize_function_for_speed_p (cfun)
|
5063 |
|
|
&& reload_completed
|
5064 |
|
|
&& (SSE_REG_P (operands[0])
|
5065 |
|
|
|| (GET_CODE (operands[0]) == SUBREG
|
5066 |
|
|
&& SSE_REG_P (SUBREG_REG (operands[0]))))"
|
5067 |
|
|
[(const_int 0)]
|
5068 |
|
|
{
|
5069 |
|
|
operands[3] = simplify_gen_subreg (mode, operands[0],
|
5070 |
|
|
mode, 0);
|
5071 |
|
|
operands[4] = simplify_gen_subreg (V4SImode, operands[0], mode, 0);
|
5072 |
|
|
|
5073 |
|
|
emit_insn (gen_sse2_loadld (operands[4],
|
5074 |
|
|
CONST0_RTX (V4SImode), operands[1]));
|
5075 |
|
|
if (mode == V4SFmode)
|
5076 |
|
|
emit_insn (gen_floatv4siv4sf2 (operands[3], operands[4]));
|
5077 |
|
|
else
|
5078 |
|
|
emit_insn (gen_sse2_cvtdq2pd (operands[3], operands[4]));
|
5079 |
|
|
DONE;
|
5080 |
|
|
})
|
5081 |
|
|
|
5082 |
|
|
(define_insn "*float2_sse_with_temp"
|
5083 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x,x")
|
5084 |
|
|
(float:MODEF
|
5085 |
|
|
(match_operand:SWI48x 1 "nonimmediate_operand" "r,m")))
|
5086 |
|
|
(clobber (match_operand:SWI48x 2 "memory_operand" "=m,X"))]
|
5087 |
|
|
"(mode != DImode || TARGET_64BIT)
|
5088 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH"
|
5089 |
|
|
"#"
|
5090 |
|
|
[(set_attr "type" "sseicvt")
|
5091 |
|
|
(set_attr "mode" "")
|
5092 |
|
|
(set_attr "athlon_decode" "double,direct")
|
5093 |
|
|
(set_attr "amdfam10_decode" "vector,double")
|
5094 |
|
|
(set_attr "bdver1_decode" "double,direct")
|
5095 |
|
|
(set_attr "fp_int_src" "true")])
|
5096 |
|
|
|
5097 |
|
|
(define_insn "*float2_sse_interunit"
|
5098 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x,x")
|
5099 |
|
|
(float:MODEF
|
5100 |
|
|
(match_operand:SWI48x 1 "nonimmediate_operand" "r,m")))]
|
5101 |
|
|
"(mode != DImode || TARGET_64BIT)
|
5102 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
5103 |
|
|
&& (TARGET_INTER_UNIT_CONVERSIONS || optimize_function_for_size_p (cfun))"
|
5104 |
|
|
"%vcvtsi2\t{%1, %d0|%d0, %1}"
|
5105 |
|
|
[(set_attr "type" "sseicvt")
|
5106 |
|
|
(set_attr "prefix" "maybe_vex")
|
5107 |
|
|
(set_attr "mode" "")
|
5108 |
|
|
(set (attr "prefix_rex")
|
5109 |
|
|
(if_then_else
|
5110 |
|
|
(and (eq_attr "prefix" "maybe_vex")
|
5111 |
|
|
(match_test "mode == DImode"))
|
5112 |
|
|
(const_string "1")
|
5113 |
|
|
(const_string "*")))
|
5114 |
|
|
(set_attr "athlon_decode" "double,direct")
|
5115 |
|
|
(set_attr "amdfam10_decode" "vector,double")
|
5116 |
|
|
(set_attr "bdver1_decode" "double,direct")
|
5117 |
|
|
(set_attr "fp_int_src" "true")])
|
5118 |
|
|
|
5119 |
|
|
(define_split
|
5120 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
5121 |
|
|
(float:MODEF (match_operand:SWI48x 1 "nonimmediate_operand" "")))
|
5122 |
|
|
(clobber (match_operand:SWI48x 2 "memory_operand" ""))]
|
5123 |
|
|
"(mode != DImode || TARGET_64BIT)
|
5124 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
5125 |
|
|
&& (TARGET_INTER_UNIT_CONVERSIONS || optimize_function_for_size_p (cfun))
|
5126 |
|
|
&& reload_completed
|
5127 |
|
|
&& (SSE_REG_P (operands[0])
|
5128 |
|
|
|| (GET_CODE (operands[0]) == SUBREG
|
5129 |
|
|
&& SSE_REG_P (SUBREG_REG (operands[0]))))"
|
5130 |
|
|
[(set (match_dup 0) (float:MODEF (match_dup 1)))])
|
5131 |
|
|
|
5132 |
|
|
(define_insn "*float2_sse_nointerunit"
|
5133 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x")
|
5134 |
|
|
(float:MODEF
|
5135 |
|
|
(match_operand:SWI48x 1 "memory_operand" "m")))]
|
5136 |
|
|
"(mode != DImode || TARGET_64BIT)
|
5137 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
5138 |
|
|
&& !(TARGET_INTER_UNIT_CONVERSIONS || optimize_function_for_size_p (cfun))"
|
5139 |
|
|
"%vcvtsi2\t{%1, %d0|%d0, %1}"
|
5140 |
|
|
[(set_attr "type" "sseicvt")
|
5141 |
|
|
(set_attr "prefix" "maybe_vex")
|
5142 |
|
|
(set_attr "mode" "")
|
5143 |
|
|
(set (attr "prefix_rex")
|
5144 |
|
|
(if_then_else
|
5145 |
|
|
(and (eq_attr "prefix" "maybe_vex")
|
5146 |
|
|
(match_test "mode == DImode"))
|
5147 |
|
|
(const_string "1")
|
5148 |
|
|
(const_string "*")))
|
5149 |
|
|
(set_attr "athlon_decode" "direct")
|
5150 |
|
|
(set_attr "amdfam10_decode" "double")
|
5151 |
|
|
(set_attr "bdver1_decode" "direct")
|
5152 |
|
|
(set_attr "fp_int_src" "true")])
|
5153 |
|
|
|
5154 |
|
|
(define_split
|
5155 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
5156 |
|
|
(float:MODEF (match_operand:SWI48x 1 "register_operand" "")))
|
5157 |
|
|
(clobber (match_operand:SWI48x 2 "memory_operand" ""))]
|
5158 |
|
|
"(mode != DImode || TARGET_64BIT)
|
5159 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
5160 |
|
|
&& !(TARGET_INTER_UNIT_CONVERSIONS || optimize_function_for_size_p (cfun))
|
5161 |
|
|
&& reload_completed
|
5162 |
|
|
&& (SSE_REG_P (operands[0])
|
5163 |
|
|
|| (GET_CODE (operands[0]) == SUBREG
|
5164 |
|
|
&& SSE_REG_P (SUBREG_REG (operands[0]))))"
|
5165 |
|
|
[(set (match_dup 2) (match_dup 1))
|
5166 |
|
|
(set (match_dup 0) (float:MODEF (match_dup 2)))])
|
5167 |
|
|
|
5168 |
|
|
(define_split
|
5169 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
5170 |
|
|
(float:MODEF (match_operand:SWI48x 1 "memory_operand" "")))
|
5171 |
|
|
(clobber (match_operand:SWI48x 2 "memory_operand" ""))]
|
5172 |
|
|
"(mode != DImode || TARGET_64BIT)
|
5173 |
|
|
&& SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
5174 |
|
|
&& reload_completed
|
5175 |
|
|
&& (SSE_REG_P (operands[0])
|
5176 |
|
|
|| (GET_CODE (operands[0]) == SUBREG
|
5177 |
|
|
&& SSE_REG_P (SUBREG_REG (operands[0]))))"
|
5178 |
|
|
[(set (match_dup 0) (float:MODEF (match_dup 1)))])
|
5179 |
|
|
|
5180 |
|
|
(define_insn "*float2_i387_with_temp"
|
5181 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "=f,f")
|
5182 |
|
|
(float:X87MODEF
|
5183 |
|
|
(match_operand:SWI48x 1 "nonimmediate_operand" "m,?r")))
|
5184 |
|
|
(clobber (match_operand:SWI48x 2 "memory_operand" "=X,m"))]
|
5185 |
|
|
"TARGET_80387
|
5186 |
|
|
&& X87_ENABLE_FLOAT (mode, mode)"
|
5187 |
|
|
"@
|
5188 |
|
|
fild%Z1\t%1
|
5189 |
|
|
#"
|
5190 |
|
|
[(set_attr "type" "fmov,multi")
|
5191 |
|
|
(set_attr "mode" "")
|
5192 |
|
|
(set_attr "unit" "*,i387")
|
5193 |
|
|
(set_attr "fp_int_src" "true")])
|
5194 |
|
|
|
5195 |
|
|
(define_insn "*float2_i387"
|
5196 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "=f")
|
5197 |
|
|
(float:X87MODEF
|
5198 |
|
|
(match_operand:SWI48x 1 "memory_operand" "m")))]
|
5199 |
|
|
"TARGET_80387
|
5200 |
|
|
&& X87_ENABLE_FLOAT (mode, mode)"
|
5201 |
|
|
"fild%Z1\t%1"
|
5202 |
|
|
[(set_attr "type" "fmov")
|
5203 |
|
|
(set_attr "mode" "")
|
5204 |
|
|
(set_attr "fp_int_src" "true")])
|
5205 |
|
|
|
5206 |
|
|
(define_split
|
5207 |
|
|
[(set (match_operand:X87MODEF 0 "fp_register_operand" "")
|
5208 |
|
|
(float:X87MODEF (match_operand:SWI48x 1 "register_operand" "")))
|
5209 |
|
|
(clobber (match_operand:SWI48x 2 "memory_operand" ""))]
|
5210 |
|
|
"TARGET_80387
|
5211 |
|
|
&& X87_ENABLE_FLOAT (mode, mode)
|
5212 |
|
|
&& reload_completed"
|
5213 |
|
|
[(set (match_dup 2) (match_dup 1))
|
5214 |
|
|
(set (match_dup 0) (float:X87MODEF (match_dup 2)))])
|
5215 |
|
|
|
5216 |
|
|
(define_split
|
5217 |
|
|
[(set (match_operand:X87MODEF 0 "fp_register_operand" "")
|
5218 |
|
|
(float:X87MODEF (match_operand:SWI48x 1 "memory_operand" "")))
|
5219 |
|
|
(clobber (match_operand:SWI48x 2 "memory_operand" ""))]
|
5220 |
|
|
"TARGET_80387
|
5221 |
|
|
&& X87_ENABLE_FLOAT (mode, mode)
|
5222 |
|
|
&& reload_completed"
|
5223 |
|
|
[(set (match_dup 0) (float:X87MODEF (match_dup 1)))])
|
5224 |
|
|
|
5225 |
|
|
;; Avoid store forwarding (partial memory) stall penalty
|
5226 |
|
|
;; by passing DImode value through XMM registers. */
|
5227 |
|
|
|
5228 |
|
|
(define_insn "floatdi2_i387_with_xmm"
|
5229 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "=f,f")
|
5230 |
|
|
(float:X87MODEF
|
5231 |
|
|
(match_operand:DI 1 "nonimmediate_operand" "m,?r")))
|
5232 |
|
|
(clobber (match_scratch:V4SI 3 "=X,x"))
|
5233 |
|
|
(clobber (match_scratch:V4SI 4 "=X,x"))
|
5234 |
|
|
(clobber (match_operand:DI 2 "memory_operand" "=X,m"))]
|
5235 |
|
|
"TARGET_80387 && X87_ENABLE_FLOAT (mode, DImode)
|
5236 |
|
|
&& TARGET_SSE2 && TARGET_INTER_UNIT_MOVES
|
5237 |
|
|
&& !TARGET_64BIT && optimize_function_for_speed_p (cfun)"
|
5238 |
|
|
"#"
|
5239 |
|
|
[(set_attr "type" "multi")
|
5240 |
|
|
(set_attr "mode" "")
|
5241 |
|
|
(set_attr "unit" "i387")
|
5242 |
|
|
(set_attr "fp_int_src" "true")])
|
5243 |
|
|
|
5244 |
|
|
(define_split
|
5245 |
|
|
[(set (match_operand:X87MODEF 0 "fp_register_operand" "")
|
5246 |
|
|
(float:X87MODEF (match_operand:DI 1 "register_operand" "")))
|
5247 |
|
|
(clobber (match_scratch:V4SI 3 ""))
|
5248 |
|
|
(clobber (match_scratch:V4SI 4 ""))
|
5249 |
|
|
(clobber (match_operand:DI 2 "memory_operand" ""))]
|
5250 |
|
|
"TARGET_80387 && X87_ENABLE_FLOAT (mode, DImode)
|
5251 |
|
|
&& TARGET_SSE2 && TARGET_INTER_UNIT_MOVES
|
5252 |
|
|
&& !TARGET_64BIT && optimize_function_for_speed_p (cfun)
|
5253 |
|
|
&& reload_completed"
|
5254 |
|
|
[(set (match_dup 2) (match_dup 3))
|
5255 |
|
|
(set (match_dup 0) (float:X87MODEF (match_dup 2)))]
|
5256 |
|
|
{
|
5257 |
|
|
/* The DImode arrived in a pair of integral registers (e.g. %edx:%eax).
|
5258 |
|
|
Assemble the 64-bit DImode value in an xmm register. */
|
5259 |
|
|
emit_insn (gen_sse2_loadld (operands[3], CONST0_RTX (V4SImode),
|
5260 |
|
|
gen_rtx_SUBREG (SImode, operands[1], 0)));
|
5261 |
|
|
emit_insn (gen_sse2_loadld (operands[4], CONST0_RTX (V4SImode),
|
5262 |
|
|
gen_rtx_SUBREG (SImode, operands[1], 4)));
|
5263 |
|
|
emit_insn (gen_vec_interleave_lowv4si (operands[3], operands[3],
|
5264 |
|
|
operands[4]));
|
5265 |
|
|
|
5266 |
|
|
operands[3] = gen_rtx_REG (DImode, REGNO (operands[3]));
|
5267 |
|
|
})
|
5268 |
|
|
|
5269 |
|
|
(define_split
|
5270 |
|
|
[(set (match_operand:X87MODEF 0 "fp_register_operand" "")
|
5271 |
|
|
(float:X87MODEF (match_operand:DI 1 "memory_operand" "")))
|
5272 |
|
|
(clobber (match_scratch:V4SI 3 ""))
|
5273 |
|
|
(clobber (match_scratch:V4SI 4 ""))
|
5274 |
|
|
(clobber (match_operand:DI 2 "memory_operand" ""))]
|
5275 |
|
|
"TARGET_80387 && X87_ENABLE_FLOAT (mode, DImode)
|
5276 |
|
|
&& TARGET_SSE2 && TARGET_INTER_UNIT_MOVES
|
5277 |
|
|
&& !TARGET_64BIT && optimize_function_for_speed_p (cfun)
|
5278 |
|
|
&& reload_completed"
|
5279 |
|
|
[(set (match_dup 0) (float:X87MODEF (match_dup 1)))])
|
5280 |
|
|
|
5281 |
|
|
;; Avoid store forwarding (partial memory) stall penalty by extending
|
5282 |
|
|
;; SImode value to DImode through XMM register instead of pushing two
|
5283 |
|
|
;; SImode values to stack. Note that even !TARGET_INTER_UNIT_MOVES
|
5284 |
|
|
;; targets benefit from this optimization. Also note that fild
|
5285 |
|
|
;; loads from memory only.
|
5286 |
|
|
|
5287 |
|
|
(define_insn "*floatunssi2_1"
|
5288 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "=f,f")
|
5289 |
|
|
(unsigned_float:X87MODEF
|
5290 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "x,m")))
|
5291 |
|
|
(clobber (match_operand:DI 2 "memory_operand" "=m,m"))
|
5292 |
|
|
(clobber (match_scratch:SI 3 "=X,x"))]
|
5293 |
|
|
"!TARGET_64BIT
|
5294 |
|
|
&& TARGET_80387 && X87_ENABLE_FLOAT (mode, DImode)
|
5295 |
|
|
&& TARGET_SSE"
|
5296 |
|
|
"#"
|
5297 |
|
|
[(set_attr "type" "multi")
|
5298 |
|
|
(set_attr "mode" "")])
|
5299 |
|
|
|
5300 |
|
|
(define_split
|
5301 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "")
|
5302 |
|
|
(unsigned_float:X87MODEF
|
5303 |
|
|
(match_operand:SI 1 "register_operand" "")))
|
5304 |
|
|
(clobber (match_operand:DI 2 "memory_operand" ""))
|
5305 |
|
|
(clobber (match_scratch:SI 3 ""))]
|
5306 |
|
|
"!TARGET_64BIT
|
5307 |
|
|
&& TARGET_80387 && X87_ENABLE_FLOAT (mode, DImode)
|
5308 |
|
|
&& TARGET_SSE
|
5309 |
|
|
&& reload_completed"
|
5310 |
|
|
[(set (match_dup 2) (match_dup 1))
|
5311 |
|
|
(set (match_dup 0)
|
5312 |
|
|
(float:X87MODEF (match_dup 2)))]
|
5313 |
|
|
"operands[1] = simplify_gen_subreg (DImode, operands[1], SImode, 0);")
|
5314 |
|
|
|
5315 |
|
|
(define_split
|
5316 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "")
|
5317 |
|
|
(unsigned_float:X87MODEF
|
5318 |
|
|
(match_operand:SI 1 "memory_operand" "")))
|
5319 |
|
|
(clobber (match_operand:DI 2 "memory_operand" ""))
|
5320 |
|
|
(clobber (match_scratch:SI 3 ""))]
|
5321 |
|
|
"!TARGET_64BIT
|
5322 |
|
|
&& TARGET_80387 && X87_ENABLE_FLOAT (mode, DImode)
|
5323 |
|
|
&& TARGET_SSE
|
5324 |
|
|
&& reload_completed"
|
5325 |
|
|
[(set (match_dup 2) (match_dup 3))
|
5326 |
|
|
(set (match_dup 0)
|
5327 |
|
|
(float:X87MODEF (match_dup 2)))]
|
5328 |
|
|
{
|
5329 |
|
|
emit_move_insn (operands[3], operands[1]);
|
5330 |
|
|
operands[3] = simplify_gen_subreg (DImode, operands[3], SImode, 0);
|
5331 |
|
|
})
|
5332 |
|
|
|
5333 |
|
|
(define_expand "floatunssi2"
|
5334 |
|
|
[(parallel
|
5335 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "")
|
5336 |
|
|
(unsigned_float:X87MODEF
|
5337 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "")))
|
5338 |
|
|
(clobber (match_dup 2))
|
5339 |
|
|
(clobber (match_scratch:SI 3 ""))])]
|
5340 |
|
|
"!TARGET_64BIT
|
5341 |
|
|
&& ((TARGET_80387 && X87_ENABLE_FLOAT (mode, DImode)
|
5342 |
|
|
&& TARGET_SSE)
|
5343 |
|
|
|| (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH))"
|
5344 |
|
|
{
|
5345 |
|
|
if (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
5346 |
|
|
{
|
5347 |
|
|
ix86_expand_convert_uns_si_sse (operands[0], operands[1]);
|
5348 |
|
|
DONE;
|
5349 |
|
|
}
|
5350 |
|
|
else
|
5351 |
|
|
{
|
5352 |
|
|
enum ix86_stack_slot slot = (virtuals_instantiated
|
5353 |
|
|
? SLOT_TEMP
|
5354 |
|
|
: SLOT_VIRTUAL);
|
5355 |
|
|
operands[2] = assign_386_stack_local (DImode, slot);
|
5356 |
|
|
}
|
5357 |
|
|
})
|
5358 |
|
|
|
5359 |
|
|
(define_expand "floatunsdisf2"
|
5360 |
|
|
[(use (match_operand:SF 0 "register_operand" ""))
|
5361 |
|
|
(use (match_operand:DI 1 "nonimmediate_operand" ""))]
|
5362 |
|
|
"TARGET_64BIT && TARGET_SSE_MATH"
|
5363 |
|
|
"x86_emit_floatuns (operands); DONE;")
|
5364 |
|
|
|
5365 |
|
|
(define_expand "floatunsdidf2"
|
5366 |
|
|
[(use (match_operand:DF 0 "register_operand" ""))
|
5367 |
|
|
(use (match_operand:DI 1 "nonimmediate_operand" ""))]
|
5368 |
|
|
"(TARGET_64BIT || TARGET_KEEPS_VECTOR_ALIGNED_STACK)
|
5369 |
|
|
&& TARGET_SSE2 && TARGET_SSE_MATH"
|
5370 |
|
|
{
|
5371 |
|
|
if (TARGET_64BIT)
|
5372 |
|
|
x86_emit_floatuns (operands);
|
5373 |
|
|
else
|
5374 |
|
|
ix86_expand_convert_uns_didf_sse (operands[0], operands[1]);
|
5375 |
|
|
DONE;
|
5376 |
|
|
})
|
5377 |
|
|
|
5378 |
|
|
;; Add instructions
|
5379 |
|
|
|
5380 |
|
|
(define_expand "add3"
|
5381 |
|
|
[(set (match_operand:SDWIM 0 "nonimmediate_operand" "")
|
5382 |
|
|
(plus:SDWIM (match_operand:SDWIM 1 "nonimmediate_operand" "")
|
5383 |
|
|
(match_operand:SDWIM 2 "" "")))]
|
5384 |
|
|
""
|
5385 |
|
|
"ix86_expand_binary_operator (PLUS, mode, operands); DONE;")
|
5386 |
|
|
|
5387 |
|
|
(define_insn_and_split "*add3_doubleword"
|
5388 |
|
|
[(set (match_operand: 0 "nonimmediate_operand" "=r,o")
|
5389 |
|
|
(plus:
|
5390 |
|
|
(match_operand: 1 "nonimmediate_operand" "%0,0")
|
5391 |
|
|
(match_operand: 2 "" "ro,r")))
|
5392 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
5393 |
|
|
"ix86_binary_operator_ok (PLUS, mode, operands)"
|
5394 |
|
|
"#"
|
5395 |
|
|
"reload_completed"
|
5396 |
|
|
[(parallel [(set (reg:CC FLAGS_REG)
|
5397 |
|
|
(unspec:CC [(match_dup 1) (match_dup 2)]
|
5398 |
|
|
UNSPEC_ADD_CARRY))
|
5399 |
|
|
(set (match_dup 0)
|
5400 |
|
|
(plus:DWIH (match_dup 1) (match_dup 2)))])
|
5401 |
|
|
(parallel [(set (match_dup 3)
|
5402 |
|
|
(plus:DWIH
|
5403 |
|
|
(match_dup 4)
|
5404 |
|
|
(plus:DWIH
|
5405 |
|
|
(ltu:DWIH (reg:CC FLAGS_REG) (const_int 0))
|
5406 |
|
|
(match_dup 5))))
|
5407 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
5408 |
|
|
"split_double_mode (mode, &operands[0], 3, &operands[0], &operands[3]);")
|
5409 |
|
|
|
5410 |
|
|
(define_insn "*add3_cc"
|
5411 |
|
|
[(set (reg:CC FLAGS_REG)
|
5412 |
|
|
(unspec:CC
|
5413 |
|
|
[(match_operand:SWI48 1 "nonimmediate_operand" "%0,0")
|
5414 |
|
|
(match_operand:SWI48 2 "" "r,rm")]
|
5415 |
|
|
UNSPEC_ADD_CARRY))
|
5416 |
|
|
(set (match_operand:SWI48 0 "nonimmediate_operand" "=rm,r")
|
5417 |
|
|
(plus:SWI48 (match_dup 1) (match_dup 2)))]
|
5418 |
|
|
"ix86_binary_operator_ok (PLUS, mode, operands)"
|
5419 |
|
|
"add{}\t{%2, %0|%0, %2}"
|
5420 |
|
|
[(set_attr "type" "alu")
|
5421 |
|
|
(set_attr "mode" "")])
|
5422 |
|
|
|
5423 |
|
|
(define_insn "addqi3_cc"
|
5424 |
|
|
[(set (reg:CC FLAGS_REG)
|
5425 |
|
|
(unspec:CC
|
5426 |
|
|
[(match_operand:QI 1 "nonimmediate_operand" "%0,0")
|
5427 |
|
|
(match_operand:QI 2 "general_operand" "qn,qm")]
|
5428 |
|
|
UNSPEC_ADD_CARRY))
|
5429 |
|
|
(set (match_operand:QI 0 "nonimmediate_operand" "=qm,q")
|
5430 |
|
|
(plus:QI (match_dup 1) (match_dup 2)))]
|
5431 |
|
|
"ix86_binary_operator_ok (PLUS, QImode, operands)"
|
5432 |
|
|
"add{b}\t{%2, %0|%0, %2}"
|
5433 |
|
|
[(set_attr "type" "alu")
|
5434 |
|
|
(set_attr "mode" "QI")])
|
5435 |
|
|
|
5436 |
|
|
(define_insn_and_split "*lea_1"
|
5437 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
5438 |
|
|
(subreg:SI (match_operand:DI 1 "lea_address_operand" "p") 0))]
|
5439 |
|
|
"TARGET_64BIT"
|
5440 |
|
|
"lea{l}\t{%a1, %0|%0, %a1}"
|
5441 |
|
|
"&& reload_completed && ix86_avoid_lea_for_addr (insn, operands)"
|
5442 |
|
|
[(const_int 0)]
|
5443 |
|
|
{
|
5444 |
|
|
ix86_split_lea_for_addr (operands, SImode);
|
5445 |
|
|
DONE;
|
5446 |
|
|
}
|
5447 |
|
|
[(set_attr "type" "lea")
|
5448 |
|
|
(set_attr "mode" "SI")])
|
5449 |
|
|
|
5450 |
|
|
(define_insn_and_split "*lea_2"
|
5451 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
5452 |
|
|
(match_operand:SWI48 1 "lea_address_operand" "p"))]
|
5453 |
|
|
""
|
5454 |
|
|
"lea{}\t{%a1, %0|%0, %a1}"
|
5455 |
|
|
"reload_completed && ix86_avoid_lea_for_addr (insn, operands)"
|
5456 |
|
|
[(const_int 0)]
|
5457 |
|
|
{
|
5458 |
|
|
ix86_split_lea_for_addr (operands, mode);
|
5459 |
|
|
DONE;
|
5460 |
|
|
}
|
5461 |
|
|
[(set_attr "type" "lea")
|
5462 |
|
|
(set_attr "mode" "")])
|
5463 |
|
|
|
5464 |
|
|
(define_insn "*lea_3_zext"
|
5465 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
5466 |
|
|
(zero_extend:DI
|
5467 |
|
|
(subreg:SI (match_operand:DI 1 "lea_address_operand" "j") 0)))]
|
5468 |
|
|
"TARGET_64BIT"
|
5469 |
|
|
"lea{l}\t{%a1, %k0|%k0, %a1}"
|
5470 |
|
|
[(set_attr "type" "lea")
|
5471 |
|
|
(set_attr "mode" "SI")])
|
5472 |
|
|
|
5473 |
|
|
(define_insn "*lea_4_zext"
|
5474 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
5475 |
|
|
(zero_extend:DI
|
5476 |
|
|
(match_operand:SI 1 "lea_address_operand" "j")))]
|
5477 |
|
|
"TARGET_64BIT"
|
5478 |
|
|
"lea{l}\t{%a1, %k0|%k0, %a1}"
|
5479 |
|
|
[(set_attr "type" "lea")
|
5480 |
|
|
(set_attr "mode" "SI")])
|
5481 |
|
|
|
5482 |
|
|
(define_insn "*lea_5_zext"
|
5483 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
5484 |
|
|
(and:DI
|
5485 |
|
|
(subreg:DI (match_operand:SI 1 "lea_address_operand" "p") 0)
|
5486 |
|
|
(match_operand:DI 2 "const_32bit_mask" "n")))]
|
5487 |
|
|
"TARGET_64BIT"
|
5488 |
|
|
"lea{l}\t{%a1, %k0|%k0, %a1}"
|
5489 |
|
|
[(set_attr "type" "lea")
|
5490 |
|
|
(set_attr "mode" "SI")])
|
5491 |
|
|
|
5492 |
|
|
(define_insn "*lea_6_zext"
|
5493 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
5494 |
|
|
(and:DI
|
5495 |
|
|
(match_operand:DI 1 "lea_address_operand" "p")
|
5496 |
|
|
(match_operand:DI 2 "const_32bit_mask" "n")))]
|
5497 |
|
|
"TARGET_64BIT"
|
5498 |
|
|
"lea{l}\t{%a1, %k0|%k0, %a1}"
|
5499 |
|
|
[(set_attr "type" "lea")
|
5500 |
|
|
(set_attr "mode" "SI")])
|
5501 |
|
|
|
5502 |
|
|
(define_insn "*add_1"
|
5503 |
|
|
[(set (match_operand:SWI48 0 "nonimmediate_operand" "=r,rm,r,r")
|
5504 |
|
|
(plus:SWI48
|
5505 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "%0,0,r,r")
|
5506 |
|
|
(match_operand:SWI48 2 "x86_64_general_operand" "rme,re,0,le")))
|
5507 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
5508 |
|
|
"ix86_binary_operator_ok (PLUS, mode, operands)"
|
5509 |
|
|
{
|
5510 |
|
|
switch (get_attr_type (insn))
|
5511 |
|
|
{
|
5512 |
|
|
case TYPE_LEA:
|
5513 |
|
|
return "#";
|
5514 |
|
|
|
5515 |
|
|
case TYPE_INCDEC:
|
5516 |
|
|
gcc_assert (rtx_equal_p (operands[0], operands[1]));
|
5517 |
|
|
if (operands[2] == const1_rtx)
|
5518 |
|
|
return "inc{}\t%0";
|
5519 |
|
|
else
|
5520 |
|
|
{
|
5521 |
|
|
gcc_assert (operands[2] == constm1_rtx);
|
5522 |
|
|
return "dec{}\t%0";
|
5523 |
|
|
}
|
5524 |
|
|
|
5525 |
|
|
default:
|
5526 |
|
|
/* For most processors, ADD is faster than LEA. This alternative
|
5527 |
|
|
was added to use ADD as much as possible. */
|
5528 |
|
|
if (which_alternative == 2)
|
5529 |
|
|
{
|
5530 |
|
|
rtx tmp;
|
5531 |
|
|
tmp = operands[1], operands[1] = operands[2], operands[2] = tmp;
|
5532 |
|
|
}
|
5533 |
|
|
|
5534 |
|
|
gcc_assert (rtx_equal_p (operands[0], operands[1]));
|
5535 |
|
|
if (x86_maybe_negate_const_int (&operands[2], mode))
|
5536 |
|
|
return "sub{}\t{%2, %0|%0, %2}";
|
5537 |
|
|
|
5538 |
|
|
return "add{}\t{%2, %0|%0, %2}";
|
5539 |
|
|
}
|
5540 |
|
|
}
|
5541 |
|
|
[(set (attr "type")
|
5542 |
|
|
(cond [(eq_attr "alternative" "3")
|
5543 |
|
|
(const_string "lea")
|
5544 |
|
|
(match_operand:SWI48 2 "incdec_operand" "")
|
5545 |
|
|
(const_string "incdec")
|
5546 |
|
|
]
|
5547 |
|
|
(const_string "alu")))
|
5548 |
|
|
(set (attr "length_immediate")
|
5549 |
|
|
(if_then_else
|
5550 |
|
|
(and (eq_attr "type" "alu") (match_operand 2 "const128_operand" ""))
|
5551 |
|
|
(const_string "1")
|
5552 |
|
|
(const_string "*")))
|
5553 |
|
|
(set_attr "mode" "")])
|
5554 |
|
|
|
5555 |
|
|
;; It may seem that nonimmediate operand is proper one for operand 1.
|
5556 |
|
|
;; The addsi_1 pattern allows nonimmediate operand at that place and
|
5557 |
|
|
;; we take care in ix86_binary_operator_ok to not allow two memory
|
5558 |
|
|
;; operands so proper swapping will be done in reload. This allow
|
5559 |
|
|
;; patterns constructed from addsi_1 to match.
|
5560 |
|
|
|
5561 |
|
|
(define_insn "addsi_1_zext"
|
5562 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r,r,r")
|
5563 |
|
|
(zero_extend:DI
|
5564 |
|
|
(plus:SI (match_operand:SI 1 "nonimmediate_operand" "%0,r,r")
|
5565 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "rme,0,le"))))
|
5566 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
5567 |
|
|
"TARGET_64BIT && ix86_binary_operator_ok (PLUS, SImode, operands)"
|
5568 |
|
|
{
|
5569 |
|
|
switch (get_attr_type (insn))
|
5570 |
|
|
{
|
5571 |
|
|
case TYPE_LEA:
|
5572 |
|
|
return "#";
|
5573 |
|
|
|
5574 |
|
|
case TYPE_INCDEC:
|
5575 |
|
|
if (operands[2] == const1_rtx)
|
5576 |
|
|
return "inc{l}\t%k0";
|
5577 |
|
|
else
|
5578 |
|
|
{
|
5579 |
|
|
gcc_assert (operands[2] == constm1_rtx);
|
5580 |
|
|
return "dec{l}\t%k0";
|
5581 |
|
|
}
|
5582 |
|
|
|
5583 |
|
|
default:
|
5584 |
|
|
/* For most processors, ADD is faster than LEA. This alternative
|
5585 |
|
|
was added to use ADD as much as possible. */
|
5586 |
|
|
if (which_alternative == 1)
|
5587 |
|
|
{
|
5588 |
|
|
rtx tmp;
|
5589 |
|
|
tmp = operands[1], operands[1] = operands[2], operands[2] = tmp;
|
5590 |
|
|
}
|
5591 |
|
|
|
5592 |
|
|
if (x86_maybe_negate_const_int (&operands[2], SImode))
|
5593 |
|
|
return "sub{l}\t{%2, %k0|%k0, %2}";
|
5594 |
|
|
|
5595 |
|
|
return "add{l}\t{%2, %k0|%k0, %2}";
|
5596 |
|
|
}
|
5597 |
|
|
}
|
5598 |
|
|
[(set (attr "type")
|
5599 |
|
|
(cond [(eq_attr "alternative" "2")
|
5600 |
|
|
(const_string "lea")
|
5601 |
|
|
(match_operand:SI 2 "incdec_operand" "")
|
5602 |
|
|
(const_string "incdec")
|
5603 |
|
|
]
|
5604 |
|
|
(const_string "alu")))
|
5605 |
|
|
(set (attr "length_immediate")
|
5606 |
|
|
(if_then_else
|
5607 |
|
|
(and (eq_attr "type" "alu") (match_operand 2 "const128_operand" ""))
|
5608 |
|
|
(const_string "1")
|
5609 |
|
|
(const_string "*")))
|
5610 |
|
|
(set_attr "mode" "SI")])
|
5611 |
|
|
|
5612 |
|
|
(define_insn "*addhi_1"
|
5613 |
|
|
[(set (match_operand:HI 0 "nonimmediate_operand" "=rm,r,r,Yp")
|
5614 |
|
|
(plus:HI (match_operand:HI 1 "nonimmediate_operand" "%0,0,r,Yp")
|
5615 |
|
|
(match_operand:HI 2 "general_operand" "rn,rm,0,ln")))
|
5616 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
5617 |
|
|
"ix86_binary_operator_ok (PLUS, HImode, operands)"
|
5618 |
|
|
{
|
5619 |
|
|
switch (get_attr_type (insn))
|
5620 |
|
|
{
|
5621 |
|
|
case TYPE_LEA:
|
5622 |
|
|
return "#";
|
5623 |
|
|
|
5624 |
|
|
case TYPE_INCDEC:
|
5625 |
|
|
gcc_assert (rtx_equal_p (operands[0], operands[1]));
|
5626 |
|
|
if (operands[2] == const1_rtx)
|
5627 |
|
|
return "inc{w}\t%0";
|
5628 |
|
|
else
|
5629 |
|
|
{
|
5630 |
|
|
gcc_assert (operands[2] == constm1_rtx);
|
5631 |
|
|
return "dec{w}\t%0";
|
5632 |
|
|
}
|
5633 |
|
|
|
5634 |
|
|
default:
|
5635 |
|
|
/* For most processors, ADD is faster than LEA. This alternative
|
5636 |
|
|
was added to use ADD as much as possible. */
|
5637 |
|
|
if (which_alternative == 2)
|
5638 |
|
|
{
|
5639 |
|
|
rtx tmp;
|
5640 |
|
|
tmp = operands[1], operands[1] = operands[2], operands[2] = tmp;
|
5641 |
|
|
}
|
5642 |
|
|
|
5643 |
|
|
gcc_assert (rtx_equal_p (operands[0], operands[1]));
|
5644 |
|
|
if (x86_maybe_negate_const_int (&operands[2], HImode))
|
5645 |
|
|
return "sub{w}\t{%2, %0|%0, %2}";
|
5646 |
|
|
|
5647 |
|
|
return "add{w}\t{%2, %0|%0, %2}";
|
5648 |
|
|
}
|
5649 |
|
|
}
|
5650 |
|
|
[(set (attr "type")
|
5651 |
|
|
(cond [(eq_attr "alternative" "3")
|
5652 |
|
|
(const_string "lea")
|
5653 |
|
|
(match_operand:HI 2 "incdec_operand" "")
|
5654 |
|
|
(const_string "incdec")
|
5655 |
|
|
]
|
5656 |
|
|
(const_string "alu")))
|
5657 |
|
|
(set (attr "length_immediate")
|
5658 |
|
|
(if_then_else
|
5659 |
|
|
(and (eq_attr "type" "alu") (match_operand 2 "const128_operand" ""))
|
5660 |
|
|
(const_string "1")
|
5661 |
|
|
(const_string "*")))
|
5662 |
|
|
(set_attr "mode" "HI,HI,HI,SI")])
|
5663 |
|
|
|
5664 |
|
|
;; %%% Potential partial reg stall on alternatives 3 and 4. What to do?
|
5665 |
|
|
(define_insn "*addqi_1"
|
5666 |
|
|
[(set (match_operand:QI 0 "nonimmediate_operand" "=qm,q,q,r,r,Yp")
|
5667 |
|
|
(plus:QI (match_operand:QI 1 "nonimmediate_operand" "%0,0,q,0,r,Yp")
|
5668 |
|
|
(match_operand:QI 2 "general_operand" "qn,qm,0,rn,0,ln")))
|
5669 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
5670 |
|
|
"ix86_binary_operator_ok (PLUS, QImode, operands)"
|
5671 |
|
|
{
|
5672 |
|
|
bool widen = (which_alternative == 3 || which_alternative == 4);
|
5673 |
|
|
|
5674 |
|
|
switch (get_attr_type (insn))
|
5675 |
|
|
{
|
5676 |
|
|
case TYPE_LEA:
|
5677 |
|
|
return "#";
|
5678 |
|
|
|
5679 |
|
|
case TYPE_INCDEC:
|
5680 |
|
|
gcc_assert (rtx_equal_p (operands[0], operands[1]));
|
5681 |
|
|
if (operands[2] == const1_rtx)
|
5682 |
|
|
return widen ? "inc{l}\t%k0" : "inc{b}\t%0";
|
5683 |
|
|
else
|
5684 |
|
|
{
|
5685 |
|
|
gcc_assert (operands[2] == constm1_rtx);
|
5686 |
|
|
return widen ? "dec{l}\t%k0" : "dec{b}\t%0";
|
5687 |
|
|
}
|
5688 |
|
|
|
5689 |
|
|
default:
|
5690 |
|
|
/* For most processors, ADD is faster than LEA. These alternatives
|
5691 |
|
|
were added to use ADD as much as possible. */
|
5692 |
|
|
if (which_alternative == 2 || which_alternative == 4)
|
5693 |
|
|
{
|
5694 |
|
|
rtx tmp;
|
5695 |
|
|
tmp = operands[1], operands[1] = operands[2], operands[2] = tmp;
|
5696 |
|
|
}
|
5697 |
|
|
|
5698 |
|
|
gcc_assert (rtx_equal_p (operands[0], operands[1]));
|
5699 |
|
|
if (x86_maybe_negate_const_int (&operands[2], QImode))
|
5700 |
|
|
{
|
5701 |
|
|
if (widen)
|
5702 |
|
|
return "sub{l}\t{%2, %k0|%k0, %2}";
|
5703 |
|
|
else
|
5704 |
|
|
return "sub{b}\t{%2, %0|%0, %2}";
|
5705 |
|
|
}
|
5706 |
|
|
if (widen)
|
5707 |
|
|
return "add{l}\t{%k2, %k0|%k0, %k2}";
|
5708 |
|
|
else
|
5709 |
|
|
return "add{b}\t{%2, %0|%0, %2}";
|
5710 |
|
|
}
|
5711 |
|
|
}
|
5712 |
|
|
[(set (attr "type")
|
5713 |
|
|
(cond [(eq_attr "alternative" "5")
|
5714 |
|
|
(const_string "lea")
|
5715 |
|
|
(match_operand:QI 2 "incdec_operand" "")
|
5716 |
|
|
(const_string "incdec")
|
5717 |
|
|
]
|
5718 |
|
|
(const_string "alu")))
|
5719 |
|
|
(set (attr "length_immediate")
|
5720 |
|
|
(if_then_else
|
5721 |
|
|
(and (eq_attr "type" "alu") (match_operand 2 "const128_operand" ""))
|
5722 |
|
|
(const_string "1")
|
5723 |
|
|
(const_string "*")))
|
5724 |
|
|
(set_attr "mode" "QI,QI,QI,SI,SI,SI")])
|
5725 |
|
|
|
5726 |
|
|
(define_insn "*addqi_1_slp"
|
5727 |
|
|
[(set (strict_low_part (match_operand:QI 0 "nonimmediate_operand" "+qm,q"))
|
5728 |
|
|
(plus:QI (match_dup 0)
|
5729 |
|
|
(match_operand:QI 1 "general_operand" "qn,qm")))
|
5730 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
5731 |
|
|
"(! TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
5732 |
|
|
&& !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
5733 |
|
|
{
|
5734 |
|
|
switch (get_attr_type (insn))
|
5735 |
|
|
{
|
5736 |
|
|
case TYPE_INCDEC:
|
5737 |
|
|
if (operands[1] == const1_rtx)
|
5738 |
|
|
return "inc{b}\t%0";
|
5739 |
|
|
else
|
5740 |
|
|
{
|
5741 |
|
|
gcc_assert (operands[1] == constm1_rtx);
|
5742 |
|
|
return "dec{b}\t%0";
|
5743 |
|
|
}
|
5744 |
|
|
|
5745 |
|
|
default:
|
5746 |
|
|
if (x86_maybe_negate_const_int (&operands[1], QImode))
|
5747 |
|
|
return "sub{b}\t{%1, %0|%0, %1}";
|
5748 |
|
|
|
5749 |
|
|
return "add{b}\t{%1, %0|%0, %1}";
|
5750 |
|
|
}
|
5751 |
|
|
}
|
5752 |
|
|
[(set (attr "type")
|
5753 |
|
|
(if_then_else (match_operand:QI 1 "incdec_operand" "")
|
5754 |
|
|
(const_string "incdec")
|
5755 |
|
|
(const_string "alu1")))
|
5756 |
|
|
(set (attr "memory")
|
5757 |
|
|
(if_then_else (match_operand 1 "memory_operand" "")
|
5758 |
|
|
(const_string "load")
|
5759 |
|
|
(const_string "none")))
|
5760 |
|
|
(set_attr "mode" "QI")])
|
5761 |
|
|
|
5762 |
|
|
;; Split non destructive adds if we cannot use lea.
|
5763 |
|
|
(define_split
|
5764 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "")
|
5765 |
|
|
(plus:SWI48 (match_operand:SWI48 1 "register_operand" "")
|
5766 |
|
|
(match_operand:SWI48 2 "nonmemory_operand" "")))
|
5767 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
5768 |
|
|
"reload_completed && ix86_avoid_lea_for_add (insn, operands)"
|
5769 |
|
|
[(set (match_dup 0) (match_dup 1))
|
5770 |
|
|
(parallel [(set (match_dup 0) (plus: (match_dup 0) (match_dup 2)))
|
5771 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
5772 |
|
|
|
5773 |
|
|
;; Convert add to the lea pattern to avoid flags dependency.
|
5774 |
|
|
(define_split
|
5775 |
|
|
[(set (match_operand:SWI 0 "register_operand" "")
|
5776 |
|
|
(plus:SWI (match_operand:SWI 1 "register_operand" "")
|
5777 |
|
|
(match_operand:SWI 2 "" "")))
|
5778 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
5779 |
|
|
"reload_completed && ix86_lea_for_add_ok (insn, operands)"
|
5780 |
|
|
[(const_int 0)]
|
5781 |
|
|
{
|
5782 |
|
|
enum machine_mode mode = mode;
|
5783 |
|
|
rtx pat;
|
5784 |
|
|
|
5785 |
|
|
if (GET_MODE_SIZE (mode) < GET_MODE_SIZE (SImode))
|
5786 |
|
|
{
|
5787 |
|
|
mode = SImode;
|
5788 |
|
|
operands[0] = gen_lowpart (mode, operands[0]);
|
5789 |
|
|
operands[1] = gen_lowpart (mode, operands[1]);
|
5790 |
|
|
operands[2] = gen_lowpart (mode, operands[2]);
|
5791 |
|
|
}
|
5792 |
|
|
|
5793 |
|
|
pat = gen_rtx_PLUS (mode, operands[1], operands[2]);
|
5794 |
|
|
|
5795 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[0], pat));
|
5796 |
|
|
DONE;
|
5797 |
|
|
})
|
5798 |
|
|
|
5799 |
|
|
;; Convert add to the lea pattern to avoid flags dependency.
|
5800 |
|
|
(define_split
|
5801 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
5802 |
|
|
(zero_extend:DI
|
5803 |
|
|
(plus:SI (match_operand:SI 1 "register_operand" "")
|
5804 |
|
|
(match_operand:SI 2 "x86_64_nonmemory_operand" ""))))
|
5805 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
5806 |
|
|
"TARGET_64BIT && reload_completed && ix86_lea_for_add_ok (insn, operands)"
|
5807 |
|
|
[(set (match_dup 0)
|
5808 |
|
|
(zero_extend:DI (plus:SI (match_dup 1) (match_dup 2))))])
|
5809 |
|
|
|
5810 |
|
|
(define_insn "*add_2"
|
5811 |
|
|
[(set (reg FLAGS_REG)
|
5812 |
|
|
(compare
|
5813 |
|
|
(plus:SWI
|
5814 |
|
|
(match_operand:SWI 1 "nonimmediate_operand" "%0,0")
|
5815 |
|
|
(match_operand:SWI 2 "" ","))
|
5816 |
|
|
(const_int 0)))
|
5817 |
|
|
(set (match_operand:SWI 0 "nonimmediate_operand" "=,m")
|
5818 |
|
|
(plus:SWI (match_dup 1) (match_dup 2)))]
|
5819 |
|
|
"ix86_match_ccmode (insn, CCGOCmode)
|
5820 |
|
|
&& ix86_binary_operator_ok (PLUS, mode, operands)"
|
5821 |
|
|
{
|
5822 |
|
|
switch (get_attr_type (insn))
|
5823 |
|
|
{
|
5824 |
|
|
case TYPE_INCDEC:
|
5825 |
|
|
if (operands[2] == const1_rtx)
|
5826 |
|
|
return "inc{}\t%0";
|
5827 |
|
|
else
|
5828 |
|
|
{
|
5829 |
|
|
gcc_assert (operands[2] == constm1_rtx);
|
5830 |
|
|
return "dec{}\t%0";
|
5831 |
|
|
}
|
5832 |
|
|
|
5833 |
|
|
default:
|
5834 |
|
|
if (x86_maybe_negate_const_int (&operands[2], mode))
|
5835 |
|
|
return "sub{}\t{%2, %0|%0, %2}";
|
5836 |
|
|
|
5837 |
|
|
return "add{}\t{%2, %0|%0, %2}";
|
5838 |
|
|
}
|
5839 |
|
|
}
|
5840 |
|
|
[(set (attr "type")
|
5841 |
|
|
(if_then_else (match_operand:SWI 2 "incdec_operand" "")
|
5842 |
|
|
(const_string "incdec")
|
5843 |
|
|
(const_string "alu")))
|
5844 |
|
|
(set (attr "length_immediate")
|
5845 |
|
|
(if_then_else
|
5846 |
|
|
(and (eq_attr "type" "alu") (match_operand 2 "const128_operand" ""))
|
5847 |
|
|
(const_string "1")
|
5848 |
|
|
(const_string "*")))
|
5849 |
|
|
(set_attr "mode" "")])
|
5850 |
|
|
|
5851 |
|
|
;; See comment for addsi_1_zext why we do use nonimmediate_operand
|
5852 |
|
|
(define_insn "*addsi_2_zext"
|
5853 |
|
|
[(set (reg FLAGS_REG)
|
5854 |
|
|
(compare
|
5855 |
|
|
(plus:SI (match_operand:SI 1 "nonimmediate_operand" "%0")
|
5856 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "rme"))
|
5857 |
|
|
(const_int 0)))
|
5858 |
|
|
(set (match_operand:DI 0 "register_operand" "=r")
|
5859 |
|
|
(zero_extend:DI (plus:SI (match_dup 1) (match_dup 2))))]
|
5860 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCGOCmode)
|
5861 |
|
|
&& ix86_binary_operator_ok (PLUS, SImode, operands)"
|
5862 |
|
|
{
|
5863 |
|
|
switch (get_attr_type (insn))
|
5864 |
|
|
{
|
5865 |
|
|
case TYPE_INCDEC:
|
5866 |
|
|
if (operands[2] == const1_rtx)
|
5867 |
|
|
return "inc{l}\t%k0";
|
5868 |
|
|
else
|
5869 |
|
|
{
|
5870 |
|
|
gcc_assert (operands[2] == constm1_rtx);
|
5871 |
|
|
return "dec{l}\t%k0";
|
5872 |
|
|
}
|
5873 |
|
|
|
5874 |
|
|
default:
|
5875 |
|
|
if (x86_maybe_negate_const_int (&operands[2], SImode))
|
5876 |
|
|
return "sub{l}\t{%2, %k0|%k0, %2}";
|
5877 |
|
|
|
5878 |
|
|
return "add{l}\t{%2, %k0|%k0, %2}";
|
5879 |
|
|
}
|
5880 |
|
|
}
|
5881 |
|
|
[(set (attr "type")
|
5882 |
|
|
(if_then_else (match_operand:SI 2 "incdec_operand" "")
|
5883 |
|
|
(const_string "incdec")
|
5884 |
|
|
(const_string "alu")))
|
5885 |
|
|
(set (attr "length_immediate")
|
5886 |
|
|
(if_then_else
|
5887 |
|
|
(and (eq_attr "type" "alu") (match_operand 2 "const128_operand" ""))
|
5888 |
|
|
(const_string "1")
|
5889 |
|
|
(const_string "*")))
|
5890 |
|
|
(set_attr "mode" "SI")])
|
5891 |
|
|
|
5892 |
|
|
(define_insn "*add_3"
|
5893 |
|
|
[(set (reg FLAGS_REG)
|
5894 |
|
|
(compare
|
5895 |
|
|
(neg:SWI (match_operand:SWI 2 "" ""))
|
5896 |
|
|
(match_operand:SWI 1 "nonimmediate_operand" "%0")))
|
5897 |
|
|
(clobber (match_scratch:SWI 0 "="))]
|
5898 |
|
|
"ix86_match_ccmode (insn, CCZmode)
|
5899 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
5900 |
|
|
{
|
5901 |
|
|
switch (get_attr_type (insn))
|
5902 |
|
|
{
|
5903 |
|
|
case TYPE_INCDEC:
|
5904 |
|
|
if (operands[2] == const1_rtx)
|
5905 |
|
|
return "inc{}\t%0";
|
5906 |
|
|
else
|
5907 |
|
|
{
|
5908 |
|
|
gcc_assert (operands[2] == constm1_rtx);
|
5909 |
|
|
return "dec{}\t%0";
|
5910 |
|
|
}
|
5911 |
|
|
|
5912 |
|
|
default:
|
5913 |
|
|
if (x86_maybe_negate_const_int (&operands[2], mode))
|
5914 |
|
|
return "sub{}\t{%2, %0|%0, %2}";
|
5915 |
|
|
|
5916 |
|
|
return "add{}\t{%2, %0|%0, %2}";
|
5917 |
|
|
}
|
5918 |
|
|
}
|
5919 |
|
|
[(set (attr "type")
|
5920 |
|
|
(if_then_else (match_operand:SWI 2 "incdec_operand" "")
|
5921 |
|
|
(const_string "incdec")
|
5922 |
|
|
(const_string "alu")))
|
5923 |
|
|
(set (attr "length_immediate")
|
5924 |
|
|
(if_then_else
|
5925 |
|
|
(and (eq_attr "type" "alu") (match_operand 2 "const128_operand" ""))
|
5926 |
|
|
(const_string "1")
|
5927 |
|
|
(const_string "*")))
|
5928 |
|
|
(set_attr "mode" "")])
|
5929 |
|
|
|
5930 |
|
|
;; See comment for addsi_1_zext why we do use nonimmediate_operand
|
5931 |
|
|
(define_insn "*addsi_3_zext"
|
5932 |
|
|
[(set (reg FLAGS_REG)
|
5933 |
|
|
(compare
|
5934 |
|
|
(neg:SI (match_operand:SI 2 "x86_64_general_operand" "rme"))
|
5935 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "%0")))
|
5936 |
|
|
(set (match_operand:DI 0 "register_operand" "=r")
|
5937 |
|
|
(zero_extend:DI (plus:SI (match_dup 1) (match_dup 2))))]
|
5938 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCZmode)
|
5939 |
|
|
&& ix86_binary_operator_ok (PLUS, SImode, operands)"
|
5940 |
|
|
{
|
5941 |
|
|
switch (get_attr_type (insn))
|
5942 |
|
|
{
|
5943 |
|
|
case TYPE_INCDEC:
|
5944 |
|
|
if (operands[2] == const1_rtx)
|
5945 |
|
|
return "inc{l}\t%k0";
|
5946 |
|
|
else
|
5947 |
|
|
{
|
5948 |
|
|
gcc_assert (operands[2] == constm1_rtx);
|
5949 |
|
|
return "dec{l}\t%k0";
|
5950 |
|
|
}
|
5951 |
|
|
|
5952 |
|
|
default:
|
5953 |
|
|
if (x86_maybe_negate_const_int (&operands[2], SImode))
|
5954 |
|
|
return "sub{l}\t{%2, %k0|%k0, %2}";
|
5955 |
|
|
|
5956 |
|
|
return "add{l}\t{%2, %k0|%k0, %2}";
|
5957 |
|
|
}
|
5958 |
|
|
}
|
5959 |
|
|
[(set (attr "type")
|
5960 |
|
|
(if_then_else (match_operand:SI 2 "incdec_operand" "")
|
5961 |
|
|
(const_string "incdec")
|
5962 |
|
|
(const_string "alu")))
|
5963 |
|
|
(set (attr "length_immediate")
|
5964 |
|
|
(if_then_else
|
5965 |
|
|
(and (eq_attr "type" "alu") (match_operand 2 "const128_operand" ""))
|
5966 |
|
|
(const_string "1")
|
5967 |
|
|
(const_string "*")))
|
5968 |
|
|
(set_attr "mode" "SI")])
|
5969 |
|
|
|
5970 |
|
|
; For comparisons against 1, -1 and 128, we may generate better code
|
5971 |
|
|
; by converting cmp to add, inc or dec as done by peephole2. This pattern
|
5972 |
|
|
; is matched then. We can't accept general immediate, because for
|
5973 |
|
|
; case of overflows, the result is messed up.
|
5974 |
|
|
; Also carry flag is reversed compared to cmp, so this conversion is valid
|
5975 |
|
|
; only for comparisons not depending on it.
|
5976 |
|
|
|
5977 |
|
|
(define_insn "*adddi_4"
|
5978 |
|
|
[(set (reg FLAGS_REG)
|
5979 |
|
|
(compare
|
5980 |
|
|
(match_operand:DI 1 "nonimmediate_operand" "0")
|
5981 |
|
|
(match_operand:DI 2 "x86_64_immediate_operand" "e")))
|
5982 |
|
|
(clobber (match_scratch:DI 0 "=rm"))]
|
5983 |
|
|
"TARGET_64BIT
|
5984 |
|
|
&& ix86_match_ccmode (insn, CCGCmode)"
|
5985 |
|
|
{
|
5986 |
|
|
switch (get_attr_type (insn))
|
5987 |
|
|
{
|
5988 |
|
|
case TYPE_INCDEC:
|
5989 |
|
|
if (operands[2] == constm1_rtx)
|
5990 |
|
|
return "inc{q}\t%0";
|
5991 |
|
|
else
|
5992 |
|
|
{
|
5993 |
|
|
gcc_assert (operands[2] == const1_rtx);
|
5994 |
|
|
return "dec{q}\t%0";
|
5995 |
|
|
}
|
5996 |
|
|
|
5997 |
|
|
default:
|
5998 |
|
|
if (x86_maybe_negate_const_int (&operands[2], DImode))
|
5999 |
|
|
return "add{q}\t{%2, %0|%0, %2}";
|
6000 |
|
|
|
6001 |
|
|
return "sub{q}\t{%2, %0|%0, %2}";
|
6002 |
|
|
}
|
6003 |
|
|
}
|
6004 |
|
|
[(set (attr "type")
|
6005 |
|
|
(if_then_else (match_operand:DI 2 "incdec_operand" "")
|
6006 |
|
|
(const_string "incdec")
|
6007 |
|
|
(const_string "alu")))
|
6008 |
|
|
(set (attr "length_immediate")
|
6009 |
|
|
(if_then_else
|
6010 |
|
|
(and (eq_attr "type" "alu") (match_operand 2 "const128_operand" ""))
|
6011 |
|
|
(const_string "1")
|
6012 |
|
|
(const_string "*")))
|
6013 |
|
|
(set_attr "mode" "DI")])
|
6014 |
|
|
|
6015 |
|
|
; For comparisons against 1, -1 and 128, we may generate better code
|
6016 |
|
|
; by converting cmp to add, inc or dec as done by peephole2. This pattern
|
6017 |
|
|
; is matched then. We can't accept general immediate, because for
|
6018 |
|
|
; case of overflows, the result is messed up.
|
6019 |
|
|
; Also carry flag is reversed compared to cmp, so this conversion is valid
|
6020 |
|
|
; only for comparisons not depending on it.
|
6021 |
|
|
|
6022 |
|
|
(define_insn "*add_4"
|
6023 |
|
|
[(set (reg FLAGS_REG)
|
6024 |
|
|
(compare
|
6025 |
|
|
(match_operand:SWI124 1 "nonimmediate_operand" "0")
|
6026 |
|
|
(match_operand:SWI124 2 "const_int_operand" "n")))
|
6027 |
|
|
(clobber (match_scratch:SWI124 0 "=m"))]
|
6028 |
|
|
"ix86_match_ccmode (insn, CCGCmode)"
|
6029 |
|
|
{
|
6030 |
|
|
switch (get_attr_type (insn))
|
6031 |
|
|
{
|
6032 |
|
|
case TYPE_INCDEC:
|
6033 |
|
|
if (operands[2] == constm1_rtx)
|
6034 |
|
|
return "inc{}\t%0";
|
6035 |
|
|
else
|
6036 |
|
|
{
|
6037 |
|
|
gcc_assert (operands[2] == const1_rtx);
|
6038 |
|
|
return "dec{}\t%0";
|
6039 |
|
|
}
|
6040 |
|
|
|
6041 |
|
|
default:
|
6042 |
|
|
if (x86_maybe_negate_const_int (&operands[2], mode))
|
6043 |
|
|
return "add{}\t{%2, %0|%0, %2}";
|
6044 |
|
|
|
6045 |
|
|
return "sub{}\t{%2, %0|%0, %2}";
|
6046 |
|
|
}
|
6047 |
|
|
}
|
6048 |
|
|
[(set (attr "type")
|
6049 |
|
|
(if_then_else (match_operand: 2 "incdec_operand" "")
|
6050 |
|
|
(const_string "incdec")
|
6051 |
|
|
(const_string "alu")))
|
6052 |
|
|
(set (attr "length_immediate")
|
6053 |
|
|
(if_then_else
|
6054 |
|
|
(and (eq_attr "type" "alu") (match_operand 2 "const128_operand" ""))
|
6055 |
|
|
(const_string "1")
|
6056 |
|
|
(const_string "*")))
|
6057 |
|
|
(set_attr "mode" "")])
|
6058 |
|
|
|
6059 |
|
|
(define_insn "*add_5"
|
6060 |
|
|
[(set (reg FLAGS_REG)
|
6061 |
|
|
(compare
|
6062 |
|
|
(plus:SWI
|
6063 |
|
|
(match_operand:SWI 1 "nonimmediate_operand" "%0")
|
6064 |
|
|
(match_operand:SWI 2 "" ""))
|
6065 |
|
|
(const_int 0)))
|
6066 |
|
|
(clobber (match_scratch:SWI 0 "="))]
|
6067 |
|
|
"ix86_match_ccmode (insn, CCGOCmode)
|
6068 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6069 |
|
|
{
|
6070 |
|
|
switch (get_attr_type (insn))
|
6071 |
|
|
{
|
6072 |
|
|
case TYPE_INCDEC:
|
6073 |
|
|
if (operands[2] == const1_rtx)
|
6074 |
|
|
return "inc{}\t%0";
|
6075 |
|
|
else
|
6076 |
|
|
{
|
6077 |
|
|
gcc_assert (operands[2] == constm1_rtx);
|
6078 |
|
|
return "dec{}\t%0";
|
6079 |
|
|
}
|
6080 |
|
|
|
6081 |
|
|
default:
|
6082 |
|
|
if (x86_maybe_negate_const_int (&operands[2], mode))
|
6083 |
|
|
return "sub{}\t{%2, %0|%0, %2}";
|
6084 |
|
|
|
6085 |
|
|
return "add{}\t{%2, %0|%0, %2}";
|
6086 |
|
|
}
|
6087 |
|
|
}
|
6088 |
|
|
[(set (attr "type")
|
6089 |
|
|
(if_then_else (match_operand:SWI 2 "incdec_operand" "")
|
6090 |
|
|
(const_string "incdec")
|
6091 |
|
|
(const_string "alu")))
|
6092 |
|
|
(set (attr "length_immediate")
|
6093 |
|
|
(if_then_else
|
6094 |
|
|
(and (eq_attr "type" "alu") (match_operand 2 "const128_operand" ""))
|
6095 |
|
|
(const_string "1")
|
6096 |
|
|
(const_string "*")))
|
6097 |
|
|
(set_attr "mode" "")])
|
6098 |
|
|
|
6099 |
|
|
(define_insn "*addqi_ext_1_rex64"
|
6100 |
|
|
[(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=Q")
|
6101 |
|
|
(const_int 8)
|
6102 |
|
|
(const_int 8))
|
6103 |
|
|
(plus:SI
|
6104 |
|
|
(zero_extract:SI
|
6105 |
|
|
(match_operand 1 "ext_register_operand" "0")
|
6106 |
|
|
(const_int 8)
|
6107 |
|
|
(const_int 8))
|
6108 |
|
|
(match_operand:QI 2 "nonmemory_operand" "Qn")))
|
6109 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6110 |
|
|
"TARGET_64BIT"
|
6111 |
|
|
{
|
6112 |
|
|
switch (get_attr_type (insn))
|
6113 |
|
|
{
|
6114 |
|
|
case TYPE_INCDEC:
|
6115 |
|
|
if (operands[2] == const1_rtx)
|
6116 |
|
|
return "inc{b}\t%h0";
|
6117 |
|
|
else
|
6118 |
|
|
{
|
6119 |
|
|
gcc_assert (operands[2] == constm1_rtx);
|
6120 |
|
|
return "dec{b}\t%h0";
|
6121 |
|
|
}
|
6122 |
|
|
|
6123 |
|
|
default:
|
6124 |
|
|
return "add{b}\t{%2, %h0|%h0, %2}";
|
6125 |
|
|
}
|
6126 |
|
|
}
|
6127 |
|
|
[(set (attr "type")
|
6128 |
|
|
(if_then_else (match_operand:QI 2 "incdec_operand" "")
|
6129 |
|
|
(const_string "incdec")
|
6130 |
|
|
(const_string "alu")))
|
6131 |
|
|
(set_attr "modrm" "1")
|
6132 |
|
|
(set_attr "mode" "QI")])
|
6133 |
|
|
|
6134 |
|
|
(define_insn "addqi_ext_1"
|
6135 |
|
|
[(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=Q")
|
6136 |
|
|
(const_int 8)
|
6137 |
|
|
(const_int 8))
|
6138 |
|
|
(plus:SI
|
6139 |
|
|
(zero_extract:SI
|
6140 |
|
|
(match_operand 1 "ext_register_operand" "0")
|
6141 |
|
|
(const_int 8)
|
6142 |
|
|
(const_int 8))
|
6143 |
|
|
(match_operand:QI 2 "general_operand" "Qmn")))
|
6144 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6145 |
|
|
"!TARGET_64BIT"
|
6146 |
|
|
{
|
6147 |
|
|
switch (get_attr_type (insn))
|
6148 |
|
|
{
|
6149 |
|
|
case TYPE_INCDEC:
|
6150 |
|
|
if (operands[2] == const1_rtx)
|
6151 |
|
|
return "inc{b}\t%h0";
|
6152 |
|
|
else
|
6153 |
|
|
{
|
6154 |
|
|
gcc_assert (operands[2] == constm1_rtx);
|
6155 |
|
|
return "dec{b}\t%h0";
|
6156 |
|
|
}
|
6157 |
|
|
|
6158 |
|
|
default:
|
6159 |
|
|
return "add{b}\t{%2, %h0|%h0, %2}";
|
6160 |
|
|
}
|
6161 |
|
|
}
|
6162 |
|
|
[(set (attr "type")
|
6163 |
|
|
(if_then_else (match_operand:QI 2 "incdec_operand" "")
|
6164 |
|
|
(const_string "incdec")
|
6165 |
|
|
(const_string "alu")))
|
6166 |
|
|
(set_attr "modrm" "1")
|
6167 |
|
|
(set_attr "mode" "QI")])
|
6168 |
|
|
|
6169 |
|
|
(define_insn "*addqi_ext_2"
|
6170 |
|
|
[(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=Q")
|
6171 |
|
|
(const_int 8)
|
6172 |
|
|
(const_int 8))
|
6173 |
|
|
(plus:SI
|
6174 |
|
|
(zero_extract:SI
|
6175 |
|
|
(match_operand 1 "ext_register_operand" "%0")
|
6176 |
|
|
(const_int 8)
|
6177 |
|
|
(const_int 8))
|
6178 |
|
|
(zero_extract:SI
|
6179 |
|
|
(match_operand 2 "ext_register_operand" "Q")
|
6180 |
|
|
(const_int 8)
|
6181 |
|
|
(const_int 8))))
|
6182 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6183 |
|
|
""
|
6184 |
|
|
"add{b}\t{%h2, %h0|%h0, %h2}"
|
6185 |
|
|
[(set_attr "type" "alu")
|
6186 |
|
|
(set_attr "mode" "QI")])
|
6187 |
|
|
|
6188 |
|
|
;; The lea patterns for modes less than 32 bits need to be matched by
|
6189 |
|
|
;; several insns converted to real lea by splitters.
|
6190 |
|
|
|
6191 |
|
|
(define_insn_and_split "*lea_general_1"
|
6192 |
|
|
[(set (match_operand 0 "register_operand" "=r")
|
6193 |
|
|
(plus (plus (match_operand 1 "index_register_operand" "l")
|
6194 |
|
|
(match_operand 2 "register_operand" "r"))
|
6195 |
|
|
(match_operand 3 "immediate_operand" "i")))]
|
6196 |
|
|
"(GET_MODE (operands[0]) == QImode || GET_MODE (operands[0]) == HImode)
|
6197 |
|
|
&& (!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
6198 |
|
|
&& GET_MODE (operands[0]) == GET_MODE (operands[1])
|
6199 |
|
|
&& GET_MODE (operands[0]) == GET_MODE (operands[2])
|
6200 |
|
|
&& (GET_MODE (operands[0]) == GET_MODE (operands[3])
|
6201 |
|
|
|| GET_MODE (operands[3]) == VOIDmode)"
|
6202 |
|
|
"#"
|
6203 |
|
|
"&& reload_completed"
|
6204 |
|
|
[(const_int 0)]
|
6205 |
|
|
{
|
6206 |
|
|
enum machine_mode mode = SImode;
|
6207 |
|
|
rtx pat;
|
6208 |
|
|
|
6209 |
|
|
operands[0] = gen_lowpart (mode, operands[0]);
|
6210 |
|
|
operands[1] = gen_lowpart (mode, operands[1]);
|
6211 |
|
|
operands[2] = gen_lowpart (mode, operands[2]);
|
6212 |
|
|
operands[3] = gen_lowpart (mode, operands[3]);
|
6213 |
|
|
|
6214 |
|
|
pat = gen_rtx_PLUS (mode, gen_rtx_PLUS (mode, operands[1], operands[2]),
|
6215 |
|
|
operands[3]);
|
6216 |
|
|
|
6217 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[0], pat));
|
6218 |
|
|
DONE;
|
6219 |
|
|
}
|
6220 |
|
|
[(set_attr "type" "lea")
|
6221 |
|
|
(set_attr "mode" "SI")])
|
6222 |
|
|
|
6223 |
|
|
(define_insn_and_split "*lea_general_2"
|
6224 |
|
|
[(set (match_operand 0 "register_operand" "=r")
|
6225 |
|
|
(plus (mult (match_operand 1 "index_register_operand" "l")
|
6226 |
|
|
(match_operand 2 "const248_operand" "n"))
|
6227 |
|
|
(match_operand 3 "nonmemory_operand" "ri")))]
|
6228 |
|
|
"(GET_MODE (operands[0]) == QImode || GET_MODE (operands[0]) == HImode)
|
6229 |
|
|
&& (!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
6230 |
|
|
&& GET_MODE (operands[0]) == GET_MODE (operands[1])
|
6231 |
|
|
&& (GET_MODE (operands[0]) == GET_MODE (operands[3])
|
6232 |
|
|
|| GET_MODE (operands[3]) == VOIDmode)"
|
6233 |
|
|
"#"
|
6234 |
|
|
"&& reload_completed"
|
6235 |
|
|
[(const_int 0)]
|
6236 |
|
|
{
|
6237 |
|
|
enum machine_mode mode = SImode;
|
6238 |
|
|
rtx pat;
|
6239 |
|
|
|
6240 |
|
|
operands[0] = gen_lowpart (mode, operands[0]);
|
6241 |
|
|
operands[1] = gen_lowpart (mode, operands[1]);
|
6242 |
|
|
operands[3] = gen_lowpart (mode, operands[3]);
|
6243 |
|
|
|
6244 |
|
|
pat = gen_rtx_PLUS (mode, gen_rtx_MULT (mode, operands[1], operands[2]),
|
6245 |
|
|
operands[3]);
|
6246 |
|
|
|
6247 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[0], pat));
|
6248 |
|
|
DONE;
|
6249 |
|
|
}
|
6250 |
|
|
[(set_attr "type" "lea")
|
6251 |
|
|
(set_attr "mode" "SI")])
|
6252 |
|
|
|
6253 |
|
|
(define_insn_and_split "*lea_general_3"
|
6254 |
|
|
[(set (match_operand 0 "register_operand" "=r")
|
6255 |
|
|
(plus (plus (mult (match_operand 1 "index_register_operand" "l")
|
6256 |
|
|
(match_operand 2 "const248_operand" "n"))
|
6257 |
|
|
(match_operand 3 "register_operand" "r"))
|
6258 |
|
|
(match_operand 4 "immediate_operand" "i")))]
|
6259 |
|
|
"(GET_MODE (operands[0]) == QImode || GET_MODE (operands[0]) == HImode)
|
6260 |
|
|
&& (!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
6261 |
|
|
&& GET_MODE (operands[0]) == GET_MODE (operands[1])
|
6262 |
|
|
&& GET_MODE (operands[0]) == GET_MODE (operands[3])"
|
6263 |
|
|
"#"
|
6264 |
|
|
"&& reload_completed"
|
6265 |
|
|
[(const_int 0)]
|
6266 |
|
|
{
|
6267 |
|
|
enum machine_mode mode = SImode;
|
6268 |
|
|
rtx pat;
|
6269 |
|
|
|
6270 |
|
|
operands[0] = gen_lowpart (mode, operands[0]);
|
6271 |
|
|
operands[1] = gen_lowpart (mode, operands[1]);
|
6272 |
|
|
operands[3] = gen_lowpart (mode, operands[3]);
|
6273 |
|
|
operands[4] = gen_lowpart (mode, operands[4]);
|
6274 |
|
|
|
6275 |
|
|
pat = gen_rtx_PLUS (mode,
|
6276 |
|
|
gen_rtx_PLUS (mode,
|
6277 |
|
|
gen_rtx_MULT (mode, operands[1],
|
6278 |
|
|
operands[2]),
|
6279 |
|
|
operands[3]),
|
6280 |
|
|
operands[4]);
|
6281 |
|
|
|
6282 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[0], pat));
|
6283 |
|
|
DONE;
|
6284 |
|
|
}
|
6285 |
|
|
[(set_attr "type" "lea")
|
6286 |
|
|
(set_attr "mode" "SI")])
|
6287 |
|
|
|
6288 |
|
|
(define_insn_and_split "*lea_general_4"
|
6289 |
|
|
[(set (match_operand 0 "register_operand" "=r")
|
6290 |
|
|
(any_or (ashift
|
6291 |
|
|
(match_operand 1 "index_register_operand" "l")
|
6292 |
|
|
(match_operand 2 "const_int_operand" "n"))
|
6293 |
|
|
(match_operand 3 "const_int_operand" "n")))]
|
6294 |
|
|
"(((GET_MODE (operands[0]) == QImode || GET_MODE (operands[0]) == HImode)
|
6295 |
|
|
&& (!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun)))
|
6296 |
|
|
|| GET_MODE (operands[0]) == SImode
|
6297 |
|
|
|| (TARGET_64BIT && GET_MODE (operands[0]) == DImode))
|
6298 |
|
|
&& GET_MODE (operands[0]) == GET_MODE (operands[1])
|
6299 |
|
|
&& ((unsigned HOST_WIDE_INT) INTVAL (operands[2])) - 1 < 3
|
6300 |
|
|
&& ((unsigned HOST_WIDE_INT) INTVAL (operands[3])
|
6301 |
|
|
< ((unsigned HOST_WIDE_INT) 1 << INTVAL (operands[2])))"
|
6302 |
|
|
"#"
|
6303 |
|
|
"&& reload_completed"
|
6304 |
|
|
[(const_int 0)]
|
6305 |
|
|
{
|
6306 |
|
|
enum machine_mode mode = GET_MODE (operands[0]);
|
6307 |
|
|
rtx pat;
|
6308 |
|
|
|
6309 |
|
|
if (GET_MODE_SIZE (mode) < GET_MODE_SIZE (SImode))
|
6310 |
|
|
{
|
6311 |
|
|
mode = SImode;
|
6312 |
|
|
operands[0] = gen_lowpart (mode, operands[0]);
|
6313 |
|
|
operands[1] = gen_lowpart (mode, operands[1]);
|
6314 |
|
|
}
|
6315 |
|
|
|
6316 |
|
|
operands[2] = GEN_INT (1 << INTVAL (operands[2]));
|
6317 |
|
|
|
6318 |
|
|
pat = plus_constant (gen_rtx_MULT (mode, operands[1], operands[2]),
|
6319 |
|
|
INTVAL (operands[3]));
|
6320 |
|
|
|
6321 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[0], pat));
|
6322 |
|
|
DONE;
|
6323 |
|
|
}
|
6324 |
|
|
[(set_attr "type" "lea")
|
6325 |
|
|
(set (attr "mode")
|
6326 |
|
|
(if_then_else (match_operand:DI 0 "" "")
|
6327 |
|
|
(const_string "DI")
|
6328 |
|
|
(const_string "SI")))])
|
6329 |
|
|
|
6330 |
|
|
;; Subtract instructions
|
6331 |
|
|
|
6332 |
|
|
(define_expand "sub3"
|
6333 |
|
|
[(set (match_operand:SDWIM 0 "nonimmediate_operand" "")
|
6334 |
|
|
(minus:SDWIM (match_operand:SDWIM 1 "nonimmediate_operand" "")
|
6335 |
|
|
(match_operand:SDWIM 2 "" "")))]
|
6336 |
|
|
""
|
6337 |
|
|
"ix86_expand_binary_operator (MINUS, mode, operands); DONE;")
|
6338 |
|
|
|
6339 |
|
|
(define_insn_and_split "*sub3_doubleword"
|
6340 |
|
|
[(set (match_operand: 0 "nonimmediate_operand" "=r,o")
|
6341 |
|
|
(minus:
|
6342 |
|
|
(match_operand: 1 "nonimmediate_operand" "0,0")
|
6343 |
|
|
(match_operand: 2 "" "ro,r")))
|
6344 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6345 |
|
|
"ix86_binary_operator_ok (MINUS, mode, operands)"
|
6346 |
|
|
"#"
|
6347 |
|
|
"reload_completed"
|
6348 |
|
|
[(parallel [(set (reg:CC FLAGS_REG)
|
6349 |
|
|
(compare:CC (match_dup 1) (match_dup 2)))
|
6350 |
|
|
(set (match_dup 0)
|
6351 |
|
|
(minus:DWIH (match_dup 1) (match_dup 2)))])
|
6352 |
|
|
(parallel [(set (match_dup 3)
|
6353 |
|
|
(minus:DWIH
|
6354 |
|
|
(match_dup 4)
|
6355 |
|
|
(plus:DWIH
|
6356 |
|
|
(ltu:DWIH (reg:CC FLAGS_REG) (const_int 0))
|
6357 |
|
|
(match_dup 5))))
|
6358 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
6359 |
|
|
"split_double_mode (mode, &operands[0], 3, &operands[0], &operands[3]);")
|
6360 |
|
|
|
6361 |
|
|
(define_insn "*sub_1"
|
6362 |
|
|
[(set (match_operand:SWI 0 "nonimmediate_operand" "=m,")
|
6363 |
|
|
(minus:SWI
|
6364 |
|
|
(match_operand:SWI 1 "nonimmediate_operand" "0,0")
|
6365 |
|
|
(match_operand:SWI 2 "" ",m")))
|
6366 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6367 |
|
|
"ix86_binary_operator_ok (MINUS, mode, operands)"
|
6368 |
|
|
"sub{}\t{%2, %0|%0, %2}"
|
6369 |
|
|
[(set_attr "type" "alu")
|
6370 |
|
|
(set_attr "mode" "")])
|
6371 |
|
|
|
6372 |
|
|
(define_insn "*subsi_1_zext"
|
6373 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
6374 |
|
|
(zero_extend:DI
|
6375 |
|
|
(minus:SI (match_operand:SI 1 "register_operand" "0")
|
6376 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "rme"))))
|
6377 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6378 |
|
|
"TARGET_64BIT && ix86_binary_operator_ok (MINUS, SImode, operands)"
|
6379 |
|
|
"sub{l}\t{%2, %k0|%k0, %2}"
|
6380 |
|
|
[(set_attr "type" "alu")
|
6381 |
|
|
(set_attr "mode" "SI")])
|
6382 |
|
|
|
6383 |
|
|
(define_insn "*subqi_1_slp"
|
6384 |
|
|
[(set (strict_low_part (match_operand:QI 0 "nonimmediate_operand" "+qm,q"))
|
6385 |
|
|
(minus:QI (match_dup 0)
|
6386 |
|
|
(match_operand:QI 1 "general_operand" "qn,qm")))
|
6387 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6388 |
|
|
"(! TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
6389 |
|
|
&& !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
6390 |
|
|
"sub{b}\t{%1, %0|%0, %1}"
|
6391 |
|
|
[(set_attr "type" "alu1")
|
6392 |
|
|
(set_attr "mode" "QI")])
|
6393 |
|
|
|
6394 |
|
|
(define_insn "*sub_2"
|
6395 |
|
|
[(set (reg FLAGS_REG)
|
6396 |
|
|
(compare
|
6397 |
|
|
(minus:SWI
|
6398 |
|
|
(match_operand:SWI 1 "nonimmediate_operand" "0,0")
|
6399 |
|
|
(match_operand:SWI 2 "" ",m"))
|
6400 |
|
|
(const_int 0)))
|
6401 |
|
|
(set (match_operand:SWI 0 "nonimmediate_operand" "=m,")
|
6402 |
|
|
(minus:SWI (match_dup 1) (match_dup 2)))]
|
6403 |
|
|
"ix86_match_ccmode (insn, CCGOCmode)
|
6404 |
|
|
&& ix86_binary_operator_ok (MINUS, mode, operands)"
|
6405 |
|
|
"sub{}\t{%2, %0|%0, %2}"
|
6406 |
|
|
[(set_attr "type" "alu")
|
6407 |
|
|
(set_attr "mode" "")])
|
6408 |
|
|
|
6409 |
|
|
(define_insn "*subsi_2_zext"
|
6410 |
|
|
[(set (reg FLAGS_REG)
|
6411 |
|
|
(compare
|
6412 |
|
|
(minus:SI (match_operand:SI 1 "register_operand" "0")
|
6413 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "rme"))
|
6414 |
|
|
(const_int 0)))
|
6415 |
|
|
(set (match_operand:DI 0 "register_operand" "=r")
|
6416 |
|
|
(zero_extend:DI
|
6417 |
|
|
(minus:SI (match_dup 1)
|
6418 |
|
|
(match_dup 2))))]
|
6419 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCGOCmode)
|
6420 |
|
|
&& ix86_binary_operator_ok (MINUS, SImode, operands)"
|
6421 |
|
|
"sub{l}\t{%2, %k0|%k0, %2}"
|
6422 |
|
|
[(set_attr "type" "alu")
|
6423 |
|
|
(set_attr "mode" "SI")])
|
6424 |
|
|
|
6425 |
|
|
(define_insn "*sub_3"
|
6426 |
|
|
[(set (reg FLAGS_REG)
|
6427 |
|
|
(compare (match_operand:SWI 1 "nonimmediate_operand" "0,0")
|
6428 |
|
|
(match_operand:SWI 2 "" ",m")))
|
6429 |
|
|
(set (match_operand:SWI 0 "nonimmediate_operand" "=m,")
|
6430 |
|
|
(minus:SWI (match_dup 1) (match_dup 2)))]
|
6431 |
|
|
"ix86_match_ccmode (insn, CCmode)
|
6432 |
|
|
&& ix86_binary_operator_ok (MINUS, mode, operands)"
|
6433 |
|
|
"sub{}\t{%2, %0|%0, %2}"
|
6434 |
|
|
[(set_attr "type" "alu")
|
6435 |
|
|
(set_attr "mode" "")])
|
6436 |
|
|
|
6437 |
|
|
(define_insn "*subsi_3_zext"
|
6438 |
|
|
[(set (reg FLAGS_REG)
|
6439 |
|
|
(compare (match_operand:SI 1 "register_operand" "0")
|
6440 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "rme")))
|
6441 |
|
|
(set (match_operand:DI 0 "register_operand" "=r")
|
6442 |
|
|
(zero_extend:DI
|
6443 |
|
|
(minus:SI (match_dup 1)
|
6444 |
|
|
(match_dup 2))))]
|
6445 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCmode)
|
6446 |
|
|
&& ix86_binary_operator_ok (MINUS, SImode, operands)"
|
6447 |
|
|
"sub{l}\t{%2, %1|%1, %2}"
|
6448 |
|
|
[(set_attr "type" "alu")
|
6449 |
|
|
(set_attr "mode" "SI")])
|
6450 |
|
|
|
6451 |
|
|
;; Add with carry and subtract with borrow
|
6452 |
|
|
|
6453 |
|
|
(define_expand "3_carry"
|
6454 |
|
|
[(parallel
|
6455 |
|
|
[(set (match_operand:SWI 0 "nonimmediate_operand" "")
|
6456 |
|
|
(plusminus:SWI
|
6457 |
|
|
(match_operand:SWI 1 "nonimmediate_operand" "")
|
6458 |
|
|
(plus:SWI (match_operator:SWI 4 "ix86_carry_flag_operator"
|
6459 |
|
|
[(match_operand 3 "flags_reg_operand" "")
|
6460 |
|
|
(const_int 0)])
|
6461 |
|
|
(match_operand:SWI 2 "" ""))))
|
6462 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
6463 |
|
|
"ix86_binary_operator_ok (, mode, operands)")
|
6464 |
|
|
|
6465 |
|
|
(define_insn "*3_carry"
|
6466 |
|
|
[(set (match_operand:SWI 0 "nonimmediate_operand" "=m,")
|
6467 |
|
|
(plusminus:SWI
|
6468 |
|
|
(match_operand:SWI 1 "nonimmediate_operand" "0,0")
|
6469 |
|
|
(plus:SWI
|
6470 |
|
|
(match_operator 3 "ix86_carry_flag_operator"
|
6471 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
6472 |
|
|
(match_operand:SWI 2 "" ",m"))))
|
6473 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6474 |
|
|
"ix86_binary_operator_ok (PLUS, mode, operands)"
|
6475 |
|
|
"{}\t{%2, %0|%0, %2}"
|
6476 |
|
|
[(set_attr "type" "alu")
|
6477 |
|
|
(set_attr "use_carry" "1")
|
6478 |
|
|
(set_attr "pent_pair" "pu")
|
6479 |
|
|
(set_attr "mode" "")])
|
6480 |
|
|
|
6481 |
|
|
(define_insn "*addsi3_carry_zext"
|
6482 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
6483 |
|
|
(zero_extend:DI
|
6484 |
|
|
(plus:SI (match_operand:SI 1 "nonimmediate_operand" "%0")
|
6485 |
|
|
(plus:SI (match_operator 3 "ix86_carry_flag_operator"
|
6486 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
6487 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "rme")))))
|
6488 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6489 |
|
|
"TARGET_64BIT && ix86_binary_operator_ok (PLUS, SImode, operands)"
|
6490 |
|
|
"adc{l}\t{%2, %k0|%k0, %2}"
|
6491 |
|
|
[(set_attr "type" "alu")
|
6492 |
|
|
(set_attr "use_carry" "1")
|
6493 |
|
|
(set_attr "pent_pair" "pu")
|
6494 |
|
|
(set_attr "mode" "SI")])
|
6495 |
|
|
|
6496 |
|
|
(define_insn "*subsi3_carry_zext"
|
6497 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
6498 |
|
|
(zero_extend:DI
|
6499 |
|
|
(minus:SI (match_operand:SI 1 "register_operand" "0")
|
6500 |
|
|
(plus:SI (match_operator 3 "ix86_carry_flag_operator"
|
6501 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
6502 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "rme")))))
|
6503 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6504 |
|
|
"TARGET_64BIT && ix86_binary_operator_ok (MINUS, SImode, operands)"
|
6505 |
|
|
"sbb{l}\t{%2, %k0|%k0, %2}"
|
6506 |
|
|
[(set_attr "type" "alu")
|
6507 |
|
|
(set_attr "pent_pair" "pu")
|
6508 |
|
|
(set_attr "mode" "SI")])
|
6509 |
|
|
|
6510 |
|
|
;; Overflow setting add and subtract instructions
|
6511 |
|
|
|
6512 |
|
|
(define_insn "*add3_cconly_overflow"
|
6513 |
|
|
[(set (reg:CCC FLAGS_REG)
|
6514 |
|
|
(compare:CCC
|
6515 |
|
|
(plus:SWI
|
6516 |
|
|
(match_operand:SWI 1 "nonimmediate_operand" "%0")
|
6517 |
|
|
(match_operand:SWI 2 "" ""))
|
6518 |
|
|
(match_dup 1)))
|
6519 |
|
|
(clobber (match_scratch:SWI 0 "="))]
|
6520 |
|
|
"!(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6521 |
|
|
"add{}\t{%2, %0|%0, %2}"
|
6522 |
|
|
[(set_attr "type" "alu")
|
6523 |
|
|
(set_attr "mode" "")])
|
6524 |
|
|
|
6525 |
|
|
(define_insn "*sub3_cconly_overflow"
|
6526 |
|
|
[(set (reg:CCC FLAGS_REG)
|
6527 |
|
|
(compare:CCC
|
6528 |
|
|
(minus:SWI
|
6529 |
|
|
(match_operand:SWI 0 "nonimmediate_operand" "m,")
|
6530 |
|
|
(match_operand:SWI 1 "" ",m"))
|
6531 |
|
|
(match_dup 0)))]
|
6532 |
|
|
""
|
6533 |
|
|
"cmp{}\t{%1, %0|%0, %1}"
|
6534 |
|
|
[(set_attr "type" "icmp")
|
6535 |
|
|
(set_attr "mode" "")])
|
6536 |
|
|
|
6537 |
|
|
(define_insn "*3_cc_overflow"
|
6538 |
|
|
[(set (reg:CCC FLAGS_REG)
|
6539 |
|
|
(compare:CCC
|
6540 |
|
|
(plusminus:SWI
|
6541 |
|
|
(match_operand:SWI 1 "nonimmediate_operand" "0,0")
|
6542 |
|
|
(match_operand:SWI 2 "" ",m"))
|
6543 |
|
|
(match_dup 1)))
|
6544 |
|
|
(set (match_operand:SWI 0 "nonimmediate_operand" "=m,")
|
6545 |
|
|
(plusminus:SWI (match_dup 1) (match_dup 2)))]
|
6546 |
|
|
"ix86_binary_operator_ok (, mode, operands)"
|
6547 |
|
|
"{}\t{%2, %0|%0, %2}"
|
6548 |
|
|
[(set_attr "type" "alu")
|
6549 |
|
|
(set_attr "mode" "")])
|
6550 |
|
|
|
6551 |
|
|
(define_insn "*si3_zext_cc_overflow"
|
6552 |
|
|
[(set (reg:CCC FLAGS_REG)
|
6553 |
|
|
(compare:CCC
|
6554 |
|
|
(plusminus:SI
|
6555 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "0")
|
6556 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "rme"))
|
6557 |
|
|
(match_dup 1)))
|
6558 |
|
|
(set (match_operand:DI 0 "register_operand" "=r")
|
6559 |
|
|
(zero_extend:DI (plusminus:SI (match_dup 1) (match_dup 2))))]
|
6560 |
|
|
"TARGET_64BIT && ix86_binary_operator_ok (, SImode, operands)"
|
6561 |
|
|
"{l}\t{%2, %k0|%k0, %2}"
|
6562 |
|
|
[(set_attr "type" "alu")
|
6563 |
|
|
(set_attr "mode" "SI")])
|
6564 |
|
|
|
6565 |
|
|
;; The patterns that match these are at the end of this file.
|
6566 |
|
|
|
6567 |
|
|
(define_expand "xf3"
|
6568 |
|
|
[(set (match_operand:XF 0 "register_operand" "")
|
6569 |
|
|
(plusminus:XF
|
6570 |
|
|
(match_operand:XF 1 "register_operand" "")
|
6571 |
|
|
(match_operand:XF 2 "register_operand" "")))]
|
6572 |
|
|
"TARGET_80387")
|
6573 |
|
|
|
6574 |
|
|
(define_expand "3"
|
6575 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
6576 |
|
|
(plusminus:MODEF
|
6577 |
|
|
(match_operand:MODEF 1 "register_operand" "")
|
6578 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "")))]
|
6579 |
|
|
"(TARGET_80387 && X87_ENABLE_ARITH (mode))
|
6580 |
|
|
|| (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)")
|
6581 |
|
|
|
6582 |
|
|
;; Multiply instructions
|
6583 |
|
|
|
6584 |
|
|
(define_expand "mul3"
|
6585 |
|
|
[(parallel [(set (match_operand:SWIM248 0 "register_operand" "")
|
6586 |
|
|
(mult:SWIM248
|
6587 |
|
|
(match_operand:SWIM248 1 "register_operand" "")
|
6588 |
|
|
(match_operand:SWIM248 2 "" "")))
|
6589 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
6590 |
|
|
|
6591 |
|
|
(define_expand "mulqi3"
|
6592 |
|
|
[(parallel [(set (match_operand:QI 0 "register_operand" "")
|
6593 |
|
|
(mult:QI
|
6594 |
|
|
(match_operand:QI 1 "register_operand" "")
|
6595 |
|
|
(match_operand:QI 2 "nonimmediate_operand" "")))
|
6596 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
6597 |
|
|
"TARGET_QIMODE_MATH")
|
6598 |
|
|
|
6599 |
|
|
;; On AMDFAM10
|
6600 |
|
|
;; IMUL reg32/64, reg32/64, imm8 Direct
|
6601 |
|
|
;; IMUL reg32/64, mem32/64, imm8 VectorPath
|
6602 |
|
|
;; IMUL reg32/64, reg32/64, imm32 Direct
|
6603 |
|
|
;; IMUL reg32/64, mem32/64, imm32 VectorPath
|
6604 |
|
|
;; IMUL reg32/64, reg32/64 Direct
|
6605 |
|
|
;; IMUL reg32/64, mem32/64 Direct
|
6606 |
|
|
;;
|
6607 |
|
|
;; On BDVER1, all above IMULs use DirectPath
|
6608 |
|
|
|
6609 |
|
|
(define_insn "*mul3_1"
|
6610 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r,r,r")
|
6611 |
|
|
(mult:SWI48
|
6612 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "%rm,rm,0")
|
6613 |
|
|
(match_operand:SWI48 2 "" "K,,mr")))
|
6614 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6615 |
|
|
"!(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6616 |
|
|
"@
|
6617 |
|
|
imul{}\t{%2, %1, %0|%0, %1, %2}
|
6618 |
|
|
imul{}\t{%2, %1, %0|%0, %1, %2}
|
6619 |
|
|
imul{}\t{%2, %0|%0, %2}"
|
6620 |
|
|
[(set_attr "type" "imul")
|
6621 |
|
|
(set_attr "prefix_0f" "0,0,1")
|
6622 |
|
|
(set (attr "athlon_decode")
|
6623 |
|
|
(cond [(eq_attr "cpu" "athlon")
|
6624 |
|
|
(const_string "vector")
|
6625 |
|
|
(eq_attr "alternative" "1")
|
6626 |
|
|
(const_string "vector")
|
6627 |
|
|
(and (eq_attr "alternative" "2")
|
6628 |
|
|
(match_operand 1 "memory_operand" ""))
|
6629 |
|
|
(const_string "vector")]
|
6630 |
|
|
(const_string "direct")))
|
6631 |
|
|
(set (attr "amdfam10_decode")
|
6632 |
|
|
(cond [(and (eq_attr "alternative" "0,1")
|
6633 |
|
|
(match_operand 1 "memory_operand" ""))
|
6634 |
|
|
(const_string "vector")]
|
6635 |
|
|
(const_string "direct")))
|
6636 |
|
|
(set_attr "bdver1_decode" "direct")
|
6637 |
|
|
(set_attr "mode" "")])
|
6638 |
|
|
|
6639 |
|
|
(define_insn "*mulsi3_1_zext"
|
6640 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r,r,r")
|
6641 |
|
|
(zero_extend:DI
|
6642 |
|
|
(mult:SI (match_operand:SI 1 "nonimmediate_operand" "%rm,rm,0")
|
6643 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "K,e,mr"))))
|
6644 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6645 |
|
|
"TARGET_64BIT
|
6646 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6647 |
|
|
"@
|
6648 |
|
|
imul{l}\t{%2, %1, %k0|%k0, %1, %2}
|
6649 |
|
|
imul{l}\t{%2, %1, %k0|%k0, %1, %2}
|
6650 |
|
|
imul{l}\t{%2, %k0|%k0, %2}"
|
6651 |
|
|
[(set_attr "type" "imul")
|
6652 |
|
|
(set_attr "prefix_0f" "0,0,1")
|
6653 |
|
|
(set (attr "athlon_decode")
|
6654 |
|
|
(cond [(eq_attr "cpu" "athlon")
|
6655 |
|
|
(const_string "vector")
|
6656 |
|
|
(eq_attr "alternative" "1")
|
6657 |
|
|
(const_string "vector")
|
6658 |
|
|
(and (eq_attr "alternative" "2")
|
6659 |
|
|
(match_operand 1 "memory_operand" ""))
|
6660 |
|
|
(const_string "vector")]
|
6661 |
|
|
(const_string "direct")))
|
6662 |
|
|
(set (attr "amdfam10_decode")
|
6663 |
|
|
(cond [(and (eq_attr "alternative" "0,1")
|
6664 |
|
|
(match_operand 1 "memory_operand" ""))
|
6665 |
|
|
(const_string "vector")]
|
6666 |
|
|
(const_string "direct")))
|
6667 |
|
|
(set_attr "bdver1_decode" "direct")
|
6668 |
|
|
(set_attr "mode" "SI")])
|
6669 |
|
|
|
6670 |
|
|
;; On AMDFAM10
|
6671 |
|
|
;; IMUL reg16, reg16, imm8 VectorPath
|
6672 |
|
|
;; IMUL reg16, mem16, imm8 VectorPath
|
6673 |
|
|
;; IMUL reg16, reg16, imm16 VectorPath
|
6674 |
|
|
;; IMUL reg16, mem16, imm16 VectorPath
|
6675 |
|
|
;; IMUL reg16, reg16 Direct
|
6676 |
|
|
;; IMUL reg16, mem16 Direct
|
6677 |
|
|
;;
|
6678 |
|
|
;; On BDVER1, all HI MULs use DoublePath
|
6679 |
|
|
|
6680 |
|
|
(define_insn "*mulhi3_1"
|
6681 |
|
|
[(set (match_operand:HI 0 "register_operand" "=r,r,r")
|
6682 |
|
|
(mult:HI (match_operand:HI 1 "nonimmediate_operand" "%rm,rm,0")
|
6683 |
|
|
(match_operand:HI 2 "general_operand" "K,n,mr")))
|
6684 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6685 |
|
|
"TARGET_HIMODE_MATH
|
6686 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6687 |
|
|
"@
|
6688 |
|
|
imul{w}\t{%2, %1, %0|%0, %1, %2}
|
6689 |
|
|
imul{w}\t{%2, %1, %0|%0, %1, %2}
|
6690 |
|
|
imul{w}\t{%2, %0|%0, %2}"
|
6691 |
|
|
[(set_attr "type" "imul")
|
6692 |
|
|
(set_attr "prefix_0f" "0,0,1")
|
6693 |
|
|
(set (attr "athlon_decode")
|
6694 |
|
|
(cond [(eq_attr "cpu" "athlon")
|
6695 |
|
|
(const_string "vector")
|
6696 |
|
|
(eq_attr "alternative" "1,2")
|
6697 |
|
|
(const_string "vector")]
|
6698 |
|
|
(const_string "direct")))
|
6699 |
|
|
(set (attr "amdfam10_decode")
|
6700 |
|
|
(cond [(eq_attr "alternative" "0,1")
|
6701 |
|
|
(const_string "vector")]
|
6702 |
|
|
(const_string "direct")))
|
6703 |
|
|
(set_attr "bdver1_decode" "double")
|
6704 |
|
|
(set_attr "mode" "HI")])
|
6705 |
|
|
|
6706 |
|
|
;;On AMDFAM10 and BDVER1
|
6707 |
|
|
;; MUL reg8 Direct
|
6708 |
|
|
;; MUL mem8 Direct
|
6709 |
|
|
|
6710 |
|
|
(define_insn "*mulqi3_1"
|
6711 |
|
|
[(set (match_operand:QI 0 "register_operand" "=a")
|
6712 |
|
|
(mult:QI (match_operand:QI 1 "nonimmediate_operand" "%0")
|
6713 |
|
|
(match_operand:QI 2 "nonimmediate_operand" "qm")))
|
6714 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6715 |
|
|
"TARGET_QIMODE_MATH
|
6716 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6717 |
|
|
"mul{b}\t%2"
|
6718 |
|
|
[(set_attr "type" "imul")
|
6719 |
|
|
(set_attr "length_immediate" "0")
|
6720 |
|
|
(set (attr "athlon_decode")
|
6721 |
|
|
(if_then_else (eq_attr "cpu" "athlon")
|
6722 |
|
|
(const_string "vector")
|
6723 |
|
|
(const_string "direct")))
|
6724 |
|
|
(set_attr "amdfam10_decode" "direct")
|
6725 |
|
|
(set_attr "bdver1_decode" "direct")
|
6726 |
|
|
(set_attr "mode" "QI")])
|
6727 |
|
|
|
6728 |
|
|
(define_expand "mul3"
|
6729 |
|
|
[(parallel [(set (match_operand: 0 "register_operand" "")
|
6730 |
|
|
(mult:
|
6731 |
|
|
(any_extend:
|
6732 |
|
|
(match_operand:DWIH 1 "nonimmediate_operand" ""))
|
6733 |
|
|
(any_extend:
|
6734 |
|
|
(match_operand:DWIH 2 "register_operand" ""))))
|
6735 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
6736 |
|
|
|
6737 |
|
|
(define_expand "mulqihi3"
|
6738 |
|
|
[(parallel [(set (match_operand:HI 0 "register_operand" "")
|
6739 |
|
|
(mult:HI
|
6740 |
|
|
(any_extend:HI
|
6741 |
|
|
(match_operand:QI 1 "nonimmediate_operand" ""))
|
6742 |
|
|
(any_extend:HI
|
6743 |
|
|
(match_operand:QI 2 "register_operand" ""))))
|
6744 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
6745 |
|
|
"TARGET_QIMODE_MATH")
|
6746 |
|
|
|
6747 |
|
|
(define_insn "*bmi2_umulditi3_1"
|
6748 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
6749 |
|
|
(mult:DI
|
6750 |
|
|
(match_operand:DI 2 "nonimmediate_operand" "%d")
|
6751 |
|
|
(match_operand:DI 3 "nonimmediate_operand" "rm")))
|
6752 |
|
|
(set (match_operand:DI 1 "register_operand" "=r")
|
6753 |
|
|
(truncate:DI
|
6754 |
|
|
(lshiftrt:TI
|
6755 |
|
|
(mult:TI (zero_extend:TI (match_dup 2))
|
6756 |
|
|
(zero_extend:TI (match_dup 3)))
|
6757 |
|
|
(const_int 64))))]
|
6758 |
|
|
"TARGET_64BIT && TARGET_BMI2
|
6759 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6760 |
|
|
"mulx\t{%3, %0, %1|%1, %0, %3}"
|
6761 |
|
|
[(set_attr "type" "imulx")
|
6762 |
|
|
(set_attr "prefix" "vex")
|
6763 |
|
|
(set_attr "mode" "DI")])
|
6764 |
|
|
|
6765 |
|
|
(define_insn "*bmi2_umulsidi3_1"
|
6766 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
6767 |
|
|
(mult:SI
|
6768 |
|
|
(match_operand:SI 2 "nonimmediate_operand" "%d")
|
6769 |
|
|
(match_operand:SI 3 "nonimmediate_operand" "rm")))
|
6770 |
|
|
(set (match_operand:SI 1 "register_operand" "=r")
|
6771 |
|
|
(truncate:SI
|
6772 |
|
|
(lshiftrt:DI
|
6773 |
|
|
(mult:DI (zero_extend:DI (match_dup 2))
|
6774 |
|
|
(zero_extend:DI (match_dup 3)))
|
6775 |
|
|
(const_int 32))))]
|
6776 |
|
|
"!TARGET_64BIT && TARGET_BMI2
|
6777 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6778 |
|
|
"mulx\t{%3, %0, %1|%1, %0, %3}"
|
6779 |
|
|
[(set_attr "type" "imulx")
|
6780 |
|
|
(set_attr "prefix" "vex")
|
6781 |
|
|
(set_attr "mode" "SI")])
|
6782 |
|
|
|
6783 |
|
|
(define_insn "*umul3_1"
|
6784 |
|
|
[(set (match_operand: 0 "register_operand" "=A,r")
|
6785 |
|
|
(mult:
|
6786 |
|
|
(zero_extend:
|
6787 |
|
|
(match_operand:DWIH 1 "nonimmediate_operand" "%0,d"))
|
6788 |
|
|
(zero_extend:
|
6789 |
|
|
(match_operand:DWIH 2 "nonimmediate_operand" "rm,rm"))))
|
6790 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6791 |
|
|
"!(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6792 |
|
|
"@
|
6793 |
|
|
mul{}\t%2
|
6794 |
|
|
#"
|
6795 |
|
|
[(set_attr "isa" "*,bmi2")
|
6796 |
|
|
(set_attr "type" "imul,imulx")
|
6797 |
|
|
(set_attr "length_immediate" "0,*")
|
6798 |
|
|
(set (attr "athlon_decode")
|
6799 |
|
|
(cond [(eq_attr "alternative" "0")
|
6800 |
|
|
(if_then_else (eq_attr "cpu" "athlon")
|
6801 |
|
|
(const_string "vector")
|
6802 |
|
|
(const_string "double"))]
|
6803 |
|
|
(const_string "*")))
|
6804 |
|
|
(set_attr "amdfam10_decode" "double,*")
|
6805 |
|
|
(set_attr "bdver1_decode" "direct,*")
|
6806 |
|
|
(set_attr "prefix" "orig,vex")
|
6807 |
|
|
(set_attr "mode" "")])
|
6808 |
|
|
|
6809 |
|
|
;; Convert mul to the mulx pattern to avoid flags dependency.
|
6810 |
|
|
(define_split
|
6811 |
|
|
[(set (match_operand: 0 "register_operand" "")
|
6812 |
|
|
(mult:
|
6813 |
|
|
(zero_extend:
|
6814 |
|
|
(match_operand:DWIH 1 "register_operand" ""))
|
6815 |
|
|
(zero_extend:
|
6816 |
|
|
(match_operand:DWIH 2 "nonimmediate_operand" ""))))
|
6817 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6818 |
|
|
"TARGET_BMI2 && reload_completed
|
6819 |
|
|
&& true_regnum (operands[1]) == DX_REG"
|
6820 |
|
|
[(parallel [(set (match_dup 3)
|
6821 |
|
|
(mult:DWIH (match_dup 1) (match_dup 2)))
|
6822 |
|
|
(set (match_dup 4)
|
6823 |
|
|
(truncate:DWIH
|
6824 |
|
|
(lshiftrt:
|
6825 |
|
|
(mult: (zero_extend: (match_dup 1))
|
6826 |
|
|
(zero_extend: (match_dup 2)))
|
6827 |
|
|
(match_dup 5))))])]
|
6828 |
|
|
{
|
6829 |
|
|
split_double_mode (mode, &operands[0], 1, &operands[3], &operands[4]);
|
6830 |
|
|
|
6831 |
|
|
operands[5] = GEN_INT (GET_MODE_BITSIZE (mode));
|
6832 |
|
|
})
|
6833 |
|
|
|
6834 |
|
|
(define_insn "*mul3_1"
|
6835 |
|
|
[(set (match_operand: 0 "register_operand" "=A")
|
6836 |
|
|
(mult:
|
6837 |
|
|
(sign_extend:
|
6838 |
|
|
(match_operand:DWIH 1 "nonimmediate_operand" "%0"))
|
6839 |
|
|
(sign_extend:
|
6840 |
|
|
(match_operand:DWIH 2 "nonimmediate_operand" "rm"))))
|
6841 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6842 |
|
|
"!(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6843 |
|
|
"imul{}\t%2"
|
6844 |
|
|
[(set_attr "type" "imul")
|
6845 |
|
|
(set_attr "length_immediate" "0")
|
6846 |
|
|
(set (attr "athlon_decode")
|
6847 |
|
|
(if_then_else (eq_attr "cpu" "athlon")
|
6848 |
|
|
(const_string "vector")
|
6849 |
|
|
(const_string "double")))
|
6850 |
|
|
(set_attr "amdfam10_decode" "double")
|
6851 |
|
|
(set_attr "bdver1_decode" "direct")
|
6852 |
|
|
(set_attr "mode" "")])
|
6853 |
|
|
|
6854 |
|
|
(define_insn "*mulqihi3_1"
|
6855 |
|
|
[(set (match_operand:HI 0 "register_operand" "=a")
|
6856 |
|
|
(mult:HI
|
6857 |
|
|
(any_extend:HI
|
6858 |
|
|
(match_operand:QI 1 "nonimmediate_operand" "%0"))
|
6859 |
|
|
(any_extend:HI
|
6860 |
|
|
(match_operand:QI 2 "nonimmediate_operand" "qm"))))
|
6861 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6862 |
|
|
"TARGET_QIMODE_MATH
|
6863 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6864 |
|
|
"mul{b}\t%2"
|
6865 |
|
|
[(set_attr "type" "imul")
|
6866 |
|
|
(set_attr "length_immediate" "0")
|
6867 |
|
|
(set (attr "athlon_decode")
|
6868 |
|
|
(if_then_else (eq_attr "cpu" "athlon")
|
6869 |
|
|
(const_string "vector")
|
6870 |
|
|
(const_string "direct")))
|
6871 |
|
|
(set_attr "amdfam10_decode" "direct")
|
6872 |
|
|
(set_attr "bdver1_decode" "direct")
|
6873 |
|
|
(set_attr "mode" "QI")])
|
6874 |
|
|
|
6875 |
|
|
(define_expand "mul3_highpart"
|
6876 |
|
|
[(parallel [(set (match_operand:SWI48 0 "register_operand" "")
|
6877 |
|
|
(truncate:SWI48
|
6878 |
|
|
(lshiftrt:
|
6879 |
|
|
(mult:
|
6880 |
|
|
(any_extend:
|
6881 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" ""))
|
6882 |
|
|
(any_extend:
|
6883 |
|
|
(match_operand:SWI48 2 "register_operand" "")))
|
6884 |
|
|
(match_dup 4))))
|
6885 |
|
|
(clobber (match_scratch:SWI48 3 ""))
|
6886 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
6887 |
|
|
""
|
6888 |
|
|
"operands[4] = GEN_INT (GET_MODE_BITSIZE (mode));")
|
6889 |
|
|
|
6890 |
|
|
(define_insn "*muldi3_highpart_1"
|
6891 |
|
|
[(set (match_operand:DI 0 "register_operand" "=d")
|
6892 |
|
|
(truncate:DI
|
6893 |
|
|
(lshiftrt:TI
|
6894 |
|
|
(mult:TI
|
6895 |
|
|
(any_extend:TI
|
6896 |
|
|
(match_operand:DI 1 "nonimmediate_operand" "%a"))
|
6897 |
|
|
(any_extend:TI
|
6898 |
|
|
(match_operand:DI 2 "nonimmediate_operand" "rm")))
|
6899 |
|
|
(const_int 64))))
|
6900 |
|
|
(clobber (match_scratch:DI 3 "=1"))
|
6901 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6902 |
|
|
"TARGET_64BIT
|
6903 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6904 |
|
|
"mul{q}\t%2"
|
6905 |
|
|
[(set_attr "type" "imul")
|
6906 |
|
|
(set_attr "length_immediate" "0")
|
6907 |
|
|
(set (attr "athlon_decode")
|
6908 |
|
|
(if_then_else (eq_attr "cpu" "athlon")
|
6909 |
|
|
(const_string "vector")
|
6910 |
|
|
(const_string "double")))
|
6911 |
|
|
(set_attr "amdfam10_decode" "double")
|
6912 |
|
|
(set_attr "bdver1_decode" "direct")
|
6913 |
|
|
(set_attr "mode" "DI")])
|
6914 |
|
|
|
6915 |
|
|
(define_insn "*mulsi3_highpart_1"
|
6916 |
|
|
[(set (match_operand:SI 0 "register_operand" "=d")
|
6917 |
|
|
(truncate:SI
|
6918 |
|
|
(lshiftrt:DI
|
6919 |
|
|
(mult:DI
|
6920 |
|
|
(any_extend:DI
|
6921 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "%a"))
|
6922 |
|
|
(any_extend:DI
|
6923 |
|
|
(match_operand:SI 2 "nonimmediate_operand" "rm")))
|
6924 |
|
|
(const_int 32))))
|
6925 |
|
|
(clobber (match_scratch:SI 3 "=1"))
|
6926 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6927 |
|
|
"!(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6928 |
|
|
"mul{l}\t%2"
|
6929 |
|
|
[(set_attr "type" "imul")
|
6930 |
|
|
(set_attr "length_immediate" "0")
|
6931 |
|
|
(set (attr "athlon_decode")
|
6932 |
|
|
(if_then_else (eq_attr "cpu" "athlon")
|
6933 |
|
|
(const_string "vector")
|
6934 |
|
|
(const_string "double")))
|
6935 |
|
|
(set_attr "amdfam10_decode" "double")
|
6936 |
|
|
(set_attr "bdver1_decode" "direct")
|
6937 |
|
|
(set_attr "mode" "SI")])
|
6938 |
|
|
|
6939 |
|
|
(define_insn "*mulsi3_highpart_zext"
|
6940 |
|
|
[(set (match_operand:DI 0 "register_operand" "=d")
|
6941 |
|
|
(zero_extend:DI (truncate:SI
|
6942 |
|
|
(lshiftrt:DI
|
6943 |
|
|
(mult:DI (any_extend:DI
|
6944 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "%a"))
|
6945 |
|
|
(any_extend:DI
|
6946 |
|
|
(match_operand:SI 2 "nonimmediate_operand" "rm")))
|
6947 |
|
|
(const_int 32)))))
|
6948 |
|
|
(clobber (match_scratch:SI 3 "=1"))
|
6949 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
6950 |
|
|
"TARGET_64BIT
|
6951 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
6952 |
|
|
"mul{l}\t%2"
|
6953 |
|
|
[(set_attr "type" "imul")
|
6954 |
|
|
(set_attr "length_immediate" "0")
|
6955 |
|
|
(set (attr "athlon_decode")
|
6956 |
|
|
(if_then_else (eq_attr "cpu" "athlon")
|
6957 |
|
|
(const_string "vector")
|
6958 |
|
|
(const_string "double")))
|
6959 |
|
|
(set_attr "amdfam10_decode" "double")
|
6960 |
|
|
(set_attr "bdver1_decode" "direct")
|
6961 |
|
|
(set_attr "mode" "SI")])
|
6962 |
|
|
|
6963 |
|
|
;; The patterns that match these are at the end of this file.
|
6964 |
|
|
|
6965 |
|
|
(define_expand "mulxf3"
|
6966 |
|
|
[(set (match_operand:XF 0 "register_operand" "")
|
6967 |
|
|
(mult:XF (match_operand:XF 1 "register_operand" "")
|
6968 |
|
|
(match_operand:XF 2 "register_operand" "")))]
|
6969 |
|
|
"TARGET_80387")
|
6970 |
|
|
|
6971 |
|
|
(define_expand "mul3"
|
6972 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
6973 |
|
|
(mult:MODEF (match_operand:MODEF 1 "register_operand" "")
|
6974 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "")))]
|
6975 |
|
|
"(TARGET_80387 && X87_ENABLE_ARITH (mode))
|
6976 |
|
|
|| (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)")
|
6977 |
|
|
|
6978 |
|
|
;; Divide instructions
|
6979 |
|
|
|
6980 |
|
|
;; The patterns that match these are at the end of this file.
|
6981 |
|
|
|
6982 |
|
|
(define_expand "divxf3"
|
6983 |
|
|
[(set (match_operand:XF 0 "register_operand" "")
|
6984 |
|
|
(div:XF (match_operand:XF 1 "register_operand" "")
|
6985 |
|
|
(match_operand:XF 2 "register_operand" "")))]
|
6986 |
|
|
"TARGET_80387")
|
6987 |
|
|
|
6988 |
|
|
(define_expand "divdf3"
|
6989 |
|
|
[(set (match_operand:DF 0 "register_operand" "")
|
6990 |
|
|
(div:DF (match_operand:DF 1 "register_operand" "")
|
6991 |
|
|
(match_operand:DF 2 "nonimmediate_operand" "")))]
|
6992 |
|
|
"(TARGET_80387 && X87_ENABLE_ARITH (DFmode))
|
6993 |
|
|
|| (TARGET_SSE2 && TARGET_SSE_MATH)")
|
6994 |
|
|
|
6995 |
|
|
(define_expand "divsf3"
|
6996 |
|
|
[(set (match_operand:SF 0 "register_operand" "")
|
6997 |
|
|
(div:SF (match_operand:SF 1 "register_operand" "")
|
6998 |
|
|
(match_operand:SF 2 "nonimmediate_operand" "")))]
|
6999 |
|
|
"(TARGET_80387 && X87_ENABLE_ARITH (SFmode))
|
7000 |
|
|
|| TARGET_SSE_MATH"
|
7001 |
|
|
{
|
7002 |
|
|
if (TARGET_SSE_MATH
|
7003 |
|
|
&& TARGET_RECIP_DIV
|
7004 |
|
|
&& optimize_insn_for_speed_p ()
|
7005 |
|
|
&& flag_finite_math_only && !flag_trapping_math
|
7006 |
|
|
&& flag_unsafe_math_optimizations)
|
7007 |
|
|
{
|
7008 |
|
|
ix86_emit_swdivsf (operands[0], operands[1],
|
7009 |
|
|
operands[2], SFmode);
|
7010 |
|
|
DONE;
|
7011 |
|
|
}
|
7012 |
|
|
})
|
7013 |
|
|
|
7014 |
|
|
;; Divmod instructions.
|
7015 |
|
|
|
7016 |
|
|
(define_expand "divmod4"
|
7017 |
|
|
[(parallel [(set (match_operand:SWIM248 0 "register_operand" "")
|
7018 |
|
|
(div:SWIM248
|
7019 |
|
|
(match_operand:SWIM248 1 "register_operand" "")
|
7020 |
|
|
(match_operand:SWIM248 2 "nonimmediate_operand" "")))
|
7021 |
|
|
(set (match_operand:SWIM248 3 "register_operand" "")
|
7022 |
|
|
(mod:SWIM248 (match_dup 1) (match_dup 2)))
|
7023 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
7024 |
|
|
|
7025 |
|
|
;; Split with 8bit unsigned divide:
|
7026 |
|
|
;; if (dividend an divisor are in [0-255])
|
7027 |
|
|
;; use 8bit unsigned integer divide
|
7028 |
|
|
;; else
|
7029 |
|
|
;; use original integer divide
|
7030 |
|
|
(define_split
|
7031 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "")
|
7032 |
|
|
(div:SWI48 (match_operand:SWI48 2 "register_operand" "")
|
7033 |
|
|
(match_operand:SWI48 3 "nonimmediate_operand" "")))
|
7034 |
|
|
(set (match_operand:SWI48 1 "register_operand" "")
|
7035 |
|
|
(mod:SWI48 (match_dup 2) (match_dup 3)))
|
7036 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7037 |
|
|
"TARGET_USE_8BIT_IDIV
|
7038 |
|
|
&& TARGET_QIMODE_MATH
|
7039 |
|
|
&& can_create_pseudo_p ()
|
7040 |
|
|
&& !optimize_insn_for_size_p ()"
|
7041 |
|
|
[(const_int 0)]
|
7042 |
|
|
"ix86_split_idivmod (mode, operands, true); DONE;")
|
7043 |
|
|
|
7044 |
|
|
(define_insn_and_split "divmod4_1"
|
7045 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=a")
|
7046 |
|
|
(div:SWI48 (match_operand:SWI48 2 "register_operand" "0")
|
7047 |
|
|
(match_operand:SWI48 3 "nonimmediate_operand" "rm")))
|
7048 |
|
|
(set (match_operand:SWI48 1 "register_operand" "=&d")
|
7049 |
|
|
(mod:SWI48 (match_dup 2) (match_dup 3)))
|
7050 |
|
|
(unspec [(const_int 0)] UNSPEC_DIV_ALREADY_SPLIT)
|
7051 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7052 |
|
|
""
|
7053 |
|
|
"#"
|
7054 |
|
|
"reload_completed"
|
7055 |
|
|
[(parallel [(set (match_dup 1)
|
7056 |
|
|
(ashiftrt:SWI48 (match_dup 4) (match_dup 5)))
|
7057 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
7058 |
|
|
(parallel [(set (match_dup 0)
|
7059 |
|
|
(div:SWI48 (match_dup 2) (match_dup 3)))
|
7060 |
|
|
(set (match_dup 1)
|
7061 |
|
|
(mod:SWI48 (match_dup 2) (match_dup 3)))
|
7062 |
|
|
(use (match_dup 1))
|
7063 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
7064 |
|
|
{
|
7065 |
|
|
operands[5] = GEN_INT (GET_MODE_BITSIZE (mode)-1);
|
7066 |
|
|
|
7067 |
|
|
if (optimize_function_for_size_p (cfun) || TARGET_USE_CLTD)
|
7068 |
|
|
operands[4] = operands[2];
|
7069 |
|
|
else
|
7070 |
|
|
{
|
7071 |
|
|
/* Avoid use of cltd in favor of a mov+shift. */
|
7072 |
|
|
emit_move_insn (operands[1], operands[2]);
|
7073 |
|
|
operands[4] = operands[1];
|
7074 |
|
|
}
|
7075 |
|
|
}
|
7076 |
|
|
[(set_attr "type" "multi")
|
7077 |
|
|
(set_attr "mode" "")])
|
7078 |
|
|
|
7079 |
|
|
(define_insn_and_split "*divmod4"
|
7080 |
|
|
[(set (match_operand:SWIM248 0 "register_operand" "=a")
|
7081 |
|
|
(div:SWIM248 (match_operand:SWIM248 2 "register_operand" "0")
|
7082 |
|
|
(match_operand:SWIM248 3 "nonimmediate_operand" "rm")))
|
7083 |
|
|
(set (match_operand:SWIM248 1 "register_operand" "=&d")
|
7084 |
|
|
(mod:SWIM248 (match_dup 2) (match_dup 3)))
|
7085 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7086 |
|
|
""
|
7087 |
|
|
"#"
|
7088 |
|
|
"reload_completed"
|
7089 |
|
|
[(parallel [(set (match_dup 1)
|
7090 |
|
|
(ashiftrt:SWIM248 (match_dup 4) (match_dup 5)))
|
7091 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
7092 |
|
|
(parallel [(set (match_dup 0)
|
7093 |
|
|
(div:SWIM248 (match_dup 2) (match_dup 3)))
|
7094 |
|
|
(set (match_dup 1)
|
7095 |
|
|
(mod:SWIM248 (match_dup 2) (match_dup 3)))
|
7096 |
|
|
(use (match_dup 1))
|
7097 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
7098 |
|
|
{
|
7099 |
|
|
operands[5] = GEN_INT (GET_MODE_BITSIZE (mode)-1);
|
7100 |
|
|
|
7101 |
|
|
if (mode != HImode
|
7102 |
|
|
&& (optimize_function_for_size_p (cfun) || TARGET_USE_CLTD))
|
7103 |
|
|
operands[4] = operands[2];
|
7104 |
|
|
else
|
7105 |
|
|
{
|
7106 |
|
|
/* Avoid use of cltd in favor of a mov+shift. */
|
7107 |
|
|
emit_move_insn (operands[1], operands[2]);
|
7108 |
|
|
operands[4] = operands[1];
|
7109 |
|
|
}
|
7110 |
|
|
}
|
7111 |
|
|
[(set_attr "type" "multi")
|
7112 |
|
|
(set_attr "mode" "")])
|
7113 |
|
|
|
7114 |
|
|
(define_insn "*divmod4_noext"
|
7115 |
|
|
[(set (match_operand:SWIM248 0 "register_operand" "=a")
|
7116 |
|
|
(div:SWIM248 (match_operand:SWIM248 2 "register_operand" "0")
|
7117 |
|
|
(match_operand:SWIM248 3 "nonimmediate_operand" "rm")))
|
7118 |
|
|
(set (match_operand:SWIM248 1 "register_operand" "=d")
|
7119 |
|
|
(mod:SWIM248 (match_dup 2) (match_dup 3)))
|
7120 |
|
|
(use (match_operand:SWIM248 4 "register_operand" "1"))
|
7121 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7122 |
|
|
""
|
7123 |
|
|
"idiv{}\t%3"
|
7124 |
|
|
[(set_attr "type" "idiv")
|
7125 |
|
|
(set_attr "mode" "")])
|
7126 |
|
|
|
7127 |
|
|
(define_expand "divmodqi4"
|
7128 |
|
|
[(parallel [(set (match_operand:QI 0 "register_operand" "")
|
7129 |
|
|
(div:QI
|
7130 |
|
|
(match_operand:QI 1 "register_operand" "")
|
7131 |
|
|
(match_operand:QI 2 "nonimmediate_operand" "")))
|
7132 |
|
|
(set (match_operand:QI 3 "register_operand" "")
|
7133 |
|
|
(mod:QI (match_dup 1) (match_dup 2)))
|
7134 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
7135 |
|
|
"TARGET_QIMODE_MATH"
|
7136 |
|
|
{
|
7137 |
|
|
rtx div, mod, insn;
|
7138 |
|
|
rtx tmp0, tmp1;
|
7139 |
|
|
|
7140 |
|
|
tmp0 = gen_reg_rtx (HImode);
|
7141 |
|
|
tmp1 = gen_reg_rtx (HImode);
|
7142 |
|
|
|
7143 |
|
|
/* Extend operands[1] to HImode. Generate 8bit divide. Result is
|
7144 |
|
|
in AX. */
|
7145 |
|
|
emit_insn (gen_extendqihi2 (tmp1, operands[1]));
|
7146 |
|
|
emit_insn (gen_divmodhiqi3 (tmp0, tmp1, operands[2]));
|
7147 |
|
|
|
7148 |
|
|
/* Extract remainder from AH. */
|
7149 |
|
|
tmp1 = gen_rtx_SIGN_EXTRACT (QImode, tmp0, GEN_INT (8), GEN_INT (8));
|
7150 |
|
|
insn = emit_move_insn (operands[3], tmp1);
|
7151 |
|
|
|
7152 |
|
|
mod = gen_rtx_MOD (QImode, operands[1], operands[2]);
|
7153 |
|
|
set_unique_reg_note (insn, REG_EQUAL, mod);
|
7154 |
|
|
|
7155 |
|
|
/* Extract quotient from AL. */
|
7156 |
|
|
insn = emit_move_insn (operands[0], gen_lowpart (QImode, tmp0));
|
7157 |
|
|
|
7158 |
|
|
div = gen_rtx_DIV (QImode, operands[1], operands[2]);
|
7159 |
|
|
set_unique_reg_note (insn, REG_EQUAL, div);
|
7160 |
|
|
|
7161 |
|
|
DONE;
|
7162 |
|
|
})
|
7163 |
|
|
|
7164 |
|
|
;; Divide AX by r/m8, with result stored in
|
7165 |
|
|
;; AL <- Quotient
|
7166 |
|
|
;; AH <- Remainder
|
7167 |
|
|
;; Change div/mod to HImode and extend the second argument to HImode
|
7168 |
|
|
;; so that mode of div/mod matches with mode of arguments. Otherwise
|
7169 |
|
|
;; combine may fail.
|
7170 |
|
|
(define_insn "divmodhiqi3"
|
7171 |
|
|
[(set (match_operand:HI 0 "register_operand" "=a")
|
7172 |
|
|
(ior:HI
|
7173 |
|
|
(ashift:HI
|
7174 |
|
|
(zero_extend:HI
|
7175 |
|
|
(truncate:QI
|
7176 |
|
|
(mod:HI (match_operand:HI 1 "register_operand" "0")
|
7177 |
|
|
(sign_extend:HI
|
7178 |
|
|
(match_operand:QI 2 "nonimmediate_operand" "qm")))))
|
7179 |
|
|
(const_int 8))
|
7180 |
|
|
(zero_extend:HI
|
7181 |
|
|
(truncate:QI
|
7182 |
|
|
(div:HI (match_dup 1) (sign_extend:HI (match_dup 2)))))))
|
7183 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7184 |
|
|
"TARGET_QIMODE_MATH"
|
7185 |
|
|
"idiv{b}\t%2"
|
7186 |
|
|
[(set_attr "type" "idiv")
|
7187 |
|
|
(set_attr "mode" "QI")])
|
7188 |
|
|
|
7189 |
|
|
(define_expand "udivmod4"
|
7190 |
|
|
[(parallel [(set (match_operand:SWIM248 0 "register_operand" "")
|
7191 |
|
|
(udiv:SWIM248
|
7192 |
|
|
(match_operand:SWIM248 1 "register_operand" "")
|
7193 |
|
|
(match_operand:SWIM248 2 "nonimmediate_operand" "")))
|
7194 |
|
|
(set (match_operand:SWIM248 3 "register_operand" "")
|
7195 |
|
|
(umod:SWIM248 (match_dup 1) (match_dup 2)))
|
7196 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
7197 |
|
|
|
7198 |
|
|
;; Split with 8bit unsigned divide:
|
7199 |
|
|
;; if (dividend an divisor are in [0-255])
|
7200 |
|
|
;; use 8bit unsigned integer divide
|
7201 |
|
|
;; else
|
7202 |
|
|
;; use original integer divide
|
7203 |
|
|
(define_split
|
7204 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "")
|
7205 |
|
|
(udiv:SWI48 (match_operand:SWI48 2 "register_operand" "")
|
7206 |
|
|
(match_operand:SWI48 3 "nonimmediate_operand" "")))
|
7207 |
|
|
(set (match_operand:SWI48 1 "register_operand" "")
|
7208 |
|
|
(umod:SWI48 (match_dup 2) (match_dup 3)))
|
7209 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7210 |
|
|
"TARGET_USE_8BIT_IDIV
|
7211 |
|
|
&& TARGET_QIMODE_MATH
|
7212 |
|
|
&& can_create_pseudo_p ()
|
7213 |
|
|
&& !optimize_insn_for_size_p ()"
|
7214 |
|
|
[(const_int 0)]
|
7215 |
|
|
"ix86_split_idivmod (mode, operands, false); DONE;")
|
7216 |
|
|
|
7217 |
|
|
(define_insn_and_split "udivmod4_1"
|
7218 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=a")
|
7219 |
|
|
(udiv:SWI48 (match_operand:SWI48 2 "register_operand" "0")
|
7220 |
|
|
(match_operand:SWI48 3 "nonimmediate_operand" "rm")))
|
7221 |
|
|
(set (match_operand:SWI48 1 "register_operand" "=&d")
|
7222 |
|
|
(umod:SWI48 (match_dup 2) (match_dup 3)))
|
7223 |
|
|
(unspec [(const_int 0)] UNSPEC_DIV_ALREADY_SPLIT)
|
7224 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7225 |
|
|
""
|
7226 |
|
|
"#"
|
7227 |
|
|
"reload_completed"
|
7228 |
|
|
[(set (match_dup 1) (const_int 0))
|
7229 |
|
|
(parallel [(set (match_dup 0)
|
7230 |
|
|
(udiv:SWI48 (match_dup 2) (match_dup 3)))
|
7231 |
|
|
(set (match_dup 1)
|
7232 |
|
|
(umod:SWI48 (match_dup 2) (match_dup 3)))
|
7233 |
|
|
(use (match_dup 1))
|
7234 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
7235 |
|
|
""
|
7236 |
|
|
[(set_attr "type" "multi")
|
7237 |
|
|
(set_attr "mode" "")])
|
7238 |
|
|
|
7239 |
|
|
(define_insn_and_split "*udivmod4"
|
7240 |
|
|
[(set (match_operand:SWIM248 0 "register_operand" "=a")
|
7241 |
|
|
(udiv:SWIM248 (match_operand:SWIM248 2 "register_operand" "0")
|
7242 |
|
|
(match_operand:SWIM248 3 "nonimmediate_operand" "rm")))
|
7243 |
|
|
(set (match_operand:SWIM248 1 "register_operand" "=&d")
|
7244 |
|
|
(umod:SWIM248 (match_dup 2) (match_dup 3)))
|
7245 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7246 |
|
|
""
|
7247 |
|
|
"#"
|
7248 |
|
|
"reload_completed"
|
7249 |
|
|
[(set (match_dup 1) (const_int 0))
|
7250 |
|
|
(parallel [(set (match_dup 0)
|
7251 |
|
|
(udiv:SWIM248 (match_dup 2) (match_dup 3)))
|
7252 |
|
|
(set (match_dup 1)
|
7253 |
|
|
(umod:SWIM248 (match_dup 2) (match_dup 3)))
|
7254 |
|
|
(use (match_dup 1))
|
7255 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
7256 |
|
|
""
|
7257 |
|
|
[(set_attr "type" "multi")
|
7258 |
|
|
(set_attr "mode" "")])
|
7259 |
|
|
|
7260 |
|
|
(define_insn "*udivmod4_noext"
|
7261 |
|
|
[(set (match_operand:SWIM248 0 "register_operand" "=a")
|
7262 |
|
|
(udiv:SWIM248 (match_operand:SWIM248 2 "register_operand" "0")
|
7263 |
|
|
(match_operand:SWIM248 3 "nonimmediate_operand" "rm")))
|
7264 |
|
|
(set (match_operand:SWIM248 1 "register_operand" "=d")
|
7265 |
|
|
(umod:SWIM248 (match_dup 2) (match_dup 3)))
|
7266 |
|
|
(use (match_operand:SWIM248 4 "register_operand" "1"))
|
7267 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7268 |
|
|
""
|
7269 |
|
|
"div{}\t%3"
|
7270 |
|
|
[(set_attr "type" "idiv")
|
7271 |
|
|
(set_attr "mode" "")])
|
7272 |
|
|
|
7273 |
|
|
(define_expand "udivmodqi4"
|
7274 |
|
|
[(parallel [(set (match_operand:QI 0 "register_operand" "")
|
7275 |
|
|
(udiv:QI
|
7276 |
|
|
(match_operand:QI 1 "register_operand" "")
|
7277 |
|
|
(match_operand:QI 2 "nonimmediate_operand" "")))
|
7278 |
|
|
(set (match_operand:QI 3 "register_operand" "")
|
7279 |
|
|
(umod:QI (match_dup 1) (match_dup 2)))
|
7280 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
7281 |
|
|
"TARGET_QIMODE_MATH"
|
7282 |
|
|
{
|
7283 |
|
|
rtx div, mod, insn;
|
7284 |
|
|
rtx tmp0, tmp1;
|
7285 |
|
|
|
7286 |
|
|
tmp0 = gen_reg_rtx (HImode);
|
7287 |
|
|
tmp1 = gen_reg_rtx (HImode);
|
7288 |
|
|
|
7289 |
|
|
/* Extend operands[1] to HImode. Generate 8bit divide. Result is
|
7290 |
|
|
in AX. */
|
7291 |
|
|
emit_insn (gen_zero_extendqihi2 (tmp1, operands[1]));
|
7292 |
|
|
emit_insn (gen_udivmodhiqi3 (tmp0, tmp1, operands[2]));
|
7293 |
|
|
|
7294 |
|
|
/* Extract remainder from AH. */
|
7295 |
|
|
tmp1 = gen_rtx_ZERO_EXTRACT (SImode, tmp0, GEN_INT (8), GEN_INT (8));
|
7296 |
|
|
tmp1 = simplify_gen_subreg (QImode, tmp1, SImode, 0);
|
7297 |
|
|
insn = emit_move_insn (operands[3], tmp1);
|
7298 |
|
|
|
7299 |
|
|
mod = gen_rtx_UMOD (QImode, operands[1], operands[2]);
|
7300 |
|
|
set_unique_reg_note (insn, REG_EQUAL, mod);
|
7301 |
|
|
|
7302 |
|
|
/* Extract quotient from AL. */
|
7303 |
|
|
insn = emit_move_insn (operands[0], gen_lowpart (QImode, tmp0));
|
7304 |
|
|
|
7305 |
|
|
div = gen_rtx_UDIV (QImode, operands[1], operands[2]);
|
7306 |
|
|
set_unique_reg_note (insn, REG_EQUAL, div);
|
7307 |
|
|
|
7308 |
|
|
DONE;
|
7309 |
|
|
})
|
7310 |
|
|
|
7311 |
|
|
(define_insn "udivmodhiqi3"
|
7312 |
|
|
[(set (match_operand:HI 0 "register_operand" "=a")
|
7313 |
|
|
(ior:HI
|
7314 |
|
|
(ashift:HI
|
7315 |
|
|
(zero_extend:HI
|
7316 |
|
|
(truncate:QI
|
7317 |
|
|
(mod:HI (match_operand:HI 1 "register_operand" "0")
|
7318 |
|
|
(zero_extend:HI
|
7319 |
|
|
(match_operand:QI 2 "nonimmediate_operand" "qm")))))
|
7320 |
|
|
(const_int 8))
|
7321 |
|
|
(zero_extend:HI
|
7322 |
|
|
(truncate:QI
|
7323 |
|
|
(div:HI (match_dup 1) (zero_extend:HI (match_dup 2)))))))
|
7324 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7325 |
|
|
"TARGET_QIMODE_MATH"
|
7326 |
|
|
"div{b}\t%2"
|
7327 |
|
|
[(set_attr "type" "idiv")
|
7328 |
|
|
(set_attr "mode" "QI")])
|
7329 |
|
|
|
7330 |
|
|
;; We cannot use div/idiv for double division, because it causes
|
7331 |
|
|
;; "division by zero" on the overflow and that's not what we expect
|
7332 |
|
|
;; from truncate. Because true (non truncating) double division is
|
7333 |
|
|
;; never generated, we can't create this insn anyway.
|
7334 |
|
|
;
|
7335 |
|
|
;(define_insn ""
|
7336 |
|
|
; [(set (match_operand:SI 0 "register_operand" "=a")
|
7337 |
|
|
; (truncate:SI
|
7338 |
|
|
; (udiv:DI (match_operand:DI 1 "register_operand" "A")
|
7339 |
|
|
; (zero_extend:DI
|
7340 |
|
|
; (match_operand:SI 2 "nonimmediate_operand" "rm")))))
|
7341 |
|
|
; (set (match_operand:SI 3 "register_operand" "=d")
|
7342 |
|
|
; (truncate:SI
|
7343 |
|
|
; (umod:DI (match_dup 1) (zero_extend:DI (match_dup 2)))))
|
7344 |
|
|
; (clobber (reg:CC FLAGS_REG))]
|
7345 |
|
|
; ""
|
7346 |
|
|
; "div{l}\t{%2, %0|%0, %2}"
|
7347 |
|
|
; [(set_attr "type" "idiv")])
|
7348 |
|
|
|
7349 |
|
|
;;- Logical AND instructions
|
7350 |
|
|
|
7351 |
|
|
;; On Pentium, "test imm, reg" is pairable only with eax, ax, and al.
|
7352 |
|
|
;; Note that this excludes ah.
|
7353 |
|
|
|
7354 |
|
|
(define_expand "testsi_ccno_1"
|
7355 |
|
|
[(set (reg:CCNO FLAGS_REG)
|
7356 |
|
|
(compare:CCNO
|
7357 |
|
|
(and:SI (match_operand:SI 0 "nonimmediate_operand" "")
|
7358 |
|
|
(match_operand:SI 1 "x86_64_nonmemory_operand" ""))
|
7359 |
|
|
(const_int 0)))])
|
7360 |
|
|
|
7361 |
|
|
(define_expand "testqi_ccz_1"
|
7362 |
|
|
[(set (reg:CCZ FLAGS_REG)
|
7363 |
|
|
(compare:CCZ (and:QI (match_operand:QI 0 "nonimmediate_operand" "")
|
7364 |
|
|
(match_operand:QI 1 "nonmemory_operand" ""))
|
7365 |
|
|
(const_int 0)))])
|
7366 |
|
|
|
7367 |
|
|
(define_expand "testdi_ccno_1"
|
7368 |
|
|
[(set (reg:CCNO FLAGS_REG)
|
7369 |
|
|
(compare:CCNO
|
7370 |
|
|
(and:DI (match_operand:DI 0 "nonimmediate_operand" "")
|
7371 |
|
|
(match_operand:DI 1 "x86_64_szext_general_operand" ""))
|
7372 |
|
|
(const_int 0)))]
|
7373 |
|
|
"TARGET_64BIT && !(MEM_P (operands[0]) && MEM_P (operands[1]))")
|
7374 |
|
|
|
7375 |
|
|
(define_insn "*testdi_1"
|
7376 |
|
|
[(set (reg FLAGS_REG)
|
7377 |
|
|
(compare
|
7378 |
|
|
(and:DI
|
7379 |
|
|
(match_operand:DI 0 "nonimmediate_operand" "%!*a,r,!*a,r,rm")
|
7380 |
|
|
(match_operand:DI 1 "x86_64_szext_general_operand" "Z,Z,e,e,re"))
|
7381 |
|
|
(const_int 0)))]
|
7382 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCNOmode)
|
7383 |
|
|
&& !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
7384 |
|
|
"@
|
7385 |
|
|
test{l}\t{%k1, %k0|%k0, %k1}
|
7386 |
|
|
test{l}\t{%k1, %k0|%k0, %k1}
|
7387 |
|
|
test{q}\t{%1, %0|%0, %1}
|
7388 |
|
|
test{q}\t{%1, %0|%0, %1}
|
7389 |
|
|
test{q}\t{%1, %0|%0, %1}"
|
7390 |
|
|
[(set_attr "type" "test")
|
7391 |
|
|
(set_attr "modrm" "0,1,0,1,1")
|
7392 |
|
|
(set_attr "mode" "SI,SI,DI,DI,DI")])
|
7393 |
|
|
|
7394 |
|
|
(define_insn "*testqi_1_maybe_si"
|
7395 |
|
|
[(set (reg FLAGS_REG)
|
7396 |
|
|
(compare
|
7397 |
|
|
(and:QI
|
7398 |
|
|
(match_operand:QI 0 "nonimmediate_operand" "%!*a,q,qm,r")
|
7399 |
|
|
(match_operand:QI 1 "general_operand" "n,n,qn,n"))
|
7400 |
|
|
(const_int 0)))]
|
7401 |
|
|
"!(MEM_P (operands[0]) && MEM_P (operands[1]))
|
7402 |
|
|
&& ix86_match_ccmode (insn,
|
7403 |
|
|
CONST_INT_P (operands[1])
|
7404 |
|
|
&& INTVAL (operands[1]) >= 0 ? CCNOmode : CCZmode)"
|
7405 |
|
|
{
|
7406 |
|
|
if (which_alternative == 3)
|
7407 |
|
|
{
|
7408 |
|
|
if (CONST_INT_P (operands[1]) && INTVAL (operands[1]) < 0)
|
7409 |
|
|
operands[1] = GEN_INT (INTVAL (operands[1]) & 0xff);
|
7410 |
|
|
return "test{l}\t{%1, %k0|%k0, %1}";
|
7411 |
|
|
}
|
7412 |
|
|
return "test{b}\t{%1, %0|%0, %1}";
|
7413 |
|
|
}
|
7414 |
|
|
[(set_attr "type" "test")
|
7415 |
|
|
(set_attr "modrm" "0,1,1,1")
|
7416 |
|
|
(set_attr "mode" "QI,QI,QI,SI")
|
7417 |
|
|
(set_attr "pent_pair" "uv,np,uv,np")])
|
7418 |
|
|
|
7419 |
|
|
(define_insn "*test_1"
|
7420 |
|
|
[(set (reg FLAGS_REG)
|
7421 |
|
|
(compare
|
7422 |
|
|
(and:SWI124
|
7423 |
|
|
(match_operand:SWI124 0 "nonimmediate_operand" "%!*a,,m")
|
7424 |
|
|
(match_operand:SWI124 1 "" ",,"))
|
7425 |
|
|
(const_int 0)))]
|
7426 |
|
|
"ix86_match_ccmode (insn, CCNOmode)
|
7427 |
|
|
&& !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
7428 |
|
|
"test{}\t{%1, %0|%0, %1}"
|
7429 |
|
|
[(set_attr "type" "test")
|
7430 |
|
|
(set_attr "modrm" "0,1,1")
|
7431 |
|
|
(set_attr "mode" "")
|
7432 |
|
|
(set_attr "pent_pair" "uv,np,uv")])
|
7433 |
|
|
|
7434 |
|
|
(define_expand "testqi_ext_ccno_0"
|
7435 |
|
|
[(set (reg:CCNO FLAGS_REG)
|
7436 |
|
|
(compare:CCNO
|
7437 |
|
|
(and:SI
|
7438 |
|
|
(zero_extract:SI
|
7439 |
|
|
(match_operand 0 "ext_register_operand" "")
|
7440 |
|
|
(const_int 8)
|
7441 |
|
|
(const_int 8))
|
7442 |
|
|
(match_operand 1 "const_int_operand" ""))
|
7443 |
|
|
(const_int 0)))])
|
7444 |
|
|
|
7445 |
|
|
(define_insn "*testqi_ext_0"
|
7446 |
|
|
[(set (reg FLAGS_REG)
|
7447 |
|
|
(compare
|
7448 |
|
|
(and:SI
|
7449 |
|
|
(zero_extract:SI
|
7450 |
|
|
(match_operand 0 "ext_register_operand" "Q")
|
7451 |
|
|
(const_int 8)
|
7452 |
|
|
(const_int 8))
|
7453 |
|
|
(match_operand 1 "const_int_operand" "n"))
|
7454 |
|
|
(const_int 0)))]
|
7455 |
|
|
"ix86_match_ccmode (insn, CCNOmode)"
|
7456 |
|
|
"test{b}\t{%1, %h0|%h0, %1}"
|
7457 |
|
|
[(set_attr "type" "test")
|
7458 |
|
|
(set_attr "mode" "QI")
|
7459 |
|
|
(set_attr "length_immediate" "1")
|
7460 |
|
|
(set_attr "modrm" "1")
|
7461 |
|
|
(set_attr "pent_pair" "np")])
|
7462 |
|
|
|
7463 |
|
|
(define_insn "*testqi_ext_1_rex64"
|
7464 |
|
|
[(set (reg FLAGS_REG)
|
7465 |
|
|
(compare
|
7466 |
|
|
(and:SI
|
7467 |
|
|
(zero_extract:SI
|
7468 |
|
|
(match_operand 0 "ext_register_operand" "Q")
|
7469 |
|
|
(const_int 8)
|
7470 |
|
|
(const_int 8))
|
7471 |
|
|
(zero_extend:SI
|
7472 |
|
|
(match_operand:QI 1 "register_operand" "Q")))
|
7473 |
|
|
(const_int 0)))]
|
7474 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCNOmode)"
|
7475 |
|
|
"test{b}\t{%1, %h0|%h0, %1}"
|
7476 |
|
|
[(set_attr "type" "test")
|
7477 |
|
|
(set_attr "mode" "QI")])
|
7478 |
|
|
|
7479 |
|
|
(define_insn "*testqi_ext_1"
|
7480 |
|
|
[(set (reg FLAGS_REG)
|
7481 |
|
|
(compare
|
7482 |
|
|
(and:SI
|
7483 |
|
|
(zero_extract:SI
|
7484 |
|
|
(match_operand 0 "ext_register_operand" "Q")
|
7485 |
|
|
(const_int 8)
|
7486 |
|
|
(const_int 8))
|
7487 |
|
|
(zero_extend:SI
|
7488 |
|
|
(match_operand:QI 1 "general_operand" "Qm")))
|
7489 |
|
|
(const_int 0)))]
|
7490 |
|
|
"!TARGET_64BIT && ix86_match_ccmode (insn, CCNOmode)"
|
7491 |
|
|
"test{b}\t{%1, %h0|%h0, %1}"
|
7492 |
|
|
[(set_attr "type" "test")
|
7493 |
|
|
(set_attr "mode" "QI")])
|
7494 |
|
|
|
7495 |
|
|
(define_insn "*testqi_ext_2"
|
7496 |
|
|
[(set (reg FLAGS_REG)
|
7497 |
|
|
(compare
|
7498 |
|
|
(and:SI
|
7499 |
|
|
(zero_extract:SI
|
7500 |
|
|
(match_operand 0 "ext_register_operand" "Q")
|
7501 |
|
|
(const_int 8)
|
7502 |
|
|
(const_int 8))
|
7503 |
|
|
(zero_extract:SI
|
7504 |
|
|
(match_operand 1 "ext_register_operand" "Q")
|
7505 |
|
|
(const_int 8)
|
7506 |
|
|
(const_int 8)))
|
7507 |
|
|
(const_int 0)))]
|
7508 |
|
|
"ix86_match_ccmode (insn, CCNOmode)"
|
7509 |
|
|
"test{b}\t{%h1, %h0|%h0, %h1}"
|
7510 |
|
|
[(set_attr "type" "test")
|
7511 |
|
|
(set_attr "mode" "QI")])
|
7512 |
|
|
|
7513 |
|
|
(define_insn "*testqi_ext_3_rex64"
|
7514 |
|
|
[(set (reg FLAGS_REG)
|
7515 |
|
|
(compare (zero_extract:DI
|
7516 |
|
|
(match_operand 0 "nonimmediate_operand" "rm")
|
7517 |
|
|
(match_operand:DI 1 "const_int_operand" "")
|
7518 |
|
|
(match_operand:DI 2 "const_int_operand" ""))
|
7519 |
|
|
(const_int 0)))]
|
7520 |
|
|
"TARGET_64BIT
|
7521 |
|
|
&& ix86_match_ccmode (insn, CCNOmode)
|
7522 |
|
|
&& INTVAL (operands[1]) > 0
|
7523 |
|
|
&& INTVAL (operands[2]) >= 0
|
7524 |
|
|
/* Ensure that resulting mask is zero or sign extended operand. */
|
7525 |
|
|
&& (INTVAL (operands[1]) + INTVAL (operands[2]) <= 32
|
7526 |
|
|
|| (INTVAL (operands[1]) + INTVAL (operands[2]) == 64
|
7527 |
|
|
&& INTVAL (operands[1]) > 32))
|
7528 |
|
|
&& (GET_MODE (operands[0]) == SImode
|
7529 |
|
|
|| GET_MODE (operands[0]) == DImode
|
7530 |
|
|
|| GET_MODE (operands[0]) == HImode
|
7531 |
|
|
|| GET_MODE (operands[0]) == QImode)"
|
7532 |
|
|
"#")
|
7533 |
|
|
|
7534 |
|
|
;; Combine likes to form bit extractions for some tests. Humor it.
|
7535 |
|
|
(define_insn "*testqi_ext_3"
|
7536 |
|
|
[(set (reg FLAGS_REG)
|
7537 |
|
|
(compare (zero_extract:SI
|
7538 |
|
|
(match_operand 0 "nonimmediate_operand" "rm")
|
7539 |
|
|
(match_operand:SI 1 "const_int_operand" "")
|
7540 |
|
|
(match_operand:SI 2 "const_int_operand" ""))
|
7541 |
|
|
(const_int 0)))]
|
7542 |
|
|
"ix86_match_ccmode (insn, CCNOmode)
|
7543 |
|
|
&& INTVAL (operands[1]) > 0
|
7544 |
|
|
&& INTVAL (operands[2]) >= 0
|
7545 |
|
|
&& INTVAL (operands[1]) + INTVAL (operands[2]) <= 32
|
7546 |
|
|
&& (GET_MODE (operands[0]) == SImode
|
7547 |
|
|
|| (TARGET_64BIT && GET_MODE (operands[0]) == DImode)
|
7548 |
|
|
|| GET_MODE (operands[0]) == HImode
|
7549 |
|
|
|| GET_MODE (operands[0]) == QImode)"
|
7550 |
|
|
"#")
|
7551 |
|
|
|
7552 |
|
|
(define_split
|
7553 |
|
|
[(set (match_operand 0 "flags_reg_operand" "")
|
7554 |
|
|
(match_operator 1 "compare_operator"
|
7555 |
|
|
[(zero_extract
|
7556 |
|
|
(match_operand 2 "nonimmediate_operand" "")
|
7557 |
|
|
(match_operand 3 "const_int_operand" "")
|
7558 |
|
|
(match_operand 4 "const_int_operand" ""))
|
7559 |
|
|
(const_int 0)]))]
|
7560 |
|
|
"ix86_match_ccmode (insn, CCNOmode)"
|
7561 |
|
|
[(set (match_dup 0) (match_op_dup 1 [(match_dup 2) (const_int 0)]))]
|
7562 |
|
|
{
|
7563 |
|
|
rtx val = operands[2];
|
7564 |
|
|
HOST_WIDE_INT len = INTVAL (operands[3]);
|
7565 |
|
|
HOST_WIDE_INT pos = INTVAL (operands[4]);
|
7566 |
|
|
HOST_WIDE_INT mask;
|
7567 |
|
|
enum machine_mode mode, submode;
|
7568 |
|
|
|
7569 |
|
|
mode = GET_MODE (val);
|
7570 |
|
|
if (MEM_P (val))
|
7571 |
|
|
{
|
7572 |
|
|
/* ??? Combine likes to put non-volatile mem extractions in QImode
|
7573 |
|
|
no matter the size of the test. So find a mode that works. */
|
7574 |
|
|
if (! MEM_VOLATILE_P (val))
|
7575 |
|
|
{
|
7576 |
|
|
mode = smallest_mode_for_size (pos + len, MODE_INT);
|
7577 |
|
|
val = adjust_address (val, mode, 0);
|
7578 |
|
|
}
|
7579 |
|
|
}
|
7580 |
|
|
else if (GET_CODE (val) == SUBREG
|
7581 |
|
|
&& (submode = GET_MODE (SUBREG_REG (val)),
|
7582 |
|
|
GET_MODE_BITSIZE (mode) > GET_MODE_BITSIZE (submode))
|
7583 |
|
|
&& pos + len <= GET_MODE_BITSIZE (submode)
|
7584 |
|
|
&& GET_MODE_CLASS (submode) == MODE_INT)
|
7585 |
|
|
{
|
7586 |
|
|
/* Narrow a paradoxical subreg to prevent partial register stalls. */
|
7587 |
|
|
mode = submode;
|
7588 |
|
|
val = SUBREG_REG (val);
|
7589 |
|
|
}
|
7590 |
|
|
else if (mode == HImode && pos + len <= 8)
|
7591 |
|
|
{
|
7592 |
|
|
/* Small HImode tests can be converted to QImode. */
|
7593 |
|
|
mode = QImode;
|
7594 |
|
|
val = gen_lowpart (QImode, val);
|
7595 |
|
|
}
|
7596 |
|
|
|
7597 |
|
|
if (len == HOST_BITS_PER_WIDE_INT)
|
7598 |
|
|
mask = -1;
|
7599 |
|
|
else
|
7600 |
|
|
mask = ((HOST_WIDE_INT)1 << len) - 1;
|
7601 |
|
|
mask <<= pos;
|
7602 |
|
|
|
7603 |
|
|
operands[2] = gen_rtx_AND (mode, val, gen_int_mode (mask, mode));
|
7604 |
|
|
})
|
7605 |
|
|
|
7606 |
|
|
;; Convert HImode/SImode test instructions with immediate to QImode ones.
|
7607 |
|
|
;; i386 does not allow to encode test with 8bit sign extended immediate, so
|
7608 |
|
|
;; this is relatively important trick.
|
7609 |
|
|
;; Do the conversion only post-reload to avoid limiting of the register class
|
7610 |
|
|
;; to QI regs.
|
7611 |
|
|
(define_split
|
7612 |
|
|
[(set (match_operand 0 "flags_reg_operand" "")
|
7613 |
|
|
(match_operator 1 "compare_operator"
|
7614 |
|
|
[(and (match_operand 2 "register_operand" "")
|
7615 |
|
|
(match_operand 3 "const_int_operand" ""))
|
7616 |
|
|
(const_int 0)]))]
|
7617 |
|
|
"reload_completed
|
7618 |
|
|
&& QI_REG_P (operands[2])
|
7619 |
|
|
&& GET_MODE (operands[2]) != QImode
|
7620 |
|
|
&& ((ix86_match_ccmode (insn, CCZmode)
|
7621 |
|
|
&& !(INTVAL (operands[3]) & ~(255 << 8)))
|
7622 |
|
|
|| (ix86_match_ccmode (insn, CCNOmode)
|
7623 |
|
|
&& !(INTVAL (operands[3]) & ~(127 << 8))))"
|
7624 |
|
|
[(set (match_dup 0)
|
7625 |
|
|
(match_op_dup 1
|
7626 |
|
|
[(and:SI (zero_extract:SI (match_dup 2) (const_int 8) (const_int 8))
|
7627 |
|
|
(match_dup 3))
|
7628 |
|
|
(const_int 0)]))]
|
7629 |
|
|
{
|
7630 |
|
|
operands[2] = gen_lowpart (SImode, operands[2]);
|
7631 |
|
|
operands[3] = gen_int_mode (INTVAL (operands[3]) >> 8, SImode);
|
7632 |
|
|
})
|
7633 |
|
|
|
7634 |
|
|
(define_split
|
7635 |
|
|
[(set (match_operand 0 "flags_reg_operand" "")
|
7636 |
|
|
(match_operator 1 "compare_operator"
|
7637 |
|
|
[(and (match_operand 2 "nonimmediate_operand" "")
|
7638 |
|
|
(match_operand 3 "const_int_operand" ""))
|
7639 |
|
|
(const_int 0)]))]
|
7640 |
|
|
"reload_completed
|
7641 |
|
|
&& GET_MODE (operands[2]) != QImode
|
7642 |
|
|
&& (!REG_P (operands[2]) || ANY_QI_REG_P (operands[2]))
|
7643 |
|
|
&& ((ix86_match_ccmode (insn, CCZmode)
|
7644 |
|
|
&& !(INTVAL (operands[3]) & ~255))
|
7645 |
|
|
|| (ix86_match_ccmode (insn, CCNOmode)
|
7646 |
|
|
&& !(INTVAL (operands[3]) & ~127)))"
|
7647 |
|
|
[(set (match_dup 0)
|
7648 |
|
|
(match_op_dup 1 [(and:QI (match_dup 2) (match_dup 3))
|
7649 |
|
|
(const_int 0)]))]
|
7650 |
|
|
{
|
7651 |
|
|
operands[2] = gen_lowpart (QImode, operands[2]);
|
7652 |
|
|
operands[3] = gen_lowpart (QImode, operands[3]);
|
7653 |
|
|
})
|
7654 |
|
|
|
7655 |
|
|
;; %%% This used to optimize known byte-wide and operations to memory,
|
7656 |
|
|
;; and sometimes to QImode registers. If this is considered useful,
|
7657 |
|
|
;; it should be done with splitters.
|
7658 |
|
|
|
7659 |
|
|
(define_expand "and3"
|
7660 |
|
|
[(set (match_operand:SWIM 0 "nonimmediate_operand" "")
|
7661 |
|
|
(and:SWIM (match_operand:SWIM 1 "nonimmediate_operand" "")
|
7662 |
|
|
(match_operand:SWIM 2 "" "")))]
|
7663 |
|
|
""
|
7664 |
|
|
"ix86_expand_binary_operator (AND, mode, operands); DONE;")
|
7665 |
|
|
|
7666 |
|
|
(define_insn "*anddi_1"
|
7667 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "=r,rm,r,r")
|
7668 |
|
|
(and:DI
|
7669 |
|
|
(match_operand:DI 1 "nonimmediate_operand" "%0,0,0,qm")
|
7670 |
|
|
(match_operand:DI 2 "x86_64_szext_general_operand" "Z,re,rm,L")))
|
7671 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7672 |
|
|
"TARGET_64BIT && ix86_binary_operator_ok (AND, DImode, operands)"
|
7673 |
|
|
{
|
7674 |
|
|
switch (get_attr_type (insn))
|
7675 |
|
|
{
|
7676 |
|
|
case TYPE_IMOVX:
|
7677 |
|
|
{
|
7678 |
|
|
enum machine_mode mode;
|
7679 |
|
|
|
7680 |
|
|
gcc_assert (CONST_INT_P (operands[2]));
|
7681 |
|
|
if (INTVAL (operands[2]) == (HOST_WIDE_INT) 0xffffffff)
|
7682 |
|
|
mode = SImode;
|
7683 |
|
|
else if (INTVAL (operands[2]) == 0xffff)
|
7684 |
|
|
mode = HImode;
|
7685 |
|
|
else
|
7686 |
|
|
{
|
7687 |
|
|
gcc_assert (INTVAL (operands[2]) == 0xff);
|
7688 |
|
|
mode = QImode;
|
7689 |
|
|
}
|
7690 |
|
|
|
7691 |
|
|
operands[1] = gen_lowpart (mode, operands[1]);
|
7692 |
|
|
if (mode == SImode)
|
7693 |
|
|
return "mov{l}\t{%1, %k0|%k0, %1}";
|
7694 |
|
|
else if (mode == HImode)
|
7695 |
|
|
return "movz{wl|x}\t{%1, %k0|%k0, %1}";
|
7696 |
|
|
else
|
7697 |
|
|
return "movz{bl|x}\t{%1, %k0|%k0, %1}";
|
7698 |
|
|
}
|
7699 |
|
|
|
7700 |
|
|
default:
|
7701 |
|
|
gcc_assert (rtx_equal_p (operands[0], operands[1]));
|
7702 |
|
|
if (get_attr_mode (insn) == MODE_SI)
|
7703 |
|
|
return "and{l}\t{%k2, %k0|%k0, %k2}";
|
7704 |
|
|
else
|
7705 |
|
|
return "and{q}\t{%2, %0|%0, %2}";
|
7706 |
|
|
}
|
7707 |
|
|
}
|
7708 |
|
|
[(set_attr "type" "alu,alu,alu,imovx")
|
7709 |
|
|
(set_attr "length_immediate" "*,*,*,0")
|
7710 |
|
|
(set (attr "prefix_rex")
|
7711 |
|
|
(if_then_else
|
7712 |
|
|
(and (eq_attr "type" "imovx")
|
7713 |
|
|
(and (match_test "INTVAL (operands[2]) == 0xff")
|
7714 |
|
|
(match_operand 1 "ext_QIreg_operand" "")))
|
7715 |
|
|
(const_string "1")
|
7716 |
|
|
(const_string "*")))
|
7717 |
|
|
(set_attr "mode" "SI,DI,DI,SI")])
|
7718 |
|
|
|
7719 |
|
|
(define_insn "*andsi_1"
|
7720 |
|
|
[(set (match_operand:SI 0 "nonimmediate_operand" "=rm,r,r")
|
7721 |
|
|
(and:SI (match_operand:SI 1 "nonimmediate_operand" "%0,0,qm")
|
7722 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "re,rm,L")))
|
7723 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7724 |
|
|
"ix86_binary_operator_ok (AND, SImode, operands)"
|
7725 |
|
|
{
|
7726 |
|
|
switch (get_attr_type (insn))
|
7727 |
|
|
{
|
7728 |
|
|
case TYPE_IMOVX:
|
7729 |
|
|
{
|
7730 |
|
|
enum machine_mode mode;
|
7731 |
|
|
|
7732 |
|
|
gcc_assert (CONST_INT_P (operands[2]));
|
7733 |
|
|
if (INTVAL (operands[2]) == 0xffff)
|
7734 |
|
|
mode = HImode;
|
7735 |
|
|
else
|
7736 |
|
|
{
|
7737 |
|
|
gcc_assert (INTVAL (operands[2]) == 0xff);
|
7738 |
|
|
mode = QImode;
|
7739 |
|
|
}
|
7740 |
|
|
|
7741 |
|
|
operands[1] = gen_lowpart (mode, operands[1]);
|
7742 |
|
|
if (mode == HImode)
|
7743 |
|
|
return "movz{wl|x}\t{%1, %0|%0, %1}";
|
7744 |
|
|
else
|
7745 |
|
|
return "movz{bl|x}\t{%1, %0|%0, %1}";
|
7746 |
|
|
}
|
7747 |
|
|
|
7748 |
|
|
default:
|
7749 |
|
|
gcc_assert (rtx_equal_p (operands[0], operands[1]));
|
7750 |
|
|
return "and{l}\t{%2, %0|%0, %2}";
|
7751 |
|
|
}
|
7752 |
|
|
}
|
7753 |
|
|
[(set_attr "type" "alu,alu,imovx")
|
7754 |
|
|
(set (attr "prefix_rex")
|
7755 |
|
|
(if_then_else
|
7756 |
|
|
(and (eq_attr "type" "imovx")
|
7757 |
|
|
(and (match_test "INTVAL (operands[2]) == 0xff")
|
7758 |
|
|
(match_operand 1 "ext_QIreg_operand" "")))
|
7759 |
|
|
(const_string "1")
|
7760 |
|
|
(const_string "*")))
|
7761 |
|
|
(set_attr "length_immediate" "*,*,0")
|
7762 |
|
|
(set_attr "mode" "SI")])
|
7763 |
|
|
|
7764 |
|
|
;; See comment for addsi_1_zext why we do use nonimmediate_operand
|
7765 |
|
|
(define_insn "*andsi_1_zext"
|
7766 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
7767 |
|
|
(zero_extend:DI
|
7768 |
|
|
(and:SI (match_operand:SI 1 "nonimmediate_operand" "%0")
|
7769 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "rme"))))
|
7770 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7771 |
|
|
"TARGET_64BIT && ix86_binary_operator_ok (AND, SImode, operands)"
|
7772 |
|
|
"and{l}\t{%2, %k0|%k0, %2}"
|
7773 |
|
|
[(set_attr "type" "alu")
|
7774 |
|
|
(set_attr "mode" "SI")])
|
7775 |
|
|
|
7776 |
|
|
(define_insn "*andhi_1"
|
7777 |
|
|
[(set (match_operand:HI 0 "nonimmediate_operand" "=rm,r,r")
|
7778 |
|
|
(and:HI (match_operand:HI 1 "nonimmediate_operand" "%0,0,qm")
|
7779 |
|
|
(match_operand:HI 2 "general_operand" "rn,rm,L")))
|
7780 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7781 |
|
|
"ix86_binary_operator_ok (AND, HImode, operands)"
|
7782 |
|
|
{
|
7783 |
|
|
switch (get_attr_type (insn))
|
7784 |
|
|
{
|
7785 |
|
|
case TYPE_IMOVX:
|
7786 |
|
|
gcc_assert (CONST_INT_P (operands[2]));
|
7787 |
|
|
gcc_assert (INTVAL (operands[2]) == 0xff);
|
7788 |
|
|
return "movz{bl|x}\t{%b1, %k0|%k0, %b1}";
|
7789 |
|
|
|
7790 |
|
|
default:
|
7791 |
|
|
gcc_assert (rtx_equal_p (operands[0], operands[1]));
|
7792 |
|
|
|
7793 |
|
|
return "and{w}\t{%2, %0|%0, %2}";
|
7794 |
|
|
}
|
7795 |
|
|
}
|
7796 |
|
|
[(set_attr "type" "alu,alu,imovx")
|
7797 |
|
|
(set_attr "length_immediate" "*,*,0")
|
7798 |
|
|
(set (attr "prefix_rex")
|
7799 |
|
|
(if_then_else
|
7800 |
|
|
(and (eq_attr "type" "imovx")
|
7801 |
|
|
(match_operand 1 "ext_QIreg_operand" ""))
|
7802 |
|
|
(const_string "1")
|
7803 |
|
|
(const_string "*")))
|
7804 |
|
|
(set_attr "mode" "HI,HI,SI")])
|
7805 |
|
|
|
7806 |
|
|
;; %%% Potential partial reg stall on alternative 2. What to do?
|
7807 |
|
|
(define_insn "*andqi_1"
|
7808 |
|
|
[(set (match_operand:QI 0 "nonimmediate_operand" "=qm,q,r")
|
7809 |
|
|
(and:QI (match_operand:QI 1 "nonimmediate_operand" "%0,0,0")
|
7810 |
|
|
(match_operand:QI 2 "general_operand" "qn,qmn,rn")))
|
7811 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7812 |
|
|
"ix86_binary_operator_ok (AND, QImode, operands)"
|
7813 |
|
|
"@
|
7814 |
|
|
and{b}\t{%2, %0|%0, %2}
|
7815 |
|
|
and{b}\t{%2, %0|%0, %2}
|
7816 |
|
|
and{l}\t{%k2, %k0|%k0, %k2}"
|
7817 |
|
|
[(set_attr "type" "alu")
|
7818 |
|
|
(set_attr "mode" "QI,QI,SI")])
|
7819 |
|
|
|
7820 |
|
|
(define_insn "*andqi_1_slp"
|
7821 |
|
|
[(set (strict_low_part (match_operand:QI 0 "nonimmediate_operand" "+qm,q"))
|
7822 |
|
|
(and:QI (match_dup 0)
|
7823 |
|
|
(match_operand:QI 1 "general_operand" "qn,qmn")))
|
7824 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7825 |
|
|
"(!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
7826 |
|
|
&& !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
7827 |
|
|
"and{b}\t{%1, %0|%0, %1}"
|
7828 |
|
|
[(set_attr "type" "alu1")
|
7829 |
|
|
(set_attr "mode" "QI")])
|
7830 |
|
|
|
7831 |
|
|
(define_split
|
7832 |
|
|
[(set (match_operand 0 "register_operand" "")
|
7833 |
|
|
(and (match_dup 0)
|
7834 |
|
|
(const_int -65536)))
|
7835 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7836 |
|
|
"(TARGET_FAST_PREFIX && !TARGET_PARTIAL_REG_STALL)
|
7837 |
|
|
|| optimize_function_for_size_p (cfun)"
|
7838 |
|
|
[(set (strict_low_part (match_dup 1)) (const_int 0))]
|
7839 |
|
|
"operands[1] = gen_lowpart (HImode, operands[0]);")
|
7840 |
|
|
|
7841 |
|
|
(define_split
|
7842 |
|
|
[(set (match_operand 0 "ext_register_operand" "")
|
7843 |
|
|
(and (match_dup 0)
|
7844 |
|
|
(const_int -256)))
|
7845 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7846 |
|
|
"(!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
7847 |
|
|
&& reload_completed"
|
7848 |
|
|
[(set (strict_low_part (match_dup 1)) (const_int 0))]
|
7849 |
|
|
"operands[1] = gen_lowpart (QImode, operands[0]);")
|
7850 |
|
|
|
7851 |
|
|
(define_split
|
7852 |
|
|
[(set (match_operand 0 "ext_register_operand" "")
|
7853 |
|
|
(and (match_dup 0)
|
7854 |
|
|
(const_int -65281)))
|
7855 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7856 |
|
|
"(!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
7857 |
|
|
&& reload_completed"
|
7858 |
|
|
[(parallel [(set (zero_extract:SI (match_dup 0)
|
7859 |
|
|
(const_int 8)
|
7860 |
|
|
(const_int 8))
|
7861 |
|
|
(xor:SI
|
7862 |
|
|
(zero_extract:SI (match_dup 0)
|
7863 |
|
|
(const_int 8)
|
7864 |
|
|
(const_int 8))
|
7865 |
|
|
(zero_extract:SI (match_dup 0)
|
7866 |
|
|
(const_int 8)
|
7867 |
|
|
(const_int 8))))
|
7868 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
7869 |
|
|
"operands[0] = gen_lowpart (SImode, operands[0]);")
|
7870 |
|
|
|
7871 |
|
|
(define_insn "*anddi_2"
|
7872 |
|
|
[(set (reg FLAGS_REG)
|
7873 |
|
|
(compare
|
7874 |
|
|
(and:DI
|
7875 |
|
|
(match_operand:DI 1 "nonimmediate_operand" "%0,0,0")
|
7876 |
|
|
(match_operand:DI 2 "x86_64_szext_general_operand" "Z,rem,re"))
|
7877 |
|
|
(const_int 0)))
|
7878 |
|
|
(set (match_operand:DI 0 "nonimmediate_operand" "=r,r,rm")
|
7879 |
|
|
(and:DI (match_dup 1) (match_dup 2)))]
|
7880 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCNOmode)
|
7881 |
|
|
&& ix86_binary_operator_ok (AND, DImode, operands)"
|
7882 |
|
|
"@
|
7883 |
|
|
and{l}\t{%k2, %k0|%k0, %k2}
|
7884 |
|
|
and{q}\t{%2, %0|%0, %2}
|
7885 |
|
|
and{q}\t{%2, %0|%0, %2}"
|
7886 |
|
|
[(set_attr "type" "alu")
|
7887 |
|
|
(set_attr "mode" "SI,DI,DI")])
|
7888 |
|
|
|
7889 |
|
|
(define_insn "*andqi_2_maybe_si"
|
7890 |
|
|
[(set (reg FLAGS_REG)
|
7891 |
|
|
(compare (and:QI
|
7892 |
|
|
(match_operand:QI 1 "nonimmediate_operand" "%0,0,0")
|
7893 |
|
|
(match_operand:QI 2 "general_operand" "qmn,qn,n"))
|
7894 |
|
|
(const_int 0)))
|
7895 |
|
|
(set (match_operand:QI 0 "nonimmediate_operand" "=q,qm,*r")
|
7896 |
|
|
(and:QI (match_dup 1) (match_dup 2)))]
|
7897 |
|
|
"ix86_binary_operator_ok (AND, QImode, operands)
|
7898 |
|
|
&& ix86_match_ccmode (insn,
|
7899 |
|
|
CONST_INT_P (operands[2])
|
7900 |
|
|
&& INTVAL (operands[2]) >= 0 ? CCNOmode : CCZmode)"
|
7901 |
|
|
{
|
7902 |
|
|
if (which_alternative == 2)
|
7903 |
|
|
{
|
7904 |
|
|
if (CONST_INT_P (operands[2]) && INTVAL (operands[2]) < 0)
|
7905 |
|
|
operands[2] = GEN_INT (INTVAL (operands[2]) & 0xff);
|
7906 |
|
|
return "and{l}\t{%2, %k0|%k0, %2}";
|
7907 |
|
|
}
|
7908 |
|
|
return "and{b}\t{%2, %0|%0, %2}";
|
7909 |
|
|
}
|
7910 |
|
|
[(set_attr "type" "alu")
|
7911 |
|
|
(set_attr "mode" "QI,QI,SI")])
|
7912 |
|
|
|
7913 |
|
|
(define_insn "*and_2"
|
7914 |
|
|
[(set (reg FLAGS_REG)
|
7915 |
|
|
(compare (and:SWI124
|
7916 |
|
|
(match_operand:SWI124 1 "nonimmediate_operand" "%0,0")
|
7917 |
|
|
(match_operand:SWI124 2 "" ","))
|
7918 |
|
|
(const_int 0)))
|
7919 |
|
|
(set (match_operand:SWI124 0 "nonimmediate_operand" "=,m")
|
7920 |
|
|
(and:SWI124 (match_dup 1) (match_dup 2)))]
|
7921 |
|
|
"ix86_match_ccmode (insn, CCNOmode)
|
7922 |
|
|
&& ix86_binary_operator_ok (AND, mode, operands)"
|
7923 |
|
|
"and{}\t{%2, %0|%0, %2}"
|
7924 |
|
|
[(set_attr "type" "alu")
|
7925 |
|
|
(set_attr "mode" "")])
|
7926 |
|
|
|
7927 |
|
|
;; See comment for addsi_1_zext why we do use nonimmediate_operand
|
7928 |
|
|
(define_insn "*andsi_2_zext"
|
7929 |
|
|
[(set (reg FLAGS_REG)
|
7930 |
|
|
(compare (and:SI
|
7931 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "%0")
|
7932 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "rme"))
|
7933 |
|
|
(const_int 0)))
|
7934 |
|
|
(set (match_operand:DI 0 "register_operand" "=r")
|
7935 |
|
|
(zero_extend:DI (and:SI (match_dup 1) (match_dup 2))))]
|
7936 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCNOmode)
|
7937 |
|
|
&& ix86_binary_operator_ok (AND, SImode, operands)"
|
7938 |
|
|
"and{l}\t{%2, %k0|%k0, %2}"
|
7939 |
|
|
[(set_attr "type" "alu")
|
7940 |
|
|
(set_attr "mode" "SI")])
|
7941 |
|
|
|
7942 |
|
|
(define_insn "*andqi_2_slp"
|
7943 |
|
|
[(set (reg FLAGS_REG)
|
7944 |
|
|
(compare (and:QI
|
7945 |
|
|
(match_operand:QI 0 "nonimmediate_operand" "+q,qm")
|
7946 |
|
|
(match_operand:QI 1 "nonimmediate_operand" "qmn,qn"))
|
7947 |
|
|
(const_int 0)))
|
7948 |
|
|
(set (strict_low_part (match_dup 0))
|
7949 |
|
|
(and:QI (match_dup 0) (match_dup 1)))]
|
7950 |
|
|
"(!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
7951 |
|
|
&& ix86_match_ccmode (insn, CCNOmode)
|
7952 |
|
|
&& !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
7953 |
|
|
"and{b}\t{%1, %0|%0, %1}"
|
7954 |
|
|
[(set_attr "type" "alu1")
|
7955 |
|
|
(set_attr "mode" "QI")])
|
7956 |
|
|
|
7957 |
|
|
;; ??? A bug in recog prevents it from recognizing a const_int as an
|
7958 |
|
|
;; operand to zero_extend in andqi_ext_1. It was checking explicitly
|
7959 |
|
|
;; for a QImode operand, which of course failed.
|
7960 |
|
|
(define_insn "andqi_ext_0"
|
7961 |
|
|
[(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=Q")
|
7962 |
|
|
(const_int 8)
|
7963 |
|
|
(const_int 8))
|
7964 |
|
|
(and:SI
|
7965 |
|
|
(zero_extract:SI
|
7966 |
|
|
(match_operand 1 "ext_register_operand" "0")
|
7967 |
|
|
(const_int 8)
|
7968 |
|
|
(const_int 8))
|
7969 |
|
|
(match_operand 2 "const_int_operand" "n")))
|
7970 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
7971 |
|
|
""
|
7972 |
|
|
"and{b}\t{%2, %h0|%h0, %2}"
|
7973 |
|
|
[(set_attr "type" "alu")
|
7974 |
|
|
(set_attr "length_immediate" "1")
|
7975 |
|
|
(set_attr "modrm" "1")
|
7976 |
|
|
(set_attr "mode" "QI")])
|
7977 |
|
|
|
7978 |
|
|
;; Generated by peephole translating test to and. This shows up
|
7979 |
|
|
;; often in fp comparisons.
|
7980 |
|
|
(define_insn "*andqi_ext_0_cc"
|
7981 |
|
|
[(set (reg FLAGS_REG)
|
7982 |
|
|
(compare
|
7983 |
|
|
(and:SI
|
7984 |
|
|
(zero_extract:SI
|
7985 |
|
|
(match_operand 1 "ext_register_operand" "0")
|
7986 |
|
|
(const_int 8)
|
7987 |
|
|
(const_int 8))
|
7988 |
|
|
(match_operand 2 "const_int_operand" "n"))
|
7989 |
|
|
(const_int 0)))
|
7990 |
|
|
(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=Q")
|
7991 |
|
|
(const_int 8)
|
7992 |
|
|
(const_int 8))
|
7993 |
|
|
(and:SI
|
7994 |
|
|
(zero_extract:SI
|
7995 |
|
|
(match_dup 1)
|
7996 |
|
|
(const_int 8)
|
7997 |
|
|
(const_int 8))
|
7998 |
|
|
(match_dup 2)))]
|
7999 |
|
|
"ix86_match_ccmode (insn, CCNOmode)"
|
8000 |
|
|
"and{b}\t{%2, %h0|%h0, %2}"
|
8001 |
|
|
[(set_attr "type" "alu")
|
8002 |
|
|
(set_attr "length_immediate" "1")
|
8003 |
|
|
(set_attr "modrm" "1")
|
8004 |
|
|
(set_attr "mode" "QI")])
|
8005 |
|
|
|
8006 |
|
|
(define_insn "*andqi_ext_1_rex64"
|
8007 |
|
|
[(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=Q")
|
8008 |
|
|
(const_int 8)
|
8009 |
|
|
(const_int 8))
|
8010 |
|
|
(and:SI
|
8011 |
|
|
(zero_extract:SI
|
8012 |
|
|
(match_operand 1 "ext_register_operand" "0")
|
8013 |
|
|
(const_int 8)
|
8014 |
|
|
(const_int 8))
|
8015 |
|
|
(zero_extend:SI
|
8016 |
|
|
(match_operand 2 "ext_register_operand" "Q"))))
|
8017 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8018 |
|
|
"TARGET_64BIT"
|
8019 |
|
|
"and{b}\t{%2, %h0|%h0, %2}"
|
8020 |
|
|
[(set_attr "type" "alu")
|
8021 |
|
|
(set_attr "length_immediate" "0")
|
8022 |
|
|
(set_attr "mode" "QI")])
|
8023 |
|
|
|
8024 |
|
|
(define_insn "*andqi_ext_1"
|
8025 |
|
|
[(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=Q")
|
8026 |
|
|
(const_int 8)
|
8027 |
|
|
(const_int 8))
|
8028 |
|
|
(and:SI
|
8029 |
|
|
(zero_extract:SI
|
8030 |
|
|
(match_operand 1 "ext_register_operand" "0")
|
8031 |
|
|
(const_int 8)
|
8032 |
|
|
(const_int 8))
|
8033 |
|
|
(zero_extend:SI
|
8034 |
|
|
(match_operand:QI 2 "general_operand" "Qm"))))
|
8035 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8036 |
|
|
"!TARGET_64BIT"
|
8037 |
|
|
"and{b}\t{%2, %h0|%h0, %2}"
|
8038 |
|
|
[(set_attr "type" "alu")
|
8039 |
|
|
(set_attr "length_immediate" "0")
|
8040 |
|
|
(set_attr "mode" "QI")])
|
8041 |
|
|
|
8042 |
|
|
(define_insn "*andqi_ext_2"
|
8043 |
|
|
[(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=Q")
|
8044 |
|
|
(const_int 8)
|
8045 |
|
|
(const_int 8))
|
8046 |
|
|
(and:SI
|
8047 |
|
|
(zero_extract:SI
|
8048 |
|
|
(match_operand 1 "ext_register_operand" "%0")
|
8049 |
|
|
(const_int 8)
|
8050 |
|
|
(const_int 8))
|
8051 |
|
|
(zero_extract:SI
|
8052 |
|
|
(match_operand 2 "ext_register_operand" "Q")
|
8053 |
|
|
(const_int 8)
|
8054 |
|
|
(const_int 8))))
|
8055 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8056 |
|
|
""
|
8057 |
|
|
"and{b}\t{%h2, %h0|%h0, %h2}"
|
8058 |
|
|
[(set_attr "type" "alu")
|
8059 |
|
|
(set_attr "length_immediate" "0")
|
8060 |
|
|
(set_attr "mode" "QI")])
|
8061 |
|
|
|
8062 |
|
|
;; Convert wide AND instructions with immediate operand to shorter QImode
|
8063 |
|
|
;; equivalents when possible.
|
8064 |
|
|
;; Don't do the splitting with memory operands, since it introduces risk
|
8065 |
|
|
;; of memory mismatch stalls. We may want to do the splitting for optimizing
|
8066 |
|
|
;; for size, but that can (should?) be handled by generic code instead.
|
8067 |
|
|
(define_split
|
8068 |
|
|
[(set (match_operand 0 "register_operand" "")
|
8069 |
|
|
(and (match_operand 1 "register_operand" "")
|
8070 |
|
|
(match_operand 2 "const_int_operand" "")))
|
8071 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8072 |
|
|
"reload_completed
|
8073 |
|
|
&& QI_REG_P (operands[0])
|
8074 |
|
|
&& (!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
8075 |
|
|
&& !(~INTVAL (operands[2]) & ~(255 << 8))
|
8076 |
|
|
&& GET_MODE (operands[0]) != QImode"
|
8077 |
|
|
[(parallel [(set (zero_extract:SI (match_dup 0) (const_int 8) (const_int 8))
|
8078 |
|
|
(and:SI (zero_extract:SI (match_dup 1)
|
8079 |
|
|
(const_int 8) (const_int 8))
|
8080 |
|
|
(match_dup 2)))
|
8081 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
8082 |
|
|
{
|
8083 |
|
|
operands[0] = gen_lowpart (SImode, operands[0]);
|
8084 |
|
|
operands[1] = gen_lowpart (SImode, operands[1]);
|
8085 |
|
|
operands[2] = gen_int_mode ((INTVAL (operands[2]) >> 8) & 0xff, SImode);
|
8086 |
|
|
})
|
8087 |
|
|
|
8088 |
|
|
;; Since AND can be encoded with sign extended immediate, this is only
|
8089 |
|
|
;; profitable when 7th bit is not set.
|
8090 |
|
|
(define_split
|
8091 |
|
|
[(set (match_operand 0 "register_operand" "")
|
8092 |
|
|
(and (match_operand 1 "general_operand" "")
|
8093 |
|
|
(match_operand 2 "const_int_operand" "")))
|
8094 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8095 |
|
|
"reload_completed
|
8096 |
|
|
&& ANY_QI_REG_P (operands[0])
|
8097 |
|
|
&& (!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
8098 |
|
|
&& !(~INTVAL (operands[2]) & ~255)
|
8099 |
|
|
&& !(INTVAL (operands[2]) & 128)
|
8100 |
|
|
&& GET_MODE (operands[0]) != QImode"
|
8101 |
|
|
[(parallel [(set (strict_low_part (match_dup 0))
|
8102 |
|
|
(and:QI (match_dup 1)
|
8103 |
|
|
(match_dup 2)))
|
8104 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
8105 |
|
|
{
|
8106 |
|
|
operands[0] = gen_lowpart (QImode, operands[0]);
|
8107 |
|
|
operands[1] = gen_lowpart (QImode, operands[1]);
|
8108 |
|
|
operands[2] = gen_lowpart (QImode, operands[2]);
|
8109 |
|
|
})
|
8110 |
|
|
|
8111 |
|
|
;; Logical inclusive and exclusive OR instructions
|
8112 |
|
|
|
8113 |
|
|
;; %%% This used to optimize known byte-wide and operations to memory.
|
8114 |
|
|
;; If this is considered useful, it should be done with splitters.
|
8115 |
|
|
|
8116 |
|
|
(define_expand "3"
|
8117 |
|
|
[(set (match_operand:SWIM 0 "nonimmediate_operand" "")
|
8118 |
|
|
(any_or:SWIM (match_operand:SWIM 1 "nonimmediate_operand" "")
|
8119 |
|
|
(match_operand:SWIM 2 "" "")))]
|
8120 |
|
|
""
|
8121 |
|
|
"ix86_expand_binary_operator (, mode, operands); DONE;")
|
8122 |
|
|
|
8123 |
|
|
(define_insn "*_1"
|
8124 |
|
|
[(set (match_operand:SWI248 0 "nonimmediate_operand" "=r,rm")
|
8125 |
|
|
(any_or:SWI248
|
8126 |
|
|
(match_operand:SWI248 1 "nonimmediate_operand" "%0,0")
|
8127 |
|
|
(match_operand:SWI248 2 "" ",r")))
|
8128 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8129 |
|
|
"ix86_binary_operator_ok (, mode, operands)"
|
8130 |
|
|
"{}\t{%2, %0|%0, %2}"
|
8131 |
|
|
[(set_attr "type" "alu")
|
8132 |
|
|
(set_attr "mode" "")])
|
8133 |
|
|
|
8134 |
|
|
;; %%% Potential partial reg stall on alternative 2. What to do?
|
8135 |
|
|
(define_insn "*qi_1"
|
8136 |
|
|
[(set (match_operand:QI 0 "nonimmediate_operand" "=q,m,r")
|
8137 |
|
|
(any_or:QI (match_operand:QI 1 "nonimmediate_operand" "%0,0,0")
|
8138 |
|
|
(match_operand:QI 2 "general_operand" "qmn,qn,rn")))
|
8139 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8140 |
|
|
"ix86_binary_operator_ok (, QImode, operands)"
|
8141 |
|
|
"@
|
8142 |
|
|
{b}\t{%2, %0|%0, %2}
|
8143 |
|
|
{b}\t{%2, %0|%0, %2}
|
8144 |
|
|
{l}\t{%k2, %k0|%k0, %k2}"
|
8145 |
|
|
[(set_attr "type" "alu")
|
8146 |
|
|
(set_attr "mode" "QI,QI,SI")])
|
8147 |
|
|
|
8148 |
|
|
;; See comment for addsi_1_zext why we do use nonimmediate_operand
|
8149 |
|
|
(define_insn "*si_1_zext"
|
8150 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
8151 |
|
|
(zero_extend:DI
|
8152 |
|
|
(any_or:SI (match_operand:SI 1 "nonimmediate_operand" "%0")
|
8153 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "rme"))))
|
8154 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8155 |
|
|
"TARGET_64BIT && ix86_binary_operator_ok (, SImode, operands)"
|
8156 |
|
|
"{l}\t{%2, %k0|%k0, %2}"
|
8157 |
|
|
[(set_attr "type" "alu")
|
8158 |
|
|
(set_attr "mode" "SI")])
|
8159 |
|
|
|
8160 |
|
|
(define_insn "*si_1_zext_imm"
|
8161 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
8162 |
|
|
(any_or:DI
|
8163 |
|
|
(zero_extend:DI (match_operand:SI 1 "register_operand" "%0"))
|
8164 |
|
|
(match_operand:DI 2 "x86_64_zext_immediate_operand" "Z")))
|
8165 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8166 |
|
|
"TARGET_64BIT && ix86_binary_operator_ok (, SImode, operands)"
|
8167 |
|
|
"{l}\t{%2, %k0|%k0, %2}"
|
8168 |
|
|
[(set_attr "type" "alu")
|
8169 |
|
|
(set_attr "mode" "SI")])
|
8170 |
|
|
|
8171 |
|
|
(define_insn "*qi_1_slp"
|
8172 |
|
|
[(set (strict_low_part (match_operand:QI 0 "nonimmediate_operand" "+q,m"))
|
8173 |
|
|
(any_or:QI (match_dup 0)
|
8174 |
|
|
(match_operand:QI 1 "general_operand" "qmn,qn")))
|
8175 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8176 |
|
|
"(!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
8177 |
|
|
&& !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
8178 |
|
|
"{b}\t{%1, %0|%0, %1}"
|
8179 |
|
|
[(set_attr "type" "alu1")
|
8180 |
|
|
(set_attr "mode" "QI")])
|
8181 |
|
|
|
8182 |
|
|
(define_insn "*_2"
|
8183 |
|
|
[(set (reg FLAGS_REG)
|
8184 |
|
|
(compare (any_or:SWI
|
8185 |
|
|
(match_operand:SWI 1 "nonimmediate_operand" "%0,0")
|
8186 |
|
|
(match_operand:SWI 2 "" ","))
|
8187 |
|
|
(const_int 0)))
|
8188 |
|
|
(set (match_operand:SWI 0 "nonimmediate_operand" "=,m")
|
8189 |
|
|
(any_or:SWI (match_dup 1) (match_dup 2)))]
|
8190 |
|
|
"ix86_match_ccmode (insn, CCNOmode)
|
8191 |
|
|
&& ix86_binary_operator_ok (, mode, operands)"
|
8192 |
|
|
"{}\t{%2, %0|%0, %2}"
|
8193 |
|
|
[(set_attr "type" "alu")
|
8194 |
|
|
(set_attr "mode" "")])
|
8195 |
|
|
|
8196 |
|
|
;; See comment for addsi_1_zext why we do use nonimmediate_operand
|
8197 |
|
|
;; ??? Special case for immediate operand is missing - it is tricky.
|
8198 |
|
|
(define_insn "*si_2_zext"
|
8199 |
|
|
[(set (reg FLAGS_REG)
|
8200 |
|
|
(compare (any_or:SI (match_operand:SI 1 "nonimmediate_operand" "%0")
|
8201 |
|
|
(match_operand:SI 2 "x86_64_general_operand" "rme"))
|
8202 |
|
|
(const_int 0)))
|
8203 |
|
|
(set (match_operand:DI 0 "register_operand" "=r")
|
8204 |
|
|
(zero_extend:DI (any_or:SI (match_dup 1) (match_dup 2))))]
|
8205 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCNOmode)
|
8206 |
|
|
&& ix86_binary_operator_ok (, SImode, operands)"
|
8207 |
|
|
"{l}\t{%2, %k0|%k0, %2}"
|
8208 |
|
|
[(set_attr "type" "alu")
|
8209 |
|
|
(set_attr "mode" "SI")])
|
8210 |
|
|
|
8211 |
|
|
(define_insn "*si_2_zext_imm"
|
8212 |
|
|
[(set (reg FLAGS_REG)
|
8213 |
|
|
(compare (any_or:SI
|
8214 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "%0")
|
8215 |
|
|
(match_operand:SI 2 "x86_64_zext_immediate_operand" "Z"))
|
8216 |
|
|
(const_int 0)))
|
8217 |
|
|
(set (match_operand:DI 0 "register_operand" "=r")
|
8218 |
|
|
(any_or:DI (zero_extend:DI (match_dup 1)) (match_dup 2)))]
|
8219 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCNOmode)
|
8220 |
|
|
&& ix86_binary_operator_ok (, SImode, operands)"
|
8221 |
|
|
"{l}\t{%2, %k0|%k0, %2}"
|
8222 |
|
|
[(set_attr "type" "alu")
|
8223 |
|
|
(set_attr "mode" "SI")])
|
8224 |
|
|
|
8225 |
|
|
(define_insn "*qi_2_slp"
|
8226 |
|
|
[(set (reg FLAGS_REG)
|
8227 |
|
|
(compare (any_or:QI (match_operand:QI 0 "nonimmediate_operand" "+q,qm")
|
8228 |
|
|
(match_operand:QI 1 "general_operand" "qmn,qn"))
|
8229 |
|
|
(const_int 0)))
|
8230 |
|
|
(set (strict_low_part (match_dup 0))
|
8231 |
|
|
(any_or:QI (match_dup 0) (match_dup 1)))]
|
8232 |
|
|
"(!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
8233 |
|
|
&& ix86_match_ccmode (insn, CCNOmode)
|
8234 |
|
|
&& !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
8235 |
|
|
"{b}\t{%1, %0|%0, %1}"
|
8236 |
|
|
[(set_attr "type" "alu1")
|
8237 |
|
|
(set_attr "mode" "QI")])
|
8238 |
|
|
|
8239 |
|
|
(define_insn "*_3"
|
8240 |
|
|
[(set (reg FLAGS_REG)
|
8241 |
|
|
(compare (any_or:SWI
|
8242 |
|
|
(match_operand:SWI 1 "nonimmediate_operand" "%0")
|
8243 |
|
|
(match_operand:SWI 2 "" ""))
|
8244 |
|
|
(const_int 0)))
|
8245 |
|
|
(clobber (match_scratch:SWI 0 "="))]
|
8246 |
|
|
"ix86_match_ccmode (insn, CCNOmode)
|
8247 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
8248 |
|
|
"{}\t{%2, %0|%0, %2}"
|
8249 |
|
|
[(set_attr "type" "alu")
|
8250 |
|
|
(set_attr "mode" "")])
|
8251 |
|
|
|
8252 |
|
|
(define_insn "*qi_ext_0"
|
8253 |
|
|
[(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=Q")
|
8254 |
|
|
(const_int 8)
|
8255 |
|
|
(const_int 8))
|
8256 |
|
|
(any_or:SI
|
8257 |
|
|
(zero_extract:SI
|
8258 |
|
|
(match_operand 1 "ext_register_operand" "0")
|
8259 |
|
|
(const_int 8)
|
8260 |
|
|
(const_int 8))
|
8261 |
|
|
(match_operand 2 "const_int_operand" "n")))
|
8262 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8263 |
|
|
"!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun)"
|
8264 |
|
|
"{b}\t{%2, %h0|%h0, %2}"
|
8265 |
|
|
[(set_attr "type" "alu")
|
8266 |
|
|
(set_attr "length_immediate" "1")
|
8267 |
|
|
(set_attr "modrm" "1")
|
8268 |
|
|
(set_attr "mode" "QI")])
|
8269 |
|
|
|
8270 |
|
|
(define_insn "*qi_ext_1_rex64"
|
8271 |
|
|
[(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=Q")
|
8272 |
|
|
(const_int 8)
|
8273 |
|
|
(const_int 8))
|
8274 |
|
|
(any_or:SI
|
8275 |
|
|
(zero_extract:SI
|
8276 |
|
|
(match_operand 1 "ext_register_operand" "0")
|
8277 |
|
|
(const_int 8)
|
8278 |
|
|
(const_int 8))
|
8279 |
|
|
(zero_extend:SI
|
8280 |
|
|
(match_operand 2 "ext_register_operand" "Q"))))
|
8281 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8282 |
|
|
"TARGET_64BIT
|
8283 |
|
|
&& (!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))"
|
8284 |
|
|
"{b}\t{%2, %h0|%h0, %2}"
|
8285 |
|
|
[(set_attr "type" "alu")
|
8286 |
|
|
(set_attr "length_immediate" "0")
|
8287 |
|
|
(set_attr "mode" "QI")])
|
8288 |
|
|
|
8289 |
|
|
(define_insn "*qi_ext_1"
|
8290 |
|
|
[(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=Q")
|
8291 |
|
|
(const_int 8)
|
8292 |
|
|
(const_int 8))
|
8293 |
|
|
(any_or:SI
|
8294 |
|
|
(zero_extract:SI
|
8295 |
|
|
(match_operand 1 "ext_register_operand" "0")
|
8296 |
|
|
(const_int 8)
|
8297 |
|
|
(const_int 8))
|
8298 |
|
|
(zero_extend:SI
|
8299 |
|
|
(match_operand:QI 2 "general_operand" "Qm"))))
|
8300 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8301 |
|
|
"!TARGET_64BIT
|
8302 |
|
|
&& (!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))"
|
8303 |
|
|
"{b}\t{%2, %h0|%h0, %2}"
|
8304 |
|
|
[(set_attr "type" "alu")
|
8305 |
|
|
(set_attr "length_immediate" "0")
|
8306 |
|
|
(set_attr "mode" "QI")])
|
8307 |
|
|
|
8308 |
|
|
(define_insn "*qi_ext_2"
|
8309 |
|
|
[(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=Q")
|
8310 |
|
|
(const_int 8)
|
8311 |
|
|
(const_int 8))
|
8312 |
|
|
(any_or:SI
|
8313 |
|
|
(zero_extract:SI (match_operand 1 "ext_register_operand" "0")
|
8314 |
|
|
(const_int 8)
|
8315 |
|
|
(const_int 8))
|
8316 |
|
|
(zero_extract:SI (match_operand 2 "ext_register_operand" "Q")
|
8317 |
|
|
(const_int 8)
|
8318 |
|
|
(const_int 8))))
|
8319 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8320 |
|
|
"!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun)"
|
8321 |
|
|
"{b}\t{%h2, %h0|%h0, %h2}"
|
8322 |
|
|
[(set_attr "type" "alu")
|
8323 |
|
|
(set_attr "length_immediate" "0")
|
8324 |
|
|
(set_attr "mode" "QI")])
|
8325 |
|
|
|
8326 |
|
|
(define_split
|
8327 |
|
|
[(set (match_operand 0 "register_operand" "")
|
8328 |
|
|
(any_or (match_operand 1 "register_operand" "")
|
8329 |
|
|
(match_operand 2 "const_int_operand" "")))
|
8330 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8331 |
|
|
"reload_completed
|
8332 |
|
|
&& QI_REG_P (operands[0])
|
8333 |
|
|
&& (!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
8334 |
|
|
&& !(INTVAL (operands[2]) & ~(255 << 8))
|
8335 |
|
|
&& GET_MODE (operands[0]) != QImode"
|
8336 |
|
|
[(parallel [(set (zero_extract:SI (match_dup 0) (const_int 8) (const_int 8))
|
8337 |
|
|
(any_or:SI (zero_extract:SI (match_dup 1)
|
8338 |
|
|
(const_int 8) (const_int 8))
|
8339 |
|
|
(match_dup 2)))
|
8340 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
8341 |
|
|
{
|
8342 |
|
|
operands[0] = gen_lowpart (SImode, operands[0]);
|
8343 |
|
|
operands[1] = gen_lowpart (SImode, operands[1]);
|
8344 |
|
|
operands[2] = gen_int_mode ((INTVAL (operands[2]) >> 8) & 0xff, SImode);
|
8345 |
|
|
})
|
8346 |
|
|
|
8347 |
|
|
;; Since OR can be encoded with sign extended immediate, this is only
|
8348 |
|
|
;; profitable when 7th bit is set.
|
8349 |
|
|
(define_split
|
8350 |
|
|
[(set (match_operand 0 "register_operand" "")
|
8351 |
|
|
(any_or (match_operand 1 "general_operand" "")
|
8352 |
|
|
(match_operand 2 "const_int_operand" "")))
|
8353 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8354 |
|
|
"reload_completed
|
8355 |
|
|
&& ANY_QI_REG_P (operands[0])
|
8356 |
|
|
&& (!TARGET_PARTIAL_REG_STALL || optimize_function_for_size_p (cfun))
|
8357 |
|
|
&& !(INTVAL (operands[2]) & ~255)
|
8358 |
|
|
&& (INTVAL (operands[2]) & 128)
|
8359 |
|
|
&& GET_MODE (operands[0]) != QImode"
|
8360 |
|
|
[(parallel [(set (strict_low_part (match_dup 0))
|
8361 |
|
|
(any_or:QI (match_dup 1)
|
8362 |
|
|
(match_dup 2)))
|
8363 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
8364 |
|
|
{
|
8365 |
|
|
operands[0] = gen_lowpart (QImode, operands[0]);
|
8366 |
|
|
operands[1] = gen_lowpart (QImode, operands[1]);
|
8367 |
|
|
operands[2] = gen_lowpart (QImode, operands[2]);
|
8368 |
|
|
})
|
8369 |
|
|
|
8370 |
|
|
(define_expand "xorqi_cc_ext_1"
|
8371 |
|
|
[(parallel [
|
8372 |
|
|
(set (reg:CCNO FLAGS_REG)
|
8373 |
|
|
(compare:CCNO
|
8374 |
|
|
(xor:SI
|
8375 |
|
|
(zero_extract:SI
|
8376 |
|
|
(match_operand 1 "ext_register_operand" "")
|
8377 |
|
|
(const_int 8)
|
8378 |
|
|
(const_int 8))
|
8379 |
|
|
(match_operand:QI 2 "general_operand" ""))
|
8380 |
|
|
(const_int 0)))
|
8381 |
|
|
(set (zero_extract:SI (match_operand 0 "ext_register_operand" "")
|
8382 |
|
|
(const_int 8)
|
8383 |
|
|
(const_int 8))
|
8384 |
|
|
(xor:SI
|
8385 |
|
|
(zero_extract:SI
|
8386 |
|
|
(match_dup 1)
|
8387 |
|
|
(const_int 8)
|
8388 |
|
|
(const_int 8))
|
8389 |
|
|
(match_dup 2)))])])
|
8390 |
|
|
|
8391 |
|
|
(define_insn "*xorqi_cc_ext_1_rex64"
|
8392 |
|
|
[(set (reg FLAGS_REG)
|
8393 |
|
|
(compare
|
8394 |
|
|
(xor:SI
|
8395 |
|
|
(zero_extract:SI
|
8396 |
|
|
(match_operand 1 "ext_register_operand" "0")
|
8397 |
|
|
(const_int 8)
|
8398 |
|
|
(const_int 8))
|
8399 |
|
|
(match_operand:QI 2 "nonmemory_operand" "Qn"))
|
8400 |
|
|
(const_int 0)))
|
8401 |
|
|
(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=Q")
|
8402 |
|
|
(const_int 8)
|
8403 |
|
|
(const_int 8))
|
8404 |
|
|
(xor:SI
|
8405 |
|
|
(zero_extract:SI
|
8406 |
|
|
(match_dup 1)
|
8407 |
|
|
(const_int 8)
|
8408 |
|
|
(const_int 8))
|
8409 |
|
|
(match_dup 2)))]
|
8410 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCNOmode)"
|
8411 |
|
|
"xor{b}\t{%2, %h0|%h0, %2}"
|
8412 |
|
|
[(set_attr "type" "alu")
|
8413 |
|
|
(set_attr "modrm" "1")
|
8414 |
|
|
(set_attr "mode" "QI")])
|
8415 |
|
|
|
8416 |
|
|
(define_insn "*xorqi_cc_ext_1"
|
8417 |
|
|
[(set (reg FLAGS_REG)
|
8418 |
|
|
(compare
|
8419 |
|
|
(xor:SI
|
8420 |
|
|
(zero_extract:SI
|
8421 |
|
|
(match_operand 1 "ext_register_operand" "0")
|
8422 |
|
|
(const_int 8)
|
8423 |
|
|
(const_int 8))
|
8424 |
|
|
(match_operand:QI 2 "general_operand" "qmn"))
|
8425 |
|
|
(const_int 0)))
|
8426 |
|
|
(set (zero_extract:SI (match_operand 0 "ext_register_operand" "=q")
|
8427 |
|
|
(const_int 8)
|
8428 |
|
|
(const_int 8))
|
8429 |
|
|
(xor:SI
|
8430 |
|
|
(zero_extract:SI
|
8431 |
|
|
(match_dup 1)
|
8432 |
|
|
(const_int 8)
|
8433 |
|
|
(const_int 8))
|
8434 |
|
|
(match_dup 2)))]
|
8435 |
|
|
"!TARGET_64BIT && ix86_match_ccmode (insn, CCNOmode)"
|
8436 |
|
|
"xor{b}\t{%2, %h0|%h0, %2}"
|
8437 |
|
|
[(set_attr "type" "alu")
|
8438 |
|
|
(set_attr "modrm" "1")
|
8439 |
|
|
(set_attr "mode" "QI")])
|
8440 |
|
|
|
8441 |
|
|
;; Negation instructions
|
8442 |
|
|
|
8443 |
|
|
(define_expand "neg2"
|
8444 |
|
|
[(set (match_operand:SDWIM 0 "nonimmediate_operand" "")
|
8445 |
|
|
(neg:SDWIM (match_operand:SDWIM 1 "nonimmediate_operand" "")))]
|
8446 |
|
|
""
|
8447 |
|
|
"ix86_expand_unary_operator (NEG, mode, operands); DONE;")
|
8448 |
|
|
|
8449 |
|
|
(define_insn_and_split "*neg2_doubleword"
|
8450 |
|
|
[(set (match_operand: 0 "nonimmediate_operand" "=ro")
|
8451 |
|
|
(neg: (match_operand: 1 "nonimmediate_operand" "0")))
|
8452 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8453 |
|
|
"ix86_unary_operator_ok (NEG, mode, operands)"
|
8454 |
|
|
"#"
|
8455 |
|
|
"reload_completed"
|
8456 |
|
|
[(parallel
|
8457 |
|
|
[(set (reg:CCZ FLAGS_REG)
|
8458 |
|
|
(compare:CCZ (neg:DWIH (match_dup 1)) (const_int 0)))
|
8459 |
|
|
(set (match_dup 0) (neg:DWIH (match_dup 1)))])
|
8460 |
|
|
(parallel
|
8461 |
|
|
[(set (match_dup 2)
|
8462 |
|
|
(plus:DWIH (match_dup 3)
|
8463 |
|
|
(plus:DWIH (ltu:DWIH (reg:CC FLAGS_REG) (const_int 0))
|
8464 |
|
|
(const_int 0))))
|
8465 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
8466 |
|
|
(parallel
|
8467 |
|
|
[(set (match_dup 2)
|
8468 |
|
|
(neg:DWIH (match_dup 2)))
|
8469 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
8470 |
|
|
"split_double_mode (mode, &operands[0], 2, &operands[0], &operands[2]);")
|
8471 |
|
|
|
8472 |
|
|
(define_insn "*neg2_1"
|
8473 |
|
|
[(set (match_operand:SWI 0 "nonimmediate_operand" "=m")
|
8474 |
|
|
(neg:SWI (match_operand:SWI 1 "nonimmediate_operand" "0")))
|
8475 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8476 |
|
|
"ix86_unary_operator_ok (NEG, mode, operands)"
|
8477 |
|
|
"neg{}\t%0"
|
8478 |
|
|
[(set_attr "type" "negnot")
|
8479 |
|
|
(set_attr "mode" "")])
|
8480 |
|
|
|
8481 |
|
|
;; Combine is quite creative about this pattern.
|
8482 |
|
|
(define_insn "*negsi2_1_zext"
|
8483 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
8484 |
|
|
(lshiftrt:DI
|
8485 |
|
|
(neg:DI (ashift:DI (match_operand:DI 1 "register_operand" "0")
|
8486 |
|
|
(const_int 32)))
|
8487 |
|
|
(const_int 32)))
|
8488 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8489 |
|
|
"TARGET_64BIT && ix86_unary_operator_ok (NEG, SImode, operands)"
|
8490 |
|
|
"neg{l}\t%k0"
|
8491 |
|
|
[(set_attr "type" "negnot")
|
8492 |
|
|
(set_attr "mode" "SI")])
|
8493 |
|
|
|
8494 |
|
|
;; The problem with neg is that it does not perform (compare x 0),
|
8495 |
|
|
;; it really performs (compare 0 x), which leaves us with the zero
|
8496 |
|
|
;; flag being the only useful item.
|
8497 |
|
|
|
8498 |
|
|
(define_insn "*neg2_cmpz"
|
8499 |
|
|
[(set (reg:CCZ FLAGS_REG)
|
8500 |
|
|
(compare:CCZ
|
8501 |
|
|
(neg:SWI (match_operand:SWI 1 "nonimmediate_operand" "0"))
|
8502 |
|
|
(const_int 0)))
|
8503 |
|
|
(set (match_operand:SWI 0 "nonimmediate_operand" "=m")
|
8504 |
|
|
(neg:SWI (match_dup 1)))]
|
8505 |
|
|
"ix86_unary_operator_ok (NEG, mode, operands)"
|
8506 |
|
|
"neg{}\t%0"
|
8507 |
|
|
[(set_attr "type" "negnot")
|
8508 |
|
|
(set_attr "mode" "")])
|
8509 |
|
|
|
8510 |
|
|
(define_insn "*negsi2_cmpz_zext"
|
8511 |
|
|
[(set (reg:CCZ FLAGS_REG)
|
8512 |
|
|
(compare:CCZ
|
8513 |
|
|
(lshiftrt:DI
|
8514 |
|
|
(neg:DI (ashift:DI
|
8515 |
|
|
(match_operand:DI 1 "register_operand" "0")
|
8516 |
|
|
(const_int 32)))
|
8517 |
|
|
(const_int 32))
|
8518 |
|
|
(const_int 0)))
|
8519 |
|
|
(set (match_operand:DI 0 "register_operand" "=r")
|
8520 |
|
|
(lshiftrt:DI (neg:DI (ashift:DI (match_dup 1)
|
8521 |
|
|
(const_int 32)))
|
8522 |
|
|
(const_int 32)))]
|
8523 |
|
|
"TARGET_64BIT && ix86_unary_operator_ok (NEG, SImode, operands)"
|
8524 |
|
|
"neg{l}\t%k0"
|
8525 |
|
|
[(set_attr "type" "negnot")
|
8526 |
|
|
(set_attr "mode" "SI")])
|
8527 |
|
|
|
8528 |
|
|
;; Changing of sign for FP values is doable using integer unit too.
|
8529 |
|
|
|
8530 |
|
|
(define_expand "2"
|
8531 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "")
|
8532 |
|
|
(absneg:X87MODEF (match_operand:X87MODEF 1 "register_operand" "")))]
|
8533 |
|
|
"TARGET_80387 || (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)"
|
8534 |
|
|
"ix86_expand_fp_absneg_operator (, mode, operands); DONE;")
|
8535 |
|
|
|
8536 |
|
|
(define_insn "*absneg2_mixed"
|
8537 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x,x,f,!r")
|
8538 |
|
|
(match_operator:MODEF 3 "absneg_operator"
|
8539 |
|
|
[(match_operand:MODEF 1 "register_operand" "0,x,0,0")]))
|
8540 |
|
|
(use (match_operand: 2 "nonimmediate_operand" "xm,0,X,X"))
|
8541 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8542 |
|
|
"TARGET_MIX_SSE_I387 && SSE_FLOAT_MODE_P (mode)"
|
8543 |
|
|
"#")
|
8544 |
|
|
|
8545 |
|
|
(define_insn "*absneg2_sse"
|
8546 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x,x,!r")
|
8547 |
|
|
(match_operator:MODEF 3 "absneg_operator"
|
8548 |
|
|
[(match_operand:MODEF 1 "register_operand" "0 ,x,0")]))
|
8549 |
|
|
(use (match_operand: 2 "register_operand" "xm,0,X"))
|
8550 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8551 |
|
|
"SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH"
|
8552 |
|
|
"#")
|
8553 |
|
|
|
8554 |
|
|
(define_insn "*absneg2_i387"
|
8555 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "=f,!r")
|
8556 |
|
|
(match_operator:X87MODEF 3 "absneg_operator"
|
8557 |
|
|
[(match_operand:X87MODEF 1 "register_operand" "0,0")]))
|
8558 |
|
|
(use (match_operand 2 "" ""))
|
8559 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8560 |
|
|
"TARGET_80387 && !(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)"
|
8561 |
|
|
"#")
|
8562 |
|
|
|
8563 |
|
|
(define_expand "tf2"
|
8564 |
|
|
[(set (match_operand:TF 0 "register_operand" "")
|
8565 |
|
|
(absneg:TF (match_operand:TF 1 "register_operand" "")))]
|
8566 |
|
|
"TARGET_SSE2"
|
8567 |
|
|
"ix86_expand_fp_absneg_operator (, TFmode, operands); DONE;")
|
8568 |
|
|
|
8569 |
|
|
(define_insn "*absnegtf2_sse"
|
8570 |
|
|
[(set (match_operand:TF 0 "register_operand" "=x,x")
|
8571 |
|
|
(match_operator:TF 3 "absneg_operator"
|
8572 |
|
|
[(match_operand:TF 1 "register_operand" "0,x")]))
|
8573 |
|
|
(use (match_operand:TF 2 "nonimmediate_operand" "xm,0"))
|
8574 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8575 |
|
|
"TARGET_SSE2"
|
8576 |
|
|
"#")
|
8577 |
|
|
|
8578 |
|
|
;; Splitters for fp abs and neg.
|
8579 |
|
|
|
8580 |
|
|
(define_split
|
8581 |
|
|
[(set (match_operand 0 "fp_register_operand" "")
|
8582 |
|
|
(match_operator 1 "absneg_operator" [(match_dup 0)]))
|
8583 |
|
|
(use (match_operand 2 "" ""))
|
8584 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8585 |
|
|
"reload_completed"
|
8586 |
|
|
[(set (match_dup 0) (match_op_dup 1 [(match_dup 0)]))])
|
8587 |
|
|
|
8588 |
|
|
(define_split
|
8589 |
|
|
[(set (match_operand 0 "register_operand" "")
|
8590 |
|
|
(match_operator 3 "absneg_operator"
|
8591 |
|
|
[(match_operand 1 "register_operand" "")]))
|
8592 |
|
|
(use (match_operand 2 "nonimmediate_operand" ""))
|
8593 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8594 |
|
|
"reload_completed && SSE_REG_P (operands[0])"
|
8595 |
|
|
[(set (match_dup 0) (match_dup 3))]
|
8596 |
|
|
{
|
8597 |
|
|
enum machine_mode mode = GET_MODE (operands[0]);
|
8598 |
|
|
enum machine_mode vmode = GET_MODE (operands[2]);
|
8599 |
|
|
rtx tmp;
|
8600 |
|
|
|
8601 |
|
|
operands[0] = simplify_gen_subreg (vmode, operands[0], mode, 0);
|
8602 |
|
|
operands[1] = simplify_gen_subreg (vmode, operands[1], mode, 0);
|
8603 |
|
|
if (operands_match_p (operands[0], operands[2]))
|
8604 |
|
|
{
|
8605 |
|
|
tmp = operands[1];
|
8606 |
|
|
operands[1] = operands[2];
|
8607 |
|
|
operands[2] = tmp;
|
8608 |
|
|
}
|
8609 |
|
|
if (GET_CODE (operands[3]) == ABS)
|
8610 |
|
|
tmp = gen_rtx_AND (vmode, operands[1], operands[2]);
|
8611 |
|
|
else
|
8612 |
|
|
tmp = gen_rtx_XOR (vmode, operands[1], operands[2]);
|
8613 |
|
|
operands[3] = tmp;
|
8614 |
|
|
})
|
8615 |
|
|
|
8616 |
|
|
(define_split
|
8617 |
|
|
[(set (match_operand:SF 0 "register_operand" "")
|
8618 |
|
|
(match_operator:SF 1 "absneg_operator" [(match_dup 0)]))
|
8619 |
|
|
(use (match_operand:V4SF 2 "" ""))
|
8620 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8621 |
|
|
"reload_completed"
|
8622 |
|
|
[(parallel [(set (match_dup 0) (match_dup 1))
|
8623 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
8624 |
|
|
{
|
8625 |
|
|
rtx tmp;
|
8626 |
|
|
operands[0] = gen_lowpart (SImode, operands[0]);
|
8627 |
|
|
if (GET_CODE (operands[1]) == ABS)
|
8628 |
|
|
{
|
8629 |
|
|
tmp = gen_int_mode (0x7fffffff, SImode);
|
8630 |
|
|
tmp = gen_rtx_AND (SImode, operands[0], tmp);
|
8631 |
|
|
}
|
8632 |
|
|
else
|
8633 |
|
|
{
|
8634 |
|
|
tmp = gen_int_mode (0x80000000, SImode);
|
8635 |
|
|
tmp = gen_rtx_XOR (SImode, operands[0], tmp);
|
8636 |
|
|
}
|
8637 |
|
|
operands[1] = tmp;
|
8638 |
|
|
})
|
8639 |
|
|
|
8640 |
|
|
(define_split
|
8641 |
|
|
[(set (match_operand:DF 0 "register_operand" "")
|
8642 |
|
|
(match_operator:DF 1 "absneg_operator" [(match_dup 0)]))
|
8643 |
|
|
(use (match_operand 2 "" ""))
|
8644 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8645 |
|
|
"reload_completed"
|
8646 |
|
|
[(parallel [(set (match_dup 0) (match_dup 1))
|
8647 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
8648 |
|
|
{
|
8649 |
|
|
rtx tmp;
|
8650 |
|
|
if (TARGET_64BIT)
|
8651 |
|
|
{
|
8652 |
|
|
tmp = gen_lowpart (DImode, operands[0]);
|
8653 |
|
|
tmp = gen_rtx_ZERO_EXTRACT (DImode, tmp, const1_rtx, GEN_INT (63));
|
8654 |
|
|
operands[0] = tmp;
|
8655 |
|
|
|
8656 |
|
|
if (GET_CODE (operands[1]) == ABS)
|
8657 |
|
|
tmp = const0_rtx;
|
8658 |
|
|
else
|
8659 |
|
|
tmp = gen_rtx_NOT (DImode, tmp);
|
8660 |
|
|
}
|
8661 |
|
|
else
|
8662 |
|
|
{
|
8663 |
|
|
operands[0] = gen_highpart (SImode, operands[0]);
|
8664 |
|
|
if (GET_CODE (operands[1]) == ABS)
|
8665 |
|
|
{
|
8666 |
|
|
tmp = gen_int_mode (0x7fffffff, SImode);
|
8667 |
|
|
tmp = gen_rtx_AND (SImode, operands[0], tmp);
|
8668 |
|
|
}
|
8669 |
|
|
else
|
8670 |
|
|
{
|
8671 |
|
|
tmp = gen_int_mode (0x80000000, SImode);
|
8672 |
|
|
tmp = gen_rtx_XOR (SImode, operands[0], tmp);
|
8673 |
|
|
}
|
8674 |
|
|
}
|
8675 |
|
|
operands[1] = tmp;
|
8676 |
|
|
})
|
8677 |
|
|
|
8678 |
|
|
(define_split
|
8679 |
|
|
[(set (match_operand:XF 0 "register_operand" "")
|
8680 |
|
|
(match_operator:XF 1 "absneg_operator" [(match_dup 0)]))
|
8681 |
|
|
(use (match_operand 2 "" ""))
|
8682 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8683 |
|
|
"reload_completed"
|
8684 |
|
|
[(parallel [(set (match_dup 0) (match_dup 1))
|
8685 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
8686 |
|
|
{
|
8687 |
|
|
rtx tmp;
|
8688 |
|
|
operands[0] = gen_rtx_REG (SImode,
|
8689 |
|
|
true_regnum (operands[0])
|
8690 |
|
|
+ (TARGET_64BIT ? 1 : 2));
|
8691 |
|
|
if (GET_CODE (operands[1]) == ABS)
|
8692 |
|
|
{
|
8693 |
|
|
tmp = GEN_INT (0x7fff);
|
8694 |
|
|
tmp = gen_rtx_AND (SImode, operands[0], tmp);
|
8695 |
|
|
}
|
8696 |
|
|
else
|
8697 |
|
|
{
|
8698 |
|
|
tmp = GEN_INT (0x8000);
|
8699 |
|
|
tmp = gen_rtx_XOR (SImode, operands[0], tmp);
|
8700 |
|
|
}
|
8701 |
|
|
operands[1] = tmp;
|
8702 |
|
|
})
|
8703 |
|
|
|
8704 |
|
|
;; Conditionalize these after reload. If they match before reload, we
|
8705 |
|
|
;; lose the clobber and ability to use integer instructions.
|
8706 |
|
|
|
8707 |
|
|
(define_insn "*2_1"
|
8708 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "=f")
|
8709 |
|
|
(absneg:X87MODEF (match_operand:X87MODEF 1 "register_operand" "0")))]
|
8710 |
|
|
"TARGET_80387
|
8711 |
|
|
&& (reload_completed
|
8712 |
|
|
|| !(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH))"
|
8713 |
|
|
"f"
|
8714 |
|
|
[(set_attr "type" "fsgn")
|
8715 |
|
|
(set_attr "mode" "")])
|
8716 |
|
|
|
8717 |
|
|
(define_insn "*extendsfdf2"
|
8718 |
|
|
[(set (match_operand:DF 0 "register_operand" "=f")
|
8719 |
|
|
(absneg:DF (float_extend:DF
|
8720 |
|
|
(match_operand:SF 1 "register_operand" "0"))))]
|
8721 |
|
|
"TARGET_80387 && (!TARGET_SSE_MATH || TARGET_MIX_SSE_I387)"
|
8722 |
|
|
"f"
|
8723 |
|
|
[(set_attr "type" "fsgn")
|
8724 |
|
|
(set_attr "mode" "DF")])
|
8725 |
|
|
|
8726 |
|
|
(define_insn "*extendsfxf2"
|
8727 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
8728 |
|
|
(absneg:XF (float_extend:XF
|
8729 |
|
|
(match_operand:SF 1 "register_operand" "0"))))]
|
8730 |
|
|
"TARGET_80387"
|
8731 |
|
|
"f"
|
8732 |
|
|
[(set_attr "type" "fsgn")
|
8733 |
|
|
(set_attr "mode" "XF")])
|
8734 |
|
|
|
8735 |
|
|
(define_insn "*extenddfxf2"
|
8736 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
8737 |
|
|
(absneg:XF (float_extend:XF
|
8738 |
|
|
(match_operand:DF 1 "register_operand" "0"))))]
|
8739 |
|
|
"TARGET_80387"
|
8740 |
|
|
"f"
|
8741 |
|
|
[(set_attr "type" "fsgn")
|
8742 |
|
|
(set_attr "mode" "XF")])
|
8743 |
|
|
|
8744 |
|
|
;; Copysign instructions
|
8745 |
|
|
|
8746 |
|
|
(define_mode_iterator CSGNMODE [SF DF TF])
|
8747 |
|
|
(define_mode_attr CSGNVMODE [(SF "V4SF") (DF "V2DF") (TF "TF")])
|
8748 |
|
|
|
8749 |
|
|
(define_expand "copysign3"
|
8750 |
|
|
[(match_operand:CSGNMODE 0 "register_operand" "")
|
8751 |
|
|
(match_operand:CSGNMODE 1 "nonmemory_operand" "")
|
8752 |
|
|
(match_operand:CSGNMODE 2 "register_operand" "")]
|
8753 |
|
|
"(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
8754 |
|
|
|| (TARGET_SSE2 && (mode == TFmode))"
|
8755 |
|
|
"ix86_expand_copysign (operands); DONE;")
|
8756 |
|
|
|
8757 |
|
|
(define_insn_and_split "copysign3_const"
|
8758 |
|
|
[(set (match_operand:CSGNMODE 0 "register_operand" "=x")
|
8759 |
|
|
(unspec:CSGNMODE
|
8760 |
|
|
[(match_operand: 1 "vector_move_operand" "xmC")
|
8761 |
|
|
(match_operand:CSGNMODE 2 "register_operand" "0")
|
8762 |
|
|
(match_operand: 3 "nonimmediate_operand" "xm")]
|
8763 |
|
|
UNSPEC_COPYSIGN))]
|
8764 |
|
|
"(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
8765 |
|
|
|| (TARGET_SSE2 && (mode == TFmode))"
|
8766 |
|
|
"#"
|
8767 |
|
|
"&& reload_completed"
|
8768 |
|
|
[(const_int 0)]
|
8769 |
|
|
"ix86_split_copysign_const (operands); DONE;")
|
8770 |
|
|
|
8771 |
|
|
(define_insn "copysign3_var"
|
8772 |
|
|
[(set (match_operand:CSGNMODE 0 "register_operand" "=x,x,x,x,x")
|
8773 |
|
|
(unspec:CSGNMODE
|
8774 |
|
|
[(match_operand:CSGNMODE 2 "register_operand" "x,0,0,x,x")
|
8775 |
|
|
(match_operand:CSGNMODE 3 "register_operand" "1,1,x,1,x")
|
8776 |
|
|
(match_operand: 4 "nonimmediate_operand" "X,xm,xm,0,0")
|
8777 |
|
|
(match_operand: 5 "nonimmediate_operand" "0,xm,1,xm,1")]
|
8778 |
|
|
UNSPEC_COPYSIGN))
|
8779 |
|
|
(clobber (match_scratch: 1 "=x,x,x,x,x"))]
|
8780 |
|
|
"(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
8781 |
|
|
|| (TARGET_SSE2 && (mode == TFmode))"
|
8782 |
|
|
"#")
|
8783 |
|
|
|
8784 |
|
|
(define_split
|
8785 |
|
|
[(set (match_operand:CSGNMODE 0 "register_operand" "")
|
8786 |
|
|
(unspec:CSGNMODE
|
8787 |
|
|
[(match_operand:CSGNMODE 2 "register_operand" "")
|
8788 |
|
|
(match_operand:CSGNMODE 3 "register_operand" "")
|
8789 |
|
|
(match_operand: 4 "" "")
|
8790 |
|
|
(match_operand: 5 "" "")]
|
8791 |
|
|
UNSPEC_COPYSIGN))
|
8792 |
|
|
(clobber (match_scratch: 1 ""))]
|
8793 |
|
|
"((SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
8794 |
|
|
|| (TARGET_SSE2 && (mode == TFmode)))
|
8795 |
|
|
&& reload_completed"
|
8796 |
|
|
[(const_int 0)]
|
8797 |
|
|
"ix86_split_copysign_var (operands); DONE;")
|
8798 |
|
|
|
8799 |
|
|
;; One complement instructions
|
8800 |
|
|
|
8801 |
|
|
(define_expand "one_cmpl2"
|
8802 |
|
|
[(set (match_operand:SWIM 0 "nonimmediate_operand" "")
|
8803 |
|
|
(not:SWIM (match_operand:SWIM 1 "nonimmediate_operand" "")))]
|
8804 |
|
|
""
|
8805 |
|
|
"ix86_expand_unary_operator (NOT, mode, operands); DONE;")
|
8806 |
|
|
|
8807 |
|
|
(define_insn "*one_cmpl2_1"
|
8808 |
|
|
[(set (match_operand:SWI248 0 "nonimmediate_operand" "=rm")
|
8809 |
|
|
(not:SWI248 (match_operand:SWI248 1 "nonimmediate_operand" "0")))]
|
8810 |
|
|
"ix86_unary_operator_ok (NOT, mode, operands)"
|
8811 |
|
|
"not{}\t%0"
|
8812 |
|
|
[(set_attr "type" "negnot")
|
8813 |
|
|
(set_attr "mode" "")])
|
8814 |
|
|
|
8815 |
|
|
;; %%% Potential partial reg stall on alternative 1. What to do?
|
8816 |
|
|
(define_insn "*one_cmplqi2_1"
|
8817 |
|
|
[(set (match_operand:QI 0 "nonimmediate_operand" "=qm,r")
|
8818 |
|
|
(not:QI (match_operand:QI 1 "nonimmediate_operand" "0,0")))]
|
8819 |
|
|
"ix86_unary_operator_ok (NOT, QImode, operands)"
|
8820 |
|
|
"@
|
8821 |
|
|
not{b}\t%0
|
8822 |
|
|
not{l}\t%k0"
|
8823 |
|
|
[(set_attr "type" "negnot")
|
8824 |
|
|
(set_attr "mode" "QI,SI")])
|
8825 |
|
|
|
8826 |
|
|
;; ??? Currently never generated - xor is used instead.
|
8827 |
|
|
(define_insn "*one_cmplsi2_1_zext"
|
8828 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
8829 |
|
|
(zero_extend:DI
|
8830 |
|
|
(not:SI (match_operand:SI 1 "register_operand" "0"))))]
|
8831 |
|
|
"TARGET_64BIT && ix86_unary_operator_ok (NOT, SImode, operands)"
|
8832 |
|
|
"not{l}\t%k0"
|
8833 |
|
|
[(set_attr "type" "negnot")
|
8834 |
|
|
(set_attr "mode" "SI")])
|
8835 |
|
|
|
8836 |
|
|
(define_insn "*one_cmpl2_2"
|
8837 |
|
|
[(set (reg FLAGS_REG)
|
8838 |
|
|
(compare (not:SWI (match_operand:SWI 1 "nonimmediate_operand" "0"))
|
8839 |
|
|
(const_int 0)))
|
8840 |
|
|
(set (match_operand:SWI 0 "nonimmediate_operand" "=m")
|
8841 |
|
|
(not:SWI (match_dup 1)))]
|
8842 |
|
|
"ix86_match_ccmode (insn, CCNOmode)
|
8843 |
|
|
&& ix86_unary_operator_ok (NOT, mode, operands)"
|
8844 |
|
|
"#"
|
8845 |
|
|
[(set_attr "type" "alu1")
|
8846 |
|
|
(set_attr "mode" "")])
|
8847 |
|
|
|
8848 |
|
|
(define_split
|
8849 |
|
|
[(set (match_operand 0 "flags_reg_operand" "")
|
8850 |
|
|
(match_operator 2 "compare_operator"
|
8851 |
|
|
[(not:SWI (match_operand:SWI 3 "nonimmediate_operand" ""))
|
8852 |
|
|
(const_int 0)]))
|
8853 |
|
|
(set (match_operand:SWI 1 "nonimmediate_operand" "")
|
8854 |
|
|
(not:SWI (match_dup 3)))]
|
8855 |
|
|
"ix86_match_ccmode (insn, CCNOmode)"
|
8856 |
|
|
[(parallel [(set (match_dup 0)
|
8857 |
|
|
(match_op_dup 2 [(xor:SWI (match_dup 3) (const_int -1))
|
8858 |
|
|
(const_int 0)]))
|
8859 |
|
|
(set (match_dup 1)
|
8860 |
|
|
(xor:SWI (match_dup 3) (const_int -1)))])])
|
8861 |
|
|
|
8862 |
|
|
;; ??? Currently never generated - xor is used instead.
|
8863 |
|
|
(define_insn "*one_cmplsi2_2_zext"
|
8864 |
|
|
[(set (reg FLAGS_REG)
|
8865 |
|
|
(compare (not:SI (match_operand:SI 1 "register_operand" "0"))
|
8866 |
|
|
(const_int 0)))
|
8867 |
|
|
(set (match_operand:DI 0 "register_operand" "=r")
|
8868 |
|
|
(zero_extend:DI (not:SI (match_dup 1))))]
|
8869 |
|
|
"TARGET_64BIT && ix86_match_ccmode (insn, CCNOmode)
|
8870 |
|
|
&& ix86_unary_operator_ok (NOT, SImode, operands)"
|
8871 |
|
|
"#"
|
8872 |
|
|
[(set_attr "type" "alu1")
|
8873 |
|
|
(set_attr "mode" "SI")])
|
8874 |
|
|
|
8875 |
|
|
(define_split
|
8876 |
|
|
[(set (match_operand 0 "flags_reg_operand" "")
|
8877 |
|
|
(match_operator 2 "compare_operator"
|
8878 |
|
|
[(not:SI (match_operand:SI 3 "register_operand" ""))
|
8879 |
|
|
(const_int 0)]))
|
8880 |
|
|
(set (match_operand:DI 1 "register_operand" "")
|
8881 |
|
|
(zero_extend:DI (not:SI (match_dup 3))))]
|
8882 |
|
|
"ix86_match_ccmode (insn, CCNOmode)"
|
8883 |
|
|
[(parallel [(set (match_dup 0)
|
8884 |
|
|
(match_op_dup 2 [(xor:SI (match_dup 3) (const_int -1))
|
8885 |
|
|
(const_int 0)]))
|
8886 |
|
|
(set (match_dup 1)
|
8887 |
|
|
(zero_extend:DI (xor:SI (match_dup 3) (const_int -1))))])])
|
8888 |
|
|
|
8889 |
|
|
;; Shift instructions
|
8890 |
|
|
|
8891 |
|
|
;; DImode shifts are implemented using the i386 "shift double" opcode,
|
8892 |
|
|
;; which is written as "sh[lr]d[lw] imm,reg,reg/mem". If the shift count
|
8893 |
|
|
;; is variable, then the count is in %cl and the "imm" operand is dropped
|
8894 |
|
|
;; from the assembler input.
|
8895 |
|
|
;;
|
8896 |
|
|
;; This instruction shifts the target reg/mem as usual, but instead of
|
8897 |
|
|
;; shifting in zeros, bits are shifted in from reg operand. If the insn
|
8898 |
|
|
;; is a left shift double, bits are taken from the high order bits of
|
8899 |
|
|
;; reg, else if the insn is a shift right double, bits are taken from the
|
8900 |
|
|
;; low order bits of reg. So if %eax is "1234" and %edx is "5678",
|
8901 |
|
|
;; "shldl $8,%edx,%eax" leaves %edx unchanged and sets %eax to "2345".
|
8902 |
|
|
;;
|
8903 |
|
|
;; Since sh[lr]d does not change the `reg' operand, that is done
|
8904 |
|
|
;; separately, making all shifts emit pairs of shift double and normal
|
8905 |
|
|
;; shift. Since sh[lr]d does not shift more than 31 bits, and we wish to
|
8906 |
|
|
;; support a 63 bit shift, each shift where the count is in a reg expands
|
8907 |
|
|
;; to a pair of shifts, a branch, a shift by 32 and a label.
|
8908 |
|
|
;;
|
8909 |
|
|
;; If the shift count is a constant, we need never emit more than one
|
8910 |
|
|
;; shift pair, instead using moves and sign extension for counts greater
|
8911 |
|
|
;; than 31.
|
8912 |
|
|
|
8913 |
|
|
(define_expand "ashl3"
|
8914 |
|
|
[(set (match_operand:SDWIM 0 "" "")
|
8915 |
|
|
(ashift:SDWIM (match_operand:SDWIM 1 "" "")
|
8916 |
|
|
(match_operand:QI 2 "nonmemory_operand" "")))]
|
8917 |
|
|
""
|
8918 |
|
|
"ix86_expand_binary_operator (ASHIFT, mode, operands); DONE;")
|
8919 |
|
|
|
8920 |
|
|
(define_insn "*ashl3_doubleword"
|
8921 |
|
|
[(set (match_operand:DWI 0 "register_operand" "=&r,r")
|
8922 |
|
|
(ashift:DWI (match_operand:DWI 1 "reg_or_pm1_operand" "n,0")
|
8923 |
|
|
(match_operand:QI 2 "nonmemory_operand" "c,c")))
|
8924 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8925 |
|
|
""
|
8926 |
|
|
"#"
|
8927 |
|
|
[(set_attr "type" "multi")])
|
8928 |
|
|
|
8929 |
|
|
(define_split
|
8930 |
|
|
[(set (match_operand:DWI 0 "register_operand" "")
|
8931 |
|
|
(ashift:DWI (match_operand:DWI 1 "nonmemory_operand" "")
|
8932 |
|
|
(match_operand:QI 2 "nonmemory_operand" "")))
|
8933 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8934 |
|
|
"(optimize && flag_peephole2) ? epilogue_completed : reload_completed"
|
8935 |
|
|
[(const_int 0)]
|
8936 |
|
|
"ix86_split_ashl (operands, NULL_RTX, mode); DONE;")
|
8937 |
|
|
|
8938 |
|
|
;; By default we don't ask for a scratch register, because when DWImode
|
8939 |
|
|
;; values are manipulated, registers are already at a premium. But if
|
8940 |
|
|
;; we have one handy, we won't turn it away.
|
8941 |
|
|
|
8942 |
|
|
(define_peephole2
|
8943 |
|
|
[(match_scratch:DWIH 3 "r")
|
8944 |
|
|
(parallel [(set (match_operand: 0 "register_operand" "")
|
8945 |
|
|
(ashift:
|
8946 |
|
|
(match_operand: 1 "nonmemory_operand" "")
|
8947 |
|
|
(match_operand:QI 2 "nonmemory_operand" "")))
|
8948 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
8949 |
|
|
(match_dup 3)]
|
8950 |
|
|
"TARGET_CMOVE"
|
8951 |
|
|
[(const_int 0)]
|
8952 |
|
|
"ix86_split_ashl (operands, operands[3], mode); DONE;")
|
8953 |
|
|
|
8954 |
|
|
(define_insn "x86_64_shld"
|
8955 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "+r*m")
|
8956 |
|
|
(ior:DI (ashift:DI (match_dup 0)
|
8957 |
|
|
(match_operand:QI 2 "nonmemory_operand" "Jc"))
|
8958 |
|
|
(lshiftrt:DI (match_operand:DI 1 "register_operand" "r")
|
8959 |
|
|
(minus:QI (const_int 64) (match_dup 2)))))
|
8960 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8961 |
|
|
"TARGET_64BIT"
|
8962 |
|
|
"shld{q}\t{%s2%1, %0|%0, %1, %2}"
|
8963 |
|
|
[(set_attr "type" "ishift")
|
8964 |
|
|
(set_attr "prefix_0f" "1")
|
8965 |
|
|
(set_attr "mode" "DI")
|
8966 |
|
|
(set_attr "athlon_decode" "vector")
|
8967 |
|
|
(set_attr "amdfam10_decode" "vector")
|
8968 |
|
|
(set_attr "bdver1_decode" "vector")])
|
8969 |
|
|
|
8970 |
|
|
(define_insn "x86_shld"
|
8971 |
|
|
[(set (match_operand:SI 0 "nonimmediate_operand" "+r*m")
|
8972 |
|
|
(ior:SI (ashift:SI (match_dup 0)
|
8973 |
|
|
(match_operand:QI 2 "nonmemory_operand" "Ic"))
|
8974 |
|
|
(lshiftrt:SI (match_operand:SI 1 "register_operand" "r")
|
8975 |
|
|
(minus:QI (const_int 32) (match_dup 2)))))
|
8976 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
8977 |
|
|
""
|
8978 |
|
|
"shld{l}\t{%s2%1, %0|%0, %1, %2}"
|
8979 |
|
|
[(set_attr "type" "ishift")
|
8980 |
|
|
(set_attr "prefix_0f" "1")
|
8981 |
|
|
(set_attr "mode" "SI")
|
8982 |
|
|
(set_attr "pent_pair" "np")
|
8983 |
|
|
(set_attr "athlon_decode" "vector")
|
8984 |
|
|
(set_attr "amdfam10_decode" "vector")
|
8985 |
|
|
(set_attr "bdver1_decode" "vector")])
|
8986 |
|
|
|
8987 |
|
|
(define_expand "x86_shift_adj_1"
|
8988 |
|
|
[(set (reg:CCZ FLAGS_REG)
|
8989 |
|
|
(compare:CCZ (and:QI (match_operand:QI 2 "register_operand" "")
|
8990 |
|
|
(match_dup 4))
|
8991 |
|
|
(const_int 0)))
|
8992 |
|
|
(set (match_operand:SWI48 0 "register_operand" "")
|
8993 |
|
|
(if_then_else:SWI48 (ne (reg:CCZ FLAGS_REG) (const_int 0))
|
8994 |
|
|
(match_operand:SWI48 1 "register_operand" "")
|
8995 |
|
|
(match_dup 0)))
|
8996 |
|
|
(set (match_dup 1)
|
8997 |
|
|
(if_then_else:SWI48 (ne (reg:CCZ FLAGS_REG) (const_int 0))
|
8998 |
|
|
(match_operand:SWI48 3 "register_operand" "")
|
8999 |
|
|
(match_dup 1)))]
|
9000 |
|
|
"TARGET_CMOVE"
|
9001 |
|
|
"operands[4] = GEN_INT (GET_MODE_BITSIZE (mode));")
|
9002 |
|
|
|
9003 |
|
|
(define_expand "x86_shift_adj_2"
|
9004 |
|
|
[(use (match_operand:SWI48 0 "register_operand" ""))
|
9005 |
|
|
(use (match_operand:SWI48 1 "register_operand" ""))
|
9006 |
|
|
(use (match_operand:QI 2 "register_operand" ""))]
|
9007 |
|
|
""
|
9008 |
|
|
{
|
9009 |
|
|
rtx label = gen_label_rtx ();
|
9010 |
|
|
rtx tmp;
|
9011 |
|
|
|
9012 |
|
|
emit_insn (gen_testqi_ccz_1 (operands[2],
|
9013 |
|
|
GEN_INT (GET_MODE_BITSIZE (mode))));
|
9014 |
|
|
|
9015 |
|
|
tmp = gen_rtx_REG (CCZmode, FLAGS_REG);
|
9016 |
|
|
tmp = gen_rtx_EQ (VOIDmode, tmp, const0_rtx);
|
9017 |
|
|
tmp = gen_rtx_IF_THEN_ELSE (VOIDmode, tmp,
|
9018 |
|
|
gen_rtx_LABEL_REF (VOIDmode, label),
|
9019 |
|
|
pc_rtx);
|
9020 |
|
|
tmp = emit_jump_insn (gen_rtx_SET (VOIDmode, pc_rtx, tmp));
|
9021 |
|
|
JUMP_LABEL (tmp) = label;
|
9022 |
|
|
|
9023 |
|
|
emit_move_insn (operands[0], operands[1]);
|
9024 |
|
|
ix86_expand_clear (operands[1]);
|
9025 |
|
|
|
9026 |
|
|
emit_label (label);
|
9027 |
|
|
LABEL_NUSES (label) = 1;
|
9028 |
|
|
|
9029 |
|
|
DONE;
|
9030 |
|
|
})
|
9031 |
|
|
|
9032 |
|
|
;; Avoid useless masking of count operand.
|
9033 |
|
|
(define_insn_and_split "*ashl3_mask"
|
9034 |
|
|
[(set (match_operand:SWI48 0 "nonimmediate_operand" "=rm")
|
9035 |
|
|
(ashift:SWI48
|
9036 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "0")
|
9037 |
|
|
(subreg:QI
|
9038 |
|
|
(and:SI
|
9039 |
|
|
(match_operand:SI 2 "nonimmediate_operand" "c")
|
9040 |
|
|
(match_operand:SI 3 "const_int_operand" "n")) 0)))
|
9041 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9042 |
|
|
"ix86_binary_operator_ok (ASHIFT, mode, operands)
|
9043 |
|
|
&& (INTVAL (operands[3]) & (GET_MODE_BITSIZE (mode)-1))
|
9044 |
|
|
== GET_MODE_BITSIZE (mode)-1"
|
9045 |
|
|
"#"
|
9046 |
|
|
"&& 1"
|
9047 |
|
|
[(parallel [(set (match_dup 0)
|
9048 |
|
|
(ashift:SWI48 (match_dup 1) (match_dup 2)))
|
9049 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
9050 |
|
|
{
|
9051 |
|
|
if (can_create_pseudo_p ())
|
9052 |
|
|
operands [2] = force_reg (SImode, operands[2]);
|
9053 |
|
|
|
9054 |
|
|
operands[2] = simplify_gen_subreg (QImode, operands[2], SImode, 0);
|
9055 |
|
|
}
|
9056 |
|
|
[(set_attr "type" "ishift")
|
9057 |
|
|
(set_attr "mode" "")])
|
9058 |
|
|
|
9059 |
|
|
(define_insn "*bmi2_ashl3_1"
|
9060 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
9061 |
|
|
(ashift:SWI48 (match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
9062 |
|
|
(match_operand:SWI48 2 "register_operand" "r")))]
|
9063 |
|
|
"TARGET_BMI2"
|
9064 |
|
|
"shlx\t{%2, %1, %0|%0, %1, %2}"
|
9065 |
|
|
[(set_attr "type" "ishiftx")
|
9066 |
|
|
(set_attr "mode" "")])
|
9067 |
|
|
|
9068 |
|
|
(define_insn "*ashl3_1"
|
9069 |
|
|
[(set (match_operand:SWI48 0 "nonimmediate_operand" "=rm,r,r")
|
9070 |
|
|
(ashift:SWI48 (match_operand:SWI48 1 "nonimmediate_operand" "0,l,rm")
|
9071 |
|
|
(match_operand:QI 2 "nonmemory_operand" "c,M,r")))
|
9072 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9073 |
|
|
"ix86_binary_operator_ok (ASHIFT, mode, operands)"
|
9074 |
|
|
{
|
9075 |
|
|
switch (get_attr_type (insn))
|
9076 |
|
|
{
|
9077 |
|
|
case TYPE_LEA:
|
9078 |
|
|
case TYPE_ISHIFTX:
|
9079 |
|
|
return "#";
|
9080 |
|
|
|
9081 |
|
|
case TYPE_ALU:
|
9082 |
|
|
gcc_assert (operands[2] == const1_rtx);
|
9083 |
|
|
gcc_assert (rtx_equal_p (operands[0], operands[1]));
|
9084 |
|
|
return "add{}\t%0, %0";
|
9085 |
|
|
|
9086 |
|
|
default:
|
9087 |
|
|
if (operands[2] == const1_rtx
|
9088 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9089 |
|
|
return "sal{}\t%0";
|
9090 |
|
|
else
|
9091 |
|
|
return "sal{}\t{%2, %0|%0, %2}";
|
9092 |
|
|
}
|
9093 |
|
|
}
|
9094 |
|
|
[(set_attr "isa" "*,*,bmi2")
|
9095 |
|
|
(set (attr "type")
|
9096 |
|
|
(cond [(eq_attr "alternative" "1")
|
9097 |
|
|
(const_string "lea")
|
9098 |
|
|
(eq_attr "alternative" "2")
|
9099 |
|
|
(const_string "ishiftx")
|
9100 |
|
|
(and (and (match_test "TARGET_DOUBLE_WITH_ADD")
|
9101 |
|
|
(match_operand 0 "register_operand" ""))
|
9102 |
|
|
(match_operand 2 "const1_operand" ""))
|
9103 |
|
|
(const_string "alu")
|
9104 |
|
|
]
|
9105 |
|
|
(const_string "ishift")))
|
9106 |
|
|
(set (attr "length_immediate")
|
9107 |
|
|
(if_then_else
|
9108 |
|
|
(ior (eq_attr "type" "alu")
|
9109 |
|
|
(and (eq_attr "type" "ishift")
|
9110 |
|
|
(and (match_operand 2 "const1_operand" "")
|
9111 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9112 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))))
|
9113 |
|
|
(const_string "0")
|
9114 |
|
|
(const_string "*")))
|
9115 |
|
|
(set_attr "mode" "")])
|
9116 |
|
|
|
9117 |
|
|
;; Convert shift to the shiftx pattern to avoid flags dependency.
|
9118 |
|
|
(define_split
|
9119 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "")
|
9120 |
|
|
(ashift:SWI48 (match_operand:SWI48 1 "nonimmediate_operand" "")
|
9121 |
|
|
(match_operand:QI 2 "register_operand" "")))
|
9122 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9123 |
|
|
"TARGET_BMI2 && reload_completed"
|
9124 |
|
|
[(set (match_dup 0)
|
9125 |
|
|
(ashift:SWI48 (match_dup 1) (match_dup 2)))]
|
9126 |
|
|
"operands[2] = gen_lowpart (mode, operands[2]);")
|
9127 |
|
|
|
9128 |
|
|
(define_insn "*bmi2_ashlsi3_1_zext"
|
9129 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
9130 |
|
|
(zero_extend:DI
|
9131 |
|
|
(ashift:SI (match_operand:SI 1 "nonimmediate_operand" "rm")
|
9132 |
|
|
(match_operand:SI 2 "register_operand" "r"))))]
|
9133 |
|
|
"TARGET_64BIT && TARGET_BMI2"
|
9134 |
|
|
"shlx\t{%2, %1, %k0|%k0, %1, %2}"
|
9135 |
|
|
[(set_attr "type" "ishiftx")
|
9136 |
|
|
(set_attr "mode" "SI")])
|
9137 |
|
|
|
9138 |
|
|
(define_insn "*ashlsi3_1_zext"
|
9139 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r,r,r")
|
9140 |
|
|
(zero_extend:DI
|
9141 |
|
|
(ashift:SI (match_operand:SI 1 "nonimmediate_operand" "0,l,rm")
|
9142 |
|
|
(match_operand:QI 2 "nonmemory_operand" "cI,M,r"))))
|
9143 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9144 |
|
|
"TARGET_64BIT && ix86_binary_operator_ok (ASHIFT, SImode, operands)"
|
9145 |
|
|
{
|
9146 |
|
|
switch (get_attr_type (insn))
|
9147 |
|
|
{
|
9148 |
|
|
case TYPE_LEA:
|
9149 |
|
|
case TYPE_ISHIFTX:
|
9150 |
|
|
return "#";
|
9151 |
|
|
|
9152 |
|
|
case TYPE_ALU:
|
9153 |
|
|
gcc_assert (operands[2] == const1_rtx);
|
9154 |
|
|
return "add{l}\t%k0, %k0";
|
9155 |
|
|
|
9156 |
|
|
default:
|
9157 |
|
|
if (operands[2] == const1_rtx
|
9158 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9159 |
|
|
return "sal{l}\t%k0";
|
9160 |
|
|
else
|
9161 |
|
|
return "sal{l}\t{%2, %k0|%k0, %2}";
|
9162 |
|
|
}
|
9163 |
|
|
}
|
9164 |
|
|
[(set_attr "isa" "*,*,bmi2")
|
9165 |
|
|
(set (attr "type")
|
9166 |
|
|
(cond [(eq_attr "alternative" "1")
|
9167 |
|
|
(const_string "lea")
|
9168 |
|
|
(eq_attr "alternative" "2")
|
9169 |
|
|
(const_string "ishiftx")
|
9170 |
|
|
(and (match_test "TARGET_DOUBLE_WITH_ADD")
|
9171 |
|
|
(match_operand 2 "const1_operand" ""))
|
9172 |
|
|
(const_string "alu")
|
9173 |
|
|
]
|
9174 |
|
|
(const_string "ishift")))
|
9175 |
|
|
(set (attr "length_immediate")
|
9176 |
|
|
(if_then_else
|
9177 |
|
|
(ior (eq_attr "type" "alu")
|
9178 |
|
|
(and (eq_attr "type" "ishift")
|
9179 |
|
|
(and (match_operand 2 "const1_operand" "")
|
9180 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9181 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))))
|
9182 |
|
|
(const_string "0")
|
9183 |
|
|
(const_string "*")))
|
9184 |
|
|
(set_attr "mode" "SI")])
|
9185 |
|
|
|
9186 |
|
|
;; Convert shift to the shiftx pattern to avoid flags dependency.
|
9187 |
|
|
(define_split
|
9188 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
9189 |
|
|
(zero_extend:DI
|
9190 |
|
|
(ashift:SI (match_operand:SI 1 "nonimmediate_operand" "")
|
9191 |
|
|
(match_operand:QI 2 "register_operand" ""))))
|
9192 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9193 |
|
|
"TARGET_64BIT && TARGET_BMI2 && reload_completed"
|
9194 |
|
|
[(set (match_dup 0)
|
9195 |
|
|
(zero_extend:DI (ashift:SI (match_dup 1) (match_dup 2))))]
|
9196 |
|
|
"operands[2] = gen_lowpart (SImode, operands[2]);")
|
9197 |
|
|
|
9198 |
|
|
(define_insn "*ashlhi3_1"
|
9199 |
|
|
[(set (match_operand:HI 0 "nonimmediate_operand" "=rm,Yp")
|
9200 |
|
|
(ashift:HI (match_operand:HI 1 "nonimmediate_operand" "0,l")
|
9201 |
|
|
(match_operand:QI 2 "nonmemory_operand" "cI,M")))
|
9202 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9203 |
|
|
"ix86_binary_operator_ok (ASHIFT, HImode, operands)"
|
9204 |
|
|
{
|
9205 |
|
|
switch (get_attr_type (insn))
|
9206 |
|
|
{
|
9207 |
|
|
case TYPE_LEA:
|
9208 |
|
|
return "#";
|
9209 |
|
|
|
9210 |
|
|
case TYPE_ALU:
|
9211 |
|
|
gcc_assert (operands[2] == const1_rtx);
|
9212 |
|
|
return "add{w}\t%0, %0";
|
9213 |
|
|
|
9214 |
|
|
default:
|
9215 |
|
|
if (operands[2] == const1_rtx
|
9216 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9217 |
|
|
return "sal{w}\t%0";
|
9218 |
|
|
else
|
9219 |
|
|
return "sal{w}\t{%2, %0|%0, %2}";
|
9220 |
|
|
}
|
9221 |
|
|
}
|
9222 |
|
|
[(set (attr "type")
|
9223 |
|
|
(cond [(eq_attr "alternative" "1")
|
9224 |
|
|
(const_string "lea")
|
9225 |
|
|
(and (and (match_test "TARGET_DOUBLE_WITH_ADD")
|
9226 |
|
|
(match_operand 0 "register_operand" ""))
|
9227 |
|
|
(match_operand 2 "const1_operand" ""))
|
9228 |
|
|
(const_string "alu")
|
9229 |
|
|
]
|
9230 |
|
|
(const_string "ishift")))
|
9231 |
|
|
(set (attr "length_immediate")
|
9232 |
|
|
(if_then_else
|
9233 |
|
|
(ior (eq_attr "type" "alu")
|
9234 |
|
|
(and (eq_attr "type" "ishift")
|
9235 |
|
|
(and (match_operand 2 "const1_operand" "")
|
9236 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9237 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))))
|
9238 |
|
|
(const_string "0")
|
9239 |
|
|
(const_string "*")))
|
9240 |
|
|
(set_attr "mode" "HI,SI")])
|
9241 |
|
|
|
9242 |
|
|
;; %%% Potential partial reg stall on alternative 1. What to do?
|
9243 |
|
|
(define_insn "*ashlqi3_1"
|
9244 |
|
|
[(set (match_operand:QI 0 "nonimmediate_operand" "=qm,r,Yp")
|
9245 |
|
|
(ashift:QI (match_operand:QI 1 "nonimmediate_operand" "0,0,l")
|
9246 |
|
|
(match_operand:QI 2 "nonmemory_operand" "cI,cI,M")))
|
9247 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9248 |
|
|
"ix86_binary_operator_ok (ASHIFT, QImode, operands)"
|
9249 |
|
|
{
|
9250 |
|
|
switch (get_attr_type (insn))
|
9251 |
|
|
{
|
9252 |
|
|
case TYPE_LEA:
|
9253 |
|
|
return "#";
|
9254 |
|
|
|
9255 |
|
|
case TYPE_ALU:
|
9256 |
|
|
gcc_assert (operands[2] == const1_rtx);
|
9257 |
|
|
if (REG_P (operands[1]) && !ANY_QI_REG_P (operands[1]))
|
9258 |
|
|
return "add{l}\t%k0, %k0";
|
9259 |
|
|
else
|
9260 |
|
|
return "add{b}\t%0, %0";
|
9261 |
|
|
|
9262 |
|
|
default:
|
9263 |
|
|
if (operands[2] == const1_rtx
|
9264 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9265 |
|
|
{
|
9266 |
|
|
if (get_attr_mode (insn) == MODE_SI)
|
9267 |
|
|
return "sal{l}\t%k0";
|
9268 |
|
|
else
|
9269 |
|
|
return "sal{b}\t%0";
|
9270 |
|
|
}
|
9271 |
|
|
else
|
9272 |
|
|
{
|
9273 |
|
|
if (get_attr_mode (insn) == MODE_SI)
|
9274 |
|
|
return "sal{l}\t{%2, %k0|%k0, %2}";
|
9275 |
|
|
else
|
9276 |
|
|
return "sal{b}\t{%2, %0|%0, %2}";
|
9277 |
|
|
}
|
9278 |
|
|
}
|
9279 |
|
|
}
|
9280 |
|
|
[(set (attr "type")
|
9281 |
|
|
(cond [(eq_attr "alternative" "2")
|
9282 |
|
|
(const_string "lea")
|
9283 |
|
|
(and (and (match_test "TARGET_DOUBLE_WITH_ADD")
|
9284 |
|
|
(match_operand 0 "register_operand" ""))
|
9285 |
|
|
(match_operand 2 "const1_operand" ""))
|
9286 |
|
|
(const_string "alu")
|
9287 |
|
|
]
|
9288 |
|
|
(const_string "ishift")))
|
9289 |
|
|
(set (attr "length_immediate")
|
9290 |
|
|
(if_then_else
|
9291 |
|
|
(ior (eq_attr "type" "alu")
|
9292 |
|
|
(and (eq_attr "type" "ishift")
|
9293 |
|
|
(and (match_operand 2 "const1_operand" "")
|
9294 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9295 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))))
|
9296 |
|
|
(const_string "0")
|
9297 |
|
|
(const_string "*")))
|
9298 |
|
|
(set_attr "mode" "QI,SI,SI")])
|
9299 |
|
|
|
9300 |
|
|
(define_insn "*ashlqi3_1_slp"
|
9301 |
|
|
[(set (strict_low_part (match_operand:QI 0 "nonimmediate_operand" "+qm"))
|
9302 |
|
|
(ashift:QI (match_dup 0)
|
9303 |
|
|
(match_operand:QI 1 "nonmemory_operand" "cI")))
|
9304 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9305 |
|
|
"(optimize_function_for_size_p (cfun)
|
9306 |
|
|
|| !TARGET_PARTIAL_FLAG_REG_STALL
|
9307 |
|
|
|| (operands[1] == const1_rtx
|
9308 |
|
|
&& (TARGET_SHIFT1
|
9309 |
|
|
|| (TARGET_DOUBLE_WITH_ADD && REG_P (operands[0])))))"
|
9310 |
|
|
{
|
9311 |
|
|
switch (get_attr_type (insn))
|
9312 |
|
|
{
|
9313 |
|
|
case TYPE_ALU:
|
9314 |
|
|
gcc_assert (operands[1] == const1_rtx);
|
9315 |
|
|
return "add{b}\t%0, %0";
|
9316 |
|
|
|
9317 |
|
|
default:
|
9318 |
|
|
if (operands[1] == const1_rtx
|
9319 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9320 |
|
|
return "sal{b}\t%0";
|
9321 |
|
|
else
|
9322 |
|
|
return "sal{b}\t{%1, %0|%0, %1}";
|
9323 |
|
|
}
|
9324 |
|
|
}
|
9325 |
|
|
[(set (attr "type")
|
9326 |
|
|
(cond [(and (and (match_test "TARGET_DOUBLE_WITH_ADD")
|
9327 |
|
|
(match_operand 0 "register_operand" ""))
|
9328 |
|
|
(match_operand 1 "const1_operand" ""))
|
9329 |
|
|
(const_string "alu")
|
9330 |
|
|
]
|
9331 |
|
|
(const_string "ishift1")))
|
9332 |
|
|
(set (attr "length_immediate")
|
9333 |
|
|
(if_then_else
|
9334 |
|
|
(ior (eq_attr "type" "alu")
|
9335 |
|
|
(and (eq_attr "type" "ishift1")
|
9336 |
|
|
(and (match_operand 1 "const1_operand" "")
|
9337 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9338 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))))
|
9339 |
|
|
(const_string "0")
|
9340 |
|
|
(const_string "*")))
|
9341 |
|
|
(set_attr "mode" "QI")])
|
9342 |
|
|
|
9343 |
|
|
;; Convert ashift to the lea pattern to avoid flags dependency.
|
9344 |
|
|
(define_split
|
9345 |
|
|
[(set (match_operand 0 "register_operand" "")
|
9346 |
|
|
(ashift (match_operand 1 "index_register_operand" "")
|
9347 |
|
|
(match_operand:QI 2 "const_int_operand" "")))
|
9348 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9349 |
|
|
"GET_MODE (operands[0]) == GET_MODE (operands[1])
|
9350 |
|
|
&& reload_completed
|
9351 |
|
|
&& true_regnum (operands[0]) != true_regnum (operands[1])"
|
9352 |
|
|
[(const_int 0)]
|
9353 |
|
|
{
|
9354 |
|
|
enum machine_mode mode = GET_MODE (operands[0]);
|
9355 |
|
|
rtx pat;
|
9356 |
|
|
|
9357 |
|
|
if (GET_MODE_SIZE (mode) < GET_MODE_SIZE (SImode))
|
9358 |
|
|
{
|
9359 |
|
|
mode = SImode;
|
9360 |
|
|
operands[0] = gen_lowpart (mode, operands[0]);
|
9361 |
|
|
operands[1] = gen_lowpart (mode, operands[1]);
|
9362 |
|
|
}
|
9363 |
|
|
|
9364 |
|
|
operands[2] = gen_int_mode (1 << INTVAL (operands[2]), mode);
|
9365 |
|
|
|
9366 |
|
|
pat = gen_rtx_MULT (mode, operands[1], operands[2]);
|
9367 |
|
|
|
9368 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[0], pat));
|
9369 |
|
|
DONE;
|
9370 |
|
|
})
|
9371 |
|
|
|
9372 |
|
|
;; Convert ashift to the lea pattern to avoid flags dependency.
|
9373 |
|
|
(define_split
|
9374 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
9375 |
|
|
(zero_extend:DI
|
9376 |
|
|
(ashift:SI (match_operand:SI 1 "index_register_operand" "")
|
9377 |
|
|
(match_operand:QI 2 "const_int_operand" ""))))
|
9378 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9379 |
|
|
"TARGET_64BIT && reload_completed
|
9380 |
|
|
&& true_regnum (operands[0]) != true_regnum (operands[1])"
|
9381 |
|
|
[(set (match_dup 0)
|
9382 |
|
|
(zero_extend:DI (subreg:SI (mult:DI (match_dup 1) (match_dup 2)) 0)))]
|
9383 |
|
|
{
|
9384 |
|
|
operands[1] = gen_lowpart (DImode, operands[1]);
|
9385 |
|
|
operands[2] = gen_int_mode (1 << INTVAL (operands[2]), DImode);
|
9386 |
|
|
})
|
9387 |
|
|
|
9388 |
|
|
;; This pattern can't accept a variable shift count, since shifts by
|
9389 |
|
|
;; zero don't affect the flags. We assume that shifts by constant
|
9390 |
|
|
;; zero are optimized away.
|
9391 |
|
|
(define_insn "*ashl3_cmp"
|
9392 |
|
|
[(set (reg FLAGS_REG)
|
9393 |
|
|
(compare
|
9394 |
|
|
(ashift:SWI (match_operand:SWI 1 "nonimmediate_operand" "0")
|
9395 |
|
|
(match_operand:QI 2 "" ""))
|
9396 |
|
|
(const_int 0)))
|
9397 |
|
|
(set (match_operand:SWI 0 "nonimmediate_operand" "=m")
|
9398 |
|
|
(ashift:SWI (match_dup 1) (match_dup 2)))]
|
9399 |
|
|
"(optimize_function_for_size_p (cfun)
|
9400 |
|
|
|| !TARGET_PARTIAL_FLAG_REG_STALL
|
9401 |
|
|
|| (operands[2] == const1_rtx
|
9402 |
|
|
&& (TARGET_SHIFT1
|
9403 |
|
|
|| (TARGET_DOUBLE_WITH_ADD && REG_P (operands[0])))))
|
9404 |
|
|
&& ix86_match_ccmode (insn, CCGOCmode)
|
9405 |
|
|
&& ix86_binary_operator_ok (ASHIFT, mode, operands)"
|
9406 |
|
|
{
|
9407 |
|
|
switch (get_attr_type (insn))
|
9408 |
|
|
{
|
9409 |
|
|
case TYPE_ALU:
|
9410 |
|
|
gcc_assert (operands[2] == const1_rtx);
|
9411 |
|
|
return "add{}\t%0, %0";
|
9412 |
|
|
|
9413 |
|
|
default:
|
9414 |
|
|
if (operands[2] == const1_rtx
|
9415 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9416 |
|
|
return "sal{}\t%0";
|
9417 |
|
|
else
|
9418 |
|
|
return "sal{}\t{%2, %0|%0, %2}";
|
9419 |
|
|
}
|
9420 |
|
|
}
|
9421 |
|
|
[(set (attr "type")
|
9422 |
|
|
(cond [(and (and (match_test "TARGET_DOUBLE_WITH_ADD")
|
9423 |
|
|
(match_operand 0 "register_operand" ""))
|
9424 |
|
|
(match_operand 2 "const1_operand" ""))
|
9425 |
|
|
(const_string "alu")
|
9426 |
|
|
]
|
9427 |
|
|
(const_string "ishift")))
|
9428 |
|
|
(set (attr "length_immediate")
|
9429 |
|
|
(if_then_else
|
9430 |
|
|
(ior (eq_attr "type" "alu")
|
9431 |
|
|
(and (eq_attr "type" "ishift")
|
9432 |
|
|
(and (match_operand 2 "const1_operand" "")
|
9433 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9434 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))))
|
9435 |
|
|
(const_string "0")
|
9436 |
|
|
(const_string "*")))
|
9437 |
|
|
(set_attr "mode" "")])
|
9438 |
|
|
|
9439 |
|
|
(define_insn "*ashlsi3_cmp_zext"
|
9440 |
|
|
[(set (reg FLAGS_REG)
|
9441 |
|
|
(compare
|
9442 |
|
|
(ashift:SI (match_operand:SI 1 "register_operand" "0")
|
9443 |
|
|
(match_operand:QI 2 "const_1_to_31_operand" "I"))
|
9444 |
|
|
(const_int 0)))
|
9445 |
|
|
(set (match_operand:DI 0 "register_operand" "=r")
|
9446 |
|
|
(zero_extend:DI (ashift:SI (match_dup 1) (match_dup 2))))]
|
9447 |
|
|
"TARGET_64BIT
|
9448 |
|
|
&& (optimize_function_for_size_p (cfun)
|
9449 |
|
|
|| !TARGET_PARTIAL_FLAG_REG_STALL
|
9450 |
|
|
|| (operands[2] == const1_rtx
|
9451 |
|
|
&& (TARGET_SHIFT1
|
9452 |
|
|
|| TARGET_DOUBLE_WITH_ADD)))
|
9453 |
|
|
&& ix86_match_ccmode (insn, CCGOCmode)
|
9454 |
|
|
&& ix86_binary_operator_ok (ASHIFT, SImode, operands)"
|
9455 |
|
|
{
|
9456 |
|
|
switch (get_attr_type (insn))
|
9457 |
|
|
{
|
9458 |
|
|
case TYPE_ALU:
|
9459 |
|
|
gcc_assert (operands[2] == const1_rtx);
|
9460 |
|
|
return "add{l}\t%k0, %k0";
|
9461 |
|
|
|
9462 |
|
|
default:
|
9463 |
|
|
if (operands[2] == const1_rtx
|
9464 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9465 |
|
|
return "sal{l}\t%k0";
|
9466 |
|
|
else
|
9467 |
|
|
return "sal{l}\t{%2, %k0|%k0, %2}";
|
9468 |
|
|
}
|
9469 |
|
|
}
|
9470 |
|
|
[(set (attr "type")
|
9471 |
|
|
(cond [(and (match_test "TARGET_DOUBLE_WITH_ADD")
|
9472 |
|
|
(match_operand 2 "const1_operand" ""))
|
9473 |
|
|
(const_string "alu")
|
9474 |
|
|
]
|
9475 |
|
|
(const_string "ishift")))
|
9476 |
|
|
(set (attr "length_immediate")
|
9477 |
|
|
(if_then_else
|
9478 |
|
|
(ior (eq_attr "type" "alu")
|
9479 |
|
|
(and (eq_attr "type" "ishift")
|
9480 |
|
|
(and (match_operand 2 "const1_operand" "")
|
9481 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9482 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))))
|
9483 |
|
|
(const_string "0")
|
9484 |
|
|
(const_string "*")))
|
9485 |
|
|
(set_attr "mode" "SI")])
|
9486 |
|
|
|
9487 |
|
|
(define_insn "*ashl3_cconly"
|
9488 |
|
|
[(set (reg FLAGS_REG)
|
9489 |
|
|
(compare
|
9490 |
|
|
(ashift:SWI (match_operand:SWI 1 "register_operand" "0")
|
9491 |
|
|
(match_operand:QI 2 "" ""))
|
9492 |
|
|
(const_int 0)))
|
9493 |
|
|
(clobber (match_scratch:SWI 0 "="))]
|
9494 |
|
|
"(optimize_function_for_size_p (cfun)
|
9495 |
|
|
|| !TARGET_PARTIAL_FLAG_REG_STALL
|
9496 |
|
|
|| (operands[2] == const1_rtx
|
9497 |
|
|
&& (TARGET_SHIFT1
|
9498 |
|
|
|| TARGET_DOUBLE_WITH_ADD)))
|
9499 |
|
|
&& ix86_match_ccmode (insn, CCGOCmode)"
|
9500 |
|
|
{
|
9501 |
|
|
switch (get_attr_type (insn))
|
9502 |
|
|
{
|
9503 |
|
|
case TYPE_ALU:
|
9504 |
|
|
gcc_assert (operands[2] == const1_rtx);
|
9505 |
|
|
return "add{}\t%0, %0";
|
9506 |
|
|
|
9507 |
|
|
default:
|
9508 |
|
|
if (operands[2] == const1_rtx
|
9509 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9510 |
|
|
return "sal{}\t%0";
|
9511 |
|
|
else
|
9512 |
|
|
return "sal{}\t{%2, %0|%0, %2}";
|
9513 |
|
|
}
|
9514 |
|
|
}
|
9515 |
|
|
[(set (attr "type")
|
9516 |
|
|
(cond [(and (and (match_test "TARGET_DOUBLE_WITH_ADD")
|
9517 |
|
|
(match_operand 0 "register_operand" ""))
|
9518 |
|
|
(match_operand 2 "const1_operand" ""))
|
9519 |
|
|
(const_string "alu")
|
9520 |
|
|
]
|
9521 |
|
|
(const_string "ishift")))
|
9522 |
|
|
(set (attr "length_immediate")
|
9523 |
|
|
(if_then_else
|
9524 |
|
|
(ior (eq_attr "type" "alu")
|
9525 |
|
|
(and (eq_attr "type" "ishift")
|
9526 |
|
|
(and (match_operand 2 "const1_operand" "")
|
9527 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9528 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))))
|
9529 |
|
|
(const_string "0")
|
9530 |
|
|
(const_string "*")))
|
9531 |
|
|
(set_attr "mode" "")])
|
9532 |
|
|
|
9533 |
|
|
;; See comment above `ashl3' about how this works.
|
9534 |
|
|
|
9535 |
|
|
(define_expand "3"
|
9536 |
|
|
[(set (match_operand:SDWIM 0 "" "")
|
9537 |
|
|
(any_shiftrt:SDWIM (match_operand:SDWIM 1 "" "")
|
9538 |
|
|
(match_operand:QI 2 "nonmemory_operand" "")))]
|
9539 |
|
|
""
|
9540 |
|
|
"ix86_expand_binary_operator (, mode, operands); DONE;")
|
9541 |
|
|
|
9542 |
|
|
;; Avoid useless masking of count operand.
|
9543 |
|
|
(define_insn_and_split "*3_mask"
|
9544 |
|
|
[(set (match_operand:SWI48 0 "nonimmediate_operand" "=rm")
|
9545 |
|
|
(any_shiftrt:SWI48
|
9546 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "0")
|
9547 |
|
|
(subreg:QI
|
9548 |
|
|
(and:SI
|
9549 |
|
|
(match_operand:SI 2 "nonimmediate_operand" "c")
|
9550 |
|
|
(match_operand:SI 3 "const_int_operand" "n")) 0)))
|
9551 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9552 |
|
|
"ix86_binary_operator_ok (, mode, operands)
|
9553 |
|
|
&& (INTVAL (operands[3]) & (GET_MODE_BITSIZE (mode)-1))
|
9554 |
|
|
== GET_MODE_BITSIZE (mode)-1"
|
9555 |
|
|
"#"
|
9556 |
|
|
"&& 1"
|
9557 |
|
|
[(parallel [(set (match_dup 0)
|
9558 |
|
|
(any_shiftrt:SWI48 (match_dup 1) (match_dup 2)))
|
9559 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
9560 |
|
|
{
|
9561 |
|
|
if (can_create_pseudo_p ())
|
9562 |
|
|
operands [2] = force_reg (SImode, operands[2]);
|
9563 |
|
|
|
9564 |
|
|
operands[2] = simplify_gen_subreg (QImode, operands[2], SImode, 0);
|
9565 |
|
|
}
|
9566 |
|
|
[(set_attr "type" "ishift")
|
9567 |
|
|
(set_attr "mode" "")])
|
9568 |
|
|
|
9569 |
|
|
(define_insn_and_split "*3_doubleword"
|
9570 |
|
|
[(set (match_operand:DWI 0 "register_operand" "=r")
|
9571 |
|
|
(any_shiftrt:DWI (match_operand:DWI 1 "register_operand" "0")
|
9572 |
|
|
(match_operand:QI 2 "nonmemory_operand" "c")))
|
9573 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9574 |
|
|
""
|
9575 |
|
|
"#"
|
9576 |
|
|
"(optimize && flag_peephole2) ? epilogue_completed : reload_completed"
|
9577 |
|
|
[(const_int 0)]
|
9578 |
|
|
"ix86_split_ (operands, NULL_RTX, mode); DONE;"
|
9579 |
|
|
[(set_attr "type" "multi")])
|
9580 |
|
|
|
9581 |
|
|
;; By default we don't ask for a scratch register, because when DWImode
|
9582 |
|
|
;; values are manipulated, registers are already at a premium. But if
|
9583 |
|
|
;; we have one handy, we won't turn it away.
|
9584 |
|
|
|
9585 |
|
|
(define_peephole2
|
9586 |
|
|
[(match_scratch:DWIH 3 "r")
|
9587 |
|
|
(parallel [(set (match_operand: 0 "register_operand" "")
|
9588 |
|
|
(any_shiftrt:
|
9589 |
|
|
(match_operand: 1 "register_operand" "")
|
9590 |
|
|
(match_operand:QI 2 "nonmemory_operand" "")))
|
9591 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
9592 |
|
|
(match_dup 3)]
|
9593 |
|
|
"TARGET_CMOVE"
|
9594 |
|
|
[(const_int 0)]
|
9595 |
|
|
"ix86_split_ (operands, operands[3], mode); DONE;")
|
9596 |
|
|
|
9597 |
|
|
(define_insn "x86_64_shrd"
|
9598 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "+r*m")
|
9599 |
|
|
(ior:DI (ashiftrt:DI (match_dup 0)
|
9600 |
|
|
(match_operand:QI 2 "nonmemory_operand" "Jc"))
|
9601 |
|
|
(ashift:DI (match_operand:DI 1 "register_operand" "r")
|
9602 |
|
|
(minus:QI (const_int 64) (match_dup 2)))))
|
9603 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9604 |
|
|
"TARGET_64BIT"
|
9605 |
|
|
"shrd{q}\t{%s2%1, %0|%0, %1, %2}"
|
9606 |
|
|
[(set_attr "type" "ishift")
|
9607 |
|
|
(set_attr "prefix_0f" "1")
|
9608 |
|
|
(set_attr "mode" "DI")
|
9609 |
|
|
(set_attr "athlon_decode" "vector")
|
9610 |
|
|
(set_attr "amdfam10_decode" "vector")
|
9611 |
|
|
(set_attr "bdver1_decode" "vector")])
|
9612 |
|
|
|
9613 |
|
|
(define_insn "x86_shrd"
|
9614 |
|
|
[(set (match_operand:SI 0 "nonimmediate_operand" "+r*m")
|
9615 |
|
|
(ior:SI (ashiftrt:SI (match_dup 0)
|
9616 |
|
|
(match_operand:QI 2 "nonmemory_operand" "Ic"))
|
9617 |
|
|
(ashift:SI (match_operand:SI 1 "register_operand" "r")
|
9618 |
|
|
(minus:QI (const_int 32) (match_dup 2)))))
|
9619 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9620 |
|
|
""
|
9621 |
|
|
"shrd{l}\t{%s2%1, %0|%0, %1, %2}"
|
9622 |
|
|
[(set_attr "type" "ishift")
|
9623 |
|
|
(set_attr "prefix_0f" "1")
|
9624 |
|
|
(set_attr "mode" "SI")
|
9625 |
|
|
(set_attr "pent_pair" "np")
|
9626 |
|
|
(set_attr "athlon_decode" "vector")
|
9627 |
|
|
(set_attr "amdfam10_decode" "vector")
|
9628 |
|
|
(set_attr "bdver1_decode" "vector")])
|
9629 |
|
|
|
9630 |
|
|
(define_insn "ashrdi3_cvt"
|
9631 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "=*d,rm")
|
9632 |
|
|
(ashiftrt:DI (match_operand:DI 1 "nonimmediate_operand" "*a,0")
|
9633 |
|
|
(match_operand:QI 2 "const_int_operand" "")))
|
9634 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9635 |
|
|
"TARGET_64BIT && INTVAL (operands[2]) == 63
|
9636 |
|
|
&& (TARGET_USE_CLTD || optimize_function_for_size_p (cfun))
|
9637 |
|
|
&& ix86_binary_operator_ok (ASHIFTRT, DImode, operands)"
|
9638 |
|
|
"@
|
9639 |
|
|
{cqto|cqo}
|
9640 |
|
|
sar{q}\t{%2, %0|%0, %2}"
|
9641 |
|
|
[(set_attr "type" "imovx,ishift")
|
9642 |
|
|
(set_attr "prefix_0f" "0,*")
|
9643 |
|
|
(set_attr "length_immediate" "0,*")
|
9644 |
|
|
(set_attr "modrm" "0,1")
|
9645 |
|
|
(set_attr "mode" "DI")])
|
9646 |
|
|
|
9647 |
|
|
(define_insn "ashrsi3_cvt"
|
9648 |
|
|
[(set (match_operand:SI 0 "nonimmediate_operand" "=*d,rm")
|
9649 |
|
|
(ashiftrt:SI (match_operand:SI 1 "nonimmediate_operand" "*a,0")
|
9650 |
|
|
(match_operand:QI 2 "const_int_operand" "")))
|
9651 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9652 |
|
|
"INTVAL (operands[2]) == 31
|
9653 |
|
|
&& (TARGET_USE_CLTD || optimize_function_for_size_p (cfun))
|
9654 |
|
|
&& ix86_binary_operator_ok (ASHIFTRT, SImode, operands)"
|
9655 |
|
|
"@
|
9656 |
|
|
{cltd|cdq}
|
9657 |
|
|
sar{l}\t{%2, %0|%0, %2}"
|
9658 |
|
|
[(set_attr "type" "imovx,ishift")
|
9659 |
|
|
(set_attr "prefix_0f" "0,*")
|
9660 |
|
|
(set_attr "length_immediate" "0,*")
|
9661 |
|
|
(set_attr "modrm" "0,1")
|
9662 |
|
|
(set_attr "mode" "SI")])
|
9663 |
|
|
|
9664 |
|
|
(define_insn "*ashrsi3_cvt_zext"
|
9665 |
|
|
[(set (match_operand:DI 0 "register_operand" "=*d,r")
|
9666 |
|
|
(zero_extend:DI
|
9667 |
|
|
(ashiftrt:SI (match_operand:SI 1 "register_operand" "*a,0")
|
9668 |
|
|
(match_operand:QI 2 "const_int_operand" ""))))
|
9669 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9670 |
|
|
"TARGET_64BIT && INTVAL (operands[2]) == 31
|
9671 |
|
|
&& (TARGET_USE_CLTD || optimize_function_for_size_p (cfun))
|
9672 |
|
|
&& ix86_binary_operator_ok (ASHIFTRT, SImode, operands)"
|
9673 |
|
|
"@
|
9674 |
|
|
{cltd|cdq}
|
9675 |
|
|
sar{l}\t{%2, %k0|%k0, %2}"
|
9676 |
|
|
[(set_attr "type" "imovx,ishift")
|
9677 |
|
|
(set_attr "prefix_0f" "0,*")
|
9678 |
|
|
(set_attr "length_immediate" "0,*")
|
9679 |
|
|
(set_attr "modrm" "0,1")
|
9680 |
|
|
(set_attr "mode" "SI")])
|
9681 |
|
|
|
9682 |
|
|
(define_expand "x86_shift_adj_3"
|
9683 |
|
|
[(use (match_operand:SWI48 0 "register_operand" ""))
|
9684 |
|
|
(use (match_operand:SWI48 1 "register_operand" ""))
|
9685 |
|
|
(use (match_operand:QI 2 "register_operand" ""))]
|
9686 |
|
|
""
|
9687 |
|
|
{
|
9688 |
|
|
rtx label = gen_label_rtx ();
|
9689 |
|
|
rtx tmp;
|
9690 |
|
|
|
9691 |
|
|
emit_insn (gen_testqi_ccz_1 (operands[2],
|
9692 |
|
|
GEN_INT (GET_MODE_BITSIZE (mode))));
|
9693 |
|
|
|
9694 |
|
|
tmp = gen_rtx_REG (CCZmode, FLAGS_REG);
|
9695 |
|
|
tmp = gen_rtx_EQ (VOIDmode, tmp, const0_rtx);
|
9696 |
|
|
tmp = gen_rtx_IF_THEN_ELSE (VOIDmode, tmp,
|
9697 |
|
|
gen_rtx_LABEL_REF (VOIDmode, label),
|
9698 |
|
|
pc_rtx);
|
9699 |
|
|
tmp = emit_jump_insn (gen_rtx_SET (VOIDmode, pc_rtx, tmp));
|
9700 |
|
|
JUMP_LABEL (tmp) = label;
|
9701 |
|
|
|
9702 |
|
|
emit_move_insn (operands[0], operands[1]);
|
9703 |
|
|
emit_insn (gen_ashr3_cvt (operands[1], operands[1],
|
9704 |
|
|
GEN_INT (GET_MODE_BITSIZE (mode)-1)));
|
9705 |
|
|
emit_label (label);
|
9706 |
|
|
LABEL_NUSES (label) = 1;
|
9707 |
|
|
|
9708 |
|
|
DONE;
|
9709 |
|
|
})
|
9710 |
|
|
|
9711 |
|
|
(define_insn "*bmi2_3_1"
|
9712 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
9713 |
|
|
(any_shiftrt:SWI48 (match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
9714 |
|
|
(match_operand:SWI48 2 "register_operand" "r")))]
|
9715 |
|
|
"TARGET_BMI2"
|
9716 |
|
|
"x\t{%2, %1, %0|%0, %1, %2}"
|
9717 |
|
|
[(set_attr "type" "ishiftx")
|
9718 |
|
|
(set_attr "mode" "")])
|
9719 |
|
|
|
9720 |
|
|
(define_insn "*3_1"
|
9721 |
|
|
[(set (match_operand:SWI48 0 "nonimmediate_operand" "=rm,r")
|
9722 |
|
|
(any_shiftrt:SWI48
|
9723 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "0,rm")
|
9724 |
|
|
(match_operand:QI 2 "nonmemory_operand" "c,r")))
|
9725 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9726 |
|
|
"ix86_binary_operator_ok (, mode, operands)"
|
9727 |
|
|
{
|
9728 |
|
|
switch (get_attr_type (insn))
|
9729 |
|
|
{
|
9730 |
|
|
case TYPE_ISHIFTX:
|
9731 |
|
|
return "#";
|
9732 |
|
|
|
9733 |
|
|
default:
|
9734 |
|
|
if (operands[2] == const1_rtx
|
9735 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9736 |
|
|
return "{}\t%0";
|
9737 |
|
|
else
|
9738 |
|
|
return "{}\t{%2, %0|%0, %2}";
|
9739 |
|
|
}
|
9740 |
|
|
}
|
9741 |
|
|
[(set_attr "isa" "*,bmi2")
|
9742 |
|
|
(set_attr "type" "ishift,ishiftx")
|
9743 |
|
|
(set (attr "length_immediate")
|
9744 |
|
|
(if_then_else
|
9745 |
|
|
(and (match_operand 2 "const1_operand" "")
|
9746 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9747 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))
|
9748 |
|
|
(const_string "0")
|
9749 |
|
|
(const_string "*")))
|
9750 |
|
|
(set_attr "mode" "")])
|
9751 |
|
|
|
9752 |
|
|
;; Convert shift to the shiftx pattern to avoid flags dependency.
|
9753 |
|
|
(define_split
|
9754 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "")
|
9755 |
|
|
(any_shiftrt:SWI48 (match_operand:SWI48 1 "nonimmediate_operand" "")
|
9756 |
|
|
(match_operand:QI 2 "register_operand" "")))
|
9757 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9758 |
|
|
"TARGET_BMI2 && reload_completed"
|
9759 |
|
|
[(set (match_dup 0)
|
9760 |
|
|
(any_shiftrt:SWI48 (match_dup 1) (match_dup 2)))]
|
9761 |
|
|
"operands[2] = gen_lowpart (mode, operands[2]);")
|
9762 |
|
|
|
9763 |
|
|
(define_insn "*bmi2_si3_1_zext"
|
9764 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
9765 |
|
|
(zero_extend:DI
|
9766 |
|
|
(any_shiftrt:SI (match_operand:SI 1 "nonimmediate_operand" "rm")
|
9767 |
|
|
(match_operand:SI 2 "register_operand" "r"))))]
|
9768 |
|
|
"TARGET_64BIT && TARGET_BMI2"
|
9769 |
|
|
"x\t{%2, %1, %k0|%k0, %1, %2}"
|
9770 |
|
|
[(set_attr "type" "ishiftx")
|
9771 |
|
|
(set_attr "mode" "SI")])
|
9772 |
|
|
|
9773 |
|
|
(define_insn "*si3_1_zext"
|
9774 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r,r")
|
9775 |
|
|
(zero_extend:DI
|
9776 |
|
|
(any_shiftrt:SI (match_operand:SI 1 "nonimmediate_operand" "0,rm")
|
9777 |
|
|
(match_operand:QI 2 "nonmemory_operand" "cI,r"))))
|
9778 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9779 |
|
|
"TARGET_64BIT && ix86_binary_operator_ok (, SImode, operands)"
|
9780 |
|
|
{
|
9781 |
|
|
switch (get_attr_type (insn))
|
9782 |
|
|
{
|
9783 |
|
|
case TYPE_ISHIFTX:
|
9784 |
|
|
return "#";
|
9785 |
|
|
|
9786 |
|
|
default:
|
9787 |
|
|
if (operands[2] == const1_rtx
|
9788 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9789 |
|
|
return "{l}\t%k0";
|
9790 |
|
|
else
|
9791 |
|
|
return "{l}\t{%2, %k0|%k0, %2}";
|
9792 |
|
|
}
|
9793 |
|
|
}
|
9794 |
|
|
[(set_attr "isa" "*,bmi2")
|
9795 |
|
|
(set_attr "type" "ishift,ishiftx")
|
9796 |
|
|
(set (attr "length_immediate")
|
9797 |
|
|
(if_then_else
|
9798 |
|
|
(and (match_operand 2 "const1_operand" "")
|
9799 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9800 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))
|
9801 |
|
|
(const_string "0")
|
9802 |
|
|
(const_string "*")))
|
9803 |
|
|
(set_attr "mode" "SI")])
|
9804 |
|
|
|
9805 |
|
|
;; Convert shift to the shiftx pattern to avoid flags dependency.
|
9806 |
|
|
(define_split
|
9807 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
9808 |
|
|
(zero_extend:DI
|
9809 |
|
|
(any_shiftrt:SI (match_operand:SI 1 "nonimmediate_operand" "")
|
9810 |
|
|
(match_operand:QI 2 "register_operand" ""))))
|
9811 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9812 |
|
|
"TARGET_64BIT && TARGET_BMI2 && reload_completed"
|
9813 |
|
|
[(set (match_dup 0)
|
9814 |
|
|
(zero_extend:DI (any_shiftrt:SI (match_dup 1) (match_dup 2))))]
|
9815 |
|
|
"operands[2] = gen_lowpart (SImode, operands[2]);")
|
9816 |
|
|
|
9817 |
|
|
(define_insn "*3_1"
|
9818 |
|
|
[(set (match_operand:SWI12 0 "nonimmediate_operand" "=m")
|
9819 |
|
|
(any_shiftrt:SWI12
|
9820 |
|
|
(match_operand:SWI12 1 "nonimmediate_operand" "0")
|
9821 |
|
|
(match_operand:QI 2 "nonmemory_operand" "c")))
|
9822 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9823 |
|
|
"ix86_binary_operator_ok (, mode, operands)"
|
9824 |
|
|
{
|
9825 |
|
|
if (operands[2] == const1_rtx
|
9826 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9827 |
|
|
return "{}\t%0";
|
9828 |
|
|
else
|
9829 |
|
|
return "{}\t{%2, %0|%0, %2}";
|
9830 |
|
|
}
|
9831 |
|
|
[(set_attr "type" "ishift")
|
9832 |
|
|
(set (attr "length_immediate")
|
9833 |
|
|
(if_then_else
|
9834 |
|
|
(and (match_operand 2 "const1_operand" "")
|
9835 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9836 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))
|
9837 |
|
|
(const_string "0")
|
9838 |
|
|
(const_string "*")))
|
9839 |
|
|
(set_attr "mode" "")])
|
9840 |
|
|
|
9841 |
|
|
(define_insn "*qi3_1_slp"
|
9842 |
|
|
[(set (strict_low_part (match_operand:QI 0 "nonimmediate_operand" "+qm"))
|
9843 |
|
|
(any_shiftrt:QI (match_dup 0)
|
9844 |
|
|
(match_operand:QI 1 "nonmemory_operand" "cI")))
|
9845 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
9846 |
|
|
"(optimize_function_for_size_p (cfun)
|
9847 |
|
|
|| !TARGET_PARTIAL_REG_STALL
|
9848 |
|
|
|| (operands[1] == const1_rtx
|
9849 |
|
|
&& TARGET_SHIFT1))"
|
9850 |
|
|
{
|
9851 |
|
|
if (operands[1] == const1_rtx
|
9852 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9853 |
|
|
return "{b}\t%0";
|
9854 |
|
|
else
|
9855 |
|
|
return "{b}\t{%1, %0|%0, %1}";
|
9856 |
|
|
}
|
9857 |
|
|
[(set_attr "type" "ishift1")
|
9858 |
|
|
(set (attr "length_immediate")
|
9859 |
|
|
(if_then_else
|
9860 |
|
|
(and (match_operand 1 "const1_operand" "")
|
9861 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9862 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))
|
9863 |
|
|
(const_string "0")
|
9864 |
|
|
(const_string "*")))
|
9865 |
|
|
(set_attr "mode" "QI")])
|
9866 |
|
|
|
9867 |
|
|
;; This pattern can't accept a variable shift count, since shifts by
|
9868 |
|
|
;; zero don't affect the flags. We assume that shifts by constant
|
9869 |
|
|
;; zero are optimized away.
|
9870 |
|
|
(define_insn "*3_cmp"
|
9871 |
|
|
[(set (reg FLAGS_REG)
|
9872 |
|
|
(compare
|
9873 |
|
|
(any_shiftrt:SWI
|
9874 |
|
|
(match_operand:SWI 1 "nonimmediate_operand" "0")
|
9875 |
|
|
(match_operand:QI 2 "" ""))
|
9876 |
|
|
(const_int 0)))
|
9877 |
|
|
(set (match_operand:SWI 0 "nonimmediate_operand" "=m")
|
9878 |
|
|
(any_shiftrt:SWI (match_dup 1) (match_dup 2)))]
|
9879 |
|
|
"(optimize_function_for_size_p (cfun)
|
9880 |
|
|
|| !TARGET_PARTIAL_FLAG_REG_STALL
|
9881 |
|
|
|| (operands[2] == const1_rtx
|
9882 |
|
|
&& TARGET_SHIFT1))
|
9883 |
|
|
&& ix86_match_ccmode (insn, CCGOCmode)
|
9884 |
|
|
&& ix86_binary_operator_ok (, mode, operands)"
|
9885 |
|
|
{
|
9886 |
|
|
if (operands[2] == const1_rtx
|
9887 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9888 |
|
|
return "{}\t%0";
|
9889 |
|
|
else
|
9890 |
|
|
return "{}\t{%2, %0|%0, %2}";
|
9891 |
|
|
}
|
9892 |
|
|
[(set_attr "type" "ishift")
|
9893 |
|
|
(set (attr "length_immediate")
|
9894 |
|
|
(if_then_else
|
9895 |
|
|
(and (match_operand 2 "const1_operand" "")
|
9896 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9897 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))
|
9898 |
|
|
(const_string "0")
|
9899 |
|
|
(const_string "*")))
|
9900 |
|
|
(set_attr "mode" "")])
|
9901 |
|
|
|
9902 |
|
|
(define_insn "*si3_cmp_zext"
|
9903 |
|
|
[(set (reg FLAGS_REG)
|
9904 |
|
|
(compare
|
9905 |
|
|
(any_shiftrt:SI (match_operand:SI 1 "register_operand" "0")
|
9906 |
|
|
(match_operand:QI 2 "const_1_to_31_operand" "I"))
|
9907 |
|
|
(const_int 0)))
|
9908 |
|
|
(set (match_operand:DI 0 "register_operand" "=r")
|
9909 |
|
|
(zero_extend:DI (any_shiftrt:SI (match_dup 1) (match_dup 2))))]
|
9910 |
|
|
"TARGET_64BIT
|
9911 |
|
|
&& (optimize_function_for_size_p (cfun)
|
9912 |
|
|
|| !TARGET_PARTIAL_FLAG_REG_STALL
|
9913 |
|
|
|| (operands[2] == const1_rtx
|
9914 |
|
|
&& TARGET_SHIFT1))
|
9915 |
|
|
&& ix86_match_ccmode (insn, CCGOCmode)
|
9916 |
|
|
&& ix86_binary_operator_ok (, SImode, operands)"
|
9917 |
|
|
{
|
9918 |
|
|
if (operands[2] == const1_rtx
|
9919 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9920 |
|
|
return "{l}\t%k0";
|
9921 |
|
|
else
|
9922 |
|
|
return "{l}\t{%2, %k0|%k0, %2}";
|
9923 |
|
|
}
|
9924 |
|
|
[(set_attr "type" "ishift")
|
9925 |
|
|
(set (attr "length_immediate")
|
9926 |
|
|
(if_then_else
|
9927 |
|
|
(and (match_operand 2 "const1_operand" "")
|
9928 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9929 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))
|
9930 |
|
|
(const_string "0")
|
9931 |
|
|
(const_string "*")))
|
9932 |
|
|
(set_attr "mode" "SI")])
|
9933 |
|
|
|
9934 |
|
|
(define_insn "*3_cconly"
|
9935 |
|
|
[(set (reg FLAGS_REG)
|
9936 |
|
|
(compare
|
9937 |
|
|
(any_shiftrt:SWI
|
9938 |
|
|
(match_operand:SWI 1 "register_operand" "0")
|
9939 |
|
|
(match_operand:QI 2 "" ""))
|
9940 |
|
|
(const_int 0)))
|
9941 |
|
|
(clobber (match_scratch:SWI 0 "="))]
|
9942 |
|
|
"(optimize_function_for_size_p (cfun)
|
9943 |
|
|
|| !TARGET_PARTIAL_FLAG_REG_STALL
|
9944 |
|
|
|| (operands[2] == const1_rtx
|
9945 |
|
|
&& TARGET_SHIFT1))
|
9946 |
|
|
&& ix86_match_ccmode (insn, CCGOCmode)"
|
9947 |
|
|
{
|
9948 |
|
|
if (operands[2] == const1_rtx
|
9949 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
9950 |
|
|
return "{}\t%0";
|
9951 |
|
|
else
|
9952 |
|
|
return "{}\t{%2, %0|%0, %2}";
|
9953 |
|
|
}
|
9954 |
|
|
[(set_attr "type" "ishift")
|
9955 |
|
|
(set (attr "length_immediate")
|
9956 |
|
|
(if_then_else
|
9957 |
|
|
(and (match_operand 2 "const1_operand" "")
|
9958 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
9959 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))
|
9960 |
|
|
(const_string "0")
|
9961 |
|
|
(const_string "*")))
|
9962 |
|
|
(set_attr "mode" "")])
|
9963 |
|
|
|
9964 |
|
|
;; Rotate instructions
|
9965 |
|
|
|
9966 |
|
|
(define_expand "ti3"
|
9967 |
|
|
[(set (match_operand:TI 0 "register_operand" "")
|
9968 |
|
|
(any_rotate:TI (match_operand:TI 1 "register_operand" "")
|
9969 |
|
|
(match_operand:QI 2 "nonmemory_operand" "")))]
|
9970 |
|
|
"TARGET_64BIT"
|
9971 |
|
|
{
|
9972 |
|
|
if (const_1_to_63_operand (operands[2], VOIDmode))
|
9973 |
|
|
emit_insn (gen_ix86_ti3_doubleword
|
9974 |
|
|
(operands[0], operands[1], operands[2]));
|
9975 |
|
|
else
|
9976 |
|
|
FAIL;
|
9977 |
|
|
|
9978 |
|
|
DONE;
|
9979 |
|
|
})
|
9980 |
|
|
|
9981 |
|
|
(define_expand "di3"
|
9982 |
|
|
[(set (match_operand:DI 0 "shiftdi_operand" "")
|
9983 |
|
|
(any_rotate:DI (match_operand:DI 1 "shiftdi_operand" "")
|
9984 |
|
|
(match_operand:QI 2 "nonmemory_operand" "")))]
|
9985 |
|
|
""
|
9986 |
|
|
{
|
9987 |
|
|
if (TARGET_64BIT)
|
9988 |
|
|
ix86_expand_binary_operator (, DImode, operands);
|
9989 |
|
|
else if (const_1_to_31_operand (operands[2], VOIDmode))
|
9990 |
|
|
emit_insn (gen_ix86_di3_doubleword
|
9991 |
|
|
(operands[0], operands[1], operands[2]));
|
9992 |
|
|
else
|
9993 |
|
|
FAIL;
|
9994 |
|
|
|
9995 |
|
|
DONE;
|
9996 |
|
|
})
|
9997 |
|
|
|
9998 |
|
|
(define_expand "3"
|
9999 |
|
|
[(set (match_operand:SWIM124 0 "nonimmediate_operand" "")
|
10000 |
|
|
(any_rotate:SWIM124 (match_operand:SWIM124 1 "nonimmediate_operand" "")
|
10001 |
|
|
(match_operand:QI 2 "nonmemory_operand" "")))]
|
10002 |
|
|
""
|
10003 |
|
|
"ix86_expand_binary_operator (, mode, operands); DONE;")
|
10004 |
|
|
|
10005 |
|
|
;; Avoid useless masking of count operand.
|
10006 |
|
|
(define_insn_and_split "*3_mask"
|
10007 |
|
|
[(set (match_operand:SWI48 0 "nonimmediate_operand" "=rm")
|
10008 |
|
|
(any_rotate:SWI48
|
10009 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "0")
|
10010 |
|
|
(subreg:QI
|
10011 |
|
|
(and:SI
|
10012 |
|
|
(match_operand:SI 2 "nonimmediate_operand" "c")
|
10013 |
|
|
(match_operand:SI 3 "const_int_operand" "n")) 0)))
|
10014 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10015 |
|
|
"ix86_binary_operator_ok (, mode, operands)
|
10016 |
|
|
&& (INTVAL (operands[3]) & (GET_MODE_BITSIZE (mode)-1))
|
10017 |
|
|
== GET_MODE_BITSIZE (mode)-1"
|
10018 |
|
|
"#"
|
10019 |
|
|
"&& 1"
|
10020 |
|
|
[(parallel [(set (match_dup 0)
|
10021 |
|
|
(any_rotate:SWI48 (match_dup 1) (match_dup 2)))
|
10022 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
10023 |
|
|
{
|
10024 |
|
|
if (can_create_pseudo_p ())
|
10025 |
|
|
operands [2] = force_reg (SImode, operands[2]);
|
10026 |
|
|
|
10027 |
|
|
operands[2] = simplify_gen_subreg (QImode, operands[2], SImode, 0);
|
10028 |
|
|
}
|
10029 |
|
|
[(set_attr "type" "rotate")
|
10030 |
|
|
(set_attr "mode" "")])
|
10031 |
|
|
|
10032 |
|
|
;; Implement rotation using two double-precision
|
10033 |
|
|
;; shift instructions and a scratch register.
|
10034 |
|
|
|
10035 |
|
|
(define_insn_and_split "ix86_rotl3_doubleword"
|
10036 |
|
|
[(set (match_operand: 0 "register_operand" "=r")
|
10037 |
|
|
(rotate: (match_operand: 1 "register_operand" "0")
|
10038 |
|
|
(match_operand:QI 2 "" "")))
|
10039 |
|
|
(clobber (reg:CC FLAGS_REG))
|
10040 |
|
|
(clobber (match_scratch:DWIH 3 "=&r"))]
|
10041 |
|
|
""
|
10042 |
|
|
"#"
|
10043 |
|
|
"reload_completed"
|
10044 |
|
|
[(set (match_dup 3) (match_dup 4))
|
10045 |
|
|
(parallel
|
10046 |
|
|
[(set (match_dup 4)
|
10047 |
|
|
(ior:DWIH (ashift:DWIH (match_dup 4) (match_dup 2))
|
10048 |
|
|
(lshiftrt:DWIH (match_dup 5)
|
10049 |
|
|
(minus:QI (match_dup 6) (match_dup 2)))))
|
10050 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
10051 |
|
|
(parallel
|
10052 |
|
|
[(set (match_dup 5)
|
10053 |
|
|
(ior:DWIH (ashift:DWIH (match_dup 5) (match_dup 2))
|
10054 |
|
|
(lshiftrt:DWIH (match_dup 3)
|
10055 |
|
|
(minus:QI (match_dup 6) (match_dup 2)))))
|
10056 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
10057 |
|
|
{
|
10058 |
|
|
operands[6] = GEN_INT (GET_MODE_BITSIZE (mode));
|
10059 |
|
|
|
10060 |
|
|
split_double_mode (mode, &operands[0], 1, &operands[4], &operands[5]);
|
10061 |
|
|
})
|
10062 |
|
|
|
10063 |
|
|
(define_insn_and_split "ix86_rotr3_doubleword"
|
10064 |
|
|
[(set (match_operand: 0 "register_operand" "=r")
|
10065 |
|
|
(rotatert: (match_operand: 1 "register_operand" "0")
|
10066 |
|
|
(match_operand:QI 2 "" "")))
|
10067 |
|
|
(clobber (reg:CC FLAGS_REG))
|
10068 |
|
|
(clobber (match_scratch:DWIH 3 "=&r"))]
|
10069 |
|
|
""
|
10070 |
|
|
"#"
|
10071 |
|
|
"reload_completed"
|
10072 |
|
|
[(set (match_dup 3) (match_dup 4))
|
10073 |
|
|
(parallel
|
10074 |
|
|
[(set (match_dup 4)
|
10075 |
|
|
(ior:DWIH (ashiftrt:DWIH (match_dup 4) (match_dup 2))
|
10076 |
|
|
(ashift:DWIH (match_dup 5)
|
10077 |
|
|
(minus:QI (match_dup 6) (match_dup 2)))))
|
10078 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
10079 |
|
|
(parallel
|
10080 |
|
|
[(set (match_dup 5)
|
10081 |
|
|
(ior:DWIH (ashiftrt:DWIH (match_dup 5) (match_dup 2))
|
10082 |
|
|
(ashift:DWIH (match_dup 3)
|
10083 |
|
|
(minus:QI (match_dup 6) (match_dup 2)))))
|
10084 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
10085 |
|
|
{
|
10086 |
|
|
operands[6] = GEN_INT (GET_MODE_BITSIZE (mode));
|
10087 |
|
|
|
10088 |
|
|
split_double_mode (mode, &operands[0], 1, &operands[4], &operands[5]);
|
10089 |
|
|
})
|
10090 |
|
|
|
10091 |
|
|
(define_insn "*bmi2_rorx3_1"
|
10092 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
10093 |
|
|
(rotatert:SWI48 (match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
10094 |
|
|
(match_operand:QI 2 "immediate_operand" "")))]
|
10095 |
|
|
"TARGET_BMI2"
|
10096 |
|
|
"rorx\t{%2, %1, %0|%0, %1, %2}"
|
10097 |
|
|
[(set_attr "type" "rotatex")
|
10098 |
|
|
(set_attr "mode" "")])
|
10099 |
|
|
|
10100 |
|
|
(define_insn "*3_1"
|
10101 |
|
|
[(set (match_operand:SWI48 0 "nonimmediate_operand" "=rm,r")
|
10102 |
|
|
(any_rotate:SWI48
|
10103 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "0,rm")
|
10104 |
|
|
(match_operand:QI 2 "nonmemory_operand" "c,")))
|
10105 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10106 |
|
|
"ix86_binary_operator_ok (, mode, operands)"
|
10107 |
|
|
{
|
10108 |
|
|
switch (get_attr_type (insn))
|
10109 |
|
|
{
|
10110 |
|
|
case TYPE_ROTATEX:
|
10111 |
|
|
return "#";
|
10112 |
|
|
|
10113 |
|
|
default:
|
10114 |
|
|
if (operands[2] == const1_rtx
|
10115 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
10116 |
|
|
return "{}\t%0";
|
10117 |
|
|
else
|
10118 |
|
|
return "{}\t{%2, %0|%0, %2}";
|
10119 |
|
|
}
|
10120 |
|
|
}
|
10121 |
|
|
[(set_attr "isa" "*,bmi2")
|
10122 |
|
|
(set_attr "type" "rotate,rotatex")
|
10123 |
|
|
(set (attr "length_immediate")
|
10124 |
|
|
(if_then_else
|
10125 |
|
|
(and (eq_attr "type" "rotate")
|
10126 |
|
|
(and (match_operand 2 "const1_operand" "")
|
10127 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
10128 |
|
|
(match_test "optimize_function_for_size_p (cfun)"))))
|
10129 |
|
|
(const_string "0")
|
10130 |
|
|
(const_string "*")))
|
10131 |
|
|
(set_attr "mode" "")])
|
10132 |
|
|
|
10133 |
|
|
;; Convert rotate to the rotatex pattern to avoid flags dependency.
|
10134 |
|
|
(define_split
|
10135 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "")
|
10136 |
|
|
(rotate:SWI48 (match_operand:SWI48 1 "nonimmediate_operand" "")
|
10137 |
|
|
(match_operand:QI 2 "immediate_operand" "")))
|
10138 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10139 |
|
|
"TARGET_BMI2 && reload_completed"
|
10140 |
|
|
[(set (match_dup 0)
|
10141 |
|
|
(rotatert:SWI48 (match_dup 1) (match_dup 2)))]
|
10142 |
|
|
{
|
10143 |
|
|
operands[2]
|
10144 |
|
|
= GEN_INT (GET_MODE_BITSIZE (mode) - INTVAL (operands[2]));
|
10145 |
|
|
})
|
10146 |
|
|
|
10147 |
|
|
(define_split
|
10148 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "")
|
10149 |
|
|
(rotatert:SWI48 (match_operand:SWI48 1 "nonimmediate_operand" "")
|
10150 |
|
|
(match_operand:QI 2 "immediate_operand" "")))
|
10151 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10152 |
|
|
"TARGET_BMI2 && reload_completed"
|
10153 |
|
|
[(set (match_dup 0)
|
10154 |
|
|
(rotatert:SWI48 (match_dup 1) (match_dup 2)))])
|
10155 |
|
|
|
10156 |
|
|
(define_insn "*bmi2_rorxsi3_1_zext"
|
10157 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
10158 |
|
|
(zero_extend:DI
|
10159 |
|
|
(rotatert:SI (match_operand:SI 1 "nonimmediate_operand" "rm")
|
10160 |
|
|
(match_operand:QI 2 "immediate_operand" "I"))))]
|
10161 |
|
|
"TARGET_64BIT && TARGET_BMI2"
|
10162 |
|
|
"rorx\t{%2, %1, %k0|%k0, %1, %2}"
|
10163 |
|
|
[(set_attr "type" "rotatex")
|
10164 |
|
|
(set_attr "mode" "SI")])
|
10165 |
|
|
|
10166 |
|
|
(define_insn "*si3_1_zext"
|
10167 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r,r")
|
10168 |
|
|
(zero_extend:DI
|
10169 |
|
|
(any_rotate:SI (match_operand:SI 1 "nonimmediate_operand" "0,rm")
|
10170 |
|
|
(match_operand:QI 2 "nonmemory_operand" "cI,I"))))
|
10171 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10172 |
|
|
"TARGET_64BIT && ix86_binary_operator_ok (, SImode, operands)"
|
10173 |
|
|
{
|
10174 |
|
|
switch (get_attr_type (insn))
|
10175 |
|
|
{
|
10176 |
|
|
case TYPE_ROTATEX:
|
10177 |
|
|
return "#";
|
10178 |
|
|
|
10179 |
|
|
default:
|
10180 |
|
|
if (operands[2] == const1_rtx
|
10181 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
10182 |
|
|
return "{l}\t%k0";
|
10183 |
|
|
else
|
10184 |
|
|
return "{l}\t{%2, %k0|%k0, %2}";
|
10185 |
|
|
}
|
10186 |
|
|
}
|
10187 |
|
|
[(set_attr "isa" "*,bmi2")
|
10188 |
|
|
(set_attr "type" "rotate,rotatex")
|
10189 |
|
|
(set (attr "length_immediate")
|
10190 |
|
|
(if_then_else
|
10191 |
|
|
(and (eq_attr "type" "rotate")
|
10192 |
|
|
(and (match_operand 2 "const1_operand" "")
|
10193 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
10194 |
|
|
(match_test "optimize_function_for_size_p (cfun)"))))
|
10195 |
|
|
(const_string "0")
|
10196 |
|
|
(const_string "*")))
|
10197 |
|
|
(set_attr "mode" "SI")])
|
10198 |
|
|
|
10199 |
|
|
;; Convert rotate to the rotatex pattern to avoid flags dependency.
|
10200 |
|
|
(define_split
|
10201 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
10202 |
|
|
(zero_extend:DI
|
10203 |
|
|
(rotate:SI (match_operand:SI 1 "nonimmediate_operand" "")
|
10204 |
|
|
(match_operand:QI 2 "immediate_operand" ""))))
|
10205 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10206 |
|
|
"TARGET_64BIT && TARGET_BMI2 && reload_completed"
|
10207 |
|
|
[(set (match_dup 0)
|
10208 |
|
|
(zero_extend:DI (rotatert:SI (match_dup 1) (match_dup 2))))]
|
10209 |
|
|
{
|
10210 |
|
|
operands[2]
|
10211 |
|
|
= GEN_INT (GET_MODE_BITSIZE (SImode) - INTVAL (operands[2]));
|
10212 |
|
|
})
|
10213 |
|
|
|
10214 |
|
|
(define_split
|
10215 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
10216 |
|
|
(zero_extend:DI
|
10217 |
|
|
(rotatert:SI (match_operand:SI 1 "nonimmediate_operand" "")
|
10218 |
|
|
(match_operand:QI 2 "immediate_operand" ""))))
|
10219 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10220 |
|
|
"TARGET_64BIT && TARGET_BMI2 && reload_completed"
|
10221 |
|
|
[(set (match_dup 0)
|
10222 |
|
|
(zero_extend:DI (rotatert:SI (match_dup 1) (match_dup 2))))])
|
10223 |
|
|
|
10224 |
|
|
(define_insn "*3_1"
|
10225 |
|
|
[(set (match_operand:SWI12 0 "nonimmediate_operand" "=m")
|
10226 |
|
|
(any_rotate:SWI12 (match_operand:SWI12 1 "nonimmediate_operand" "0")
|
10227 |
|
|
(match_operand:QI 2 "nonmemory_operand" "c")))
|
10228 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10229 |
|
|
"ix86_binary_operator_ok (, mode, operands)"
|
10230 |
|
|
{
|
10231 |
|
|
if (operands[2] == const1_rtx
|
10232 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
10233 |
|
|
return "{}\t%0";
|
10234 |
|
|
else
|
10235 |
|
|
return "{}\t{%2, %0|%0, %2}";
|
10236 |
|
|
}
|
10237 |
|
|
[(set_attr "type" "rotate")
|
10238 |
|
|
(set (attr "length_immediate")
|
10239 |
|
|
(if_then_else
|
10240 |
|
|
(and (match_operand 2 "const1_operand" "")
|
10241 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
10242 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))
|
10243 |
|
|
(const_string "0")
|
10244 |
|
|
(const_string "*")))
|
10245 |
|
|
(set_attr "mode" "")])
|
10246 |
|
|
|
10247 |
|
|
(define_insn "*qi3_1_slp"
|
10248 |
|
|
[(set (strict_low_part (match_operand:QI 0 "nonimmediate_operand" "+qm"))
|
10249 |
|
|
(any_rotate:QI (match_dup 0)
|
10250 |
|
|
(match_operand:QI 1 "nonmemory_operand" "cI")))
|
10251 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10252 |
|
|
"(optimize_function_for_size_p (cfun)
|
10253 |
|
|
|| !TARGET_PARTIAL_REG_STALL
|
10254 |
|
|
|| (operands[1] == const1_rtx
|
10255 |
|
|
&& TARGET_SHIFT1))"
|
10256 |
|
|
{
|
10257 |
|
|
if (operands[1] == const1_rtx
|
10258 |
|
|
&& (TARGET_SHIFT1 || optimize_function_for_size_p (cfun)))
|
10259 |
|
|
return "{b}\t%0";
|
10260 |
|
|
else
|
10261 |
|
|
return "{b}\t{%1, %0|%0, %1}";
|
10262 |
|
|
}
|
10263 |
|
|
[(set_attr "type" "rotate1")
|
10264 |
|
|
(set (attr "length_immediate")
|
10265 |
|
|
(if_then_else
|
10266 |
|
|
(and (match_operand 1 "const1_operand" "")
|
10267 |
|
|
(ior (match_test "TARGET_SHIFT1")
|
10268 |
|
|
(match_test "optimize_function_for_size_p (cfun)")))
|
10269 |
|
|
(const_string "0")
|
10270 |
|
|
(const_string "*")))
|
10271 |
|
|
(set_attr "mode" "QI")])
|
10272 |
|
|
|
10273 |
|
|
(define_split
|
10274 |
|
|
[(set (match_operand:HI 0 "register_operand" "")
|
10275 |
|
|
(any_rotate:HI (match_dup 0) (const_int 8)))
|
10276 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10277 |
|
|
"reload_completed
|
10278 |
|
|
&& (TARGET_USE_XCHGB || optimize_function_for_size_p (cfun))"
|
10279 |
|
|
[(parallel [(set (strict_low_part (match_dup 0))
|
10280 |
|
|
(bswap:HI (match_dup 0)))
|
10281 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
10282 |
|
|
|
10283 |
|
|
;; Bit set / bit test instructions
|
10284 |
|
|
|
10285 |
|
|
(define_expand "extv"
|
10286 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
10287 |
|
|
(sign_extract:SI (match_operand:SI 1 "register_operand" "")
|
10288 |
|
|
(match_operand:SI 2 "const8_operand" "")
|
10289 |
|
|
(match_operand:SI 3 "const8_operand" "")))]
|
10290 |
|
|
""
|
10291 |
|
|
{
|
10292 |
|
|
/* Handle extractions from %ah et al. */
|
10293 |
|
|
if (INTVAL (operands[2]) != 8 || INTVAL (operands[3]) != 8)
|
10294 |
|
|
FAIL;
|
10295 |
|
|
|
10296 |
|
|
/* From mips.md: extract_bit_field doesn't verify that our source
|
10297 |
|
|
matches the predicate, so check it again here. */
|
10298 |
|
|
if (! ext_register_operand (operands[1], VOIDmode))
|
10299 |
|
|
FAIL;
|
10300 |
|
|
})
|
10301 |
|
|
|
10302 |
|
|
(define_expand "extzv"
|
10303 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
10304 |
|
|
(zero_extract:SI (match_operand 1 "ext_register_operand" "")
|
10305 |
|
|
(match_operand:SI 2 "const8_operand" "")
|
10306 |
|
|
(match_operand:SI 3 "const8_operand" "")))]
|
10307 |
|
|
""
|
10308 |
|
|
{
|
10309 |
|
|
/* Handle extractions from %ah et al. */
|
10310 |
|
|
if (INTVAL (operands[2]) != 8 || INTVAL (operands[3]) != 8)
|
10311 |
|
|
FAIL;
|
10312 |
|
|
|
10313 |
|
|
/* From mips.md: extract_bit_field doesn't verify that our source
|
10314 |
|
|
matches the predicate, so check it again here. */
|
10315 |
|
|
if (! ext_register_operand (operands[1], VOIDmode))
|
10316 |
|
|
FAIL;
|
10317 |
|
|
})
|
10318 |
|
|
|
10319 |
|
|
(define_expand "insv"
|
10320 |
|
|
[(set (zero_extract (match_operand 0 "register_operand" "")
|
10321 |
|
|
(match_operand 1 "const_int_operand" "")
|
10322 |
|
|
(match_operand 2 "const_int_operand" ""))
|
10323 |
|
|
(match_operand 3 "register_operand" ""))]
|
10324 |
|
|
""
|
10325 |
|
|
{
|
10326 |
|
|
rtx (*gen_mov_insv_1) (rtx, rtx);
|
10327 |
|
|
|
10328 |
|
|
if (ix86_expand_pinsr (operands))
|
10329 |
|
|
DONE;
|
10330 |
|
|
|
10331 |
|
|
/* Handle insertions to %ah et al. */
|
10332 |
|
|
if (INTVAL (operands[1]) != 8 || INTVAL (operands[2]) != 8)
|
10333 |
|
|
FAIL;
|
10334 |
|
|
|
10335 |
|
|
/* From mips.md: insert_bit_field doesn't verify that our source
|
10336 |
|
|
matches the predicate, so check it again here. */
|
10337 |
|
|
if (! ext_register_operand (operands[0], VOIDmode))
|
10338 |
|
|
FAIL;
|
10339 |
|
|
|
10340 |
|
|
gen_mov_insv_1 = (TARGET_64BIT
|
10341 |
|
|
? gen_movdi_insv_1 : gen_movsi_insv_1);
|
10342 |
|
|
|
10343 |
|
|
emit_insn (gen_mov_insv_1 (operands[0], operands[3]));
|
10344 |
|
|
DONE;
|
10345 |
|
|
})
|
10346 |
|
|
|
10347 |
|
|
;; %%% bts, btr, btc, bt.
|
10348 |
|
|
;; In general these instructions are *slow* when applied to memory,
|
10349 |
|
|
;; since they enforce atomic operation. When applied to registers,
|
10350 |
|
|
;; it depends on the cpu implementation. They're never faster than
|
10351 |
|
|
;; the corresponding and/ior/xor operations, so with 32-bit there's
|
10352 |
|
|
;; no point. But in 64-bit, we can't hold the relevant immediates
|
10353 |
|
|
;; within the instruction itself, so operating on bits in the high
|
10354 |
|
|
;; 32-bits of a register becomes easier.
|
10355 |
|
|
;;
|
10356 |
|
|
;; These are slow on Nocona, but fast on Athlon64. We do require the use
|
10357 |
|
|
;; of btrq and btcq for corner cases of post-reload expansion of absdf and
|
10358 |
|
|
;; negdf respectively, so they can never be disabled entirely.
|
10359 |
|
|
|
10360 |
|
|
(define_insn "*btsq"
|
10361 |
|
|
[(set (zero_extract:DI (match_operand:DI 0 "register_operand" "+r")
|
10362 |
|
|
(const_int 1)
|
10363 |
|
|
(match_operand:DI 1 "const_0_to_63_operand" ""))
|
10364 |
|
|
(const_int 1))
|
10365 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10366 |
|
|
"TARGET_64BIT && (TARGET_USE_BT || reload_completed)"
|
10367 |
|
|
"bts{q}\t{%1, %0|%0, %1}"
|
10368 |
|
|
[(set_attr "type" "alu1")
|
10369 |
|
|
(set_attr "prefix_0f" "1")
|
10370 |
|
|
(set_attr "mode" "DI")])
|
10371 |
|
|
|
10372 |
|
|
(define_insn "*btrq"
|
10373 |
|
|
[(set (zero_extract:DI (match_operand:DI 0 "register_operand" "+r")
|
10374 |
|
|
(const_int 1)
|
10375 |
|
|
(match_operand:DI 1 "const_0_to_63_operand" ""))
|
10376 |
|
|
(const_int 0))
|
10377 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10378 |
|
|
"TARGET_64BIT && (TARGET_USE_BT || reload_completed)"
|
10379 |
|
|
"btr{q}\t{%1, %0|%0, %1}"
|
10380 |
|
|
[(set_attr "type" "alu1")
|
10381 |
|
|
(set_attr "prefix_0f" "1")
|
10382 |
|
|
(set_attr "mode" "DI")])
|
10383 |
|
|
|
10384 |
|
|
(define_insn "*btcq"
|
10385 |
|
|
[(set (zero_extract:DI (match_operand:DI 0 "register_operand" "+r")
|
10386 |
|
|
(const_int 1)
|
10387 |
|
|
(match_operand:DI 1 "const_0_to_63_operand" ""))
|
10388 |
|
|
(not:DI (zero_extract:DI (match_dup 0) (const_int 1) (match_dup 1))))
|
10389 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10390 |
|
|
"TARGET_64BIT && (TARGET_USE_BT || reload_completed)"
|
10391 |
|
|
"btc{q}\t{%1, %0|%0, %1}"
|
10392 |
|
|
[(set_attr "type" "alu1")
|
10393 |
|
|
(set_attr "prefix_0f" "1")
|
10394 |
|
|
(set_attr "mode" "DI")])
|
10395 |
|
|
|
10396 |
|
|
;; Allow Nocona to avoid these instructions if a register is available.
|
10397 |
|
|
|
10398 |
|
|
(define_peephole2
|
10399 |
|
|
[(match_scratch:DI 2 "r")
|
10400 |
|
|
(parallel [(set (zero_extract:DI
|
10401 |
|
|
(match_operand:DI 0 "register_operand" "")
|
10402 |
|
|
(const_int 1)
|
10403 |
|
|
(match_operand:DI 1 "const_0_to_63_operand" ""))
|
10404 |
|
|
(const_int 1))
|
10405 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
10406 |
|
|
"TARGET_64BIT && !TARGET_USE_BT"
|
10407 |
|
|
[(const_int 0)]
|
10408 |
|
|
{
|
10409 |
|
|
HOST_WIDE_INT i = INTVAL (operands[1]), hi, lo;
|
10410 |
|
|
rtx op1;
|
10411 |
|
|
|
10412 |
|
|
if (HOST_BITS_PER_WIDE_INT >= 64)
|
10413 |
|
|
lo = (HOST_WIDE_INT)1 << i, hi = 0;
|
10414 |
|
|
else if (i < HOST_BITS_PER_WIDE_INT)
|
10415 |
|
|
lo = (HOST_WIDE_INT)1 << i, hi = 0;
|
10416 |
|
|
else
|
10417 |
|
|
lo = 0, hi = (HOST_WIDE_INT)1 << (i - HOST_BITS_PER_WIDE_INT);
|
10418 |
|
|
|
10419 |
|
|
op1 = immed_double_const (lo, hi, DImode);
|
10420 |
|
|
if (i >= 31)
|
10421 |
|
|
{
|
10422 |
|
|
emit_move_insn (operands[2], op1);
|
10423 |
|
|
op1 = operands[2];
|
10424 |
|
|
}
|
10425 |
|
|
|
10426 |
|
|
emit_insn (gen_iordi3 (operands[0], operands[0], op1));
|
10427 |
|
|
DONE;
|
10428 |
|
|
})
|
10429 |
|
|
|
10430 |
|
|
(define_peephole2
|
10431 |
|
|
[(match_scratch:DI 2 "r")
|
10432 |
|
|
(parallel [(set (zero_extract:DI
|
10433 |
|
|
(match_operand:DI 0 "register_operand" "")
|
10434 |
|
|
(const_int 1)
|
10435 |
|
|
(match_operand:DI 1 "const_0_to_63_operand" ""))
|
10436 |
|
|
(const_int 0))
|
10437 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
10438 |
|
|
"TARGET_64BIT && !TARGET_USE_BT"
|
10439 |
|
|
[(const_int 0)]
|
10440 |
|
|
{
|
10441 |
|
|
HOST_WIDE_INT i = INTVAL (operands[1]), hi, lo;
|
10442 |
|
|
rtx op1;
|
10443 |
|
|
|
10444 |
|
|
if (HOST_BITS_PER_WIDE_INT >= 64)
|
10445 |
|
|
lo = (HOST_WIDE_INT)1 << i, hi = 0;
|
10446 |
|
|
else if (i < HOST_BITS_PER_WIDE_INT)
|
10447 |
|
|
lo = (HOST_WIDE_INT)1 << i, hi = 0;
|
10448 |
|
|
else
|
10449 |
|
|
lo = 0, hi = (HOST_WIDE_INT)1 << (i - HOST_BITS_PER_WIDE_INT);
|
10450 |
|
|
|
10451 |
|
|
op1 = immed_double_const (~lo, ~hi, DImode);
|
10452 |
|
|
if (i >= 32)
|
10453 |
|
|
{
|
10454 |
|
|
emit_move_insn (operands[2], op1);
|
10455 |
|
|
op1 = operands[2];
|
10456 |
|
|
}
|
10457 |
|
|
|
10458 |
|
|
emit_insn (gen_anddi3 (operands[0], operands[0], op1));
|
10459 |
|
|
DONE;
|
10460 |
|
|
})
|
10461 |
|
|
|
10462 |
|
|
(define_peephole2
|
10463 |
|
|
[(match_scratch:DI 2 "r")
|
10464 |
|
|
(parallel [(set (zero_extract:DI
|
10465 |
|
|
(match_operand:DI 0 "register_operand" "")
|
10466 |
|
|
(const_int 1)
|
10467 |
|
|
(match_operand:DI 1 "const_0_to_63_operand" ""))
|
10468 |
|
|
(not:DI (zero_extract:DI
|
10469 |
|
|
(match_dup 0) (const_int 1) (match_dup 1))))
|
10470 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
10471 |
|
|
"TARGET_64BIT && !TARGET_USE_BT"
|
10472 |
|
|
[(const_int 0)]
|
10473 |
|
|
{
|
10474 |
|
|
HOST_WIDE_INT i = INTVAL (operands[1]), hi, lo;
|
10475 |
|
|
rtx op1;
|
10476 |
|
|
|
10477 |
|
|
if (HOST_BITS_PER_WIDE_INT >= 64)
|
10478 |
|
|
lo = (HOST_WIDE_INT)1 << i, hi = 0;
|
10479 |
|
|
else if (i < HOST_BITS_PER_WIDE_INT)
|
10480 |
|
|
lo = (HOST_WIDE_INT)1 << i, hi = 0;
|
10481 |
|
|
else
|
10482 |
|
|
lo = 0, hi = (HOST_WIDE_INT)1 << (i - HOST_BITS_PER_WIDE_INT);
|
10483 |
|
|
|
10484 |
|
|
op1 = immed_double_const (lo, hi, DImode);
|
10485 |
|
|
if (i >= 31)
|
10486 |
|
|
{
|
10487 |
|
|
emit_move_insn (operands[2], op1);
|
10488 |
|
|
op1 = operands[2];
|
10489 |
|
|
}
|
10490 |
|
|
|
10491 |
|
|
emit_insn (gen_xordi3 (operands[0], operands[0], op1));
|
10492 |
|
|
DONE;
|
10493 |
|
|
})
|
10494 |
|
|
|
10495 |
|
|
(define_insn "*bt"
|
10496 |
|
|
[(set (reg:CCC FLAGS_REG)
|
10497 |
|
|
(compare:CCC
|
10498 |
|
|
(zero_extract:SWI48
|
10499 |
|
|
(match_operand:SWI48 0 "register_operand" "r")
|
10500 |
|
|
(const_int 1)
|
10501 |
|
|
(match_operand:SWI48 1 "x86_64_nonmemory_operand" "rN"))
|
10502 |
|
|
(const_int 0)))]
|
10503 |
|
|
"TARGET_USE_BT || optimize_function_for_size_p (cfun)"
|
10504 |
|
|
"bt{}\t{%1, %0|%0, %1}"
|
10505 |
|
|
[(set_attr "type" "alu1")
|
10506 |
|
|
(set_attr "prefix_0f" "1")
|
10507 |
|
|
(set_attr "mode" "")])
|
10508 |
|
|
|
10509 |
|
|
;; Store-flag instructions.
|
10510 |
|
|
|
10511 |
|
|
;; For all sCOND expanders, also expand the compare or test insn that
|
10512 |
|
|
;; generates cc0. Generate an equality comparison if `seq' or `sne'.
|
10513 |
|
|
|
10514 |
|
|
(define_insn_and_split "*setcc_di_1"
|
10515 |
|
|
[(set (match_operand:DI 0 "register_operand" "=q")
|
10516 |
|
|
(match_operator:DI 1 "ix86_comparison_operator"
|
10517 |
|
|
[(reg FLAGS_REG) (const_int 0)]))]
|
10518 |
|
|
"TARGET_64BIT && !TARGET_PARTIAL_REG_STALL"
|
10519 |
|
|
"#"
|
10520 |
|
|
"&& reload_completed"
|
10521 |
|
|
[(set (match_dup 2) (match_dup 1))
|
10522 |
|
|
(set (match_dup 0) (zero_extend:DI (match_dup 2)))]
|
10523 |
|
|
{
|
10524 |
|
|
PUT_MODE (operands[1], QImode);
|
10525 |
|
|
operands[2] = gen_lowpart (QImode, operands[0]);
|
10526 |
|
|
})
|
10527 |
|
|
|
10528 |
|
|
(define_insn_and_split "*setcc_si_1_and"
|
10529 |
|
|
[(set (match_operand:SI 0 "register_operand" "=q")
|
10530 |
|
|
(match_operator:SI 1 "ix86_comparison_operator"
|
10531 |
|
|
[(reg FLAGS_REG) (const_int 0)]))
|
10532 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10533 |
|
|
"!TARGET_PARTIAL_REG_STALL
|
10534 |
|
|
&& TARGET_ZERO_EXTEND_WITH_AND && optimize_function_for_speed_p (cfun)"
|
10535 |
|
|
"#"
|
10536 |
|
|
"&& reload_completed"
|
10537 |
|
|
[(set (match_dup 2) (match_dup 1))
|
10538 |
|
|
(parallel [(set (match_dup 0) (zero_extend:SI (match_dup 2)))
|
10539 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
10540 |
|
|
{
|
10541 |
|
|
PUT_MODE (operands[1], QImode);
|
10542 |
|
|
operands[2] = gen_lowpart (QImode, operands[0]);
|
10543 |
|
|
})
|
10544 |
|
|
|
10545 |
|
|
(define_insn_and_split "*setcc_si_1_movzbl"
|
10546 |
|
|
[(set (match_operand:SI 0 "register_operand" "=q")
|
10547 |
|
|
(match_operator:SI 1 "ix86_comparison_operator"
|
10548 |
|
|
[(reg FLAGS_REG) (const_int 0)]))]
|
10549 |
|
|
"!TARGET_PARTIAL_REG_STALL
|
10550 |
|
|
&& (!TARGET_ZERO_EXTEND_WITH_AND || optimize_function_for_size_p (cfun))"
|
10551 |
|
|
"#"
|
10552 |
|
|
"&& reload_completed"
|
10553 |
|
|
[(set (match_dup 2) (match_dup 1))
|
10554 |
|
|
(set (match_dup 0) (zero_extend:SI (match_dup 2)))]
|
10555 |
|
|
{
|
10556 |
|
|
PUT_MODE (operands[1], QImode);
|
10557 |
|
|
operands[2] = gen_lowpart (QImode, operands[0]);
|
10558 |
|
|
})
|
10559 |
|
|
|
10560 |
|
|
(define_insn "*setcc_qi"
|
10561 |
|
|
[(set (match_operand:QI 0 "nonimmediate_operand" "=qm")
|
10562 |
|
|
(match_operator:QI 1 "ix86_comparison_operator"
|
10563 |
|
|
[(reg FLAGS_REG) (const_int 0)]))]
|
10564 |
|
|
""
|
10565 |
|
|
"set%C1\t%0"
|
10566 |
|
|
[(set_attr "type" "setcc")
|
10567 |
|
|
(set_attr "mode" "QI")])
|
10568 |
|
|
|
10569 |
|
|
(define_insn "*setcc_qi_slp"
|
10570 |
|
|
[(set (strict_low_part (match_operand:QI 0 "nonimmediate_operand" "+qm"))
|
10571 |
|
|
(match_operator:QI 1 "ix86_comparison_operator"
|
10572 |
|
|
[(reg FLAGS_REG) (const_int 0)]))]
|
10573 |
|
|
""
|
10574 |
|
|
"set%C1\t%0"
|
10575 |
|
|
[(set_attr "type" "setcc")
|
10576 |
|
|
(set_attr "mode" "QI")])
|
10577 |
|
|
|
10578 |
|
|
;; In general it is not safe to assume too much about CCmode registers,
|
10579 |
|
|
;; so simplify-rtx stops when it sees a second one. Under certain
|
10580 |
|
|
;; conditions this is safe on x86, so help combine not create
|
10581 |
|
|
;;
|
10582 |
|
|
;; seta %al
|
10583 |
|
|
;; testb %al, %al
|
10584 |
|
|
;; sete %al
|
10585 |
|
|
|
10586 |
|
|
(define_split
|
10587 |
|
|
[(set (match_operand:QI 0 "nonimmediate_operand" "")
|
10588 |
|
|
(ne:QI (match_operator 1 "ix86_comparison_operator"
|
10589 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
10590 |
|
|
(const_int 0)))]
|
10591 |
|
|
""
|
10592 |
|
|
[(set (match_dup 0) (match_dup 1))]
|
10593 |
|
|
"PUT_MODE (operands[1], QImode);")
|
10594 |
|
|
|
10595 |
|
|
(define_split
|
10596 |
|
|
[(set (strict_low_part (match_operand:QI 0 "nonimmediate_operand" ""))
|
10597 |
|
|
(ne:QI (match_operator 1 "ix86_comparison_operator"
|
10598 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
10599 |
|
|
(const_int 0)))]
|
10600 |
|
|
""
|
10601 |
|
|
[(set (match_dup 0) (match_dup 1))]
|
10602 |
|
|
"PUT_MODE (operands[1], QImode);")
|
10603 |
|
|
|
10604 |
|
|
(define_split
|
10605 |
|
|
[(set (match_operand:QI 0 "nonimmediate_operand" "")
|
10606 |
|
|
(eq:QI (match_operator 1 "ix86_comparison_operator"
|
10607 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
10608 |
|
|
(const_int 0)))]
|
10609 |
|
|
""
|
10610 |
|
|
[(set (match_dup 0) (match_dup 1))]
|
10611 |
|
|
{
|
10612 |
|
|
rtx new_op1 = copy_rtx (operands[1]);
|
10613 |
|
|
operands[1] = new_op1;
|
10614 |
|
|
PUT_MODE (new_op1, QImode);
|
10615 |
|
|
PUT_CODE (new_op1, ix86_reverse_condition (GET_CODE (new_op1),
|
10616 |
|
|
GET_MODE (XEXP (new_op1, 0))));
|
10617 |
|
|
|
10618 |
|
|
/* Make sure that (a) the CCmode we have for the flags is strong
|
10619 |
|
|
enough for the reversed compare or (b) we have a valid FP compare. */
|
10620 |
|
|
if (! ix86_comparison_operator (new_op1, VOIDmode))
|
10621 |
|
|
FAIL;
|
10622 |
|
|
})
|
10623 |
|
|
|
10624 |
|
|
(define_split
|
10625 |
|
|
[(set (strict_low_part (match_operand:QI 0 "nonimmediate_operand" ""))
|
10626 |
|
|
(eq:QI (match_operator 1 "ix86_comparison_operator"
|
10627 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
10628 |
|
|
(const_int 0)))]
|
10629 |
|
|
""
|
10630 |
|
|
[(set (match_dup 0) (match_dup 1))]
|
10631 |
|
|
{
|
10632 |
|
|
rtx new_op1 = copy_rtx (operands[1]);
|
10633 |
|
|
operands[1] = new_op1;
|
10634 |
|
|
PUT_MODE (new_op1, QImode);
|
10635 |
|
|
PUT_CODE (new_op1, ix86_reverse_condition (GET_CODE (new_op1),
|
10636 |
|
|
GET_MODE (XEXP (new_op1, 0))));
|
10637 |
|
|
|
10638 |
|
|
/* Make sure that (a) the CCmode we have for the flags is strong
|
10639 |
|
|
enough for the reversed compare or (b) we have a valid FP compare. */
|
10640 |
|
|
if (! ix86_comparison_operator (new_op1, VOIDmode))
|
10641 |
|
|
FAIL;
|
10642 |
|
|
})
|
10643 |
|
|
|
10644 |
|
|
;; The SSE store flag instructions saves 0 or 0xffffffff to the result.
|
10645 |
|
|
;; subsequent logical operations are used to imitate conditional moves.
|
10646 |
|
|
;; 0xffffffff is NaN, but not in normalized form, so we can't represent
|
10647 |
|
|
;; it directly.
|
10648 |
|
|
|
10649 |
|
|
(define_insn "setcc__sse"
|
10650 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x,x")
|
10651 |
|
|
(match_operator:MODEF 3 "sse_comparison_operator"
|
10652 |
|
|
[(match_operand:MODEF 1 "register_operand" "0,x")
|
10653 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "xm,xm")]))]
|
10654 |
|
|
"SSE_FLOAT_MODE_P (mode)"
|
10655 |
|
|
"@
|
10656 |
|
|
cmp%D3\t{%2, %0|%0, %2}
|
10657 |
|
|
vcmp%D3\t{%2, %1, %0|%0, %1, %2}"
|
10658 |
|
|
[(set_attr "isa" "noavx,avx")
|
10659 |
|
|
(set_attr "type" "ssecmp")
|
10660 |
|
|
(set_attr "length_immediate" "1")
|
10661 |
|
|
(set_attr "prefix" "orig,vex")
|
10662 |
|
|
(set_attr "mode" "")])
|
10663 |
|
|
|
10664 |
|
|
;; Basic conditional jump instructions.
|
10665 |
|
|
;; We ignore the overflow flag for signed branch instructions.
|
10666 |
|
|
|
10667 |
|
|
(define_insn "*jcc_1"
|
10668 |
|
|
[(set (pc)
|
10669 |
|
|
(if_then_else (match_operator 1 "ix86_comparison_operator"
|
10670 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
10671 |
|
|
(label_ref (match_operand 0 "" ""))
|
10672 |
|
|
(pc)))]
|
10673 |
|
|
""
|
10674 |
|
|
"%+j%C1\t%l0"
|
10675 |
|
|
[(set_attr "type" "ibr")
|
10676 |
|
|
(set_attr "modrm" "0")
|
10677 |
|
|
(set (attr "length")
|
10678 |
|
|
(if_then_else (and (ge (minus (match_dup 0) (pc))
|
10679 |
|
|
(const_int -126))
|
10680 |
|
|
(lt (minus (match_dup 0) (pc))
|
10681 |
|
|
(const_int 128)))
|
10682 |
|
|
(const_int 2)
|
10683 |
|
|
(const_int 6)))])
|
10684 |
|
|
|
10685 |
|
|
(define_insn "*jcc_2"
|
10686 |
|
|
[(set (pc)
|
10687 |
|
|
(if_then_else (match_operator 1 "ix86_comparison_operator"
|
10688 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
10689 |
|
|
(pc)
|
10690 |
|
|
(label_ref (match_operand 0 "" ""))))]
|
10691 |
|
|
""
|
10692 |
|
|
"%+j%c1\t%l0"
|
10693 |
|
|
[(set_attr "type" "ibr")
|
10694 |
|
|
(set_attr "modrm" "0")
|
10695 |
|
|
(set (attr "length")
|
10696 |
|
|
(if_then_else (and (ge (minus (match_dup 0) (pc))
|
10697 |
|
|
(const_int -126))
|
10698 |
|
|
(lt (minus (match_dup 0) (pc))
|
10699 |
|
|
(const_int 128)))
|
10700 |
|
|
(const_int 2)
|
10701 |
|
|
(const_int 6)))])
|
10702 |
|
|
|
10703 |
|
|
;; In general it is not safe to assume too much about CCmode registers,
|
10704 |
|
|
;; so simplify-rtx stops when it sees a second one. Under certain
|
10705 |
|
|
;; conditions this is safe on x86, so help combine not create
|
10706 |
|
|
;;
|
10707 |
|
|
;; seta %al
|
10708 |
|
|
;; testb %al, %al
|
10709 |
|
|
;; je Lfoo
|
10710 |
|
|
|
10711 |
|
|
(define_split
|
10712 |
|
|
[(set (pc)
|
10713 |
|
|
(if_then_else (ne (match_operator 0 "ix86_comparison_operator"
|
10714 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
10715 |
|
|
(const_int 0))
|
10716 |
|
|
(label_ref (match_operand 1 "" ""))
|
10717 |
|
|
(pc)))]
|
10718 |
|
|
""
|
10719 |
|
|
[(set (pc)
|
10720 |
|
|
(if_then_else (match_dup 0)
|
10721 |
|
|
(label_ref (match_dup 1))
|
10722 |
|
|
(pc)))]
|
10723 |
|
|
"PUT_MODE (operands[0], VOIDmode);")
|
10724 |
|
|
|
10725 |
|
|
(define_split
|
10726 |
|
|
[(set (pc)
|
10727 |
|
|
(if_then_else (eq (match_operator 0 "ix86_comparison_operator"
|
10728 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
10729 |
|
|
(const_int 0))
|
10730 |
|
|
(label_ref (match_operand 1 "" ""))
|
10731 |
|
|
(pc)))]
|
10732 |
|
|
""
|
10733 |
|
|
[(set (pc)
|
10734 |
|
|
(if_then_else (match_dup 0)
|
10735 |
|
|
(label_ref (match_dup 1))
|
10736 |
|
|
(pc)))]
|
10737 |
|
|
{
|
10738 |
|
|
rtx new_op0 = copy_rtx (operands[0]);
|
10739 |
|
|
operands[0] = new_op0;
|
10740 |
|
|
PUT_MODE (new_op0, VOIDmode);
|
10741 |
|
|
PUT_CODE (new_op0, ix86_reverse_condition (GET_CODE (new_op0),
|
10742 |
|
|
GET_MODE (XEXP (new_op0, 0))));
|
10743 |
|
|
|
10744 |
|
|
/* Make sure that (a) the CCmode we have for the flags is strong
|
10745 |
|
|
enough for the reversed compare or (b) we have a valid FP compare. */
|
10746 |
|
|
if (! ix86_comparison_operator (new_op0, VOIDmode))
|
10747 |
|
|
FAIL;
|
10748 |
|
|
})
|
10749 |
|
|
|
10750 |
|
|
;; zero_extend in SImode is correct also for DImode, since this is what combine
|
10751 |
|
|
;; pass generates from shift insn with QImode operand. Actually, the mode
|
10752 |
|
|
;; of operand 2 (bit offset operand) doesn't matter since bt insn takes
|
10753 |
|
|
;; appropriate modulo of the bit offset value.
|
10754 |
|
|
|
10755 |
|
|
(define_insn_and_split "*jcc_bt"
|
10756 |
|
|
[(set (pc)
|
10757 |
|
|
(if_then_else (match_operator 0 "bt_comparison_operator"
|
10758 |
|
|
[(zero_extract:SWI48
|
10759 |
|
|
(match_operand:SWI48 1 "register_operand" "r")
|
10760 |
|
|
(const_int 1)
|
10761 |
|
|
(zero_extend:SI
|
10762 |
|
|
(match_operand:QI 2 "register_operand" "r")))
|
10763 |
|
|
(const_int 0)])
|
10764 |
|
|
(label_ref (match_operand 3 "" ""))
|
10765 |
|
|
(pc)))
|
10766 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10767 |
|
|
"TARGET_USE_BT || optimize_function_for_size_p (cfun)"
|
10768 |
|
|
"#"
|
10769 |
|
|
"&& 1"
|
10770 |
|
|
[(set (reg:CCC FLAGS_REG)
|
10771 |
|
|
(compare:CCC
|
10772 |
|
|
(zero_extract:SWI48
|
10773 |
|
|
(match_dup 1)
|
10774 |
|
|
(const_int 1)
|
10775 |
|
|
(match_dup 2))
|
10776 |
|
|
(const_int 0)))
|
10777 |
|
|
(set (pc)
|
10778 |
|
|
(if_then_else (match_op_dup 0 [(reg:CCC FLAGS_REG) (const_int 0)])
|
10779 |
|
|
(label_ref (match_dup 3))
|
10780 |
|
|
(pc)))]
|
10781 |
|
|
{
|
10782 |
|
|
operands[2] = simplify_gen_subreg (mode, operands[2], QImode, 0);
|
10783 |
|
|
|
10784 |
|
|
PUT_CODE (operands[0], reverse_condition (GET_CODE (operands[0])));
|
10785 |
|
|
})
|
10786 |
|
|
|
10787 |
|
|
;; Avoid useless masking of bit offset operand. "and" in SImode is correct
|
10788 |
|
|
;; also for DImode, this is what combine produces.
|
10789 |
|
|
(define_insn_and_split "*jcc_bt_mask"
|
10790 |
|
|
[(set (pc)
|
10791 |
|
|
(if_then_else (match_operator 0 "bt_comparison_operator"
|
10792 |
|
|
[(zero_extract:SWI48
|
10793 |
|
|
(match_operand:SWI48 1 "register_operand" "r")
|
10794 |
|
|
(const_int 1)
|
10795 |
|
|
(and:SI
|
10796 |
|
|
(match_operand:SI 2 "register_operand" "r")
|
10797 |
|
|
(match_operand:SI 3 "const_int_operand" "n")))])
|
10798 |
|
|
(label_ref (match_operand 4 "" ""))
|
10799 |
|
|
(pc)))
|
10800 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10801 |
|
|
"(TARGET_USE_BT || optimize_function_for_size_p (cfun))
|
10802 |
|
|
&& (INTVAL (operands[3]) & (GET_MODE_BITSIZE (mode)-1))
|
10803 |
|
|
== GET_MODE_BITSIZE (mode)-1"
|
10804 |
|
|
"#"
|
10805 |
|
|
"&& 1"
|
10806 |
|
|
[(set (reg:CCC FLAGS_REG)
|
10807 |
|
|
(compare:CCC
|
10808 |
|
|
(zero_extract:SWI48
|
10809 |
|
|
(match_dup 1)
|
10810 |
|
|
(const_int 1)
|
10811 |
|
|
(match_dup 2))
|
10812 |
|
|
(const_int 0)))
|
10813 |
|
|
(set (pc)
|
10814 |
|
|
(if_then_else (match_op_dup 0 [(reg:CCC FLAGS_REG) (const_int 0)])
|
10815 |
|
|
(label_ref (match_dup 4))
|
10816 |
|
|
(pc)))]
|
10817 |
|
|
{
|
10818 |
|
|
operands[2] = simplify_gen_subreg (mode, operands[2], SImode, 0);
|
10819 |
|
|
|
10820 |
|
|
PUT_CODE (operands[0], reverse_condition (GET_CODE (operands[0])));
|
10821 |
|
|
})
|
10822 |
|
|
|
10823 |
|
|
(define_insn_and_split "*jcc_btsi_1"
|
10824 |
|
|
[(set (pc)
|
10825 |
|
|
(if_then_else (match_operator 0 "bt_comparison_operator"
|
10826 |
|
|
[(and:SI
|
10827 |
|
|
(lshiftrt:SI
|
10828 |
|
|
(match_operand:SI 1 "register_operand" "r")
|
10829 |
|
|
(match_operand:QI 2 "register_operand" "r"))
|
10830 |
|
|
(const_int 1))
|
10831 |
|
|
(const_int 0)])
|
10832 |
|
|
(label_ref (match_operand 3 "" ""))
|
10833 |
|
|
(pc)))
|
10834 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10835 |
|
|
"TARGET_USE_BT || optimize_function_for_size_p (cfun)"
|
10836 |
|
|
"#"
|
10837 |
|
|
"&& 1"
|
10838 |
|
|
[(set (reg:CCC FLAGS_REG)
|
10839 |
|
|
(compare:CCC
|
10840 |
|
|
(zero_extract:SI
|
10841 |
|
|
(match_dup 1)
|
10842 |
|
|
(const_int 1)
|
10843 |
|
|
(match_dup 2))
|
10844 |
|
|
(const_int 0)))
|
10845 |
|
|
(set (pc)
|
10846 |
|
|
(if_then_else (match_op_dup 0 [(reg:CCC FLAGS_REG) (const_int 0)])
|
10847 |
|
|
(label_ref (match_dup 3))
|
10848 |
|
|
(pc)))]
|
10849 |
|
|
{
|
10850 |
|
|
operands[2] = simplify_gen_subreg (SImode, operands[2], QImode, 0);
|
10851 |
|
|
|
10852 |
|
|
PUT_CODE (operands[0], reverse_condition (GET_CODE (operands[0])));
|
10853 |
|
|
})
|
10854 |
|
|
|
10855 |
|
|
;; avoid useless masking of bit offset operand
|
10856 |
|
|
(define_insn_and_split "*jcc_btsi_mask_1"
|
10857 |
|
|
[(set (pc)
|
10858 |
|
|
(if_then_else
|
10859 |
|
|
(match_operator 0 "bt_comparison_operator"
|
10860 |
|
|
[(and:SI
|
10861 |
|
|
(lshiftrt:SI
|
10862 |
|
|
(match_operand:SI 1 "register_operand" "r")
|
10863 |
|
|
(subreg:QI
|
10864 |
|
|
(and:SI
|
10865 |
|
|
(match_operand:SI 2 "register_operand" "r")
|
10866 |
|
|
(match_operand:SI 3 "const_int_operand" "n")) 0))
|
10867 |
|
|
(const_int 1))
|
10868 |
|
|
(const_int 0)])
|
10869 |
|
|
(label_ref (match_operand 4 "" ""))
|
10870 |
|
|
(pc)))
|
10871 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
10872 |
|
|
"(TARGET_USE_BT || optimize_function_for_size_p (cfun))
|
10873 |
|
|
&& (INTVAL (operands[3]) & 0x1f) == 0x1f"
|
10874 |
|
|
"#"
|
10875 |
|
|
"&& 1"
|
10876 |
|
|
[(set (reg:CCC FLAGS_REG)
|
10877 |
|
|
(compare:CCC
|
10878 |
|
|
(zero_extract:SI
|
10879 |
|
|
(match_dup 1)
|
10880 |
|
|
(const_int 1)
|
10881 |
|
|
(match_dup 2))
|
10882 |
|
|
(const_int 0)))
|
10883 |
|
|
(set (pc)
|
10884 |
|
|
(if_then_else (match_op_dup 0 [(reg:CCC FLAGS_REG) (const_int 0)])
|
10885 |
|
|
(label_ref (match_dup 4))
|
10886 |
|
|
(pc)))]
|
10887 |
|
|
"PUT_CODE (operands[0], reverse_condition (GET_CODE (operands[0])));")
|
10888 |
|
|
|
10889 |
|
|
;; Define combination compare-and-branch fp compare instructions to help
|
10890 |
|
|
;; combine.
|
10891 |
|
|
|
10892 |
|
|
(define_insn "*fp_jcc_1_387"
|
10893 |
|
|
[(set (pc)
|
10894 |
|
|
(if_then_else (match_operator 0 "ix86_fp_comparison_operator"
|
10895 |
|
|
[(match_operand 1 "register_operand" "f")
|
10896 |
|
|
(match_operand 2 "nonimmediate_operand" "fm")])
|
10897 |
|
|
(label_ref (match_operand 3 "" ""))
|
10898 |
|
|
(pc)))
|
10899 |
|
|
(clobber (reg:CCFP FPSR_REG))
|
10900 |
|
|
(clobber (reg:CCFP FLAGS_REG))
|
10901 |
|
|
(clobber (match_scratch:HI 4 "=a"))]
|
10902 |
|
|
"TARGET_80387
|
10903 |
|
|
&& (GET_MODE (operands[1]) == SFmode || GET_MODE (operands[1]) == DFmode)
|
10904 |
|
|
&& GET_MODE (operands[1]) == GET_MODE (operands[2])
|
10905 |
|
|
&& SELECT_CC_MODE (GET_CODE (operands[0]),
|
10906 |
|
|
operands[1], operands[2]) == CCFPmode
|
10907 |
|
|
&& !TARGET_CMOVE"
|
10908 |
|
|
"#")
|
10909 |
|
|
|
10910 |
|
|
(define_insn "*fp_jcc_1r_387"
|
10911 |
|
|
[(set (pc)
|
10912 |
|
|
(if_then_else (match_operator 0 "ix86_fp_comparison_operator"
|
10913 |
|
|
[(match_operand 1 "register_operand" "f")
|
10914 |
|
|
(match_operand 2 "nonimmediate_operand" "fm")])
|
10915 |
|
|
(pc)
|
10916 |
|
|
(label_ref (match_operand 3 "" ""))))
|
10917 |
|
|
(clobber (reg:CCFP FPSR_REG))
|
10918 |
|
|
(clobber (reg:CCFP FLAGS_REG))
|
10919 |
|
|
(clobber (match_scratch:HI 4 "=a"))]
|
10920 |
|
|
"TARGET_80387
|
10921 |
|
|
&& (GET_MODE (operands[1]) == SFmode || GET_MODE (operands[1]) == DFmode)
|
10922 |
|
|
&& GET_MODE (operands[1]) == GET_MODE (operands[2])
|
10923 |
|
|
&& SELECT_CC_MODE (GET_CODE (operands[0]),
|
10924 |
|
|
operands[1], operands[2]) == CCFPmode
|
10925 |
|
|
&& !TARGET_CMOVE"
|
10926 |
|
|
"#")
|
10927 |
|
|
|
10928 |
|
|
(define_insn "*fp_jcc_2_387"
|
10929 |
|
|
[(set (pc)
|
10930 |
|
|
(if_then_else (match_operator 0 "ix86_fp_comparison_operator"
|
10931 |
|
|
[(match_operand 1 "register_operand" "f")
|
10932 |
|
|
(match_operand 2 "register_operand" "f")])
|
10933 |
|
|
(label_ref (match_operand 3 "" ""))
|
10934 |
|
|
(pc)))
|
10935 |
|
|
(clobber (reg:CCFP FPSR_REG))
|
10936 |
|
|
(clobber (reg:CCFP FLAGS_REG))
|
10937 |
|
|
(clobber (match_scratch:HI 4 "=a"))]
|
10938 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
10939 |
|
|
&& GET_MODE (operands[1]) == GET_MODE (operands[2])
|
10940 |
|
|
&& !TARGET_CMOVE"
|
10941 |
|
|
"#")
|
10942 |
|
|
|
10943 |
|
|
(define_insn "*fp_jcc_2r_387"
|
10944 |
|
|
[(set (pc)
|
10945 |
|
|
(if_then_else (match_operator 0 "ix86_fp_comparison_operator"
|
10946 |
|
|
[(match_operand 1 "register_operand" "f")
|
10947 |
|
|
(match_operand 2 "register_operand" "f")])
|
10948 |
|
|
(pc)
|
10949 |
|
|
(label_ref (match_operand 3 "" ""))))
|
10950 |
|
|
(clobber (reg:CCFP FPSR_REG))
|
10951 |
|
|
(clobber (reg:CCFP FLAGS_REG))
|
10952 |
|
|
(clobber (match_scratch:HI 4 "=a"))]
|
10953 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
10954 |
|
|
&& GET_MODE (operands[1]) == GET_MODE (operands[2])
|
10955 |
|
|
&& !TARGET_CMOVE"
|
10956 |
|
|
"#")
|
10957 |
|
|
|
10958 |
|
|
(define_insn "*fp_jcc_3_387"
|
10959 |
|
|
[(set (pc)
|
10960 |
|
|
(if_then_else (match_operator 0 "ix86_fp_comparison_operator"
|
10961 |
|
|
[(match_operand 1 "register_operand" "f")
|
10962 |
|
|
(match_operand 2 "const0_operand" "")])
|
10963 |
|
|
(label_ref (match_operand 3 "" ""))
|
10964 |
|
|
(pc)))
|
10965 |
|
|
(clobber (reg:CCFP FPSR_REG))
|
10966 |
|
|
(clobber (reg:CCFP FLAGS_REG))
|
10967 |
|
|
(clobber (match_scratch:HI 4 "=a"))]
|
10968 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[1]))
|
10969 |
|
|
&& GET_MODE (operands[1]) == GET_MODE (operands[2])
|
10970 |
|
|
&& SELECT_CC_MODE (GET_CODE (operands[0]),
|
10971 |
|
|
operands[1], operands[2]) == CCFPmode
|
10972 |
|
|
&& !TARGET_CMOVE"
|
10973 |
|
|
"#")
|
10974 |
|
|
|
10975 |
|
|
(define_split
|
10976 |
|
|
[(set (pc)
|
10977 |
|
|
(if_then_else (match_operator 0 "ix86_fp_comparison_operator"
|
10978 |
|
|
[(match_operand 1 "register_operand" "")
|
10979 |
|
|
(match_operand 2 "nonimmediate_operand" "")])
|
10980 |
|
|
(match_operand 3 "" "")
|
10981 |
|
|
(match_operand 4 "" "")))
|
10982 |
|
|
(clobber (reg:CCFP FPSR_REG))
|
10983 |
|
|
(clobber (reg:CCFP FLAGS_REG))]
|
10984 |
|
|
"reload_completed"
|
10985 |
|
|
[(const_int 0)]
|
10986 |
|
|
{
|
10987 |
|
|
ix86_split_fp_branch (GET_CODE (operands[0]), operands[1], operands[2],
|
10988 |
|
|
operands[3], operands[4], NULL_RTX, NULL_RTX);
|
10989 |
|
|
DONE;
|
10990 |
|
|
})
|
10991 |
|
|
|
10992 |
|
|
(define_split
|
10993 |
|
|
[(set (pc)
|
10994 |
|
|
(if_then_else (match_operator 0 "ix86_fp_comparison_operator"
|
10995 |
|
|
[(match_operand 1 "register_operand" "")
|
10996 |
|
|
(match_operand 2 "general_operand" "")])
|
10997 |
|
|
(match_operand 3 "" "")
|
10998 |
|
|
(match_operand 4 "" "")))
|
10999 |
|
|
(clobber (reg:CCFP FPSR_REG))
|
11000 |
|
|
(clobber (reg:CCFP FLAGS_REG))
|
11001 |
|
|
(clobber (match_scratch:HI 5 "=a"))]
|
11002 |
|
|
"reload_completed"
|
11003 |
|
|
[(const_int 0)]
|
11004 |
|
|
{
|
11005 |
|
|
ix86_split_fp_branch (GET_CODE (operands[0]), operands[1], operands[2],
|
11006 |
|
|
operands[3], operands[4], operands[5], NULL_RTX);
|
11007 |
|
|
DONE;
|
11008 |
|
|
})
|
11009 |
|
|
|
11010 |
|
|
;; The order of operands in *fp_jcc_4_387 is forced by combine in
|
11011 |
|
|
;; simplify_comparison () function. Float operator is treated as RTX_OBJ
|
11012 |
|
|
;; with a precedence over other operators and is always put in the first
|
11013 |
|
|
;; place. Swap condition and operands to match ficom instruction.
|
11014 |
|
|
|
11015 |
|
|
(define_insn "*fp_jcc_4__387"
|
11016 |
|
|
[(set (pc)
|
11017 |
|
|
(if_then_else
|
11018 |
|
|
(match_operator 0 "ix86_swapped_fp_comparison_operator"
|
11019 |
|
|
[(match_operator 1 "float_operator"
|
11020 |
|
|
[(match_operand:SWI24 2 "nonimmediate_operand" "m,?r")])
|
11021 |
|
|
(match_operand 3 "register_operand" "f,f")])
|
11022 |
|
|
(label_ref (match_operand 4 "" ""))
|
11023 |
|
|
(pc)))
|
11024 |
|
|
(clobber (reg:CCFP FPSR_REG))
|
11025 |
|
|
(clobber (reg:CCFP FLAGS_REG))
|
11026 |
|
|
(clobber (match_scratch:HI 5 "=a,a"))]
|
11027 |
|
|
"X87_FLOAT_MODE_P (GET_MODE (operands[3]))
|
11028 |
|
|
&& (TARGET_USE_MODE_FIOP || optimize_function_for_size_p (cfun))
|
11029 |
|
|
&& GET_MODE (operands[1]) == GET_MODE (operands[3])
|
11030 |
|
|
&& ix86_fp_compare_mode (swap_condition (GET_CODE (operands[0]))) == CCFPmode
|
11031 |
|
|
&& !TARGET_CMOVE"
|
11032 |
|
|
"#")
|
11033 |
|
|
|
11034 |
|
|
(define_split
|
11035 |
|
|
[(set (pc)
|
11036 |
|
|
(if_then_else
|
11037 |
|
|
(match_operator 0 "ix86_swapped_fp_comparison_operator"
|
11038 |
|
|
[(match_operator 1 "float_operator"
|
11039 |
|
|
[(match_operand:SWI24 2 "memory_operand" "")])
|
11040 |
|
|
(match_operand 3 "register_operand" "")])
|
11041 |
|
|
(match_operand 4 "" "")
|
11042 |
|
|
(match_operand 5 "" "")))
|
11043 |
|
|
(clobber (reg:CCFP FPSR_REG))
|
11044 |
|
|
(clobber (reg:CCFP FLAGS_REG))
|
11045 |
|
|
(clobber (match_scratch:HI 6 "=a"))]
|
11046 |
|
|
"reload_completed"
|
11047 |
|
|
[(const_int 0)]
|
11048 |
|
|
{
|
11049 |
|
|
operands[7] = gen_rtx_FLOAT (GET_MODE (operands[1]), operands[2]);
|
11050 |
|
|
|
11051 |
|
|
ix86_split_fp_branch (swap_condition (GET_CODE (operands[0])),
|
11052 |
|
|
operands[3], operands[7],
|
11053 |
|
|
operands[4], operands[5], operands[6], NULL_RTX);
|
11054 |
|
|
DONE;
|
11055 |
|
|
})
|
11056 |
|
|
|
11057 |
|
|
;; %%% Kill this when reload knows how to do it.
|
11058 |
|
|
(define_split
|
11059 |
|
|
[(set (pc)
|
11060 |
|
|
(if_then_else
|
11061 |
|
|
(match_operator 0 "ix86_swapped_fp_comparison_operator"
|
11062 |
|
|
[(match_operator 1 "float_operator"
|
11063 |
|
|
[(match_operand:SWI24 2 "register_operand" "")])
|
11064 |
|
|
(match_operand 3 "register_operand" "")])
|
11065 |
|
|
(match_operand 4 "" "")
|
11066 |
|
|
(match_operand 5 "" "")))
|
11067 |
|
|
(clobber (reg:CCFP FPSR_REG))
|
11068 |
|
|
(clobber (reg:CCFP FLAGS_REG))
|
11069 |
|
|
(clobber (match_scratch:HI 6 "=a"))]
|
11070 |
|
|
"reload_completed"
|
11071 |
|
|
[(const_int 0)]
|
11072 |
|
|
{
|
11073 |
|
|
operands[7] = ix86_force_to_memory (GET_MODE (operands[2]), operands[2]);
|
11074 |
|
|
operands[7] = gen_rtx_FLOAT (GET_MODE (operands[1]), operands[7]);
|
11075 |
|
|
|
11076 |
|
|
ix86_split_fp_branch (swap_condition (GET_CODE (operands[0])),
|
11077 |
|
|
operands[3], operands[7],
|
11078 |
|
|
operands[4], operands[5], operands[6], operands[2]);
|
11079 |
|
|
DONE;
|
11080 |
|
|
})
|
11081 |
|
|
|
11082 |
|
|
;; Unconditional and other jump instructions
|
11083 |
|
|
|
11084 |
|
|
(define_insn "jump"
|
11085 |
|
|
[(set (pc)
|
11086 |
|
|
(label_ref (match_operand 0 "" "")))]
|
11087 |
|
|
""
|
11088 |
|
|
"jmp\t%l0"
|
11089 |
|
|
[(set_attr "type" "ibr")
|
11090 |
|
|
(set (attr "length")
|
11091 |
|
|
(if_then_else (and (ge (minus (match_dup 0) (pc))
|
11092 |
|
|
(const_int -126))
|
11093 |
|
|
(lt (minus (match_dup 0) (pc))
|
11094 |
|
|
(const_int 128)))
|
11095 |
|
|
(const_int 2)
|
11096 |
|
|
(const_int 5)))
|
11097 |
|
|
(set_attr "modrm" "0")])
|
11098 |
|
|
|
11099 |
|
|
(define_expand "indirect_jump"
|
11100 |
|
|
[(set (pc) (match_operand 0 "indirect_branch_operand" ""))])
|
11101 |
|
|
|
11102 |
|
|
(define_insn "*indirect_jump"
|
11103 |
|
|
[(set (pc) (match_operand:P 0 "indirect_branch_operand" "rw"))]
|
11104 |
|
|
""
|
11105 |
|
|
"jmp\t%A0"
|
11106 |
|
|
[(set_attr "type" "ibr")
|
11107 |
|
|
(set_attr "length_immediate" "0")])
|
11108 |
|
|
|
11109 |
|
|
(define_expand "tablejump"
|
11110 |
|
|
[(parallel [(set (pc) (match_operand 0 "indirect_branch_operand" ""))
|
11111 |
|
|
(use (label_ref (match_operand 1 "" "")))])]
|
11112 |
|
|
""
|
11113 |
|
|
{
|
11114 |
|
|
/* In PIC mode, the table entries are stored GOT (32-bit) or PC (64-bit)
|
11115 |
|
|
relative. Convert the relative address to an absolute address. */
|
11116 |
|
|
if (flag_pic)
|
11117 |
|
|
{
|
11118 |
|
|
rtx op0, op1;
|
11119 |
|
|
enum rtx_code code;
|
11120 |
|
|
|
11121 |
|
|
/* We can't use @GOTOFF for text labels on VxWorks;
|
11122 |
|
|
see gotoff_operand. */
|
11123 |
|
|
if (TARGET_64BIT || TARGET_VXWORKS_RTP)
|
11124 |
|
|
{
|
11125 |
|
|
code = PLUS;
|
11126 |
|
|
op0 = operands[0];
|
11127 |
|
|
op1 = gen_rtx_LABEL_REF (Pmode, operands[1]);
|
11128 |
|
|
}
|
11129 |
|
|
else if (TARGET_MACHO || HAVE_AS_GOTOFF_IN_DATA)
|
11130 |
|
|
{
|
11131 |
|
|
code = PLUS;
|
11132 |
|
|
op0 = operands[0];
|
11133 |
|
|
op1 = pic_offset_table_rtx;
|
11134 |
|
|
}
|
11135 |
|
|
else
|
11136 |
|
|
{
|
11137 |
|
|
code = MINUS;
|
11138 |
|
|
op0 = pic_offset_table_rtx;
|
11139 |
|
|
op1 = operands[0];
|
11140 |
|
|
}
|
11141 |
|
|
|
11142 |
|
|
operands[0] = expand_simple_binop (Pmode, code, op0, op1, NULL_RTX, 0,
|
11143 |
|
|
OPTAB_DIRECT);
|
11144 |
|
|
}
|
11145 |
|
|
else if (TARGET_X32)
|
11146 |
|
|
operands[0] = convert_memory_address (Pmode, operands[0]);
|
11147 |
|
|
})
|
11148 |
|
|
|
11149 |
|
|
(define_insn "*tablejump_1"
|
11150 |
|
|
[(set (pc) (match_operand:P 0 "indirect_branch_operand" "rw"))
|
11151 |
|
|
(use (label_ref (match_operand 1 "" "")))]
|
11152 |
|
|
""
|
11153 |
|
|
"jmp\t%A0"
|
11154 |
|
|
[(set_attr "type" "ibr")
|
11155 |
|
|
(set_attr "length_immediate" "0")])
|
11156 |
|
|
|
11157 |
|
|
;; Convert setcc + movzbl to xor + setcc if operands don't overlap.
|
11158 |
|
|
|
11159 |
|
|
(define_peephole2
|
11160 |
|
|
[(set (reg FLAGS_REG) (match_operand 0 "" ""))
|
11161 |
|
|
(set (match_operand:QI 1 "register_operand" "")
|
11162 |
|
|
(match_operator:QI 2 "ix86_comparison_operator"
|
11163 |
|
|
[(reg FLAGS_REG) (const_int 0)]))
|
11164 |
|
|
(set (match_operand 3 "q_regs_operand" "")
|
11165 |
|
|
(zero_extend (match_dup 1)))]
|
11166 |
|
|
"(peep2_reg_dead_p (3, operands[1])
|
11167 |
|
|
|| operands_match_p (operands[1], operands[3]))
|
11168 |
|
|
&& ! reg_overlap_mentioned_p (operands[3], operands[0])"
|
11169 |
|
|
[(set (match_dup 4) (match_dup 0))
|
11170 |
|
|
(set (strict_low_part (match_dup 5))
|
11171 |
|
|
(match_dup 2))]
|
11172 |
|
|
{
|
11173 |
|
|
operands[4] = gen_rtx_REG (GET_MODE (operands[0]), FLAGS_REG);
|
11174 |
|
|
operands[5] = gen_lowpart (QImode, operands[3]);
|
11175 |
|
|
ix86_expand_clear (operands[3]);
|
11176 |
|
|
})
|
11177 |
|
|
|
11178 |
|
|
;; Similar, but match zero_extendhisi2_and, which adds a clobber.
|
11179 |
|
|
|
11180 |
|
|
(define_peephole2
|
11181 |
|
|
[(set (reg FLAGS_REG) (match_operand 0 "" ""))
|
11182 |
|
|
(set (match_operand:QI 1 "register_operand" "")
|
11183 |
|
|
(match_operator:QI 2 "ix86_comparison_operator"
|
11184 |
|
|
[(reg FLAGS_REG) (const_int 0)]))
|
11185 |
|
|
(parallel [(set (match_operand 3 "q_regs_operand" "")
|
11186 |
|
|
(zero_extend (match_dup 1)))
|
11187 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
11188 |
|
|
"(peep2_reg_dead_p (3, operands[1])
|
11189 |
|
|
|| operands_match_p (operands[1], operands[3]))
|
11190 |
|
|
&& ! reg_overlap_mentioned_p (operands[3], operands[0])"
|
11191 |
|
|
[(set (match_dup 4) (match_dup 0))
|
11192 |
|
|
(set (strict_low_part (match_dup 5))
|
11193 |
|
|
(match_dup 2))]
|
11194 |
|
|
{
|
11195 |
|
|
operands[4] = gen_rtx_REG (GET_MODE (operands[0]), FLAGS_REG);
|
11196 |
|
|
operands[5] = gen_lowpart (QImode, operands[3]);
|
11197 |
|
|
ix86_expand_clear (operands[3]);
|
11198 |
|
|
})
|
11199 |
|
|
|
11200 |
|
|
;; Call instructions.
|
11201 |
|
|
|
11202 |
|
|
;; The predicates normally associated with named expanders are not properly
|
11203 |
|
|
;; checked for calls. This is a bug in the generic code, but it isn't that
|
11204 |
|
|
;; easy to fix. Ignore it for now and be prepared to fix things up.
|
11205 |
|
|
|
11206 |
|
|
;; P6 processors will jump to the address after the decrement when %esp
|
11207 |
|
|
;; is used as a call operand, so they will execute return address as a code.
|
11208 |
|
|
;; See Pentium Pro errata 70, Pentium 2 errata A33 and Pentium 3 errata E17.
|
11209 |
|
|
|
11210 |
|
|
;; Register constraint for call instruction.
|
11211 |
|
|
(define_mode_attr c [(SI "l") (DI "r")])
|
11212 |
|
|
|
11213 |
|
|
;; Call subroutine returning no value.
|
11214 |
|
|
|
11215 |
|
|
(define_expand "call"
|
11216 |
|
|
[(call (match_operand:QI 0 "" "")
|
11217 |
|
|
(match_operand 1 "" ""))
|
11218 |
|
|
(use (match_operand 2 "" ""))]
|
11219 |
|
|
""
|
11220 |
|
|
{
|
11221 |
|
|
ix86_expand_call (NULL, operands[0], operands[1],
|
11222 |
|
|
operands[2], NULL, false);
|
11223 |
|
|
DONE;
|
11224 |
|
|
})
|
11225 |
|
|
|
11226 |
|
|
(define_expand "sibcall"
|
11227 |
|
|
[(call (match_operand:QI 0 "" "")
|
11228 |
|
|
(match_operand 1 "" ""))
|
11229 |
|
|
(use (match_operand 2 "" ""))]
|
11230 |
|
|
""
|
11231 |
|
|
{
|
11232 |
|
|
ix86_expand_call (NULL, operands[0], operands[1],
|
11233 |
|
|
operands[2], NULL, true);
|
11234 |
|
|
DONE;
|
11235 |
|
|
})
|
11236 |
|
|
|
11237 |
|
|
(define_insn_and_split "*call_vzeroupper"
|
11238 |
|
|
[(call (mem:QI (match_operand:P 0 "call_insn_operand" "zw"))
|
11239 |
|
|
(match_operand 1 "" ""))
|
11240 |
|
|
(unspec [(match_operand 2 "const_int_operand" "")]
|
11241 |
|
|
UNSPEC_CALL_NEEDS_VZEROUPPER)]
|
11242 |
|
|
"TARGET_VZEROUPPER && !SIBLING_CALL_P (insn)"
|
11243 |
|
|
"#"
|
11244 |
|
|
"&& reload_completed"
|
11245 |
|
|
[(const_int 0)]
|
11246 |
|
|
"ix86_split_call_vzeroupper (curr_insn, operands[2]); DONE;"
|
11247 |
|
|
[(set_attr "type" "call")])
|
11248 |
|
|
|
11249 |
|
|
(define_insn "*call"
|
11250 |
|
|
[(call (mem:QI (match_operand:P 0 "call_insn_operand" "zw"))
|
11251 |
|
|
(match_operand 1 "" ""))]
|
11252 |
|
|
"!SIBLING_CALL_P (insn)"
|
11253 |
|
|
"* return ix86_output_call_insn (insn, operands[0]);"
|
11254 |
|
|
[(set_attr "type" "call")])
|
11255 |
|
|
|
11256 |
|
|
(define_insn_and_split "*call_rex64_ms_sysv_vzeroupper"
|
11257 |
|
|
[(call (mem:QI (match_operand:DI 0 "call_insn_operand" "rzw"))
|
11258 |
|
|
(match_operand 1 "" ""))
|
11259 |
|
|
(unspec [(const_int 0)] UNSPEC_MS_TO_SYSV_CALL)
|
11260 |
|
|
(clobber (reg:TI XMM6_REG))
|
11261 |
|
|
(clobber (reg:TI XMM7_REG))
|
11262 |
|
|
(clobber (reg:TI XMM8_REG))
|
11263 |
|
|
(clobber (reg:TI XMM9_REG))
|
11264 |
|
|
(clobber (reg:TI XMM10_REG))
|
11265 |
|
|
(clobber (reg:TI XMM11_REG))
|
11266 |
|
|
(clobber (reg:TI XMM12_REG))
|
11267 |
|
|
(clobber (reg:TI XMM13_REG))
|
11268 |
|
|
(clobber (reg:TI XMM14_REG))
|
11269 |
|
|
(clobber (reg:TI XMM15_REG))
|
11270 |
|
|
(clobber (reg:DI SI_REG))
|
11271 |
|
|
(clobber (reg:DI DI_REG))
|
11272 |
|
|
(unspec [(match_operand 2 "const_int_operand" "")]
|
11273 |
|
|
UNSPEC_CALL_NEEDS_VZEROUPPER)]
|
11274 |
|
|
"TARGET_VZEROUPPER && TARGET_64BIT && !SIBLING_CALL_P (insn)"
|
11275 |
|
|
"#"
|
11276 |
|
|
"&& reload_completed"
|
11277 |
|
|
[(const_int 0)]
|
11278 |
|
|
"ix86_split_call_vzeroupper (curr_insn, operands[2]); DONE;"
|
11279 |
|
|
[(set_attr "type" "call")])
|
11280 |
|
|
|
11281 |
|
|
(define_insn "*call_rex64_ms_sysv"
|
11282 |
|
|
[(call (mem:QI (match_operand:DI 0 "call_insn_operand" "rzw"))
|
11283 |
|
|
(match_operand 1 "" ""))
|
11284 |
|
|
(unspec [(const_int 0)] UNSPEC_MS_TO_SYSV_CALL)
|
11285 |
|
|
(clobber (reg:TI XMM6_REG))
|
11286 |
|
|
(clobber (reg:TI XMM7_REG))
|
11287 |
|
|
(clobber (reg:TI XMM8_REG))
|
11288 |
|
|
(clobber (reg:TI XMM9_REG))
|
11289 |
|
|
(clobber (reg:TI XMM10_REG))
|
11290 |
|
|
(clobber (reg:TI XMM11_REG))
|
11291 |
|
|
(clobber (reg:TI XMM12_REG))
|
11292 |
|
|
(clobber (reg:TI XMM13_REG))
|
11293 |
|
|
(clobber (reg:TI XMM14_REG))
|
11294 |
|
|
(clobber (reg:TI XMM15_REG))
|
11295 |
|
|
(clobber (reg:DI SI_REG))
|
11296 |
|
|
(clobber (reg:DI DI_REG))]
|
11297 |
|
|
"TARGET_64BIT && !SIBLING_CALL_P (insn)"
|
11298 |
|
|
"* return ix86_output_call_insn (insn, operands[0]);"
|
11299 |
|
|
[(set_attr "type" "call")])
|
11300 |
|
|
|
11301 |
|
|
(define_insn_and_split "*sibcall_vzeroupper"
|
11302 |
|
|
[(call (mem:QI (match_operand:P 0 "sibcall_insn_operand" "Uz"))
|
11303 |
|
|
(match_operand 1 "" ""))
|
11304 |
|
|
(unspec [(match_operand 2 "const_int_operand" "")]
|
11305 |
|
|
UNSPEC_CALL_NEEDS_VZEROUPPER)]
|
11306 |
|
|
"TARGET_VZEROUPPER && SIBLING_CALL_P (insn)"
|
11307 |
|
|
"#"
|
11308 |
|
|
"&& reload_completed"
|
11309 |
|
|
[(const_int 0)]
|
11310 |
|
|
"ix86_split_call_vzeroupper (curr_insn, operands[2]); DONE;"
|
11311 |
|
|
[(set_attr "type" "call")])
|
11312 |
|
|
|
11313 |
|
|
(define_insn "*sibcall"
|
11314 |
|
|
[(call (mem:QI (match_operand:P 0 "sibcall_insn_operand" "Uz"))
|
11315 |
|
|
(match_operand 1 "" ""))]
|
11316 |
|
|
"SIBLING_CALL_P (insn)"
|
11317 |
|
|
"* return ix86_output_call_insn (insn, operands[0]);"
|
11318 |
|
|
[(set_attr "type" "call")])
|
11319 |
|
|
|
11320 |
|
|
(define_expand "call_pop"
|
11321 |
|
|
[(parallel [(call (match_operand:QI 0 "" "")
|
11322 |
|
|
(match_operand:SI 1 "" ""))
|
11323 |
|
|
(set (reg:SI SP_REG)
|
11324 |
|
|
(plus:SI (reg:SI SP_REG)
|
11325 |
|
|
(match_operand:SI 3 "" "")))])]
|
11326 |
|
|
"!TARGET_64BIT"
|
11327 |
|
|
{
|
11328 |
|
|
ix86_expand_call (NULL, operands[0], operands[1],
|
11329 |
|
|
operands[2], operands[3], false);
|
11330 |
|
|
DONE;
|
11331 |
|
|
})
|
11332 |
|
|
|
11333 |
|
|
(define_insn_and_split "*call_pop_vzeroupper"
|
11334 |
|
|
[(call (mem:QI (match_operand:SI 0 "call_insn_operand" "lzm"))
|
11335 |
|
|
(match_operand:SI 1 "" ""))
|
11336 |
|
|
(set (reg:SI SP_REG)
|
11337 |
|
|
(plus:SI (reg:SI SP_REG)
|
11338 |
|
|
(match_operand:SI 2 "immediate_operand" "i")))
|
11339 |
|
|
(unspec [(match_operand 3 "const_int_operand" "")]
|
11340 |
|
|
UNSPEC_CALL_NEEDS_VZEROUPPER)]
|
11341 |
|
|
"TARGET_VZEROUPPER && !TARGET_64BIT && !SIBLING_CALL_P (insn)"
|
11342 |
|
|
"#"
|
11343 |
|
|
"&& reload_completed"
|
11344 |
|
|
[(const_int 0)]
|
11345 |
|
|
"ix86_split_call_vzeroupper (curr_insn, operands[3]); DONE;"
|
11346 |
|
|
[(set_attr "type" "call")])
|
11347 |
|
|
|
11348 |
|
|
(define_insn "*call_pop"
|
11349 |
|
|
[(call (mem:QI (match_operand:SI 0 "call_insn_operand" "lzm"))
|
11350 |
|
|
(match_operand 1 "" ""))
|
11351 |
|
|
(set (reg:SI SP_REG)
|
11352 |
|
|
(plus:SI (reg:SI SP_REG)
|
11353 |
|
|
(match_operand:SI 2 "immediate_operand" "i")))]
|
11354 |
|
|
"!TARGET_64BIT && !SIBLING_CALL_P (insn)"
|
11355 |
|
|
"* return ix86_output_call_insn (insn, operands[0]);"
|
11356 |
|
|
[(set_attr "type" "call")])
|
11357 |
|
|
|
11358 |
|
|
(define_insn_and_split "*sibcall_pop_vzeroupper"
|
11359 |
|
|
[(call (mem:QI (match_operand:SI 0 "sibcall_insn_operand" "Uz"))
|
11360 |
|
|
(match_operand 1 "" ""))
|
11361 |
|
|
(set (reg:SI SP_REG)
|
11362 |
|
|
(plus:SI (reg:SI SP_REG)
|
11363 |
|
|
(match_operand:SI 2 "immediate_operand" "i")))
|
11364 |
|
|
(unspec [(match_operand 3 "const_int_operand" "")]
|
11365 |
|
|
UNSPEC_CALL_NEEDS_VZEROUPPER)]
|
11366 |
|
|
"TARGET_VZEROUPPER && !TARGET_64BIT && SIBLING_CALL_P (insn)"
|
11367 |
|
|
"#"
|
11368 |
|
|
"&& reload_completed"
|
11369 |
|
|
[(const_int 0)]
|
11370 |
|
|
"ix86_split_call_vzeroupper (curr_insn, operands[3]); DONE;"
|
11371 |
|
|
[(set_attr "type" "call")])
|
11372 |
|
|
|
11373 |
|
|
(define_insn "*sibcall_pop"
|
11374 |
|
|
[(call (mem:QI (match_operand:SI 0 "sibcall_insn_operand" "Uz"))
|
11375 |
|
|
(match_operand 1 "" ""))
|
11376 |
|
|
(set (reg:SI SP_REG)
|
11377 |
|
|
(plus:SI (reg:SI SP_REG)
|
11378 |
|
|
(match_operand:SI 2 "immediate_operand" "i")))]
|
11379 |
|
|
"!TARGET_64BIT && SIBLING_CALL_P (insn)"
|
11380 |
|
|
"* return ix86_output_call_insn (insn, operands[0]);"
|
11381 |
|
|
[(set_attr "type" "call")])
|
11382 |
|
|
|
11383 |
|
|
;; Call subroutine, returning value in operand 0
|
11384 |
|
|
|
11385 |
|
|
(define_expand "call_value"
|
11386 |
|
|
[(set (match_operand 0 "" "")
|
11387 |
|
|
(call (match_operand:QI 1 "" "")
|
11388 |
|
|
(match_operand 2 "" "")))
|
11389 |
|
|
(use (match_operand 3 "" ""))]
|
11390 |
|
|
""
|
11391 |
|
|
{
|
11392 |
|
|
ix86_expand_call (operands[0], operands[1], operands[2],
|
11393 |
|
|
operands[3], NULL, false);
|
11394 |
|
|
DONE;
|
11395 |
|
|
})
|
11396 |
|
|
|
11397 |
|
|
(define_expand "sibcall_value"
|
11398 |
|
|
[(set (match_operand 0 "" "")
|
11399 |
|
|
(call (match_operand:QI 1 "" "")
|
11400 |
|
|
(match_operand 2 "" "")))
|
11401 |
|
|
(use (match_operand 3 "" ""))]
|
11402 |
|
|
""
|
11403 |
|
|
{
|
11404 |
|
|
ix86_expand_call (operands[0], operands[1], operands[2],
|
11405 |
|
|
operands[3], NULL, true);
|
11406 |
|
|
DONE;
|
11407 |
|
|
})
|
11408 |
|
|
|
11409 |
|
|
(define_insn_and_split "*call_value_vzeroupper"
|
11410 |
|
|
[(set (match_operand 0 "" "")
|
11411 |
|
|
(call (mem:QI (match_operand:P 1 "call_insn_operand" "zw"))
|
11412 |
|
|
(match_operand 2 "" "")))
|
11413 |
|
|
(unspec [(match_operand 3 "const_int_operand" "")]
|
11414 |
|
|
UNSPEC_CALL_NEEDS_VZEROUPPER)]
|
11415 |
|
|
"TARGET_VZEROUPPER && !SIBLING_CALL_P (insn)"
|
11416 |
|
|
"#"
|
11417 |
|
|
"&& reload_completed"
|
11418 |
|
|
[(const_int 0)]
|
11419 |
|
|
"ix86_split_call_vzeroupper (curr_insn, operands[3]); DONE;"
|
11420 |
|
|
[(set_attr "type" "callv")])
|
11421 |
|
|
|
11422 |
|
|
(define_insn "*call_value"
|
11423 |
|
|
[(set (match_operand 0 "" "")
|
11424 |
|
|
(call (mem:QI (match_operand:P 1 "call_insn_operand" "zw"))
|
11425 |
|
|
(match_operand 2 "" "")))]
|
11426 |
|
|
"!SIBLING_CALL_P (insn)"
|
11427 |
|
|
"* return ix86_output_call_insn (insn, operands[1]);"
|
11428 |
|
|
[(set_attr "type" "callv")])
|
11429 |
|
|
|
11430 |
|
|
(define_insn_and_split "*sibcall_value_vzeroupper"
|
11431 |
|
|
[(set (match_operand 0 "" "")
|
11432 |
|
|
(call (mem:QI (match_operand:P 1 "sibcall_insn_operand" "Uz"))
|
11433 |
|
|
(match_operand 2 "" "")))
|
11434 |
|
|
(unspec [(match_operand 3 "const_int_operand" "")]
|
11435 |
|
|
UNSPEC_CALL_NEEDS_VZEROUPPER)]
|
11436 |
|
|
"TARGET_VZEROUPPER && SIBLING_CALL_P (insn)"
|
11437 |
|
|
"#"
|
11438 |
|
|
"&& reload_completed"
|
11439 |
|
|
[(const_int 0)]
|
11440 |
|
|
"ix86_split_call_vzeroupper (curr_insn, operands[3]); DONE;"
|
11441 |
|
|
[(set_attr "type" "callv")])
|
11442 |
|
|
|
11443 |
|
|
(define_insn "*sibcall_value"
|
11444 |
|
|
[(set (match_operand 0 "" "")
|
11445 |
|
|
(call (mem:QI (match_operand:P 1 "sibcall_insn_operand" "Uz"))
|
11446 |
|
|
(match_operand 2 "" "")))]
|
11447 |
|
|
"SIBLING_CALL_P (insn)"
|
11448 |
|
|
"* return ix86_output_call_insn (insn, operands[1]);"
|
11449 |
|
|
[(set_attr "type" "callv")])
|
11450 |
|
|
|
11451 |
|
|
(define_insn_and_split "*call_value_rex64_ms_sysv_vzeroupper"
|
11452 |
|
|
[(set (match_operand 0 "" "")
|
11453 |
|
|
(call (mem:QI (match_operand:DI 1 "call_insn_operand" "rzw"))
|
11454 |
|
|
(match_operand 2 "" "")))
|
11455 |
|
|
(unspec [(const_int 0)] UNSPEC_MS_TO_SYSV_CALL)
|
11456 |
|
|
(clobber (reg:TI XMM6_REG))
|
11457 |
|
|
(clobber (reg:TI XMM7_REG))
|
11458 |
|
|
(clobber (reg:TI XMM8_REG))
|
11459 |
|
|
(clobber (reg:TI XMM9_REG))
|
11460 |
|
|
(clobber (reg:TI XMM10_REG))
|
11461 |
|
|
(clobber (reg:TI XMM11_REG))
|
11462 |
|
|
(clobber (reg:TI XMM12_REG))
|
11463 |
|
|
(clobber (reg:TI XMM13_REG))
|
11464 |
|
|
(clobber (reg:TI XMM14_REG))
|
11465 |
|
|
(clobber (reg:TI XMM15_REG))
|
11466 |
|
|
(clobber (reg:DI SI_REG))
|
11467 |
|
|
(clobber (reg:DI DI_REG))
|
11468 |
|
|
(unspec [(match_operand 3 "const_int_operand" "")]
|
11469 |
|
|
UNSPEC_CALL_NEEDS_VZEROUPPER)]
|
11470 |
|
|
"TARGET_VZEROUPPER && TARGET_64BIT && !SIBLING_CALL_P (insn)"
|
11471 |
|
|
"#"
|
11472 |
|
|
"&& reload_completed"
|
11473 |
|
|
[(const_int 0)]
|
11474 |
|
|
"ix86_split_call_vzeroupper (curr_insn, operands[3]); DONE;"
|
11475 |
|
|
[(set_attr "type" "callv")])
|
11476 |
|
|
|
11477 |
|
|
(define_insn "*call_value_rex64_ms_sysv"
|
11478 |
|
|
[(set (match_operand 0 "" "")
|
11479 |
|
|
(call (mem:QI (match_operand:DI 1 "call_insn_operand" "rzw"))
|
11480 |
|
|
(match_operand 2 "" "")))
|
11481 |
|
|
(unspec [(const_int 0)] UNSPEC_MS_TO_SYSV_CALL)
|
11482 |
|
|
(clobber (reg:TI XMM6_REG))
|
11483 |
|
|
(clobber (reg:TI XMM7_REG))
|
11484 |
|
|
(clobber (reg:TI XMM8_REG))
|
11485 |
|
|
(clobber (reg:TI XMM9_REG))
|
11486 |
|
|
(clobber (reg:TI XMM10_REG))
|
11487 |
|
|
(clobber (reg:TI XMM11_REG))
|
11488 |
|
|
(clobber (reg:TI XMM12_REG))
|
11489 |
|
|
(clobber (reg:TI XMM13_REG))
|
11490 |
|
|
(clobber (reg:TI XMM14_REG))
|
11491 |
|
|
(clobber (reg:TI XMM15_REG))
|
11492 |
|
|
(clobber (reg:DI SI_REG))
|
11493 |
|
|
(clobber (reg:DI DI_REG))]
|
11494 |
|
|
"TARGET_64BIT && !SIBLING_CALL_P (insn)"
|
11495 |
|
|
"* return ix86_output_call_insn (insn, operands[1]);"
|
11496 |
|
|
[(set_attr "type" "callv")])
|
11497 |
|
|
|
11498 |
|
|
(define_expand "call_value_pop"
|
11499 |
|
|
[(parallel [(set (match_operand 0 "" "")
|
11500 |
|
|
(call (match_operand:QI 1 "" "")
|
11501 |
|
|
(match_operand:SI 2 "" "")))
|
11502 |
|
|
(set (reg:SI SP_REG)
|
11503 |
|
|
(plus:SI (reg:SI SP_REG)
|
11504 |
|
|
(match_operand:SI 4 "" "")))])]
|
11505 |
|
|
"!TARGET_64BIT"
|
11506 |
|
|
{
|
11507 |
|
|
ix86_expand_call (operands[0], operands[1], operands[2],
|
11508 |
|
|
operands[3], operands[4], false);
|
11509 |
|
|
DONE;
|
11510 |
|
|
})
|
11511 |
|
|
|
11512 |
|
|
(define_insn_and_split "*call_value_pop_vzeroupper"
|
11513 |
|
|
[(set (match_operand 0 "" "")
|
11514 |
|
|
(call (mem:QI (match_operand:SI 1 "call_insn_operand" "lzm"))
|
11515 |
|
|
(match_operand 2 "" "")))
|
11516 |
|
|
(set (reg:SI SP_REG)
|
11517 |
|
|
(plus:SI (reg:SI SP_REG)
|
11518 |
|
|
(match_operand:SI 3 "immediate_operand" "i")))
|
11519 |
|
|
(unspec [(match_operand 4 "const_int_operand" "")]
|
11520 |
|
|
UNSPEC_CALL_NEEDS_VZEROUPPER)]
|
11521 |
|
|
"TARGET_VZEROUPPER && !TARGET_64BIT && !SIBLING_CALL_P (insn)"
|
11522 |
|
|
"#"
|
11523 |
|
|
"&& reload_completed"
|
11524 |
|
|
[(const_int 0)]
|
11525 |
|
|
"ix86_split_call_vzeroupper (curr_insn, operands[4]); DONE;"
|
11526 |
|
|
[(set_attr "type" "callv")])
|
11527 |
|
|
|
11528 |
|
|
(define_insn "*call_value_pop"
|
11529 |
|
|
[(set (match_operand 0 "" "")
|
11530 |
|
|
(call (mem:QI (match_operand:SI 1 "call_insn_operand" "lzm"))
|
11531 |
|
|
(match_operand 2 "" "")))
|
11532 |
|
|
(set (reg:SI SP_REG)
|
11533 |
|
|
(plus:SI (reg:SI SP_REG)
|
11534 |
|
|
(match_operand:SI 3 "immediate_operand" "i")))]
|
11535 |
|
|
"!TARGET_64BIT && !SIBLING_CALL_P (insn)"
|
11536 |
|
|
"* return ix86_output_call_insn (insn, operands[1]);"
|
11537 |
|
|
[(set_attr "type" "callv")])
|
11538 |
|
|
|
11539 |
|
|
(define_insn_and_split "*sibcall_value_pop_vzeroupper"
|
11540 |
|
|
[(set (match_operand 0 "" "")
|
11541 |
|
|
(call (mem:QI (match_operand:SI 1 "sibcall_insn_operand" "Uz"))
|
11542 |
|
|
(match_operand 2 "" "")))
|
11543 |
|
|
(set (reg:SI SP_REG)
|
11544 |
|
|
(plus:SI (reg:SI SP_REG)
|
11545 |
|
|
(match_operand:SI 3 "immediate_operand" "i")))
|
11546 |
|
|
(unspec [(match_operand 4 "const_int_operand" "")]
|
11547 |
|
|
UNSPEC_CALL_NEEDS_VZEROUPPER)]
|
11548 |
|
|
"TARGET_VZEROUPPER && !TARGET_64BIT && SIBLING_CALL_P (insn)"
|
11549 |
|
|
"#"
|
11550 |
|
|
"&& reload_completed"
|
11551 |
|
|
[(const_int 0)]
|
11552 |
|
|
"ix86_split_call_vzeroupper (curr_insn, operands[4]); DONE;"
|
11553 |
|
|
[(set_attr "type" "callv")])
|
11554 |
|
|
|
11555 |
|
|
(define_insn "*sibcall_value_pop"
|
11556 |
|
|
[(set (match_operand 0 "" "")
|
11557 |
|
|
(call (mem:QI (match_operand:SI 1 "sibcall_insn_operand" "Uz"))
|
11558 |
|
|
(match_operand 2 "" "")))
|
11559 |
|
|
(set (reg:SI SP_REG)
|
11560 |
|
|
(plus:SI (reg:SI SP_REG)
|
11561 |
|
|
(match_operand:SI 3 "immediate_operand" "i")))]
|
11562 |
|
|
"!TARGET_64BIT && SIBLING_CALL_P (insn)"
|
11563 |
|
|
"* return ix86_output_call_insn (insn, operands[1]);"
|
11564 |
|
|
[(set_attr "type" "callv")])
|
11565 |
|
|
|
11566 |
|
|
;; Call subroutine returning any type.
|
11567 |
|
|
|
11568 |
|
|
(define_expand "untyped_call"
|
11569 |
|
|
[(parallel [(call (match_operand 0 "" "")
|
11570 |
|
|
(const_int 0))
|
11571 |
|
|
(match_operand 1 "" "")
|
11572 |
|
|
(match_operand 2 "" "")])]
|
11573 |
|
|
""
|
11574 |
|
|
{
|
11575 |
|
|
int i;
|
11576 |
|
|
|
11577 |
|
|
/* In order to give reg-stack an easier job in validating two
|
11578 |
|
|
coprocessor registers as containing a possible return value,
|
11579 |
|
|
simply pretend the untyped call returns a complex long double
|
11580 |
|
|
value.
|
11581 |
|
|
|
11582 |
|
|
We can't use SSE_REGPARM_MAX here since callee is unprototyped
|
11583 |
|
|
and should have the default ABI. */
|
11584 |
|
|
|
11585 |
|
|
ix86_expand_call ((TARGET_FLOAT_RETURNS_IN_80387
|
11586 |
|
|
? gen_rtx_REG (XCmode, FIRST_FLOAT_REG) : NULL),
|
11587 |
|
|
operands[0], const0_rtx,
|
11588 |
|
|
GEN_INT ((TARGET_64BIT
|
11589 |
|
|
? (ix86_abi == SYSV_ABI
|
11590 |
|
|
? X86_64_SSE_REGPARM_MAX
|
11591 |
|
|
: X86_64_MS_SSE_REGPARM_MAX)
|
11592 |
|
|
: X86_32_SSE_REGPARM_MAX)
|
11593 |
|
|
- 1),
|
11594 |
|
|
NULL, false);
|
11595 |
|
|
|
11596 |
|
|
for (i = 0; i < XVECLEN (operands[2], 0); i++)
|
11597 |
|
|
{
|
11598 |
|
|
rtx set = XVECEXP (operands[2], 0, i);
|
11599 |
|
|
emit_move_insn (SET_DEST (set), SET_SRC (set));
|
11600 |
|
|
}
|
11601 |
|
|
|
11602 |
|
|
/* The optimizer does not know that the call sets the function value
|
11603 |
|
|
registers we stored in the result block. We avoid problems by
|
11604 |
|
|
claiming that all hard registers are used and clobbered at this
|
11605 |
|
|
point. */
|
11606 |
|
|
emit_insn (gen_blockage ());
|
11607 |
|
|
|
11608 |
|
|
DONE;
|
11609 |
|
|
})
|
11610 |
|
|
|
11611 |
|
|
;; Prologue and epilogue instructions
|
11612 |
|
|
|
11613 |
|
|
;; UNSPEC_VOLATILE is considered to use and clobber all hard registers and
|
11614 |
|
|
;; all of memory. This blocks insns from being moved across this point.
|
11615 |
|
|
|
11616 |
|
|
(define_insn "blockage"
|
11617 |
|
|
[(unspec_volatile [(const_int 0)] UNSPECV_BLOCKAGE)]
|
11618 |
|
|
""
|
11619 |
|
|
""
|
11620 |
|
|
[(set_attr "length" "0")])
|
11621 |
|
|
|
11622 |
|
|
;; Do not schedule instructions accessing memory across this point.
|
11623 |
|
|
|
11624 |
|
|
(define_expand "memory_blockage"
|
11625 |
|
|
[(set (match_dup 0)
|
11626 |
|
|
(unspec:BLK [(match_dup 0)] UNSPEC_MEMORY_BLOCKAGE))]
|
11627 |
|
|
""
|
11628 |
|
|
{
|
11629 |
|
|
operands[0] = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (Pmode));
|
11630 |
|
|
MEM_VOLATILE_P (operands[0]) = 1;
|
11631 |
|
|
})
|
11632 |
|
|
|
11633 |
|
|
(define_insn "*memory_blockage"
|
11634 |
|
|
[(set (match_operand:BLK 0 "" "")
|
11635 |
|
|
(unspec:BLK [(match_dup 0)] UNSPEC_MEMORY_BLOCKAGE))]
|
11636 |
|
|
""
|
11637 |
|
|
""
|
11638 |
|
|
[(set_attr "length" "0")])
|
11639 |
|
|
|
11640 |
|
|
;; As USE insns aren't meaningful after reload, this is used instead
|
11641 |
|
|
;; to prevent deleting instructions setting registers for PIC code
|
11642 |
|
|
(define_insn "prologue_use"
|
11643 |
|
|
[(unspec_volatile [(match_operand 0 "" "")] UNSPECV_PROLOGUE_USE)]
|
11644 |
|
|
""
|
11645 |
|
|
""
|
11646 |
|
|
[(set_attr "length" "0")])
|
11647 |
|
|
|
11648 |
|
|
;; Insn emitted into the body of a function to return from a function.
|
11649 |
|
|
;; This is only done if the function's epilogue is known to be simple.
|
11650 |
|
|
;; See comments for ix86_can_use_return_insn_p in i386.c.
|
11651 |
|
|
|
11652 |
|
|
(define_expand "return"
|
11653 |
|
|
[(simple_return)]
|
11654 |
|
|
"ix86_can_use_return_insn_p ()"
|
11655 |
|
|
{
|
11656 |
|
|
ix86_maybe_emit_epilogue_vzeroupper ();
|
11657 |
|
|
if (crtl->args.pops_args)
|
11658 |
|
|
{
|
11659 |
|
|
rtx popc = GEN_INT (crtl->args.pops_args);
|
11660 |
|
|
emit_jump_insn (gen_simple_return_pop_internal (popc));
|
11661 |
|
|
DONE;
|
11662 |
|
|
}
|
11663 |
|
|
})
|
11664 |
|
|
|
11665 |
|
|
;; We need to disable this for TARGET_SEH, as otherwise
|
11666 |
|
|
;; shrink-wrapped prologue gets enabled too. This might exceed
|
11667 |
|
|
;; the maximum size of prologue in unwind information.
|
11668 |
|
|
|
11669 |
|
|
(define_expand "simple_return"
|
11670 |
|
|
[(simple_return)]
|
11671 |
|
|
"!TARGET_SEH"
|
11672 |
|
|
{
|
11673 |
|
|
ix86_maybe_emit_epilogue_vzeroupper ();
|
11674 |
|
|
if (crtl->args.pops_args)
|
11675 |
|
|
{
|
11676 |
|
|
rtx popc = GEN_INT (crtl->args.pops_args);
|
11677 |
|
|
emit_jump_insn (gen_simple_return_pop_internal (popc));
|
11678 |
|
|
DONE;
|
11679 |
|
|
}
|
11680 |
|
|
})
|
11681 |
|
|
|
11682 |
|
|
(define_insn "simple_return_internal"
|
11683 |
|
|
[(simple_return)]
|
11684 |
|
|
"reload_completed"
|
11685 |
|
|
"ret"
|
11686 |
|
|
[(set_attr "length" "1")
|
11687 |
|
|
(set_attr "atom_unit" "jeu")
|
11688 |
|
|
(set_attr "length_immediate" "0")
|
11689 |
|
|
(set_attr "modrm" "0")])
|
11690 |
|
|
|
11691 |
|
|
;; Used by x86_machine_dependent_reorg to avoid penalty on single byte RET
|
11692 |
|
|
;; instruction Athlon and K8 have.
|
11693 |
|
|
|
11694 |
|
|
(define_insn "simple_return_internal_long"
|
11695 |
|
|
[(simple_return)
|
11696 |
|
|
(unspec [(const_int 0)] UNSPEC_REP)]
|
11697 |
|
|
"reload_completed"
|
11698 |
|
|
"rep\;ret"
|
11699 |
|
|
[(set_attr "length" "2")
|
11700 |
|
|
(set_attr "atom_unit" "jeu")
|
11701 |
|
|
(set_attr "length_immediate" "0")
|
11702 |
|
|
(set_attr "prefix_rep" "1")
|
11703 |
|
|
(set_attr "modrm" "0")])
|
11704 |
|
|
|
11705 |
|
|
(define_insn "simple_return_pop_internal"
|
11706 |
|
|
[(simple_return)
|
11707 |
|
|
(use (match_operand:SI 0 "const_int_operand" ""))]
|
11708 |
|
|
"reload_completed"
|
11709 |
|
|
"ret\t%0"
|
11710 |
|
|
[(set_attr "length" "3")
|
11711 |
|
|
(set_attr "atom_unit" "jeu")
|
11712 |
|
|
(set_attr "length_immediate" "2")
|
11713 |
|
|
(set_attr "modrm" "0")])
|
11714 |
|
|
|
11715 |
|
|
(define_insn "simple_return_indirect_internal"
|
11716 |
|
|
[(simple_return)
|
11717 |
|
|
(use (match_operand:SI 0 "register_operand" "r"))]
|
11718 |
|
|
"reload_completed"
|
11719 |
|
|
"jmp\t%A0"
|
11720 |
|
|
[(set_attr "type" "ibr")
|
11721 |
|
|
(set_attr "length_immediate" "0")])
|
11722 |
|
|
|
11723 |
|
|
(define_insn "nop"
|
11724 |
|
|
[(const_int 0)]
|
11725 |
|
|
""
|
11726 |
|
|
"nop"
|
11727 |
|
|
[(set_attr "length" "1")
|
11728 |
|
|
(set_attr "length_immediate" "0")
|
11729 |
|
|
(set_attr "modrm" "0")])
|
11730 |
|
|
|
11731 |
|
|
;; Generate nops. Operand 0 is the number of nops, up to 8.
|
11732 |
|
|
(define_insn "nops"
|
11733 |
|
|
[(unspec_volatile [(match_operand 0 "const_int_operand" "")]
|
11734 |
|
|
UNSPECV_NOPS)]
|
11735 |
|
|
"reload_completed"
|
11736 |
|
|
{
|
11737 |
|
|
int num = INTVAL (operands[0]);
|
11738 |
|
|
|
11739 |
|
|
gcc_assert (num >= 1 && num <= 8);
|
11740 |
|
|
|
11741 |
|
|
while (num--)
|
11742 |
|
|
fputs ("\tnop\n", asm_out_file);
|
11743 |
|
|
|
11744 |
|
|
return "";
|
11745 |
|
|
}
|
11746 |
|
|
[(set (attr "length") (symbol_ref "INTVAL (operands[0])"))
|
11747 |
|
|
(set_attr "length_immediate" "0")
|
11748 |
|
|
(set_attr "modrm" "0")])
|
11749 |
|
|
|
11750 |
|
|
;; Pad to 16-byte boundary, max skip in op0. Used to avoid
|
11751 |
|
|
;; branch prediction penalty for the third jump in a 16-byte
|
11752 |
|
|
;; block on K8.
|
11753 |
|
|
|
11754 |
|
|
(define_insn "pad"
|
11755 |
|
|
[(unspec_volatile [(match_operand 0 "" "")] UNSPECV_ALIGN)]
|
11756 |
|
|
""
|
11757 |
|
|
{
|
11758 |
|
|
#ifdef ASM_OUTPUT_MAX_SKIP_PAD
|
11759 |
|
|
ASM_OUTPUT_MAX_SKIP_PAD (asm_out_file, 4, (int)INTVAL (operands[0]));
|
11760 |
|
|
#else
|
11761 |
|
|
/* It is tempting to use ASM_OUTPUT_ALIGN here, but we don't want to do that.
|
11762 |
|
|
The align insn is used to avoid 3 jump instructions in the row to improve
|
11763 |
|
|
branch prediction and the benefits hardly outweigh the cost of extra 8
|
11764 |
|
|
nops on the average inserted by full alignment pseudo operation. */
|
11765 |
|
|
#endif
|
11766 |
|
|
return "";
|
11767 |
|
|
}
|
11768 |
|
|
[(set_attr "length" "16")])
|
11769 |
|
|
|
11770 |
|
|
(define_expand "prologue"
|
11771 |
|
|
[(const_int 0)]
|
11772 |
|
|
""
|
11773 |
|
|
"ix86_expand_prologue (); DONE;")
|
11774 |
|
|
|
11775 |
|
|
(define_insn "set_got"
|
11776 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
11777 |
|
|
(unspec:SI [(const_int 0)] UNSPEC_SET_GOT))
|
11778 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
11779 |
|
|
"!TARGET_64BIT"
|
11780 |
|
|
"* return output_set_got (operands[0], NULL_RTX);"
|
11781 |
|
|
[(set_attr "type" "multi")
|
11782 |
|
|
(set_attr "length" "12")])
|
11783 |
|
|
|
11784 |
|
|
(define_insn "set_got_labelled"
|
11785 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
11786 |
|
|
(unspec:SI [(label_ref (match_operand 1 "" ""))]
|
11787 |
|
|
UNSPEC_SET_GOT))
|
11788 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
11789 |
|
|
"!TARGET_64BIT"
|
11790 |
|
|
"* return output_set_got (operands[0], operands[1]);"
|
11791 |
|
|
[(set_attr "type" "multi")
|
11792 |
|
|
(set_attr "length" "12")])
|
11793 |
|
|
|
11794 |
|
|
(define_insn "set_got_rex64"
|
11795 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
11796 |
|
|
(unspec:DI [(const_int 0)] UNSPEC_SET_GOT))]
|
11797 |
|
|
"TARGET_64BIT"
|
11798 |
|
|
"lea{q}\t{_GLOBAL_OFFSET_TABLE_(%%rip), %0|%0, _GLOBAL_OFFSET_TABLE_[rip]}"
|
11799 |
|
|
[(set_attr "type" "lea")
|
11800 |
|
|
(set_attr "length_address" "4")
|
11801 |
|
|
(set_attr "mode" "DI")])
|
11802 |
|
|
|
11803 |
|
|
(define_insn "set_rip_rex64"
|
11804 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
11805 |
|
|
(unspec:DI [(label_ref (match_operand 1 "" ""))] UNSPEC_SET_RIP))]
|
11806 |
|
|
"TARGET_64BIT"
|
11807 |
|
|
"lea{q}\t{%l1(%%rip), %0|%0, %l1[rip]}"
|
11808 |
|
|
[(set_attr "type" "lea")
|
11809 |
|
|
(set_attr "length_address" "4")
|
11810 |
|
|
(set_attr "mode" "DI")])
|
11811 |
|
|
|
11812 |
|
|
(define_insn "set_got_offset_rex64"
|
11813 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
11814 |
|
|
(unspec:DI
|
11815 |
|
|
[(label_ref (match_operand 1 "" ""))]
|
11816 |
|
|
UNSPEC_SET_GOT_OFFSET))]
|
11817 |
|
|
"TARGET_LP64"
|
11818 |
|
|
"movabs{q}\t{$_GLOBAL_OFFSET_TABLE_-%l1, %0|%0, OFFSET FLAT:_GLOBAL_OFFSET_TABLE_-%l1}"
|
11819 |
|
|
[(set_attr "type" "imov")
|
11820 |
|
|
(set_attr "length_immediate" "0")
|
11821 |
|
|
(set_attr "length_address" "8")
|
11822 |
|
|
(set_attr "mode" "DI")])
|
11823 |
|
|
|
11824 |
|
|
(define_expand "epilogue"
|
11825 |
|
|
[(const_int 0)]
|
11826 |
|
|
""
|
11827 |
|
|
"ix86_expand_epilogue (1); DONE;")
|
11828 |
|
|
|
11829 |
|
|
(define_expand "sibcall_epilogue"
|
11830 |
|
|
[(const_int 0)]
|
11831 |
|
|
""
|
11832 |
|
|
"ix86_expand_epilogue (0); DONE;")
|
11833 |
|
|
|
11834 |
|
|
(define_expand "eh_return"
|
11835 |
|
|
[(use (match_operand 0 "register_operand" ""))]
|
11836 |
|
|
""
|
11837 |
|
|
{
|
11838 |
|
|
rtx tmp, sa = EH_RETURN_STACKADJ_RTX, ra = operands[0];
|
11839 |
|
|
|
11840 |
|
|
/* Tricky bit: we write the address of the handler to which we will
|
11841 |
|
|
be returning into someone else's stack frame, one word below the
|
11842 |
|
|
stack address we wish to restore. */
|
11843 |
|
|
tmp = gen_rtx_PLUS (Pmode, arg_pointer_rtx, sa);
|
11844 |
|
|
tmp = plus_constant (tmp, -UNITS_PER_WORD);
|
11845 |
|
|
tmp = gen_rtx_MEM (Pmode, tmp);
|
11846 |
|
|
emit_move_insn (tmp, ra);
|
11847 |
|
|
|
11848 |
|
|
emit_jump_insn (gen_eh_return_internal ());
|
11849 |
|
|
emit_barrier ();
|
11850 |
|
|
DONE;
|
11851 |
|
|
})
|
11852 |
|
|
|
11853 |
|
|
(define_insn_and_split "eh_return_internal"
|
11854 |
|
|
[(eh_return)]
|
11855 |
|
|
""
|
11856 |
|
|
"#"
|
11857 |
|
|
"epilogue_completed"
|
11858 |
|
|
[(const_int 0)]
|
11859 |
|
|
"ix86_expand_epilogue (2); DONE;")
|
11860 |
|
|
|
11861 |
|
|
(define_insn "leave"
|
11862 |
|
|
[(set (reg:SI SP_REG) (plus:SI (reg:SI BP_REG) (const_int 4)))
|
11863 |
|
|
(set (reg:SI BP_REG) (mem:SI (reg:SI BP_REG)))
|
11864 |
|
|
(clobber (mem:BLK (scratch)))]
|
11865 |
|
|
"!TARGET_64BIT"
|
11866 |
|
|
"leave"
|
11867 |
|
|
[(set_attr "type" "leave")])
|
11868 |
|
|
|
11869 |
|
|
(define_insn "leave_rex64"
|
11870 |
|
|
[(set (reg:DI SP_REG) (plus:DI (reg:DI BP_REG) (const_int 8)))
|
11871 |
|
|
(set (reg:DI BP_REG) (mem:DI (reg:DI BP_REG)))
|
11872 |
|
|
(clobber (mem:BLK (scratch)))]
|
11873 |
|
|
"TARGET_64BIT"
|
11874 |
|
|
"leave"
|
11875 |
|
|
[(set_attr "type" "leave")])
|
11876 |
|
|
|
11877 |
|
|
;; Handle -fsplit-stack.
|
11878 |
|
|
|
11879 |
|
|
(define_expand "split_stack_prologue"
|
11880 |
|
|
[(const_int 0)]
|
11881 |
|
|
""
|
11882 |
|
|
{
|
11883 |
|
|
ix86_expand_split_stack_prologue ();
|
11884 |
|
|
DONE;
|
11885 |
|
|
})
|
11886 |
|
|
|
11887 |
|
|
;; In order to support the call/return predictor, we use a return
|
11888 |
|
|
;; instruction which the middle-end doesn't see.
|
11889 |
|
|
(define_insn "split_stack_return"
|
11890 |
|
|
[(unspec_volatile [(match_operand:SI 0 "const_int_operand" "")]
|
11891 |
|
|
UNSPECV_SPLIT_STACK_RETURN)]
|
11892 |
|
|
""
|
11893 |
|
|
{
|
11894 |
|
|
if (operands[0] == const0_rtx)
|
11895 |
|
|
return "ret";
|
11896 |
|
|
else
|
11897 |
|
|
return "ret\t%0";
|
11898 |
|
|
}
|
11899 |
|
|
[(set_attr "atom_unit" "jeu")
|
11900 |
|
|
(set_attr "modrm" "0")
|
11901 |
|
|
(set (attr "length")
|
11902 |
|
|
(if_then_else (match_operand:SI 0 "const0_operand" "")
|
11903 |
|
|
(const_int 1)
|
11904 |
|
|
(const_int 3)))
|
11905 |
|
|
(set (attr "length_immediate")
|
11906 |
|
|
(if_then_else (match_operand:SI 0 "const0_operand" "")
|
11907 |
|
|
(const_int 0)
|
11908 |
|
|
(const_int 2)))])
|
11909 |
|
|
|
11910 |
|
|
;; If there are operand 0 bytes available on the stack, jump to
|
11911 |
|
|
;; operand 1.
|
11912 |
|
|
|
11913 |
|
|
(define_expand "split_stack_space_check"
|
11914 |
|
|
[(set (pc) (if_then_else
|
11915 |
|
|
(ltu (minus (reg SP_REG)
|
11916 |
|
|
(match_operand 0 "register_operand" ""))
|
11917 |
|
|
(unspec [(const_int 0)] UNSPEC_STACK_CHECK))
|
11918 |
|
|
(label_ref (match_operand 1 "" ""))
|
11919 |
|
|
(pc)))]
|
11920 |
|
|
""
|
11921 |
|
|
{
|
11922 |
|
|
rtx reg, size, limit;
|
11923 |
|
|
|
11924 |
|
|
reg = gen_reg_rtx (Pmode);
|
11925 |
|
|
size = force_reg (Pmode, operands[0]);
|
11926 |
|
|
emit_insn (gen_sub3_insn (reg, stack_pointer_rtx, size));
|
11927 |
|
|
limit = gen_rtx_UNSPEC (Pmode, gen_rtvec (1, const0_rtx),
|
11928 |
|
|
UNSPEC_STACK_CHECK);
|
11929 |
|
|
limit = gen_rtx_MEM (Pmode, gen_rtx_CONST (Pmode, limit));
|
11930 |
|
|
ix86_expand_branch (GEU, reg, limit, operands[1]);
|
11931 |
|
|
|
11932 |
|
|
DONE;
|
11933 |
|
|
})
|
11934 |
|
|
|
11935 |
|
|
;; Bit manipulation instructions.
|
11936 |
|
|
|
11937 |
|
|
(define_expand "ffs2"
|
11938 |
|
|
[(set (match_dup 2) (const_int -1))
|
11939 |
|
|
(parallel [(set (reg:CCZ FLAGS_REG)
|
11940 |
|
|
(compare:CCZ
|
11941 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "")
|
11942 |
|
|
(const_int 0)))
|
11943 |
|
|
(set (match_operand:SWI48 0 "register_operand" "")
|
11944 |
|
|
(ctz:SWI48 (match_dup 1)))])
|
11945 |
|
|
(set (match_dup 0) (if_then_else:SWI48
|
11946 |
|
|
(eq (reg:CCZ FLAGS_REG) (const_int 0))
|
11947 |
|
|
(match_dup 2)
|
11948 |
|
|
(match_dup 0)))
|
11949 |
|
|
(parallel [(set (match_dup 0) (plus:SWI48 (match_dup 0) (const_int 1)))
|
11950 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
11951 |
|
|
""
|
11952 |
|
|
{
|
11953 |
|
|
if (mode == SImode && !TARGET_CMOVE)
|
11954 |
|
|
{
|
11955 |
|
|
emit_insn (gen_ffssi2_no_cmove (operands[0], operands [1]));
|
11956 |
|
|
DONE;
|
11957 |
|
|
}
|
11958 |
|
|
operands[2] = gen_reg_rtx (mode);
|
11959 |
|
|
})
|
11960 |
|
|
|
11961 |
|
|
(define_insn_and_split "ffssi2_no_cmove"
|
11962 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
11963 |
|
|
(ffs:SI (match_operand:SI 1 "nonimmediate_operand" "rm")))
|
11964 |
|
|
(clobber (match_scratch:SI 2 "=&q"))
|
11965 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
11966 |
|
|
"!TARGET_CMOVE"
|
11967 |
|
|
"#"
|
11968 |
|
|
"&& reload_completed"
|
11969 |
|
|
[(parallel [(set (reg:CCZ FLAGS_REG)
|
11970 |
|
|
(compare:CCZ (match_dup 1) (const_int 0)))
|
11971 |
|
|
(set (match_dup 0) (ctz:SI (match_dup 1)))])
|
11972 |
|
|
(set (strict_low_part (match_dup 3))
|
11973 |
|
|
(eq:QI (reg:CCZ FLAGS_REG) (const_int 0)))
|
11974 |
|
|
(parallel [(set (match_dup 2) (neg:SI (match_dup 2)))
|
11975 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
11976 |
|
|
(parallel [(set (match_dup 0) (ior:SI (match_dup 0) (match_dup 2)))
|
11977 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
11978 |
|
|
(parallel [(set (match_dup 0) (plus:SI (match_dup 0) (const_int 1)))
|
11979 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
11980 |
|
|
{
|
11981 |
|
|
operands[3] = gen_lowpart (QImode, operands[2]);
|
11982 |
|
|
ix86_expand_clear (operands[2]);
|
11983 |
|
|
})
|
11984 |
|
|
|
11985 |
|
|
(define_insn "*ffs_1"
|
11986 |
|
|
[(set (reg:CCZ FLAGS_REG)
|
11987 |
|
|
(compare:CCZ (match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
11988 |
|
|
(const_int 0)))
|
11989 |
|
|
(set (match_operand:SWI48 0 "register_operand" "=r")
|
11990 |
|
|
(ctz:SWI48 (match_dup 1)))]
|
11991 |
|
|
""
|
11992 |
|
|
"bsf{}\t{%1, %0|%0, %1}"
|
11993 |
|
|
[(set_attr "type" "alu1")
|
11994 |
|
|
(set_attr "prefix_0f" "1")
|
11995 |
|
|
(set_attr "mode" "")])
|
11996 |
|
|
|
11997 |
|
|
(define_insn "ctz2"
|
11998 |
|
|
[(set (match_operand:SWI248 0 "register_operand" "=r")
|
11999 |
|
|
(ctz:SWI248 (match_operand:SWI248 1 "nonimmediate_operand" "rm")))
|
12000 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12001 |
|
|
""
|
12002 |
|
|
{
|
12003 |
|
|
if (TARGET_BMI)
|
12004 |
|
|
return "tzcnt{}\t{%1, %0|%0, %1}";
|
12005 |
|
|
else
|
12006 |
|
|
return "bsf{}\t{%1, %0|%0, %1}";
|
12007 |
|
|
}
|
12008 |
|
|
[(set_attr "type" "alu1")
|
12009 |
|
|
(set_attr "prefix_0f" "1")
|
12010 |
|
|
(set (attr "prefix_rep") (symbol_ref "TARGET_BMI"))
|
12011 |
|
|
(set_attr "mode" "")])
|
12012 |
|
|
|
12013 |
|
|
(define_expand "clz2"
|
12014 |
|
|
[(parallel
|
12015 |
|
|
[(set (match_operand:SWI248 0 "register_operand" "")
|
12016 |
|
|
(minus:SWI248
|
12017 |
|
|
(match_dup 2)
|
12018 |
|
|
(clz:SWI248 (match_operand:SWI248 1 "nonimmediate_operand" ""))))
|
12019 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
12020 |
|
|
(parallel
|
12021 |
|
|
[(set (match_dup 0) (xor:SWI248 (match_dup 0) (match_dup 2)))
|
12022 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
12023 |
|
|
""
|
12024 |
|
|
{
|
12025 |
|
|
if (TARGET_LZCNT)
|
12026 |
|
|
{
|
12027 |
|
|
emit_insn (gen_clz2_lzcnt (operands[0], operands[1]));
|
12028 |
|
|
DONE;
|
12029 |
|
|
}
|
12030 |
|
|
operands[2] = GEN_INT (GET_MODE_BITSIZE (mode)-1);
|
12031 |
|
|
})
|
12032 |
|
|
|
12033 |
|
|
(define_insn "clz2_lzcnt"
|
12034 |
|
|
[(set (match_operand:SWI248 0 "register_operand" "=r")
|
12035 |
|
|
(clz:SWI248 (match_operand:SWI248 1 "nonimmediate_operand" "rm")))
|
12036 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12037 |
|
|
"TARGET_LZCNT"
|
12038 |
|
|
"lzcnt{}\t{%1, %0|%0, %1}"
|
12039 |
|
|
[(set_attr "prefix_rep" "1")
|
12040 |
|
|
(set_attr "type" "bitmanip")
|
12041 |
|
|
(set_attr "mode" "")])
|
12042 |
|
|
|
12043 |
|
|
;; BMI instructions.
|
12044 |
|
|
(define_insn "*bmi_andn_"
|
12045 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12046 |
|
|
(and:SWI48
|
12047 |
|
|
(not:SWI48
|
12048 |
|
|
(match_operand:SWI48 1 "register_operand" "r"))
|
12049 |
|
|
(match_operand:SWI48 2 "nonimmediate_operand" "rm")))
|
12050 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12051 |
|
|
"TARGET_BMI"
|
12052 |
|
|
"andn\t{%2, %1, %0|%0, %1, %2}"
|
12053 |
|
|
[(set_attr "type" "bitmanip")
|
12054 |
|
|
(set_attr "mode" "")])
|
12055 |
|
|
|
12056 |
|
|
(define_insn "bmi_bextr_"
|
12057 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12058 |
|
|
(unspec:SWI48 [(match_operand:SWI48 1 "register_operand" "r")
|
12059 |
|
|
(match_operand:SWI48 2 "nonimmediate_operand" "rm")]
|
12060 |
|
|
UNSPEC_BEXTR))
|
12061 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12062 |
|
|
"TARGET_BMI"
|
12063 |
|
|
"bextr\t{%2, %1, %0|%0, %1, %2}"
|
12064 |
|
|
[(set_attr "type" "bitmanip")
|
12065 |
|
|
(set_attr "mode" "")])
|
12066 |
|
|
|
12067 |
|
|
(define_insn "*bmi_blsi_"
|
12068 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12069 |
|
|
(and:SWI48
|
12070 |
|
|
(neg:SWI48
|
12071 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "rm"))
|
12072 |
|
|
(match_dup 1)))
|
12073 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12074 |
|
|
"TARGET_BMI"
|
12075 |
|
|
"blsi\t{%1, %0|%0, %1}"
|
12076 |
|
|
[(set_attr "type" "bitmanip")
|
12077 |
|
|
(set_attr "mode" "")])
|
12078 |
|
|
|
12079 |
|
|
(define_insn "*bmi_blsmsk_"
|
12080 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12081 |
|
|
(xor:SWI48
|
12082 |
|
|
(plus:SWI48
|
12083 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
12084 |
|
|
(const_int -1))
|
12085 |
|
|
(match_dup 1)))
|
12086 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12087 |
|
|
"TARGET_BMI"
|
12088 |
|
|
"blsmsk\t{%1, %0|%0, %1}"
|
12089 |
|
|
[(set_attr "type" "bitmanip")
|
12090 |
|
|
(set_attr "mode" "")])
|
12091 |
|
|
|
12092 |
|
|
(define_insn "*bmi_blsr_"
|
12093 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12094 |
|
|
(and:SWI48
|
12095 |
|
|
(plus:SWI48
|
12096 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
12097 |
|
|
(const_int -1))
|
12098 |
|
|
(match_dup 1)))
|
12099 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12100 |
|
|
"TARGET_BMI"
|
12101 |
|
|
"blsr\t{%1, %0|%0, %1}"
|
12102 |
|
|
[(set_attr "type" "bitmanip")
|
12103 |
|
|
(set_attr "mode" "")])
|
12104 |
|
|
|
12105 |
|
|
;; BMI2 instructions.
|
12106 |
|
|
(define_insn "bmi2_bzhi_3"
|
12107 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12108 |
|
|
(and:SWI48 (match_operand:SWI48 1 "register_operand" "r")
|
12109 |
|
|
(lshiftrt:SWI48 (const_int -1)
|
12110 |
|
|
(match_operand:SWI48 2 "nonimmediate_operand" "rm"))))
|
12111 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12112 |
|
|
"TARGET_BMI2"
|
12113 |
|
|
"bzhi\t{%2, %1, %0|%0, %1, %2}"
|
12114 |
|
|
[(set_attr "type" "bitmanip")
|
12115 |
|
|
(set_attr "prefix" "vex")
|
12116 |
|
|
(set_attr "mode" "")])
|
12117 |
|
|
|
12118 |
|
|
(define_insn "bmi2_pdep_3"
|
12119 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12120 |
|
|
(unspec:SWI48 [(match_operand:SWI48 1 "register_operand" "r")
|
12121 |
|
|
(match_operand:SWI48 2 "nonimmediate_operand" "rm")]
|
12122 |
|
|
UNSPEC_PDEP))]
|
12123 |
|
|
"TARGET_BMI2"
|
12124 |
|
|
"pdep\t{%2, %1, %0|%0, %1, %2}"
|
12125 |
|
|
[(set_attr "type" "bitmanip")
|
12126 |
|
|
(set_attr "prefix" "vex")
|
12127 |
|
|
(set_attr "mode" "")])
|
12128 |
|
|
|
12129 |
|
|
(define_insn "bmi2_pext_3"
|
12130 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12131 |
|
|
(unspec:SWI48 [(match_operand:SWI48 1 "register_operand" "r")
|
12132 |
|
|
(match_operand:SWI48 2 "nonimmediate_operand" "rm")]
|
12133 |
|
|
UNSPEC_PEXT))]
|
12134 |
|
|
"TARGET_BMI2"
|
12135 |
|
|
"pext\t{%2, %1, %0|%0, %1, %2}"
|
12136 |
|
|
[(set_attr "type" "bitmanip")
|
12137 |
|
|
(set_attr "prefix" "vex")
|
12138 |
|
|
(set_attr "mode" "")])
|
12139 |
|
|
|
12140 |
|
|
;; TBM instructions.
|
12141 |
|
|
(define_insn "tbm_bextri_"
|
12142 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12143 |
|
|
(zero_extract:SWI48
|
12144 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
12145 |
|
|
(match_operand:SWI48 2 "const_0_to_255_operand" "n")
|
12146 |
|
|
(match_operand:SWI48 3 "const_0_to_255_operand" "n")))
|
12147 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12148 |
|
|
"TARGET_TBM"
|
12149 |
|
|
{
|
12150 |
|
|
operands[2] = GEN_INT (INTVAL (operands[2]) << 8 | INTVAL (operands[3]));
|
12151 |
|
|
return "bextr\t{%2, %1, %0|%0, %1, %2}";
|
12152 |
|
|
}
|
12153 |
|
|
[(set_attr "type" "bitmanip")
|
12154 |
|
|
(set_attr "mode" "")])
|
12155 |
|
|
|
12156 |
|
|
(define_insn "*tbm_blcfill_"
|
12157 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12158 |
|
|
(and:SWI48
|
12159 |
|
|
(plus:SWI48
|
12160 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
12161 |
|
|
(const_int 1))
|
12162 |
|
|
(match_dup 1)))
|
12163 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12164 |
|
|
"TARGET_TBM"
|
12165 |
|
|
"blcfill\t{%1, %0|%0, %1}"
|
12166 |
|
|
[(set_attr "type" "bitmanip")
|
12167 |
|
|
(set_attr "mode" "")])
|
12168 |
|
|
|
12169 |
|
|
(define_insn "*tbm_blci_"
|
12170 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12171 |
|
|
(ior:SWI48
|
12172 |
|
|
(not:SWI48
|
12173 |
|
|
(plus:SWI48
|
12174 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
12175 |
|
|
(const_int 1)))
|
12176 |
|
|
(match_dup 1)))
|
12177 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12178 |
|
|
"TARGET_TBM"
|
12179 |
|
|
"blci\t{%1, %0|%0, %1}"
|
12180 |
|
|
[(set_attr "type" "bitmanip")
|
12181 |
|
|
(set_attr "mode" "")])
|
12182 |
|
|
|
12183 |
|
|
(define_insn "*tbm_blcic_"
|
12184 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12185 |
|
|
(and:SWI48
|
12186 |
|
|
(plus:SWI48
|
12187 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
12188 |
|
|
(const_int 1))
|
12189 |
|
|
(not:SWI48
|
12190 |
|
|
(match_dup 1))))
|
12191 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12192 |
|
|
"TARGET_TBM"
|
12193 |
|
|
"blcic\t{%1, %0|%0, %1}"
|
12194 |
|
|
[(set_attr "type" "bitmanip")
|
12195 |
|
|
(set_attr "mode" "")])
|
12196 |
|
|
|
12197 |
|
|
(define_insn "*tbm_blcmsk_"
|
12198 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12199 |
|
|
(xor:SWI48
|
12200 |
|
|
(plus:SWI48
|
12201 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
12202 |
|
|
(const_int 1))
|
12203 |
|
|
(match_dup 1)))
|
12204 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12205 |
|
|
"TARGET_TBM"
|
12206 |
|
|
"blcmsk\t{%1, %0|%0, %1}"
|
12207 |
|
|
[(set_attr "type" "bitmanip")
|
12208 |
|
|
(set_attr "mode" "")])
|
12209 |
|
|
|
12210 |
|
|
(define_insn "*tbm_blcs_"
|
12211 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12212 |
|
|
(ior:SWI48
|
12213 |
|
|
(plus:SWI48
|
12214 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
12215 |
|
|
(const_int 1))
|
12216 |
|
|
(match_dup 1)))
|
12217 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12218 |
|
|
"TARGET_TBM"
|
12219 |
|
|
"blcs\t{%1, %0|%0, %1}"
|
12220 |
|
|
[(set_attr "type" "bitmanip")
|
12221 |
|
|
(set_attr "mode" "")])
|
12222 |
|
|
|
12223 |
|
|
(define_insn "*tbm_blsfill_"
|
12224 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12225 |
|
|
(ior:SWI48
|
12226 |
|
|
(plus:SWI48
|
12227 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
12228 |
|
|
(const_int -1))
|
12229 |
|
|
(match_dup 1)))
|
12230 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12231 |
|
|
"TARGET_TBM"
|
12232 |
|
|
"blsfill\t{%1, %0|%0, %1}"
|
12233 |
|
|
[(set_attr "type" "bitmanip")
|
12234 |
|
|
(set_attr "mode" "")])
|
12235 |
|
|
|
12236 |
|
|
(define_insn "*tbm_blsic_"
|
12237 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12238 |
|
|
(ior:SWI48
|
12239 |
|
|
(plus:SWI48
|
12240 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
12241 |
|
|
(const_int -1))
|
12242 |
|
|
(not:SWI48
|
12243 |
|
|
(match_dup 1))))
|
12244 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12245 |
|
|
"TARGET_TBM"
|
12246 |
|
|
"blsic\t{%1, %0|%0, %1}"
|
12247 |
|
|
[(set_attr "type" "bitmanip")
|
12248 |
|
|
(set_attr "mode" "")])
|
12249 |
|
|
|
12250 |
|
|
(define_insn "*tbm_t1mskc_"
|
12251 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12252 |
|
|
(ior:SWI48
|
12253 |
|
|
(plus:SWI48
|
12254 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
12255 |
|
|
(const_int 1))
|
12256 |
|
|
(not:SWI48
|
12257 |
|
|
(match_dup 1))))
|
12258 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12259 |
|
|
"TARGET_TBM"
|
12260 |
|
|
"t1mskc\t{%1, %0|%0, %1}"
|
12261 |
|
|
[(set_attr "type" "bitmanip")
|
12262 |
|
|
(set_attr "mode" "")])
|
12263 |
|
|
|
12264 |
|
|
(define_insn "*tbm_tzmsk_"
|
12265 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12266 |
|
|
(and:SWI48
|
12267 |
|
|
(plus:SWI48
|
12268 |
|
|
(match_operand:SWI48 1 "nonimmediate_operand" "rm")
|
12269 |
|
|
(const_int -1))
|
12270 |
|
|
(not:SWI48
|
12271 |
|
|
(match_dup 1))))
|
12272 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12273 |
|
|
"TARGET_TBM"
|
12274 |
|
|
"tzmsk\t{%1, %0|%0, %1}"
|
12275 |
|
|
[(set_attr "type" "bitmanip")
|
12276 |
|
|
(set_attr "mode" "")])
|
12277 |
|
|
|
12278 |
|
|
(define_insn "bsr_rex64"
|
12279 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
12280 |
|
|
(minus:DI (const_int 63)
|
12281 |
|
|
(clz:DI (match_operand:DI 1 "nonimmediate_operand" "rm"))))
|
12282 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12283 |
|
|
"TARGET_64BIT"
|
12284 |
|
|
"bsr{q}\t{%1, %0|%0, %1}"
|
12285 |
|
|
[(set_attr "type" "alu1")
|
12286 |
|
|
(set_attr "prefix_0f" "1")
|
12287 |
|
|
(set_attr "mode" "DI")])
|
12288 |
|
|
|
12289 |
|
|
(define_insn "bsr"
|
12290 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
12291 |
|
|
(minus:SI (const_int 31)
|
12292 |
|
|
(clz:SI (match_operand:SI 1 "nonimmediate_operand" "rm"))))
|
12293 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12294 |
|
|
""
|
12295 |
|
|
"bsr{l}\t{%1, %0|%0, %1}"
|
12296 |
|
|
[(set_attr "type" "alu1")
|
12297 |
|
|
(set_attr "prefix_0f" "1")
|
12298 |
|
|
(set_attr "mode" "SI")])
|
12299 |
|
|
|
12300 |
|
|
(define_insn "*bsrhi"
|
12301 |
|
|
[(set (match_operand:HI 0 "register_operand" "=r")
|
12302 |
|
|
(minus:HI (const_int 15)
|
12303 |
|
|
(clz:HI (match_operand:HI 1 "nonimmediate_operand" "rm"))))
|
12304 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12305 |
|
|
""
|
12306 |
|
|
"bsr{w}\t{%1, %0|%0, %1}"
|
12307 |
|
|
[(set_attr "type" "alu1")
|
12308 |
|
|
(set_attr "prefix_0f" "1")
|
12309 |
|
|
(set_attr "mode" "HI")])
|
12310 |
|
|
|
12311 |
|
|
(define_insn "popcount2"
|
12312 |
|
|
[(set (match_operand:SWI248 0 "register_operand" "=r")
|
12313 |
|
|
(popcount:SWI248
|
12314 |
|
|
(match_operand:SWI248 1 "nonimmediate_operand" "rm")))
|
12315 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12316 |
|
|
"TARGET_POPCNT"
|
12317 |
|
|
{
|
12318 |
|
|
#if TARGET_MACHO
|
12319 |
|
|
return "popcnt\t{%1, %0|%0, %1}";
|
12320 |
|
|
#else
|
12321 |
|
|
return "popcnt{}\t{%1, %0|%0, %1}";
|
12322 |
|
|
#endif
|
12323 |
|
|
}
|
12324 |
|
|
[(set_attr "prefix_rep" "1")
|
12325 |
|
|
(set_attr "type" "bitmanip")
|
12326 |
|
|
(set_attr "mode" "")])
|
12327 |
|
|
|
12328 |
|
|
(define_insn "*popcount2_cmp"
|
12329 |
|
|
[(set (reg FLAGS_REG)
|
12330 |
|
|
(compare
|
12331 |
|
|
(popcount:SWI248
|
12332 |
|
|
(match_operand:SWI248 1 "nonimmediate_operand" "rm"))
|
12333 |
|
|
(const_int 0)))
|
12334 |
|
|
(set (match_operand:SWI248 0 "register_operand" "=r")
|
12335 |
|
|
(popcount:SWI248 (match_dup 1)))]
|
12336 |
|
|
"TARGET_POPCNT && ix86_match_ccmode (insn, CCZmode)"
|
12337 |
|
|
{
|
12338 |
|
|
#if TARGET_MACHO
|
12339 |
|
|
return "popcnt\t{%1, %0|%0, %1}";
|
12340 |
|
|
#else
|
12341 |
|
|
return "popcnt{}\t{%1, %0|%0, %1}";
|
12342 |
|
|
#endif
|
12343 |
|
|
}
|
12344 |
|
|
[(set_attr "prefix_rep" "1")
|
12345 |
|
|
(set_attr "type" "bitmanip")
|
12346 |
|
|
(set_attr "mode" "")])
|
12347 |
|
|
|
12348 |
|
|
(define_insn "*popcountsi2_cmp_zext"
|
12349 |
|
|
[(set (reg FLAGS_REG)
|
12350 |
|
|
(compare
|
12351 |
|
|
(popcount:SI (match_operand:SI 1 "nonimmediate_operand" "rm"))
|
12352 |
|
|
(const_int 0)))
|
12353 |
|
|
(set (match_operand:DI 0 "register_operand" "=r")
|
12354 |
|
|
(zero_extend:DI(popcount:SI (match_dup 1))))]
|
12355 |
|
|
"TARGET_64BIT && TARGET_POPCNT && ix86_match_ccmode (insn, CCZmode)"
|
12356 |
|
|
{
|
12357 |
|
|
#if TARGET_MACHO
|
12358 |
|
|
return "popcnt\t{%1, %0|%0, %1}";
|
12359 |
|
|
#else
|
12360 |
|
|
return "popcnt{l}\t{%1, %0|%0, %1}";
|
12361 |
|
|
#endif
|
12362 |
|
|
}
|
12363 |
|
|
[(set_attr "prefix_rep" "1")
|
12364 |
|
|
(set_attr "type" "bitmanip")
|
12365 |
|
|
(set_attr "mode" "SI")])
|
12366 |
|
|
|
12367 |
|
|
(define_expand "bswap2"
|
12368 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "")
|
12369 |
|
|
(bswap:SWI48 (match_operand:SWI48 1 "register_operand" "")))]
|
12370 |
|
|
""
|
12371 |
|
|
{
|
12372 |
|
|
if (mode == SImode && !(TARGET_BSWAP || TARGET_MOVBE))
|
12373 |
|
|
{
|
12374 |
|
|
rtx x = operands[0];
|
12375 |
|
|
|
12376 |
|
|
emit_move_insn (x, operands[1]);
|
12377 |
|
|
emit_insn (gen_bswaphi_lowpart (gen_lowpart (HImode, x)));
|
12378 |
|
|
emit_insn (gen_rotlsi3 (x, x, GEN_INT (16)));
|
12379 |
|
|
emit_insn (gen_bswaphi_lowpart (gen_lowpart (HImode, x)));
|
12380 |
|
|
DONE;
|
12381 |
|
|
}
|
12382 |
|
|
})
|
12383 |
|
|
|
12384 |
|
|
(define_insn "*bswap2_movbe"
|
12385 |
|
|
[(set (match_operand:SWI48 0 "nonimmediate_operand" "=r,r,m")
|
12386 |
|
|
(bswap:SWI48 (match_operand:SWI48 1 "nonimmediate_operand" "0,m,r")))]
|
12387 |
|
|
"TARGET_MOVBE
|
12388 |
|
|
&& !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
12389 |
|
|
"@
|
12390 |
|
|
bswap\t%0
|
12391 |
|
|
movbe\t{%1, %0|%0, %1}
|
12392 |
|
|
movbe\t{%1, %0|%0, %1}"
|
12393 |
|
|
[(set_attr "type" "bitmanip,imov,imov")
|
12394 |
|
|
(set_attr "modrm" "0,1,1")
|
12395 |
|
|
(set_attr "prefix_0f" "*,1,1")
|
12396 |
|
|
(set_attr "prefix_extra" "*,1,1")
|
12397 |
|
|
(set_attr "mode" "")])
|
12398 |
|
|
|
12399 |
|
|
(define_insn "*bswap2_1"
|
12400 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
12401 |
|
|
(bswap:SWI48 (match_operand:SWI48 1 "register_operand" "0")))]
|
12402 |
|
|
"TARGET_BSWAP"
|
12403 |
|
|
"bswap\t%0"
|
12404 |
|
|
[(set_attr "type" "bitmanip")
|
12405 |
|
|
(set_attr "modrm" "0")
|
12406 |
|
|
(set_attr "mode" "")])
|
12407 |
|
|
|
12408 |
|
|
(define_insn "*bswaphi_lowpart_1"
|
12409 |
|
|
[(set (strict_low_part (match_operand:HI 0 "register_operand" "+Q,r"))
|
12410 |
|
|
(bswap:HI (match_dup 0)))
|
12411 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12412 |
|
|
"TARGET_USE_XCHGB || optimize_function_for_size_p (cfun)"
|
12413 |
|
|
"@
|
12414 |
|
|
xchg{b}\t{%h0, %b0|%b0, %h0}
|
12415 |
|
|
rol{w}\t{$8, %0|%0, 8}"
|
12416 |
|
|
[(set_attr "length" "2,4")
|
12417 |
|
|
(set_attr "mode" "QI,HI")])
|
12418 |
|
|
|
12419 |
|
|
(define_insn "bswaphi_lowpart"
|
12420 |
|
|
[(set (strict_low_part (match_operand:HI 0 "register_operand" "+r"))
|
12421 |
|
|
(bswap:HI (match_dup 0)))
|
12422 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12423 |
|
|
""
|
12424 |
|
|
"rol{w}\t{$8, %0|%0, 8}"
|
12425 |
|
|
[(set_attr "length" "4")
|
12426 |
|
|
(set_attr "mode" "HI")])
|
12427 |
|
|
|
12428 |
|
|
(define_expand "paritydi2"
|
12429 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
12430 |
|
|
(parity:DI (match_operand:DI 1 "register_operand" "")))]
|
12431 |
|
|
"! TARGET_POPCNT"
|
12432 |
|
|
{
|
12433 |
|
|
rtx scratch = gen_reg_rtx (QImode);
|
12434 |
|
|
rtx cond;
|
12435 |
|
|
|
12436 |
|
|
emit_insn (gen_paritydi2_cmp (NULL_RTX, NULL_RTX,
|
12437 |
|
|
NULL_RTX, operands[1]));
|
12438 |
|
|
|
12439 |
|
|
cond = gen_rtx_fmt_ee (ORDERED, QImode,
|
12440 |
|
|
gen_rtx_REG (CCmode, FLAGS_REG),
|
12441 |
|
|
const0_rtx);
|
12442 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, scratch, cond));
|
12443 |
|
|
|
12444 |
|
|
if (TARGET_64BIT)
|
12445 |
|
|
emit_insn (gen_zero_extendqidi2 (operands[0], scratch));
|
12446 |
|
|
else
|
12447 |
|
|
{
|
12448 |
|
|
rtx tmp = gen_reg_rtx (SImode);
|
12449 |
|
|
|
12450 |
|
|
emit_insn (gen_zero_extendqisi2 (tmp, scratch));
|
12451 |
|
|
emit_insn (gen_zero_extendsidi2 (operands[0], tmp));
|
12452 |
|
|
}
|
12453 |
|
|
DONE;
|
12454 |
|
|
})
|
12455 |
|
|
|
12456 |
|
|
(define_expand "paritysi2"
|
12457 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
12458 |
|
|
(parity:SI (match_operand:SI 1 "register_operand" "")))]
|
12459 |
|
|
"! TARGET_POPCNT"
|
12460 |
|
|
{
|
12461 |
|
|
rtx scratch = gen_reg_rtx (QImode);
|
12462 |
|
|
rtx cond;
|
12463 |
|
|
|
12464 |
|
|
emit_insn (gen_paritysi2_cmp (NULL_RTX, NULL_RTX, operands[1]));
|
12465 |
|
|
|
12466 |
|
|
cond = gen_rtx_fmt_ee (ORDERED, QImode,
|
12467 |
|
|
gen_rtx_REG (CCmode, FLAGS_REG),
|
12468 |
|
|
const0_rtx);
|
12469 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, scratch, cond));
|
12470 |
|
|
|
12471 |
|
|
emit_insn (gen_zero_extendqisi2 (operands[0], scratch));
|
12472 |
|
|
DONE;
|
12473 |
|
|
})
|
12474 |
|
|
|
12475 |
|
|
(define_insn_and_split "paritydi2_cmp"
|
12476 |
|
|
[(set (reg:CC FLAGS_REG)
|
12477 |
|
|
(unspec:CC [(match_operand:DI 3 "register_operand" "0")]
|
12478 |
|
|
UNSPEC_PARITY))
|
12479 |
|
|
(clobber (match_scratch:DI 0 "=r"))
|
12480 |
|
|
(clobber (match_scratch:SI 1 "=&r"))
|
12481 |
|
|
(clobber (match_scratch:HI 2 "=Q"))]
|
12482 |
|
|
"! TARGET_POPCNT"
|
12483 |
|
|
"#"
|
12484 |
|
|
"&& reload_completed"
|
12485 |
|
|
[(parallel
|
12486 |
|
|
[(set (match_dup 1)
|
12487 |
|
|
(xor:SI (match_dup 1) (match_dup 4)))
|
12488 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
12489 |
|
|
(parallel
|
12490 |
|
|
[(set (reg:CC FLAGS_REG)
|
12491 |
|
|
(unspec:CC [(match_dup 1)] UNSPEC_PARITY))
|
12492 |
|
|
(clobber (match_dup 1))
|
12493 |
|
|
(clobber (match_dup 2))])]
|
12494 |
|
|
{
|
12495 |
|
|
operands[4] = gen_lowpart (SImode, operands[3]);
|
12496 |
|
|
|
12497 |
|
|
if (TARGET_64BIT)
|
12498 |
|
|
{
|
12499 |
|
|
emit_move_insn (operands[1], gen_lowpart (SImode, operands[3]));
|
12500 |
|
|
emit_insn (gen_lshrdi3 (operands[3], operands[3], GEN_INT (32)));
|
12501 |
|
|
}
|
12502 |
|
|
else
|
12503 |
|
|
operands[1] = gen_highpart (SImode, operands[3]);
|
12504 |
|
|
})
|
12505 |
|
|
|
12506 |
|
|
(define_insn_and_split "paritysi2_cmp"
|
12507 |
|
|
[(set (reg:CC FLAGS_REG)
|
12508 |
|
|
(unspec:CC [(match_operand:SI 2 "register_operand" "0")]
|
12509 |
|
|
UNSPEC_PARITY))
|
12510 |
|
|
(clobber (match_scratch:SI 0 "=r"))
|
12511 |
|
|
(clobber (match_scratch:HI 1 "=&Q"))]
|
12512 |
|
|
"! TARGET_POPCNT"
|
12513 |
|
|
"#"
|
12514 |
|
|
"&& reload_completed"
|
12515 |
|
|
[(parallel
|
12516 |
|
|
[(set (match_dup 1)
|
12517 |
|
|
(xor:HI (match_dup 1) (match_dup 3)))
|
12518 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
12519 |
|
|
(parallel
|
12520 |
|
|
[(set (reg:CC FLAGS_REG)
|
12521 |
|
|
(unspec:CC [(match_dup 1)] UNSPEC_PARITY))
|
12522 |
|
|
(clobber (match_dup 1))])]
|
12523 |
|
|
{
|
12524 |
|
|
operands[3] = gen_lowpart (HImode, operands[2]);
|
12525 |
|
|
|
12526 |
|
|
emit_move_insn (operands[1], gen_lowpart (HImode, operands[2]));
|
12527 |
|
|
emit_insn (gen_lshrsi3 (operands[2], operands[2], GEN_INT (16)));
|
12528 |
|
|
})
|
12529 |
|
|
|
12530 |
|
|
(define_insn "*parityhi2_cmp"
|
12531 |
|
|
[(set (reg:CC FLAGS_REG)
|
12532 |
|
|
(unspec:CC [(match_operand:HI 1 "register_operand" "0")]
|
12533 |
|
|
UNSPEC_PARITY))
|
12534 |
|
|
(clobber (match_scratch:HI 0 "=Q"))]
|
12535 |
|
|
"! TARGET_POPCNT"
|
12536 |
|
|
"xor{b}\t{%h0, %b0|%b0, %h0}"
|
12537 |
|
|
[(set_attr "length" "2")
|
12538 |
|
|
(set_attr "mode" "HI")])
|
12539 |
|
|
|
12540 |
|
|
|
12541 |
|
|
;; Thread-local storage patterns for ELF.
|
12542 |
|
|
;;
|
12543 |
|
|
;; Note that these code sequences must appear exactly as shown
|
12544 |
|
|
;; in order to allow linker relaxation.
|
12545 |
|
|
|
12546 |
|
|
(define_insn "*tls_global_dynamic_32_gnu"
|
12547 |
|
|
[(set (match_operand:SI 0 "register_operand" "=a")
|
12548 |
|
|
(unspec:SI
|
12549 |
|
|
[(match_operand:SI 1 "register_operand" "b")
|
12550 |
|
|
(match_operand:SI 2 "tls_symbolic_operand" "")
|
12551 |
|
|
(match_operand:SI 3 "constant_call_address_operand" "z")]
|
12552 |
|
|
UNSPEC_TLS_GD))
|
12553 |
|
|
(clobber (match_scratch:SI 4 "=d"))
|
12554 |
|
|
(clobber (match_scratch:SI 5 "=c"))
|
12555 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12556 |
|
|
"!TARGET_64BIT && TARGET_GNU_TLS"
|
12557 |
|
|
{
|
12558 |
|
|
output_asm_insn
|
12559 |
|
|
("lea{l}\t{%a2@tlsgd(,%1,1), %0|%0, %a2@tlsgd[%1*1]}", operands);
|
12560 |
|
|
if (TARGET_SUN_TLS)
|
12561 |
|
|
#ifdef HAVE_AS_IX86_TLSGDPLT
|
12562 |
|
|
return "call\t%a2@tlsgdplt";
|
12563 |
|
|
#else
|
12564 |
|
|
return "call\t%p3@plt";
|
12565 |
|
|
#endif
|
12566 |
|
|
return "call\t%P3";
|
12567 |
|
|
}
|
12568 |
|
|
[(set_attr "type" "multi")
|
12569 |
|
|
(set_attr "length" "12")])
|
12570 |
|
|
|
12571 |
|
|
(define_expand "tls_global_dynamic_32"
|
12572 |
|
|
[(parallel
|
12573 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
12574 |
|
|
(unspec:SI [(match_operand:SI 2 "register_operand" "")
|
12575 |
|
|
(match_operand:SI 1 "tls_symbolic_operand" "")
|
12576 |
|
|
(match_operand:SI 3 "constant_call_address_operand" "")]
|
12577 |
|
|
UNSPEC_TLS_GD))
|
12578 |
|
|
(clobber (match_scratch:SI 4 ""))
|
12579 |
|
|
(clobber (match_scratch:SI 5 ""))
|
12580 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
12581 |
|
|
|
12582 |
|
|
(define_insn "*tls_global_dynamic_64"
|
12583 |
|
|
[(set (match_operand:DI 0 "register_operand" "=a")
|
12584 |
|
|
(call:DI
|
12585 |
|
|
(mem:QI (match_operand:DI 2 "constant_call_address_operand" "z"))
|
12586 |
|
|
(match_operand:DI 3 "" "")))
|
12587 |
|
|
(unspec:DI [(match_operand 1 "tls_symbolic_operand" "")]
|
12588 |
|
|
UNSPEC_TLS_GD)]
|
12589 |
|
|
"TARGET_64BIT"
|
12590 |
|
|
{
|
12591 |
|
|
if (!TARGET_X32)
|
12592 |
|
|
fputs (ASM_BYTE "0x66\n", asm_out_file);
|
12593 |
|
|
output_asm_insn
|
12594 |
|
|
("lea{q}\t{%a1@tlsgd(%%rip), %%rdi|rdi, %a1@tlsgd[rip]}", operands);
|
12595 |
|
|
fputs (ASM_SHORT "0x6666\n", asm_out_file);
|
12596 |
|
|
fputs ("\trex64\n", asm_out_file);
|
12597 |
|
|
if (TARGET_SUN_TLS)
|
12598 |
|
|
return "call\t%p2@plt";
|
12599 |
|
|
return "call\t%P2";
|
12600 |
|
|
}
|
12601 |
|
|
[(set_attr "type" "multi")
|
12602 |
|
|
(set (attr "length")
|
12603 |
|
|
(symbol_ref "TARGET_X32 ? 15 : 16"))])
|
12604 |
|
|
|
12605 |
|
|
(define_expand "tls_global_dynamic_64"
|
12606 |
|
|
[(parallel
|
12607 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
12608 |
|
|
(call:DI
|
12609 |
|
|
(mem:QI (match_operand:DI 2 "constant_call_address_operand" ""))
|
12610 |
|
|
(const_int 0)))
|
12611 |
|
|
(unspec:DI [(match_operand 1 "tls_symbolic_operand" "")]
|
12612 |
|
|
UNSPEC_TLS_GD)])])
|
12613 |
|
|
|
12614 |
|
|
(define_insn "*tls_local_dynamic_base_32_gnu"
|
12615 |
|
|
[(set (match_operand:SI 0 "register_operand" "=a")
|
12616 |
|
|
(unspec:SI
|
12617 |
|
|
[(match_operand:SI 1 "register_operand" "b")
|
12618 |
|
|
(match_operand:SI 2 "constant_call_address_operand" "z")]
|
12619 |
|
|
UNSPEC_TLS_LD_BASE))
|
12620 |
|
|
(clobber (match_scratch:SI 3 "=d"))
|
12621 |
|
|
(clobber (match_scratch:SI 4 "=c"))
|
12622 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12623 |
|
|
"!TARGET_64BIT && TARGET_GNU_TLS"
|
12624 |
|
|
{
|
12625 |
|
|
output_asm_insn
|
12626 |
|
|
("lea{l}\t{%&@tlsldm(%1), %0|%0, %&@tlsldm[%1]}", operands);
|
12627 |
|
|
if (TARGET_SUN_TLS)
|
12628 |
|
|
#ifdef HAVE_AS_IX86_TLSLDMPLT
|
12629 |
|
|
return "call\t%&@tlsldmplt";
|
12630 |
|
|
#else
|
12631 |
|
|
return "call\t%p2@plt";
|
12632 |
|
|
#endif
|
12633 |
|
|
return "call\t%P2";
|
12634 |
|
|
}
|
12635 |
|
|
[(set_attr "type" "multi")
|
12636 |
|
|
(set_attr "length" "11")])
|
12637 |
|
|
|
12638 |
|
|
(define_expand "tls_local_dynamic_base_32"
|
12639 |
|
|
[(parallel
|
12640 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
12641 |
|
|
(unspec:SI
|
12642 |
|
|
[(match_operand:SI 1 "register_operand" "")
|
12643 |
|
|
(match_operand:SI 2 "constant_call_address_operand" "")]
|
12644 |
|
|
UNSPEC_TLS_LD_BASE))
|
12645 |
|
|
(clobber (match_scratch:SI 3 ""))
|
12646 |
|
|
(clobber (match_scratch:SI 4 ""))
|
12647 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
12648 |
|
|
|
12649 |
|
|
(define_insn "*tls_local_dynamic_base_64"
|
12650 |
|
|
[(set (match_operand:DI 0 "register_operand" "=a")
|
12651 |
|
|
(call:DI
|
12652 |
|
|
(mem:QI (match_operand:DI 1 "constant_call_address_operand" "z"))
|
12653 |
|
|
(match_operand:DI 2 "" "")))
|
12654 |
|
|
(unspec:DI [(const_int 0)] UNSPEC_TLS_LD_BASE)]
|
12655 |
|
|
"TARGET_64BIT"
|
12656 |
|
|
{
|
12657 |
|
|
output_asm_insn
|
12658 |
|
|
("lea{q}\t{%&@tlsld(%%rip), %%rdi|rdi, %&@tlsld[rip]}", operands);
|
12659 |
|
|
if (TARGET_SUN_TLS)
|
12660 |
|
|
return "call\t%p1@plt";
|
12661 |
|
|
return "call\t%P1";
|
12662 |
|
|
}
|
12663 |
|
|
[(set_attr "type" "multi")
|
12664 |
|
|
(set_attr "length" "12")])
|
12665 |
|
|
|
12666 |
|
|
(define_expand "tls_local_dynamic_base_64"
|
12667 |
|
|
[(parallel
|
12668 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
12669 |
|
|
(call:DI
|
12670 |
|
|
(mem:QI (match_operand:DI 1 "constant_call_address_operand" ""))
|
12671 |
|
|
(const_int 0)))
|
12672 |
|
|
(unspec:DI [(const_int 0)] UNSPEC_TLS_LD_BASE)])])
|
12673 |
|
|
|
12674 |
|
|
;; Local dynamic of a single variable is a lose. Show combine how
|
12675 |
|
|
;; to convert that back to global dynamic.
|
12676 |
|
|
|
12677 |
|
|
(define_insn_and_split "*tls_local_dynamic_32_once"
|
12678 |
|
|
[(set (match_operand:SI 0 "register_operand" "=a")
|
12679 |
|
|
(plus:SI
|
12680 |
|
|
(unspec:SI [(match_operand:SI 1 "register_operand" "b")
|
12681 |
|
|
(match_operand:SI 2 "constant_call_address_operand" "z")]
|
12682 |
|
|
UNSPEC_TLS_LD_BASE)
|
12683 |
|
|
(const:SI (unspec:SI
|
12684 |
|
|
[(match_operand:SI 3 "tls_symbolic_operand" "")]
|
12685 |
|
|
UNSPEC_DTPOFF))))
|
12686 |
|
|
(clobber (match_scratch:SI 4 "=d"))
|
12687 |
|
|
(clobber (match_scratch:SI 5 "=c"))
|
12688 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12689 |
|
|
""
|
12690 |
|
|
"#"
|
12691 |
|
|
""
|
12692 |
|
|
[(parallel
|
12693 |
|
|
[(set (match_dup 0)
|
12694 |
|
|
(unspec:SI [(match_dup 1) (match_dup 3) (match_dup 2)]
|
12695 |
|
|
UNSPEC_TLS_GD))
|
12696 |
|
|
(clobber (match_dup 4))
|
12697 |
|
|
(clobber (match_dup 5))
|
12698 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
12699 |
|
|
|
12700 |
|
|
;; Segment register for the thread base ptr load
|
12701 |
|
|
(define_mode_attr tp_seg [(SI "gs") (DI "fs")])
|
12702 |
|
|
|
12703 |
|
|
;; Load and add the thread base pointer from %:0.
|
12704 |
|
|
(define_insn "*load_tp_x32"
|
12705 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
12706 |
|
|
(unspec:SI [(const_int 0)] UNSPEC_TP))]
|
12707 |
|
|
"TARGET_X32"
|
12708 |
|
|
"mov{l}\t{%%fs:0, %0|%0, DWORD PTR fs:0}"
|
12709 |
|
|
[(set_attr "type" "imov")
|
12710 |
|
|
(set_attr "modrm" "0")
|
12711 |
|
|
(set_attr "length" "7")
|
12712 |
|
|
(set_attr "memory" "load")
|
12713 |
|
|
(set_attr "imm_disp" "false")])
|
12714 |
|
|
|
12715 |
|
|
(define_insn "*load_tp_x32_zext"
|
12716 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
12717 |
|
|
(zero_extend:DI (unspec:SI [(const_int 0)] UNSPEC_TP)))]
|
12718 |
|
|
"TARGET_X32"
|
12719 |
|
|
"mov{l}\t{%%fs:0, %k0|%k0, DWORD PTR fs:0}"
|
12720 |
|
|
[(set_attr "type" "imov")
|
12721 |
|
|
(set_attr "modrm" "0")
|
12722 |
|
|
(set_attr "length" "7")
|
12723 |
|
|
(set_attr "memory" "load")
|
12724 |
|
|
(set_attr "imm_disp" "false")])
|
12725 |
|
|
|
12726 |
|
|
(define_insn "*load_tp_"
|
12727 |
|
|
[(set (match_operand:P 0 "register_operand" "=r")
|
12728 |
|
|
(unspec:P [(const_int 0)] UNSPEC_TP))]
|
12729 |
|
|
"!TARGET_X32"
|
12730 |
|
|
"mov{}\t{%%:0, %0|%0, PTR :0}"
|
12731 |
|
|
[(set_attr "type" "imov")
|
12732 |
|
|
(set_attr "modrm" "0")
|
12733 |
|
|
(set_attr "length" "7")
|
12734 |
|
|
(set_attr "memory" "load")
|
12735 |
|
|
(set_attr "imm_disp" "false")])
|
12736 |
|
|
|
12737 |
|
|
(define_insn "*add_tp_x32"
|
12738 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
12739 |
|
|
(plus:SI (unspec:SI [(const_int 0)] UNSPEC_TP)
|
12740 |
|
|
(match_operand:SI 1 "register_operand" "0")))
|
12741 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12742 |
|
|
"TARGET_X32"
|
12743 |
|
|
"add{l}\t{%%fs:0, %0|%0, DWORD PTR fs:0}"
|
12744 |
|
|
[(set_attr "type" "alu")
|
12745 |
|
|
(set_attr "modrm" "0")
|
12746 |
|
|
(set_attr "length" "7")
|
12747 |
|
|
(set_attr "memory" "load")
|
12748 |
|
|
(set_attr "imm_disp" "false")])
|
12749 |
|
|
|
12750 |
|
|
(define_insn "*add_tp_x32_zext"
|
12751 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
12752 |
|
|
(zero_extend:DI
|
12753 |
|
|
(plus:SI (unspec:SI [(const_int 0)] UNSPEC_TP)
|
12754 |
|
|
(match_operand:SI 1 "register_operand" "0"))))
|
12755 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12756 |
|
|
"TARGET_X32"
|
12757 |
|
|
"add{l}\t{%%fs:0, %k0|%k0, DWORD PTR fs:0}"
|
12758 |
|
|
[(set_attr "type" "alu")
|
12759 |
|
|
(set_attr "modrm" "0")
|
12760 |
|
|
(set_attr "length" "7")
|
12761 |
|
|
(set_attr "memory" "load")
|
12762 |
|
|
(set_attr "imm_disp" "false")])
|
12763 |
|
|
|
12764 |
|
|
(define_insn "*add_tp_"
|
12765 |
|
|
[(set (match_operand:P 0 "register_operand" "=r")
|
12766 |
|
|
(plus:P (unspec:P [(const_int 0)] UNSPEC_TP)
|
12767 |
|
|
(match_operand:P 1 "register_operand" "0")))
|
12768 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12769 |
|
|
"!TARGET_X32"
|
12770 |
|
|
"add{}\t{%%:0, %0|%0, PTR :0}"
|
12771 |
|
|
[(set_attr "type" "alu")
|
12772 |
|
|
(set_attr "modrm" "0")
|
12773 |
|
|
(set_attr "length" "7")
|
12774 |
|
|
(set_attr "memory" "load")
|
12775 |
|
|
(set_attr "imm_disp" "false")])
|
12776 |
|
|
|
12777 |
|
|
;; The Sun linker took the AMD64 TLS spec literally and can only handle
|
12778 |
|
|
;; %rax as destination of the initial executable code sequence.
|
12779 |
|
|
(define_insn "tls_initial_exec_64_sun"
|
12780 |
|
|
[(set (match_operand:DI 0 "register_operand" "=a")
|
12781 |
|
|
(unspec:DI
|
12782 |
|
|
[(match_operand:DI 1 "tls_symbolic_operand" "")]
|
12783 |
|
|
UNSPEC_TLS_IE_SUN))
|
12784 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12785 |
|
|
"TARGET_64BIT && TARGET_SUN_TLS"
|
12786 |
|
|
{
|
12787 |
|
|
output_asm_insn
|
12788 |
|
|
("mov{q}\t{%%fs:0, %0|%0, QWORD PTR fs:0}", operands);
|
12789 |
|
|
return "add{q}\t{%a1@gottpoff(%%rip), %0|%0, %a1@gottpoff[rip]}";
|
12790 |
|
|
}
|
12791 |
|
|
[(set_attr "type" "multi")])
|
12792 |
|
|
|
12793 |
|
|
;; GNU2 TLS patterns can be split.
|
12794 |
|
|
|
12795 |
|
|
(define_expand "tls_dynamic_gnu2_32"
|
12796 |
|
|
[(set (match_dup 3)
|
12797 |
|
|
(plus:SI (match_operand:SI 2 "register_operand" "")
|
12798 |
|
|
(const:SI
|
12799 |
|
|
(unspec:SI [(match_operand:SI 1 "tls_symbolic_operand" "")]
|
12800 |
|
|
UNSPEC_TLSDESC))))
|
12801 |
|
|
(parallel
|
12802 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
12803 |
|
|
(unspec:SI [(match_dup 1) (match_dup 3)
|
12804 |
|
|
(match_dup 2) (reg:SI SP_REG)]
|
12805 |
|
|
UNSPEC_TLSDESC))
|
12806 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
12807 |
|
|
"!TARGET_64BIT && TARGET_GNU2_TLS"
|
12808 |
|
|
{
|
12809 |
|
|
operands[3] = can_create_pseudo_p () ? gen_reg_rtx (Pmode) : operands[0];
|
12810 |
|
|
ix86_tls_descriptor_calls_expanded_in_cfun = true;
|
12811 |
|
|
})
|
12812 |
|
|
|
12813 |
|
|
(define_insn "*tls_dynamic_gnu2_lea_32"
|
12814 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
12815 |
|
|
(plus:SI (match_operand:SI 1 "register_operand" "b")
|
12816 |
|
|
(const:SI
|
12817 |
|
|
(unspec:SI [(match_operand:SI 2 "tls_symbolic_operand" "")]
|
12818 |
|
|
UNSPEC_TLSDESC))))]
|
12819 |
|
|
"!TARGET_64BIT && TARGET_GNU2_TLS"
|
12820 |
|
|
"lea{l}\t{%a2@TLSDESC(%1), %0|%0, %a2@TLSDESC[%1]}"
|
12821 |
|
|
[(set_attr "type" "lea")
|
12822 |
|
|
(set_attr "mode" "SI")
|
12823 |
|
|
(set_attr "length" "6")
|
12824 |
|
|
(set_attr "length_address" "4")])
|
12825 |
|
|
|
12826 |
|
|
(define_insn "*tls_dynamic_gnu2_call_32"
|
12827 |
|
|
[(set (match_operand:SI 0 "register_operand" "=a")
|
12828 |
|
|
(unspec:SI [(match_operand:SI 1 "tls_symbolic_operand" "")
|
12829 |
|
|
(match_operand:SI 2 "register_operand" "0")
|
12830 |
|
|
;; we have to make sure %ebx still points to the GOT
|
12831 |
|
|
(match_operand:SI 3 "register_operand" "b")
|
12832 |
|
|
(reg:SI SP_REG)]
|
12833 |
|
|
UNSPEC_TLSDESC))
|
12834 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12835 |
|
|
"!TARGET_64BIT && TARGET_GNU2_TLS"
|
12836 |
|
|
"call\t{*%a1@TLSCALL(%2)|[DWORD PTR [%2+%a1@TLSCALL]]}"
|
12837 |
|
|
[(set_attr "type" "call")
|
12838 |
|
|
(set_attr "length" "2")
|
12839 |
|
|
(set_attr "length_address" "0")])
|
12840 |
|
|
|
12841 |
|
|
(define_insn_and_split "*tls_dynamic_gnu2_combine_32"
|
12842 |
|
|
[(set (match_operand:SI 0 "register_operand" "=&a")
|
12843 |
|
|
(plus:SI
|
12844 |
|
|
(unspec:SI [(match_operand:SI 3 "tls_modbase_operand" "")
|
12845 |
|
|
(match_operand:SI 4 "" "")
|
12846 |
|
|
(match_operand:SI 2 "register_operand" "b")
|
12847 |
|
|
(reg:SI SP_REG)]
|
12848 |
|
|
UNSPEC_TLSDESC)
|
12849 |
|
|
(const:SI (unspec:SI
|
12850 |
|
|
[(match_operand:SI 1 "tls_symbolic_operand" "")]
|
12851 |
|
|
UNSPEC_DTPOFF))))
|
12852 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12853 |
|
|
"!TARGET_64BIT && TARGET_GNU2_TLS"
|
12854 |
|
|
"#"
|
12855 |
|
|
""
|
12856 |
|
|
[(set (match_dup 0) (match_dup 5))]
|
12857 |
|
|
{
|
12858 |
|
|
operands[5] = can_create_pseudo_p () ? gen_reg_rtx (Pmode) : operands[0];
|
12859 |
|
|
emit_insn (gen_tls_dynamic_gnu2_32 (operands[5], operands[1], operands[2]));
|
12860 |
|
|
})
|
12861 |
|
|
|
12862 |
|
|
(define_expand "tls_dynamic_gnu2_64"
|
12863 |
|
|
[(set (match_dup 2)
|
12864 |
|
|
(unspec:DI [(match_operand 1 "tls_symbolic_operand" "")]
|
12865 |
|
|
UNSPEC_TLSDESC))
|
12866 |
|
|
(parallel
|
12867 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
12868 |
|
|
(unspec:DI [(match_dup 1) (match_dup 2) (reg:DI SP_REG)]
|
12869 |
|
|
UNSPEC_TLSDESC))
|
12870 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
12871 |
|
|
"TARGET_64BIT && TARGET_GNU2_TLS"
|
12872 |
|
|
{
|
12873 |
|
|
operands[2] = can_create_pseudo_p () ? gen_reg_rtx (Pmode) : operands[0];
|
12874 |
|
|
ix86_tls_descriptor_calls_expanded_in_cfun = true;
|
12875 |
|
|
})
|
12876 |
|
|
|
12877 |
|
|
(define_insn "*tls_dynamic_gnu2_lea_64"
|
12878 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
12879 |
|
|
(unspec:DI [(match_operand 1 "tls_symbolic_operand" "")]
|
12880 |
|
|
UNSPEC_TLSDESC))]
|
12881 |
|
|
"TARGET_64BIT && TARGET_GNU2_TLS"
|
12882 |
|
|
"lea{q}\t{%a1@TLSDESC(%%rip), %0|%0, %a1@TLSDESC[rip]}"
|
12883 |
|
|
[(set_attr "type" "lea")
|
12884 |
|
|
(set_attr "mode" "DI")
|
12885 |
|
|
(set_attr "length" "7")
|
12886 |
|
|
(set_attr "length_address" "4")])
|
12887 |
|
|
|
12888 |
|
|
(define_insn "*tls_dynamic_gnu2_call_64"
|
12889 |
|
|
[(set (match_operand:DI 0 "register_operand" "=a")
|
12890 |
|
|
(unspec:DI [(match_operand 1 "tls_symbolic_operand" "")
|
12891 |
|
|
(match_operand:DI 2 "register_operand" "0")
|
12892 |
|
|
(reg:DI SP_REG)]
|
12893 |
|
|
UNSPEC_TLSDESC))
|
12894 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12895 |
|
|
"TARGET_64BIT && TARGET_GNU2_TLS"
|
12896 |
|
|
"call\t{*%a1@TLSCALL(%2)|[QWORD PTR [%2+%a1@TLSCALL]]}"
|
12897 |
|
|
[(set_attr "type" "call")
|
12898 |
|
|
(set_attr "length" "2")
|
12899 |
|
|
(set_attr "length_address" "0")])
|
12900 |
|
|
|
12901 |
|
|
(define_insn_and_split "*tls_dynamic_gnu2_combine_64"
|
12902 |
|
|
[(set (match_operand:DI 0 "register_operand" "=&a")
|
12903 |
|
|
(plus:DI
|
12904 |
|
|
(unspec:DI [(match_operand:DI 2 "tls_modbase_operand" "")
|
12905 |
|
|
(match_operand:DI 3 "" "")
|
12906 |
|
|
(reg:DI SP_REG)]
|
12907 |
|
|
UNSPEC_TLSDESC)
|
12908 |
|
|
(const:DI (unspec:DI
|
12909 |
|
|
[(match_operand 1 "tls_symbolic_operand" "")]
|
12910 |
|
|
UNSPEC_DTPOFF))))
|
12911 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
12912 |
|
|
"TARGET_64BIT && TARGET_GNU2_TLS"
|
12913 |
|
|
"#"
|
12914 |
|
|
""
|
12915 |
|
|
[(set (match_dup 0) (match_dup 4))]
|
12916 |
|
|
{
|
12917 |
|
|
operands[4] = can_create_pseudo_p () ? gen_reg_rtx (Pmode) : operands[0];
|
12918 |
|
|
emit_insn (gen_tls_dynamic_gnu2_64 (operands[4], operands[1]));
|
12919 |
|
|
})
|
12920 |
|
|
|
12921 |
|
|
;; These patterns match the binary 387 instructions for addM3, subM3,
|
12922 |
|
|
;; mulM3 and divM3. There are three patterns for each of DFmode and
|
12923 |
|
|
;; SFmode. The first is the normal insn, the second the same insn but
|
12924 |
|
|
;; with one operand a conversion, and the third the same insn but with
|
12925 |
|
|
;; the other operand a conversion. The conversion may be SFmode or
|
12926 |
|
|
;; SImode if the target mode DFmode, but only SImode if the target mode
|
12927 |
|
|
;; is SFmode.
|
12928 |
|
|
|
12929 |
|
|
;; Gcc is slightly more smart about handling normal two address instructions
|
12930 |
|
|
;; so use special patterns for add and mull.
|
12931 |
|
|
|
12932 |
|
|
(define_insn "*fop__comm_mixed"
|
12933 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f,x,x")
|
12934 |
|
|
(match_operator:MODEF 3 "binary_fp_operator"
|
12935 |
|
|
[(match_operand:MODEF 1 "nonimmediate_operand" "%0,0,x")
|
12936 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "fm,xm,xm")]))]
|
12937 |
|
|
"SSE_FLOAT_MODE_P (mode) && TARGET_MIX_SSE_I387
|
12938 |
|
|
&& COMMUTATIVE_ARITH_P (operands[3])
|
12939 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
12940 |
|
|
"* return output_387_binary_op (insn, operands);"
|
12941 |
|
|
[(set (attr "type")
|
12942 |
|
|
(if_then_else (eq_attr "alternative" "1,2")
|
12943 |
|
|
(if_then_else (match_operand:MODEF 3 "mult_operator" "")
|
12944 |
|
|
(const_string "ssemul")
|
12945 |
|
|
(const_string "sseadd"))
|
12946 |
|
|
(if_then_else (match_operand:MODEF 3 "mult_operator" "")
|
12947 |
|
|
(const_string "fmul")
|
12948 |
|
|
(const_string "fop"))))
|
12949 |
|
|
(set_attr "isa" "*,noavx,avx")
|
12950 |
|
|
(set_attr "prefix" "orig,orig,vex")
|
12951 |
|
|
(set_attr "mode" "")])
|
12952 |
|
|
|
12953 |
|
|
(define_insn "*fop__comm_sse"
|
12954 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x,x")
|
12955 |
|
|
(match_operator:MODEF 3 "binary_fp_operator"
|
12956 |
|
|
[(match_operand:MODEF 1 "nonimmediate_operand" "%0,x")
|
12957 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "xm,xm")]))]
|
12958 |
|
|
"SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
12959 |
|
|
&& COMMUTATIVE_ARITH_P (operands[3])
|
12960 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
12961 |
|
|
"* return output_387_binary_op (insn, operands);"
|
12962 |
|
|
[(set (attr "type")
|
12963 |
|
|
(if_then_else (match_operand:MODEF 3 "mult_operator" "")
|
12964 |
|
|
(const_string "ssemul")
|
12965 |
|
|
(const_string "sseadd")))
|
12966 |
|
|
(set_attr "isa" "noavx,avx")
|
12967 |
|
|
(set_attr "prefix" "orig,vex")
|
12968 |
|
|
(set_attr "mode" "")])
|
12969 |
|
|
|
12970 |
|
|
(define_insn "*fop__comm_i387"
|
12971 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f")
|
12972 |
|
|
(match_operator:MODEF 3 "binary_fp_operator"
|
12973 |
|
|
[(match_operand:MODEF 1 "nonimmediate_operand" "%0")
|
12974 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "fm")]))]
|
12975 |
|
|
"TARGET_80387 && X87_ENABLE_ARITH (mode)
|
12976 |
|
|
&& COMMUTATIVE_ARITH_P (operands[3])
|
12977 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
12978 |
|
|
"* return output_387_binary_op (insn, operands);"
|
12979 |
|
|
[(set (attr "type")
|
12980 |
|
|
(if_then_else (match_operand:MODEF 3 "mult_operator" "")
|
12981 |
|
|
(const_string "fmul")
|
12982 |
|
|
(const_string "fop")))
|
12983 |
|
|
(set_attr "mode" "")])
|
12984 |
|
|
|
12985 |
|
|
(define_insn "*fop__1_mixed"
|
12986 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f,f,x,x")
|
12987 |
|
|
(match_operator:MODEF 3 "binary_fp_operator"
|
12988 |
|
|
[(match_operand:MODEF 1 "nonimmediate_operand" "0,fm,0,x")
|
12989 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "fm,0,xm,xm")]))]
|
12990 |
|
|
"SSE_FLOAT_MODE_P (mode) && TARGET_MIX_SSE_I387
|
12991 |
|
|
&& !COMMUTATIVE_ARITH_P (operands[3])
|
12992 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
12993 |
|
|
"* return output_387_binary_op (insn, operands);"
|
12994 |
|
|
[(set (attr "type")
|
12995 |
|
|
(cond [(and (eq_attr "alternative" "2,3")
|
12996 |
|
|
(match_operand:MODEF 3 "mult_operator" ""))
|
12997 |
|
|
(const_string "ssemul")
|
12998 |
|
|
(and (eq_attr "alternative" "2,3")
|
12999 |
|
|
(match_operand:MODEF 3 "div_operator" ""))
|
13000 |
|
|
(const_string "ssediv")
|
13001 |
|
|
(eq_attr "alternative" "2,3")
|
13002 |
|
|
(const_string "sseadd")
|
13003 |
|
|
(match_operand:MODEF 3 "mult_operator" "")
|
13004 |
|
|
(const_string "fmul")
|
13005 |
|
|
(match_operand:MODEF 3 "div_operator" "")
|
13006 |
|
|
(const_string "fdiv")
|
13007 |
|
|
]
|
13008 |
|
|
(const_string "fop")))
|
13009 |
|
|
(set_attr "isa" "*,*,noavx,avx")
|
13010 |
|
|
(set_attr "prefix" "orig,orig,orig,vex")
|
13011 |
|
|
(set_attr "mode" "")])
|
13012 |
|
|
|
13013 |
|
|
(define_insn "*rcpsf2_sse"
|
13014 |
|
|
[(set (match_operand:SF 0 "register_operand" "=x")
|
13015 |
|
|
(unspec:SF [(match_operand:SF 1 "nonimmediate_operand" "xm")]
|
13016 |
|
|
UNSPEC_RCP))]
|
13017 |
|
|
"TARGET_SSE_MATH"
|
13018 |
|
|
"%vrcpss\t{%1, %d0|%d0, %1}"
|
13019 |
|
|
[(set_attr "type" "sse")
|
13020 |
|
|
(set_attr "atom_sse_attr" "rcp")
|
13021 |
|
|
(set_attr "prefix" "maybe_vex")
|
13022 |
|
|
(set_attr "mode" "SF")])
|
13023 |
|
|
|
13024 |
|
|
(define_insn "*fop__1_sse"
|
13025 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x,x")
|
13026 |
|
|
(match_operator:MODEF 3 "binary_fp_operator"
|
13027 |
|
|
[(match_operand:MODEF 1 "register_operand" "0,x")
|
13028 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "xm,xm")]))]
|
13029 |
|
|
"SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
13030 |
|
|
&& !COMMUTATIVE_ARITH_P (operands[3])"
|
13031 |
|
|
"* return output_387_binary_op (insn, operands);"
|
13032 |
|
|
[(set (attr "type")
|
13033 |
|
|
(cond [(match_operand:MODEF 3 "mult_operator" "")
|
13034 |
|
|
(const_string "ssemul")
|
13035 |
|
|
(match_operand:MODEF 3 "div_operator" "")
|
13036 |
|
|
(const_string "ssediv")
|
13037 |
|
|
]
|
13038 |
|
|
(const_string "sseadd")))
|
13039 |
|
|
(set_attr "isa" "noavx,avx")
|
13040 |
|
|
(set_attr "prefix" "orig,vex")
|
13041 |
|
|
(set_attr "mode" "")])
|
13042 |
|
|
|
13043 |
|
|
;; This pattern is not fully shadowed by the pattern above.
|
13044 |
|
|
(define_insn "*fop__1_i387"
|
13045 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f,f")
|
13046 |
|
|
(match_operator:MODEF 3 "binary_fp_operator"
|
13047 |
|
|
[(match_operand:MODEF 1 "nonimmediate_operand" "0,fm")
|
13048 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "fm,0")]))]
|
13049 |
|
|
"TARGET_80387 && X87_ENABLE_ARITH (mode)
|
13050 |
|
|
&& !(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13051 |
|
|
&& !COMMUTATIVE_ARITH_P (operands[3])
|
13052 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
13053 |
|
|
"* return output_387_binary_op (insn, operands);"
|
13054 |
|
|
[(set (attr "type")
|
13055 |
|
|
(cond [(match_operand:MODEF 3 "mult_operator" "")
|
13056 |
|
|
(const_string "fmul")
|
13057 |
|
|
(match_operand:MODEF 3 "div_operator" "")
|
13058 |
|
|
(const_string "fdiv")
|
13059 |
|
|
]
|
13060 |
|
|
(const_string "fop")))
|
13061 |
|
|
(set_attr "mode" "")])
|
13062 |
|
|
|
13063 |
|
|
;; ??? Add SSE splitters for these!
|
13064 |
|
|
(define_insn "*fop__2_i387"
|
13065 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f,f")
|
13066 |
|
|
(match_operator:MODEF 3 "binary_fp_operator"
|
13067 |
|
|
[(float:MODEF
|
13068 |
|
|
(match_operand:SWI24 1 "nonimmediate_operand" "m,?r"))
|
13069 |
|
|
(match_operand:MODEF 2 "register_operand" "0,0")]))]
|
13070 |
|
|
"TARGET_80387 && X87_ENABLE_FLOAT (mode, mode)
|
13071 |
|
|
&& !(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13072 |
|
|
&& (TARGET_USE_MODE_FIOP || optimize_function_for_size_p (cfun))"
|
13073 |
|
|
"* return which_alternative ? \"#\" : output_387_binary_op (insn, operands);"
|
13074 |
|
|
[(set (attr "type")
|
13075 |
|
|
(cond [(match_operand:MODEF 3 "mult_operator" "")
|
13076 |
|
|
(const_string "fmul")
|
13077 |
|
|
(match_operand:MODEF 3 "div_operator" "")
|
13078 |
|
|
(const_string "fdiv")
|
13079 |
|
|
]
|
13080 |
|
|
(const_string "fop")))
|
13081 |
|
|
(set_attr "fp_int_src" "true")
|
13082 |
|
|
(set_attr "mode" "")])
|
13083 |
|
|
|
13084 |
|
|
(define_insn "*fop__3_i387"
|
13085 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f,f")
|
13086 |
|
|
(match_operator:MODEF 3 "binary_fp_operator"
|
13087 |
|
|
[(match_operand:MODEF 1 "register_operand" "0,0")
|
13088 |
|
|
(float:MODEF
|
13089 |
|
|
(match_operand:SWI24 2 "nonimmediate_operand" "m,?r"))]))]
|
13090 |
|
|
"TARGET_80387 && X87_ENABLE_FLOAT (mode, mode)
|
13091 |
|
|
&& !(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13092 |
|
|
&& (TARGET_USE_MODE_FIOP || optimize_function_for_size_p (cfun))"
|
13093 |
|
|
"* return which_alternative ? \"#\" : output_387_binary_op (insn, operands);"
|
13094 |
|
|
[(set (attr "type")
|
13095 |
|
|
(cond [(match_operand:MODEF 3 "mult_operator" "")
|
13096 |
|
|
(const_string "fmul")
|
13097 |
|
|
(match_operand:MODEF 3 "div_operator" "")
|
13098 |
|
|
(const_string "fdiv")
|
13099 |
|
|
]
|
13100 |
|
|
(const_string "fop")))
|
13101 |
|
|
(set_attr "fp_int_src" "true")
|
13102 |
|
|
(set_attr "mode" "")])
|
13103 |
|
|
|
13104 |
|
|
(define_insn "*fop_df_4_i387"
|
13105 |
|
|
[(set (match_operand:DF 0 "register_operand" "=f,f")
|
13106 |
|
|
(match_operator:DF 3 "binary_fp_operator"
|
13107 |
|
|
[(float_extend:DF
|
13108 |
|
|
(match_operand:SF 1 "nonimmediate_operand" "fm,0"))
|
13109 |
|
|
(match_operand:DF 2 "register_operand" "0,f")]))]
|
13110 |
|
|
"TARGET_80387 && X87_ENABLE_ARITH (DFmode)
|
13111 |
|
|
&& !(TARGET_SSE2 && TARGET_SSE_MATH)
|
13112 |
|
|
&& !(MEM_P (operands[1]) && MEM_P (operands[2]))"
|
13113 |
|
|
"* return output_387_binary_op (insn, operands);"
|
13114 |
|
|
[(set (attr "type")
|
13115 |
|
|
(cond [(match_operand:DF 3 "mult_operator" "")
|
13116 |
|
|
(const_string "fmul")
|
13117 |
|
|
(match_operand:DF 3 "div_operator" "")
|
13118 |
|
|
(const_string "fdiv")
|
13119 |
|
|
]
|
13120 |
|
|
(const_string "fop")))
|
13121 |
|
|
(set_attr "mode" "SF")])
|
13122 |
|
|
|
13123 |
|
|
(define_insn "*fop_df_5_i387"
|
13124 |
|
|
[(set (match_operand:DF 0 "register_operand" "=f,f")
|
13125 |
|
|
(match_operator:DF 3 "binary_fp_operator"
|
13126 |
|
|
[(match_operand:DF 1 "register_operand" "0,f")
|
13127 |
|
|
(float_extend:DF
|
13128 |
|
|
(match_operand:SF 2 "nonimmediate_operand" "fm,0"))]))]
|
13129 |
|
|
"TARGET_80387 && X87_ENABLE_ARITH (DFmode)
|
13130 |
|
|
&& !(TARGET_SSE2 && TARGET_SSE_MATH)"
|
13131 |
|
|
"* return output_387_binary_op (insn, operands);"
|
13132 |
|
|
[(set (attr "type")
|
13133 |
|
|
(cond [(match_operand:DF 3 "mult_operator" "")
|
13134 |
|
|
(const_string "fmul")
|
13135 |
|
|
(match_operand:DF 3 "div_operator" "")
|
13136 |
|
|
(const_string "fdiv")
|
13137 |
|
|
]
|
13138 |
|
|
(const_string "fop")))
|
13139 |
|
|
(set_attr "mode" "SF")])
|
13140 |
|
|
|
13141 |
|
|
(define_insn "*fop_df_6_i387"
|
13142 |
|
|
[(set (match_operand:DF 0 "register_operand" "=f,f")
|
13143 |
|
|
(match_operator:DF 3 "binary_fp_operator"
|
13144 |
|
|
[(float_extend:DF
|
13145 |
|
|
(match_operand:SF 1 "register_operand" "0,f"))
|
13146 |
|
|
(float_extend:DF
|
13147 |
|
|
(match_operand:SF 2 "nonimmediate_operand" "fm,0"))]))]
|
13148 |
|
|
"TARGET_80387 && X87_ENABLE_ARITH (DFmode)
|
13149 |
|
|
&& !(TARGET_SSE2 && TARGET_SSE_MATH)"
|
13150 |
|
|
"* return output_387_binary_op (insn, operands);"
|
13151 |
|
|
[(set (attr "type")
|
13152 |
|
|
(cond [(match_operand:DF 3 "mult_operator" "")
|
13153 |
|
|
(const_string "fmul")
|
13154 |
|
|
(match_operand:DF 3 "div_operator" "")
|
13155 |
|
|
(const_string "fdiv")
|
13156 |
|
|
]
|
13157 |
|
|
(const_string "fop")))
|
13158 |
|
|
(set_attr "mode" "SF")])
|
13159 |
|
|
|
13160 |
|
|
(define_insn "*fop_xf_comm_i387"
|
13161 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13162 |
|
|
(match_operator:XF 3 "binary_fp_operator"
|
13163 |
|
|
[(match_operand:XF 1 "register_operand" "%0")
|
13164 |
|
|
(match_operand:XF 2 "register_operand" "f")]))]
|
13165 |
|
|
"TARGET_80387
|
13166 |
|
|
&& COMMUTATIVE_ARITH_P (operands[3])"
|
13167 |
|
|
"* return output_387_binary_op (insn, operands);"
|
13168 |
|
|
[(set (attr "type")
|
13169 |
|
|
(if_then_else (match_operand:XF 3 "mult_operator" "")
|
13170 |
|
|
(const_string "fmul")
|
13171 |
|
|
(const_string "fop")))
|
13172 |
|
|
(set_attr "mode" "XF")])
|
13173 |
|
|
|
13174 |
|
|
(define_insn "*fop_xf_1_i387"
|
13175 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f,f")
|
13176 |
|
|
(match_operator:XF 3 "binary_fp_operator"
|
13177 |
|
|
[(match_operand:XF 1 "register_operand" "0,f")
|
13178 |
|
|
(match_operand:XF 2 "register_operand" "f,0")]))]
|
13179 |
|
|
"TARGET_80387
|
13180 |
|
|
&& !COMMUTATIVE_ARITH_P (operands[3])"
|
13181 |
|
|
"* return output_387_binary_op (insn, operands);"
|
13182 |
|
|
[(set (attr "type")
|
13183 |
|
|
(cond [(match_operand:XF 3 "mult_operator" "")
|
13184 |
|
|
(const_string "fmul")
|
13185 |
|
|
(match_operand:XF 3 "div_operator" "")
|
13186 |
|
|
(const_string "fdiv")
|
13187 |
|
|
]
|
13188 |
|
|
(const_string "fop")))
|
13189 |
|
|
(set_attr "mode" "XF")])
|
13190 |
|
|
|
13191 |
|
|
(define_insn "*fop_xf_2_i387"
|
13192 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f,f")
|
13193 |
|
|
(match_operator:XF 3 "binary_fp_operator"
|
13194 |
|
|
[(float:XF
|
13195 |
|
|
(match_operand:SWI24 1 "nonimmediate_operand" "m,?r"))
|
13196 |
|
|
(match_operand:XF 2 "register_operand" "0,0")]))]
|
13197 |
|
|
"TARGET_80387 && (TARGET_USE_MODE_FIOP || optimize_function_for_size_p (cfun))"
|
13198 |
|
|
"* return which_alternative ? \"#\" : output_387_binary_op (insn, operands);"
|
13199 |
|
|
[(set (attr "type")
|
13200 |
|
|
(cond [(match_operand:XF 3 "mult_operator" "")
|
13201 |
|
|
(const_string "fmul")
|
13202 |
|
|
(match_operand:XF 3 "div_operator" "")
|
13203 |
|
|
(const_string "fdiv")
|
13204 |
|
|
]
|
13205 |
|
|
(const_string "fop")))
|
13206 |
|
|
(set_attr "fp_int_src" "true")
|
13207 |
|
|
(set_attr "mode" "")])
|
13208 |
|
|
|
13209 |
|
|
(define_insn "*fop_xf_3_i387"
|
13210 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f,f")
|
13211 |
|
|
(match_operator:XF 3 "binary_fp_operator"
|
13212 |
|
|
[(match_operand:XF 1 "register_operand" "0,0")
|
13213 |
|
|
(float:XF
|
13214 |
|
|
(match_operand:SWI24 2 "nonimmediate_operand" "m,?r"))]))]
|
13215 |
|
|
"TARGET_80387 && (TARGET_USE_MODE_FIOP || optimize_function_for_size_p (cfun))"
|
13216 |
|
|
"* return which_alternative ? \"#\" : output_387_binary_op (insn, operands);"
|
13217 |
|
|
[(set (attr "type")
|
13218 |
|
|
(cond [(match_operand:XF 3 "mult_operator" "")
|
13219 |
|
|
(const_string "fmul")
|
13220 |
|
|
(match_operand:XF 3 "div_operator" "")
|
13221 |
|
|
(const_string "fdiv")
|
13222 |
|
|
]
|
13223 |
|
|
(const_string "fop")))
|
13224 |
|
|
(set_attr "fp_int_src" "true")
|
13225 |
|
|
(set_attr "mode" "")])
|
13226 |
|
|
|
13227 |
|
|
(define_insn "*fop_xf_4_i387"
|
13228 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f,f")
|
13229 |
|
|
(match_operator:XF 3 "binary_fp_operator"
|
13230 |
|
|
[(float_extend:XF
|
13231 |
|
|
(match_operand:MODEF 1 "nonimmediate_operand" "fm,0"))
|
13232 |
|
|
(match_operand:XF 2 "register_operand" "0,f")]))]
|
13233 |
|
|
"TARGET_80387"
|
13234 |
|
|
"* return output_387_binary_op (insn, operands);"
|
13235 |
|
|
[(set (attr "type")
|
13236 |
|
|
(cond [(match_operand:XF 3 "mult_operator" "")
|
13237 |
|
|
(const_string "fmul")
|
13238 |
|
|
(match_operand:XF 3 "div_operator" "")
|
13239 |
|
|
(const_string "fdiv")
|
13240 |
|
|
]
|
13241 |
|
|
(const_string "fop")))
|
13242 |
|
|
(set_attr "mode" "")])
|
13243 |
|
|
|
13244 |
|
|
(define_insn "*fop_xf_5_i387"
|
13245 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f,f")
|
13246 |
|
|
(match_operator:XF 3 "binary_fp_operator"
|
13247 |
|
|
[(match_operand:XF 1 "register_operand" "0,f")
|
13248 |
|
|
(float_extend:XF
|
13249 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "fm,0"))]))]
|
13250 |
|
|
"TARGET_80387"
|
13251 |
|
|
"* return output_387_binary_op (insn, operands);"
|
13252 |
|
|
[(set (attr "type")
|
13253 |
|
|
(cond [(match_operand:XF 3 "mult_operator" "")
|
13254 |
|
|
(const_string "fmul")
|
13255 |
|
|
(match_operand:XF 3 "div_operator" "")
|
13256 |
|
|
(const_string "fdiv")
|
13257 |
|
|
]
|
13258 |
|
|
(const_string "fop")))
|
13259 |
|
|
(set_attr "mode" "")])
|
13260 |
|
|
|
13261 |
|
|
(define_insn "*fop_xf_6_i387"
|
13262 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f,f")
|
13263 |
|
|
(match_operator:XF 3 "binary_fp_operator"
|
13264 |
|
|
[(float_extend:XF
|
13265 |
|
|
(match_operand:MODEF 1 "register_operand" "0,f"))
|
13266 |
|
|
(float_extend:XF
|
13267 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "fm,0"))]))]
|
13268 |
|
|
"TARGET_80387"
|
13269 |
|
|
"* return output_387_binary_op (insn, operands);"
|
13270 |
|
|
[(set (attr "type")
|
13271 |
|
|
(cond [(match_operand:XF 3 "mult_operator" "")
|
13272 |
|
|
(const_string "fmul")
|
13273 |
|
|
(match_operand:XF 3 "div_operator" "")
|
13274 |
|
|
(const_string "fdiv")
|
13275 |
|
|
]
|
13276 |
|
|
(const_string "fop")))
|
13277 |
|
|
(set_attr "mode" "")])
|
13278 |
|
|
|
13279 |
|
|
(define_split
|
13280 |
|
|
[(set (match_operand 0 "register_operand" "")
|
13281 |
|
|
(match_operator 3 "binary_fp_operator"
|
13282 |
|
|
[(float (match_operand:SWI24 1 "register_operand" ""))
|
13283 |
|
|
(match_operand 2 "register_operand" "")]))]
|
13284 |
|
|
"reload_completed
|
13285 |
|
|
&& X87_FLOAT_MODE_P (GET_MODE (operands[0]))
|
13286 |
|
|
&& X87_ENABLE_FLOAT (GET_MODE (operands[0]), GET_MODE (operands[1]))"
|
13287 |
|
|
[(const_int 0)]
|
13288 |
|
|
{
|
13289 |
|
|
operands[4] = ix86_force_to_memory (GET_MODE (operands[1]), operands[1]);
|
13290 |
|
|
operands[4] = gen_rtx_FLOAT (GET_MODE (operands[0]), operands[4]);
|
13291 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[0],
|
13292 |
|
|
gen_rtx_fmt_ee (GET_CODE (operands[3]),
|
13293 |
|
|
GET_MODE (operands[3]),
|
13294 |
|
|
operands[4],
|
13295 |
|
|
operands[2])));
|
13296 |
|
|
ix86_free_from_memory (GET_MODE (operands[1]));
|
13297 |
|
|
DONE;
|
13298 |
|
|
})
|
13299 |
|
|
|
13300 |
|
|
(define_split
|
13301 |
|
|
[(set (match_operand 0 "register_operand" "")
|
13302 |
|
|
(match_operator 3 "binary_fp_operator"
|
13303 |
|
|
[(match_operand 1 "register_operand" "")
|
13304 |
|
|
(float (match_operand:SWI24 2 "register_operand" ""))]))]
|
13305 |
|
|
"reload_completed
|
13306 |
|
|
&& X87_FLOAT_MODE_P (GET_MODE (operands[0]))
|
13307 |
|
|
&& X87_ENABLE_FLOAT (GET_MODE (operands[0]), GET_MODE (operands[2]))"
|
13308 |
|
|
[(const_int 0)]
|
13309 |
|
|
{
|
13310 |
|
|
operands[4] = ix86_force_to_memory (GET_MODE (operands[2]), operands[2]);
|
13311 |
|
|
operands[4] = gen_rtx_FLOAT (GET_MODE (operands[0]), operands[4]);
|
13312 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[0],
|
13313 |
|
|
gen_rtx_fmt_ee (GET_CODE (operands[3]),
|
13314 |
|
|
GET_MODE (operands[3]),
|
13315 |
|
|
operands[1],
|
13316 |
|
|
operands[4])));
|
13317 |
|
|
ix86_free_from_memory (GET_MODE (operands[2]));
|
13318 |
|
|
DONE;
|
13319 |
|
|
})
|
13320 |
|
|
|
13321 |
|
|
;; FPU special functions.
|
13322 |
|
|
|
13323 |
|
|
;; This pattern implements a no-op XFmode truncation for
|
13324 |
|
|
;; all fancy i386 XFmode math functions.
|
13325 |
|
|
|
13326 |
|
|
(define_insn "truncxf2_i387_noop_unspec"
|
13327 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f")
|
13328 |
|
|
(unspec:MODEF [(match_operand:XF 1 "register_operand" "f")]
|
13329 |
|
|
UNSPEC_TRUNC_NOOP))]
|
13330 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
13331 |
|
|
"* return output_387_reg_move (insn, operands);"
|
13332 |
|
|
[(set_attr "type" "fmov")
|
13333 |
|
|
(set_attr "mode" "")])
|
13334 |
|
|
|
13335 |
|
|
(define_insn "sqrtxf2"
|
13336 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13337 |
|
|
(sqrt:XF (match_operand:XF 1 "register_operand" "0")))]
|
13338 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
13339 |
|
|
"fsqrt"
|
13340 |
|
|
[(set_attr "type" "fpspc")
|
13341 |
|
|
(set_attr "mode" "XF")
|
13342 |
|
|
(set_attr "athlon_decode" "direct")
|
13343 |
|
|
(set_attr "amdfam10_decode" "direct")
|
13344 |
|
|
(set_attr "bdver1_decode" "direct")])
|
13345 |
|
|
|
13346 |
|
|
(define_insn "sqrt_extendxf2_i387"
|
13347 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13348 |
|
|
(sqrt:XF
|
13349 |
|
|
(float_extend:XF
|
13350 |
|
|
(match_operand:MODEF 1 "register_operand" "0"))))]
|
13351 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
13352 |
|
|
"fsqrt"
|
13353 |
|
|
[(set_attr "type" "fpspc")
|
13354 |
|
|
(set_attr "mode" "XF")
|
13355 |
|
|
(set_attr "athlon_decode" "direct")
|
13356 |
|
|
(set_attr "amdfam10_decode" "direct")
|
13357 |
|
|
(set_attr "bdver1_decode" "direct")])
|
13358 |
|
|
|
13359 |
|
|
(define_insn "*rsqrtsf2_sse"
|
13360 |
|
|
[(set (match_operand:SF 0 "register_operand" "=x")
|
13361 |
|
|
(unspec:SF [(match_operand:SF 1 "nonimmediate_operand" "xm")]
|
13362 |
|
|
UNSPEC_RSQRT))]
|
13363 |
|
|
"TARGET_SSE_MATH"
|
13364 |
|
|
"%vrsqrtss\t{%1, %d0|%d0, %1}"
|
13365 |
|
|
[(set_attr "type" "sse")
|
13366 |
|
|
(set_attr "atom_sse_attr" "rcp")
|
13367 |
|
|
(set_attr "prefix" "maybe_vex")
|
13368 |
|
|
(set_attr "mode" "SF")])
|
13369 |
|
|
|
13370 |
|
|
(define_expand "rsqrtsf2"
|
13371 |
|
|
[(set (match_operand:SF 0 "register_operand" "")
|
13372 |
|
|
(unspec:SF [(match_operand:SF 1 "nonimmediate_operand" "")]
|
13373 |
|
|
UNSPEC_RSQRT))]
|
13374 |
|
|
"TARGET_SSE_MATH"
|
13375 |
|
|
{
|
13376 |
|
|
ix86_emit_swsqrtsf (operands[0], operands[1], SFmode, 1);
|
13377 |
|
|
DONE;
|
13378 |
|
|
})
|
13379 |
|
|
|
13380 |
|
|
(define_insn "*sqrt2_sse"
|
13381 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x")
|
13382 |
|
|
(sqrt:MODEF
|
13383 |
|
|
(match_operand:MODEF 1 "nonimmediate_operand" "xm")))]
|
13384 |
|
|
"SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH"
|
13385 |
|
|
"%vsqrt\t{%1, %d0|%d0, %1}"
|
13386 |
|
|
[(set_attr "type" "sse")
|
13387 |
|
|
(set_attr "atom_sse_attr" "sqrt")
|
13388 |
|
|
(set_attr "prefix" "maybe_vex")
|
13389 |
|
|
(set_attr "mode" "")
|
13390 |
|
|
(set_attr "athlon_decode" "*")
|
13391 |
|
|
(set_attr "amdfam10_decode" "*")
|
13392 |
|
|
(set_attr "bdver1_decode" "*")])
|
13393 |
|
|
|
13394 |
|
|
(define_expand "sqrt2"
|
13395 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "")
|
13396 |
|
|
(sqrt:MODEF
|
13397 |
|
|
(match_operand:MODEF 1 "nonimmediate_operand" "")))]
|
13398 |
|
|
"(TARGET_USE_FANCY_MATH_387 && X87_ENABLE_ARITH (mode))
|
13399 |
|
|
|| (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)"
|
13400 |
|
|
{
|
13401 |
|
|
if (mode == SFmode
|
13402 |
|
|
&& TARGET_SSE_MATH
|
13403 |
|
|
&& TARGET_RECIP_SQRT
|
13404 |
|
|
&& !optimize_function_for_size_p (cfun)
|
13405 |
|
|
&& flag_finite_math_only && !flag_trapping_math
|
13406 |
|
|
&& flag_unsafe_math_optimizations)
|
13407 |
|
|
{
|
13408 |
|
|
ix86_emit_swsqrtsf (operands[0], operands[1], SFmode, 0);
|
13409 |
|
|
DONE;
|
13410 |
|
|
}
|
13411 |
|
|
|
13412 |
|
|
if (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH))
|
13413 |
|
|
{
|
13414 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
13415 |
|
|
rtx op1 = force_reg (mode, operands[1]);
|
13416 |
|
|
|
13417 |
|
|
emit_insn (gen_sqrt_extendxf2_i387 (op0, op1));
|
13418 |
|
|
emit_insn (gen_truncxf2_i387_noop_unspec (operands[0], op0));
|
13419 |
|
|
DONE;
|
13420 |
|
|
}
|
13421 |
|
|
})
|
13422 |
|
|
|
13423 |
|
|
(define_insn "fpremxf4_i387"
|
13424 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13425 |
|
|
(unspec:XF [(match_operand:XF 2 "register_operand" "0")
|
13426 |
|
|
(match_operand:XF 3 "register_operand" "1")]
|
13427 |
|
|
UNSPEC_FPREM_F))
|
13428 |
|
|
(set (match_operand:XF 1 "register_operand" "=u")
|
13429 |
|
|
(unspec:XF [(match_dup 2) (match_dup 3)]
|
13430 |
|
|
UNSPEC_FPREM_U))
|
13431 |
|
|
(set (reg:CCFP FPSR_REG)
|
13432 |
|
|
(unspec:CCFP [(match_dup 2) (match_dup 3)]
|
13433 |
|
|
UNSPEC_C2_FLAG))]
|
13434 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
13435 |
|
|
"fprem"
|
13436 |
|
|
[(set_attr "type" "fpspc")
|
13437 |
|
|
(set_attr "mode" "XF")])
|
13438 |
|
|
|
13439 |
|
|
(define_expand "fmodxf3"
|
13440 |
|
|
[(use (match_operand:XF 0 "register_operand" ""))
|
13441 |
|
|
(use (match_operand:XF 1 "general_operand" ""))
|
13442 |
|
|
(use (match_operand:XF 2 "general_operand" ""))]
|
13443 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
13444 |
|
|
{
|
13445 |
|
|
rtx label = gen_label_rtx ();
|
13446 |
|
|
|
13447 |
|
|
rtx op1 = gen_reg_rtx (XFmode);
|
13448 |
|
|
rtx op2 = gen_reg_rtx (XFmode);
|
13449 |
|
|
|
13450 |
|
|
emit_move_insn (op2, operands[2]);
|
13451 |
|
|
emit_move_insn (op1, operands[1]);
|
13452 |
|
|
|
13453 |
|
|
emit_label (label);
|
13454 |
|
|
emit_insn (gen_fpremxf4_i387 (op1, op2, op1, op2));
|
13455 |
|
|
ix86_emit_fp_unordered_jump (label);
|
13456 |
|
|
LABEL_NUSES (label) = 1;
|
13457 |
|
|
|
13458 |
|
|
emit_move_insn (operands[0], op1);
|
13459 |
|
|
DONE;
|
13460 |
|
|
})
|
13461 |
|
|
|
13462 |
|
|
(define_expand "fmod3"
|
13463 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
13464 |
|
|
(use (match_operand:MODEF 1 "general_operand" ""))
|
13465 |
|
|
(use (match_operand:MODEF 2 "general_operand" ""))]
|
13466 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
13467 |
|
|
{
|
13468 |
|
|
rtx (*gen_truncxf) (rtx, rtx);
|
13469 |
|
|
|
13470 |
|
|
rtx label = gen_label_rtx ();
|
13471 |
|
|
|
13472 |
|
|
rtx op1 = gen_reg_rtx (XFmode);
|
13473 |
|
|
rtx op2 = gen_reg_rtx (XFmode);
|
13474 |
|
|
|
13475 |
|
|
emit_insn (gen_extendxf2 (op2, operands[2]));
|
13476 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
13477 |
|
|
|
13478 |
|
|
emit_label (label);
|
13479 |
|
|
emit_insn (gen_fpremxf4_i387 (op1, op2, op1, op2));
|
13480 |
|
|
ix86_emit_fp_unordered_jump (label);
|
13481 |
|
|
LABEL_NUSES (label) = 1;
|
13482 |
|
|
|
13483 |
|
|
/* Truncate the result properly for strict SSE math. */
|
13484 |
|
|
if (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
13485 |
|
|
&& !TARGET_MIX_SSE_I387)
|
13486 |
|
|
gen_truncxf = gen_truncxf2;
|
13487 |
|
|
else
|
13488 |
|
|
gen_truncxf = gen_truncxf2_i387_noop_unspec;
|
13489 |
|
|
|
13490 |
|
|
emit_insn (gen_truncxf (operands[0], op1));
|
13491 |
|
|
DONE;
|
13492 |
|
|
})
|
13493 |
|
|
|
13494 |
|
|
(define_insn "fprem1xf4_i387"
|
13495 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13496 |
|
|
(unspec:XF [(match_operand:XF 2 "register_operand" "0")
|
13497 |
|
|
(match_operand:XF 3 "register_operand" "1")]
|
13498 |
|
|
UNSPEC_FPREM1_F))
|
13499 |
|
|
(set (match_operand:XF 1 "register_operand" "=u")
|
13500 |
|
|
(unspec:XF [(match_dup 2) (match_dup 3)]
|
13501 |
|
|
UNSPEC_FPREM1_U))
|
13502 |
|
|
(set (reg:CCFP FPSR_REG)
|
13503 |
|
|
(unspec:CCFP [(match_dup 2) (match_dup 3)]
|
13504 |
|
|
UNSPEC_C2_FLAG))]
|
13505 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
13506 |
|
|
"fprem1"
|
13507 |
|
|
[(set_attr "type" "fpspc")
|
13508 |
|
|
(set_attr "mode" "XF")])
|
13509 |
|
|
|
13510 |
|
|
(define_expand "remainderxf3"
|
13511 |
|
|
[(use (match_operand:XF 0 "register_operand" ""))
|
13512 |
|
|
(use (match_operand:XF 1 "general_operand" ""))
|
13513 |
|
|
(use (match_operand:XF 2 "general_operand" ""))]
|
13514 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
13515 |
|
|
{
|
13516 |
|
|
rtx label = gen_label_rtx ();
|
13517 |
|
|
|
13518 |
|
|
rtx op1 = gen_reg_rtx (XFmode);
|
13519 |
|
|
rtx op2 = gen_reg_rtx (XFmode);
|
13520 |
|
|
|
13521 |
|
|
emit_move_insn (op2, operands[2]);
|
13522 |
|
|
emit_move_insn (op1, operands[1]);
|
13523 |
|
|
|
13524 |
|
|
emit_label (label);
|
13525 |
|
|
emit_insn (gen_fprem1xf4_i387 (op1, op2, op1, op2));
|
13526 |
|
|
ix86_emit_fp_unordered_jump (label);
|
13527 |
|
|
LABEL_NUSES (label) = 1;
|
13528 |
|
|
|
13529 |
|
|
emit_move_insn (operands[0], op1);
|
13530 |
|
|
DONE;
|
13531 |
|
|
})
|
13532 |
|
|
|
13533 |
|
|
(define_expand "remainder3"
|
13534 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
13535 |
|
|
(use (match_operand:MODEF 1 "general_operand" ""))
|
13536 |
|
|
(use (match_operand:MODEF 2 "general_operand" ""))]
|
13537 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
13538 |
|
|
{
|
13539 |
|
|
rtx (*gen_truncxf) (rtx, rtx);
|
13540 |
|
|
|
13541 |
|
|
rtx label = gen_label_rtx ();
|
13542 |
|
|
|
13543 |
|
|
rtx op1 = gen_reg_rtx (XFmode);
|
13544 |
|
|
rtx op2 = gen_reg_rtx (XFmode);
|
13545 |
|
|
|
13546 |
|
|
emit_insn (gen_extendxf2 (op2, operands[2]));
|
13547 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
13548 |
|
|
|
13549 |
|
|
emit_label (label);
|
13550 |
|
|
|
13551 |
|
|
emit_insn (gen_fprem1xf4_i387 (op1, op2, op1, op2));
|
13552 |
|
|
ix86_emit_fp_unordered_jump (label);
|
13553 |
|
|
LABEL_NUSES (label) = 1;
|
13554 |
|
|
|
13555 |
|
|
/* Truncate the result properly for strict SSE math. */
|
13556 |
|
|
if (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
13557 |
|
|
&& !TARGET_MIX_SSE_I387)
|
13558 |
|
|
gen_truncxf = gen_truncxf2;
|
13559 |
|
|
else
|
13560 |
|
|
gen_truncxf = gen_truncxf2_i387_noop_unspec;
|
13561 |
|
|
|
13562 |
|
|
emit_insn (gen_truncxf (operands[0], op1));
|
13563 |
|
|
DONE;
|
13564 |
|
|
})
|
13565 |
|
|
|
13566 |
|
|
(define_insn "*sinxf2_i387"
|
13567 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13568 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "0")] UNSPEC_SIN))]
|
13569 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13570 |
|
|
&& flag_unsafe_math_optimizations"
|
13571 |
|
|
"fsin"
|
13572 |
|
|
[(set_attr "type" "fpspc")
|
13573 |
|
|
(set_attr "mode" "XF")])
|
13574 |
|
|
|
13575 |
|
|
(define_insn "*sin_extendxf2_i387"
|
13576 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13577 |
|
|
(unspec:XF [(float_extend:XF
|
13578 |
|
|
(match_operand:MODEF 1 "register_operand" "0"))]
|
13579 |
|
|
UNSPEC_SIN))]
|
13580 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13581 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13582 |
|
|
|| TARGET_MIX_SSE_I387)
|
13583 |
|
|
&& flag_unsafe_math_optimizations"
|
13584 |
|
|
"fsin"
|
13585 |
|
|
[(set_attr "type" "fpspc")
|
13586 |
|
|
(set_attr "mode" "XF")])
|
13587 |
|
|
|
13588 |
|
|
(define_insn "*cosxf2_i387"
|
13589 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13590 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "0")] UNSPEC_COS))]
|
13591 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13592 |
|
|
&& flag_unsafe_math_optimizations"
|
13593 |
|
|
"fcos"
|
13594 |
|
|
[(set_attr "type" "fpspc")
|
13595 |
|
|
(set_attr "mode" "XF")])
|
13596 |
|
|
|
13597 |
|
|
(define_insn "*cos_extendxf2_i387"
|
13598 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13599 |
|
|
(unspec:XF [(float_extend:XF
|
13600 |
|
|
(match_operand:MODEF 1 "register_operand" "0"))]
|
13601 |
|
|
UNSPEC_COS))]
|
13602 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13603 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13604 |
|
|
|| TARGET_MIX_SSE_I387)
|
13605 |
|
|
&& flag_unsafe_math_optimizations"
|
13606 |
|
|
"fcos"
|
13607 |
|
|
[(set_attr "type" "fpspc")
|
13608 |
|
|
(set_attr "mode" "XF")])
|
13609 |
|
|
|
13610 |
|
|
;; When sincos pattern is defined, sin and cos builtin functions will be
|
13611 |
|
|
;; expanded to sincos pattern with one of its outputs left unused.
|
13612 |
|
|
;; CSE pass will figure out if two sincos patterns can be combined,
|
13613 |
|
|
;; otherwise sincos pattern will be split back to sin or cos pattern,
|
13614 |
|
|
;; depending on the unused output.
|
13615 |
|
|
|
13616 |
|
|
(define_insn "sincosxf3"
|
13617 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13618 |
|
|
(unspec:XF [(match_operand:XF 2 "register_operand" "0")]
|
13619 |
|
|
UNSPEC_SINCOS_COS))
|
13620 |
|
|
(set (match_operand:XF 1 "register_operand" "=u")
|
13621 |
|
|
(unspec:XF [(match_dup 2)] UNSPEC_SINCOS_SIN))]
|
13622 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13623 |
|
|
&& flag_unsafe_math_optimizations"
|
13624 |
|
|
"fsincos"
|
13625 |
|
|
[(set_attr "type" "fpspc")
|
13626 |
|
|
(set_attr "mode" "XF")])
|
13627 |
|
|
|
13628 |
|
|
(define_split
|
13629 |
|
|
[(set (match_operand:XF 0 "register_operand" "")
|
13630 |
|
|
(unspec:XF [(match_operand:XF 2 "register_operand" "")]
|
13631 |
|
|
UNSPEC_SINCOS_COS))
|
13632 |
|
|
(set (match_operand:XF 1 "register_operand" "")
|
13633 |
|
|
(unspec:XF [(match_dup 2)] UNSPEC_SINCOS_SIN))]
|
13634 |
|
|
"find_regno_note (insn, REG_UNUSED, REGNO (operands[0]))
|
13635 |
|
|
&& can_create_pseudo_p ()"
|
13636 |
|
|
[(set (match_dup 1) (unspec:XF [(match_dup 2)] UNSPEC_SIN))])
|
13637 |
|
|
|
13638 |
|
|
(define_split
|
13639 |
|
|
[(set (match_operand:XF 0 "register_operand" "")
|
13640 |
|
|
(unspec:XF [(match_operand:XF 2 "register_operand" "")]
|
13641 |
|
|
UNSPEC_SINCOS_COS))
|
13642 |
|
|
(set (match_operand:XF 1 "register_operand" "")
|
13643 |
|
|
(unspec:XF [(match_dup 2)] UNSPEC_SINCOS_SIN))]
|
13644 |
|
|
"find_regno_note (insn, REG_UNUSED, REGNO (operands[1]))
|
13645 |
|
|
&& can_create_pseudo_p ()"
|
13646 |
|
|
[(set (match_dup 0) (unspec:XF [(match_dup 2)] UNSPEC_COS))])
|
13647 |
|
|
|
13648 |
|
|
(define_insn "sincos_extendxf3_i387"
|
13649 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13650 |
|
|
(unspec:XF [(float_extend:XF
|
13651 |
|
|
(match_operand:MODEF 2 "register_operand" "0"))]
|
13652 |
|
|
UNSPEC_SINCOS_COS))
|
13653 |
|
|
(set (match_operand:XF 1 "register_operand" "=u")
|
13654 |
|
|
(unspec:XF [(float_extend:XF (match_dup 2))] UNSPEC_SINCOS_SIN))]
|
13655 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13656 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13657 |
|
|
|| TARGET_MIX_SSE_I387)
|
13658 |
|
|
&& flag_unsafe_math_optimizations"
|
13659 |
|
|
"fsincos"
|
13660 |
|
|
[(set_attr "type" "fpspc")
|
13661 |
|
|
(set_attr "mode" "XF")])
|
13662 |
|
|
|
13663 |
|
|
(define_split
|
13664 |
|
|
[(set (match_operand:XF 0 "register_operand" "")
|
13665 |
|
|
(unspec:XF [(float_extend:XF
|
13666 |
|
|
(match_operand:MODEF 2 "register_operand" ""))]
|
13667 |
|
|
UNSPEC_SINCOS_COS))
|
13668 |
|
|
(set (match_operand:XF 1 "register_operand" "")
|
13669 |
|
|
(unspec:XF [(float_extend:XF (match_dup 2))] UNSPEC_SINCOS_SIN))]
|
13670 |
|
|
"find_regno_note (insn, REG_UNUSED, REGNO (operands[0]))
|
13671 |
|
|
&& can_create_pseudo_p ()"
|
13672 |
|
|
[(set (match_dup 1)
|
13673 |
|
|
(unspec:XF [(float_extend:XF (match_dup 2))] UNSPEC_SIN))])
|
13674 |
|
|
|
13675 |
|
|
(define_split
|
13676 |
|
|
[(set (match_operand:XF 0 "register_operand" "")
|
13677 |
|
|
(unspec:XF [(float_extend:XF
|
13678 |
|
|
(match_operand:MODEF 2 "register_operand" ""))]
|
13679 |
|
|
UNSPEC_SINCOS_COS))
|
13680 |
|
|
(set (match_operand:XF 1 "register_operand" "")
|
13681 |
|
|
(unspec:XF [(float_extend:XF (match_dup 2))] UNSPEC_SINCOS_SIN))]
|
13682 |
|
|
"find_regno_note (insn, REG_UNUSED, REGNO (operands[1]))
|
13683 |
|
|
&& can_create_pseudo_p ()"
|
13684 |
|
|
[(set (match_dup 0)
|
13685 |
|
|
(unspec:XF [(float_extend:XF (match_dup 2))] UNSPEC_COS))])
|
13686 |
|
|
|
13687 |
|
|
(define_expand "sincos3"
|
13688 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
13689 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))
|
13690 |
|
|
(use (match_operand:MODEF 2 "register_operand" ""))]
|
13691 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13692 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13693 |
|
|
|| TARGET_MIX_SSE_I387)
|
13694 |
|
|
&& flag_unsafe_math_optimizations"
|
13695 |
|
|
{
|
13696 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
13697 |
|
|
rtx op1 = gen_reg_rtx (XFmode);
|
13698 |
|
|
|
13699 |
|
|
emit_insn (gen_sincos_extendxf3_i387 (op0, op1, operands[2]));
|
13700 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
13701 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[1], op1));
|
13702 |
|
|
DONE;
|
13703 |
|
|
})
|
13704 |
|
|
|
13705 |
|
|
(define_insn "fptanxf4_i387"
|
13706 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13707 |
|
|
(match_operand:XF 3 "const_double_operand" "F"))
|
13708 |
|
|
(set (match_operand:XF 1 "register_operand" "=u")
|
13709 |
|
|
(unspec:XF [(match_operand:XF 2 "register_operand" "0")]
|
13710 |
|
|
UNSPEC_TAN))]
|
13711 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13712 |
|
|
&& flag_unsafe_math_optimizations
|
13713 |
|
|
&& standard_80387_constant_p (operands[3]) == 2"
|
13714 |
|
|
"fptan"
|
13715 |
|
|
[(set_attr "type" "fpspc")
|
13716 |
|
|
(set_attr "mode" "XF")])
|
13717 |
|
|
|
13718 |
|
|
(define_insn "fptan_extendxf4_i387"
|
13719 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=f")
|
13720 |
|
|
(match_operand:MODEF 3 "const_double_operand" "F"))
|
13721 |
|
|
(set (match_operand:XF 1 "register_operand" "=u")
|
13722 |
|
|
(unspec:XF [(float_extend:XF
|
13723 |
|
|
(match_operand:MODEF 2 "register_operand" "0"))]
|
13724 |
|
|
UNSPEC_TAN))]
|
13725 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13726 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13727 |
|
|
|| TARGET_MIX_SSE_I387)
|
13728 |
|
|
&& flag_unsafe_math_optimizations
|
13729 |
|
|
&& standard_80387_constant_p (operands[3]) == 2"
|
13730 |
|
|
"fptan"
|
13731 |
|
|
[(set_attr "type" "fpspc")
|
13732 |
|
|
(set_attr "mode" "XF")])
|
13733 |
|
|
|
13734 |
|
|
(define_expand "tanxf2"
|
13735 |
|
|
[(use (match_operand:XF 0 "register_operand" ""))
|
13736 |
|
|
(use (match_operand:XF 1 "register_operand" ""))]
|
13737 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13738 |
|
|
&& flag_unsafe_math_optimizations"
|
13739 |
|
|
{
|
13740 |
|
|
rtx one = gen_reg_rtx (XFmode);
|
13741 |
|
|
rtx op2 = CONST1_RTX (XFmode); /* fld1 */
|
13742 |
|
|
|
13743 |
|
|
emit_insn (gen_fptanxf4_i387 (one, operands[0], operands[1], op2));
|
13744 |
|
|
DONE;
|
13745 |
|
|
})
|
13746 |
|
|
|
13747 |
|
|
(define_expand "tan2"
|
13748 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
13749 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
13750 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13751 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13752 |
|
|
|| TARGET_MIX_SSE_I387)
|
13753 |
|
|
&& flag_unsafe_math_optimizations"
|
13754 |
|
|
{
|
13755 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
13756 |
|
|
|
13757 |
|
|
rtx one = gen_reg_rtx (mode);
|
13758 |
|
|
rtx op2 = CONST1_RTX (mode); /* fld1 */
|
13759 |
|
|
|
13760 |
|
|
emit_insn (gen_fptan_extendxf4_i387 (one, op0,
|
13761 |
|
|
operands[1], op2));
|
13762 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
13763 |
|
|
DONE;
|
13764 |
|
|
})
|
13765 |
|
|
|
13766 |
|
|
(define_insn "*fpatanxf3_i387"
|
13767 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13768 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "0")
|
13769 |
|
|
(match_operand:XF 2 "register_operand" "u")]
|
13770 |
|
|
UNSPEC_FPATAN))
|
13771 |
|
|
(clobber (match_scratch:XF 3 "=2"))]
|
13772 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13773 |
|
|
&& flag_unsafe_math_optimizations"
|
13774 |
|
|
"fpatan"
|
13775 |
|
|
[(set_attr "type" "fpspc")
|
13776 |
|
|
(set_attr "mode" "XF")])
|
13777 |
|
|
|
13778 |
|
|
(define_insn "fpatan_extendxf3_i387"
|
13779 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13780 |
|
|
(unspec:XF [(float_extend:XF
|
13781 |
|
|
(match_operand:MODEF 1 "register_operand" "0"))
|
13782 |
|
|
(float_extend:XF
|
13783 |
|
|
(match_operand:MODEF 2 "register_operand" "u"))]
|
13784 |
|
|
UNSPEC_FPATAN))
|
13785 |
|
|
(clobber (match_scratch:XF 3 "=2"))]
|
13786 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13787 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13788 |
|
|
|| TARGET_MIX_SSE_I387)
|
13789 |
|
|
&& flag_unsafe_math_optimizations"
|
13790 |
|
|
"fpatan"
|
13791 |
|
|
[(set_attr "type" "fpspc")
|
13792 |
|
|
(set_attr "mode" "XF")])
|
13793 |
|
|
|
13794 |
|
|
(define_expand "atan2xf3"
|
13795 |
|
|
[(parallel [(set (match_operand:XF 0 "register_operand" "")
|
13796 |
|
|
(unspec:XF [(match_operand:XF 2 "register_operand" "")
|
13797 |
|
|
(match_operand:XF 1 "register_operand" "")]
|
13798 |
|
|
UNSPEC_FPATAN))
|
13799 |
|
|
(clobber (match_scratch:XF 3 ""))])]
|
13800 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13801 |
|
|
&& flag_unsafe_math_optimizations")
|
13802 |
|
|
|
13803 |
|
|
(define_expand "atan23"
|
13804 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
13805 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))
|
13806 |
|
|
(use (match_operand:MODEF 2 "register_operand" ""))]
|
13807 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13808 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13809 |
|
|
|| TARGET_MIX_SSE_I387)
|
13810 |
|
|
&& flag_unsafe_math_optimizations"
|
13811 |
|
|
{
|
13812 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
13813 |
|
|
|
13814 |
|
|
emit_insn (gen_fpatan_extendxf3_i387 (op0, operands[2], operands[1]));
|
13815 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
13816 |
|
|
DONE;
|
13817 |
|
|
})
|
13818 |
|
|
|
13819 |
|
|
(define_expand "atanxf2"
|
13820 |
|
|
[(parallel [(set (match_operand:XF 0 "register_operand" "")
|
13821 |
|
|
(unspec:XF [(match_dup 2)
|
13822 |
|
|
(match_operand:XF 1 "register_operand" "")]
|
13823 |
|
|
UNSPEC_FPATAN))
|
13824 |
|
|
(clobber (match_scratch:XF 3 ""))])]
|
13825 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13826 |
|
|
&& flag_unsafe_math_optimizations"
|
13827 |
|
|
{
|
13828 |
|
|
operands[2] = gen_reg_rtx (XFmode);
|
13829 |
|
|
emit_move_insn (operands[2], CONST1_RTX (XFmode)); /* fld1 */
|
13830 |
|
|
})
|
13831 |
|
|
|
13832 |
|
|
(define_expand "atan2"
|
13833 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
13834 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
13835 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13836 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13837 |
|
|
|| TARGET_MIX_SSE_I387)
|
13838 |
|
|
&& flag_unsafe_math_optimizations"
|
13839 |
|
|
{
|
13840 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
13841 |
|
|
|
13842 |
|
|
rtx op2 = gen_reg_rtx (mode);
|
13843 |
|
|
emit_move_insn (op2, CONST1_RTX (mode)); /* fld1 */
|
13844 |
|
|
|
13845 |
|
|
emit_insn (gen_fpatan_extendxf3_i387 (op0, op2, operands[1]));
|
13846 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
13847 |
|
|
DONE;
|
13848 |
|
|
})
|
13849 |
|
|
|
13850 |
|
|
(define_expand "asinxf2"
|
13851 |
|
|
[(set (match_dup 2)
|
13852 |
|
|
(mult:XF (match_operand:XF 1 "register_operand" "")
|
13853 |
|
|
(match_dup 1)))
|
13854 |
|
|
(set (match_dup 4) (minus:XF (match_dup 3) (match_dup 2)))
|
13855 |
|
|
(set (match_dup 5) (sqrt:XF (match_dup 4)))
|
13856 |
|
|
(parallel [(set (match_operand:XF 0 "register_operand" "")
|
13857 |
|
|
(unspec:XF [(match_dup 5) (match_dup 1)]
|
13858 |
|
|
UNSPEC_FPATAN))
|
13859 |
|
|
(clobber (match_scratch:XF 6 ""))])]
|
13860 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13861 |
|
|
&& flag_unsafe_math_optimizations"
|
13862 |
|
|
{
|
13863 |
|
|
int i;
|
13864 |
|
|
|
13865 |
|
|
if (optimize_insn_for_size_p ())
|
13866 |
|
|
FAIL;
|
13867 |
|
|
|
13868 |
|
|
for (i = 2; i < 6; i++)
|
13869 |
|
|
operands[i] = gen_reg_rtx (XFmode);
|
13870 |
|
|
|
13871 |
|
|
emit_move_insn (operands[3], CONST1_RTX (XFmode)); /* fld1 */
|
13872 |
|
|
})
|
13873 |
|
|
|
13874 |
|
|
(define_expand "asin2"
|
13875 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
13876 |
|
|
(use (match_operand:MODEF 1 "general_operand" ""))]
|
13877 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13878 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13879 |
|
|
|| TARGET_MIX_SSE_I387)
|
13880 |
|
|
&& flag_unsafe_math_optimizations"
|
13881 |
|
|
{
|
13882 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
13883 |
|
|
rtx op1 = gen_reg_rtx (XFmode);
|
13884 |
|
|
|
13885 |
|
|
if (optimize_insn_for_size_p ())
|
13886 |
|
|
FAIL;
|
13887 |
|
|
|
13888 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
13889 |
|
|
emit_insn (gen_asinxf2 (op0, op1));
|
13890 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
13891 |
|
|
DONE;
|
13892 |
|
|
})
|
13893 |
|
|
|
13894 |
|
|
(define_expand "acosxf2"
|
13895 |
|
|
[(set (match_dup 2)
|
13896 |
|
|
(mult:XF (match_operand:XF 1 "register_operand" "")
|
13897 |
|
|
(match_dup 1)))
|
13898 |
|
|
(set (match_dup 4) (minus:XF (match_dup 3) (match_dup 2)))
|
13899 |
|
|
(set (match_dup 5) (sqrt:XF (match_dup 4)))
|
13900 |
|
|
(parallel [(set (match_operand:XF 0 "register_operand" "")
|
13901 |
|
|
(unspec:XF [(match_dup 1) (match_dup 5)]
|
13902 |
|
|
UNSPEC_FPATAN))
|
13903 |
|
|
(clobber (match_scratch:XF 6 ""))])]
|
13904 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13905 |
|
|
&& flag_unsafe_math_optimizations"
|
13906 |
|
|
{
|
13907 |
|
|
int i;
|
13908 |
|
|
|
13909 |
|
|
if (optimize_insn_for_size_p ())
|
13910 |
|
|
FAIL;
|
13911 |
|
|
|
13912 |
|
|
for (i = 2; i < 6; i++)
|
13913 |
|
|
operands[i] = gen_reg_rtx (XFmode);
|
13914 |
|
|
|
13915 |
|
|
emit_move_insn (operands[3], CONST1_RTX (XFmode)); /* fld1 */
|
13916 |
|
|
})
|
13917 |
|
|
|
13918 |
|
|
(define_expand "acos2"
|
13919 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
13920 |
|
|
(use (match_operand:MODEF 1 "general_operand" ""))]
|
13921 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13922 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13923 |
|
|
|| TARGET_MIX_SSE_I387)
|
13924 |
|
|
&& flag_unsafe_math_optimizations"
|
13925 |
|
|
{
|
13926 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
13927 |
|
|
rtx op1 = gen_reg_rtx (XFmode);
|
13928 |
|
|
|
13929 |
|
|
if (optimize_insn_for_size_p ())
|
13930 |
|
|
FAIL;
|
13931 |
|
|
|
13932 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
13933 |
|
|
emit_insn (gen_acosxf2 (op0, op1));
|
13934 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
13935 |
|
|
DONE;
|
13936 |
|
|
})
|
13937 |
|
|
|
13938 |
|
|
(define_insn "fyl2xxf3_i387"
|
13939 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13940 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "0")
|
13941 |
|
|
(match_operand:XF 2 "register_operand" "u")]
|
13942 |
|
|
UNSPEC_FYL2X))
|
13943 |
|
|
(clobber (match_scratch:XF 3 "=2"))]
|
13944 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13945 |
|
|
&& flag_unsafe_math_optimizations"
|
13946 |
|
|
"fyl2x"
|
13947 |
|
|
[(set_attr "type" "fpspc")
|
13948 |
|
|
(set_attr "mode" "XF")])
|
13949 |
|
|
|
13950 |
|
|
(define_insn "fyl2x_extendxf3_i387"
|
13951 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
13952 |
|
|
(unspec:XF [(float_extend:XF
|
13953 |
|
|
(match_operand:MODEF 1 "register_operand" "0"))
|
13954 |
|
|
(match_operand:XF 2 "register_operand" "u")]
|
13955 |
|
|
UNSPEC_FYL2X))
|
13956 |
|
|
(clobber (match_scratch:XF 3 "=2"))]
|
13957 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13958 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13959 |
|
|
|| TARGET_MIX_SSE_I387)
|
13960 |
|
|
&& flag_unsafe_math_optimizations"
|
13961 |
|
|
"fyl2x"
|
13962 |
|
|
[(set_attr "type" "fpspc")
|
13963 |
|
|
(set_attr "mode" "XF")])
|
13964 |
|
|
|
13965 |
|
|
(define_expand "logxf2"
|
13966 |
|
|
[(parallel [(set (match_operand:XF 0 "register_operand" "")
|
13967 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "")
|
13968 |
|
|
(match_dup 2)] UNSPEC_FYL2X))
|
13969 |
|
|
(clobber (match_scratch:XF 3 ""))])]
|
13970 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13971 |
|
|
&& flag_unsafe_math_optimizations"
|
13972 |
|
|
{
|
13973 |
|
|
operands[2] = gen_reg_rtx (XFmode);
|
13974 |
|
|
emit_move_insn (operands[2], standard_80387_constant_rtx (4)); /* fldln2 */
|
13975 |
|
|
})
|
13976 |
|
|
|
13977 |
|
|
(define_expand "log2"
|
13978 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
13979 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
13980 |
|
|
"TARGET_USE_FANCY_MATH_387
|
13981 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
13982 |
|
|
|| TARGET_MIX_SSE_I387)
|
13983 |
|
|
&& flag_unsafe_math_optimizations"
|
13984 |
|
|
{
|
13985 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
13986 |
|
|
|
13987 |
|
|
rtx op2 = gen_reg_rtx (XFmode);
|
13988 |
|
|
emit_move_insn (op2, standard_80387_constant_rtx (4)); /* fldln2 */
|
13989 |
|
|
|
13990 |
|
|
emit_insn (gen_fyl2x_extendxf3_i387 (op0, operands[1], op2));
|
13991 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
13992 |
|
|
DONE;
|
13993 |
|
|
})
|
13994 |
|
|
|
13995 |
|
|
(define_expand "log10xf2"
|
13996 |
|
|
[(parallel [(set (match_operand:XF 0 "register_operand" "")
|
13997 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "")
|
13998 |
|
|
(match_dup 2)] UNSPEC_FYL2X))
|
13999 |
|
|
(clobber (match_scratch:XF 3 ""))])]
|
14000 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14001 |
|
|
&& flag_unsafe_math_optimizations"
|
14002 |
|
|
{
|
14003 |
|
|
operands[2] = gen_reg_rtx (XFmode);
|
14004 |
|
|
emit_move_insn (operands[2], standard_80387_constant_rtx (3)); /* fldlg2 */
|
14005 |
|
|
})
|
14006 |
|
|
|
14007 |
|
|
(define_expand "log102"
|
14008 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
14009 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
14010 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14011 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14012 |
|
|
|| TARGET_MIX_SSE_I387)
|
14013 |
|
|
&& flag_unsafe_math_optimizations"
|
14014 |
|
|
{
|
14015 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
14016 |
|
|
|
14017 |
|
|
rtx op2 = gen_reg_rtx (XFmode);
|
14018 |
|
|
emit_move_insn (op2, standard_80387_constant_rtx (3)); /* fldlg2 */
|
14019 |
|
|
|
14020 |
|
|
emit_insn (gen_fyl2x_extendxf3_i387 (op0, operands[1], op2));
|
14021 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
14022 |
|
|
DONE;
|
14023 |
|
|
})
|
14024 |
|
|
|
14025 |
|
|
(define_expand "log2xf2"
|
14026 |
|
|
[(parallel [(set (match_operand:XF 0 "register_operand" "")
|
14027 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "")
|
14028 |
|
|
(match_dup 2)] UNSPEC_FYL2X))
|
14029 |
|
|
(clobber (match_scratch:XF 3 ""))])]
|
14030 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14031 |
|
|
&& flag_unsafe_math_optimizations"
|
14032 |
|
|
{
|
14033 |
|
|
operands[2] = gen_reg_rtx (XFmode);
|
14034 |
|
|
emit_move_insn (operands[2], CONST1_RTX (XFmode)); /* fld1 */
|
14035 |
|
|
})
|
14036 |
|
|
|
14037 |
|
|
(define_expand "log22"
|
14038 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
14039 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
14040 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14041 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14042 |
|
|
|| TARGET_MIX_SSE_I387)
|
14043 |
|
|
&& flag_unsafe_math_optimizations"
|
14044 |
|
|
{
|
14045 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
14046 |
|
|
|
14047 |
|
|
rtx op2 = gen_reg_rtx (XFmode);
|
14048 |
|
|
emit_move_insn (op2, CONST1_RTX (XFmode)); /* fld1 */
|
14049 |
|
|
|
14050 |
|
|
emit_insn (gen_fyl2x_extendxf3_i387 (op0, operands[1], op2));
|
14051 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
14052 |
|
|
DONE;
|
14053 |
|
|
})
|
14054 |
|
|
|
14055 |
|
|
(define_insn "fyl2xp1xf3_i387"
|
14056 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
14057 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "0")
|
14058 |
|
|
(match_operand:XF 2 "register_operand" "u")]
|
14059 |
|
|
UNSPEC_FYL2XP1))
|
14060 |
|
|
(clobber (match_scratch:XF 3 "=2"))]
|
14061 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14062 |
|
|
&& flag_unsafe_math_optimizations"
|
14063 |
|
|
"fyl2xp1"
|
14064 |
|
|
[(set_attr "type" "fpspc")
|
14065 |
|
|
(set_attr "mode" "XF")])
|
14066 |
|
|
|
14067 |
|
|
(define_insn "fyl2xp1_extendxf3_i387"
|
14068 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
14069 |
|
|
(unspec:XF [(float_extend:XF
|
14070 |
|
|
(match_operand:MODEF 1 "register_operand" "0"))
|
14071 |
|
|
(match_operand:XF 2 "register_operand" "u")]
|
14072 |
|
|
UNSPEC_FYL2XP1))
|
14073 |
|
|
(clobber (match_scratch:XF 3 "=2"))]
|
14074 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14075 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14076 |
|
|
|| TARGET_MIX_SSE_I387)
|
14077 |
|
|
&& flag_unsafe_math_optimizations"
|
14078 |
|
|
"fyl2xp1"
|
14079 |
|
|
[(set_attr "type" "fpspc")
|
14080 |
|
|
(set_attr "mode" "XF")])
|
14081 |
|
|
|
14082 |
|
|
(define_expand "log1pxf2"
|
14083 |
|
|
[(use (match_operand:XF 0 "register_operand" ""))
|
14084 |
|
|
(use (match_operand:XF 1 "register_operand" ""))]
|
14085 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14086 |
|
|
&& flag_unsafe_math_optimizations"
|
14087 |
|
|
{
|
14088 |
|
|
if (optimize_insn_for_size_p ())
|
14089 |
|
|
FAIL;
|
14090 |
|
|
|
14091 |
|
|
ix86_emit_i387_log1p (operands[0], operands[1]);
|
14092 |
|
|
DONE;
|
14093 |
|
|
})
|
14094 |
|
|
|
14095 |
|
|
(define_expand "log1p2"
|
14096 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
14097 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
14098 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14099 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14100 |
|
|
|| TARGET_MIX_SSE_I387)
|
14101 |
|
|
&& flag_unsafe_math_optimizations"
|
14102 |
|
|
{
|
14103 |
|
|
rtx op0;
|
14104 |
|
|
|
14105 |
|
|
if (optimize_insn_for_size_p ())
|
14106 |
|
|
FAIL;
|
14107 |
|
|
|
14108 |
|
|
op0 = gen_reg_rtx (XFmode);
|
14109 |
|
|
|
14110 |
|
|
operands[1] = gen_rtx_FLOAT_EXTEND (XFmode, operands[1]);
|
14111 |
|
|
|
14112 |
|
|
ix86_emit_i387_log1p (op0, operands[1]);
|
14113 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
14114 |
|
|
DONE;
|
14115 |
|
|
})
|
14116 |
|
|
|
14117 |
|
|
(define_insn "fxtractxf3_i387"
|
14118 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
14119 |
|
|
(unspec:XF [(match_operand:XF 2 "register_operand" "0")]
|
14120 |
|
|
UNSPEC_XTRACT_FRACT))
|
14121 |
|
|
(set (match_operand:XF 1 "register_operand" "=u")
|
14122 |
|
|
(unspec:XF [(match_dup 2)] UNSPEC_XTRACT_EXP))]
|
14123 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14124 |
|
|
&& flag_unsafe_math_optimizations"
|
14125 |
|
|
"fxtract"
|
14126 |
|
|
[(set_attr "type" "fpspc")
|
14127 |
|
|
(set_attr "mode" "XF")])
|
14128 |
|
|
|
14129 |
|
|
(define_insn "fxtract_extendxf3_i387"
|
14130 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
14131 |
|
|
(unspec:XF [(float_extend:XF
|
14132 |
|
|
(match_operand:MODEF 2 "register_operand" "0"))]
|
14133 |
|
|
UNSPEC_XTRACT_FRACT))
|
14134 |
|
|
(set (match_operand:XF 1 "register_operand" "=u")
|
14135 |
|
|
(unspec:XF [(float_extend:XF (match_dup 2))] UNSPEC_XTRACT_EXP))]
|
14136 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14137 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14138 |
|
|
|| TARGET_MIX_SSE_I387)
|
14139 |
|
|
&& flag_unsafe_math_optimizations"
|
14140 |
|
|
"fxtract"
|
14141 |
|
|
[(set_attr "type" "fpspc")
|
14142 |
|
|
(set_attr "mode" "XF")])
|
14143 |
|
|
|
14144 |
|
|
(define_expand "logbxf2"
|
14145 |
|
|
[(parallel [(set (match_dup 2)
|
14146 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "")]
|
14147 |
|
|
UNSPEC_XTRACT_FRACT))
|
14148 |
|
|
(set (match_operand:XF 0 "register_operand" "")
|
14149 |
|
|
(unspec:XF [(match_dup 1)] UNSPEC_XTRACT_EXP))])]
|
14150 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14151 |
|
|
&& flag_unsafe_math_optimizations"
|
14152 |
|
|
"operands[2] = gen_reg_rtx (XFmode);")
|
14153 |
|
|
|
14154 |
|
|
(define_expand "logb2"
|
14155 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
14156 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
14157 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14158 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14159 |
|
|
|| TARGET_MIX_SSE_I387)
|
14160 |
|
|
&& flag_unsafe_math_optimizations"
|
14161 |
|
|
{
|
14162 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
14163 |
|
|
rtx op1 = gen_reg_rtx (XFmode);
|
14164 |
|
|
|
14165 |
|
|
emit_insn (gen_fxtract_extendxf3_i387 (op0, op1, operands[1]));
|
14166 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op1));
|
14167 |
|
|
DONE;
|
14168 |
|
|
})
|
14169 |
|
|
|
14170 |
|
|
(define_expand "ilogbxf2"
|
14171 |
|
|
[(use (match_operand:SI 0 "register_operand" ""))
|
14172 |
|
|
(use (match_operand:XF 1 "register_operand" ""))]
|
14173 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14174 |
|
|
&& flag_unsafe_math_optimizations"
|
14175 |
|
|
{
|
14176 |
|
|
rtx op0, op1;
|
14177 |
|
|
|
14178 |
|
|
if (optimize_insn_for_size_p ())
|
14179 |
|
|
FAIL;
|
14180 |
|
|
|
14181 |
|
|
op0 = gen_reg_rtx (XFmode);
|
14182 |
|
|
op1 = gen_reg_rtx (XFmode);
|
14183 |
|
|
|
14184 |
|
|
emit_insn (gen_fxtractxf3_i387 (op0, op1, operands[1]));
|
14185 |
|
|
emit_insn (gen_fix_truncxfsi2 (operands[0], op1));
|
14186 |
|
|
DONE;
|
14187 |
|
|
})
|
14188 |
|
|
|
14189 |
|
|
(define_expand "ilogb2"
|
14190 |
|
|
[(use (match_operand:SI 0 "register_operand" ""))
|
14191 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
14192 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14193 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14194 |
|
|
|| TARGET_MIX_SSE_I387)
|
14195 |
|
|
&& flag_unsafe_math_optimizations"
|
14196 |
|
|
{
|
14197 |
|
|
rtx op0, op1;
|
14198 |
|
|
|
14199 |
|
|
if (optimize_insn_for_size_p ())
|
14200 |
|
|
FAIL;
|
14201 |
|
|
|
14202 |
|
|
op0 = gen_reg_rtx (XFmode);
|
14203 |
|
|
op1 = gen_reg_rtx (XFmode);
|
14204 |
|
|
|
14205 |
|
|
emit_insn (gen_fxtract_extendxf3_i387 (op0, op1, operands[1]));
|
14206 |
|
|
emit_insn (gen_fix_truncxfsi2 (operands[0], op1));
|
14207 |
|
|
DONE;
|
14208 |
|
|
})
|
14209 |
|
|
|
14210 |
|
|
(define_insn "*f2xm1xf2_i387"
|
14211 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
14212 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "0")]
|
14213 |
|
|
UNSPEC_F2XM1))]
|
14214 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14215 |
|
|
&& flag_unsafe_math_optimizations"
|
14216 |
|
|
"f2xm1"
|
14217 |
|
|
[(set_attr "type" "fpspc")
|
14218 |
|
|
(set_attr "mode" "XF")])
|
14219 |
|
|
|
14220 |
|
|
(define_insn "*fscalexf4_i387"
|
14221 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
14222 |
|
|
(unspec:XF [(match_operand:XF 2 "register_operand" "0")
|
14223 |
|
|
(match_operand:XF 3 "register_operand" "1")]
|
14224 |
|
|
UNSPEC_FSCALE_FRACT))
|
14225 |
|
|
(set (match_operand:XF 1 "register_operand" "=u")
|
14226 |
|
|
(unspec:XF [(match_dup 2) (match_dup 3)]
|
14227 |
|
|
UNSPEC_FSCALE_EXP))]
|
14228 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14229 |
|
|
&& flag_unsafe_math_optimizations"
|
14230 |
|
|
"fscale"
|
14231 |
|
|
[(set_attr "type" "fpspc")
|
14232 |
|
|
(set_attr "mode" "XF")])
|
14233 |
|
|
|
14234 |
|
|
(define_expand "expNcorexf3"
|
14235 |
|
|
[(set (match_dup 3) (mult:XF (match_operand:XF 1 "register_operand" "")
|
14236 |
|
|
(match_operand:XF 2 "register_operand" "")))
|
14237 |
|
|
(set (match_dup 4) (unspec:XF [(match_dup 3)] UNSPEC_FRNDINT))
|
14238 |
|
|
(set (match_dup 5) (minus:XF (match_dup 3) (match_dup 4)))
|
14239 |
|
|
(set (match_dup 6) (unspec:XF [(match_dup 5)] UNSPEC_F2XM1))
|
14240 |
|
|
(set (match_dup 8) (plus:XF (match_dup 6) (match_dup 7)))
|
14241 |
|
|
(parallel [(set (match_operand:XF 0 "register_operand" "")
|
14242 |
|
|
(unspec:XF [(match_dup 8) (match_dup 4)]
|
14243 |
|
|
UNSPEC_FSCALE_FRACT))
|
14244 |
|
|
(set (match_dup 9)
|
14245 |
|
|
(unspec:XF [(match_dup 8) (match_dup 4)]
|
14246 |
|
|
UNSPEC_FSCALE_EXP))])]
|
14247 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14248 |
|
|
&& flag_unsafe_math_optimizations"
|
14249 |
|
|
{
|
14250 |
|
|
int i;
|
14251 |
|
|
|
14252 |
|
|
if (optimize_insn_for_size_p ())
|
14253 |
|
|
FAIL;
|
14254 |
|
|
|
14255 |
|
|
for (i = 3; i < 10; i++)
|
14256 |
|
|
operands[i] = gen_reg_rtx (XFmode);
|
14257 |
|
|
|
14258 |
|
|
emit_move_insn (operands[7], CONST1_RTX (XFmode)); /* fld1 */
|
14259 |
|
|
})
|
14260 |
|
|
|
14261 |
|
|
(define_expand "expxf2"
|
14262 |
|
|
[(use (match_operand:XF 0 "register_operand" ""))
|
14263 |
|
|
(use (match_operand:XF 1 "register_operand" ""))]
|
14264 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14265 |
|
|
&& flag_unsafe_math_optimizations"
|
14266 |
|
|
{
|
14267 |
|
|
rtx op2;
|
14268 |
|
|
|
14269 |
|
|
if (optimize_insn_for_size_p ())
|
14270 |
|
|
FAIL;
|
14271 |
|
|
|
14272 |
|
|
op2 = gen_reg_rtx (XFmode);
|
14273 |
|
|
emit_move_insn (op2, standard_80387_constant_rtx (5)); /* fldl2e */
|
14274 |
|
|
|
14275 |
|
|
emit_insn (gen_expNcorexf3 (operands[0], operands[1], op2));
|
14276 |
|
|
DONE;
|
14277 |
|
|
})
|
14278 |
|
|
|
14279 |
|
|
(define_expand "exp2"
|
14280 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
14281 |
|
|
(use (match_operand:MODEF 1 "general_operand" ""))]
|
14282 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14283 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14284 |
|
|
|| TARGET_MIX_SSE_I387)
|
14285 |
|
|
&& flag_unsafe_math_optimizations"
|
14286 |
|
|
{
|
14287 |
|
|
rtx op0, op1;
|
14288 |
|
|
|
14289 |
|
|
if (optimize_insn_for_size_p ())
|
14290 |
|
|
FAIL;
|
14291 |
|
|
|
14292 |
|
|
op0 = gen_reg_rtx (XFmode);
|
14293 |
|
|
op1 = gen_reg_rtx (XFmode);
|
14294 |
|
|
|
14295 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
14296 |
|
|
emit_insn (gen_expxf2 (op0, op1));
|
14297 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
14298 |
|
|
DONE;
|
14299 |
|
|
})
|
14300 |
|
|
|
14301 |
|
|
(define_expand "exp10xf2"
|
14302 |
|
|
[(use (match_operand:XF 0 "register_operand" ""))
|
14303 |
|
|
(use (match_operand:XF 1 "register_operand" ""))]
|
14304 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14305 |
|
|
&& flag_unsafe_math_optimizations"
|
14306 |
|
|
{
|
14307 |
|
|
rtx op2;
|
14308 |
|
|
|
14309 |
|
|
if (optimize_insn_for_size_p ())
|
14310 |
|
|
FAIL;
|
14311 |
|
|
|
14312 |
|
|
op2 = gen_reg_rtx (XFmode);
|
14313 |
|
|
emit_move_insn (op2, standard_80387_constant_rtx (6)); /* fldl2t */
|
14314 |
|
|
|
14315 |
|
|
emit_insn (gen_expNcorexf3 (operands[0], operands[1], op2));
|
14316 |
|
|
DONE;
|
14317 |
|
|
})
|
14318 |
|
|
|
14319 |
|
|
(define_expand "exp102"
|
14320 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
14321 |
|
|
(use (match_operand:MODEF 1 "general_operand" ""))]
|
14322 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14323 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14324 |
|
|
|| TARGET_MIX_SSE_I387)
|
14325 |
|
|
&& flag_unsafe_math_optimizations"
|
14326 |
|
|
{
|
14327 |
|
|
rtx op0, op1;
|
14328 |
|
|
|
14329 |
|
|
if (optimize_insn_for_size_p ())
|
14330 |
|
|
FAIL;
|
14331 |
|
|
|
14332 |
|
|
op0 = gen_reg_rtx (XFmode);
|
14333 |
|
|
op1 = gen_reg_rtx (XFmode);
|
14334 |
|
|
|
14335 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
14336 |
|
|
emit_insn (gen_exp10xf2 (op0, op1));
|
14337 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
14338 |
|
|
DONE;
|
14339 |
|
|
})
|
14340 |
|
|
|
14341 |
|
|
(define_expand "exp2xf2"
|
14342 |
|
|
[(use (match_operand:XF 0 "register_operand" ""))
|
14343 |
|
|
(use (match_operand:XF 1 "register_operand" ""))]
|
14344 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14345 |
|
|
&& flag_unsafe_math_optimizations"
|
14346 |
|
|
{
|
14347 |
|
|
rtx op2;
|
14348 |
|
|
|
14349 |
|
|
if (optimize_insn_for_size_p ())
|
14350 |
|
|
FAIL;
|
14351 |
|
|
|
14352 |
|
|
op2 = gen_reg_rtx (XFmode);
|
14353 |
|
|
emit_move_insn (op2, CONST1_RTX (XFmode)); /* fld1 */
|
14354 |
|
|
|
14355 |
|
|
emit_insn (gen_expNcorexf3 (operands[0], operands[1], op2));
|
14356 |
|
|
DONE;
|
14357 |
|
|
})
|
14358 |
|
|
|
14359 |
|
|
(define_expand "exp22"
|
14360 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
14361 |
|
|
(use (match_operand:MODEF 1 "general_operand" ""))]
|
14362 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14363 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14364 |
|
|
|| TARGET_MIX_SSE_I387)
|
14365 |
|
|
&& flag_unsafe_math_optimizations"
|
14366 |
|
|
{
|
14367 |
|
|
rtx op0, op1;
|
14368 |
|
|
|
14369 |
|
|
if (optimize_insn_for_size_p ())
|
14370 |
|
|
FAIL;
|
14371 |
|
|
|
14372 |
|
|
op0 = gen_reg_rtx (XFmode);
|
14373 |
|
|
op1 = gen_reg_rtx (XFmode);
|
14374 |
|
|
|
14375 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
14376 |
|
|
emit_insn (gen_exp2xf2 (op0, op1));
|
14377 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
14378 |
|
|
DONE;
|
14379 |
|
|
})
|
14380 |
|
|
|
14381 |
|
|
(define_expand "expm1xf2"
|
14382 |
|
|
[(set (match_dup 3) (mult:XF (match_operand:XF 1 "register_operand" "")
|
14383 |
|
|
(match_dup 2)))
|
14384 |
|
|
(set (match_dup 4) (unspec:XF [(match_dup 3)] UNSPEC_FRNDINT))
|
14385 |
|
|
(set (match_dup 5) (minus:XF (match_dup 3) (match_dup 4)))
|
14386 |
|
|
(set (match_dup 9) (float_extend:XF (match_dup 13)))
|
14387 |
|
|
(set (match_dup 6) (unspec:XF [(match_dup 5)] UNSPEC_F2XM1))
|
14388 |
|
|
(parallel [(set (match_dup 7)
|
14389 |
|
|
(unspec:XF [(match_dup 6) (match_dup 4)]
|
14390 |
|
|
UNSPEC_FSCALE_FRACT))
|
14391 |
|
|
(set (match_dup 8)
|
14392 |
|
|
(unspec:XF [(match_dup 6) (match_dup 4)]
|
14393 |
|
|
UNSPEC_FSCALE_EXP))])
|
14394 |
|
|
(parallel [(set (match_dup 10)
|
14395 |
|
|
(unspec:XF [(match_dup 9) (match_dup 8)]
|
14396 |
|
|
UNSPEC_FSCALE_FRACT))
|
14397 |
|
|
(set (match_dup 11)
|
14398 |
|
|
(unspec:XF [(match_dup 9) (match_dup 8)]
|
14399 |
|
|
UNSPEC_FSCALE_EXP))])
|
14400 |
|
|
(set (match_dup 12) (minus:XF (match_dup 10)
|
14401 |
|
|
(float_extend:XF (match_dup 13))))
|
14402 |
|
|
(set (match_operand:XF 0 "register_operand" "")
|
14403 |
|
|
(plus:XF (match_dup 12) (match_dup 7)))]
|
14404 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14405 |
|
|
&& flag_unsafe_math_optimizations"
|
14406 |
|
|
{
|
14407 |
|
|
int i;
|
14408 |
|
|
|
14409 |
|
|
if (optimize_insn_for_size_p ())
|
14410 |
|
|
FAIL;
|
14411 |
|
|
|
14412 |
|
|
for (i = 2; i < 13; i++)
|
14413 |
|
|
operands[i] = gen_reg_rtx (XFmode);
|
14414 |
|
|
|
14415 |
|
|
operands[13]
|
14416 |
|
|
= validize_mem (force_const_mem (SFmode, CONST1_RTX (SFmode))); /* fld1 */
|
14417 |
|
|
|
14418 |
|
|
emit_move_insn (operands[2], standard_80387_constant_rtx (5)); /* fldl2e */
|
14419 |
|
|
})
|
14420 |
|
|
|
14421 |
|
|
(define_expand "expm12"
|
14422 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
14423 |
|
|
(use (match_operand:MODEF 1 "general_operand" ""))]
|
14424 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14425 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14426 |
|
|
|| TARGET_MIX_SSE_I387)
|
14427 |
|
|
&& flag_unsafe_math_optimizations"
|
14428 |
|
|
{
|
14429 |
|
|
rtx op0, op1;
|
14430 |
|
|
|
14431 |
|
|
if (optimize_insn_for_size_p ())
|
14432 |
|
|
FAIL;
|
14433 |
|
|
|
14434 |
|
|
op0 = gen_reg_rtx (XFmode);
|
14435 |
|
|
op1 = gen_reg_rtx (XFmode);
|
14436 |
|
|
|
14437 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
14438 |
|
|
emit_insn (gen_expm1xf2 (op0, op1));
|
14439 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
14440 |
|
|
DONE;
|
14441 |
|
|
})
|
14442 |
|
|
|
14443 |
|
|
(define_expand "ldexpxf3"
|
14444 |
|
|
[(set (match_dup 3)
|
14445 |
|
|
(float:XF (match_operand:SI 2 "register_operand" "")))
|
14446 |
|
|
(parallel [(set (match_operand:XF 0 " register_operand" "")
|
14447 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "")
|
14448 |
|
|
(match_dup 3)]
|
14449 |
|
|
UNSPEC_FSCALE_FRACT))
|
14450 |
|
|
(set (match_dup 4)
|
14451 |
|
|
(unspec:XF [(match_dup 1) (match_dup 3)]
|
14452 |
|
|
UNSPEC_FSCALE_EXP))])]
|
14453 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14454 |
|
|
&& flag_unsafe_math_optimizations"
|
14455 |
|
|
{
|
14456 |
|
|
if (optimize_insn_for_size_p ())
|
14457 |
|
|
FAIL;
|
14458 |
|
|
|
14459 |
|
|
operands[3] = gen_reg_rtx (XFmode);
|
14460 |
|
|
operands[4] = gen_reg_rtx (XFmode);
|
14461 |
|
|
})
|
14462 |
|
|
|
14463 |
|
|
(define_expand "ldexp3"
|
14464 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
14465 |
|
|
(use (match_operand:MODEF 1 "general_operand" ""))
|
14466 |
|
|
(use (match_operand:SI 2 "register_operand" ""))]
|
14467 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14468 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14469 |
|
|
|| TARGET_MIX_SSE_I387)
|
14470 |
|
|
&& flag_unsafe_math_optimizations"
|
14471 |
|
|
{
|
14472 |
|
|
rtx op0, op1;
|
14473 |
|
|
|
14474 |
|
|
if (optimize_insn_for_size_p ())
|
14475 |
|
|
FAIL;
|
14476 |
|
|
|
14477 |
|
|
op0 = gen_reg_rtx (XFmode);
|
14478 |
|
|
op1 = gen_reg_rtx (XFmode);
|
14479 |
|
|
|
14480 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
14481 |
|
|
emit_insn (gen_ldexpxf3 (op0, op1, operands[2]));
|
14482 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
14483 |
|
|
DONE;
|
14484 |
|
|
})
|
14485 |
|
|
|
14486 |
|
|
(define_expand "scalbxf3"
|
14487 |
|
|
[(parallel [(set (match_operand:XF 0 " register_operand" "")
|
14488 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "")
|
14489 |
|
|
(match_operand:XF 2 "register_operand" "")]
|
14490 |
|
|
UNSPEC_FSCALE_FRACT))
|
14491 |
|
|
(set (match_dup 3)
|
14492 |
|
|
(unspec:XF [(match_dup 1) (match_dup 2)]
|
14493 |
|
|
UNSPEC_FSCALE_EXP))])]
|
14494 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14495 |
|
|
&& flag_unsafe_math_optimizations"
|
14496 |
|
|
{
|
14497 |
|
|
if (optimize_insn_for_size_p ())
|
14498 |
|
|
FAIL;
|
14499 |
|
|
|
14500 |
|
|
operands[3] = gen_reg_rtx (XFmode);
|
14501 |
|
|
})
|
14502 |
|
|
|
14503 |
|
|
(define_expand "scalb3"
|
14504 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
14505 |
|
|
(use (match_operand:MODEF 1 "general_operand" ""))
|
14506 |
|
|
(use (match_operand:MODEF 2 "general_operand" ""))]
|
14507 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14508 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14509 |
|
|
|| TARGET_MIX_SSE_I387)
|
14510 |
|
|
&& flag_unsafe_math_optimizations"
|
14511 |
|
|
{
|
14512 |
|
|
rtx op0, op1, op2;
|
14513 |
|
|
|
14514 |
|
|
if (optimize_insn_for_size_p ())
|
14515 |
|
|
FAIL;
|
14516 |
|
|
|
14517 |
|
|
op0 = gen_reg_rtx (XFmode);
|
14518 |
|
|
op1 = gen_reg_rtx (XFmode);
|
14519 |
|
|
op2 = gen_reg_rtx (XFmode);
|
14520 |
|
|
|
14521 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
14522 |
|
|
emit_insn (gen_extendxf2 (op2, operands[2]));
|
14523 |
|
|
emit_insn (gen_scalbxf3 (op0, op1, op2));
|
14524 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
14525 |
|
|
DONE;
|
14526 |
|
|
})
|
14527 |
|
|
|
14528 |
|
|
(define_expand "significandxf2"
|
14529 |
|
|
[(parallel [(set (match_operand:XF 0 "register_operand" "")
|
14530 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "")]
|
14531 |
|
|
UNSPEC_XTRACT_FRACT))
|
14532 |
|
|
(set (match_dup 2)
|
14533 |
|
|
(unspec:XF [(match_dup 1)] UNSPEC_XTRACT_EXP))])]
|
14534 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14535 |
|
|
&& flag_unsafe_math_optimizations"
|
14536 |
|
|
"operands[2] = gen_reg_rtx (XFmode);")
|
14537 |
|
|
|
14538 |
|
|
(define_expand "significand2"
|
14539 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
14540 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
14541 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14542 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14543 |
|
|
|| TARGET_MIX_SSE_I387)
|
14544 |
|
|
&& flag_unsafe_math_optimizations"
|
14545 |
|
|
{
|
14546 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
14547 |
|
|
rtx op1 = gen_reg_rtx (XFmode);
|
14548 |
|
|
|
14549 |
|
|
emit_insn (gen_fxtract_extendxf3_i387 (op0, op1, operands[1]));
|
14550 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
14551 |
|
|
DONE;
|
14552 |
|
|
})
|
14553 |
|
|
|
14554 |
|
|
|
14555 |
|
|
(define_insn "sse4_1_round2"
|
14556 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x")
|
14557 |
|
|
(unspec:MODEF [(match_operand:MODEF 1 "register_operand" "x")
|
14558 |
|
|
(match_operand:SI 2 "const_0_to_15_operand" "n")]
|
14559 |
|
|
UNSPEC_ROUND))]
|
14560 |
|
|
"TARGET_ROUND"
|
14561 |
|
|
"%vround\t{%2, %1, %d0|%d0, %1, %2}"
|
14562 |
|
|
[(set_attr "type" "ssecvt")
|
14563 |
|
|
(set_attr "prefix_extra" "1")
|
14564 |
|
|
(set_attr "prefix" "maybe_vex")
|
14565 |
|
|
(set_attr "mode" "")])
|
14566 |
|
|
|
14567 |
|
|
(define_insn "rintxf2"
|
14568 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
14569 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "0")]
|
14570 |
|
|
UNSPEC_FRNDINT))]
|
14571 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14572 |
|
|
&& flag_unsafe_math_optimizations"
|
14573 |
|
|
"frndint"
|
14574 |
|
|
[(set_attr "type" "fpspc")
|
14575 |
|
|
(set_attr "mode" "XF")])
|
14576 |
|
|
|
14577 |
|
|
(define_expand "rint2"
|
14578 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
14579 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
14580 |
|
|
"(TARGET_USE_FANCY_MATH_387
|
14581 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14582 |
|
|
|| TARGET_MIX_SSE_I387)
|
14583 |
|
|
&& flag_unsafe_math_optimizations)
|
14584 |
|
|
|| (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
14585 |
|
|
&& !flag_trapping_math)"
|
14586 |
|
|
{
|
14587 |
|
|
if (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
14588 |
|
|
&& !flag_trapping_math)
|
14589 |
|
|
{
|
14590 |
|
|
if (TARGET_ROUND)
|
14591 |
|
|
emit_insn (gen_sse4_1_round2
|
14592 |
|
|
(operands[0], operands[1], GEN_INT (ROUND_MXCSR)));
|
14593 |
|
|
else if (optimize_insn_for_size_p ())
|
14594 |
|
|
FAIL;
|
14595 |
|
|
else
|
14596 |
|
|
ix86_expand_rint (operands[0], operands[1]);
|
14597 |
|
|
}
|
14598 |
|
|
else
|
14599 |
|
|
{
|
14600 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
14601 |
|
|
rtx op1 = gen_reg_rtx (XFmode);
|
14602 |
|
|
|
14603 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
14604 |
|
|
emit_insn (gen_rintxf2 (op0, op1));
|
14605 |
|
|
|
14606 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
14607 |
|
|
}
|
14608 |
|
|
DONE;
|
14609 |
|
|
})
|
14610 |
|
|
|
14611 |
|
|
(define_expand "round2"
|
14612 |
|
|
[(match_operand:X87MODEF 0 "register_operand" "")
|
14613 |
|
|
(match_operand:X87MODEF 1 "nonimmediate_operand" "")]
|
14614 |
|
|
"(TARGET_USE_FANCY_MATH_387
|
14615 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14616 |
|
|
|| TARGET_MIX_SSE_I387)
|
14617 |
|
|
&& flag_unsafe_math_optimizations)
|
14618 |
|
|
|| (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
14619 |
|
|
&& !flag_trapping_math && !flag_rounding_math)"
|
14620 |
|
|
{
|
14621 |
|
|
if (optimize_insn_for_size_p ())
|
14622 |
|
|
FAIL;
|
14623 |
|
|
|
14624 |
|
|
if (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
14625 |
|
|
&& !flag_trapping_math && !flag_rounding_math)
|
14626 |
|
|
{
|
14627 |
|
|
if (TARGET_ROUND)
|
14628 |
|
|
{
|
14629 |
|
|
operands[1] = force_reg (mode, operands[1]);
|
14630 |
|
|
ix86_expand_round_sse4 (operands[0], operands[1]);
|
14631 |
|
|
}
|
14632 |
|
|
else if (TARGET_64BIT || (mode != DFmode))
|
14633 |
|
|
ix86_expand_round (operands[0], operands[1]);
|
14634 |
|
|
else
|
14635 |
|
|
ix86_expand_rounddf_32 (operands[0], operands[1]);
|
14636 |
|
|
}
|
14637 |
|
|
else
|
14638 |
|
|
{
|
14639 |
|
|
operands[1] = force_reg (mode, operands[1]);
|
14640 |
|
|
ix86_emit_i387_round (operands[0], operands[1]);
|
14641 |
|
|
}
|
14642 |
|
|
DONE;
|
14643 |
|
|
})
|
14644 |
|
|
|
14645 |
|
|
(define_insn_and_split "*fistdi2_1"
|
14646 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "")
|
14647 |
|
|
(unspec:DI [(match_operand:XF 1 "register_operand" "")]
|
14648 |
|
|
UNSPEC_FIST))]
|
14649 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14650 |
|
|
&& can_create_pseudo_p ()"
|
14651 |
|
|
"#"
|
14652 |
|
|
"&& 1"
|
14653 |
|
|
[(const_int 0)]
|
14654 |
|
|
{
|
14655 |
|
|
if (memory_operand (operands[0], VOIDmode))
|
14656 |
|
|
emit_insn (gen_fistdi2 (operands[0], operands[1]));
|
14657 |
|
|
else
|
14658 |
|
|
{
|
14659 |
|
|
operands[2] = assign_386_stack_local (DImode, SLOT_TEMP);
|
14660 |
|
|
emit_insn (gen_fistdi2_with_temp (operands[0], operands[1],
|
14661 |
|
|
operands[2]));
|
14662 |
|
|
}
|
14663 |
|
|
DONE;
|
14664 |
|
|
}
|
14665 |
|
|
[(set_attr "type" "fpspc")
|
14666 |
|
|
(set_attr "mode" "DI")])
|
14667 |
|
|
|
14668 |
|
|
(define_insn "fistdi2"
|
14669 |
|
|
[(set (match_operand:DI 0 "memory_operand" "=m")
|
14670 |
|
|
(unspec:DI [(match_operand:XF 1 "register_operand" "f")]
|
14671 |
|
|
UNSPEC_FIST))
|
14672 |
|
|
(clobber (match_scratch:XF 2 "=&1f"))]
|
14673 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
14674 |
|
|
"* return output_fix_trunc (insn, operands, false);"
|
14675 |
|
|
[(set_attr "type" "fpspc")
|
14676 |
|
|
(set_attr "mode" "DI")])
|
14677 |
|
|
|
14678 |
|
|
(define_insn "fistdi2_with_temp"
|
14679 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "=m,?r")
|
14680 |
|
|
(unspec:DI [(match_operand:XF 1 "register_operand" "f,f")]
|
14681 |
|
|
UNSPEC_FIST))
|
14682 |
|
|
(clobber (match_operand:DI 2 "memory_operand" "=X,m"))
|
14683 |
|
|
(clobber (match_scratch:XF 3 "=&1f,&1f"))]
|
14684 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
14685 |
|
|
"#"
|
14686 |
|
|
[(set_attr "type" "fpspc")
|
14687 |
|
|
(set_attr "mode" "DI")])
|
14688 |
|
|
|
14689 |
|
|
(define_split
|
14690 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
14691 |
|
|
(unspec:DI [(match_operand:XF 1 "register_operand" "")]
|
14692 |
|
|
UNSPEC_FIST))
|
14693 |
|
|
(clobber (match_operand:DI 2 "memory_operand" ""))
|
14694 |
|
|
(clobber (match_scratch 3 ""))]
|
14695 |
|
|
"reload_completed"
|
14696 |
|
|
[(parallel [(set (match_dup 2) (unspec:DI [(match_dup 1)] UNSPEC_FIST))
|
14697 |
|
|
(clobber (match_dup 3))])
|
14698 |
|
|
(set (match_dup 0) (match_dup 2))])
|
14699 |
|
|
|
14700 |
|
|
(define_split
|
14701 |
|
|
[(set (match_operand:DI 0 "memory_operand" "")
|
14702 |
|
|
(unspec:DI [(match_operand:XF 1 "register_operand" "")]
|
14703 |
|
|
UNSPEC_FIST))
|
14704 |
|
|
(clobber (match_operand:DI 2 "memory_operand" ""))
|
14705 |
|
|
(clobber (match_scratch 3 ""))]
|
14706 |
|
|
"reload_completed"
|
14707 |
|
|
[(parallel [(set (match_dup 0) (unspec:DI [(match_dup 1)] UNSPEC_FIST))
|
14708 |
|
|
(clobber (match_dup 3))])])
|
14709 |
|
|
|
14710 |
|
|
(define_insn_and_split "*fist2_1"
|
14711 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "")
|
14712 |
|
|
(unspec:SWI24 [(match_operand:XF 1 "register_operand" "")]
|
14713 |
|
|
UNSPEC_FIST))]
|
14714 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14715 |
|
|
&& can_create_pseudo_p ()"
|
14716 |
|
|
"#"
|
14717 |
|
|
"&& 1"
|
14718 |
|
|
[(const_int 0)]
|
14719 |
|
|
{
|
14720 |
|
|
operands[2] = assign_386_stack_local (mode, SLOT_TEMP);
|
14721 |
|
|
emit_insn (gen_fist2_with_temp (operands[0], operands[1],
|
14722 |
|
|
operands[2]));
|
14723 |
|
|
DONE;
|
14724 |
|
|
}
|
14725 |
|
|
[(set_attr "type" "fpspc")
|
14726 |
|
|
(set_attr "mode" "")])
|
14727 |
|
|
|
14728 |
|
|
(define_insn "fist2"
|
14729 |
|
|
[(set (match_operand:SWI24 0 "memory_operand" "=m")
|
14730 |
|
|
(unspec:SWI24 [(match_operand:XF 1 "register_operand" "f")]
|
14731 |
|
|
UNSPEC_FIST))]
|
14732 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
14733 |
|
|
"* return output_fix_trunc (insn, operands, false);"
|
14734 |
|
|
[(set_attr "type" "fpspc")
|
14735 |
|
|
(set_attr "mode" "")])
|
14736 |
|
|
|
14737 |
|
|
(define_insn "fist2_with_temp"
|
14738 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "=r")
|
14739 |
|
|
(unspec:SWI24 [(match_operand:XF 1 "register_operand" "f")]
|
14740 |
|
|
UNSPEC_FIST))
|
14741 |
|
|
(clobber (match_operand:SWI24 2 "memory_operand" "=m"))]
|
14742 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
14743 |
|
|
"#"
|
14744 |
|
|
[(set_attr "type" "fpspc")
|
14745 |
|
|
(set_attr "mode" "")])
|
14746 |
|
|
|
14747 |
|
|
(define_split
|
14748 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "")
|
14749 |
|
|
(unspec:SWI24 [(match_operand:XF 1 "register_operand" "")]
|
14750 |
|
|
UNSPEC_FIST))
|
14751 |
|
|
(clobber (match_operand:SWI24 2 "memory_operand" ""))]
|
14752 |
|
|
"reload_completed"
|
14753 |
|
|
[(set (match_dup 2) (unspec:SWI24 [(match_dup 1)] UNSPEC_FIST))
|
14754 |
|
|
(set (match_dup 0) (match_dup 2))])
|
14755 |
|
|
|
14756 |
|
|
(define_split
|
14757 |
|
|
[(set (match_operand:SWI24 0 "memory_operand" "")
|
14758 |
|
|
(unspec:SWI24 [(match_operand:XF 1 "register_operand" "")]
|
14759 |
|
|
UNSPEC_FIST))
|
14760 |
|
|
(clobber (match_operand:SWI24 2 "memory_operand" ""))]
|
14761 |
|
|
"reload_completed"
|
14762 |
|
|
[(set (match_dup 0) (unspec:SWI24 [(match_dup 1)] UNSPEC_FIST))])
|
14763 |
|
|
|
14764 |
|
|
(define_expand "lrintxf2"
|
14765 |
|
|
[(set (match_operand:SWI248x 0 "nonimmediate_operand" "")
|
14766 |
|
|
(unspec:SWI248x [(match_operand:XF 1 "register_operand" "")]
|
14767 |
|
|
UNSPEC_FIST))]
|
14768 |
|
|
"TARGET_USE_FANCY_MATH_387")
|
14769 |
|
|
|
14770 |
|
|
(define_expand "lrint2"
|
14771 |
|
|
[(set (match_operand:SWI48x 0 "nonimmediate_operand" "")
|
14772 |
|
|
(unspec:SWI48x [(match_operand:MODEF 1 "register_operand" "")]
|
14773 |
|
|
UNSPEC_FIX_NOTRUNC))]
|
14774 |
|
|
"SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
14775 |
|
|
&& ((mode != DImode) || TARGET_64BIT)")
|
14776 |
|
|
|
14777 |
|
|
(define_expand "lround2"
|
14778 |
|
|
[(match_operand:SWI248x 0 "nonimmediate_operand" "")
|
14779 |
|
|
(match_operand:X87MODEF 1 "register_operand" "")]
|
14780 |
|
|
"(TARGET_USE_FANCY_MATH_387
|
14781 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14782 |
|
|
|| TARGET_MIX_SSE_I387)
|
14783 |
|
|
&& flag_unsafe_math_optimizations)
|
14784 |
|
|
|| (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
14785 |
|
|
&& mode != HImode
|
14786 |
|
|
&& ((mode != DImode) || TARGET_64BIT)
|
14787 |
|
|
&& !flag_trapping_math && !flag_rounding_math)"
|
14788 |
|
|
{
|
14789 |
|
|
if (optimize_insn_for_size_p ())
|
14790 |
|
|
FAIL;
|
14791 |
|
|
|
14792 |
|
|
if (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
14793 |
|
|
&& mode != HImode
|
14794 |
|
|
&& ((mode != DImode) || TARGET_64BIT)
|
14795 |
|
|
&& !flag_trapping_math && !flag_rounding_math)
|
14796 |
|
|
ix86_expand_lround (operands[0], operands[1]);
|
14797 |
|
|
else
|
14798 |
|
|
ix86_emit_i387_round (operands[0], operands[1]);
|
14799 |
|
|
DONE;
|
14800 |
|
|
})
|
14801 |
|
|
|
14802 |
|
|
;; Rounding mode control word calculation could clobber FLAGS_REG.
|
14803 |
|
|
(define_insn_and_split "frndintxf2_floor"
|
14804 |
|
|
[(set (match_operand:XF 0 "register_operand" "")
|
14805 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "")]
|
14806 |
|
|
UNSPEC_FRNDINT_FLOOR))
|
14807 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
14808 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14809 |
|
|
&& flag_unsafe_math_optimizations
|
14810 |
|
|
&& can_create_pseudo_p ()"
|
14811 |
|
|
"#"
|
14812 |
|
|
"&& 1"
|
14813 |
|
|
[(const_int 0)]
|
14814 |
|
|
{
|
14815 |
|
|
ix86_optimize_mode_switching[I387_FLOOR] = 1;
|
14816 |
|
|
|
14817 |
|
|
operands[2] = assign_386_stack_local (HImode, SLOT_CW_STORED);
|
14818 |
|
|
operands[3] = assign_386_stack_local (HImode, SLOT_CW_FLOOR);
|
14819 |
|
|
|
14820 |
|
|
emit_insn (gen_frndintxf2_floor_i387 (operands[0], operands[1],
|
14821 |
|
|
operands[2], operands[3]));
|
14822 |
|
|
DONE;
|
14823 |
|
|
}
|
14824 |
|
|
[(set_attr "type" "frndint")
|
14825 |
|
|
(set_attr "i387_cw" "floor")
|
14826 |
|
|
(set_attr "mode" "XF")])
|
14827 |
|
|
|
14828 |
|
|
(define_insn "frndintxf2_floor_i387"
|
14829 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
14830 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "0")]
|
14831 |
|
|
UNSPEC_FRNDINT_FLOOR))
|
14832 |
|
|
(use (match_operand:HI 2 "memory_operand" "m"))
|
14833 |
|
|
(use (match_operand:HI 3 "memory_operand" "m"))]
|
14834 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14835 |
|
|
&& flag_unsafe_math_optimizations"
|
14836 |
|
|
"fldcw\t%3\n\tfrndint\n\tfldcw\t%2"
|
14837 |
|
|
[(set_attr "type" "frndint")
|
14838 |
|
|
(set_attr "i387_cw" "floor")
|
14839 |
|
|
(set_attr "mode" "XF")])
|
14840 |
|
|
|
14841 |
|
|
(define_expand "floorxf2"
|
14842 |
|
|
[(use (match_operand:XF 0 "register_operand" ""))
|
14843 |
|
|
(use (match_operand:XF 1 "register_operand" ""))]
|
14844 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14845 |
|
|
&& flag_unsafe_math_optimizations"
|
14846 |
|
|
{
|
14847 |
|
|
if (optimize_insn_for_size_p ())
|
14848 |
|
|
FAIL;
|
14849 |
|
|
emit_insn (gen_frndintxf2_floor (operands[0], operands[1]));
|
14850 |
|
|
DONE;
|
14851 |
|
|
})
|
14852 |
|
|
|
14853 |
|
|
(define_expand "floor2"
|
14854 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
14855 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
14856 |
|
|
"(TARGET_USE_FANCY_MATH_387
|
14857 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
14858 |
|
|
|| TARGET_MIX_SSE_I387)
|
14859 |
|
|
&& flag_unsafe_math_optimizations)
|
14860 |
|
|
|| (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
14861 |
|
|
&& !flag_trapping_math)"
|
14862 |
|
|
{
|
14863 |
|
|
if (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
14864 |
|
|
&& !flag_trapping_math)
|
14865 |
|
|
{
|
14866 |
|
|
if (TARGET_ROUND)
|
14867 |
|
|
emit_insn (gen_sse4_1_round2
|
14868 |
|
|
(operands[0], operands[1], GEN_INT (ROUND_FLOOR)));
|
14869 |
|
|
else if (optimize_insn_for_size_p ())
|
14870 |
|
|
FAIL;
|
14871 |
|
|
else if (TARGET_64BIT || (mode != DFmode))
|
14872 |
|
|
ix86_expand_floorceil (operands[0], operands[1], true);
|
14873 |
|
|
else
|
14874 |
|
|
ix86_expand_floorceildf_32 (operands[0], operands[1], true);
|
14875 |
|
|
}
|
14876 |
|
|
else
|
14877 |
|
|
{
|
14878 |
|
|
rtx op0, op1;
|
14879 |
|
|
|
14880 |
|
|
if (optimize_insn_for_size_p ())
|
14881 |
|
|
FAIL;
|
14882 |
|
|
|
14883 |
|
|
op0 = gen_reg_rtx (XFmode);
|
14884 |
|
|
op1 = gen_reg_rtx (XFmode);
|
14885 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
14886 |
|
|
emit_insn (gen_frndintxf2_floor (op0, op1));
|
14887 |
|
|
|
14888 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
14889 |
|
|
}
|
14890 |
|
|
DONE;
|
14891 |
|
|
})
|
14892 |
|
|
|
14893 |
|
|
(define_insn_and_split "*fist2_floor_1"
|
14894 |
|
|
[(set (match_operand:SWI248x 0 "nonimmediate_operand" "")
|
14895 |
|
|
(unspec:SWI248x [(match_operand:XF 1 "register_operand" "")]
|
14896 |
|
|
UNSPEC_FIST_FLOOR))
|
14897 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
14898 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14899 |
|
|
&& flag_unsafe_math_optimizations
|
14900 |
|
|
&& can_create_pseudo_p ()"
|
14901 |
|
|
"#"
|
14902 |
|
|
"&& 1"
|
14903 |
|
|
[(const_int 0)]
|
14904 |
|
|
{
|
14905 |
|
|
ix86_optimize_mode_switching[I387_FLOOR] = 1;
|
14906 |
|
|
|
14907 |
|
|
operands[2] = assign_386_stack_local (HImode, SLOT_CW_STORED);
|
14908 |
|
|
operands[3] = assign_386_stack_local (HImode, SLOT_CW_FLOOR);
|
14909 |
|
|
if (memory_operand (operands[0], VOIDmode))
|
14910 |
|
|
emit_insn (gen_fist2_floor (operands[0], operands[1],
|
14911 |
|
|
operands[2], operands[3]));
|
14912 |
|
|
else
|
14913 |
|
|
{
|
14914 |
|
|
operands[4] = assign_386_stack_local (mode, SLOT_TEMP);
|
14915 |
|
|
emit_insn (gen_fist2_floor_with_temp (operands[0], operands[1],
|
14916 |
|
|
operands[2], operands[3],
|
14917 |
|
|
operands[4]));
|
14918 |
|
|
}
|
14919 |
|
|
DONE;
|
14920 |
|
|
}
|
14921 |
|
|
[(set_attr "type" "fistp")
|
14922 |
|
|
(set_attr "i387_cw" "floor")
|
14923 |
|
|
(set_attr "mode" "")])
|
14924 |
|
|
|
14925 |
|
|
(define_insn "fistdi2_floor"
|
14926 |
|
|
[(set (match_operand:DI 0 "memory_operand" "=m")
|
14927 |
|
|
(unspec:DI [(match_operand:XF 1 "register_operand" "f")]
|
14928 |
|
|
UNSPEC_FIST_FLOOR))
|
14929 |
|
|
(use (match_operand:HI 2 "memory_operand" "m"))
|
14930 |
|
|
(use (match_operand:HI 3 "memory_operand" "m"))
|
14931 |
|
|
(clobber (match_scratch:XF 4 "=&1f"))]
|
14932 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14933 |
|
|
&& flag_unsafe_math_optimizations"
|
14934 |
|
|
"* return output_fix_trunc (insn, operands, false);"
|
14935 |
|
|
[(set_attr "type" "fistp")
|
14936 |
|
|
(set_attr "i387_cw" "floor")
|
14937 |
|
|
(set_attr "mode" "DI")])
|
14938 |
|
|
|
14939 |
|
|
(define_insn "fistdi2_floor_with_temp"
|
14940 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "=m,?r")
|
14941 |
|
|
(unspec:DI [(match_operand:XF 1 "register_operand" "f,f")]
|
14942 |
|
|
UNSPEC_FIST_FLOOR))
|
14943 |
|
|
(use (match_operand:HI 2 "memory_operand" "m,m"))
|
14944 |
|
|
(use (match_operand:HI 3 "memory_operand" "m,m"))
|
14945 |
|
|
(clobber (match_operand:DI 4 "memory_operand" "=X,m"))
|
14946 |
|
|
(clobber (match_scratch:XF 5 "=&1f,&1f"))]
|
14947 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14948 |
|
|
&& flag_unsafe_math_optimizations"
|
14949 |
|
|
"#"
|
14950 |
|
|
[(set_attr "type" "fistp")
|
14951 |
|
|
(set_attr "i387_cw" "floor")
|
14952 |
|
|
(set_attr "mode" "DI")])
|
14953 |
|
|
|
14954 |
|
|
(define_split
|
14955 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
14956 |
|
|
(unspec:DI [(match_operand:XF 1 "register_operand" "")]
|
14957 |
|
|
UNSPEC_FIST_FLOOR))
|
14958 |
|
|
(use (match_operand:HI 2 "memory_operand" ""))
|
14959 |
|
|
(use (match_operand:HI 3 "memory_operand" ""))
|
14960 |
|
|
(clobber (match_operand:DI 4 "memory_operand" ""))
|
14961 |
|
|
(clobber (match_scratch 5 ""))]
|
14962 |
|
|
"reload_completed"
|
14963 |
|
|
[(parallel [(set (match_dup 4)
|
14964 |
|
|
(unspec:DI [(match_dup 1)] UNSPEC_FIST_FLOOR))
|
14965 |
|
|
(use (match_dup 2))
|
14966 |
|
|
(use (match_dup 3))
|
14967 |
|
|
(clobber (match_dup 5))])
|
14968 |
|
|
(set (match_dup 0) (match_dup 4))])
|
14969 |
|
|
|
14970 |
|
|
(define_split
|
14971 |
|
|
[(set (match_operand:DI 0 "memory_operand" "")
|
14972 |
|
|
(unspec:DI [(match_operand:XF 1 "register_operand" "")]
|
14973 |
|
|
UNSPEC_FIST_FLOOR))
|
14974 |
|
|
(use (match_operand:HI 2 "memory_operand" ""))
|
14975 |
|
|
(use (match_operand:HI 3 "memory_operand" ""))
|
14976 |
|
|
(clobber (match_operand:DI 4 "memory_operand" ""))
|
14977 |
|
|
(clobber (match_scratch 5 ""))]
|
14978 |
|
|
"reload_completed"
|
14979 |
|
|
[(parallel [(set (match_dup 0)
|
14980 |
|
|
(unspec:DI [(match_dup 1)] UNSPEC_FIST_FLOOR))
|
14981 |
|
|
(use (match_dup 2))
|
14982 |
|
|
(use (match_dup 3))
|
14983 |
|
|
(clobber (match_dup 5))])])
|
14984 |
|
|
|
14985 |
|
|
(define_insn "fist2_floor"
|
14986 |
|
|
[(set (match_operand:SWI24 0 "memory_operand" "=m")
|
14987 |
|
|
(unspec:SWI24 [(match_operand:XF 1 "register_operand" "f")]
|
14988 |
|
|
UNSPEC_FIST_FLOOR))
|
14989 |
|
|
(use (match_operand:HI 2 "memory_operand" "m"))
|
14990 |
|
|
(use (match_operand:HI 3 "memory_operand" "m"))]
|
14991 |
|
|
"TARGET_USE_FANCY_MATH_387
|
14992 |
|
|
&& flag_unsafe_math_optimizations"
|
14993 |
|
|
"* return output_fix_trunc (insn, operands, false);"
|
14994 |
|
|
[(set_attr "type" "fistp")
|
14995 |
|
|
(set_attr "i387_cw" "floor")
|
14996 |
|
|
(set_attr "mode" "")])
|
14997 |
|
|
|
14998 |
|
|
(define_insn "fist2_floor_with_temp"
|
14999 |
|
|
[(set (match_operand:SWI24 0 "nonimmediate_operand" "=m,?r")
|
15000 |
|
|
(unspec:SWI24 [(match_operand:XF 1 "register_operand" "f,f")]
|
15001 |
|
|
UNSPEC_FIST_FLOOR))
|
15002 |
|
|
(use (match_operand:HI 2 "memory_operand" "m,m"))
|
15003 |
|
|
(use (match_operand:HI 3 "memory_operand" "m,m"))
|
15004 |
|
|
(clobber (match_operand:SWI24 4 "memory_operand" "=X,m"))]
|
15005 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15006 |
|
|
&& flag_unsafe_math_optimizations"
|
15007 |
|
|
"#"
|
15008 |
|
|
[(set_attr "type" "fistp")
|
15009 |
|
|
(set_attr "i387_cw" "floor")
|
15010 |
|
|
(set_attr "mode" "")])
|
15011 |
|
|
|
15012 |
|
|
(define_split
|
15013 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "")
|
15014 |
|
|
(unspec:SWI24 [(match_operand:XF 1 "register_operand" "")]
|
15015 |
|
|
UNSPEC_FIST_FLOOR))
|
15016 |
|
|
(use (match_operand:HI 2 "memory_operand" ""))
|
15017 |
|
|
(use (match_operand:HI 3 "memory_operand" ""))
|
15018 |
|
|
(clobber (match_operand:SWI24 4 "memory_operand" ""))]
|
15019 |
|
|
"reload_completed"
|
15020 |
|
|
[(parallel [(set (match_dup 4)
|
15021 |
|
|
(unspec:SWI24 [(match_dup 1)] UNSPEC_FIST_FLOOR))
|
15022 |
|
|
(use (match_dup 2))
|
15023 |
|
|
(use (match_dup 3))])
|
15024 |
|
|
(set (match_dup 0) (match_dup 4))])
|
15025 |
|
|
|
15026 |
|
|
(define_split
|
15027 |
|
|
[(set (match_operand:SWI24 0 "memory_operand" "")
|
15028 |
|
|
(unspec:SWI24 [(match_operand:XF 1 "register_operand" "")]
|
15029 |
|
|
UNSPEC_FIST_FLOOR))
|
15030 |
|
|
(use (match_operand:HI 2 "memory_operand" ""))
|
15031 |
|
|
(use (match_operand:HI 3 "memory_operand" ""))
|
15032 |
|
|
(clobber (match_operand:SWI24 4 "memory_operand" ""))]
|
15033 |
|
|
"reload_completed"
|
15034 |
|
|
[(parallel [(set (match_dup 0)
|
15035 |
|
|
(unspec:SWI24 [(match_dup 1)] UNSPEC_FIST_FLOOR))
|
15036 |
|
|
(use (match_dup 2))
|
15037 |
|
|
(use (match_dup 3))])])
|
15038 |
|
|
|
15039 |
|
|
(define_expand "lfloorxf2"
|
15040 |
|
|
[(parallel [(set (match_operand:SWI248x 0 "nonimmediate_operand" "")
|
15041 |
|
|
(unspec:SWI248x [(match_operand:XF 1 "register_operand" "")]
|
15042 |
|
|
UNSPEC_FIST_FLOOR))
|
15043 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
15044 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15045 |
|
|
&& (!TARGET_SSE_MATH || TARGET_MIX_SSE_I387)
|
15046 |
|
|
&& flag_unsafe_math_optimizations")
|
15047 |
|
|
|
15048 |
|
|
(define_expand "lfloor2"
|
15049 |
|
|
[(match_operand:SWI48 0 "nonimmediate_operand" "")
|
15050 |
|
|
(match_operand:MODEF 1 "register_operand" "")]
|
15051 |
|
|
"SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
15052 |
|
|
&& !flag_trapping_math"
|
15053 |
|
|
{
|
15054 |
|
|
if (TARGET_64BIT && optimize_insn_for_size_p ())
|
15055 |
|
|
FAIL;
|
15056 |
|
|
ix86_expand_lfloorceil (operands[0], operands[1], true);
|
15057 |
|
|
DONE;
|
15058 |
|
|
})
|
15059 |
|
|
|
15060 |
|
|
;; Rounding mode control word calculation could clobber FLAGS_REG.
|
15061 |
|
|
(define_insn_and_split "frndintxf2_ceil"
|
15062 |
|
|
[(set (match_operand:XF 0 "register_operand" "")
|
15063 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "")]
|
15064 |
|
|
UNSPEC_FRNDINT_CEIL))
|
15065 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
15066 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15067 |
|
|
&& flag_unsafe_math_optimizations
|
15068 |
|
|
&& can_create_pseudo_p ()"
|
15069 |
|
|
"#"
|
15070 |
|
|
"&& 1"
|
15071 |
|
|
[(const_int 0)]
|
15072 |
|
|
{
|
15073 |
|
|
ix86_optimize_mode_switching[I387_CEIL] = 1;
|
15074 |
|
|
|
15075 |
|
|
operands[2] = assign_386_stack_local (HImode, SLOT_CW_STORED);
|
15076 |
|
|
operands[3] = assign_386_stack_local (HImode, SLOT_CW_CEIL);
|
15077 |
|
|
|
15078 |
|
|
emit_insn (gen_frndintxf2_ceil_i387 (operands[0], operands[1],
|
15079 |
|
|
operands[2], operands[3]));
|
15080 |
|
|
DONE;
|
15081 |
|
|
}
|
15082 |
|
|
[(set_attr "type" "frndint")
|
15083 |
|
|
(set_attr "i387_cw" "ceil")
|
15084 |
|
|
(set_attr "mode" "XF")])
|
15085 |
|
|
|
15086 |
|
|
(define_insn "frndintxf2_ceil_i387"
|
15087 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
15088 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "0")]
|
15089 |
|
|
UNSPEC_FRNDINT_CEIL))
|
15090 |
|
|
(use (match_operand:HI 2 "memory_operand" "m"))
|
15091 |
|
|
(use (match_operand:HI 3 "memory_operand" "m"))]
|
15092 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15093 |
|
|
&& flag_unsafe_math_optimizations"
|
15094 |
|
|
"fldcw\t%3\n\tfrndint\n\tfldcw\t%2"
|
15095 |
|
|
[(set_attr "type" "frndint")
|
15096 |
|
|
(set_attr "i387_cw" "ceil")
|
15097 |
|
|
(set_attr "mode" "XF")])
|
15098 |
|
|
|
15099 |
|
|
(define_expand "ceilxf2"
|
15100 |
|
|
[(use (match_operand:XF 0 "register_operand" ""))
|
15101 |
|
|
(use (match_operand:XF 1 "register_operand" ""))]
|
15102 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15103 |
|
|
&& flag_unsafe_math_optimizations"
|
15104 |
|
|
{
|
15105 |
|
|
if (optimize_insn_for_size_p ())
|
15106 |
|
|
FAIL;
|
15107 |
|
|
emit_insn (gen_frndintxf2_ceil (operands[0], operands[1]));
|
15108 |
|
|
DONE;
|
15109 |
|
|
})
|
15110 |
|
|
|
15111 |
|
|
(define_expand "ceil2"
|
15112 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
15113 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
15114 |
|
|
"(TARGET_USE_FANCY_MATH_387
|
15115 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
15116 |
|
|
|| TARGET_MIX_SSE_I387)
|
15117 |
|
|
&& flag_unsafe_math_optimizations)
|
15118 |
|
|
|| (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
15119 |
|
|
&& !flag_trapping_math)"
|
15120 |
|
|
{
|
15121 |
|
|
if (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
15122 |
|
|
&& !flag_trapping_math)
|
15123 |
|
|
{
|
15124 |
|
|
if (TARGET_ROUND)
|
15125 |
|
|
emit_insn (gen_sse4_1_round2
|
15126 |
|
|
(operands[0], operands[1], GEN_INT (ROUND_CEIL)));
|
15127 |
|
|
else if (optimize_insn_for_size_p ())
|
15128 |
|
|
FAIL;
|
15129 |
|
|
else if (TARGET_64BIT || (mode != DFmode))
|
15130 |
|
|
ix86_expand_floorceil (operands[0], operands[1], false);
|
15131 |
|
|
else
|
15132 |
|
|
ix86_expand_floorceildf_32 (operands[0], operands[1], false);
|
15133 |
|
|
}
|
15134 |
|
|
else
|
15135 |
|
|
{
|
15136 |
|
|
rtx op0, op1;
|
15137 |
|
|
|
15138 |
|
|
if (optimize_insn_for_size_p ())
|
15139 |
|
|
FAIL;
|
15140 |
|
|
|
15141 |
|
|
op0 = gen_reg_rtx (XFmode);
|
15142 |
|
|
op1 = gen_reg_rtx (XFmode);
|
15143 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
15144 |
|
|
emit_insn (gen_frndintxf2_ceil (op0, op1));
|
15145 |
|
|
|
15146 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
15147 |
|
|
}
|
15148 |
|
|
DONE;
|
15149 |
|
|
})
|
15150 |
|
|
|
15151 |
|
|
(define_insn_and_split "*fist2_ceil_1"
|
15152 |
|
|
[(set (match_operand:SWI248x 0 "nonimmediate_operand" "")
|
15153 |
|
|
(unspec:SWI248x [(match_operand:XF 1 "register_operand" "")]
|
15154 |
|
|
UNSPEC_FIST_CEIL))
|
15155 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
15156 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15157 |
|
|
&& flag_unsafe_math_optimizations
|
15158 |
|
|
&& can_create_pseudo_p ()"
|
15159 |
|
|
"#"
|
15160 |
|
|
"&& 1"
|
15161 |
|
|
[(const_int 0)]
|
15162 |
|
|
{
|
15163 |
|
|
ix86_optimize_mode_switching[I387_CEIL] = 1;
|
15164 |
|
|
|
15165 |
|
|
operands[2] = assign_386_stack_local (HImode, SLOT_CW_STORED);
|
15166 |
|
|
operands[3] = assign_386_stack_local (HImode, SLOT_CW_CEIL);
|
15167 |
|
|
if (memory_operand (operands[0], VOIDmode))
|
15168 |
|
|
emit_insn (gen_fist2_ceil (operands[0], operands[1],
|
15169 |
|
|
operands[2], operands[3]));
|
15170 |
|
|
else
|
15171 |
|
|
{
|
15172 |
|
|
operands[4] = assign_386_stack_local (mode, SLOT_TEMP);
|
15173 |
|
|
emit_insn (gen_fist2_ceil_with_temp (operands[0], operands[1],
|
15174 |
|
|
operands[2], operands[3],
|
15175 |
|
|
operands[4]));
|
15176 |
|
|
}
|
15177 |
|
|
DONE;
|
15178 |
|
|
}
|
15179 |
|
|
[(set_attr "type" "fistp")
|
15180 |
|
|
(set_attr "i387_cw" "ceil")
|
15181 |
|
|
(set_attr "mode" "")])
|
15182 |
|
|
|
15183 |
|
|
(define_insn "fistdi2_ceil"
|
15184 |
|
|
[(set (match_operand:DI 0 "memory_operand" "=m")
|
15185 |
|
|
(unspec:DI [(match_operand:XF 1 "register_operand" "f")]
|
15186 |
|
|
UNSPEC_FIST_CEIL))
|
15187 |
|
|
(use (match_operand:HI 2 "memory_operand" "m"))
|
15188 |
|
|
(use (match_operand:HI 3 "memory_operand" "m"))
|
15189 |
|
|
(clobber (match_scratch:XF 4 "=&1f"))]
|
15190 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15191 |
|
|
&& flag_unsafe_math_optimizations"
|
15192 |
|
|
"* return output_fix_trunc (insn, operands, false);"
|
15193 |
|
|
[(set_attr "type" "fistp")
|
15194 |
|
|
(set_attr "i387_cw" "ceil")
|
15195 |
|
|
(set_attr "mode" "DI")])
|
15196 |
|
|
|
15197 |
|
|
(define_insn "fistdi2_ceil_with_temp"
|
15198 |
|
|
[(set (match_operand:DI 0 "nonimmediate_operand" "=m,?r")
|
15199 |
|
|
(unspec:DI [(match_operand:XF 1 "register_operand" "f,f")]
|
15200 |
|
|
UNSPEC_FIST_CEIL))
|
15201 |
|
|
(use (match_operand:HI 2 "memory_operand" "m,m"))
|
15202 |
|
|
(use (match_operand:HI 3 "memory_operand" "m,m"))
|
15203 |
|
|
(clobber (match_operand:DI 4 "memory_operand" "=X,m"))
|
15204 |
|
|
(clobber (match_scratch:XF 5 "=&1f,&1f"))]
|
15205 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15206 |
|
|
&& flag_unsafe_math_optimizations"
|
15207 |
|
|
"#"
|
15208 |
|
|
[(set_attr "type" "fistp")
|
15209 |
|
|
(set_attr "i387_cw" "ceil")
|
15210 |
|
|
(set_attr "mode" "DI")])
|
15211 |
|
|
|
15212 |
|
|
(define_split
|
15213 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
15214 |
|
|
(unspec:DI [(match_operand:XF 1 "register_operand" "")]
|
15215 |
|
|
UNSPEC_FIST_CEIL))
|
15216 |
|
|
(use (match_operand:HI 2 "memory_operand" ""))
|
15217 |
|
|
(use (match_operand:HI 3 "memory_operand" ""))
|
15218 |
|
|
(clobber (match_operand:DI 4 "memory_operand" ""))
|
15219 |
|
|
(clobber (match_scratch 5 ""))]
|
15220 |
|
|
"reload_completed"
|
15221 |
|
|
[(parallel [(set (match_dup 4)
|
15222 |
|
|
(unspec:DI [(match_dup 1)] UNSPEC_FIST_CEIL))
|
15223 |
|
|
(use (match_dup 2))
|
15224 |
|
|
(use (match_dup 3))
|
15225 |
|
|
(clobber (match_dup 5))])
|
15226 |
|
|
(set (match_dup 0) (match_dup 4))])
|
15227 |
|
|
|
15228 |
|
|
(define_split
|
15229 |
|
|
[(set (match_operand:DI 0 "memory_operand" "")
|
15230 |
|
|
(unspec:DI [(match_operand:XF 1 "register_operand" "")]
|
15231 |
|
|
UNSPEC_FIST_CEIL))
|
15232 |
|
|
(use (match_operand:HI 2 "memory_operand" ""))
|
15233 |
|
|
(use (match_operand:HI 3 "memory_operand" ""))
|
15234 |
|
|
(clobber (match_operand:DI 4 "memory_operand" ""))
|
15235 |
|
|
(clobber (match_scratch 5 ""))]
|
15236 |
|
|
"reload_completed"
|
15237 |
|
|
[(parallel [(set (match_dup 0)
|
15238 |
|
|
(unspec:DI [(match_dup 1)] UNSPEC_FIST_CEIL))
|
15239 |
|
|
(use (match_dup 2))
|
15240 |
|
|
(use (match_dup 3))
|
15241 |
|
|
(clobber (match_dup 5))])])
|
15242 |
|
|
|
15243 |
|
|
(define_insn "fist2_ceil"
|
15244 |
|
|
[(set (match_operand:SWI24 0 "memory_operand" "=m")
|
15245 |
|
|
(unspec:SWI24 [(match_operand:XF 1 "register_operand" "f")]
|
15246 |
|
|
UNSPEC_FIST_CEIL))
|
15247 |
|
|
(use (match_operand:HI 2 "memory_operand" "m"))
|
15248 |
|
|
(use (match_operand:HI 3 "memory_operand" "m"))]
|
15249 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15250 |
|
|
&& flag_unsafe_math_optimizations"
|
15251 |
|
|
"* return output_fix_trunc (insn, operands, false);"
|
15252 |
|
|
[(set_attr "type" "fistp")
|
15253 |
|
|
(set_attr "i387_cw" "ceil")
|
15254 |
|
|
(set_attr "mode" "")])
|
15255 |
|
|
|
15256 |
|
|
(define_insn "fist2_ceil_with_temp"
|
15257 |
|
|
[(set (match_operand:SWI24 0 "nonimmediate_operand" "=m,?r")
|
15258 |
|
|
(unspec:SWI24 [(match_operand:XF 1 "register_operand" "f,f")]
|
15259 |
|
|
UNSPEC_FIST_CEIL))
|
15260 |
|
|
(use (match_operand:HI 2 "memory_operand" "m,m"))
|
15261 |
|
|
(use (match_operand:HI 3 "memory_operand" "m,m"))
|
15262 |
|
|
(clobber (match_operand:SWI24 4 "memory_operand" "=X,m"))]
|
15263 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15264 |
|
|
&& flag_unsafe_math_optimizations"
|
15265 |
|
|
"#"
|
15266 |
|
|
[(set_attr "type" "fistp")
|
15267 |
|
|
(set_attr "i387_cw" "ceil")
|
15268 |
|
|
(set_attr "mode" "")])
|
15269 |
|
|
|
15270 |
|
|
(define_split
|
15271 |
|
|
[(set (match_operand:SWI24 0 "register_operand" "")
|
15272 |
|
|
(unspec:SWI24 [(match_operand:XF 1 "register_operand" "")]
|
15273 |
|
|
UNSPEC_FIST_CEIL))
|
15274 |
|
|
(use (match_operand:HI 2 "memory_operand" ""))
|
15275 |
|
|
(use (match_operand:HI 3 "memory_operand" ""))
|
15276 |
|
|
(clobber (match_operand:SWI24 4 "memory_operand" ""))]
|
15277 |
|
|
"reload_completed"
|
15278 |
|
|
[(parallel [(set (match_dup 4)
|
15279 |
|
|
(unspec:SWI24 [(match_dup 1)] UNSPEC_FIST_CEIL))
|
15280 |
|
|
(use (match_dup 2))
|
15281 |
|
|
(use (match_dup 3))])
|
15282 |
|
|
(set (match_dup 0) (match_dup 4))])
|
15283 |
|
|
|
15284 |
|
|
(define_split
|
15285 |
|
|
[(set (match_operand:SWI24 0 "memory_operand" "")
|
15286 |
|
|
(unspec:SWI24 [(match_operand:XF 1 "register_operand" "")]
|
15287 |
|
|
UNSPEC_FIST_CEIL))
|
15288 |
|
|
(use (match_operand:HI 2 "memory_operand" ""))
|
15289 |
|
|
(use (match_operand:HI 3 "memory_operand" ""))
|
15290 |
|
|
(clobber (match_operand:SWI24 4 "memory_operand" ""))]
|
15291 |
|
|
"reload_completed"
|
15292 |
|
|
[(parallel [(set (match_dup 0)
|
15293 |
|
|
(unspec:SWI24 [(match_dup 1)] UNSPEC_FIST_CEIL))
|
15294 |
|
|
(use (match_dup 2))
|
15295 |
|
|
(use (match_dup 3))])])
|
15296 |
|
|
|
15297 |
|
|
(define_expand "lceilxf2"
|
15298 |
|
|
[(parallel [(set (match_operand:SWI248x 0 "nonimmediate_operand" "")
|
15299 |
|
|
(unspec:SWI248x [(match_operand:XF 1 "register_operand" "")]
|
15300 |
|
|
UNSPEC_FIST_CEIL))
|
15301 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
15302 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15303 |
|
|
&& (!TARGET_SSE_MATH || TARGET_MIX_SSE_I387)
|
15304 |
|
|
&& flag_unsafe_math_optimizations")
|
15305 |
|
|
|
15306 |
|
|
(define_expand "lceil2"
|
15307 |
|
|
[(match_operand:SWI48 0 "nonimmediate_operand" "")
|
15308 |
|
|
(match_operand:MODEF 1 "register_operand" "")]
|
15309 |
|
|
"SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
15310 |
|
|
&& !flag_trapping_math"
|
15311 |
|
|
{
|
15312 |
|
|
ix86_expand_lfloorceil (operands[0], operands[1], false);
|
15313 |
|
|
DONE;
|
15314 |
|
|
})
|
15315 |
|
|
|
15316 |
|
|
;; Rounding mode control word calculation could clobber FLAGS_REG.
|
15317 |
|
|
(define_insn_and_split "frndintxf2_trunc"
|
15318 |
|
|
[(set (match_operand:XF 0 "register_operand" "")
|
15319 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "")]
|
15320 |
|
|
UNSPEC_FRNDINT_TRUNC))
|
15321 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
15322 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15323 |
|
|
&& flag_unsafe_math_optimizations
|
15324 |
|
|
&& can_create_pseudo_p ()"
|
15325 |
|
|
"#"
|
15326 |
|
|
"&& 1"
|
15327 |
|
|
[(const_int 0)]
|
15328 |
|
|
{
|
15329 |
|
|
ix86_optimize_mode_switching[I387_TRUNC] = 1;
|
15330 |
|
|
|
15331 |
|
|
operands[2] = assign_386_stack_local (HImode, SLOT_CW_STORED);
|
15332 |
|
|
operands[3] = assign_386_stack_local (HImode, SLOT_CW_TRUNC);
|
15333 |
|
|
|
15334 |
|
|
emit_insn (gen_frndintxf2_trunc_i387 (operands[0], operands[1],
|
15335 |
|
|
operands[2], operands[3]));
|
15336 |
|
|
DONE;
|
15337 |
|
|
}
|
15338 |
|
|
[(set_attr "type" "frndint")
|
15339 |
|
|
(set_attr "i387_cw" "trunc")
|
15340 |
|
|
(set_attr "mode" "XF")])
|
15341 |
|
|
|
15342 |
|
|
(define_insn "frndintxf2_trunc_i387"
|
15343 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
15344 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "0")]
|
15345 |
|
|
UNSPEC_FRNDINT_TRUNC))
|
15346 |
|
|
(use (match_operand:HI 2 "memory_operand" "m"))
|
15347 |
|
|
(use (match_operand:HI 3 "memory_operand" "m"))]
|
15348 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15349 |
|
|
&& flag_unsafe_math_optimizations"
|
15350 |
|
|
"fldcw\t%3\n\tfrndint\n\tfldcw\t%2"
|
15351 |
|
|
[(set_attr "type" "frndint")
|
15352 |
|
|
(set_attr "i387_cw" "trunc")
|
15353 |
|
|
(set_attr "mode" "XF")])
|
15354 |
|
|
|
15355 |
|
|
(define_expand "btruncxf2"
|
15356 |
|
|
[(use (match_operand:XF 0 "register_operand" ""))
|
15357 |
|
|
(use (match_operand:XF 1 "register_operand" ""))]
|
15358 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15359 |
|
|
&& flag_unsafe_math_optimizations"
|
15360 |
|
|
{
|
15361 |
|
|
if (optimize_insn_for_size_p ())
|
15362 |
|
|
FAIL;
|
15363 |
|
|
emit_insn (gen_frndintxf2_trunc (operands[0], operands[1]));
|
15364 |
|
|
DONE;
|
15365 |
|
|
})
|
15366 |
|
|
|
15367 |
|
|
(define_expand "btrunc2"
|
15368 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
15369 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
15370 |
|
|
"(TARGET_USE_FANCY_MATH_387
|
15371 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
15372 |
|
|
|| TARGET_MIX_SSE_I387)
|
15373 |
|
|
&& flag_unsafe_math_optimizations)
|
15374 |
|
|
|| (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
15375 |
|
|
&& !flag_trapping_math)"
|
15376 |
|
|
{
|
15377 |
|
|
if (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH
|
15378 |
|
|
&& !flag_trapping_math)
|
15379 |
|
|
{
|
15380 |
|
|
if (TARGET_ROUND)
|
15381 |
|
|
emit_insn (gen_sse4_1_round2
|
15382 |
|
|
(operands[0], operands[1], GEN_INT (ROUND_TRUNC)));
|
15383 |
|
|
else if (optimize_insn_for_size_p ())
|
15384 |
|
|
FAIL;
|
15385 |
|
|
else if (TARGET_64BIT || (mode != DFmode))
|
15386 |
|
|
ix86_expand_trunc (operands[0], operands[1]);
|
15387 |
|
|
else
|
15388 |
|
|
ix86_expand_truncdf_32 (operands[0], operands[1]);
|
15389 |
|
|
}
|
15390 |
|
|
else
|
15391 |
|
|
{
|
15392 |
|
|
rtx op0, op1;
|
15393 |
|
|
|
15394 |
|
|
if (optimize_insn_for_size_p ())
|
15395 |
|
|
FAIL;
|
15396 |
|
|
|
15397 |
|
|
op0 = gen_reg_rtx (XFmode);
|
15398 |
|
|
op1 = gen_reg_rtx (XFmode);
|
15399 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
15400 |
|
|
emit_insn (gen_frndintxf2_trunc (op0, op1));
|
15401 |
|
|
|
15402 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
15403 |
|
|
}
|
15404 |
|
|
DONE;
|
15405 |
|
|
})
|
15406 |
|
|
|
15407 |
|
|
;; Rounding mode control word calculation could clobber FLAGS_REG.
|
15408 |
|
|
(define_insn_and_split "frndintxf2_mask_pm"
|
15409 |
|
|
[(set (match_operand:XF 0 "register_operand" "")
|
15410 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "")]
|
15411 |
|
|
UNSPEC_FRNDINT_MASK_PM))
|
15412 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
15413 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15414 |
|
|
&& flag_unsafe_math_optimizations
|
15415 |
|
|
&& can_create_pseudo_p ()"
|
15416 |
|
|
"#"
|
15417 |
|
|
"&& 1"
|
15418 |
|
|
[(const_int 0)]
|
15419 |
|
|
{
|
15420 |
|
|
ix86_optimize_mode_switching[I387_MASK_PM] = 1;
|
15421 |
|
|
|
15422 |
|
|
operands[2] = assign_386_stack_local (HImode, SLOT_CW_STORED);
|
15423 |
|
|
operands[3] = assign_386_stack_local (HImode, SLOT_CW_MASK_PM);
|
15424 |
|
|
|
15425 |
|
|
emit_insn (gen_frndintxf2_mask_pm_i387 (operands[0], operands[1],
|
15426 |
|
|
operands[2], operands[3]));
|
15427 |
|
|
DONE;
|
15428 |
|
|
}
|
15429 |
|
|
[(set_attr "type" "frndint")
|
15430 |
|
|
(set_attr "i387_cw" "mask_pm")
|
15431 |
|
|
(set_attr "mode" "XF")])
|
15432 |
|
|
|
15433 |
|
|
(define_insn "frndintxf2_mask_pm_i387"
|
15434 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f")
|
15435 |
|
|
(unspec:XF [(match_operand:XF 1 "register_operand" "0")]
|
15436 |
|
|
UNSPEC_FRNDINT_MASK_PM))
|
15437 |
|
|
(use (match_operand:HI 2 "memory_operand" "m"))
|
15438 |
|
|
(use (match_operand:HI 3 "memory_operand" "m"))]
|
15439 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15440 |
|
|
&& flag_unsafe_math_optimizations"
|
15441 |
|
|
"fldcw\t%3\n\tfrndint\n\tfclex\n\tfldcw\t%2"
|
15442 |
|
|
[(set_attr "type" "frndint")
|
15443 |
|
|
(set_attr "i387_cw" "mask_pm")
|
15444 |
|
|
(set_attr "mode" "XF")])
|
15445 |
|
|
|
15446 |
|
|
(define_expand "nearbyintxf2"
|
15447 |
|
|
[(use (match_operand:XF 0 "register_operand" ""))
|
15448 |
|
|
(use (match_operand:XF 1 "register_operand" ""))]
|
15449 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15450 |
|
|
&& flag_unsafe_math_optimizations"
|
15451 |
|
|
{
|
15452 |
|
|
emit_insn (gen_frndintxf2_mask_pm (operands[0], operands[1]));
|
15453 |
|
|
DONE;
|
15454 |
|
|
})
|
15455 |
|
|
|
15456 |
|
|
(define_expand "nearbyint2"
|
15457 |
|
|
[(use (match_operand:MODEF 0 "register_operand" ""))
|
15458 |
|
|
(use (match_operand:MODEF 1 "register_operand" ""))]
|
15459 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15460 |
|
|
&& (!(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)
|
15461 |
|
|
|| TARGET_MIX_SSE_I387)
|
15462 |
|
|
&& flag_unsafe_math_optimizations"
|
15463 |
|
|
{
|
15464 |
|
|
rtx op0 = gen_reg_rtx (XFmode);
|
15465 |
|
|
rtx op1 = gen_reg_rtx (XFmode);
|
15466 |
|
|
|
15467 |
|
|
emit_insn (gen_extendxf2 (op1, operands[1]));
|
15468 |
|
|
emit_insn (gen_frndintxf2_mask_pm (op0, op1));
|
15469 |
|
|
|
15470 |
|
|
emit_insn (gen_truncxf2_i387_noop (operands[0], op0));
|
15471 |
|
|
DONE;
|
15472 |
|
|
})
|
15473 |
|
|
|
15474 |
|
|
(define_insn "fxam2_i387"
|
15475 |
|
|
[(set (match_operand:HI 0 "register_operand" "=a")
|
15476 |
|
|
(unspec:HI
|
15477 |
|
|
[(match_operand:X87MODEF 1 "register_operand" "f")]
|
15478 |
|
|
UNSPEC_FXAM))]
|
15479 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
15480 |
|
|
"fxam\n\tfnstsw\t%0"
|
15481 |
|
|
[(set_attr "type" "multi")
|
15482 |
|
|
(set_attr "length" "4")
|
15483 |
|
|
(set_attr "unit" "i387")
|
15484 |
|
|
(set_attr "mode" "")])
|
15485 |
|
|
|
15486 |
|
|
(define_insn_and_split "fxam2_i387_with_temp"
|
15487 |
|
|
[(set (match_operand:HI 0 "register_operand" "")
|
15488 |
|
|
(unspec:HI
|
15489 |
|
|
[(match_operand:MODEF 1 "memory_operand" "")]
|
15490 |
|
|
UNSPEC_FXAM_MEM))]
|
15491 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15492 |
|
|
&& can_create_pseudo_p ()"
|
15493 |
|
|
"#"
|
15494 |
|
|
"&& 1"
|
15495 |
|
|
[(set (match_dup 2)(match_dup 1))
|
15496 |
|
|
(set (match_dup 0)
|
15497 |
|
|
(unspec:HI [(match_dup 2)] UNSPEC_FXAM))]
|
15498 |
|
|
{
|
15499 |
|
|
operands[2] = gen_reg_rtx (mode);
|
15500 |
|
|
|
15501 |
|
|
MEM_VOLATILE_P (operands[1]) = 1;
|
15502 |
|
|
}
|
15503 |
|
|
[(set_attr "type" "multi")
|
15504 |
|
|
(set_attr "unit" "i387")
|
15505 |
|
|
(set_attr "mode" "")])
|
15506 |
|
|
|
15507 |
|
|
(define_expand "isinfxf2"
|
15508 |
|
|
[(use (match_operand:SI 0 "register_operand" ""))
|
15509 |
|
|
(use (match_operand:XF 1 "register_operand" ""))]
|
15510 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15511 |
|
|
&& TARGET_C99_FUNCTIONS"
|
15512 |
|
|
{
|
15513 |
|
|
rtx mask = GEN_INT (0x45);
|
15514 |
|
|
rtx val = GEN_INT (0x05);
|
15515 |
|
|
|
15516 |
|
|
rtx cond;
|
15517 |
|
|
|
15518 |
|
|
rtx scratch = gen_reg_rtx (HImode);
|
15519 |
|
|
rtx res = gen_reg_rtx (QImode);
|
15520 |
|
|
|
15521 |
|
|
emit_insn (gen_fxamxf2_i387 (scratch, operands[1]));
|
15522 |
|
|
|
15523 |
|
|
emit_insn (gen_andqi_ext_0 (scratch, scratch, mask));
|
15524 |
|
|
emit_insn (gen_cmpqi_ext_3 (scratch, val));
|
15525 |
|
|
cond = gen_rtx_fmt_ee (EQ, QImode,
|
15526 |
|
|
gen_rtx_REG (CCmode, FLAGS_REG),
|
15527 |
|
|
const0_rtx);
|
15528 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, res, cond));
|
15529 |
|
|
emit_insn (gen_zero_extendqisi2 (operands[0], res));
|
15530 |
|
|
DONE;
|
15531 |
|
|
})
|
15532 |
|
|
|
15533 |
|
|
(define_expand "isinf2"
|
15534 |
|
|
[(use (match_operand:SI 0 "register_operand" ""))
|
15535 |
|
|
(use (match_operand:MODEF 1 "nonimmediate_operand" ""))]
|
15536 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15537 |
|
|
&& TARGET_C99_FUNCTIONS
|
15538 |
|
|
&& !(SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)"
|
15539 |
|
|
{
|
15540 |
|
|
rtx mask = GEN_INT (0x45);
|
15541 |
|
|
rtx val = GEN_INT (0x05);
|
15542 |
|
|
|
15543 |
|
|
rtx cond;
|
15544 |
|
|
|
15545 |
|
|
rtx scratch = gen_reg_rtx (HImode);
|
15546 |
|
|
rtx res = gen_reg_rtx (QImode);
|
15547 |
|
|
|
15548 |
|
|
/* Remove excess precision by forcing value through memory. */
|
15549 |
|
|
if (memory_operand (operands[1], VOIDmode))
|
15550 |
|
|
emit_insn (gen_fxam2_i387_with_temp (scratch, operands[1]));
|
15551 |
|
|
else
|
15552 |
|
|
{
|
15553 |
|
|
enum ix86_stack_slot slot = (virtuals_instantiated
|
15554 |
|
|
? SLOT_TEMP
|
15555 |
|
|
: SLOT_VIRTUAL);
|
15556 |
|
|
rtx temp = assign_386_stack_local (mode, slot);
|
15557 |
|
|
|
15558 |
|
|
emit_move_insn (temp, operands[1]);
|
15559 |
|
|
emit_insn (gen_fxam2_i387_with_temp (scratch, temp));
|
15560 |
|
|
}
|
15561 |
|
|
|
15562 |
|
|
emit_insn (gen_andqi_ext_0 (scratch, scratch, mask));
|
15563 |
|
|
emit_insn (gen_cmpqi_ext_3 (scratch, val));
|
15564 |
|
|
cond = gen_rtx_fmt_ee (EQ, QImode,
|
15565 |
|
|
gen_rtx_REG (CCmode, FLAGS_REG),
|
15566 |
|
|
const0_rtx);
|
15567 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, res, cond));
|
15568 |
|
|
emit_insn (gen_zero_extendqisi2 (operands[0], res));
|
15569 |
|
|
DONE;
|
15570 |
|
|
})
|
15571 |
|
|
|
15572 |
|
|
(define_expand "signbitxf2"
|
15573 |
|
|
[(use (match_operand:SI 0 "register_operand" ""))
|
15574 |
|
|
(use (match_operand:XF 1 "register_operand" ""))]
|
15575 |
|
|
"TARGET_USE_FANCY_MATH_387"
|
15576 |
|
|
{
|
15577 |
|
|
rtx scratch = gen_reg_rtx (HImode);
|
15578 |
|
|
|
15579 |
|
|
emit_insn (gen_fxamxf2_i387 (scratch, operands[1]));
|
15580 |
|
|
emit_insn (gen_andsi3 (operands[0],
|
15581 |
|
|
gen_lowpart (SImode, scratch), GEN_INT (0x200)));
|
15582 |
|
|
DONE;
|
15583 |
|
|
})
|
15584 |
|
|
|
15585 |
|
|
(define_insn "movmsk_df"
|
15586 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
15587 |
|
|
(unspec:SI
|
15588 |
|
|
[(match_operand:DF 1 "register_operand" "x")]
|
15589 |
|
|
UNSPEC_MOVMSK))]
|
15590 |
|
|
"SSE_FLOAT_MODE_P (DFmode) && TARGET_SSE_MATH"
|
15591 |
|
|
"%vmovmskpd\t{%1, %0|%0, %1}"
|
15592 |
|
|
[(set_attr "type" "ssemov")
|
15593 |
|
|
(set_attr "prefix" "maybe_vex")
|
15594 |
|
|
(set_attr "mode" "DF")])
|
15595 |
|
|
|
15596 |
|
|
;; Use movmskpd in SSE mode to avoid store forwarding stall
|
15597 |
|
|
;; for 32bit targets and movq+shrq sequence for 64bit targets.
|
15598 |
|
|
(define_expand "signbitdf2"
|
15599 |
|
|
[(use (match_operand:SI 0 "register_operand" ""))
|
15600 |
|
|
(use (match_operand:DF 1 "register_operand" ""))]
|
15601 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15602 |
|
|
|| (SSE_FLOAT_MODE_P (DFmode) && TARGET_SSE_MATH)"
|
15603 |
|
|
{
|
15604 |
|
|
if (SSE_FLOAT_MODE_P (DFmode) && TARGET_SSE_MATH)
|
15605 |
|
|
{
|
15606 |
|
|
emit_insn (gen_movmsk_df (operands[0], operands[1]));
|
15607 |
|
|
emit_insn (gen_andsi3 (operands[0], operands[0], const1_rtx));
|
15608 |
|
|
}
|
15609 |
|
|
else
|
15610 |
|
|
{
|
15611 |
|
|
rtx scratch = gen_reg_rtx (HImode);
|
15612 |
|
|
|
15613 |
|
|
emit_insn (gen_fxamdf2_i387 (scratch, operands[1]));
|
15614 |
|
|
emit_insn (gen_andsi3 (operands[0],
|
15615 |
|
|
gen_lowpart (SImode, scratch), GEN_INT (0x200)));
|
15616 |
|
|
}
|
15617 |
|
|
DONE;
|
15618 |
|
|
})
|
15619 |
|
|
|
15620 |
|
|
(define_expand "signbitsf2"
|
15621 |
|
|
[(use (match_operand:SI 0 "register_operand" ""))
|
15622 |
|
|
(use (match_operand:SF 1 "register_operand" ""))]
|
15623 |
|
|
"TARGET_USE_FANCY_MATH_387
|
15624 |
|
|
&& !(SSE_FLOAT_MODE_P (SFmode) && TARGET_SSE_MATH)"
|
15625 |
|
|
{
|
15626 |
|
|
rtx scratch = gen_reg_rtx (HImode);
|
15627 |
|
|
|
15628 |
|
|
emit_insn (gen_fxamsf2_i387 (scratch, operands[1]));
|
15629 |
|
|
emit_insn (gen_andsi3 (operands[0],
|
15630 |
|
|
gen_lowpart (SImode, scratch), GEN_INT (0x200)));
|
15631 |
|
|
DONE;
|
15632 |
|
|
})
|
15633 |
|
|
|
15634 |
|
|
;; Block operation instructions
|
15635 |
|
|
|
15636 |
|
|
(define_insn "cld"
|
15637 |
|
|
[(unspec_volatile [(const_int 0)] UNSPECV_CLD)]
|
15638 |
|
|
""
|
15639 |
|
|
"cld"
|
15640 |
|
|
[(set_attr "length" "1")
|
15641 |
|
|
(set_attr "length_immediate" "0")
|
15642 |
|
|
(set_attr "modrm" "0")])
|
15643 |
|
|
|
15644 |
|
|
(define_expand "movmem"
|
15645 |
|
|
[(use (match_operand:BLK 0 "memory_operand" ""))
|
15646 |
|
|
(use (match_operand:BLK 1 "memory_operand" ""))
|
15647 |
|
|
(use (match_operand:SWI48 2 "nonmemory_operand" ""))
|
15648 |
|
|
(use (match_operand:SWI48 3 "const_int_operand" ""))
|
15649 |
|
|
(use (match_operand:SI 4 "const_int_operand" ""))
|
15650 |
|
|
(use (match_operand:SI 5 "const_int_operand" ""))]
|
15651 |
|
|
""
|
15652 |
|
|
{
|
15653 |
|
|
if (ix86_expand_movmem (operands[0], operands[1], operands[2], operands[3],
|
15654 |
|
|
operands[4], operands[5]))
|
15655 |
|
|
DONE;
|
15656 |
|
|
else
|
15657 |
|
|
FAIL;
|
15658 |
|
|
})
|
15659 |
|
|
|
15660 |
|
|
;; Most CPUs don't like single string operations
|
15661 |
|
|
;; Handle this case here to simplify previous expander.
|
15662 |
|
|
|
15663 |
|
|
(define_expand "strmov"
|
15664 |
|
|
[(set (match_dup 4) (match_operand 3 "memory_operand" ""))
|
15665 |
|
|
(set (match_operand 1 "memory_operand" "") (match_dup 4))
|
15666 |
|
|
(parallel [(set (match_operand 0 "register_operand" "") (match_dup 5))
|
15667 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
15668 |
|
|
(parallel [(set (match_operand 2 "register_operand" "") (match_dup 6))
|
15669 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
15670 |
|
|
""
|
15671 |
|
|
{
|
15672 |
|
|
rtx adjust = GEN_INT (GET_MODE_SIZE (GET_MODE (operands[1])));
|
15673 |
|
|
|
15674 |
|
|
/* If .md ever supports :P for Pmode, these can be directly
|
15675 |
|
|
in the pattern above. */
|
15676 |
|
|
operands[5] = gen_rtx_PLUS (Pmode, operands[0], adjust);
|
15677 |
|
|
operands[6] = gen_rtx_PLUS (Pmode, operands[2], adjust);
|
15678 |
|
|
|
15679 |
|
|
/* Can't use this if the user has appropriated esi or edi. */
|
15680 |
|
|
if ((TARGET_SINGLE_STRINGOP || optimize_insn_for_size_p ())
|
15681 |
|
|
&& !(fixed_regs[SI_REG] || fixed_regs[DI_REG]))
|
15682 |
|
|
{
|
15683 |
|
|
emit_insn (gen_strmov_singleop (operands[0], operands[1],
|
15684 |
|
|
operands[2], operands[3],
|
15685 |
|
|
operands[5], operands[6]));
|
15686 |
|
|
DONE;
|
15687 |
|
|
}
|
15688 |
|
|
|
15689 |
|
|
operands[4] = gen_reg_rtx (GET_MODE (operands[1]));
|
15690 |
|
|
})
|
15691 |
|
|
|
15692 |
|
|
(define_expand "strmov_singleop"
|
15693 |
|
|
[(parallel [(set (match_operand 1 "memory_operand" "")
|
15694 |
|
|
(match_operand 3 "memory_operand" ""))
|
15695 |
|
|
(set (match_operand 0 "register_operand" "")
|
15696 |
|
|
(match_operand 4 "" ""))
|
15697 |
|
|
(set (match_operand 2 "register_operand" "")
|
15698 |
|
|
(match_operand 5 "" ""))])]
|
15699 |
|
|
""
|
15700 |
|
|
"ix86_current_function_needs_cld = 1;")
|
15701 |
|
|
|
15702 |
|
|
(define_insn "*strmovdi_rex_1"
|
15703 |
|
|
[(set (mem:DI (match_operand:DI 2 "register_operand" "0"))
|
15704 |
|
|
(mem:DI (match_operand:DI 3 "register_operand" "1")))
|
15705 |
|
|
(set (match_operand:DI 0 "register_operand" "=D")
|
15706 |
|
|
(plus:DI (match_dup 2)
|
15707 |
|
|
(const_int 8)))
|
15708 |
|
|
(set (match_operand:DI 1 "register_operand" "=S")
|
15709 |
|
|
(plus:DI (match_dup 3)
|
15710 |
|
|
(const_int 8)))]
|
15711 |
|
|
"TARGET_64BIT
|
15712 |
|
|
&& !(fixed_regs[SI_REG] || fixed_regs[DI_REG])"
|
15713 |
|
|
"movsq"
|
15714 |
|
|
[(set_attr "type" "str")
|
15715 |
|
|
(set_attr "memory" "both")
|
15716 |
|
|
(set_attr "mode" "DI")])
|
15717 |
|
|
|
15718 |
|
|
(define_insn "*strmovsi_1"
|
15719 |
|
|
[(set (mem:SI (match_operand:P 2 "register_operand" "0"))
|
15720 |
|
|
(mem:SI (match_operand:P 3 "register_operand" "1")))
|
15721 |
|
|
(set (match_operand:P 0 "register_operand" "=D")
|
15722 |
|
|
(plus:P (match_dup 2)
|
15723 |
|
|
(const_int 4)))
|
15724 |
|
|
(set (match_operand:P 1 "register_operand" "=S")
|
15725 |
|
|
(plus:P (match_dup 3)
|
15726 |
|
|
(const_int 4)))]
|
15727 |
|
|
"!(fixed_regs[SI_REG] || fixed_regs[DI_REG])"
|
15728 |
|
|
"movs{l|d}"
|
15729 |
|
|
[(set_attr "type" "str")
|
15730 |
|
|
(set_attr "memory" "both")
|
15731 |
|
|
(set_attr "mode" "SI")])
|
15732 |
|
|
|
15733 |
|
|
(define_insn "*strmovhi_1"
|
15734 |
|
|
[(set (mem:HI (match_operand:P 2 "register_operand" "0"))
|
15735 |
|
|
(mem:HI (match_operand:P 3 "register_operand" "1")))
|
15736 |
|
|
(set (match_operand:P 0 "register_operand" "=D")
|
15737 |
|
|
(plus:P (match_dup 2)
|
15738 |
|
|
(const_int 2)))
|
15739 |
|
|
(set (match_operand:P 1 "register_operand" "=S")
|
15740 |
|
|
(plus:P (match_dup 3)
|
15741 |
|
|
(const_int 2)))]
|
15742 |
|
|
"!(fixed_regs[SI_REG] || fixed_regs[DI_REG])"
|
15743 |
|
|
"movsw"
|
15744 |
|
|
[(set_attr "type" "str")
|
15745 |
|
|
(set_attr "memory" "both")
|
15746 |
|
|
(set_attr "mode" "HI")])
|
15747 |
|
|
|
15748 |
|
|
(define_insn "*strmovqi_1"
|
15749 |
|
|
[(set (mem:QI (match_operand:P 2 "register_operand" "0"))
|
15750 |
|
|
(mem:QI (match_operand:P 3 "register_operand" "1")))
|
15751 |
|
|
(set (match_operand:P 0 "register_operand" "=D")
|
15752 |
|
|
(plus:P (match_dup 2)
|
15753 |
|
|
(const_int 1)))
|
15754 |
|
|
(set (match_operand:P 1 "register_operand" "=S")
|
15755 |
|
|
(plus:P (match_dup 3)
|
15756 |
|
|
(const_int 1)))]
|
15757 |
|
|
"!(fixed_regs[SI_REG] || fixed_regs[DI_REG])"
|
15758 |
|
|
"movsb"
|
15759 |
|
|
[(set_attr "type" "str")
|
15760 |
|
|
(set_attr "memory" "both")
|
15761 |
|
|
(set (attr "prefix_rex")
|
15762 |
|
|
(if_then_else
|
15763 |
|
|
(match_test "mode == DImode")
|
15764 |
|
|
(const_string "0")
|
15765 |
|
|
(const_string "*")))
|
15766 |
|
|
(set_attr "mode" "QI")])
|
15767 |
|
|
|
15768 |
|
|
(define_expand "rep_mov"
|
15769 |
|
|
[(parallel [(set (match_operand 4 "register_operand" "") (const_int 0))
|
15770 |
|
|
(set (match_operand 0 "register_operand" "")
|
15771 |
|
|
(match_operand 5 "" ""))
|
15772 |
|
|
(set (match_operand 2 "register_operand" "")
|
15773 |
|
|
(match_operand 6 "" ""))
|
15774 |
|
|
(set (match_operand 1 "memory_operand" "")
|
15775 |
|
|
(match_operand 3 "memory_operand" ""))
|
15776 |
|
|
(use (match_dup 4))])]
|
15777 |
|
|
""
|
15778 |
|
|
"ix86_current_function_needs_cld = 1;")
|
15779 |
|
|
|
15780 |
|
|
(define_insn "*rep_movdi_rex64"
|
15781 |
|
|
[(set (match_operand:DI 2 "register_operand" "=c") (const_int 0))
|
15782 |
|
|
(set (match_operand:DI 0 "register_operand" "=D")
|
15783 |
|
|
(plus:DI (ashift:DI (match_operand:DI 5 "register_operand" "2")
|
15784 |
|
|
(const_int 3))
|
15785 |
|
|
(match_operand:DI 3 "register_operand" "0")))
|
15786 |
|
|
(set (match_operand:DI 1 "register_operand" "=S")
|
15787 |
|
|
(plus:DI (ashift:DI (match_dup 5) (const_int 3))
|
15788 |
|
|
(match_operand:DI 4 "register_operand" "1")))
|
15789 |
|
|
(set (mem:BLK (match_dup 3))
|
15790 |
|
|
(mem:BLK (match_dup 4)))
|
15791 |
|
|
(use (match_dup 5))]
|
15792 |
|
|
"TARGET_64BIT
|
15793 |
|
|
&& !(fixed_regs[CX_REG] || fixed_regs[SI_REG] || fixed_regs[DI_REG])"
|
15794 |
|
|
"rep{%;} movsq"
|
15795 |
|
|
[(set_attr "type" "str")
|
15796 |
|
|
(set_attr "prefix_rep" "1")
|
15797 |
|
|
(set_attr "memory" "both")
|
15798 |
|
|
(set_attr "mode" "DI")])
|
15799 |
|
|
|
15800 |
|
|
(define_insn "*rep_movsi"
|
15801 |
|
|
[(set (match_operand:P 2 "register_operand" "=c") (const_int 0))
|
15802 |
|
|
(set (match_operand:P 0 "register_operand" "=D")
|
15803 |
|
|
(plus:P (ashift:P (match_operand:P 5 "register_operand" "2")
|
15804 |
|
|
(const_int 2))
|
15805 |
|
|
(match_operand:P 3 "register_operand" "0")))
|
15806 |
|
|
(set (match_operand:P 1 "register_operand" "=S")
|
15807 |
|
|
(plus:P (ashift:P (match_dup 5) (const_int 2))
|
15808 |
|
|
(match_operand:P 4 "register_operand" "1")))
|
15809 |
|
|
(set (mem:BLK (match_dup 3))
|
15810 |
|
|
(mem:BLK (match_dup 4)))
|
15811 |
|
|
(use (match_dup 5))]
|
15812 |
|
|
"!(fixed_regs[CX_REG] || fixed_regs[SI_REG] || fixed_regs[DI_REG])"
|
15813 |
|
|
"rep{%;} movs{l|d}"
|
15814 |
|
|
[(set_attr "type" "str")
|
15815 |
|
|
(set_attr "prefix_rep" "1")
|
15816 |
|
|
(set_attr "memory" "both")
|
15817 |
|
|
(set_attr "mode" "SI")])
|
15818 |
|
|
|
15819 |
|
|
(define_insn "*rep_movqi"
|
15820 |
|
|
[(set (match_operand:P 2 "register_operand" "=c") (const_int 0))
|
15821 |
|
|
(set (match_operand:P 0 "register_operand" "=D")
|
15822 |
|
|
(plus:P (match_operand:P 3 "register_operand" "0")
|
15823 |
|
|
(match_operand:P 5 "register_operand" "2")))
|
15824 |
|
|
(set (match_operand:P 1 "register_operand" "=S")
|
15825 |
|
|
(plus:P (match_operand:P 4 "register_operand" "1") (match_dup 5)))
|
15826 |
|
|
(set (mem:BLK (match_dup 3))
|
15827 |
|
|
(mem:BLK (match_dup 4)))
|
15828 |
|
|
(use (match_dup 5))]
|
15829 |
|
|
"!(fixed_regs[CX_REG] || fixed_regs[SI_REG] || fixed_regs[DI_REG])"
|
15830 |
|
|
"rep{%;} movsb"
|
15831 |
|
|
[(set_attr "type" "str")
|
15832 |
|
|
(set_attr "prefix_rep" "1")
|
15833 |
|
|
(set_attr "memory" "both")
|
15834 |
|
|
(set_attr "mode" "QI")])
|
15835 |
|
|
|
15836 |
|
|
(define_expand "setmem"
|
15837 |
|
|
[(use (match_operand:BLK 0 "memory_operand" ""))
|
15838 |
|
|
(use (match_operand:SWI48 1 "nonmemory_operand" ""))
|
15839 |
|
|
(use (match_operand:QI 2 "nonmemory_operand" ""))
|
15840 |
|
|
(use (match_operand 3 "const_int_operand" ""))
|
15841 |
|
|
(use (match_operand:SI 4 "const_int_operand" ""))
|
15842 |
|
|
(use (match_operand:SI 5 "const_int_operand" ""))]
|
15843 |
|
|
""
|
15844 |
|
|
{
|
15845 |
|
|
if (ix86_expand_setmem (operands[0], operands[1],
|
15846 |
|
|
operands[2], operands[3],
|
15847 |
|
|
operands[4], operands[5]))
|
15848 |
|
|
DONE;
|
15849 |
|
|
else
|
15850 |
|
|
FAIL;
|
15851 |
|
|
})
|
15852 |
|
|
|
15853 |
|
|
;; Most CPUs don't like single string operations
|
15854 |
|
|
;; Handle this case here to simplify previous expander.
|
15855 |
|
|
|
15856 |
|
|
(define_expand "strset"
|
15857 |
|
|
[(set (match_operand 1 "memory_operand" "")
|
15858 |
|
|
(match_operand 2 "register_operand" ""))
|
15859 |
|
|
(parallel [(set (match_operand 0 "register_operand" "")
|
15860 |
|
|
(match_dup 3))
|
15861 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
15862 |
|
|
""
|
15863 |
|
|
{
|
15864 |
|
|
if (GET_MODE (operands[1]) != GET_MODE (operands[2]))
|
15865 |
|
|
operands[1] = adjust_address_nv (operands[1], GET_MODE (operands[2]), 0);
|
15866 |
|
|
|
15867 |
|
|
/* If .md ever supports :P for Pmode, this can be directly
|
15868 |
|
|
in the pattern above. */
|
15869 |
|
|
operands[3] = gen_rtx_PLUS (Pmode, operands[0],
|
15870 |
|
|
GEN_INT (GET_MODE_SIZE (GET_MODE
|
15871 |
|
|
(operands[2]))));
|
15872 |
|
|
/* Can't use this if the user has appropriated eax or edi. */
|
15873 |
|
|
if ((TARGET_SINGLE_STRINGOP || optimize_insn_for_size_p ())
|
15874 |
|
|
&& !(fixed_regs[AX_REG] || fixed_regs[DI_REG]))
|
15875 |
|
|
{
|
15876 |
|
|
emit_insn (gen_strset_singleop (operands[0], operands[1], operands[2],
|
15877 |
|
|
operands[3]));
|
15878 |
|
|
DONE;
|
15879 |
|
|
}
|
15880 |
|
|
})
|
15881 |
|
|
|
15882 |
|
|
(define_expand "strset_singleop"
|
15883 |
|
|
[(parallel [(set (match_operand 1 "memory_operand" "")
|
15884 |
|
|
(match_operand 2 "register_operand" ""))
|
15885 |
|
|
(set (match_operand 0 "register_operand" "")
|
15886 |
|
|
(match_operand 3 "" ""))])]
|
15887 |
|
|
""
|
15888 |
|
|
"ix86_current_function_needs_cld = 1;")
|
15889 |
|
|
|
15890 |
|
|
(define_insn "*strsetdi_rex_1"
|
15891 |
|
|
[(set (mem:DI (match_operand:DI 1 "register_operand" "0"))
|
15892 |
|
|
(match_operand:DI 2 "register_operand" "a"))
|
15893 |
|
|
(set (match_operand:DI 0 "register_operand" "=D")
|
15894 |
|
|
(plus:DI (match_dup 1)
|
15895 |
|
|
(const_int 8)))]
|
15896 |
|
|
"TARGET_64BIT
|
15897 |
|
|
&& !(fixed_regs[AX_REG] || fixed_regs[DI_REG])"
|
15898 |
|
|
"stosq"
|
15899 |
|
|
[(set_attr "type" "str")
|
15900 |
|
|
(set_attr "memory" "store")
|
15901 |
|
|
(set_attr "mode" "DI")])
|
15902 |
|
|
|
15903 |
|
|
(define_insn "*strsetsi_1"
|
15904 |
|
|
[(set (mem:SI (match_operand:P 1 "register_operand" "0"))
|
15905 |
|
|
(match_operand:SI 2 "register_operand" "a"))
|
15906 |
|
|
(set (match_operand:P 0 "register_operand" "=D")
|
15907 |
|
|
(plus:P (match_dup 1)
|
15908 |
|
|
(const_int 4)))]
|
15909 |
|
|
"!(fixed_regs[AX_REG] || fixed_regs[DI_REG])"
|
15910 |
|
|
"stos{l|d}"
|
15911 |
|
|
[(set_attr "type" "str")
|
15912 |
|
|
(set_attr "memory" "store")
|
15913 |
|
|
(set_attr "mode" "SI")])
|
15914 |
|
|
|
15915 |
|
|
(define_insn "*strsethi_1"
|
15916 |
|
|
[(set (mem:HI (match_operand:P 1 "register_operand" "0"))
|
15917 |
|
|
(match_operand:HI 2 "register_operand" "a"))
|
15918 |
|
|
(set (match_operand:P 0 "register_operand" "=D")
|
15919 |
|
|
(plus:P (match_dup 1)
|
15920 |
|
|
(const_int 2)))]
|
15921 |
|
|
"!(fixed_regs[AX_REG] || fixed_regs[DI_REG])"
|
15922 |
|
|
"stosw"
|
15923 |
|
|
[(set_attr "type" "str")
|
15924 |
|
|
(set_attr "memory" "store")
|
15925 |
|
|
(set_attr "mode" "HI")])
|
15926 |
|
|
|
15927 |
|
|
(define_insn "*strsetqi_1"
|
15928 |
|
|
[(set (mem:QI (match_operand:P 1 "register_operand" "0"))
|
15929 |
|
|
(match_operand:QI 2 "register_operand" "a"))
|
15930 |
|
|
(set (match_operand:P 0 "register_operand" "=D")
|
15931 |
|
|
(plus:P (match_dup 1)
|
15932 |
|
|
(const_int 1)))]
|
15933 |
|
|
"!(fixed_regs[AX_REG] || fixed_regs[DI_REG])"
|
15934 |
|
|
"stosb"
|
15935 |
|
|
[(set_attr "type" "str")
|
15936 |
|
|
(set_attr "memory" "store")
|
15937 |
|
|
(set (attr "prefix_rex")
|
15938 |
|
|
(if_then_else
|
15939 |
|
|
(match_test "mode == DImode")
|
15940 |
|
|
(const_string "0")
|
15941 |
|
|
(const_string "*")))
|
15942 |
|
|
(set_attr "mode" "QI")])
|
15943 |
|
|
|
15944 |
|
|
(define_expand "rep_stos"
|
15945 |
|
|
[(parallel [(set (match_operand 1 "register_operand" "") (const_int 0))
|
15946 |
|
|
(set (match_operand 0 "register_operand" "")
|
15947 |
|
|
(match_operand 4 "" ""))
|
15948 |
|
|
(set (match_operand 2 "memory_operand" "") (const_int 0))
|
15949 |
|
|
(use (match_operand 3 "register_operand" ""))
|
15950 |
|
|
(use (match_dup 1))])]
|
15951 |
|
|
""
|
15952 |
|
|
"ix86_current_function_needs_cld = 1;")
|
15953 |
|
|
|
15954 |
|
|
(define_insn "*rep_stosdi_rex64"
|
15955 |
|
|
[(set (match_operand:DI 1 "register_operand" "=c") (const_int 0))
|
15956 |
|
|
(set (match_operand:DI 0 "register_operand" "=D")
|
15957 |
|
|
(plus:DI (ashift:DI (match_operand:DI 4 "register_operand" "1")
|
15958 |
|
|
(const_int 3))
|
15959 |
|
|
(match_operand:DI 3 "register_operand" "0")))
|
15960 |
|
|
(set (mem:BLK (match_dup 3))
|
15961 |
|
|
(const_int 0))
|
15962 |
|
|
(use (match_operand:DI 2 "register_operand" "a"))
|
15963 |
|
|
(use (match_dup 4))]
|
15964 |
|
|
"TARGET_64BIT
|
15965 |
|
|
&& !(fixed_regs[AX_REG] || fixed_regs[CX_REG] || fixed_regs[DI_REG])"
|
15966 |
|
|
"rep{%;} stosq"
|
15967 |
|
|
[(set_attr "type" "str")
|
15968 |
|
|
(set_attr "prefix_rep" "1")
|
15969 |
|
|
(set_attr "memory" "store")
|
15970 |
|
|
(set_attr "mode" "DI")])
|
15971 |
|
|
|
15972 |
|
|
(define_insn "*rep_stossi"
|
15973 |
|
|
[(set (match_operand:P 1 "register_operand" "=c") (const_int 0))
|
15974 |
|
|
(set (match_operand:P 0 "register_operand" "=D")
|
15975 |
|
|
(plus:P (ashift:P (match_operand:P 4 "register_operand" "1")
|
15976 |
|
|
(const_int 2))
|
15977 |
|
|
(match_operand:P 3 "register_operand" "0")))
|
15978 |
|
|
(set (mem:BLK (match_dup 3))
|
15979 |
|
|
(const_int 0))
|
15980 |
|
|
(use (match_operand:SI 2 "register_operand" "a"))
|
15981 |
|
|
(use (match_dup 4))]
|
15982 |
|
|
"!(fixed_regs[AX_REG] || fixed_regs[CX_REG] || fixed_regs[DI_REG])"
|
15983 |
|
|
"rep{%;} stos{l|d}"
|
15984 |
|
|
[(set_attr "type" "str")
|
15985 |
|
|
(set_attr "prefix_rep" "1")
|
15986 |
|
|
(set_attr "memory" "store")
|
15987 |
|
|
(set_attr "mode" "SI")])
|
15988 |
|
|
|
15989 |
|
|
(define_insn "*rep_stosqi"
|
15990 |
|
|
[(set (match_operand:P 1 "register_operand" "=c") (const_int 0))
|
15991 |
|
|
(set (match_operand:P 0 "register_operand" "=D")
|
15992 |
|
|
(plus:P (match_operand:P 3 "register_operand" "0")
|
15993 |
|
|
(match_operand:P 4 "register_operand" "1")))
|
15994 |
|
|
(set (mem:BLK (match_dup 3))
|
15995 |
|
|
(const_int 0))
|
15996 |
|
|
(use (match_operand:QI 2 "register_operand" "a"))
|
15997 |
|
|
(use (match_dup 4))]
|
15998 |
|
|
"!(fixed_regs[AX_REG] || fixed_regs[CX_REG] || fixed_regs[DI_REG])"
|
15999 |
|
|
"rep{%;} stosb"
|
16000 |
|
|
[(set_attr "type" "str")
|
16001 |
|
|
(set_attr "prefix_rep" "1")
|
16002 |
|
|
(set_attr "memory" "store")
|
16003 |
|
|
(set (attr "prefix_rex")
|
16004 |
|
|
(if_then_else
|
16005 |
|
|
(match_test "mode == DImode")
|
16006 |
|
|
(const_string "0")
|
16007 |
|
|
(const_string "*")))
|
16008 |
|
|
(set_attr "mode" "QI")])
|
16009 |
|
|
|
16010 |
|
|
(define_expand "cmpstrnsi"
|
16011 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
16012 |
|
|
(compare:SI (match_operand:BLK 1 "general_operand" "")
|
16013 |
|
|
(match_operand:BLK 2 "general_operand" "")))
|
16014 |
|
|
(use (match_operand 3 "general_operand" ""))
|
16015 |
|
|
(use (match_operand 4 "immediate_operand" ""))]
|
16016 |
|
|
""
|
16017 |
|
|
{
|
16018 |
|
|
rtx addr1, addr2, out, outlow, count, countreg, align;
|
16019 |
|
|
|
16020 |
|
|
if (optimize_insn_for_size_p () && !TARGET_INLINE_ALL_STRINGOPS)
|
16021 |
|
|
FAIL;
|
16022 |
|
|
|
16023 |
|
|
/* Can't use this if the user has appropriated ecx, esi or edi. */
|
16024 |
|
|
if (fixed_regs[CX_REG] || fixed_regs[SI_REG] || fixed_regs[DI_REG])
|
16025 |
|
|
FAIL;
|
16026 |
|
|
|
16027 |
|
|
out = operands[0];
|
16028 |
|
|
if (!REG_P (out))
|
16029 |
|
|
out = gen_reg_rtx (SImode);
|
16030 |
|
|
|
16031 |
|
|
addr1 = copy_to_mode_reg (Pmode, XEXP (operands[1], 0));
|
16032 |
|
|
addr2 = copy_to_mode_reg (Pmode, XEXP (operands[2], 0));
|
16033 |
|
|
if (addr1 != XEXP (operands[1], 0))
|
16034 |
|
|
operands[1] = replace_equiv_address_nv (operands[1], addr1);
|
16035 |
|
|
if (addr2 != XEXP (operands[2], 0))
|
16036 |
|
|
operands[2] = replace_equiv_address_nv (operands[2], addr2);
|
16037 |
|
|
|
16038 |
|
|
count = operands[3];
|
16039 |
|
|
countreg = ix86_zero_extend_to_Pmode (count);
|
16040 |
|
|
|
16041 |
|
|
/* %%% Iff we are testing strict equality, we can use known alignment
|
16042 |
|
|
to good advantage. This may be possible with combine, particularly
|
16043 |
|
|
once cc0 is dead. */
|
16044 |
|
|
align = operands[4];
|
16045 |
|
|
|
16046 |
|
|
if (CONST_INT_P (count))
|
16047 |
|
|
{
|
16048 |
|
|
if (INTVAL (count) == 0)
|
16049 |
|
|
{
|
16050 |
|
|
emit_move_insn (operands[0], const0_rtx);
|
16051 |
|
|
DONE;
|
16052 |
|
|
}
|
16053 |
|
|
emit_insn (gen_cmpstrnqi_nz_1 (addr1, addr2, countreg, align,
|
16054 |
|
|
operands[1], operands[2]));
|
16055 |
|
|
}
|
16056 |
|
|
else
|
16057 |
|
|
{
|
16058 |
|
|
rtx (*gen_cmp) (rtx, rtx);
|
16059 |
|
|
|
16060 |
|
|
gen_cmp = (TARGET_64BIT
|
16061 |
|
|
? gen_cmpdi_1 : gen_cmpsi_1);
|
16062 |
|
|
|
16063 |
|
|
emit_insn (gen_cmp (countreg, countreg));
|
16064 |
|
|
emit_insn (gen_cmpstrnqi_1 (addr1, addr2, countreg, align,
|
16065 |
|
|
operands[1], operands[2]));
|
16066 |
|
|
}
|
16067 |
|
|
|
16068 |
|
|
outlow = gen_lowpart (QImode, out);
|
16069 |
|
|
emit_insn (gen_cmpintqi (outlow));
|
16070 |
|
|
emit_move_insn (out, gen_rtx_SIGN_EXTEND (SImode, outlow));
|
16071 |
|
|
|
16072 |
|
|
if (operands[0] != out)
|
16073 |
|
|
emit_move_insn (operands[0], out);
|
16074 |
|
|
|
16075 |
|
|
DONE;
|
16076 |
|
|
})
|
16077 |
|
|
|
16078 |
|
|
;; Produce a tri-state integer (-1, 0, 1) from condition codes.
|
16079 |
|
|
|
16080 |
|
|
(define_expand "cmpintqi"
|
16081 |
|
|
[(set (match_dup 1)
|
16082 |
|
|
(gtu:QI (reg:CC FLAGS_REG) (const_int 0)))
|
16083 |
|
|
(set (match_dup 2)
|
16084 |
|
|
(ltu:QI (reg:CC FLAGS_REG) (const_int 0)))
|
16085 |
|
|
(parallel [(set (match_operand:QI 0 "register_operand" "")
|
16086 |
|
|
(minus:QI (match_dup 1)
|
16087 |
|
|
(match_dup 2)))
|
16088 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
16089 |
|
|
""
|
16090 |
|
|
{
|
16091 |
|
|
operands[1] = gen_reg_rtx (QImode);
|
16092 |
|
|
operands[2] = gen_reg_rtx (QImode);
|
16093 |
|
|
})
|
16094 |
|
|
|
16095 |
|
|
;; memcmp recognizers. The `cmpsb' opcode does nothing if the count is
|
16096 |
|
|
;; zero. Emit extra code to make sure that a zero-length compare is EQ.
|
16097 |
|
|
|
16098 |
|
|
(define_expand "cmpstrnqi_nz_1"
|
16099 |
|
|
[(parallel [(set (reg:CC FLAGS_REG)
|
16100 |
|
|
(compare:CC (match_operand 4 "memory_operand" "")
|
16101 |
|
|
(match_operand 5 "memory_operand" "")))
|
16102 |
|
|
(use (match_operand 2 "register_operand" ""))
|
16103 |
|
|
(use (match_operand:SI 3 "immediate_operand" ""))
|
16104 |
|
|
(clobber (match_operand 0 "register_operand" ""))
|
16105 |
|
|
(clobber (match_operand 1 "register_operand" ""))
|
16106 |
|
|
(clobber (match_dup 2))])]
|
16107 |
|
|
""
|
16108 |
|
|
"ix86_current_function_needs_cld = 1;")
|
16109 |
|
|
|
16110 |
|
|
(define_insn "*cmpstrnqi_nz_1"
|
16111 |
|
|
[(set (reg:CC FLAGS_REG)
|
16112 |
|
|
(compare:CC (mem:BLK (match_operand:P 4 "register_operand" "0"))
|
16113 |
|
|
(mem:BLK (match_operand:P 5 "register_operand" "1"))))
|
16114 |
|
|
(use (match_operand:P 6 "register_operand" "2"))
|
16115 |
|
|
(use (match_operand:SI 3 "immediate_operand" "i"))
|
16116 |
|
|
(clobber (match_operand:P 0 "register_operand" "=S"))
|
16117 |
|
|
(clobber (match_operand:P 1 "register_operand" "=D"))
|
16118 |
|
|
(clobber (match_operand:P 2 "register_operand" "=c"))]
|
16119 |
|
|
"!(fixed_regs[CX_REG] || fixed_regs[SI_REG] || fixed_regs[DI_REG])"
|
16120 |
|
|
"repz{%;} cmpsb"
|
16121 |
|
|
[(set_attr "type" "str")
|
16122 |
|
|
(set_attr "mode" "QI")
|
16123 |
|
|
(set (attr "prefix_rex")
|
16124 |
|
|
(if_then_else
|
16125 |
|
|
(match_test "mode == DImode")
|
16126 |
|
|
(const_string "0")
|
16127 |
|
|
(const_string "*")))
|
16128 |
|
|
(set_attr "prefix_rep" "1")])
|
16129 |
|
|
|
16130 |
|
|
;; The same, but the count is not known to not be zero.
|
16131 |
|
|
|
16132 |
|
|
(define_expand "cmpstrnqi_1"
|
16133 |
|
|
[(parallel [(set (reg:CC FLAGS_REG)
|
16134 |
|
|
(if_then_else:CC (ne (match_operand 2 "register_operand" "")
|
16135 |
|
|
(const_int 0))
|
16136 |
|
|
(compare:CC (match_operand 4 "memory_operand" "")
|
16137 |
|
|
(match_operand 5 "memory_operand" ""))
|
16138 |
|
|
(const_int 0)))
|
16139 |
|
|
(use (match_operand:SI 3 "immediate_operand" ""))
|
16140 |
|
|
(use (reg:CC FLAGS_REG))
|
16141 |
|
|
(clobber (match_operand 0 "register_operand" ""))
|
16142 |
|
|
(clobber (match_operand 1 "register_operand" ""))
|
16143 |
|
|
(clobber (match_dup 2))])]
|
16144 |
|
|
""
|
16145 |
|
|
"ix86_current_function_needs_cld = 1;")
|
16146 |
|
|
|
16147 |
|
|
(define_insn "*cmpstrnqi_1"
|
16148 |
|
|
[(set (reg:CC FLAGS_REG)
|
16149 |
|
|
(if_then_else:CC (ne (match_operand:P 6 "register_operand" "2")
|
16150 |
|
|
(const_int 0))
|
16151 |
|
|
(compare:CC (mem:BLK (match_operand:P 4 "register_operand" "0"))
|
16152 |
|
|
(mem:BLK (match_operand:P 5 "register_operand" "1")))
|
16153 |
|
|
(const_int 0)))
|
16154 |
|
|
(use (match_operand:SI 3 "immediate_operand" "i"))
|
16155 |
|
|
(use (reg:CC FLAGS_REG))
|
16156 |
|
|
(clobber (match_operand:P 0 "register_operand" "=S"))
|
16157 |
|
|
(clobber (match_operand:P 1 "register_operand" "=D"))
|
16158 |
|
|
(clobber (match_operand:P 2 "register_operand" "=c"))]
|
16159 |
|
|
"!(fixed_regs[CX_REG] || fixed_regs[SI_REG] || fixed_regs[DI_REG])"
|
16160 |
|
|
"repz{%;} cmpsb"
|
16161 |
|
|
[(set_attr "type" "str")
|
16162 |
|
|
(set_attr "mode" "QI")
|
16163 |
|
|
(set (attr "prefix_rex")
|
16164 |
|
|
(if_then_else
|
16165 |
|
|
(match_test "mode == DImode")
|
16166 |
|
|
(const_string "0")
|
16167 |
|
|
(const_string "*")))
|
16168 |
|
|
(set_attr "prefix_rep" "1")])
|
16169 |
|
|
|
16170 |
|
|
(define_expand "strlen"
|
16171 |
|
|
[(set (match_operand:P 0 "register_operand" "")
|
16172 |
|
|
(unspec:P [(match_operand:BLK 1 "general_operand" "")
|
16173 |
|
|
(match_operand:QI 2 "immediate_operand" "")
|
16174 |
|
|
(match_operand 3 "immediate_operand" "")]
|
16175 |
|
|
UNSPEC_SCAS))]
|
16176 |
|
|
""
|
16177 |
|
|
{
|
16178 |
|
|
if (ix86_expand_strlen (operands[0], operands[1], operands[2], operands[3]))
|
16179 |
|
|
DONE;
|
16180 |
|
|
else
|
16181 |
|
|
FAIL;
|
16182 |
|
|
})
|
16183 |
|
|
|
16184 |
|
|
(define_expand "strlenqi_1"
|
16185 |
|
|
[(parallel [(set (match_operand 0 "register_operand" "")
|
16186 |
|
|
(match_operand 2 "" ""))
|
16187 |
|
|
(clobber (match_operand 1 "register_operand" ""))
|
16188 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
16189 |
|
|
""
|
16190 |
|
|
"ix86_current_function_needs_cld = 1;")
|
16191 |
|
|
|
16192 |
|
|
(define_insn "*strlenqi_1"
|
16193 |
|
|
[(set (match_operand:P 0 "register_operand" "=&c")
|
16194 |
|
|
(unspec:P [(mem:BLK (match_operand:P 5 "register_operand" "1"))
|
16195 |
|
|
(match_operand:QI 2 "register_operand" "a")
|
16196 |
|
|
(match_operand:P 3 "immediate_operand" "i")
|
16197 |
|
|
(match_operand:P 4 "register_operand" "0")] UNSPEC_SCAS))
|
16198 |
|
|
(clobber (match_operand:P 1 "register_operand" "=D"))
|
16199 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
16200 |
|
|
"!(fixed_regs[AX_REG] || fixed_regs[CX_REG] || fixed_regs[DI_REG])"
|
16201 |
|
|
"repnz{%;} scasb"
|
16202 |
|
|
[(set_attr "type" "str")
|
16203 |
|
|
(set_attr "mode" "QI")
|
16204 |
|
|
(set (attr "prefix_rex")
|
16205 |
|
|
(if_then_else
|
16206 |
|
|
(match_test "mode == DImode")
|
16207 |
|
|
(const_string "0")
|
16208 |
|
|
(const_string "*")))
|
16209 |
|
|
(set_attr "prefix_rep" "1")])
|
16210 |
|
|
|
16211 |
|
|
;; Peephole optimizations to clean up after cmpstrn*. This should be
|
16212 |
|
|
;; handled in combine, but it is not currently up to the task.
|
16213 |
|
|
;; When used for their truth value, the cmpstrn* expanders generate
|
16214 |
|
|
;; code like this:
|
16215 |
|
|
;;
|
16216 |
|
|
;; repz cmpsb
|
16217 |
|
|
;; seta %al
|
16218 |
|
|
;; setb %dl
|
16219 |
|
|
;; cmpb %al, %dl
|
16220 |
|
|
;; jcc label
|
16221 |
|
|
;;
|
16222 |
|
|
;; The intermediate three instructions are unnecessary.
|
16223 |
|
|
|
16224 |
|
|
;; This one handles cmpstrn*_nz_1...
|
16225 |
|
|
(define_peephole2
|
16226 |
|
|
[(parallel[
|
16227 |
|
|
(set (reg:CC FLAGS_REG)
|
16228 |
|
|
(compare:CC (mem:BLK (match_operand 4 "register_operand" ""))
|
16229 |
|
|
(mem:BLK (match_operand 5 "register_operand" ""))))
|
16230 |
|
|
(use (match_operand 6 "register_operand" ""))
|
16231 |
|
|
(use (match_operand:SI 3 "immediate_operand" ""))
|
16232 |
|
|
(clobber (match_operand 0 "register_operand" ""))
|
16233 |
|
|
(clobber (match_operand 1 "register_operand" ""))
|
16234 |
|
|
(clobber (match_operand 2 "register_operand" ""))])
|
16235 |
|
|
(set (match_operand:QI 7 "register_operand" "")
|
16236 |
|
|
(gtu:QI (reg:CC FLAGS_REG) (const_int 0)))
|
16237 |
|
|
(set (match_operand:QI 8 "register_operand" "")
|
16238 |
|
|
(ltu:QI (reg:CC FLAGS_REG) (const_int 0)))
|
16239 |
|
|
(set (reg FLAGS_REG)
|
16240 |
|
|
(compare (match_dup 7) (match_dup 8)))
|
16241 |
|
|
]
|
16242 |
|
|
"peep2_reg_dead_p (4, operands[7]) && peep2_reg_dead_p (4, operands[8])"
|
16243 |
|
|
[(parallel[
|
16244 |
|
|
(set (reg:CC FLAGS_REG)
|
16245 |
|
|
(compare:CC (mem:BLK (match_dup 4))
|
16246 |
|
|
(mem:BLK (match_dup 5))))
|
16247 |
|
|
(use (match_dup 6))
|
16248 |
|
|
(use (match_dup 3))
|
16249 |
|
|
(clobber (match_dup 0))
|
16250 |
|
|
(clobber (match_dup 1))
|
16251 |
|
|
(clobber (match_dup 2))])])
|
16252 |
|
|
|
16253 |
|
|
;; ...and this one handles cmpstrn*_1.
|
16254 |
|
|
(define_peephole2
|
16255 |
|
|
[(parallel[
|
16256 |
|
|
(set (reg:CC FLAGS_REG)
|
16257 |
|
|
(if_then_else:CC (ne (match_operand 6 "register_operand" "")
|
16258 |
|
|
(const_int 0))
|
16259 |
|
|
(compare:CC (mem:BLK (match_operand 4 "register_operand" ""))
|
16260 |
|
|
(mem:BLK (match_operand 5 "register_operand" "")))
|
16261 |
|
|
(const_int 0)))
|
16262 |
|
|
(use (match_operand:SI 3 "immediate_operand" ""))
|
16263 |
|
|
(use (reg:CC FLAGS_REG))
|
16264 |
|
|
(clobber (match_operand 0 "register_operand" ""))
|
16265 |
|
|
(clobber (match_operand 1 "register_operand" ""))
|
16266 |
|
|
(clobber (match_operand 2 "register_operand" ""))])
|
16267 |
|
|
(set (match_operand:QI 7 "register_operand" "")
|
16268 |
|
|
(gtu:QI (reg:CC FLAGS_REG) (const_int 0)))
|
16269 |
|
|
(set (match_operand:QI 8 "register_operand" "")
|
16270 |
|
|
(ltu:QI (reg:CC FLAGS_REG) (const_int 0)))
|
16271 |
|
|
(set (reg FLAGS_REG)
|
16272 |
|
|
(compare (match_dup 7) (match_dup 8)))
|
16273 |
|
|
]
|
16274 |
|
|
"peep2_reg_dead_p (4, operands[7]) && peep2_reg_dead_p (4, operands[8])"
|
16275 |
|
|
[(parallel[
|
16276 |
|
|
(set (reg:CC FLAGS_REG)
|
16277 |
|
|
(if_then_else:CC (ne (match_dup 6)
|
16278 |
|
|
(const_int 0))
|
16279 |
|
|
(compare:CC (mem:BLK (match_dup 4))
|
16280 |
|
|
(mem:BLK (match_dup 5)))
|
16281 |
|
|
(const_int 0)))
|
16282 |
|
|
(use (match_dup 3))
|
16283 |
|
|
(use (reg:CC FLAGS_REG))
|
16284 |
|
|
(clobber (match_dup 0))
|
16285 |
|
|
(clobber (match_dup 1))
|
16286 |
|
|
(clobber (match_dup 2))])])
|
16287 |
|
|
|
16288 |
|
|
;; Conditional move instructions.
|
16289 |
|
|
|
16290 |
|
|
(define_expand "movcc"
|
16291 |
|
|
[(set (match_operand:SWIM 0 "register_operand" "")
|
16292 |
|
|
(if_then_else:SWIM (match_operand 1 "ordered_comparison_operator" "")
|
16293 |
|
|
(match_operand:SWIM 2 "" "")
|
16294 |
|
|
(match_operand:SWIM 3 "" "")))]
|
16295 |
|
|
""
|
16296 |
|
|
"if (ix86_expand_int_movcc (operands)) DONE; else FAIL;")
|
16297 |
|
|
|
16298 |
|
|
;; Data flow gets confused by our desire for `sbbl reg,reg', and clearing
|
16299 |
|
|
;; the register first winds up with `sbbl $0,reg', which is also weird.
|
16300 |
|
|
;; So just document what we're doing explicitly.
|
16301 |
|
|
|
16302 |
|
|
(define_expand "x86_movcc_0_m1"
|
16303 |
|
|
[(parallel
|
16304 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "")
|
16305 |
|
|
(if_then_else:SWI48
|
16306 |
|
|
(match_operator:SWI48 2 "ix86_carry_flag_operator"
|
16307 |
|
|
[(match_operand 1 "flags_reg_operand" "")
|
16308 |
|
|
(const_int 0)])
|
16309 |
|
|
(const_int -1)
|
16310 |
|
|
(const_int 0)))
|
16311 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
16312 |
|
|
|
16313 |
|
|
(define_insn "*x86_movcc_0_m1"
|
16314 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
16315 |
|
|
(if_then_else:SWI48 (match_operator 1 "ix86_carry_flag_operator"
|
16316 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
16317 |
|
|
(const_int -1)
|
16318 |
|
|
(const_int 0)))
|
16319 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
16320 |
|
|
""
|
16321 |
|
|
"sbb{}\t%0, %0"
|
16322 |
|
|
; Since we don't have the proper number of operands for an alu insn,
|
16323 |
|
|
; fill in all the blanks.
|
16324 |
|
|
[(set_attr "type" "alu")
|
16325 |
|
|
(set_attr "use_carry" "1")
|
16326 |
|
|
(set_attr "pent_pair" "pu")
|
16327 |
|
|
(set_attr "memory" "none")
|
16328 |
|
|
(set_attr "imm_disp" "false")
|
16329 |
|
|
(set_attr "mode" "")
|
16330 |
|
|
(set_attr "length_immediate" "0")])
|
16331 |
|
|
|
16332 |
|
|
(define_insn "*x86_movcc_0_m1_se"
|
16333 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
16334 |
|
|
(sign_extract:SWI48 (match_operator 1 "ix86_carry_flag_operator"
|
16335 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
16336 |
|
|
(const_int 1)
|
16337 |
|
|
(const_int 0)))
|
16338 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
16339 |
|
|
""
|
16340 |
|
|
"sbb{}\t%0, %0"
|
16341 |
|
|
[(set_attr "type" "alu")
|
16342 |
|
|
(set_attr "use_carry" "1")
|
16343 |
|
|
(set_attr "pent_pair" "pu")
|
16344 |
|
|
(set_attr "memory" "none")
|
16345 |
|
|
(set_attr "imm_disp" "false")
|
16346 |
|
|
(set_attr "mode" "")
|
16347 |
|
|
(set_attr "length_immediate" "0")])
|
16348 |
|
|
|
16349 |
|
|
(define_insn "*x86_movcc_0_m1_neg"
|
16350 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
16351 |
|
|
(neg:SWI48 (match_operator 1 "ix86_carry_flag_operator"
|
16352 |
|
|
[(reg FLAGS_REG) (const_int 0)])))]
|
16353 |
|
|
""
|
16354 |
|
|
"sbb{}\t%0, %0"
|
16355 |
|
|
[(set_attr "type" "alu")
|
16356 |
|
|
(set_attr "use_carry" "1")
|
16357 |
|
|
(set_attr "pent_pair" "pu")
|
16358 |
|
|
(set_attr "memory" "none")
|
16359 |
|
|
(set_attr "imm_disp" "false")
|
16360 |
|
|
(set_attr "mode" "")
|
16361 |
|
|
(set_attr "length_immediate" "0")])
|
16362 |
|
|
|
16363 |
|
|
(define_insn "*movcc_noc"
|
16364 |
|
|
[(set (match_operand:SWI248 0 "register_operand" "=r,r")
|
16365 |
|
|
(if_then_else:SWI248 (match_operator 1 "ix86_comparison_operator"
|
16366 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
16367 |
|
|
(match_operand:SWI248 2 "nonimmediate_operand" "rm,0")
|
16368 |
|
|
(match_operand:SWI248 3 "nonimmediate_operand" "0,rm")))]
|
16369 |
|
|
"TARGET_CMOVE && !(MEM_P (operands[2]) && MEM_P (operands[3]))"
|
16370 |
|
|
"@
|
16371 |
|
|
cmov%O2%C1\t{%2, %0|%0, %2}
|
16372 |
|
|
cmov%O2%c1\t{%3, %0|%0, %3}"
|
16373 |
|
|
[(set_attr "type" "icmov")
|
16374 |
|
|
(set_attr "mode" "")])
|
16375 |
|
|
|
16376 |
|
|
(define_insn_and_split "*movqicc_noc"
|
16377 |
|
|
[(set (match_operand:QI 0 "register_operand" "=r,r")
|
16378 |
|
|
(if_then_else:QI (match_operator 1 "ix86_comparison_operator"
|
16379 |
|
|
[(match_operand 4 "flags_reg_operand" "")
|
16380 |
|
|
(const_int 0)])
|
16381 |
|
|
(match_operand:QI 2 "register_operand" "r,0")
|
16382 |
|
|
(match_operand:QI 3 "register_operand" "0,r")))]
|
16383 |
|
|
"TARGET_CMOVE && !TARGET_PARTIAL_REG_STALL"
|
16384 |
|
|
"#"
|
16385 |
|
|
"&& reload_completed"
|
16386 |
|
|
[(set (match_dup 0)
|
16387 |
|
|
(if_then_else:SI (match_op_dup 1 [(match_dup 4) (const_int 0)])
|
16388 |
|
|
(match_dup 2)
|
16389 |
|
|
(match_dup 3)))]
|
16390 |
|
|
"operands[0] = gen_lowpart (SImode, operands[0]);
|
16391 |
|
|
operands[2] = gen_lowpart (SImode, operands[2]);
|
16392 |
|
|
operands[3] = gen_lowpart (SImode, operands[3]);"
|
16393 |
|
|
[(set_attr "type" "icmov")
|
16394 |
|
|
(set_attr "mode" "SI")])
|
16395 |
|
|
|
16396 |
|
|
(define_expand "movcc"
|
16397 |
|
|
[(set (match_operand:X87MODEF 0 "register_operand" "")
|
16398 |
|
|
(if_then_else:X87MODEF
|
16399 |
|
|
(match_operand 1 "ix86_fp_comparison_operator" "")
|
16400 |
|
|
(match_operand:X87MODEF 2 "register_operand" "")
|
16401 |
|
|
(match_operand:X87MODEF 3 "register_operand" "")))]
|
16402 |
|
|
"(TARGET_80387 && TARGET_CMOVE)
|
16403 |
|
|
|| (SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH)"
|
16404 |
|
|
"if (ix86_expand_fp_movcc (operands)) DONE; else FAIL;")
|
16405 |
|
|
|
16406 |
|
|
(define_insn "*movxfcc_1"
|
16407 |
|
|
[(set (match_operand:XF 0 "register_operand" "=f,f")
|
16408 |
|
|
(if_then_else:XF (match_operator 1 "fcmov_comparison_operator"
|
16409 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
16410 |
|
|
(match_operand:XF 2 "register_operand" "f,0")
|
16411 |
|
|
(match_operand:XF 3 "register_operand" "0,f")))]
|
16412 |
|
|
"TARGET_80387 && TARGET_CMOVE"
|
16413 |
|
|
"@
|
16414 |
|
|
fcmov%F1\t{%2, %0|%0, %2}
|
16415 |
|
|
fcmov%f1\t{%3, %0|%0, %3}"
|
16416 |
|
|
[(set_attr "type" "fcmov")
|
16417 |
|
|
(set_attr "mode" "XF")])
|
16418 |
|
|
|
16419 |
|
|
(define_insn "*movdfcc_1_rex64"
|
16420 |
|
|
[(set (match_operand:DF 0 "register_operand" "=f,f,r,r")
|
16421 |
|
|
(if_then_else:DF (match_operator 1 "fcmov_comparison_operator"
|
16422 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
16423 |
|
|
(match_operand:DF 2 "nonimmediate_operand" "f,0,rm,0")
|
16424 |
|
|
(match_operand:DF 3 "nonimmediate_operand" "0,f,0,rm")))]
|
16425 |
|
|
"TARGET_64BIT && TARGET_80387 && TARGET_CMOVE
|
16426 |
|
|
&& !(MEM_P (operands[2]) && MEM_P (operands[3]))"
|
16427 |
|
|
"@
|
16428 |
|
|
fcmov%F1\t{%2, %0|%0, %2}
|
16429 |
|
|
fcmov%f1\t{%3, %0|%0, %3}
|
16430 |
|
|
cmov%O2%C1\t{%2, %0|%0, %2}
|
16431 |
|
|
cmov%O2%c1\t{%3, %0|%0, %3}"
|
16432 |
|
|
[(set_attr "type" "fcmov,fcmov,icmov,icmov")
|
16433 |
|
|
(set_attr "mode" "DF,DF,DI,DI")])
|
16434 |
|
|
|
16435 |
|
|
(define_insn "*movdfcc_1"
|
16436 |
|
|
[(set (match_operand:DF 0 "register_operand" "=f,f,&r,&r")
|
16437 |
|
|
(if_then_else:DF (match_operator 1 "fcmov_comparison_operator"
|
16438 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
16439 |
|
|
(match_operand:DF 2 "nonimmediate_operand" "f,0,rm,0")
|
16440 |
|
|
(match_operand:DF 3 "nonimmediate_operand" "0,f,0,rm")))]
|
16441 |
|
|
"!TARGET_64BIT && TARGET_80387 && TARGET_CMOVE
|
16442 |
|
|
&& !(MEM_P (operands[2]) && MEM_P (operands[3]))"
|
16443 |
|
|
"@
|
16444 |
|
|
fcmov%F1\t{%2, %0|%0, %2}
|
16445 |
|
|
fcmov%f1\t{%3, %0|%0, %3}
|
16446 |
|
|
#
|
16447 |
|
|
#"
|
16448 |
|
|
[(set_attr "type" "fcmov,fcmov,multi,multi")
|
16449 |
|
|
(set_attr "mode" "DF,DF,DI,DI")])
|
16450 |
|
|
|
16451 |
|
|
(define_split
|
16452 |
|
|
[(set (match_operand:DF 0 "register_and_not_any_fp_reg_operand" "")
|
16453 |
|
|
(if_then_else:DF (match_operator 1 "fcmov_comparison_operator"
|
16454 |
|
|
[(match_operand 4 "flags_reg_operand" "")
|
16455 |
|
|
(const_int 0)])
|
16456 |
|
|
(match_operand:DF 2 "nonimmediate_operand" "")
|
16457 |
|
|
(match_operand:DF 3 "nonimmediate_operand" "")))]
|
16458 |
|
|
"!TARGET_64BIT && reload_completed"
|
16459 |
|
|
[(set (match_dup 2)
|
16460 |
|
|
(if_then_else:SI (match_op_dup 1 [(match_dup 4) (const_int 0)])
|
16461 |
|
|
(match_dup 5)
|
16462 |
|
|
(match_dup 6)))
|
16463 |
|
|
(set (match_dup 3)
|
16464 |
|
|
(if_then_else:SI (match_op_dup 1 [(match_dup 4) (const_int 0)])
|
16465 |
|
|
(match_dup 7)
|
16466 |
|
|
(match_dup 8)))]
|
16467 |
|
|
{
|
16468 |
|
|
split_double_mode (DImode, &operands[2], 2, &operands[5], &operands[7]);
|
16469 |
|
|
split_double_mode (DImode, &operands[0], 1, &operands[2], &operands[3]);
|
16470 |
|
|
})
|
16471 |
|
|
|
16472 |
|
|
(define_insn "*movsfcc_1_387"
|
16473 |
|
|
[(set (match_operand:SF 0 "register_operand" "=f,f,r,r")
|
16474 |
|
|
(if_then_else:SF (match_operator 1 "fcmov_comparison_operator"
|
16475 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
16476 |
|
|
(match_operand:SF 2 "nonimmediate_operand" "f,0,rm,0")
|
16477 |
|
|
(match_operand:SF 3 "nonimmediate_operand" "0,f,0,rm")))]
|
16478 |
|
|
"TARGET_80387 && TARGET_CMOVE
|
16479 |
|
|
&& !(MEM_P (operands[2]) && MEM_P (operands[3]))"
|
16480 |
|
|
"@
|
16481 |
|
|
fcmov%F1\t{%2, %0|%0, %2}
|
16482 |
|
|
fcmov%f1\t{%3, %0|%0, %3}
|
16483 |
|
|
cmov%O2%C1\t{%2, %0|%0, %2}
|
16484 |
|
|
cmov%O2%c1\t{%3, %0|%0, %3}"
|
16485 |
|
|
[(set_attr "type" "fcmov,fcmov,icmov,icmov")
|
16486 |
|
|
(set_attr "mode" "SF,SF,SI,SI")])
|
16487 |
|
|
|
16488 |
|
|
;; All moves in XOP pcmov instructions are 128 bits and hence we restrict
|
16489 |
|
|
;; the scalar versions to have only XMM registers as operands.
|
16490 |
|
|
|
16491 |
|
|
;; XOP conditional move
|
16492 |
|
|
(define_insn "*xop_pcmov_"
|
16493 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x")
|
16494 |
|
|
(if_then_else:MODEF
|
16495 |
|
|
(match_operand:MODEF 1 "register_operand" "x")
|
16496 |
|
|
(match_operand:MODEF 2 "register_operand" "x")
|
16497 |
|
|
(match_operand:MODEF 3 "register_operand" "x")))]
|
16498 |
|
|
"TARGET_XOP"
|
16499 |
|
|
"vpcmov\t{%1, %3, %2, %0|%0, %2, %3, %1}"
|
16500 |
|
|
[(set_attr "type" "sse4arg")])
|
16501 |
|
|
|
16502 |
|
|
;; These versions of the min/max patterns are intentionally ignorant of
|
16503 |
|
|
;; their behavior wrt -0.0 and NaN (via the commutative operand mark).
|
16504 |
|
|
;; Since both the tree-level MAX_EXPR and the rtl-level SMAX operator
|
16505 |
|
|
;; are undefined in this condition, we're certain this is correct.
|
16506 |
|
|
|
16507 |
|
|
(define_insn "3"
|
16508 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x,x")
|
16509 |
|
|
(smaxmin:MODEF
|
16510 |
|
|
(match_operand:MODEF 1 "nonimmediate_operand" "%0,x")
|
16511 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "xm,xm")))]
|
16512 |
|
|
"SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH"
|
16513 |
|
|
"@
|
16514 |
|
|
\t{%2, %0|%0, %2}
|
16515 |
|
|
v\t{%2, %1, %0|%0, %1, %2}"
|
16516 |
|
|
[(set_attr "isa" "noavx,avx")
|
16517 |
|
|
(set_attr "prefix" "orig,vex")
|
16518 |
|
|
(set_attr "type" "sseadd")
|
16519 |
|
|
(set_attr "mode" "")])
|
16520 |
|
|
|
16521 |
|
|
;; These versions of the min/max patterns implement exactly the operations
|
16522 |
|
|
;; min = (op1 < op2 ? op1 : op2)
|
16523 |
|
|
;; max = (!(op1 < op2) ? op1 : op2)
|
16524 |
|
|
;; Their operands are not commutative, and thus they may be used in the
|
16525 |
|
|
;; presence of -0.0 and NaN.
|
16526 |
|
|
|
16527 |
|
|
(define_insn "*ieee_smin3"
|
16528 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x,x")
|
16529 |
|
|
(unspec:MODEF
|
16530 |
|
|
[(match_operand:MODEF 1 "register_operand" "0,x")
|
16531 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "xm,xm")]
|
16532 |
|
|
UNSPEC_IEEE_MIN))]
|
16533 |
|
|
"SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH"
|
16534 |
|
|
"@
|
16535 |
|
|
min\t{%2, %0|%0, %2}
|
16536 |
|
|
vmin\t{%2, %1, %0|%0, %1, %2}"
|
16537 |
|
|
[(set_attr "isa" "noavx,avx")
|
16538 |
|
|
(set_attr "prefix" "orig,vex")
|
16539 |
|
|
(set_attr "type" "sseadd")
|
16540 |
|
|
(set_attr "mode" "")])
|
16541 |
|
|
|
16542 |
|
|
(define_insn "*ieee_smax3"
|
16543 |
|
|
[(set (match_operand:MODEF 0 "register_operand" "=x,x")
|
16544 |
|
|
(unspec:MODEF
|
16545 |
|
|
[(match_operand:MODEF 1 "register_operand" "0,x")
|
16546 |
|
|
(match_operand:MODEF 2 "nonimmediate_operand" "xm,xm")]
|
16547 |
|
|
UNSPEC_IEEE_MAX))]
|
16548 |
|
|
"SSE_FLOAT_MODE_P (mode) && TARGET_SSE_MATH"
|
16549 |
|
|
"@
|
16550 |
|
|
max\t{%2, %0|%0, %2}
|
16551 |
|
|
vmax\t{%2, %1, %0|%0, %1, %2}"
|
16552 |
|
|
[(set_attr "isa" "noavx,avx")
|
16553 |
|
|
(set_attr "prefix" "orig,vex")
|
16554 |
|
|
(set_attr "type" "sseadd")
|
16555 |
|
|
(set_attr "mode" "")])
|
16556 |
|
|
|
16557 |
|
|
;; Make two stack loads independent:
|
16558 |
|
|
;; fld aa fld aa
|
16559 |
|
|
;; fld %st(0) -> fld bb
|
16560 |
|
|
;; fmul bb fmul %st(1), %st
|
16561 |
|
|
;;
|
16562 |
|
|
;; Actually we only match the last two instructions for simplicity.
|
16563 |
|
|
(define_peephole2
|
16564 |
|
|
[(set (match_operand 0 "fp_register_operand" "")
|
16565 |
|
|
(match_operand 1 "fp_register_operand" ""))
|
16566 |
|
|
(set (match_dup 0)
|
16567 |
|
|
(match_operator 2 "binary_fp_operator"
|
16568 |
|
|
[(match_dup 0)
|
16569 |
|
|
(match_operand 3 "memory_operand" "")]))]
|
16570 |
|
|
"REGNO (operands[0]) != REGNO (operands[1])"
|
16571 |
|
|
[(set (match_dup 0) (match_dup 3))
|
16572 |
|
|
(set (match_dup 0) (match_dup 4))]
|
16573 |
|
|
|
16574 |
|
|
;; The % modifier is not operational anymore in peephole2's, so we have to
|
16575 |
|
|
;; swap the operands manually in the case of addition and multiplication.
|
16576 |
|
|
{
|
16577 |
|
|
rtx op0, op1;
|
16578 |
|
|
|
16579 |
|
|
if (COMMUTATIVE_ARITH_P (operands[2]))
|
16580 |
|
|
op0 = operands[0], op1 = operands[1];
|
16581 |
|
|
else
|
16582 |
|
|
op0 = operands[1], op1 = operands[0];
|
16583 |
|
|
|
16584 |
|
|
operands[4] = gen_rtx_fmt_ee (GET_CODE (operands[2]),
|
16585 |
|
|
GET_MODE (operands[2]),
|
16586 |
|
|
op0, op1);
|
16587 |
|
|
})
|
16588 |
|
|
|
16589 |
|
|
;; Conditional addition patterns
|
16590 |
|
|
(define_expand "addcc"
|
16591 |
|
|
[(match_operand:SWI 0 "register_operand" "")
|
16592 |
|
|
(match_operand 1 "ordered_comparison_operator" "")
|
16593 |
|
|
(match_operand:SWI 2 "register_operand" "")
|
16594 |
|
|
(match_operand:SWI 3 "const_int_operand" "")]
|
16595 |
|
|
""
|
16596 |
|
|
"if (ix86_expand_int_addcc (operands)) DONE; else FAIL;")
|
16597 |
|
|
|
16598 |
|
|
;; Misc patterns (?)
|
16599 |
|
|
|
16600 |
|
|
;; This pattern exists to put a dependency on all ebp-based memory accesses.
|
16601 |
|
|
;; Otherwise there will be nothing to keep
|
16602 |
|
|
;;
|
16603 |
|
|
;; [(set (reg ebp) (reg esp))]
|
16604 |
|
|
;; [(set (reg esp) (plus (reg esp) (const_int -160000)))
|
16605 |
|
|
;; (clobber (eflags)]
|
16606 |
|
|
;; [(set (mem (plus (reg ebp) (const_int -160000))) (const_int 0))]
|
16607 |
|
|
;;
|
16608 |
|
|
;; in proper program order.
|
16609 |
|
|
|
16610 |
|
|
(define_insn "pro_epilogue_adjust_stack__add"
|
16611 |
|
|
[(set (match_operand:P 0 "register_operand" "=r,r")
|
16612 |
|
|
(plus:P (match_operand:P 1 "register_operand" "0,r")
|
16613 |
|
|
(match_operand:P 2 "" "r,l")))
|
16614 |
|
|
(clobber (reg:CC FLAGS_REG))
|
16615 |
|
|
(clobber (mem:BLK (scratch)))]
|
16616 |
|
|
""
|
16617 |
|
|
{
|
16618 |
|
|
switch (get_attr_type (insn))
|
16619 |
|
|
{
|
16620 |
|
|
case TYPE_IMOV:
|
16621 |
|
|
return "mov{}\t{%1, %0|%0, %1}";
|
16622 |
|
|
|
16623 |
|
|
case TYPE_ALU:
|
16624 |
|
|
gcc_assert (rtx_equal_p (operands[0], operands[1]));
|
16625 |
|
|
if (x86_maybe_negate_const_int (&operands[2], mode))
|
16626 |
|
|
return "sub{}\t{%2, %0|%0, %2}";
|
16627 |
|
|
|
16628 |
|
|
return "add{}\t{%2, %0|%0, %2}";
|
16629 |
|
|
|
16630 |
|
|
default:
|
16631 |
|
|
operands[2] = SET_SRC (XVECEXP (PATTERN (insn), 0, 0));
|
16632 |
|
|
return "lea{}\t{%a2, %0|%0, %a2}";
|
16633 |
|
|
}
|
16634 |
|
|
}
|
16635 |
|
|
[(set (attr "type")
|
16636 |
|
|
(cond [(and (eq_attr "alternative" "0")
|
16637 |
|
|
(not (match_test "TARGET_OPT_AGU")))
|
16638 |
|
|
(const_string "alu")
|
16639 |
|
|
(match_operand: 2 "const0_operand" "")
|
16640 |
|
|
(const_string "imov")
|
16641 |
|
|
]
|
16642 |
|
|
(const_string "lea")))
|
16643 |
|
|
(set (attr "length_immediate")
|
16644 |
|
|
(cond [(eq_attr "type" "imov")
|
16645 |
|
|
(const_string "0")
|
16646 |
|
|
(and (eq_attr "type" "alu")
|
16647 |
|
|
(match_operand 2 "const128_operand" ""))
|
16648 |
|
|
(const_string "1")
|
16649 |
|
|
]
|
16650 |
|
|
(const_string "*")))
|
16651 |
|
|
(set_attr "mode" "")])
|
16652 |
|
|
|
16653 |
|
|
(define_insn "pro_epilogue_adjust_stack__sub"
|
16654 |
|
|
[(set (match_operand:P 0 "register_operand" "=r")
|
16655 |
|
|
(minus:P (match_operand:P 1 "register_operand" "0")
|
16656 |
|
|
(match_operand:P 2 "register_operand" "r")))
|
16657 |
|
|
(clobber (reg:CC FLAGS_REG))
|
16658 |
|
|
(clobber (mem:BLK (scratch)))]
|
16659 |
|
|
""
|
16660 |
|
|
"sub{}\t{%2, %0|%0, %2}"
|
16661 |
|
|
[(set_attr "type" "alu")
|
16662 |
|
|
(set_attr "mode" "")])
|
16663 |
|
|
|
16664 |
|
|
(define_insn "allocate_stack_worker_probe_"
|
16665 |
|
|
[(set (match_operand:P 0 "register_operand" "=a")
|
16666 |
|
|
(unspec_volatile:P [(match_operand:P 1 "register_operand" "0")]
|
16667 |
|
|
UNSPECV_STACK_PROBE))
|
16668 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
16669 |
|
|
"ix86_target_stack_probe ()"
|
16670 |
|
|
"call\t___chkstk_ms"
|
16671 |
|
|
[(set_attr "type" "multi")
|
16672 |
|
|
(set_attr "length" "5")])
|
16673 |
|
|
|
16674 |
|
|
(define_expand "allocate_stack"
|
16675 |
|
|
[(match_operand 0 "register_operand" "")
|
16676 |
|
|
(match_operand 1 "general_operand" "")]
|
16677 |
|
|
"ix86_target_stack_probe ()"
|
16678 |
|
|
{
|
16679 |
|
|
rtx x;
|
16680 |
|
|
|
16681 |
|
|
#ifndef CHECK_STACK_LIMIT
|
16682 |
|
|
#define CHECK_STACK_LIMIT 0
|
16683 |
|
|
#endif
|
16684 |
|
|
|
16685 |
|
|
if (CHECK_STACK_LIMIT && CONST_INT_P (operands[1])
|
16686 |
|
|
&& INTVAL (operands[1]) < CHECK_STACK_LIMIT)
|
16687 |
|
|
{
|
16688 |
|
|
x = expand_simple_binop (Pmode, MINUS, stack_pointer_rtx, operands[1],
|
16689 |
|
|
stack_pointer_rtx, 0, OPTAB_DIRECT);
|
16690 |
|
|
if (x != stack_pointer_rtx)
|
16691 |
|
|
emit_move_insn (stack_pointer_rtx, x);
|
16692 |
|
|
}
|
16693 |
|
|
else
|
16694 |
|
|
{
|
16695 |
|
|
x = copy_to_mode_reg (Pmode, operands[1]);
|
16696 |
|
|
if (TARGET_64BIT)
|
16697 |
|
|
emit_insn (gen_allocate_stack_worker_probe_di (x, x));
|
16698 |
|
|
else
|
16699 |
|
|
emit_insn (gen_allocate_stack_worker_probe_si (x, x));
|
16700 |
|
|
x = expand_simple_binop (Pmode, MINUS, stack_pointer_rtx, x,
|
16701 |
|
|
stack_pointer_rtx, 0, OPTAB_DIRECT);
|
16702 |
|
|
if (x != stack_pointer_rtx)
|
16703 |
|
|
emit_move_insn (stack_pointer_rtx, x);
|
16704 |
|
|
}
|
16705 |
|
|
|
16706 |
|
|
emit_move_insn (operands[0], virtual_stack_dynamic_rtx);
|
16707 |
|
|
DONE;
|
16708 |
|
|
})
|
16709 |
|
|
|
16710 |
|
|
;; Use IOR for stack probes, this is shorter.
|
16711 |
|
|
(define_expand "probe_stack"
|
16712 |
|
|
[(match_operand 0 "memory_operand" "")]
|
16713 |
|
|
""
|
16714 |
|
|
{
|
16715 |
|
|
rtx (*gen_ior3) (rtx, rtx, rtx);
|
16716 |
|
|
|
16717 |
|
|
gen_ior3 = (GET_MODE (operands[0]) == DImode
|
16718 |
|
|
? gen_iordi3 : gen_iorsi3);
|
16719 |
|
|
|
16720 |
|
|
emit_insn (gen_ior3 (operands[0], operands[0], const0_rtx));
|
16721 |
|
|
DONE;
|
16722 |
|
|
})
|
16723 |
|
|
|
16724 |
|
|
(define_insn "adjust_stack_and_probe"
|
16725 |
|
|
[(set (match_operand:P 0 "register_operand" "=r")
|
16726 |
|
|
(unspec_volatile:P [(match_operand:P 1 "register_operand" "0")]
|
16727 |
|
|
UNSPECV_PROBE_STACK_RANGE))
|
16728 |
|
|
(set (reg:P SP_REG)
|
16729 |
|
|
(minus:P (reg:P SP_REG) (match_operand:P 2 "const_int_operand" "n")))
|
16730 |
|
|
(clobber (reg:CC FLAGS_REG))
|
16731 |
|
|
(clobber (mem:BLK (scratch)))]
|
16732 |
|
|
""
|
16733 |
|
|
"* return output_adjust_stack_and_probe (operands[0]);"
|
16734 |
|
|
[(set_attr "type" "multi")])
|
16735 |
|
|
|
16736 |
|
|
(define_insn "probe_stack_range"
|
16737 |
|
|
[(set (match_operand:P 0 "register_operand" "=r")
|
16738 |
|
|
(unspec_volatile:P [(match_operand:P 1 "register_operand" "0")
|
16739 |
|
|
(match_operand:P 2 "const_int_operand" "n")]
|
16740 |
|
|
UNSPECV_PROBE_STACK_RANGE))
|
16741 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
16742 |
|
|
""
|
16743 |
|
|
"* return output_probe_stack_range (operands[0], operands[2]);"
|
16744 |
|
|
[(set_attr "type" "multi")])
|
16745 |
|
|
|
16746 |
|
|
(define_expand "builtin_setjmp_receiver"
|
16747 |
|
|
[(label_ref (match_operand 0 "" ""))]
|
16748 |
|
|
"!TARGET_64BIT && flag_pic"
|
16749 |
|
|
{
|
16750 |
|
|
#if TARGET_MACHO
|
16751 |
|
|
if (TARGET_MACHO)
|
16752 |
|
|
{
|
16753 |
|
|
rtx xops[3];
|
16754 |
|
|
rtx picreg = gen_rtx_REG (Pmode, PIC_OFFSET_TABLE_REGNUM);
|
16755 |
|
|
rtx label_rtx = gen_label_rtx ();
|
16756 |
|
|
emit_insn (gen_set_got_labelled (pic_offset_table_rtx, label_rtx));
|
16757 |
|
|
xops[0] = xops[1] = picreg;
|
16758 |
|
|
xops[2] = machopic_gen_offset (gen_rtx_LABEL_REF (SImode, label_rtx));
|
16759 |
|
|
ix86_expand_binary_operator (MINUS, SImode, xops);
|
16760 |
|
|
}
|
16761 |
|
|
else
|
16762 |
|
|
#endif
|
16763 |
|
|
emit_insn (gen_set_got (pic_offset_table_rtx));
|
16764 |
|
|
DONE;
|
16765 |
|
|
})
|
16766 |
|
|
|
16767 |
|
|
;; Avoid redundant prefixes by splitting HImode arithmetic to SImode.
|
16768 |
|
|
|
16769 |
|
|
(define_split
|
16770 |
|
|
[(set (match_operand 0 "register_operand" "")
|
16771 |
|
|
(match_operator 3 "promotable_binary_operator"
|
16772 |
|
|
[(match_operand 1 "register_operand" "")
|
16773 |
|
|
(match_operand 2 "aligned_operand" "")]))
|
16774 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
16775 |
|
|
"! TARGET_PARTIAL_REG_STALL && reload_completed
|
16776 |
|
|
&& ((GET_MODE (operands[0]) == HImode
|
16777 |
|
|
&& ((optimize_function_for_speed_p (cfun) && !TARGET_FAST_PREFIX)
|
16778 |
|
|
/* ??? next two lines just !satisfies_constraint_K (...) */
|
16779 |
|
|
|| !CONST_INT_P (operands[2])
|
16780 |
|
|
|| satisfies_constraint_K (operands[2])))
|
16781 |
|
|
|| (GET_MODE (operands[0]) == QImode
|
16782 |
|
|
&& (TARGET_PROMOTE_QImode || optimize_function_for_size_p (cfun))))"
|
16783 |
|
|
[(parallel [(set (match_dup 0)
|
16784 |
|
|
(match_op_dup 3 [(match_dup 1) (match_dup 2)]))
|
16785 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
16786 |
|
|
{
|
16787 |
|
|
operands[0] = gen_lowpart (SImode, operands[0]);
|
16788 |
|
|
operands[1] = gen_lowpart (SImode, operands[1]);
|
16789 |
|
|
if (GET_CODE (operands[3]) != ASHIFT)
|
16790 |
|
|
operands[2] = gen_lowpart (SImode, operands[2]);
|
16791 |
|
|
PUT_MODE (operands[3], SImode);
|
16792 |
|
|
})
|
16793 |
|
|
|
16794 |
|
|
; Promote the QImode tests, as i386 has encoding of the AND
|
16795 |
|
|
; instruction with 32-bit sign-extended immediate and thus the
|
16796 |
|
|
; instruction size is unchanged, except in the %eax case for
|
16797 |
|
|
; which it is increased by one byte, hence the ! optimize_size.
|
16798 |
|
|
(define_split
|
16799 |
|
|
[(set (match_operand 0 "flags_reg_operand" "")
|
16800 |
|
|
(match_operator 2 "compare_operator"
|
16801 |
|
|
[(and (match_operand 3 "aligned_operand" "")
|
16802 |
|
|
(match_operand 4 "const_int_operand" ""))
|
16803 |
|
|
(const_int 0)]))
|
16804 |
|
|
(set (match_operand 1 "register_operand" "")
|
16805 |
|
|
(and (match_dup 3) (match_dup 4)))]
|
16806 |
|
|
"! TARGET_PARTIAL_REG_STALL && reload_completed
|
16807 |
|
|
&& optimize_insn_for_speed_p ()
|
16808 |
|
|
&& ((GET_MODE (operands[1]) == HImode && ! TARGET_FAST_PREFIX)
|
16809 |
|
|
|| (GET_MODE (operands[1]) == QImode && TARGET_PROMOTE_QImode))
|
16810 |
|
|
/* Ensure that the operand will remain sign-extended immediate. */
|
16811 |
|
|
&& ix86_match_ccmode (insn, INTVAL (operands[4]) >= 0 ? CCNOmode : CCZmode)"
|
16812 |
|
|
[(parallel [(set (match_dup 0)
|
16813 |
|
|
(match_op_dup 2 [(and:SI (match_dup 3) (match_dup 4))
|
16814 |
|
|
(const_int 0)]))
|
16815 |
|
|
(set (match_dup 1)
|
16816 |
|
|
(and:SI (match_dup 3) (match_dup 4)))])]
|
16817 |
|
|
{
|
16818 |
|
|
operands[4]
|
16819 |
|
|
= gen_int_mode (INTVAL (operands[4])
|
16820 |
|
|
& GET_MODE_MASK (GET_MODE (operands[1])), SImode);
|
16821 |
|
|
operands[1] = gen_lowpart (SImode, operands[1]);
|
16822 |
|
|
operands[3] = gen_lowpart (SImode, operands[3]);
|
16823 |
|
|
})
|
16824 |
|
|
|
16825 |
|
|
; Don't promote the QImode tests, as i386 doesn't have encoding of
|
16826 |
|
|
; the TEST instruction with 32-bit sign-extended immediate and thus
|
16827 |
|
|
; the instruction size would at least double, which is not what we
|
16828 |
|
|
; want even with ! optimize_size.
|
16829 |
|
|
(define_split
|
16830 |
|
|
[(set (match_operand 0 "flags_reg_operand" "")
|
16831 |
|
|
(match_operator 1 "compare_operator"
|
16832 |
|
|
[(and (match_operand:HI 2 "aligned_operand" "")
|
16833 |
|
|
(match_operand:HI 3 "const_int_operand" ""))
|
16834 |
|
|
(const_int 0)]))]
|
16835 |
|
|
"! TARGET_PARTIAL_REG_STALL && reload_completed
|
16836 |
|
|
&& ! TARGET_FAST_PREFIX
|
16837 |
|
|
&& optimize_insn_for_speed_p ()
|
16838 |
|
|
/* Ensure that the operand will remain sign-extended immediate. */
|
16839 |
|
|
&& ix86_match_ccmode (insn, INTVAL (operands[3]) >= 0 ? CCNOmode : CCZmode)"
|
16840 |
|
|
[(set (match_dup 0)
|
16841 |
|
|
(match_op_dup 1 [(and:SI (match_dup 2) (match_dup 3))
|
16842 |
|
|
(const_int 0)]))]
|
16843 |
|
|
{
|
16844 |
|
|
operands[3]
|
16845 |
|
|
= gen_int_mode (INTVAL (operands[3])
|
16846 |
|
|
& GET_MODE_MASK (GET_MODE (operands[2])), SImode);
|
16847 |
|
|
operands[2] = gen_lowpart (SImode, operands[2]);
|
16848 |
|
|
})
|
16849 |
|
|
|
16850 |
|
|
(define_split
|
16851 |
|
|
[(set (match_operand 0 "register_operand" "")
|
16852 |
|
|
(neg (match_operand 1 "register_operand" "")))
|
16853 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
16854 |
|
|
"! TARGET_PARTIAL_REG_STALL && reload_completed
|
16855 |
|
|
&& (GET_MODE (operands[0]) == HImode
|
16856 |
|
|
|| (GET_MODE (operands[0]) == QImode
|
16857 |
|
|
&& (TARGET_PROMOTE_QImode
|
16858 |
|
|
|| optimize_insn_for_size_p ())))"
|
16859 |
|
|
[(parallel [(set (match_dup 0)
|
16860 |
|
|
(neg:SI (match_dup 1)))
|
16861 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
16862 |
|
|
{
|
16863 |
|
|
operands[0] = gen_lowpart (SImode, operands[0]);
|
16864 |
|
|
operands[1] = gen_lowpart (SImode, operands[1]);
|
16865 |
|
|
})
|
16866 |
|
|
|
16867 |
|
|
(define_split
|
16868 |
|
|
[(set (match_operand 0 "register_operand" "")
|
16869 |
|
|
(not (match_operand 1 "register_operand" "")))]
|
16870 |
|
|
"! TARGET_PARTIAL_REG_STALL && reload_completed
|
16871 |
|
|
&& (GET_MODE (operands[0]) == HImode
|
16872 |
|
|
|| (GET_MODE (operands[0]) == QImode
|
16873 |
|
|
&& (TARGET_PROMOTE_QImode
|
16874 |
|
|
|| optimize_insn_for_size_p ())))"
|
16875 |
|
|
[(set (match_dup 0)
|
16876 |
|
|
(not:SI (match_dup 1)))]
|
16877 |
|
|
{
|
16878 |
|
|
operands[0] = gen_lowpart (SImode, operands[0]);
|
16879 |
|
|
operands[1] = gen_lowpart (SImode, operands[1]);
|
16880 |
|
|
})
|
16881 |
|
|
|
16882 |
|
|
(define_split
|
16883 |
|
|
[(set (match_operand 0 "register_operand" "")
|
16884 |
|
|
(if_then_else (match_operator 1 "ordered_comparison_operator"
|
16885 |
|
|
[(reg FLAGS_REG) (const_int 0)])
|
16886 |
|
|
(match_operand 2 "register_operand" "")
|
16887 |
|
|
(match_operand 3 "register_operand" "")))]
|
16888 |
|
|
"! TARGET_PARTIAL_REG_STALL && TARGET_CMOVE
|
16889 |
|
|
&& (GET_MODE (operands[0]) == HImode
|
16890 |
|
|
|| (GET_MODE (operands[0]) == QImode
|
16891 |
|
|
&& (TARGET_PROMOTE_QImode
|
16892 |
|
|
|| optimize_insn_for_size_p ())))"
|
16893 |
|
|
[(set (match_dup 0)
|
16894 |
|
|
(if_then_else:SI (match_dup 1) (match_dup 2) (match_dup 3)))]
|
16895 |
|
|
{
|
16896 |
|
|
operands[0] = gen_lowpart (SImode, operands[0]);
|
16897 |
|
|
operands[2] = gen_lowpart (SImode, operands[2]);
|
16898 |
|
|
operands[3] = gen_lowpart (SImode, operands[3]);
|
16899 |
|
|
})
|
16900 |
|
|
|
16901 |
|
|
;; RTL Peephole optimizations, run before sched2. These primarily look to
|
16902 |
|
|
;; transform a complex memory operation into two memory to register operations.
|
16903 |
|
|
|
16904 |
|
|
;; Don't push memory operands
|
16905 |
|
|
(define_peephole2
|
16906 |
|
|
[(set (match_operand:SWI 0 "push_operand" "")
|
16907 |
|
|
(match_operand:SWI 1 "memory_operand" ""))
|
16908 |
|
|
(match_scratch:SWI 2 "")]
|
16909 |
|
|
"!(TARGET_PUSH_MEMORY || optimize_insn_for_size_p ())
|
16910 |
|
|
&& !RTX_FRAME_RELATED_P (peep2_next_insn (0))"
|
16911 |
|
|
[(set (match_dup 2) (match_dup 1))
|
16912 |
|
|
(set (match_dup 0) (match_dup 2))])
|
16913 |
|
|
|
16914 |
|
|
;; We need to handle SFmode only, because DFmode and XFmode are split to
|
16915 |
|
|
;; SImode pushes.
|
16916 |
|
|
(define_peephole2
|
16917 |
|
|
[(set (match_operand:SF 0 "push_operand" "")
|
16918 |
|
|
(match_operand:SF 1 "memory_operand" ""))
|
16919 |
|
|
(match_scratch:SF 2 "r")]
|
16920 |
|
|
"!(TARGET_PUSH_MEMORY || optimize_insn_for_size_p ())
|
16921 |
|
|
&& !RTX_FRAME_RELATED_P (peep2_next_insn (0))"
|
16922 |
|
|
[(set (match_dup 2) (match_dup 1))
|
16923 |
|
|
(set (match_dup 0) (match_dup 2))])
|
16924 |
|
|
|
16925 |
|
|
;; Don't move an immediate directly to memory when the instruction
|
16926 |
|
|
;; gets too big.
|
16927 |
|
|
(define_peephole2
|
16928 |
|
|
[(match_scratch:SWI124 1 "")
|
16929 |
|
|
(set (match_operand:SWI124 0 "memory_operand" "")
|
16930 |
|
|
(const_int 0))]
|
16931 |
|
|
"optimize_insn_for_speed_p ()
|
16932 |
|
|
&& !TARGET_USE_MOV0
|
16933 |
|
|
&& TARGET_SPLIT_LONG_MOVES
|
16934 |
|
|
&& get_attr_length (insn) >= ix86_cur_cost ()->large_insn
|
16935 |
|
|
&& peep2_regno_dead_p (0, FLAGS_REG)"
|
16936 |
|
|
[(parallel [(set (match_dup 2) (const_int 0))
|
16937 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
16938 |
|
|
(set (match_dup 0) (match_dup 1))]
|
16939 |
|
|
"operands[2] = gen_lowpart (SImode, operands[1]);")
|
16940 |
|
|
|
16941 |
|
|
(define_peephole2
|
16942 |
|
|
[(match_scratch:SWI124 2 "")
|
16943 |
|
|
(set (match_operand:SWI124 0 "memory_operand" "")
|
16944 |
|
|
(match_operand:SWI124 1 "immediate_operand" ""))]
|
16945 |
|
|
"optimize_insn_for_speed_p ()
|
16946 |
|
|
&& TARGET_SPLIT_LONG_MOVES
|
16947 |
|
|
&& get_attr_length (insn) >= ix86_cur_cost ()->large_insn"
|
16948 |
|
|
[(set (match_dup 2) (match_dup 1))
|
16949 |
|
|
(set (match_dup 0) (match_dup 2))])
|
16950 |
|
|
|
16951 |
|
|
;; Don't compare memory with zero, load and use a test instead.
|
16952 |
|
|
(define_peephole2
|
16953 |
|
|
[(set (match_operand 0 "flags_reg_operand" "")
|
16954 |
|
|
(match_operator 1 "compare_operator"
|
16955 |
|
|
[(match_operand:SI 2 "memory_operand" "")
|
16956 |
|
|
(const_int 0)]))
|
16957 |
|
|
(match_scratch:SI 3 "r")]
|
16958 |
|
|
"optimize_insn_for_speed_p () && ix86_match_ccmode (insn, CCNOmode)"
|
16959 |
|
|
[(set (match_dup 3) (match_dup 2))
|
16960 |
|
|
(set (match_dup 0) (match_op_dup 1 [(match_dup 3) (const_int 0)]))])
|
16961 |
|
|
|
16962 |
|
|
;; NOT is not pairable on Pentium, while XOR is, but one byte longer.
|
16963 |
|
|
;; Don't split NOTs with a displacement operand, because resulting XOR
|
16964 |
|
|
;; will not be pairable anyway.
|
16965 |
|
|
;;
|
16966 |
|
|
;; On AMD K6, NOT is vector decoded with memory operand that cannot be
|
16967 |
|
|
;; represented using a modRM byte. The XOR replacement is long decoded,
|
16968 |
|
|
;; so this split helps here as well.
|
16969 |
|
|
;;
|
16970 |
|
|
;; Note: Can't do this as a regular split because we can't get proper
|
16971 |
|
|
;; lifetime information then.
|
16972 |
|
|
|
16973 |
|
|
(define_peephole2
|
16974 |
|
|
[(set (match_operand:SWI124 0 "nonimmediate_operand" "")
|
16975 |
|
|
(not:SWI124 (match_operand:SWI124 1 "nonimmediate_operand" "")))]
|
16976 |
|
|
"optimize_insn_for_speed_p ()
|
16977 |
|
|
&& ((TARGET_NOT_UNPAIRABLE
|
16978 |
|
|
&& (!MEM_P (operands[0])
|
16979 |
|
|
|| !memory_displacement_operand (operands[0], mode)))
|
16980 |
|
|
|| (TARGET_NOT_VECTORMODE
|
16981 |
|
|
&& long_memory_operand (operands[0], mode)))
|
16982 |
|
|
&& peep2_regno_dead_p (0, FLAGS_REG)"
|
16983 |
|
|
[(parallel [(set (match_dup 0)
|
16984 |
|
|
(xor:SWI124 (match_dup 1) (const_int -1)))
|
16985 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
16986 |
|
|
|
16987 |
|
|
;; Non pairable "test imm, reg" instructions can be translated to
|
16988 |
|
|
;; "and imm, reg" if reg dies. The "and" form is also shorter (one
|
16989 |
|
|
;; byte opcode instead of two, have a short form for byte operands),
|
16990 |
|
|
;; so do it for other CPUs as well. Given that the value was dead,
|
16991 |
|
|
;; this should not create any new dependencies. Pass on the sub-word
|
16992 |
|
|
;; versions if we're concerned about partial register stalls.
|
16993 |
|
|
|
16994 |
|
|
(define_peephole2
|
16995 |
|
|
[(set (match_operand 0 "flags_reg_operand" "")
|
16996 |
|
|
(match_operator 1 "compare_operator"
|
16997 |
|
|
[(and:SI (match_operand:SI 2 "register_operand" "")
|
16998 |
|
|
(match_operand:SI 3 "immediate_operand" ""))
|
16999 |
|
|
(const_int 0)]))]
|
17000 |
|
|
"ix86_match_ccmode (insn, CCNOmode)
|
17001 |
|
|
&& (true_regnum (operands[2]) != AX_REG
|
17002 |
|
|
|| satisfies_constraint_K (operands[3]))
|
17003 |
|
|
&& peep2_reg_dead_p (1, operands[2])"
|
17004 |
|
|
[(parallel
|
17005 |
|
|
[(set (match_dup 0)
|
17006 |
|
|
(match_op_dup 1 [(and:SI (match_dup 2) (match_dup 3))
|
17007 |
|
|
(const_int 0)]))
|
17008 |
|
|
(set (match_dup 2)
|
17009 |
|
|
(and:SI (match_dup 2) (match_dup 3)))])])
|
17010 |
|
|
|
17011 |
|
|
;; We don't need to handle HImode case, because it will be promoted to SImode
|
17012 |
|
|
;; on ! TARGET_PARTIAL_REG_STALL
|
17013 |
|
|
|
17014 |
|
|
(define_peephole2
|
17015 |
|
|
[(set (match_operand 0 "flags_reg_operand" "")
|
17016 |
|
|
(match_operator 1 "compare_operator"
|
17017 |
|
|
[(and:QI (match_operand:QI 2 "register_operand" "")
|
17018 |
|
|
(match_operand:QI 3 "immediate_operand" ""))
|
17019 |
|
|
(const_int 0)]))]
|
17020 |
|
|
"! TARGET_PARTIAL_REG_STALL
|
17021 |
|
|
&& ix86_match_ccmode (insn, CCNOmode)
|
17022 |
|
|
&& true_regnum (operands[2]) != AX_REG
|
17023 |
|
|
&& peep2_reg_dead_p (1, operands[2])"
|
17024 |
|
|
[(parallel
|
17025 |
|
|
[(set (match_dup 0)
|
17026 |
|
|
(match_op_dup 1 [(and:QI (match_dup 2) (match_dup 3))
|
17027 |
|
|
(const_int 0)]))
|
17028 |
|
|
(set (match_dup 2)
|
17029 |
|
|
(and:QI (match_dup 2) (match_dup 3)))])])
|
17030 |
|
|
|
17031 |
|
|
(define_peephole2
|
17032 |
|
|
[(set (match_operand 0 "flags_reg_operand" "")
|
17033 |
|
|
(match_operator 1 "compare_operator"
|
17034 |
|
|
[(and:SI
|
17035 |
|
|
(zero_extract:SI
|
17036 |
|
|
(match_operand 2 "ext_register_operand" "")
|
17037 |
|
|
(const_int 8)
|
17038 |
|
|
(const_int 8))
|
17039 |
|
|
(match_operand 3 "const_int_operand" ""))
|
17040 |
|
|
(const_int 0)]))]
|
17041 |
|
|
"! TARGET_PARTIAL_REG_STALL
|
17042 |
|
|
&& ix86_match_ccmode (insn, CCNOmode)
|
17043 |
|
|
&& true_regnum (operands[2]) != AX_REG
|
17044 |
|
|
&& peep2_reg_dead_p (1, operands[2])"
|
17045 |
|
|
[(parallel [(set (match_dup 0)
|
17046 |
|
|
(match_op_dup 1
|
17047 |
|
|
[(and:SI
|
17048 |
|
|
(zero_extract:SI
|
17049 |
|
|
(match_dup 2)
|
17050 |
|
|
(const_int 8)
|
17051 |
|
|
(const_int 8))
|
17052 |
|
|
(match_dup 3))
|
17053 |
|
|
(const_int 0)]))
|
17054 |
|
|
(set (zero_extract:SI (match_dup 2)
|
17055 |
|
|
(const_int 8)
|
17056 |
|
|
(const_int 8))
|
17057 |
|
|
(and:SI
|
17058 |
|
|
(zero_extract:SI
|
17059 |
|
|
(match_dup 2)
|
17060 |
|
|
(const_int 8)
|
17061 |
|
|
(const_int 8))
|
17062 |
|
|
(match_dup 3)))])])
|
17063 |
|
|
|
17064 |
|
|
;; Don't do logical operations with memory inputs.
|
17065 |
|
|
(define_peephole2
|
17066 |
|
|
[(match_scratch:SI 2 "r")
|
17067 |
|
|
(parallel [(set (match_operand:SI 0 "register_operand" "")
|
17068 |
|
|
(match_operator:SI 3 "arith_or_logical_operator"
|
17069 |
|
|
[(match_dup 0)
|
17070 |
|
|
(match_operand:SI 1 "memory_operand" "")]))
|
17071 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17072 |
|
|
"!(TARGET_READ_MODIFY || optimize_insn_for_size_p ())"
|
17073 |
|
|
[(set (match_dup 2) (match_dup 1))
|
17074 |
|
|
(parallel [(set (match_dup 0)
|
17075 |
|
|
(match_op_dup 3 [(match_dup 0) (match_dup 2)]))
|
17076 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
17077 |
|
|
|
17078 |
|
|
(define_peephole2
|
17079 |
|
|
[(match_scratch:SI 2 "r")
|
17080 |
|
|
(parallel [(set (match_operand:SI 0 "register_operand" "")
|
17081 |
|
|
(match_operator:SI 3 "arith_or_logical_operator"
|
17082 |
|
|
[(match_operand:SI 1 "memory_operand" "")
|
17083 |
|
|
(match_dup 0)]))
|
17084 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17085 |
|
|
"!(TARGET_READ_MODIFY || optimize_insn_for_size_p ())"
|
17086 |
|
|
[(set (match_dup 2) (match_dup 1))
|
17087 |
|
|
(parallel [(set (match_dup 0)
|
17088 |
|
|
(match_op_dup 3 [(match_dup 2) (match_dup 0)]))
|
17089 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
17090 |
|
|
|
17091 |
|
|
;; Prefer Load+RegOp to Mov+MemOp. Watch out for cases when the memory address
|
17092 |
|
|
;; refers to the destination of the load!
|
17093 |
|
|
|
17094 |
|
|
(define_peephole2
|
17095 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
17096 |
|
|
(match_operand:SI 1 "register_operand" ""))
|
17097 |
|
|
(parallel [(set (match_dup 0)
|
17098 |
|
|
(match_operator:SI 3 "commutative_operator"
|
17099 |
|
|
[(match_dup 0)
|
17100 |
|
|
(match_operand:SI 2 "memory_operand" "")]))
|
17101 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17102 |
|
|
"REGNO (operands[0]) != REGNO (operands[1])
|
17103 |
|
|
&& GENERAL_REGNO_P (REGNO (operands[0]))
|
17104 |
|
|
&& GENERAL_REGNO_P (REGNO (operands[1]))"
|
17105 |
|
|
[(set (match_dup 0) (match_dup 4))
|
17106 |
|
|
(parallel [(set (match_dup 0)
|
17107 |
|
|
(match_op_dup 3 [(match_dup 0) (match_dup 1)]))
|
17108 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17109 |
|
|
"operands[4] = replace_rtx (operands[2], operands[0], operands[1]);")
|
17110 |
|
|
|
17111 |
|
|
(define_peephole2
|
17112 |
|
|
[(set (match_operand 0 "register_operand" "")
|
17113 |
|
|
(match_operand 1 "register_operand" ""))
|
17114 |
|
|
(set (match_dup 0)
|
17115 |
|
|
(match_operator 3 "commutative_operator"
|
17116 |
|
|
[(match_dup 0)
|
17117 |
|
|
(match_operand 2 "memory_operand" "")]))]
|
17118 |
|
|
"REGNO (operands[0]) != REGNO (operands[1])
|
17119 |
|
|
&& ((MMX_REG_P (operands[0]) && MMX_REG_P (operands[1]))
|
17120 |
|
|
|| (SSE_REG_P (operands[0]) && SSE_REG_P (operands[1])))"
|
17121 |
|
|
[(set (match_dup 0) (match_dup 2))
|
17122 |
|
|
(set (match_dup 0)
|
17123 |
|
|
(match_op_dup 3 [(match_dup 0) (match_dup 1)]))])
|
17124 |
|
|
|
17125 |
|
|
; Don't do logical operations with memory outputs
|
17126 |
|
|
;
|
17127 |
|
|
; These two don't make sense for PPro/PII -- we're expanding a 4-uop
|
17128 |
|
|
; instruction into two 1-uop insns plus a 2-uop insn. That last has
|
17129 |
|
|
; the same decoder scheduling characteristics as the original.
|
17130 |
|
|
|
17131 |
|
|
(define_peephole2
|
17132 |
|
|
[(match_scratch:SI 2 "r")
|
17133 |
|
|
(parallel [(set (match_operand:SI 0 "memory_operand" "")
|
17134 |
|
|
(match_operator:SI 3 "arith_or_logical_operator"
|
17135 |
|
|
[(match_dup 0)
|
17136 |
|
|
(match_operand:SI 1 "nonmemory_operand" "")]))
|
17137 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17138 |
|
|
"!(TARGET_READ_MODIFY_WRITE || optimize_insn_for_size_p ())
|
17139 |
|
|
/* Do not split stack checking probes. */
|
17140 |
|
|
&& GET_CODE (operands[3]) != IOR && operands[1] != const0_rtx"
|
17141 |
|
|
[(set (match_dup 2) (match_dup 0))
|
17142 |
|
|
(parallel [(set (match_dup 2)
|
17143 |
|
|
(match_op_dup 3 [(match_dup 2) (match_dup 1)]))
|
17144 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
17145 |
|
|
(set (match_dup 0) (match_dup 2))])
|
17146 |
|
|
|
17147 |
|
|
(define_peephole2
|
17148 |
|
|
[(match_scratch:SI 2 "r")
|
17149 |
|
|
(parallel [(set (match_operand:SI 0 "memory_operand" "")
|
17150 |
|
|
(match_operator:SI 3 "arith_or_logical_operator"
|
17151 |
|
|
[(match_operand:SI 1 "nonmemory_operand" "")
|
17152 |
|
|
(match_dup 0)]))
|
17153 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17154 |
|
|
"!(TARGET_READ_MODIFY_WRITE || optimize_insn_for_size_p ())
|
17155 |
|
|
/* Do not split stack checking probes. */
|
17156 |
|
|
&& GET_CODE (operands[3]) != IOR && operands[1] != const0_rtx"
|
17157 |
|
|
[(set (match_dup 2) (match_dup 0))
|
17158 |
|
|
(parallel [(set (match_dup 2)
|
17159 |
|
|
(match_op_dup 3 [(match_dup 1) (match_dup 2)]))
|
17160 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
17161 |
|
|
(set (match_dup 0) (match_dup 2))])
|
17162 |
|
|
|
17163 |
|
|
;; Attempt to use arith or logical operations with memory outputs with
|
17164 |
|
|
;; setting of flags.
|
17165 |
|
|
(define_peephole2
|
17166 |
|
|
[(set (match_operand:SWI 0 "register_operand" "")
|
17167 |
|
|
(match_operand:SWI 1 "memory_operand" ""))
|
17168 |
|
|
(parallel [(set (match_dup 0)
|
17169 |
|
|
(match_operator:SWI 3 "plusminuslogic_operator"
|
17170 |
|
|
[(match_dup 0)
|
17171 |
|
|
(match_operand:SWI 2 "" "")]))
|
17172 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
17173 |
|
|
(set (match_dup 1) (match_dup 0))
|
17174 |
|
|
(set (reg FLAGS_REG) (compare (match_dup 0) (const_int 0)))]
|
17175 |
|
|
"(TARGET_READ_MODIFY_WRITE || optimize_insn_for_size_p ())
|
17176 |
|
|
&& peep2_reg_dead_p (4, operands[0])
|
17177 |
|
|
&& !reg_overlap_mentioned_p (operands[0], operands[1])
|
17178 |
|
|
&& ix86_match_ccmode (peep2_next_insn (3),
|
17179 |
|
|
(GET_CODE (operands[3]) == PLUS
|
17180 |
|
|
|| GET_CODE (operands[3]) == MINUS)
|
17181 |
|
|
? CCGOCmode : CCNOmode)"
|
17182 |
|
|
[(parallel [(set (match_dup 4) (match_dup 5))
|
17183 |
|
|
(set (match_dup 1) (match_op_dup 3 [(match_dup 1)
|
17184 |
|
|
(match_dup 2)]))])]
|
17185 |
|
|
{
|
17186 |
|
|
operands[4] = SET_DEST (PATTERN (peep2_next_insn (3)));
|
17187 |
|
|
operands[5] = gen_rtx_fmt_ee (GET_CODE (operands[3]), mode,
|
17188 |
|
|
copy_rtx (operands[1]),
|
17189 |
|
|
copy_rtx (operands[2]));
|
17190 |
|
|
operands[5] = gen_rtx_COMPARE (GET_MODE (operands[4]),
|
17191 |
|
|
operands[5], const0_rtx);
|
17192 |
|
|
})
|
17193 |
|
|
|
17194 |
|
|
(define_peephole2
|
17195 |
|
|
[(parallel [(set (match_operand:SWI 0 "register_operand" "")
|
17196 |
|
|
(match_operator:SWI 2 "plusminuslogic_operator"
|
17197 |
|
|
[(match_dup 0)
|
17198 |
|
|
(match_operand:SWI 1 "memory_operand" "")]))
|
17199 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
17200 |
|
|
(set (match_dup 1) (match_dup 0))
|
17201 |
|
|
(set (reg FLAGS_REG) (compare (match_dup 0) (const_int 0)))]
|
17202 |
|
|
"(TARGET_READ_MODIFY_WRITE || optimize_insn_for_size_p ())
|
17203 |
|
|
&& GET_CODE (operands[2]) != MINUS
|
17204 |
|
|
&& peep2_reg_dead_p (3, operands[0])
|
17205 |
|
|
&& !reg_overlap_mentioned_p (operands[0], operands[1])
|
17206 |
|
|
&& ix86_match_ccmode (peep2_next_insn (2),
|
17207 |
|
|
GET_CODE (operands[2]) == PLUS
|
17208 |
|
|
? CCGOCmode : CCNOmode)"
|
17209 |
|
|
[(parallel [(set (match_dup 3) (match_dup 4))
|
17210 |
|
|
(set (match_dup 1) (match_op_dup 2 [(match_dup 1)
|
17211 |
|
|
(match_dup 0)]))])]
|
17212 |
|
|
{
|
17213 |
|
|
operands[3] = SET_DEST (PATTERN (peep2_next_insn (2)));
|
17214 |
|
|
operands[4] = gen_rtx_fmt_ee (GET_CODE (operands[2]), mode,
|
17215 |
|
|
copy_rtx (operands[1]),
|
17216 |
|
|
copy_rtx (operands[0]));
|
17217 |
|
|
operands[4] = gen_rtx_COMPARE (GET_MODE (operands[3]),
|
17218 |
|
|
operands[4], const0_rtx);
|
17219 |
|
|
})
|
17220 |
|
|
|
17221 |
|
|
(define_peephole2
|
17222 |
|
|
[(set (match_operand:SWI12 0 "register_operand" "")
|
17223 |
|
|
(match_operand:SWI12 1 "memory_operand" ""))
|
17224 |
|
|
(parallel [(set (match_operand:SI 4 "register_operand" "")
|
17225 |
|
|
(match_operator:SI 3 "plusminuslogic_operator"
|
17226 |
|
|
[(match_dup 4)
|
17227 |
|
|
(match_operand:SI 2 "nonmemory_operand" "")]))
|
17228 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
17229 |
|
|
(set (match_dup 1) (match_dup 0))
|
17230 |
|
|
(set (reg FLAGS_REG) (compare (match_dup 0) (const_int 0)))]
|
17231 |
|
|
"(TARGET_READ_MODIFY_WRITE || optimize_insn_for_size_p ())
|
17232 |
|
|
&& REG_P (operands[0]) && REG_P (operands[4])
|
17233 |
|
|
&& REGNO (operands[0]) == REGNO (operands[4])
|
17234 |
|
|
&& peep2_reg_dead_p (4, operands[0])
|
17235 |
|
|
&& (mode != QImode
|
17236 |
|
|
|| immediate_operand (operands[2], SImode)
|
17237 |
|
|
|| q_regs_operand (operands[2], SImode))
|
17238 |
|
|
&& !reg_overlap_mentioned_p (operands[0], operands[1])
|
17239 |
|
|
&& ix86_match_ccmode (peep2_next_insn (3),
|
17240 |
|
|
(GET_CODE (operands[3]) == PLUS
|
17241 |
|
|
|| GET_CODE (operands[3]) == MINUS)
|
17242 |
|
|
? CCGOCmode : CCNOmode)"
|
17243 |
|
|
[(parallel [(set (match_dup 4) (match_dup 5))
|
17244 |
|
|
(set (match_dup 1) (match_dup 6))])]
|
17245 |
|
|
{
|
17246 |
|
|
operands[2] = gen_lowpart (mode, operands[2]);
|
17247 |
|
|
operands[4] = SET_DEST (PATTERN (peep2_next_insn (3)));
|
17248 |
|
|
operands[5] = gen_rtx_fmt_ee (GET_CODE (operands[3]), mode,
|
17249 |
|
|
copy_rtx (operands[1]), operands[2]);
|
17250 |
|
|
operands[5] = gen_rtx_COMPARE (GET_MODE (operands[4]),
|
17251 |
|
|
operands[5], const0_rtx);
|
17252 |
|
|
operands[6] = gen_rtx_fmt_ee (GET_CODE (operands[3]), mode,
|
17253 |
|
|
copy_rtx (operands[1]),
|
17254 |
|
|
copy_rtx (operands[2]));
|
17255 |
|
|
})
|
17256 |
|
|
|
17257 |
|
|
;; Attempt to always use XOR for zeroing registers.
|
17258 |
|
|
(define_peephole2
|
17259 |
|
|
[(set (match_operand 0 "register_operand" "")
|
17260 |
|
|
(match_operand 1 "const0_operand" ""))]
|
17261 |
|
|
"GET_MODE_SIZE (GET_MODE (operands[0])) <= UNITS_PER_WORD
|
17262 |
|
|
&& (! TARGET_USE_MOV0 || optimize_insn_for_size_p ())
|
17263 |
|
|
&& GENERAL_REG_P (operands[0])
|
17264 |
|
|
&& peep2_regno_dead_p (0, FLAGS_REG)"
|
17265 |
|
|
[(parallel [(set (match_dup 0) (const_int 0))
|
17266 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17267 |
|
|
"operands[0] = gen_lowpart (word_mode, operands[0]);")
|
17268 |
|
|
|
17269 |
|
|
(define_peephole2
|
17270 |
|
|
[(set (strict_low_part (match_operand 0 "register_operand" ""))
|
17271 |
|
|
(const_int 0))]
|
17272 |
|
|
"(GET_MODE (operands[0]) == QImode
|
17273 |
|
|
|| GET_MODE (operands[0]) == HImode)
|
17274 |
|
|
&& (! TARGET_USE_MOV0 || optimize_insn_for_size_p ())
|
17275 |
|
|
&& peep2_regno_dead_p (0, FLAGS_REG)"
|
17276 |
|
|
[(parallel [(set (strict_low_part (match_dup 0)) (const_int 0))
|
17277 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
17278 |
|
|
|
17279 |
|
|
;; For HI, SI and DI modes, or $-1,reg is smaller than mov $-1,reg.
|
17280 |
|
|
(define_peephole2
|
17281 |
|
|
[(set (match_operand:SWI248 0 "register_operand" "")
|
17282 |
|
|
(const_int -1))]
|
17283 |
|
|
"(optimize_insn_for_size_p () || TARGET_MOVE_M1_VIA_OR)
|
17284 |
|
|
&& peep2_regno_dead_p (0, FLAGS_REG)"
|
17285 |
|
|
[(parallel [(set (match_dup 0) (const_int -1))
|
17286 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17287 |
|
|
{
|
17288 |
|
|
if (GET_MODE_SIZE (mode) < GET_MODE_SIZE (SImode))
|
17289 |
|
|
operands[0] = gen_lowpart (SImode, operands[0]);
|
17290 |
|
|
})
|
17291 |
|
|
|
17292 |
|
|
;; Attempt to convert simple lea to add/shift.
|
17293 |
|
|
;; These can be created by move expanders.
|
17294 |
|
|
|
17295 |
|
|
(define_peephole2
|
17296 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "")
|
17297 |
|
|
(plus:SWI48 (match_dup 0)
|
17298 |
|
|
(match_operand:SWI48 1 "" "")))]
|
17299 |
|
|
"peep2_regno_dead_p (0, FLAGS_REG)"
|
17300 |
|
|
[(parallel [(set (match_dup 0) (plus:SWI48 (match_dup 0) (match_dup 1)))
|
17301 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
17302 |
|
|
|
17303 |
|
|
(define_peephole2
|
17304 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
17305 |
|
|
(subreg:SI (plus:DI (match_operand:DI 1 "register_operand" "")
|
17306 |
|
|
(match_operand:DI 2 "nonmemory_operand" "")) 0))]
|
17307 |
|
|
"TARGET_64BIT
|
17308 |
|
|
&& peep2_regno_dead_p (0, FLAGS_REG)
|
17309 |
|
|
&& REGNO (operands[0]) == REGNO (operands[1])"
|
17310 |
|
|
[(parallel [(set (match_dup 0) (plus:SI (match_dup 0) (match_dup 2)))
|
17311 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17312 |
|
|
"operands[2] = gen_lowpart (SImode, operands[2]);")
|
17313 |
|
|
|
17314 |
|
|
(define_peephole2
|
17315 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "")
|
17316 |
|
|
(mult:SWI48 (match_dup 0)
|
17317 |
|
|
(match_operand:SWI48 1 "const_int_operand" "")))]
|
17318 |
|
|
"exact_log2 (INTVAL (operands[1])) >= 0
|
17319 |
|
|
&& peep2_regno_dead_p (0, FLAGS_REG)"
|
17320 |
|
|
[(parallel [(set (match_dup 0) (ashift:SWI48 (match_dup 0) (match_dup 2)))
|
17321 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17322 |
|
|
"operands[2] = GEN_INT (exact_log2 (INTVAL (operands[1])));")
|
17323 |
|
|
|
17324 |
|
|
(define_peephole2
|
17325 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
17326 |
|
|
(subreg:SI (mult:DI (match_operand:DI 1 "register_operand" "")
|
17327 |
|
|
(match_operand:DI 2 "const_int_operand" "")) 0))]
|
17328 |
|
|
"TARGET_64BIT
|
17329 |
|
|
&& exact_log2 (INTVAL (operands[2])) >= 0
|
17330 |
|
|
&& REGNO (operands[0]) == REGNO (operands[1])
|
17331 |
|
|
&& peep2_regno_dead_p (0, FLAGS_REG)"
|
17332 |
|
|
[(parallel [(set (match_dup 0) (ashift:SI (match_dup 0) (match_dup 2)))
|
17333 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17334 |
|
|
"operands[2] = GEN_INT (exact_log2 (INTVAL (operands[2])));")
|
17335 |
|
|
|
17336 |
|
|
;; The ESP adjustments can be done by the push and pop instructions. Resulting
|
17337 |
|
|
;; code is shorter, since push is only 1 byte, while add imm, %esp is 3 bytes.
|
17338 |
|
|
;; On many CPUs it is also faster, since special hardware to avoid esp
|
17339 |
|
|
;; dependencies is present.
|
17340 |
|
|
|
17341 |
|
|
;; While some of these conversions may be done using splitters, we use
|
17342 |
|
|
;; peepholes in order to allow combine_stack_adjustments pass to see
|
17343 |
|
|
;; nonobfuscated RTL.
|
17344 |
|
|
|
17345 |
|
|
;; Convert prologue esp subtractions to push.
|
17346 |
|
|
;; We need register to push. In order to keep verify_flow_info happy we have
|
17347 |
|
|
;; two choices
|
17348 |
|
|
;; - use scratch and clobber it in order to avoid dependencies
|
17349 |
|
|
;; - use already live register
|
17350 |
|
|
;; We can't use the second way right now, since there is no reliable way how to
|
17351 |
|
|
;; verify that given register is live. First choice will also most likely in
|
17352 |
|
|
;; fewer dependencies. On the place of esp adjustments it is very likely that
|
17353 |
|
|
;; call clobbered registers are dead. We may want to use base pointer as an
|
17354 |
|
|
;; alternative when no register is available later.
|
17355 |
|
|
|
17356 |
|
|
(define_peephole2
|
17357 |
|
|
[(match_scratch:P 1 "r")
|
17358 |
|
|
(parallel [(set (reg:P SP_REG)
|
17359 |
|
|
(plus:P (reg:P SP_REG)
|
17360 |
|
|
(match_operand:P 0 "const_int_operand" "")))
|
17361 |
|
|
(clobber (reg:CC FLAGS_REG))
|
17362 |
|
|
(clobber (mem:BLK (scratch)))])]
|
17363 |
|
|
"(TARGET_SINGLE_PUSH || optimize_insn_for_size_p ())
|
17364 |
|
|
&& INTVAL (operands[0]) == -GET_MODE_SIZE (Pmode)"
|
17365 |
|
|
[(clobber (match_dup 1))
|
17366 |
|
|
(parallel [(set (mem:P (pre_dec:P (reg:P SP_REG))) (match_dup 1))
|
17367 |
|
|
(clobber (mem:BLK (scratch)))])])
|
17368 |
|
|
|
17369 |
|
|
(define_peephole2
|
17370 |
|
|
[(match_scratch:P 1 "r")
|
17371 |
|
|
(parallel [(set (reg:P SP_REG)
|
17372 |
|
|
(plus:P (reg:P SP_REG)
|
17373 |
|
|
(match_operand:P 0 "const_int_operand" "")))
|
17374 |
|
|
(clobber (reg:CC FLAGS_REG))
|
17375 |
|
|
(clobber (mem:BLK (scratch)))])]
|
17376 |
|
|
"(TARGET_DOUBLE_PUSH || optimize_insn_for_size_p ())
|
17377 |
|
|
&& INTVAL (operands[0]) == -2*GET_MODE_SIZE (Pmode)"
|
17378 |
|
|
[(clobber (match_dup 1))
|
17379 |
|
|
(set (mem:P (pre_dec:P (reg:P SP_REG))) (match_dup 1))
|
17380 |
|
|
(parallel [(set (mem:P (pre_dec:P (reg:P SP_REG))) (match_dup 1))
|
17381 |
|
|
(clobber (mem:BLK (scratch)))])])
|
17382 |
|
|
|
17383 |
|
|
;; Convert esp subtractions to push.
|
17384 |
|
|
(define_peephole2
|
17385 |
|
|
[(match_scratch:P 1 "r")
|
17386 |
|
|
(parallel [(set (reg:P SP_REG)
|
17387 |
|
|
(plus:P (reg:P SP_REG)
|
17388 |
|
|
(match_operand:P 0 "const_int_operand" "")))
|
17389 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17390 |
|
|
"(TARGET_SINGLE_PUSH || optimize_insn_for_size_p ())
|
17391 |
|
|
&& INTVAL (operands[0]) == -GET_MODE_SIZE (Pmode)"
|
17392 |
|
|
[(clobber (match_dup 1))
|
17393 |
|
|
(set (mem:P (pre_dec:P (reg:P SP_REG))) (match_dup 1))])
|
17394 |
|
|
|
17395 |
|
|
(define_peephole2
|
17396 |
|
|
[(match_scratch:P 1 "r")
|
17397 |
|
|
(parallel [(set (reg:P SP_REG)
|
17398 |
|
|
(plus:P (reg:P SP_REG)
|
17399 |
|
|
(match_operand:P 0 "const_int_operand" "")))
|
17400 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17401 |
|
|
"(TARGET_DOUBLE_PUSH || optimize_insn_for_size_p ())
|
17402 |
|
|
&& INTVAL (operands[0]) == -2*GET_MODE_SIZE (Pmode)"
|
17403 |
|
|
[(clobber (match_dup 1))
|
17404 |
|
|
(set (mem:P (pre_dec:P (reg:P SP_REG))) (match_dup 1))
|
17405 |
|
|
(set (mem:P (pre_dec:P (reg:P SP_REG))) (match_dup 1))])
|
17406 |
|
|
|
17407 |
|
|
;; Convert epilogue deallocator to pop.
|
17408 |
|
|
(define_peephole2
|
17409 |
|
|
[(match_scratch:P 1 "r")
|
17410 |
|
|
(parallel [(set (reg:P SP_REG)
|
17411 |
|
|
(plus:P (reg:P SP_REG)
|
17412 |
|
|
(match_operand:P 0 "const_int_operand" "")))
|
17413 |
|
|
(clobber (reg:CC FLAGS_REG))
|
17414 |
|
|
(clobber (mem:BLK (scratch)))])]
|
17415 |
|
|
"(TARGET_SINGLE_POP || optimize_insn_for_size_p ())
|
17416 |
|
|
&& INTVAL (operands[0]) == GET_MODE_SIZE (Pmode)"
|
17417 |
|
|
[(parallel [(set (match_dup 1) (mem:P (post_inc:P (reg:P SP_REG))))
|
17418 |
|
|
(clobber (mem:BLK (scratch)))])])
|
17419 |
|
|
|
17420 |
|
|
;; Two pops case is tricky, since pop causes dependency
|
17421 |
|
|
;; on destination register. We use two registers if available.
|
17422 |
|
|
(define_peephole2
|
17423 |
|
|
[(match_scratch:P 1 "r")
|
17424 |
|
|
(match_scratch:P 2 "r")
|
17425 |
|
|
(parallel [(set (reg:P SP_REG)
|
17426 |
|
|
(plus:P (reg:P SP_REG)
|
17427 |
|
|
(match_operand:P 0 "const_int_operand" "")))
|
17428 |
|
|
(clobber (reg:CC FLAGS_REG))
|
17429 |
|
|
(clobber (mem:BLK (scratch)))])]
|
17430 |
|
|
"(TARGET_DOUBLE_POP || optimize_insn_for_size_p ())
|
17431 |
|
|
&& INTVAL (operands[0]) == 2*GET_MODE_SIZE (Pmode)"
|
17432 |
|
|
[(parallel [(set (match_dup 1) (mem:P (post_inc:P (reg:P SP_REG))))
|
17433 |
|
|
(clobber (mem:BLK (scratch)))])
|
17434 |
|
|
(set (match_dup 2) (mem:P (post_inc:P (reg:P SP_REG))))])
|
17435 |
|
|
|
17436 |
|
|
(define_peephole2
|
17437 |
|
|
[(match_scratch:P 1 "r")
|
17438 |
|
|
(parallel [(set (reg:P SP_REG)
|
17439 |
|
|
(plus:P (reg:P SP_REG)
|
17440 |
|
|
(match_operand:P 0 "const_int_operand" "")))
|
17441 |
|
|
(clobber (reg:CC FLAGS_REG))
|
17442 |
|
|
(clobber (mem:BLK (scratch)))])]
|
17443 |
|
|
"optimize_insn_for_size_p ()
|
17444 |
|
|
&& INTVAL (operands[0]) == 2*GET_MODE_SIZE (Pmode)"
|
17445 |
|
|
[(parallel [(set (match_dup 1) (mem:P (post_inc:P (reg:P SP_REG))))
|
17446 |
|
|
(clobber (mem:BLK (scratch)))])
|
17447 |
|
|
(set (match_dup 1) (mem:P (post_inc:P (reg:P SP_REG))))])
|
17448 |
|
|
|
17449 |
|
|
;; Convert esp additions to pop.
|
17450 |
|
|
(define_peephole2
|
17451 |
|
|
[(match_scratch:P 1 "r")
|
17452 |
|
|
(parallel [(set (reg:P SP_REG)
|
17453 |
|
|
(plus:P (reg:P SP_REG)
|
17454 |
|
|
(match_operand:P 0 "const_int_operand" "")))
|
17455 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17456 |
|
|
"INTVAL (operands[0]) == GET_MODE_SIZE (Pmode)"
|
17457 |
|
|
[(set (match_dup 1) (mem:P (post_inc:P (reg:P SP_REG))))])
|
17458 |
|
|
|
17459 |
|
|
;; Two pops case is tricky, since pop causes dependency
|
17460 |
|
|
;; on destination register. We use two registers if available.
|
17461 |
|
|
(define_peephole2
|
17462 |
|
|
[(match_scratch:P 1 "r")
|
17463 |
|
|
(match_scratch:P 2 "r")
|
17464 |
|
|
(parallel [(set (reg:P SP_REG)
|
17465 |
|
|
(plus:P (reg:P SP_REG)
|
17466 |
|
|
(match_operand:P 0 "const_int_operand" "")))
|
17467 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17468 |
|
|
"INTVAL (operands[0]) == 2*GET_MODE_SIZE (Pmode)"
|
17469 |
|
|
[(set (match_dup 1) (mem:P (post_inc:P (reg:P SP_REG))))
|
17470 |
|
|
(set (match_dup 2) (mem:P (post_inc:P (reg:P SP_REG))))])
|
17471 |
|
|
|
17472 |
|
|
(define_peephole2
|
17473 |
|
|
[(match_scratch:P 1 "r")
|
17474 |
|
|
(parallel [(set (reg:P SP_REG)
|
17475 |
|
|
(plus:P (reg:P SP_REG)
|
17476 |
|
|
(match_operand:P 0 "const_int_operand" "")))
|
17477 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17478 |
|
|
"optimize_insn_for_size_p ()
|
17479 |
|
|
&& INTVAL (operands[0]) == 2*GET_MODE_SIZE (Pmode)"
|
17480 |
|
|
[(set (match_dup 1) (mem:P (post_inc:P (reg:P SP_REG))))
|
17481 |
|
|
(set (match_dup 1) (mem:P (post_inc:P (reg:P SP_REG))))])
|
17482 |
|
|
|
17483 |
|
|
;; Convert compares with 1 to shorter inc/dec operations when CF is not
|
17484 |
|
|
;; required and register dies. Similarly for 128 to -128.
|
17485 |
|
|
(define_peephole2
|
17486 |
|
|
[(set (match_operand 0 "flags_reg_operand" "")
|
17487 |
|
|
(match_operator 1 "compare_operator"
|
17488 |
|
|
[(match_operand 2 "register_operand" "")
|
17489 |
|
|
(match_operand 3 "const_int_operand" "")]))]
|
17490 |
|
|
"(((!TARGET_FUSE_CMP_AND_BRANCH || optimize_insn_for_size_p ())
|
17491 |
|
|
&& incdec_operand (operands[3], GET_MODE (operands[3])))
|
17492 |
|
|
|| (!TARGET_FUSE_CMP_AND_BRANCH
|
17493 |
|
|
&& INTVAL (operands[3]) == 128))
|
17494 |
|
|
&& ix86_match_ccmode (insn, CCGCmode)
|
17495 |
|
|
&& peep2_reg_dead_p (1, operands[2])"
|
17496 |
|
|
[(parallel [(set (match_dup 0)
|
17497 |
|
|
(match_op_dup 1 [(match_dup 2) (match_dup 3)]))
|
17498 |
|
|
(clobber (match_dup 2))])])
|
17499 |
|
|
|
17500 |
|
|
;; Convert imul by three, five and nine into lea
|
17501 |
|
|
(define_peephole2
|
17502 |
|
|
[(parallel
|
17503 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "")
|
17504 |
|
|
(mult:SWI48 (match_operand:SWI48 1 "register_operand" "")
|
17505 |
|
|
(match_operand:SWI48 2 "const359_operand" "")))
|
17506 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17507 |
|
|
"!TARGET_PARTIAL_REG_STALL
|
17508 |
|
|
|| mode == SImode
|
17509 |
|
|
|| optimize_function_for_size_p (cfun)"
|
17510 |
|
|
[(set (match_dup 0)
|
17511 |
|
|
(plus:SWI48 (mult:SWI48 (match_dup 1) (match_dup 2))
|
17512 |
|
|
(match_dup 1)))]
|
17513 |
|
|
"operands[2] = GEN_INT (INTVAL (operands[2]) - 1);")
|
17514 |
|
|
|
17515 |
|
|
(define_peephole2
|
17516 |
|
|
[(parallel
|
17517 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "")
|
17518 |
|
|
(mult:SWI48 (match_operand:SWI48 1 "nonimmediate_operand" "")
|
17519 |
|
|
(match_operand:SWI48 2 "const359_operand" "")))
|
17520 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17521 |
|
|
"optimize_insn_for_speed_p ()
|
17522 |
|
|
&& (!TARGET_PARTIAL_REG_STALL || mode == SImode)"
|
17523 |
|
|
[(set (match_dup 0) (match_dup 1))
|
17524 |
|
|
(set (match_dup 0)
|
17525 |
|
|
(plus:SWI48 (mult:SWI48 (match_dup 0) (match_dup 2))
|
17526 |
|
|
(match_dup 0)))]
|
17527 |
|
|
"operands[2] = GEN_INT (INTVAL (operands[2]) - 1);")
|
17528 |
|
|
|
17529 |
|
|
;; imul $32bit_imm, mem, reg is vector decoded, while
|
17530 |
|
|
;; imul $32bit_imm, reg, reg is direct decoded.
|
17531 |
|
|
(define_peephole2
|
17532 |
|
|
[(match_scratch:SWI48 3 "r")
|
17533 |
|
|
(parallel [(set (match_operand:SWI48 0 "register_operand" "")
|
17534 |
|
|
(mult:SWI48 (match_operand:SWI48 1 "memory_operand" "")
|
17535 |
|
|
(match_operand:SWI48 2 "immediate_operand" "")))
|
17536 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17537 |
|
|
"TARGET_SLOW_IMUL_IMM32_MEM && optimize_insn_for_speed_p ()
|
17538 |
|
|
&& !satisfies_constraint_K (operands[2])"
|
17539 |
|
|
[(set (match_dup 3) (match_dup 1))
|
17540 |
|
|
(parallel [(set (match_dup 0) (mult:SWI48 (match_dup 3) (match_dup 2)))
|
17541 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
17542 |
|
|
|
17543 |
|
|
(define_peephole2
|
17544 |
|
|
[(match_scratch:SI 3 "r")
|
17545 |
|
|
(parallel [(set (match_operand:DI 0 "register_operand" "")
|
17546 |
|
|
(zero_extend:DI
|
17547 |
|
|
(mult:SI (match_operand:SI 1 "memory_operand" "")
|
17548 |
|
|
(match_operand:SI 2 "immediate_operand" ""))))
|
17549 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17550 |
|
|
"TARGET_64BIT
|
17551 |
|
|
&& TARGET_SLOW_IMUL_IMM32_MEM && optimize_insn_for_speed_p ()
|
17552 |
|
|
&& !satisfies_constraint_K (operands[2])"
|
17553 |
|
|
[(set (match_dup 3) (match_dup 1))
|
17554 |
|
|
(parallel [(set (match_dup 0)
|
17555 |
|
|
(zero_extend:DI (mult:SI (match_dup 3) (match_dup 2))))
|
17556 |
|
|
(clobber (reg:CC FLAGS_REG))])])
|
17557 |
|
|
|
17558 |
|
|
;; imul $8/16bit_imm, regmem, reg is vector decoded.
|
17559 |
|
|
;; Convert it into imul reg, reg
|
17560 |
|
|
;; It would be better to force assembler to encode instruction using long
|
17561 |
|
|
;; immediate, but there is apparently no way to do so.
|
17562 |
|
|
(define_peephole2
|
17563 |
|
|
[(parallel [(set (match_operand:SWI248 0 "register_operand" "")
|
17564 |
|
|
(mult:SWI248
|
17565 |
|
|
(match_operand:SWI248 1 "nonimmediate_operand" "")
|
17566 |
|
|
(match_operand:SWI248 2 "const_int_operand" "")))
|
17567 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
17568 |
|
|
(match_scratch:SWI248 3 "r")]
|
17569 |
|
|
"TARGET_SLOW_IMUL_IMM8 && optimize_insn_for_speed_p ()
|
17570 |
|
|
&& satisfies_constraint_K (operands[2])"
|
17571 |
|
|
[(set (match_dup 3) (match_dup 2))
|
17572 |
|
|
(parallel [(set (match_dup 0) (mult:SWI248 (match_dup 0) (match_dup 3)))
|
17573 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17574 |
|
|
{
|
17575 |
|
|
if (!rtx_equal_p (operands[0], operands[1]))
|
17576 |
|
|
emit_move_insn (operands[0], operands[1]);
|
17577 |
|
|
})
|
17578 |
|
|
|
17579 |
|
|
;; After splitting up read-modify operations, array accesses with memory
|
17580 |
|
|
;; operands might end up in form:
|
17581 |
|
|
;; sall $2, %eax
|
17582 |
|
|
;; movl 4(%esp), %edx
|
17583 |
|
|
;; addl %edx, %eax
|
17584 |
|
|
;; instead of pre-splitting:
|
17585 |
|
|
;; sall $2, %eax
|
17586 |
|
|
;; addl 4(%esp), %eax
|
17587 |
|
|
;; Turn it into:
|
17588 |
|
|
;; movl 4(%esp), %edx
|
17589 |
|
|
;; leal (%edx,%eax,4), %eax
|
17590 |
|
|
|
17591 |
|
|
(define_peephole2
|
17592 |
|
|
[(match_scratch:P 5 "r")
|
17593 |
|
|
(parallel [(set (match_operand 0 "register_operand" "")
|
17594 |
|
|
(ashift (match_operand 1 "register_operand" "")
|
17595 |
|
|
(match_operand 2 "const_int_operand" "")))
|
17596 |
|
|
(clobber (reg:CC FLAGS_REG))])
|
17597 |
|
|
(parallel [(set (match_operand 3 "register_operand" "")
|
17598 |
|
|
(plus (match_dup 0)
|
17599 |
|
|
(match_operand 4 "x86_64_general_operand" "")))
|
17600 |
|
|
(clobber (reg:CC FLAGS_REG))])]
|
17601 |
|
|
"IN_RANGE (INTVAL (operands[2]), 1, 3)
|
17602 |
|
|
/* Validate MODE for lea. */
|
17603 |
|
|
&& ((!TARGET_PARTIAL_REG_STALL
|
17604 |
|
|
&& (GET_MODE (operands[0]) == QImode
|
17605 |
|
|
|| GET_MODE (operands[0]) == HImode))
|
17606 |
|
|
|| GET_MODE (operands[0]) == SImode
|
17607 |
|
|
|| (TARGET_64BIT && GET_MODE (operands[0]) == DImode))
|
17608 |
|
|
&& (rtx_equal_p (operands[0], operands[3])
|
17609 |
|
|
|| peep2_reg_dead_p (2, operands[0]))
|
17610 |
|
|
/* We reorder load and the shift. */
|
17611 |
|
|
&& !reg_overlap_mentioned_p (operands[0], operands[4])"
|
17612 |
|
|
[(set (match_dup 5) (match_dup 4))
|
17613 |
|
|
(set (match_dup 0) (match_dup 1))]
|
17614 |
|
|
{
|
17615 |
|
|
enum machine_mode op1mode = GET_MODE (operands[1]);
|
17616 |
|
|
enum machine_mode mode = op1mode == DImode ? DImode : SImode;
|
17617 |
|
|
int scale = 1 << INTVAL (operands[2]);
|
17618 |
|
|
rtx index = gen_lowpart (Pmode, operands[1]);
|
17619 |
|
|
rtx base = gen_lowpart (Pmode, operands[5]);
|
17620 |
|
|
rtx dest = gen_lowpart (mode, operands[3]);
|
17621 |
|
|
|
17622 |
|
|
operands[1] = gen_rtx_PLUS (Pmode, base,
|
17623 |
|
|
gen_rtx_MULT (Pmode, index, GEN_INT (scale)));
|
17624 |
|
|
operands[5] = base;
|
17625 |
|
|
if (mode != Pmode)
|
17626 |
|
|
operands[1] = gen_rtx_SUBREG (mode, operands[1], 0);
|
17627 |
|
|
if (op1mode != Pmode)
|
17628 |
|
|
operands[5] = gen_rtx_SUBREG (op1mode, operands[5], 0);
|
17629 |
|
|
operands[0] = dest;
|
17630 |
|
|
})
|
17631 |
|
|
|
17632 |
|
|
;; We used to use "int $5", in honor of #BR which maps to interrupt vector 5.
|
17633 |
|
|
;; That, however, is usually mapped by the OS to SIGSEGV, which is often
|
17634 |
|
|
;; caught for use by garbage collectors and the like. Using an insn that
|
17635 |
|
|
;; maps to SIGILL makes it more likely the program will rightfully die.
|
17636 |
|
|
;; Keeping with tradition, "6" is in honor of #UD.
|
17637 |
|
|
(define_insn "trap"
|
17638 |
|
|
[(trap_if (const_int 1) (const_int 6))]
|
17639 |
|
|
""
|
17640 |
|
|
{ return ASM_SHORT "0x0b0f"; }
|
17641 |
|
|
[(set_attr "length" "2")])
|
17642 |
|
|
|
17643 |
|
|
(define_expand "prefetch"
|
17644 |
|
|
[(prefetch (match_operand 0 "address_operand" "")
|
17645 |
|
|
(match_operand:SI 1 "const_int_operand" "")
|
17646 |
|
|
(match_operand:SI 2 "const_int_operand" ""))]
|
17647 |
|
|
"TARGET_PREFETCH_SSE || TARGET_3DNOW"
|
17648 |
|
|
{
|
17649 |
|
|
int rw = INTVAL (operands[1]);
|
17650 |
|
|
int locality = INTVAL (operands[2]);
|
17651 |
|
|
|
17652 |
|
|
gcc_assert (rw == 0 || rw == 1);
|
17653 |
|
|
gcc_assert (locality >= 0 && locality <= 3);
|
17654 |
|
|
gcc_assert (GET_MODE (operands[0]) == Pmode
|
17655 |
|
|
|| GET_MODE (operands[0]) == VOIDmode);
|
17656 |
|
|
|
17657 |
|
|
/* Use 3dNOW prefetch in case we are asking for write prefetch not
|
17658 |
|
|
supported by SSE counterpart or the SSE prefetch is not available
|
17659 |
|
|
(K6 machines). Otherwise use SSE prefetch as it allows specifying
|
17660 |
|
|
of locality. */
|
17661 |
|
|
if (TARGET_3DNOW && (!TARGET_PREFETCH_SSE || rw))
|
17662 |
|
|
operands[2] = GEN_INT (3);
|
17663 |
|
|
else
|
17664 |
|
|
operands[1] = const0_rtx;
|
17665 |
|
|
})
|
17666 |
|
|
|
17667 |
|
|
(define_insn "*prefetch_sse_"
|
17668 |
|
|
[(prefetch (match_operand:P 0 "address_operand" "p")
|
17669 |
|
|
(const_int 0)
|
17670 |
|
|
(match_operand:SI 1 "const_int_operand" ""))]
|
17671 |
|
|
"TARGET_PREFETCH_SSE"
|
17672 |
|
|
{
|
17673 |
|
|
static const char * const patterns[4] = {
|
17674 |
|
|
"prefetchnta\t%a0", "prefetcht2\t%a0", "prefetcht1\t%a0", "prefetcht0\t%a0"
|
17675 |
|
|
};
|
17676 |
|
|
|
17677 |
|
|
int locality = INTVAL (operands[1]);
|
17678 |
|
|
gcc_assert (locality >= 0 && locality <= 3);
|
17679 |
|
|
|
17680 |
|
|
return patterns[locality];
|
17681 |
|
|
}
|
17682 |
|
|
[(set_attr "type" "sse")
|
17683 |
|
|
(set_attr "atom_sse_attr" "prefetch")
|
17684 |
|
|
(set (attr "length_address")
|
17685 |
|
|
(symbol_ref "memory_address_length (operands[0])"))
|
17686 |
|
|
(set_attr "memory" "none")])
|
17687 |
|
|
|
17688 |
|
|
(define_insn "*prefetch_3dnow_"
|
17689 |
|
|
[(prefetch (match_operand:P 0 "address_operand" "p")
|
17690 |
|
|
(match_operand:SI 1 "const_int_operand" "n")
|
17691 |
|
|
(const_int 3))]
|
17692 |
|
|
"TARGET_3DNOW"
|
17693 |
|
|
{
|
17694 |
|
|
if (INTVAL (operands[1]) == 0)
|
17695 |
|
|
return "prefetch\t%a0";
|
17696 |
|
|
else
|
17697 |
|
|
return "prefetchw\t%a0";
|
17698 |
|
|
}
|
17699 |
|
|
[(set_attr "type" "mmx")
|
17700 |
|
|
(set (attr "length_address")
|
17701 |
|
|
(symbol_ref "memory_address_length (operands[0])"))
|
17702 |
|
|
(set_attr "memory" "none")])
|
17703 |
|
|
|
17704 |
|
|
(define_expand "stack_protect_set"
|
17705 |
|
|
[(match_operand 0 "memory_operand" "")
|
17706 |
|
|
(match_operand 1 "memory_operand" "")]
|
17707 |
|
|
""
|
17708 |
|
|
{
|
17709 |
|
|
rtx (*insn)(rtx, rtx);
|
17710 |
|
|
|
17711 |
|
|
#ifdef TARGET_THREAD_SSP_OFFSET
|
17712 |
|
|
operands[1] = GEN_INT (TARGET_THREAD_SSP_OFFSET);
|
17713 |
|
|
insn = (TARGET_LP64
|
17714 |
|
|
? gen_stack_tls_protect_set_di
|
17715 |
|
|
: gen_stack_tls_protect_set_si);
|
17716 |
|
|
#else
|
17717 |
|
|
insn = (TARGET_LP64
|
17718 |
|
|
? gen_stack_protect_set_di
|
17719 |
|
|
: gen_stack_protect_set_si);
|
17720 |
|
|
#endif
|
17721 |
|
|
|
17722 |
|
|
emit_insn (insn (operands[0], operands[1]));
|
17723 |
|
|
DONE;
|
17724 |
|
|
})
|
17725 |
|
|
|
17726 |
|
|
(define_insn "stack_protect_set_"
|
17727 |
|
|
[(set (match_operand:PTR 0 "memory_operand" "=m")
|
17728 |
|
|
(unspec:PTR [(match_operand:PTR 1 "memory_operand" "m")]
|
17729 |
|
|
UNSPEC_SP_SET))
|
17730 |
|
|
(set (match_scratch:PTR 2 "=&r") (const_int 0))
|
17731 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
17732 |
|
|
""
|
17733 |
|
|
"mov{}\t{%1, %2|%2, %1}\;mov{}\t{%2, %0|%0, %2}\;xor{l}\t%k2, %k2"
|
17734 |
|
|
[(set_attr "type" "multi")])
|
17735 |
|
|
|
17736 |
|
|
(define_insn "stack_tls_protect_set_"
|
17737 |
|
|
[(set (match_operand:PTR 0 "memory_operand" "=m")
|
17738 |
|
|
(unspec:PTR [(match_operand:PTR 1 "const_int_operand" "i")]
|
17739 |
|
|
UNSPEC_SP_TLS_SET))
|
17740 |
|
|
(set (match_scratch:PTR 2 "=&r") (const_int 0))
|
17741 |
|
|
(clobber (reg:CC FLAGS_REG))]
|
17742 |
|
|
""
|
17743 |
|
|
"mov{}\t{%@:%P1, %2|%2, PTR %@:%P1}\;mov{}\t{%2, %0|%0, %2}\;xor{l}\t%k2, %k2"
|
17744 |
|
|
[(set_attr "type" "multi")])
|
17745 |
|
|
|
17746 |
|
|
(define_expand "stack_protect_test"
|
17747 |
|
|
[(match_operand 0 "memory_operand" "")
|
17748 |
|
|
(match_operand 1 "memory_operand" "")
|
17749 |
|
|
(match_operand 2 "" "")]
|
17750 |
|
|
""
|
17751 |
|
|
{
|
17752 |
|
|
rtx flags = gen_rtx_REG (CCZmode, FLAGS_REG);
|
17753 |
|
|
|
17754 |
|
|
rtx (*insn)(rtx, rtx, rtx);
|
17755 |
|
|
|
17756 |
|
|
#ifdef TARGET_THREAD_SSP_OFFSET
|
17757 |
|
|
operands[1] = GEN_INT (TARGET_THREAD_SSP_OFFSET);
|
17758 |
|
|
insn = (TARGET_LP64
|
17759 |
|
|
? gen_stack_tls_protect_test_di
|
17760 |
|
|
: gen_stack_tls_protect_test_si);
|
17761 |
|
|
#else
|
17762 |
|
|
insn = (TARGET_LP64
|
17763 |
|
|
? gen_stack_protect_test_di
|
17764 |
|
|
: gen_stack_protect_test_si);
|
17765 |
|
|
#endif
|
17766 |
|
|
|
17767 |
|
|
emit_insn (insn (flags, operands[0], operands[1]));
|
17768 |
|
|
|
17769 |
|
|
emit_jump_insn (gen_cbranchcc4 (gen_rtx_EQ (VOIDmode, flags, const0_rtx),
|
17770 |
|
|
flags, const0_rtx, operands[2]));
|
17771 |
|
|
DONE;
|
17772 |
|
|
})
|
17773 |
|
|
|
17774 |
|
|
(define_insn "stack_protect_test_"
|
17775 |
|
|
[(set (match_operand:CCZ 0 "flags_reg_operand" "")
|
17776 |
|
|
(unspec:CCZ [(match_operand:PTR 1 "memory_operand" "m")
|
17777 |
|
|
(match_operand:PTR 2 "memory_operand" "m")]
|
17778 |
|
|
UNSPEC_SP_TEST))
|
17779 |
|
|
(clobber (match_scratch:PTR 3 "=&r"))]
|
17780 |
|
|
""
|
17781 |
|
|
"mov{}\t{%1, %3|%3, %1}\;xor{}\t{%2, %3|%3, %2}"
|
17782 |
|
|
[(set_attr "type" "multi")])
|
17783 |
|
|
|
17784 |
|
|
(define_insn "stack_tls_protect_test_"
|
17785 |
|
|
[(set (match_operand:CCZ 0 "flags_reg_operand" "")
|
17786 |
|
|
(unspec:CCZ [(match_operand:PTR 1 "memory_operand" "m")
|
17787 |
|
|
(match_operand:PTR 2 "const_int_operand" "i")]
|
17788 |
|
|
UNSPEC_SP_TLS_TEST))
|
17789 |
|
|
(clobber (match_scratch:PTR 3 "=r"))]
|
17790 |
|
|
""
|
17791 |
|
|
"mov{}\t{%1, %3|%3, %1}\;xor{}\t{%@:%P2, %3|%3, PTR %@:%P2}"
|
17792 |
|
|
[(set_attr "type" "multi")])
|
17793 |
|
|
|
17794 |
|
|
(define_insn "sse4_2_crc32"
|
17795 |
|
|
[(set (match_operand:SI 0 "register_operand" "=r")
|
17796 |
|
|
(unspec:SI
|
17797 |
|
|
[(match_operand:SI 1 "register_operand" "0")
|
17798 |
|
|
(match_operand:SWI124 2 "nonimmediate_operand" "m")]
|
17799 |
|
|
UNSPEC_CRC32))]
|
17800 |
|
|
"TARGET_SSE4_2 || TARGET_CRC32"
|
17801 |
|
|
"crc32{}\t{%2, %0|%0, %2}"
|
17802 |
|
|
[(set_attr "type" "sselog1")
|
17803 |
|
|
(set_attr "prefix_rep" "1")
|
17804 |
|
|
(set_attr "prefix_extra" "1")
|
17805 |
|
|
(set (attr "prefix_data16")
|
17806 |
|
|
(if_then_else (match_operand:HI 2 "" "")
|
17807 |
|
|
(const_string "1")
|
17808 |
|
|
(const_string "*")))
|
17809 |
|
|
(set (attr "prefix_rex")
|
17810 |
|
|
(if_then_else (match_operand:QI 2 "ext_QIreg_operand" "")
|
17811 |
|
|
(const_string "1")
|
17812 |
|
|
(const_string "*")))
|
17813 |
|
|
(set_attr "mode" "SI")])
|
17814 |
|
|
|
17815 |
|
|
(define_insn "sse4_2_crc32di"
|
17816 |
|
|
[(set (match_operand:DI 0 "register_operand" "=r")
|
17817 |
|
|
(unspec:DI
|
17818 |
|
|
[(match_operand:DI 1 "register_operand" "0")
|
17819 |
|
|
(match_operand:DI 2 "nonimmediate_operand" "rm")]
|
17820 |
|
|
UNSPEC_CRC32))]
|
17821 |
|
|
"TARGET_64BIT && (TARGET_SSE4_2 || TARGET_CRC32)"
|
17822 |
|
|
"crc32{q}\t{%2, %0|%0, %2}"
|
17823 |
|
|
[(set_attr "type" "sselog1")
|
17824 |
|
|
(set_attr "prefix_rep" "1")
|
17825 |
|
|
(set_attr "prefix_extra" "1")
|
17826 |
|
|
(set_attr "mode" "DI")])
|
17827 |
|
|
|
17828 |
|
|
(define_expand "rdpmc"
|
17829 |
|
|
[(match_operand:DI 0 "register_operand" "")
|
17830 |
|
|
(match_operand:SI 1 "register_operand" "")]
|
17831 |
|
|
""
|
17832 |
|
|
{
|
17833 |
|
|
rtx reg = gen_reg_rtx (DImode);
|
17834 |
|
|
rtx si;
|
17835 |
|
|
|
17836 |
|
|
/* Force operand 1 into ECX. */
|
17837 |
|
|
rtx ecx = gen_rtx_REG (SImode, CX_REG);
|
17838 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, ecx, operands[1]));
|
17839 |
|
|
si = gen_rtx_UNSPEC_VOLATILE (DImode, gen_rtvec (1, ecx),
|
17840 |
|
|
UNSPECV_RDPMC);
|
17841 |
|
|
|
17842 |
|
|
if (TARGET_64BIT)
|
17843 |
|
|
{
|
17844 |
|
|
rtvec vec = rtvec_alloc (2);
|
17845 |
|
|
rtx load = gen_rtx_PARALLEL (VOIDmode, vec);
|
17846 |
|
|
rtx upper = gen_reg_rtx (DImode);
|
17847 |
|
|
rtx di = gen_rtx_UNSPEC_VOLATILE (DImode,
|
17848 |
|
|
gen_rtvec (1, const0_rtx),
|
17849 |
|
|
UNSPECV_RDPMC);
|
17850 |
|
|
RTVEC_ELT (vec, 0) = gen_rtx_SET (VOIDmode, reg, si);
|
17851 |
|
|
RTVEC_ELT (vec, 1) = gen_rtx_SET (VOIDmode, upper, di);
|
17852 |
|
|
emit_insn (load);
|
17853 |
|
|
upper = expand_simple_binop (DImode, ASHIFT, upper, GEN_INT (32),
|
17854 |
|
|
NULL, 1, OPTAB_DIRECT);
|
17855 |
|
|
reg = expand_simple_binop (DImode, IOR, reg, upper, reg, 1,
|
17856 |
|
|
OPTAB_DIRECT);
|
17857 |
|
|
}
|
17858 |
|
|
else
|
17859 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, reg, si));
|
17860 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[0], reg));
|
17861 |
|
|
DONE;
|
17862 |
|
|
})
|
17863 |
|
|
|
17864 |
|
|
(define_insn "*rdpmc"
|
17865 |
|
|
[(set (match_operand:DI 0 "register_operand" "=A")
|
17866 |
|
|
(unspec_volatile:DI [(match_operand:SI 1 "register_operand" "c")]
|
17867 |
|
|
UNSPECV_RDPMC))]
|
17868 |
|
|
"!TARGET_64BIT"
|
17869 |
|
|
"rdpmc"
|
17870 |
|
|
[(set_attr "type" "other")
|
17871 |
|
|
(set_attr "length" "2")])
|
17872 |
|
|
|
17873 |
|
|
(define_insn "*rdpmc_rex64"
|
17874 |
|
|
[(set (match_operand:DI 0 "register_operand" "=a")
|
17875 |
|
|
(unspec_volatile:DI [(match_operand:SI 2 "register_operand" "c")]
|
17876 |
|
|
UNSPECV_RDPMC))
|
17877 |
|
|
(set (match_operand:DI 1 "register_operand" "=d")
|
17878 |
|
|
(unspec_volatile:DI [(const_int 0)] UNSPECV_RDPMC))]
|
17879 |
|
|
"TARGET_64BIT"
|
17880 |
|
|
"rdpmc"
|
17881 |
|
|
[(set_attr "type" "other")
|
17882 |
|
|
(set_attr "length" "2")])
|
17883 |
|
|
|
17884 |
|
|
(define_expand "rdtsc"
|
17885 |
|
|
[(set (match_operand:DI 0 "register_operand" "")
|
17886 |
|
|
(unspec_volatile:DI [(const_int 0)] UNSPECV_RDTSC))]
|
17887 |
|
|
""
|
17888 |
|
|
{
|
17889 |
|
|
if (TARGET_64BIT)
|
17890 |
|
|
{
|
17891 |
|
|
rtvec vec = rtvec_alloc (2);
|
17892 |
|
|
rtx load = gen_rtx_PARALLEL (VOIDmode, vec);
|
17893 |
|
|
rtx upper = gen_reg_rtx (DImode);
|
17894 |
|
|
rtx lower = gen_reg_rtx (DImode);
|
17895 |
|
|
rtx src = gen_rtx_UNSPEC_VOLATILE (DImode,
|
17896 |
|
|
gen_rtvec (1, const0_rtx),
|
17897 |
|
|
UNSPECV_RDTSC);
|
17898 |
|
|
RTVEC_ELT (vec, 0) = gen_rtx_SET (VOIDmode, lower, src);
|
17899 |
|
|
RTVEC_ELT (vec, 1) = gen_rtx_SET (VOIDmode, upper, src);
|
17900 |
|
|
emit_insn (load);
|
17901 |
|
|
upper = expand_simple_binop (DImode, ASHIFT, upper, GEN_INT (32),
|
17902 |
|
|
NULL, 1, OPTAB_DIRECT);
|
17903 |
|
|
lower = expand_simple_binop (DImode, IOR, lower, upper, lower, 1,
|
17904 |
|
|
OPTAB_DIRECT);
|
17905 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[0], lower));
|
17906 |
|
|
DONE;
|
17907 |
|
|
}
|
17908 |
|
|
})
|
17909 |
|
|
|
17910 |
|
|
(define_insn "*rdtsc"
|
17911 |
|
|
[(set (match_operand:DI 0 "register_operand" "=A")
|
17912 |
|
|
(unspec_volatile:DI [(const_int 0)] UNSPECV_RDTSC))]
|
17913 |
|
|
"!TARGET_64BIT"
|
17914 |
|
|
"rdtsc"
|
17915 |
|
|
[(set_attr "type" "other")
|
17916 |
|
|
(set_attr "length" "2")])
|
17917 |
|
|
|
17918 |
|
|
(define_insn "*rdtsc_rex64"
|
17919 |
|
|
[(set (match_operand:DI 0 "register_operand" "=a")
|
17920 |
|
|
(unspec_volatile:DI [(const_int 0)] UNSPECV_RDTSC))
|
17921 |
|
|
(set (match_operand:DI 1 "register_operand" "=d")
|
17922 |
|
|
(unspec_volatile:DI [(const_int 0)] UNSPECV_RDTSC))]
|
17923 |
|
|
"TARGET_64BIT"
|
17924 |
|
|
"rdtsc"
|
17925 |
|
|
[(set_attr "type" "other")
|
17926 |
|
|
(set_attr "length" "2")])
|
17927 |
|
|
|
17928 |
|
|
(define_expand "rdtscp"
|
17929 |
|
|
[(match_operand:DI 0 "register_operand" "")
|
17930 |
|
|
(match_operand:SI 1 "memory_operand" "")]
|
17931 |
|
|
""
|
17932 |
|
|
{
|
17933 |
|
|
rtx di = gen_rtx_UNSPEC_VOLATILE (DImode,
|
17934 |
|
|
gen_rtvec (1, const0_rtx),
|
17935 |
|
|
UNSPECV_RDTSCP);
|
17936 |
|
|
rtx si = gen_rtx_UNSPEC_VOLATILE (SImode,
|
17937 |
|
|
gen_rtvec (1, const0_rtx),
|
17938 |
|
|
UNSPECV_RDTSCP);
|
17939 |
|
|
rtx reg = gen_reg_rtx (DImode);
|
17940 |
|
|
rtx tmp = gen_reg_rtx (SImode);
|
17941 |
|
|
|
17942 |
|
|
if (TARGET_64BIT)
|
17943 |
|
|
{
|
17944 |
|
|
rtvec vec = rtvec_alloc (3);
|
17945 |
|
|
rtx load = gen_rtx_PARALLEL (VOIDmode, vec);
|
17946 |
|
|
rtx upper = gen_reg_rtx (DImode);
|
17947 |
|
|
RTVEC_ELT (vec, 0) = gen_rtx_SET (VOIDmode, reg, di);
|
17948 |
|
|
RTVEC_ELT (vec, 1) = gen_rtx_SET (VOIDmode, upper, di);
|
17949 |
|
|
RTVEC_ELT (vec, 2) = gen_rtx_SET (VOIDmode, tmp, si);
|
17950 |
|
|
emit_insn (load);
|
17951 |
|
|
upper = expand_simple_binop (DImode, ASHIFT, upper, GEN_INT (32),
|
17952 |
|
|
NULL, 1, OPTAB_DIRECT);
|
17953 |
|
|
reg = expand_simple_binop (DImode, IOR, reg, upper, reg, 1,
|
17954 |
|
|
OPTAB_DIRECT);
|
17955 |
|
|
}
|
17956 |
|
|
else
|
17957 |
|
|
{
|
17958 |
|
|
rtvec vec = rtvec_alloc (2);
|
17959 |
|
|
rtx load = gen_rtx_PARALLEL (VOIDmode, vec);
|
17960 |
|
|
RTVEC_ELT (vec, 0) = gen_rtx_SET (VOIDmode, reg, di);
|
17961 |
|
|
RTVEC_ELT (vec, 1) = gen_rtx_SET (VOIDmode, tmp, si);
|
17962 |
|
|
emit_insn (load);
|
17963 |
|
|
}
|
17964 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[0], reg));
|
17965 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[1], tmp));
|
17966 |
|
|
DONE;
|
17967 |
|
|
})
|
17968 |
|
|
|
17969 |
|
|
(define_insn "*rdtscp"
|
17970 |
|
|
[(set (match_operand:DI 0 "register_operand" "=A")
|
17971 |
|
|
(unspec_volatile:DI [(const_int 0)] UNSPECV_RDTSCP))
|
17972 |
|
|
(set (match_operand:SI 1 "register_operand" "=c")
|
17973 |
|
|
(unspec_volatile:SI [(const_int 0)] UNSPECV_RDTSCP))]
|
17974 |
|
|
"!TARGET_64BIT"
|
17975 |
|
|
"rdtscp"
|
17976 |
|
|
[(set_attr "type" "other")
|
17977 |
|
|
(set_attr "length" "3")])
|
17978 |
|
|
|
17979 |
|
|
(define_insn "*rdtscp_rex64"
|
17980 |
|
|
[(set (match_operand:DI 0 "register_operand" "=a")
|
17981 |
|
|
(unspec_volatile:DI [(const_int 0)] UNSPECV_RDTSCP))
|
17982 |
|
|
(set (match_operand:DI 1 "register_operand" "=d")
|
17983 |
|
|
(unspec_volatile:DI [(const_int 0)] UNSPECV_RDTSCP))
|
17984 |
|
|
(set (match_operand:SI 2 "register_operand" "=c")
|
17985 |
|
|
(unspec_volatile:SI [(const_int 0)] UNSPECV_RDTSCP))]
|
17986 |
|
|
"TARGET_64BIT"
|
17987 |
|
|
"rdtscp"
|
17988 |
|
|
[(set_attr "type" "other")
|
17989 |
|
|
(set_attr "length" "3")])
|
17990 |
|
|
|
17991 |
|
|
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
17992 |
|
|
;;
|
17993 |
|
|
;; LWP instructions
|
17994 |
|
|
;;
|
17995 |
|
|
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
17996 |
|
|
|
17997 |
|
|
(define_expand "lwp_llwpcb"
|
17998 |
|
|
[(unspec_volatile [(match_operand 0 "register_operand" "r")]
|
17999 |
|
|
UNSPECV_LLWP_INTRINSIC)]
|
18000 |
|
|
"TARGET_LWP")
|
18001 |
|
|
|
18002 |
|
|
(define_insn "*lwp_llwpcb1"
|
18003 |
|
|
[(unspec_volatile [(match_operand:P 0 "register_operand" "r")]
|
18004 |
|
|
UNSPECV_LLWP_INTRINSIC)]
|
18005 |
|
|
"TARGET_LWP"
|
18006 |
|
|
"llwpcb\t%0"
|
18007 |
|
|
[(set_attr "type" "lwp")
|
18008 |
|
|
(set_attr "mode" "")
|
18009 |
|
|
(set_attr "length" "5")])
|
18010 |
|
|
|
18011 |
|
|
(define_expand "lwp_slwpcb"
|
18012 |
|
|
[(set (match_operand 0 "register_operand" "=r")
|
18013 |
|
|
(unspec_volatile [(const_int 0)] UNSPECV_SLWP_INTRINSIC))]
|
18014 |
|
|
"TARGET_LWP"
|
18015 |
|
|
{
|
18016 |
|
|
rtx (*insn)(rtx);
|
18017 |
|
|
|
18018 |
|
|
insn = (TARGET_64BIT
|
18019 |
|
|
? gen_lwp_slwpcbdi
|
18020 |
|
|
: gen_lwp_slwpcbsi);
|
18021 |
|
|
|
18022 |
|
|
emit_insn (insn (operands[0]));
|
18023 |
|
|
DONE;
|
18024 |
|
|
})
|
18025 |
|
|
|
18026 |
|
|
(define_insn "lwp_slwpcb"
|
18027 |
|
|
[(set (match_operand:P 0 "register_operand" "=r")
|
18028 |
|
|
(unspec_volatile:P [(const_int 0)] UNSPECV_SLWP_INTRINSIC))]
|
18029 |
|
|
"TARGET_LWP"
|
18030 |
|
|
"slwpcb\t%0"
|
18031 |
|
|
[(set_attr "type" "lwp")
|
18032 |
|
|
(set_attr "mode" "")
|
18033 |
|
|
(set_attr "length" "5")])
|
18034 |
|
|
|
18035 |
|
|
(define_expand "lwp_lwpval3"
|
18036 |
|
|
[(unspec_volatile [(match_operand:SWI48 1 "register_operand" "r")
|
18037 |
|
|
(match_operand:SI 2 "nonimmediate_operand" "rm")
|
18038 |
|
|
(match_operand:SI 3 "const_int_operand" "i")]
|
18039 |
|
|
UNSPECV_LWPVAL_INTRINSIC)]
|
18040 |
|
|
"TARGET_LWP"
|
18041 |
|
|
;; Avoid unused variable warning.
|
18042 |
|
|
"(void) operands[0];")
|
18043 |
|
|
|
18044 |
|
|
(define_insn "*lwp_lwpval3_1"
|
18045 |
|
|
[(unspec_volatile [(match_operand:SWI48 0 "register_operand" "r")
|
18046 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "rm")
|
18047 |
|
|
(match_operand:SI 2 "const_int_operand" "i")]
|
18048 |
|
|
UNSPECV_LWPVAL_INTRINSIC)]
|
18049 |
|
|
"TARGET_LWP"
|
18050 |
|
|
"lwpval\t{%2, %1, %0|%0, %1, %2}"
|
18051 |
|
|
[(set_attr "type" "lwp")
|
18052 |
|
|
(set_attr "mode" "")
|
18053 |
|
|
(set (attr "length")
|
18054 |
|
|
(symbol_ref "ix86_attr_length_address_default (insn) + 9"))])
|
18055 |
|
|
|
18056 |
|
|
(define_expand "lwp_lwpins3"
|
18057 |
|
|
[(set (reg:CCC FLAGS_REG)
|
18058 |
|
|
(unspec_volatile:CCC [(match_operand:SWI48 1 "register_operand" "r")
|
18059 |
|
|
(match_operand:SI 2 "nonimmediate_operand" "rm")
|
18060 |
|
|
(match_operand:SI 3 "const_int_operand" "i")]
|
18061 |
|
|
UNSPECV_LWPINS_INTRINSIC))
|
18062 |
|
|
(set (match_operand:QI 0 "nonimmediate_operand" "=qm")
|
18063 |
|
|
(eq:QI (reg:CCC FLAGS_REG) (const_int 0)))]
|
18064 |
|
|
"TARGET_LWP")
|
18065 |
|
|
|
18066 |
|
|
(define_insn "*lwp_lwpins3_1"
|
18067 |
|
|
[(set (reg:CCC FLAGS_REG)
|
18068 |
|
|
(unspec_volatile:CCC [(match_operand:SWI48 0 "register_operand" "r")
|
18069 |
|
|
(match_operand:SI 1 "nonimmediate_operand" "rm")
|
18070 |
|
|
(match_operand:SI 2 "const_int_operand" "i")]
|
18071 |
|
|
UNSPECV_LWPINS_INTRINSIC))]
|
18072 |
|
|
"TARGET_LWP"
|
18073 |
|
|
"lwpins\t{%2, %1, %0|%0, %1, %2}"
|
18074 |
|
|
[(set_attr "type" "lwp")
|
18075 |
|
|
(set_attr "mode" "")
|
18076 |
|
|
(set (attr "length")
|
18077 |
|
|
(symbol_ref "ix86_attr_length_address_default (insn) + 9"))])
|
18078 |
|
|
|
18079 |
|
|
(define_insn "rdfsbase"
|
18080 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
18081 |
|
|
(unspec_volatile:SWI48 [(const_int 0)] UNSPECV_RDFSBASE))]
|
18082 |
|
|
"TARGET_64BIT && TARGET_FSGSBASE"
|
18083 |
|
|
"rdfsbase %0"
|
18084 |
|
|
[(set_attr "type" "other")
|
18085 |
|
|
(set_attr "prefix_extra" "2")])
|
18086 |
|
|
|
18087 |
|
|
(define_insn "rdgsbase"
|
18088 |
|
|
[(set (match_operand:SWI48 0 "register_operand" "=r")
|
18089 |
|
|
(unspec_volatile:SWI48 [(const_int 0)] UNSPECV_RDGSBASE))]
|
18090 |
|
|
"TARGET_64BIT && TARGET_FSGSBASE"
|
18091 |
|
|
"rdgsbase %0"
|
18092 |
|
|
[(set_attr "type" "other")
|
18093 |
|
|
(set_attr "prefix_extra" "2")])
|
18094 |
|
|
|
18095 |
|
|
(define_insn "wrfsbase"
|
18096 |
|
|
[(unspec_volatile [(match_operand:SWI48 0 "register_operand" "r")]
|
18097 |
|
|
UNSPECV_WRFSBASE)]
|
18098 |
|
|
"TARGET_64BIT && TARGET_FSGSBASE"
|
18099 |
|
|
"wrfsbase %0"
|
18100 |
|
|
[(set_attr "type" "other")
|
18101 |
|
|
(set_attr "prefix_extra" "2")])
|
18102 |
|
|
|
18103 |
|
|
(define_insn "wrgsbase"
|
18104 |
|
|
[(unspec_volatile [(match_operand:SWI48 0 "register_operand" "r")]
|
18105 |
|
|
UNSPECV_WRGSBASE)]
|
18106 |
|
|
"TARGET_64BIT && TARGET_FSGSBASE"
|
18107 |
|
|
"wrgsbase %0"
|
18108 |
|
|
[(set_attr "type" "other")
|
18109 |
|
|
(set_attr "prefix_extra" "2")])
|
18110 |
|
|
|
18111 |
|
|
(define_insn "rdrand_1"
|
18112 |
|
|
[(set (match_operand:SWI248 0 "register_operand" "=r")
|
18113 |
|
|
(unspec:SWI248 [(const_int 0)] UNSPEC_RDRAND))
|
18114 |
|
|
(set (reg:CCC FLAGS_REG)
|
18115 |
|
|
(unspec:CCC [(const_int 0)] UNSPEC_RDRAND))]
|
18116 |
|
|
"TARGET_RDRND"
|
18117 |
|
|
"rdrand\t%0"
|
18118 |
|
|
[(set_attr "type" "other")
|
18119 |
|
|
(set_attr "prefix_extra" "1")])
|
18120 |
|
|
|
18121 |
|
|
(define_expand "pause"
|
18122 |
|
|
[(set (match_dup 0)
|
18123 |
|
|
(unspec:BLK [(match_dup 0)] UNSPEC_PAUSE))]
|
18124 |
|
|
""
|
18125 |
|
|
{
|
18126 |
|
|
operands[0] = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (Pmode));
|
18127 |
|
|
MEM_VOLATILE_P (operands[0]) = 1;
|
18128 |
|
|
})
|
18129 |
|
|
|
18130 |
|
|
;; Use "rep; nop", instead of "pause", to support older assemblers.
|
18131 |
|
|
;; They have the same encoding.
|
18132 |
|
|
(define_insn "*pause"
|
18133 |
|
|
[(set (match_operand:BLK 0 "" "")
|
18134 |
|
|
(unspec:BLK [(match_dup 0)] UNSPEC_PAUSE))]
|
18135 |
|
|
""
|
18136 |
|
|
"rep; nop"
|
18137 |
|
|
[(set_attr "length" "2")
|
18138 |
|
|
(set_attr "memory" "unknown")])
|
18139 |
|
|
|
18140 |
|
|
(include "mmx.md")
|
18141 |
|
|
(include "sse.md")
|
18142 |
|
|
(include "sync.md")
|