1 |
282 |
jeremybenn |
;; Copyright (C) 2006, 2007, 2008, 2009 Free Software Foundation, Inc.
|
2 |
|
|
|
3 |
|
|
;; This file is free software; you can redistribute it and/or modify it under
|
4 |
|
|
;; the terms of the GNU General Public License as published by the Free
|
5 |
|
|
;; Software Foundation; either version 3 of the License, or (at your option)
|
6 |
|
|
;; any later version.
|
7 |
|
|
|
8 |
|
|
;; This file is distributed in the hope that it will be useful, but WITHOUT
|
9 |
|
|
;; ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
10 |
|
|
;; FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
11 |
|
|
;; for more details.
|
12 |
|
|
|
13 |
|
|
;; You should have received a copy of the GNU General Public License
|
14 |
|
|
;; along with GCC; see the file COPYING3. If not see
|
15 |
|
|
;; .
|
16 |
|
|
|
17 |
|
|
;;- See file "rtl.def" for documentation on define_insn, match_*, et. al.
|
18 |
|
|
|
19 |
|
|
|
20 |
|
|
;; Define an insn type attribute. This is used in function unit delay
|
21 |
|
|
;; computations.
|
22 |
|
|
;; multi0 is a multiple insn rtl whose first insn is in pipe0
|
23 |
|
|
;; multi1 is a multiple insn rtl whose first insn is in pipe1
|
24 |
|
|
(define_attr "type" "fx2,shuf,fx3,load,store,br,spr,lnop,nop,fxb,fp6,fp7,fpd,iprefetch,multi0,multi1,hbr,convert"
|
25 |
|
|
(const_string "fx2"))
|
26 |
|
|
|
27 |
|
|
;; Length (in bytes).
|
28 |
|
|
(define_attr "length" ""
|
29 |
|
|
(const_int 4))
|
30 |
|
|
|
31 |
|
|
(define_attr "tune" "cell,celledp" (const (symbol_ref "spu_tune")))
|
32 |
|
|
;; Processor type -- this attribute must exactly match the processor_type
|
33 |
|
|
;; enumeration in spu.h.
|
34 |
|
|
|
35 |
|
|
(define_attr "cpu" "spu"
|
36 |
|
|
(const (symbol_ref "spu_cpu_attr")))
|
37 |
|
|
|
38 |
|
|
; (define_function_unit NAME MULTIPLICITY SIMULTANEITY
|
39 |
|
|
; TEST READY-DELAY ISSUE-DELAY [CONFLICT-LIST])
|
40 |
|
|
|
41 |
|
|
(define_cpu_unit "pipe0,pipe1,fp,ls")
|
42 |
|
|
|
43 |
|
|
(define_insn_reservation "NOP" 1 (eq_attr "type" "nop")
|
44 |
|
|
"pipe0")
|
45 |
|
|
|
46 |
|
|
(define_insn_reservation "FX2" 2 (eq_attr "type" "fx2")
|
47 |
|
|
"pipe0, nothing")
|
48 |
|
|
|
49 |
|
|
(define_insn_reservation "FX3" 4 (eq_attr "type" "fx3,fxb")
|
50 |
|
|
"pipe0, nothing*3")
|
51 |
|
|
|
52 |
|
|
(define_insn_reservation "FP6" 6 (eq_attr "type" "fp6")
|
53 |
|
|
"pipe0 + fp, nothing*5")
|
54 |
|
|
|
55 |
|
|
(define_insn_reservation "FP7" 7 (eq_attr "type" "fp7")
|
56 |
|
|
"pipe0, fp, nothing*5")
|
57 |
|
|
|
58 |
|
|
;; The behavior of the double precision is that both pipes stall
|
59 |
|
|
;; for 6 cycles and the rest of the operation pipelines for
|
60 |
|
|
;; 7 cycles. The simplest way to model this is to simply ignore
|
61 |
|
|
;; the 6 cyle stall.
|
62 |
|
|
(define_insn_reservation "FPD" 7
|
63 |
|
|
(and (eq_attr "tune" "cell")
|
64 |
|
|
(eq_attr "type" "fpd"))
|
65 |
|
|
"pipe0 + pipe1, fp, nothing*5")
|
66 |
|
|
|
67 |
|
|
;; Tune for CELLEDP, 9 cycles, dual-issuable, fully pipelined
|
68 |
|
|
(define_insn_reservation "FPD_CELLEDP" 9
|
69 |
|
|
(and (eq_attr "tune" "celledp")
|
70 |
|
|
(eq_attr "type" "fpd"))
|
71 |
|
|
"pipe0 + fp, nothing*8")
|
72 |
|
|
|
73 |
|
|
(define_insn_reservation "LNOP" 1 (eq_attr "type" "lnop")
|
74 |
|
|
"pipe1")
|
75 |
|
|
|
76 |
|
|
(define_insn_reservation "STORE" 1 (eq_attr "type" "store")
|
77 |
|
|
"pipe1 + ls")
|
78 |
|
|
|
79 |
|
|
(define_insn_reservation "IPREFETCH" 1 (eq_attr "type" "iprefetch")
|
80 |
|
|
"pipe1 + ls")
|
81 |
|
|
|
82 |
|
|
(define_insn_reservation "SHUF" 4 (eq_attr "type" "shuf,br,spr")
|
83 |
|
|
"pipe1, nothing*3")
|
84 |
|
|
|
85 |
|
|
(define_insn_reservation "LOAD" 6 (eq_attr "type" "load")
|
86 |
|
|
"pipe1 + ls, nothing*5")
|
87 |
|
|
|
88 |
|
|
(define_insn_reservation "HBR" 18 (eq_attr "type" "hbr")
|
89 |
|
|
"pipe1, nothing*15")
|
90 |
|
|
|
91 |
|
|
(define_insn_reservation "MULTI0" 4 (eq_attr "type" "multi0")
|
92 |
|
|
"pipe0+pipe1, nothing*3")
|
93 |
|
|
|
94 |
|
|
(define_insn_reservation "MULTI1" 4 (eq_attr "type" "multi1")
|
95 |
|
|
"pipe1, nothing*3")
|
96 |
|
|
|
97 |
|
|
(define_insn_reservation "CONVERT" 0 (eq_attr "type" "convert")
|
98 |
|
|
"nothing")
|
99 |
|
|
|
100 |
|
|
;; Force pipe0 to occur before pipe 1 in a cycle.
|
101 |
|
|
(absence_set "pipe0" "pipe1")
|
102 |
|
|
|
103 |
|
|
|
104 |
|
|
(define_constants [
|
105 |
|
|
(UNSPEC_BLOCKAGE 0)
|
106 |
|
|
(UNSPEC_IPREFETCH 1)
|
107 |
|
|
(UNSPEC_FREST 2)
|
108 |
|
|
(UNSPEC_FRSQEST 3)
|
109 |
|
|
(UNSPEC_FI 4)
|
110 |
|
|
(UNSPEC_EXTEND_CMP 5)
|
111 |
|
|
(UNSPEC_CG 6)
|
112 |
|
|
(UNSPEC_CGX 7)
|
113 |
|
|
(UNSPEC_ADDX 8)
|
114 |
|
|
(UNSPEC_BG 9)
|
115 |
|
|
(UNSPEC_BGX 10)
|
116 |
|
|
(UNSPEC_SFX 11)
|
117 |
|
|
(UNSPEC_FSM 12)
|
118 |
|
|
(UNSPEC_HBR 13)
|
119 |
|
|
(UNSPEC_LNOP 14)
|
120 |
|
|
(UNSPEC_NOP 15)
|
121 |
|
|
(UNSPEC_CONVERT 16)
|
122 |
|
|
(UNSPEC_SELB 17)
|
123 |
|
|
(UNSPEC_SHUFB 18)
|
124 |
|
|
(UNSPEC_CPAT 19)
|
125 |
|
|
(UNSPEC_SYNC 20)
|
126 |
|
|
(UNSPEC_CNTB 21)
|
127 |
|
|
(UNSPEC_SUMB 22)
|
128 |
|
|
(UNSPEC_FSMB 23)
|
129 |
|
|
(UNSPEC_FSMH 24)
|
130 |
|
|
(UNSPEC_GBB 25)
|
131 |
|
|
(UNSPEC_GBH 26)
|
132 |
|
|
(UNSPEC_GB 27)
|
133 |
|
|
(UNSPEC_AVGB 28)
|
134 |
|
|
(UNSPEC_ABSDB 29)
|
135 |
|
|
(UNSPEC_ORX 30)
|
136 |
|
|
(UNSPEC_HEQ 31)
|
137 |
|
|
(UNSPEC_HGT 32)
|
138 |
|
|
(UNSPEC_HLGT 33)
|
139 |
|
|
(UNSPEC_STOP 38)
|
140 |
|
|
(UNSPEC_STOPD 39)
|
141 |
|
|
(UNSPEC_SET_INTR 40)
|
142 |
|
|
(UNSPEC_FSCRRD 42)
|
143 |
|
|
(UNSPEC_FSCRWR 43)
|
144 |
|
|
(UNSPEC_MFSPR 44)
|
145 |
|
|
(UNSPEC_MTSPR 45)
|
146 |
|
|
(UNSPEC_RDCH 46)
|
147 |
|
|
(UNSPEC_RCHCNT 47)
|
148 |
|
|
(UNSPEC_WRCH 48)
|
149 |
|
|
(UNSPEC_SPU_REALIGN_LOAD 49)
|
150 |
|
|
(UNSPEC_SPU_MASK_FOR_LOAD 50)
|
151 |
|
|
(UNSPEC_DFTSV 51)
|
152 |
|
|
(UNSPEC_FLOAT_EXTEND 52)
|
153 |
|
|
(UNSPEC_FLOAT_TRUNCATE 53)
|
154 |
|
|
(UNSPEC_SP_SET 54)
|
155 |
|
|
(UNSPEC_SP_TEST 55)
|
156 |
|
|
])
|
157 |
|
|
|
158 |
|
|
(include "predicates.md")
|
159 |
|
|
(include "constraints.md")
|
160 |
|
|
|
161 |
|
|
|
162 |
|
|
;; Mode iterators
|
163 |
|
|
|
164 |
|
|
(define_mode_iterator ALL [QI V16QI
|
165 |
|
|
HI V8HI
|
166 |
|
|
SI V4SI
|
167 |
|
|
DI V2DI
|
168 |
|
|
TI
|
169 |
|
|
SF V4SF
|
170 |
|
|
DF V2DF])
|
171 |
|
|
|
172 |
|
|
; Everything except DI and TI which are handled separately because
|
173 |
|
|
; they need different constraints to correctly test VOIDmode constants
|
174 |
|
|
(define_mode_iterator MOV [QI V16QI
|
175 |
|
|
HI V8HI
|
176 |
|
|
SI V4SI
|
177 |
|
|
V2DI
|
178 |
|
|
SF V4SF
|
179 |
|
|
DF V2DF])
|
180 |
|
|
|
181 |
|
|
(define_mode_iterator QHSI [QI HI SI])
|
182 |
|
|
(define_mode_iterator QHSDI [QI HI SI DI])
|
183 |
|
|
(define_mode_iterator DTI [DI TI])
|
184 |
|
|
|
185 |
|
|
(define_mode_iterator VINT [QI V16QI
|
186 |
|
|
HI V8HI
|
187 |
|
|
SI V4SI
|
188 |
|
|
DI V2DI
|
189 |
|
|
TI])
|
190 |
|
|
|
191 |
|
|
(define_mode_iterator VQHSI [QI V16QI
|
192 |
|
|
HI V8HI
|
193 |
|
|
SI V4SI])
|
194 |
|
|
|
195 |
|
|
(define_mode_iterator VHSI [HI V8HI
|
196 |
|
|
SI V4SI])
|
197 |
|
|
|
198 |
|
|
(define_mode_iterator VSDF [SF V4SF
|
199 |
|
|
DF V2DF])
|
200 |
|
|
|
201 |
|
|
(define_mode_iterator VSI [SI V4SI])
|
202 |
|
|
(define_mode_iterator VDI [DI V2DI])
|
203 |
|
|
(define_mode_iterator VSF [SF V4SF])
|
204 |
|
|
(define_mode_iterator VDF [DF V2DF])
|
205 |
|
|
|
206 |
|
|
(define_mode_iterator VCMP [V16QI
|
207 |
|
|
V8HI
|
208 |
|
|
V4SI
|
209 |
|
|
V4SF
|
210 |
|
|
V2DF])
|
211 |
|
|
|
212 |
|
|
(define_mode_iterator VCMPU [V16QI
|
213 |
|
|
V8HI
|
214 |
|
|
V4SI])
|
215 |
|
|
|
216 |
|
|
(define_mode_attr v [(V8HI "v") (V4SI "v")
|
217 |
|
|
(HI "") (SI "")])
|
218 |
|
|
|
219 |
|
|
(define_mode_attr bh [(QI "b") (V16QI "b")
|
220 |
|
|
(HI "h") (V8HI "h")
|
221 |
|
|
(SI "") (V4SI "")])
|
222 |
|
|
|
223 |
|
|
(define_mode_attr d [(SF "") (V4SF "")
|
224 |
|
|
(DF "d") (V2DF "d")])
|
225 |
|
|
(define_mode_attr d6 [(SF "6") (V4SF "6")
|
226 |
|
|
(DF "d") (V2DF "d")])
|
227 |
|
|
|
228 |
|
|
(define_mode_attr f2i [(SF "si") (V4SF "v4si")
|
229 |
|
|
(DF "di") (V2DF "v2di")])
|
230 |
|
|
(define_mode_attr F2I [(SF "SI") (V4SF "V4SI")
|
231 |
|
|
(DF "DI") (V2DF "V2DI")])
|
232 |
|
|
(define_mode_attr i2f [(SI "sf") (V4SI "v4sf")
|
233 |
|
|
(DI "df") (V2DI "v2df")])
|
234 |
|
|
(define_mode_attr I2F [(SI "SF") (V4SI "V4SF")
|
235 |
|
|
(DI "DF") (V2DI "V2DF")])
|
236 |
|
|
|
237 |
|
|
(define_mode_attr DF2I [(DF "SI") (V2DF "V2DI")])
|
238 |
|
|
|
239 |
|
|
(define_mode_attr umask [(HI "f") (V8HI "f")
|
240 |
|
|
(SI "g") (V4SI "g")])
|
241 |
|
|
(define_mode_attr nmask [(HI "F") (V8HI "F")
|
242 |
|
|
(SI "G") (V4SI "G")])
|
243 |
|
|
|
244 |
|
|
;; Used for carry and borrow instructions.
|
245 |
|
|
(define_mode_iterator CBOP [SI DI V4SI V2DI])
|
246 |
|
|
|
247 |
|
|
;; Used in vec_set and vec_extract
|
248 |
|
|
(define_mode_iterator V [V2DI V4SI V8HI V16QI V2DF V4SF])
|
249 |
|
|
(define_mode_attr inner [(V16QI "QI")
|
250 |
|
|
(V8HI "HI")
|
251 |
|
|
(V4SI "SI")
|
252 |
|
|
(V2DI "DI")
|
253 |
|
|
(V4SF "SF")
|
254 |
|
|
(V2DF "DF")])
|
255 |
|
|
(define_mode_attr vmult [(V16QI "1")
|
256 |
|
|
(V8HI "2")
|
257 |
|
|
(V4SI "4")
|
258 |
|
|
(V2DI "8")
|
259 |
|
|
(V4SF "4")
|
260 |
|
|
(V2DF "8")])
|
261 |
|
|
(define_mode_attr voff [(V16QI "13")
|
262 |
|
|
(V8HI "14")
|
263 |
|
|
(V4SI "0")
|
264 |
|
|
(V2DI "0")
|
265 |
|
|
(V4SF "0")
|
266 |
|
|
(V2DF "0")])
|
267 |
|
|
|
268 |
|
|
|
269 |
|
|
;; mov
|
270 |
|
|
|
271 |
|
|
(define_expand "mov"
|
272 |
|
|
[(set (match_operand:ALL 0 "spu_nonimm_operand" "=r,r,r,m")
|
273 |
|
|
(match_operand:ALL 1 "general_operand" "r,i,m,r"))]
|
274 |
|
|
""
|
275 |
|
|
{
|
276 |
|
|
if (spu_expand_mov(operands, mode))
|
277 |
|
|
DONE;
|
278 |
|
|
})
|
279 |
|
|
|
280 |
|
|
(define_split
|
281 |
|
|
[(set (match_operand 0 "spu_reg_operand")
|
282 |
|
|
(match_operand 1 "immediate_operand"))]
|
283 |
|
|
|
284 |
|
|
""
|
285 |
|
|
[(set (match_dup 0)
|
286 |
|
|
(high (match_dup 1)))
|
287 |
|
|
(set (match_dup 0)
|
288 |
|
|
(lo_sum (match_dup 0)
|
289 |
|
|
(match_dup 1)))]
|
290 |
|
|
{
|
291 |
|
|
if (spu_split_immediate (operands))
|
292 |
|
|
DONE;
|
293 |
|
|
FAIL;
|
294 |
|
|
})
|
295 |
|
|
|
296 |
|
|
(define_insn "pic"
|
297 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
298 |
|
|
(match_operand:SI 1 "immediate_operand" "s"))
|
299 |
|
|
(use (const_int 0))]
|
300 |
|
|
"flag_pic"
|
301 |
|
|
"ila\t%0,%%pic(%1)")
|
302 |
|
|
|
303 |
|
|
;; Whenever a function generates the 'pic' pattern above we need to
|
304 |
|
|
;; load the pic_offset_table register.
|
305 |
|
|
;; GCC doesn't deal well with labels in the middle of a block so we
|
306 |
|
|
;; hardcode the offsets in the asm here.
|
307 |
|
|
(define_insn "load_pic_offset"
|
308 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
309 |
|
|
(unspec:SI [(const_int 0)] 0))
|
310 |
|
|
(set (match_operand:SI 1 "spu_reg_operand" "=r")
|
311 |
|
|
(unspec:SI [(const_int 0)] 0))]
|
312 |
|
|
"flag_pic"
|
313 |
|
|
"ila\t%1,.+8\;brsl\t%0,4"
|
314 |
|
|
[(set_attr "length" "8")
|
315 |
|
|
(set_attr "type" "multi0")])
|
316 |
|
|
|
317 |
|
|
|
318 |
|
|
;; move internal
|
319 |
|
|
|
320 |
|
|
(define_insn "_mov"
|
321 |
|
|
[(set (match_operand:MOV 0 "spu_dest_operand" "=r,r,r,r,r,m")
|
322 |
|
|
(match_operand:MOV 1 "spu_mov_operand" "r,A,f,j,m,r"))]
|
323 |
|
|
"register_operand(operands[0], mode)
|
324 |
|
|
|| register_operand(operands[1], mode)"
|
325 |
|
|
"@
|
326 |
|
|
ori\t%0,%1,0
|
327 |
|
|
il%s1\t%0,%S1
|
328 |
|
|
fsmbi\t%0,%S1
|
329 |
|
|
c%s1d\t%0,%S1($sp)
|
330 |
|
|
lq%p1\t%0,%1
|
331 |
|
|
stq%p0\t%1,%0"
|
332 |
|
|
[(set_attr "type" "fx2,fx2,shuf,shuf,load,store")])
|
333 |
|
|
|
334 |
|
|
(define_insn "low_"
|
335 |
|
|
[(set (match_operand:VSI 0 "spu_reg_operand" "=r")
|
336 |
|
|
(lo_sum:VSI (match_operand:VSI 1 "spu_reg_operand" "0")
|
337 |
|
|
(match_operand:VSI 2 "immediate_operand" "i")))]
|
338 |
|
|
""
|
339 |
|
|
"iohl\t%0,%2@l")
|
340 |
|
|
|
341 |
|
|
(define_insn "_movdi"
|
342 |
|
|
[(set (match_operand:DI 0 "spu_dest_operand" "=r,r,r,r,r,m")
|
343 |
|
|
(match_operand:DI 1 "spu_mov_operand" "r,a,f,k,m,r"))]
|
344 |
|
|
"register_operand(operands[0], DImode)
|
345 |
|
|
|| register_operand(operands[1], DImode)"
|
346 |
|
|
"@
|
347 |
|
|
ori\t%0,%1,0
|
348 |
|
|
il%d1\t%0,%D1
|
349 |
|
|
fsmbi\t%0,%D1
|
350 |
|
|
c%d1d\t%0,%D1($sp)
|
351 |
|
|
lq%p1\t%0,%1
|
352 |
|
|
stq%p0\t%1,%0"
|
353 |
|
|
[(set_attr "type" "fx2,fx2,shuf,shuf,load,store")])
|
354 |
|
|
|
355 |
|
|
(define_insn "_movti"
|
356 |
|
|
[(set (match_operand:TI 0 "spu_dest_operand" "=r,r,r,r,r,m")
|
357 |
|
|
(match_operand:TI 1 "spu_mov_operand" "r,U,f,l,m,r"))]
|
358 |
|
|
"register_operand(operands[0], TImode)
|
359 |
|
|
|| register_operand(operands[1], TImode)"
|
360 |
|
|
"@
|
361 |
|
|
ori\t%0,%1,0
|
362 |
|
|
il%t1\t%0,%T1
|
363 |
|
|
fsmbi\t%0,%T1
|
364 |
|
|
c%t1d\t%0,%T1($sp)
|
365 |
|
|
lq%p1\t%0,%1
|
366 |
|
|
stq%p0\t%1,%0"
|
367 |
|
|
[(set_attr "type" "fx2,fx2,shuf,shuf,load,store")])
|
368 |
|
|
|
369 |
|
|
(define_split
|
370 |
|
|
[(set (match_operand 0 "spu_reg_operand")
|
371 |
|
|
(match_operand 1 "memory_operand"))]
|
372 |
|
|
"GET_MODE_SIZE (GET_MODE (operands[0])) < 16
|
373 |
|
|
&& GET_MODE(operands[0]) == GET_MODE(operands[1])
|
374 |
|
|
&& !reload_in_progress && !reload_completed"
|
375 |
|
|
[(set (match_dup 0)
|
376 |
|
|
(match_dup 1))]
|
377 |
|
|
{ if (spu_split_load(operands))
|
378 |
|
|
DONE;
|
379 |
|
|
})
|
380 |
|
|
|
381 |
|
|
(define_split
|
382 |
|
|
[(set (match_operand 0 "memory_operand")
|
383 |
|
|
(match_operand 1 "spu_reg_operand"))]
|
384 |
|
|
"GET_MODE_SIZE (GET_MODE (operands[0])) < 16
|
385 |
|
|
&& GET_MODE(operands[0]) == GET_MODE(operands[1])
|
386 |
|
|
&& !reload_in_progress && !reload_completed"
|
387 |
|
|
[(set (match_dup 0)
|
388 |
|
|
(match_dup 1))]
|
389 |
|
|
{ if (spu_split_store(operands))
|
390 |
|
|
DONE;
|
391 |
|
|
})
|
392 |
|
|
;; Operand 3 is the number of bytes. 1:b 2:h 4:w 8:d
|
393 |
|
|
|
394 |
|
|
(define_expand "cpat"
|
395 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r,r")
|
396 |
|
|
(unspec:TI [(match_operand:SI 1 "spu_reg_operand" "r,r")
|
397 |
|
|
(match_operand:SI 2 "spu_nonmem_operand" "r,n")
|
398 |
|
|
(match_operand:SI 3 "immediate_operand" "i,i")] UNSPEC_CPAT))]
|
399 |
|
|
""
|
400 |
|
|
{
|
401 |
|
|
rtx x = gen_cpat_const (operands);
|
402 |
|
|
if (x)
|
403 |
|
|
{
|
404 |
|
|
emit_move_insn (operands[0], x);
|
405 |
|
|
DONE;
|
406 |
|
|
}
|
407 |
|
|
})
|
408 |
|
|
|
409 |
|
|
(define_insn "_cpat"
|
410 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r,r")
|
411 |
|
|
(unspec:TI [(match_operand:SI 1 "spu_reg_operand" "r,r")
|
412 |
|
|
(match_operand:SI 2 "spu_nonmem_operand" "r,n")
|
413 |
|
|
(match_operand:SI 3 "immediate_operand" "i,i")] UNSPEC_CPAT))]
|
414 |
|
|
""
|
415 |
|
|
"@
|
416 |
|
|
c%M3x\t%0,%1,%2
|
417 |
|
|
c%M3d\t%0,%C2(%1)"
|
418 |
|
|
[(set_attr "type" "shuf")])
|
419 |
|
|
|
420 |
|
|
(define_split
|
421 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand")
|
422 |
|
|
(unspec:TI [(match_operand:SI 1 "spu_nonmem_operand")
|
423 |
|
|
(match_operand:SI 2 "immediate_operand")
|
424 |
|
|
(match_operand:SI 3 "immediate_operand")] UNSPEC_CPAT))]
|
425 |
|
|
""
|
426 |
|
|
[(set (match_dup:TI 0)
|
427 |
|
|
(match_dup:TI 4))]
|
428 |
|
|
{
|
429 |
|
|
operands[4] = gen_cpat_const (operands);
|
430 |
|
|
if (!operands[4])
|
431 |
|
|
FAIL;
|
432 |
|
|
})
|
433 |
|
|
|
434 |
|
|
;; extend
|
435 |
|
|
|
436 |
|
|
(define_insn "extendqihi2"
|
437 |
|
|
[(set (match_operand:HI 0 "spu_reg_operand" "=r")
|
438 |
|
|
(sign_extend:HI (match_operand:QI 1 "spu_reg_operand" "r")))]
|
439 |
|
|
""
|
440 |
|
|
"xsbh\t%0,%1")
|
441 |
|
|
|
442 |
|
|
(define_insn "extendhisi2"
|
443 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
444 |
|
|
(sign_extend:SI (match_operand:HI 1 "spu_reg_operand" "r")))]
|
445 |
|
|
""
|
446 |
|
|
"xshw\t%0,%1")
|
447 |
|
|
|
448 |
|
|
(define_expand "extendsidi2"
|
449 |
|
|
[(set (match_dup:DI 2)
|
450 |
|
|
(zero_extend:DI (match_operand:SI 1 "spu_reg_operand" "")))
|
451 |
|
|
(set (match_operand:DI 0 "spu_reg_operand" "")
|
452 |
|
|
(sign_extend:DI (vec_select:SI (match_dup:V2SI 3)
|
453 |
|
|
(parallel [(const_int 1)]))))]
|
454 |
|
|
""
|
455 |
|
|
{
|
456 |
|
|
operands[2] = gen_reg_rtx (DImode);
|
457 |
|
|
operands[3] = spu_gen_subreg (V2SImode, operands[2]);
|
458 |
|
|
})
|
459 |
|
|
|
460 |
|
|
(define_insn "xswd"
|
461 |
|
|
[(set (match_operand:DI 0 "spu_reg_operand" "=r")
|
462 |
|
|
(sign_extend:DI
|
463 |
|
|
(vec_select:SI
|
464 |
|
|
(match_operand:V2SI 1 "spu_reg_operand" "r")
|
465 |
|
|
(parallel [(const_int 1) ]))))]
|
466 |
|
|
""
|
467 |
|
|
"xswd\t%0,%1");
|
468 |
|
|
|
469 |
|
|
;; By splitting this late we don't allow much opportunity for sharing of
|
470 |
|
|
;; constants. That's ok because this should really be optimized away.
|
471 |
|
|
(define_insn_and_split "extendti2"
|
472 |
|
|
[(set (match_operand:TI 0 "register_operand" "")
|
473 |
|
|
(sign_extend:TI (match_operand:QHSDI 1 "register_operand" "")))]
|
474 |
|
|
""
|
475 |
|
|
"#"
|
476 |
|
|
""
|
477 |
|
|
[(set (match_dup:TI 0)
|
478 |
|
|
(sign_extend:TI (match_dup:QHSDI 1)))]
|
479 |
|
|
{
|
480 |
|
|
spu_expand_sign_extend(operands);
|
481 |
|
|
DONE;
|
482 |
|
|
})
|
483 |
|
|
|
484 |
|
|
|
485 |
|
|
;; zero_extend
|
486 |
|
|
|
487 |
|
|
(define_insn "zero_extendqihi2"
|
488 |
|
|
[(set (match_operand:HI 0 "spu_reg_operand" "=r")
|
489 |
|
|
(zero_extend:HI (match_operand:QI 1 "spu_reg_operand" "r")))]
|
490 |
|
|
""
|
491 |
|
|
"andi\t%0,%1,0x00ff")
|
492 |
|
|
|
493 |
|
|
(define_insn "zero_extendqisi2"
|
494 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
495 |
|
|
(zero_extend:SI (match_operand:QI 1 "spu_reg_operand" "r")))]
|
496 |
|
|
""
|
497 |
|
|
"andi\t%0,%1,0x00ff")
|
498 |
|
|
|
499 |
|
|
(define_expand "zero_extendhisi2"
|
500 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
501 |
|
|
(zero_extend:SI (match_operand:HI 1 "spu_reg_operand" "r")))
|
502 |
|
|
(clobber (match_scratch:SI 2 "=&r"))]
|
503 |
|
|
""
|
504 |
|
|
{
|
505 |
|
|
rtx mask = gen_reg_rtx (SImode);
|
506 |
|
|
rtx op1 = simplify_gen_subreg (SImode, operands[1], HImode, 0);
|
507 |
|
|
emit_move_insn (mask, GEN_INT (0xffff));
|
508 |
|
|
emit_insn (gen_andsi3(operands[0], op1, mask));
|
509 |
|
|
DONE;
|
510 |
|
|
})
|
511 |
|
|
|
512 |
|
|
(define_insn "zero_extendsidi2"
|
513 |
|
|
[(set (match_operand:DI 0 "spu_reg_operand" "=r")
|
514 |
|
|
(zero_extend:DI (match_operand:SI 1 "spu_reg_operand" "r")))]
|
515 |
|
|
""
|
516 |
|
|
"rotqmbyi\t%0,%1,-4"
|
517 |
|
|
[(set_attr "type" "shuf")])
|
518 |
|
|
|
519 |
|
|
(define_insn "zero_extendqiti2"
|
520 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r")
|
521 |
|
|
(zero_extend:TI (match_operand:QI 1 "spu_reg_operand" "r")))]
|
522 |
|
|
""
|
523 |
|
|
"andi\t%0,%1,0x00ff\;rotqmbyi\t%0,%0,-12"
|
524 |
|
|
[(set_attr "type" "multi0")
|
525 |
|
|
(set_attr "length" "8")])
|
526 |
|
|
|
527 |
|
|
(define_insn "zero_extendhiti2"
|
528 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r")
|
529 |
|
|
(zero_extend:TI (match_operand:HI 1 "spu_reg_operand" "r")))]
|
530 |
|
|
""
|
531 |
|
|
"shli\t%0,%1,16\;rotqmbyi\t%0,%0,-14"
|
532 |
|
|
[(set_attr "type" "multi1")
|
533 |
|
|
(set_attr "length" "8")])
|
534 |
|
|
|
535 |
|
|
(define_insn "zero_extendsiti2"
|
536 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r")
|
537 |
|
|
(zero_extend:TI (match_operand:SI 1 "spu_reg_operand" "r")))]
|
538 |
|
|
""
|
539 |
|
|
"rotqmbyi\t%0,%1,-12"
|
540 |
|
|
[(set_attr "type" "shuf")])
|
541 |
|
|
|
542 |
|
|
(define_insn "zero_extendditi2"
|
543 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r")
|
544 |
|
|
(zero_extend:TI (match_operand:DI 1 "spu_reg_operand" "r")))]
|
545 |
|
|
""
|
546 |
|
|
"rotqmbyi\t%0,%1,-8"
|
547 |
|
|
[(set_attr "type" "shuf")])
|
548 |
|
|
|
549 |
|
|
|
550 |
|
|
;; trunc
|
551 |
|
|
|
552 |
|
|
(define_insn "truncdiqi2"
|
553 |
|
|
[(set (match_operand:QI 0 "spu_reg_operand" "=r")
|
554 |
|
|
(truncate:QI (match_operand:DI 1 "spu_reg_operand" "r")))]
|
555 |
|
|
""
|
556 |
|
|
"shlqbyi\t%0,%1,4"
|
557 |
|
|
[(set_attr "type" "shuf")])
|
558 |
|
|
|
559 |
|
|
(define_insn "truncdihi2"
|
560 |
|
|
[(set (match_operand:HI 0 "spu_reg_operand" "=r")
|
561 |
|
|
(truncate:HI (match_operand:DI 1 "spu_reg_operand" "r")))]
|
562 |
|
|
""
|
563 |
|
|
"shlqbyi\t%0,%1,4"
|
564 |
|
|
[(set_attr "type" "shuf")])
|
565 |
|
|
|
566 |
|
|
(define_insn "truncdisi2"
|
567 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
568 |
|
|
(truncate:SI (match_operand:DI 1 "spu_reg_operand" "r")))]
|
569 |
|
|
""
|
570 |
|
|
"shlqbyi\t%0,%1,4"
|
571 |
|
|
[(set_attr "type" "shuf")])
|
572 |
|
|
|
573 |
|
|
(define_insn "trunctiqi2"
|
574 |
|
|
[(set (match_operand:QI 0 "spu_reg_operand" "=r")
|
575 |
|
|
(truncate:QI (match_operand:TI 1 "spu_reg_operand" "r")))]
|
576 |
|
|
""
|
577 |
|
|
"shlqbyi\t%0,%1,12"
|
578 |
|
|
[(set_attr "type" "shuf")])
|
579 |
|
|
|
580 |
|
|
(define_insn "trunctihi2"
|
581 |
|
|
[(set (match_operand:HI 0 "spu_reg_operand" "=r")
|
582 |
|
|
(truncate:HI (match_operand:TI 1 "spu_reg_operand" "r")))]
|
583 |
|
|
""
|
584 |
|
|
"shlqbyi\t%0,%1,12"
|
585 |
|
|
[(set_attr "type" "shuf")])
|
586 |
|
|
|
587 |
|
|
(define_insn "trunctisi2"
|
588 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
589 |
|
|
(truncate:SI (match_operand:TI 1 "spu_reg_operand" "r")))]
|
590 |
|
|
""
|
591 |
|
|
"shlqbyi\t%0,%1,12"
|
592 |
|
|
[(set_attr "type" "shuf")])
|
593 |
|
|
|
594 |
|
|
(define_insn "trunctidi2"
|
595 |
|
|
[(set (match_operand:DI 0 "spu_reg_operand" "=r")
|
596 |
|
|
(truncate:DI (match_operand:TI 1 "spu_reg_operand" "r")))]
|
597 |
|
|
""
|
598 |
|
|
"shlqbyi\t%0,%1,8"
|
599 |
|
|
[(set_attr "type" "shuf")])
|
600 |
|
|
|
601 |
|
|
|
602 |
|
|
;; float conversions
|
603 |
|
|
|
604 |
|
|
(define_insn "float2"
|
605 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
606 |
|
|
(float: (match_operand:VSI 1 "spu_reg_operand" "r")))]
|
607 |
|
|
""
|
608 |
|
|
"csflt\t%0,%1,0"
|
609 |
|
|
[(set_attr "type" "fp7")])
|
610 |
|
|
|
611 |
|
|
(define_insn "fix_trunc2"
|
612 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
613 |
|
|
(fix: (match_operand:VSF 1 "spu_reg_operand" "r")))]
|
614 |
|
|
""
|
615 |
|
|
"cflts\t%0,%1,0"
|
616 |
|
|
[(set_attr "type" "fp7")])
|
617 |
|
|
|
618 |
|
|
(define_insn "floatuns2"
|
619 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
620 |
|
|
(unsigned_float: (match_operand:VSI 1 "spu_reg_operand" "r")))]
|
621 |
|
|
""
|
622 |
|
|
"cuflt\t%0,%1,0"
|
623 |
|
|
[(set_attr "type" "fp7")])
|
624 |
|
|
|
625 |
|
|
(define_insn "fixuns_trunc2"
|
626 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
627 |
|
|
(unsigned_fix: (match_operand:VSF 1 "spu_reg_operand" "r")))]
|
628 |
|
|
""
|
629 |
|
|
"cfltu\t%0,%1,0"
|
630 |
|
|
[(set_attr "type" "fp7")])
|
631 |
|
|
|
632 |
|
|
(define_insn "float2_mul"
|
633 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
634 |
|
|
(mult: (float: (match_operand:VSI 1 "spu_reg_operand" "r"))
|
635 |
|
|
(match_operand: 2 "spu_inv_exp2_operand" "w")))]
|
636 |
|
|
""
|
637 |
|
|
"csflt\t%0,%1,%w2"
|
638 |
|
|
[(set_attr "type" "fp7")])
|
639 |
|
|
|
640 |
|
|
(define_insn "float2_div"
|
641 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
642 |
|
|
(div: (float: (match_operand:VSI 1 "spu_reg_operand" "r"))
|
643 |
|
|
(match_operand: 2 "spu_exp2_operand" "v")))]
|
644 |
|
|
""
|
645 |
|
|
"csflt\t%0,%1,%v2"
|
646 |
|
|
[(set_attr "type" "fp7")])
|
647 |
|
|
|
648 |
|
|
|
649 |
|
|
(define_insn "fix_trunc2_mul"
|
650 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
651 |
|
|
(fix: (mult:VSF (match_operand:VSF 1 "spu_reg_operand" "r")
|
652 |
|
|
(match_operand:VSF 2 "spu_exp2_operand" "v"))))]
|
653 |
|
|
""
|
654 |
|
|
"cflts\t%0,%1,%v2"
|
655 |
|
|
[(set_attr "type" "fp7")])
|
656 |
|
|
|
657 |
|
|
(define_insn "floatuns2_mul"
|
658 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
659 |
|
|
(mult: (unsigned_float: (match_operand:VSI 1 "spu_reg_operand" "r"))
|
660 |
|
|
(match_operand: 2 "spu_inv_exp2_operand" "w")))]
|
661 |
|
|
""
|
662 |
|
|
"cuflt\t%0,%1,%w2"
|
663 |
|
|
[(set_attr "type" "fp7")])
|
664 |
|
|
|
665 |
|
|
(define_insn "floatuns2_div"
|
666 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
667 |
|
|
(div: (unsigned_float: (match_operand:VSI 1 "spu_reg_operand" "r"))
|
668 |
|
|
(match_operand: 2 "spu_exp2_operand" "v")))]
|
669 |
|
|
""
|
670 |
|
|
"cuflt\t%0,%1,%v2"
|
671 |
|
|
[(set_attr "type" "fp7")])
|
672 |
|
|
|
673 |
|
|
(define_insn "fixuns_trunc2_mul"
|
674 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
675 |
|
|
(unsigned_fix: (mult:VSF (match_operand:VSF 1 "spu_reg_operand" "r")
|
676 |
|
|
(match_operand:VSF 2 "spu_exp2_operand" "v"))))]
|
677 |
|
|
""
|
678 |
|
|
"cfltu\t%0,%1,%v2"
|
679 |
|
|
[(set_attr "type" "fp7")])
|
680 |
|
|
|
681 |
|
|
(define_insn "extendsfdf2"
|
682 |
|
|
[(set (match_operand:DF 0 "spu_reg_operand" "=r")
|
683 |
|
|
(unspec:DF [(match_operand:SF 1 "spu_reg_operand" "r")]
|
684 |
|
|
UNSPEC_FLOAT_EXTEND))]
|
685 |
|
|
""
|
686 |
|
|
"fesd\t%0,%1"
|
687 |
|
|
[(set_attr "type" "fpd")])
|
688 |
|
|
|
689 |
|
|
(define_insn "truncdfsf2"
|
690 |
|
|
[(set (match_operand:SF 0 "spu_reg_operand" "=r")
|
691 |
|
|
(unspec:SF [(match_operand:DF 1 "spu_reg_operand" "r")]
|
692 |
|
|
UNSPEC_FLOAT_TRUNCATE))]
|
693 |
|
|
""
|
694 |
|
|
"frds\t%0,%1"
|
695 |
|
|
[(set_attr "type" "fpd")])
|
696 |
|
|
|
697 |
|
|
(define_expand "floatdisf2"
|
698 |
|
|
[(set (match_operand:SF 0 "register_operand" "")
|
699 |
|
|
(float:SF (match_operand:DI 1 "register_operand" "")))]
|
700 |
|
|
""
|
701 |
|
|
{
|
702 |
|
|
rtx c0 = gen_reg_rtx (SImode);
|
703 |
|
|
rtx r0 = gen_reg_rtx (DImode);
|
704 |
|
|
rtx r1 = gen_reg_rtx (SFmode);
|
705 |
|
|
rtx r2 = gen_reg_rtx (SImode);
|
706 |
|
|
rtx setneg = gen_reg_rtx (SImode);
|
707 |
|
|
rtx isneg = gen_reg_rtx (SImode);
|
708 |
|
|
rtx neg = gen_reg_rtx (DImode);
|
709 |
|
|
rtx mask = gen_reg_rtx (DImode);
|
710 |
|
|
|
711 |
|
|
emit_move_insn (c0, GEN_INT (-0x80000000ll));
|
712 |
|
|
|
713 |
|
|
emit_insn (gen_negdi2 (neg, operands[1]));
|
714 |
|
|
emit_insn (gen_cgt_di_m1 (isneg, operands[1]));
|
715 |
|
|
emit_insn (gen_extend_compare (mask, isneg));
|
716 |
|
|
emit_insn (gen_selb (r0, neg, operands[1], mask));
|
717 |
|
|
emit_insn (gen_andc_si (setneg, c0, isneg));
|
718 |
|
|
|
719 |
|
|
emit_insn (gen_floatunsdisf2 (r1, r0));
|
720 |
|
|
|
721 |
|
|
emit_insn (gen_iorsi3 (r2, gen_rtx_SUBREG (SImode, r1, 0), setneg));
|
722 |
|
|
emit_move_insn (operands[0], gen_rtx_SUBREG (SFmode, r2, 0));
|
723 |
|
|
DONE;
|
724 |
|
|
})
|
725 |
|
|
|
726 |
|
|
(define_insn_and_split "floatunsdisf2"
|
727 |
|
|
[(set (match_operand:SF 0 "register_operand" "=r")
|
728 |
|
|
(unsigned_float:SF (match_operand:DI 1 "register_operand" "r")))
|
729 |
|
|
(clobber (match_scratch:SF 2 "=r"))
|
730 |
|
|
(clobber (match_scratch:SF 3 "=r"))
|
731 |
|
|
(clobber (match_scratch:SF 4 "=r"))]
|
732 |
|
|
""
|
733 |
|
|
"#"
|
734 |
|
|
"reload_completed"
|
735 |
|
|
[(set (match_dup:SF 0)
|
736 |
|
|
(unsigned_float:SF (match_dup:DI 1)))]
|
737 |
|
|
{
|
738 |
|
|
rtx op1_v4si = gen_rtx_REG (V4SImode, REGNO (operands[1]));
|
739 |
|
|
rtx op2_v4sf = gen_rtx_REG (V4SFmode, REGNO (operands[2]));
|
740 |
|
|
rtx op2_ti = gen_rtx_REG (TImode, REGNO (operands[2]));
|
741 |
|
|
rtx op3_ti = gen_rtx_REG (TImode, REGNO (operands[3]));
|
742 |
|
|
|
743 |
|
|
REAL_VALUE_TYPE scale;
|
744 |
|
|
real_2expN (&scale, 32, SFmode);
|
745 |
|
|
|
746 |
|
|
emit_insn (gen_floatunsv4siv4sf2 (op2_v4sf, op1_v4si));
|
747 |
|
|
emit_insn (gen_shlqby_ti (op3_ti, op2_ti, GEN_INT (4)));
|
748 |
|
|
|
749 |
|
|
emit_move_insn (operands[4],
|
750 |
|
|
CONST_DOUBLE_FROM_REAL_VALUE (scale, SFmode));
|
751 |
|
|
emit_insn (gen_fma_sf (operands[0],
|
752 |
|
|
operands[2], operands[4], operands[3]));
|
753 |
|
|
DONE;
|
754 |
|
|
})
|
755 |
|
|
|
756 |
|
|
;; Do (double)(operands[1]+0x80000000u)-(double)0x80000000
|
757 |
|
|
(define_expand "floatsidf2"
|
758 |
|
|
[(set (match_operand:DF 0 "register_operand" "")
|
759 |
|
|
(float:DF (match_operand:SI 1 "register_operand" "")))]
|
760 |
|
|
""
|
761 |
|
|
{
|
762 |
|
|
rtx c0 = gen_reg_rtx (SImode);
|
763 |
|
|
rtx c1 = gen_reg_rtx (DFmode);
|
764 |
|
|
rtx r0 = gen_reg_rtx (SImode);
|
765 |
|
|
rtx r1 = gen_reg_rtx (DFmode);
|
766 |
|
|
|
767 |
|
|
emit_move_insn (c0, GEN_INT (-0x80000000ll));
|
768 |
|
|
emit_move_insn (c1, spu_float_const ("2147483648", DFmode));
|
769 |
|
|
emit_insn (gen_xorsi3 (r0, operands[1], c0));
|
770 |
|
|
emit_insn (gen_floatunssidf2 (r1, r0));
|
771 |
|
|
emit_insn (gen_subdf3 (operands[0], r1, c1));
|
772 |
|
|
DONE;
|
773 |
|
|
})
|
774 |
|
|
|
775 |
|
|
(define_expand "floatunssidf2"
|
776 |
|
|
[(set (match_operand:DF 0 "register_operand" "=r")
|
777 |
|
|
(unsigned_float:DF (match_operand:SI 1 "register_operand" "r")))]
|
778 |
|
|
""
|
779 |
|
|
"{
|
780 |
|
|
rtx value, insns;
|
781 |
|
|
rtx c0 = spu_const_from_ints (V16QImode, 0x02031011, 0x12138080,
|
782 |
|
|
0x06071415, 0x16178080);
|
783 |
|
|
rtx r0 = gen_reg_rtx (V16QImode);
|
784 |
|
|
|
785 |
|
|
if (optimize_size)
|
786 |
|
|
{
|
787 |
|
|
start_sequence ();
|
788 |
|
|
value =
|
789 |
|
|
emit_library_call_value (convert_optab_libfunc (ufloat_optab,
|
790 |
|
|
DFmode, SImode),
|
791 |
|
|
NULL_RTX, LCT_NORMAL, DFmode, 1, operands[1], SImode);
|
792 |
|
|
insns = get_insns ();
|
793 |
|
|
end_sequence ();
|
794 |
|
|
emit_libcall_block (insns, operands[0], value,
|
795 |
|
|
gen_rtx_UNSIGNED_FLOAT (DFmode, operands[1]));
|
796 |
|
|
}
|
797 |
|
|
else
|
798 |
|
|
{
|
799 |
|
|
emit_move_insn (r0, c0);
|
800 |
|
|
emit_insn (gen_floatunssidf2_internal (operands[0], operands[1], r0));
|
801 |
|
|
}
|
802 |
|
|
DONE;
|
803 |
|
|
}")
|
804 |
|
|
|
805 |
|
|
(define_insn_and_split "floatunssidf2_internal"
|
806 |
|
|
[(set (match_operand:DF 0 "register_operand" "=r")
|
807 |
|
|
(unsigned_float:DF (match_operand:SI 1 "register_operand" "r")))
|
808 |
|
|
(use (match_operand:V16QI 2 "register_operand" "r"))
|
809 |
|
|
(clobber (match_scratch:V4SI 3 "=&r"))
|
810 |
|
|
(clobber (match_scratch:V4SI 4 "=&r"))
|
811 |
|
|
(clobber (match_scratch:V4SI 5 "=&r"))
|
812 |
|
|
(clobber (match_scratch:V4SI 6 "=&r"))]
|
813 |
|
|
""
|
814 |
|
|
"clz\t%3,%1\;il\t%6,1023+31\;shl\t%4,%1,%3\;ceqi\t%5,%3,32\;sf\t%6,%3,%6\;a\t%4,%4,%4\;andc\t%6,%6,%5\;shufb\t%6,%6,%4,%2\;shlqbii\t%0,%6,4"
|
815 |
|
|
"reload_completed"
|
816 |
|
|
[(set (match_dup:DF 0)
|
817 |
|
|
(unsigned_float:DF (match_dup:SI 1)))]
|
818 |
|
|
"{
|
819 |
|
|
rtx *ops = operands;
|
820 |
|
|
rtx op1_v4si = gen_rtx_REG(V4SImode, REGNO(ops[1]));
|
821 |
|
|
rtx op0_ti = gen_rtx_REG (TImode, REGNO (ops[0]));
|
822 |
|
|
rtx op2_ti = gen_rtx_REG (TImode, REGNO (ops[2]));
|
823 |
|
|
rtx op6_ti = gen_rtx_REG (TImode, REGNO (ops[6]));
|
824 |
|
|
emit_insn (gen_clzv4si2 (ops[3],op1_v4si));
|
825 |
|
|
emit_move_insn (ops[6], spu_const (V4SImode, 1023+31));
|
826 |
|
|
emit_insn (gen_vashlv4si3 (ops[4],op1_v4si,ops[3]));
|
827 |
|
|
emit_insn (gen_ceq_v4si (ops[5],ops[3],spu_const (V4SImode, 32)));
|
828 |
|
|
emit_insn (gen_subv4si3 (ops[6],ops[6],ops[3]));
|
829 |
|
|
emit_insn (gen_addv4si3 (ops[4],ops[4],ops[4]));
|
830 |
|
|
emit_insn (gen_andc_v4si (ops[6],ops[6],ops[5]));
|
831 |
|
|
emit_insn (gen_shufb (ops[6],ops[6],ops[4],op2_ti));
|
832 |
|
|
emit_insn (gen_shlqbi_ti (op0_ti,op6_ti,GEN_INT(4)));
|
833 |
|
|
DONE;
|
834 |
|
|
}"
|
835 |
|
|
[(set_attr "length" "32")])
|
836 |
|
|
|
837 |
|
|
(define_expand "floatdidf2"
|
838 |
|
|
[(set (match_operand:DF 0 "register_operand" "")
|
839 |
|
|
(float:DF (match_operand:DI 1 "register_operand" "")))]
|
840 |
|
|
""
|
841 |
|
|
{
|
842 |
|
|
rtx c0 = gen_reg_rtx (DImode);
|
843 |
|
|
rtx r0 = gen_reg_rtx (DImode);
|
844 |
|
|
rtx r1 = gen_reg_rtx (DFmode);
|
845 |
|
|
rtx r2 = gen_reg_rtx (DImode);
|
846 |
|
|
rtx setneg = gen_reg_rtx (DImode);
|
847 |
|
|
rtx isneg = gen_reg_rtx (SImode);
|
848 |
|
|
rtx neg = gen_reg_rtx (DImode);
|
849 |
|
|
rtx mask = gen_reg_rtx (DImode);
|
850 |
|
|
|
851 |
|
|
emit_move_insn (c0, GEN_INT (0x8000000000000000ull));
|
852 |
|
|
|
853 |
|
|
emit_insn (gen_negdi2 (neg, operands[1]));
|
854 |
|
|
emit_insn (gen_cgt_di_m1 (isneg, operands[1]));
|
855 |
|
|
emit_insn (gen_extend_compare (mask, isneg));
|
856 |
|
|
emit_insn (gen_selb (r0, neg, operands[1], mask));
|
857 |
|
|
emit_insn (gen_andc_di (setneg, c0, mask));
|
858 |
|
|
|
859 |
|
|
emit_insn (gen_floatunsdidf2 (r1, r0));
|
860 |
|
|
|
861 |
|
|
emit_insn (gen_iordi3 (r2, gen_rtx_SUBREG (DImode, r1, 0), setneg));
|
862 |
|
|
emit_move_insn (operands[0], gen_rtx_SUBREG (DFmode, r2, 0));
|
863 |
|
|
DONE;
|
864 |
|
|
})
|
865 |
|
|
|
866 |
|
|
(define_expand "floatunsdidf2"
|
867 |
|
|
[(set (match_operand:DF 0 "register_operand" "=r")
|
868 |
|
|
(unsigned_float:DF (match_operand:DI 1 "register_operand" "r")))]
|
869 |
|
|
""
|
870 |
|
|
"{
|
871 |
|
|
rtx value, insns;
|
872 |
|
|
rtx c0 = spu_const_from_ints (V16QImode, 0x02031011, 0x12138080,
|
873 |
|
|
0x06071415, 0x16178080);
|
874 |
|
|
rtx c1 = spu_const_from_ints (V4SImode, 1023+63, 1023+31, 0, 0);
|
875 |
|
|
rtx r0 = gen_reg_rtx (V16QImode);
|
876 |
|
|
rtx r1 = gen_reg_rtx (V4SImode);
|
877 |
|
|
|
878 |
|
|
if (optimize_size)
|
879 |
|
|
{
|
880 |
|
|
start_sequence ();
|
881 |
|
|
value =
|
882 |
|
|
emit_library_call_value (convert_optab_libfunc (ufloat_optab,
|
883 |
|
|
DFmode, DImode),
|
884 |
|
|
NULL_RTX, LCT_NORMAL, DFmode, 1, operands[1], DImode);
|
885 |
|
|
insns = get_insns ();
|
886 |
|
|
end_sequence ();
|
887 |
|
|
emit_libcall_block (insns, operands[0], value,
|
888 |
|
|
gen_rtx_UNSIGNED_FLOAT (DFmode, operands[1]));
|
889 |
|
|
}
|
890 |
|
|
else
|
891 |
|
|
{
|
892 |
|
|
emit_move_insn (r1, c1);
|
893 |
|
|
emit_move_insn (r0, c0);
|
894 |
|
|
emit_insn (gen_floatunsdidf2_internal (operands[0], operands[1], r0, r1));
|
895 |
|
|
}
|
896 |
|
|
DONE;
|
897 |
|
|
}")
|
898 |
|
|
|
899 |
|
|
(define_insn_and_split "floatunsdidf2_internal"
|
900 |
|
|
[(set (match_operand:DF 0 "register_operand" "=r")
|
901 |
|
|
(unsigned_float:DF (match_operand:DI 1 "register_operand" "r")))
|
902 |
|
|
(use (match_operand:V16QI 2 "register_operand" "r"))
|
903 |
|
|
(use (match_operand:V4SI 3 "register_operand" "r"))
|
904 |
|
|
(clobber (match_scratch:V4SI 4 "=&r"))
|
905 |
|
|
(clobber (match_scratch:V4SI 5 "=&r"))
|
906 |
|
|
(clobber (match_scratch:V4SI 6 "=&r"))]
|
907 |
|
|
""
|
908 |
|
|
"clz\t%4,%1\;shl\t%5,%1,%4\;ceqi\t%6,%4,32\;sf\t%4,%4,%3\;a\t%5,%5,%5\;andc\t%4,%4,%6\;shufb\t%4,%4,%5,%2\;shlqbii\t%4,%4,4\;shlqbyi\t%5,%4,8\;dfa\t%0,%4,%5"
|
909 |
|
|
"reload_completed"
|
910 |
|
|
[(set (match_operand:DF 0 "register_operand" "=r")
|
911 |
|
|
(unsigned_float:DF (match_operand:DI 1 "register_operand" "r")))]
|
912 |
|
|
"{
|
913 |
|
|
rtx *ops = operands;
|
914 |
|
|
rtx op1_v4si = gen_rtx_REG (V4SImode, REGNO(ops[1]));
|
915 |
|
|
rtx op2_ti = gen_rtx_REG (TImode, REGNO(ops[2]));
|
916 |
|
|
rtx op4_ti = gen_rtx_REG (TImode, REGNO(ops[4]));
|
917 |
|
|
rtx op5_ti = gen_rtx_REG (TImode, REGNO(ops[5]));
|
918 |
|
|
rtx op4_df = gen_rtx_REG (DFmode, REGNO(ops[4]));
|
919 |
|
|
rtx op5_df = gen_rtx_REG (DFmode, REGNO(ops[5]));
|
920 |
|
|
emit_insn (gen_clzv4si2 (ops[4],op1_v4si));
|
921 |
|
|
emit_insn (gen_vashlv4si3 (ops[5],op1_v4si,ops[4]));
|
922 |
|
|
emit_insn (gen_ceq_v4si (ops[6],ops[4],spu_const (V4SImode, 32)));
|
923 |
|
|
emit_insn (gen_subv4si3 (ops[4],ops[3],ops[4]));
|
924 |
|
|
emit_insn (gen_addv4si3 (ops[5],ops[5],ops[5]));
|
925 |
|
|
emit_insn (gen_andc_v4si (ops[4],ops[4],ops[6]));
|
926 |
|
|
emit_insn (gen_shufb (ops[4],ops[4],ops[5],op2_ti));
|
927 |
|
|
emit_insn (gen_shlqbi_ti (op4_ti,op4_ti,GEN_INT(4)));
|
928 |
|
|
emit_insn (gen_shlqby_ti (op5_ti,op4_ti,GEN_INT(8)));
|
929 |
|
|
emit_insn (gen_adddf3 (ops[0],op4_df,op5_df));
|
930 |
|
|
DONE;
|
931 |
|
|
}"
|
932 |
|
|
[(set_attr "length" "40")])
|
933 |
|
|
|
934 |
|
|
|
935 |
|
|
;; add
|
936 |
|
|
|
937 |
|
|
(define_expand "addv16qi3"
|
938 |
|
|
[(set (match_operand:V16QI 0 "spu_reg_operand" "=r")
|
939 |
|
|
(plus:V16QI (match_operand:V16QI 1 "spu_reg_operand" "r")
|
940 |
|
|
(match_operand:V16QI 2 "spu_reg_operand" "r")))]
|
941 |
|
|
""
|
942 |
|
|
"{
|
943 |
|
|
rtx res_short = simplify_gen_subreg (V8HImode, operands[0], V16QImode, 0);
|
944 |
|
|
rtx lhs_short = simplify_gen_subreg (V8HImode, operands[1], V16QImode, 0);
|
945 |
|
|
rtx rhs_short = simplify_gen_subreg (V8HImode, operands[2], V16QImode, 0);
|
946 |
|
|
rtx rhs_and = gen_reg_rtx (V8HImode);
|
947 |
|
|
rtx hi_char = gen_reg_rtx (V8HImode);
|
948 |
|
|
rtx lo_char = gen_reg_rtx (V8HImode);
|
949 |
|
|
rtx mask = gen_reg_rtx (V8HImode);
|
950 |
|
|
|
951 |
|
|
emit_move_insn (mask, spu_const (V8HImode, 0x00ff));
|
952 |
|
|
emit_insn (gen_andv8hi3 (rhs_and, rhs_short, spu_const (V8HImode, 0xff00)));
|
953 |
|
|
emit_insn (gen_addv8hi3 (hi_char, lhs_short, rhs_and));
|
954 |
|
|
emit_insn (gen_addv8hi3 (lo_char, lhs_short, rhs_short));
|
955 |
|
|
emit_insn (gen_selb (res_short, hi_char, lo_char, mask));
|
956 |
|
|
DONE;
|
957 |
|
|
}")
|
958 |
|
|
|
959 |
|
|
(define_insn "add3"
|
960 |
|
|
[(set (match_operand:VHSI 0 "spu_reg_operand" "=r,r")
|
961 |
|
|
(plus:VHSI (match_operand:VHSI 1 "spu_reg_operand" "r,r")
|
962 |
|
|
(match_operand:VHSI 2 "spu_arith_operand" "r,B")))]
|
963 |
|
|
""
|
964 |
|
|
"@
|
965 |
|
|
a\t%0,%1,%2
|
966 |
|
|
ai\t%0,%1,%2")
|
967 |
|
|
|
968 |
|
|
(define_expand "add3"
|
969 |
|
|
[(set (match_dup:VDI 3)
|
970 |
|
|
(unspec:VDI [(match_operand:VDI 1 "spu_reg_operand" "")
|
971 |
|
|
(match_operand:VDI 2 "spu_reg_operand" "")] UNSPEC_CG))
|
972 |
|
|
(set (match_dup:VDI 5)
|
973 |
|
|
(unspec:VDI [(match_dup 3)
|
974 |
|
|
(match_dup 3)
|
975 |
|
|
(match_dup:TI 4)] UNSPEC_SHUFB))
|
976 |
|
|
(set (match_operand:VDI 0 "spu_reg_operand" "")
|
977 |
|
|
(unspec:VDI [(match_dup 1)
|
978 |
|
|
(match_dup 2)
|
979 |
|
|
(match_dup 5)] UNSPEC_ADDX))]
|
980 |
|
|
""
|
981 |
|
|
{
|
982 |
|
|
unsigned char pat[16] = {
|
983 |
|
|
0x04, 0x05, 0x06, 0x07,
|
984 |
|
|
0x80, 0x80, 0x80, 0x80,
|
985 |
|
|
0x0c, 0x0d, 0x0e, 0x0f,
|
986 |
|
|
0x80, 0x80, 0x80, 0x80
|
987 |
|
|
};
|
988 |
|
|
operands[3] = gen_reg_rtx (mode);
|
989 |
|
|
operands[4] = gen_reg_rtx (TImode);
|
990 |
|
|
operands[5] = gen_reg_rtx (mode);
|
991 |
|
|
emit_move_insn (operands[4], array_to_constant (TImode, pat));
|
992 |
|
|
})
|
993 |
|
|
|
994 |
|
|
(define_insn "cg_"
|
995 |
|
|
[(set (match_operand:CBOP 0 "spu_reg_operand" "=r")
|
996 |
|
|
(unspec:CBOP [(match_operand 1 "spu_reg_operand" "r")
|
997 |
|
|
(match_operand 2 "spu_reg_operand" "r")] UNSPEC_CG))]
|
998 |
|
|
"operands"
|
999 |
|
|
"cg\t%0,%1,%2")
|
1000 |
|
|
|
1001 |
|
|
(define_insn "cgx_"
|
1002 |
|
|
[(set (match_operand:CBOP 0 "spu_reg_operand" "=r")
|
1003 |
|
|
(unspec:CBOP [(match_operand 1 "spu_reg_operand" "r")
|
1004 |
|
|
(match_operand 2 "spu_reg_operand" "r")
|
1005 |
|
|
(match_operand 3 "spu_reg_operand" "0")] UNSPEC_CGX))]
|
1006 |
|
|
"operands"
|
1007 |
|
|
"cgx\t%0,%1,%2")
|
1008 |
|
|
|
1009 |
|
|
(define_insn "addx_"
|
1010 |
|
|
[(set (match_operand:CBOP 0 "spu_reg_operand" "=r")
|
1011 |
|
|
(unspec:CBOP [(match_operand 1 "spu_reg_operand" "r")
|
1012 |
|
|
(match_operand 2 "spu_reg_operand" "r")
|
1013 |
|
|
(match_operand 3 "spu_reg_operand" "0")] UNSPEC_ADDX))]
|
1014 |
|
|
"operands"
|
1015 |
|
|
"addx\t%0,%1,%2")
|
1016 |
|
|
|
1017 |
|
|
|
1018 |
|
|
;; This is not the most efficient implementation of addti3.
|
1019 |
|
|
;; We include this here because 1) the compiler needs it to be
|
1020 |
|
|
;; defined as the word size is 128-bit and 2) sometimes gcc
|
1021 |
|
|
;; substitutes an add for a constant left-shift. 2) is unlikely
|
1022 |
|
|
;; because we also give addti3 a high cost. In case gcc does
|
1023 |
|
|
;; generate TImode add, here is the code to do it.
|
1024 |
|
|
;; operand 2 is a nonmemory because the compiler requires it.
|
1025 |
|
|
(define_insn "addti3"
|
1026 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=&r")
|
1027 |
|
|
(plus:TI (match_operand:TI 1 "spu_reg_operand" "r")
|
1028 |
|
|
(match_operand:TI 2 "spu_nonmem_operand" "r")))
|
1029 |
|
|
(clobber (match_scratch:TI 3 "=&r"))]
|
1030 |
|
|
""
|
1031 |
|
|
"cg\t%3,%1,%2\n\\
|
1032 |
|
|
shlqbyi\t%3,%3,4\n\\
|
1033 |
|
|
cgx\t%3,%1,%2\n\\
|
1034 |
|
|
shlqbyi\t%3,%3,4\n\\
|
1035 |
|
|
cgx\t%3,%1,%2\n\\
|
1036 |
|
|
shlqbyi\t%0,%3,4\n\\
|
1037 |
|
|
addx\t%0,%1,%2"
|
1038 |
|
|
[(set_attr "type" "multi0")
|
1039 |
|
|
(set_attr "length" "28")])
|
1040 |
|
|
|
1041 |
|
|
(define_insn "add3"
|
1042 |
|
|
[(set (match_operand:VSF 0 "spu_reg_operand" "=r")
|
1043 |
|
|
(plus:VSF (match_operand:VSF 1 "spu_reg_operand" "r")
|
1044 |
|
|
(match_operand:VSF 2 "spu_reg_operand" "r")))]
|
1045 |
|
|
""
|
1046 |
|
|
"fa\t%0,%1,%2"
|
1047 |
|
|
[(set_attr "type" "fp6")])
|
1048 |
|
|
|
1049 |
|
|
(define_insn "add3"
|
1050 |
|
|
[(set (match_operand:VDF 0 "spu_reg_operand" "=r")
|
1051 |
|
|
(plus:VDF (match_operand:VDF 1 "spu_reg_operand" "r")
|
1052 |
|
|
(match_operand:VDF 2 "spu_reg_operand" "r")))]
|
1053 |
|
|
""
|
1054 |
|
|
"dfa\t%0,%1,%2"
|
1055 |
|
|
[(set_attr "type" "fpd")])
|
1056 |
|
|
|
1057 |
|
|
|
1058 |
|
|
;; sub
|
1059 |
|
|
|
1060 |
|
|
(define_expand "subv16qi3"
|
1061 |
|
|
[(set (match_operand:V16QI 0 "spu_reg_operand" "=r")
|
1062 |
|
|
(minus:V16QI (match_operand:V16QI 1 "spu_reg_operand" "r")
|
1063 |
|
|
(match_operand:V16QI 2 "spu_reg_operand" "r")))]
|
1064 |
|
|
""
|
1065 |
|
|
"{
|
1066 |
|
|
rtx res_short = simplify_gen_subreg (V8HImode, operands[0], V16QImode, 0);
|
1067 |
|
|
rtx lhs_short = simplify_gen_subreg (V8HImode, operands[1], V16QImode, 0);
|
1068 |
|
|
rtx rhs_short = simplify_gen_subreg (V8HImode, operands[2], V16QImode, 0);
|
1069 |
|
|
rtx rhs_and = gen_reg_rtx (V8HImode);
|
1070 |
|
|
rtx hi_char = gen_reg_rtx (V8HImode);
|
1071 |
|
|
rtx lo_char = gen_reg_rtx (V8HImode);
|
1072 |
|
|
rtx mask = gen_reg_rtx (V8HImode);
|
1073 |
|
|
|
1074 |
|
|
emit_move_insn (mask, spu_const (V8HImode, 0x00ff));
|
1075 |
|
|
emit_insn (gen_andv8hi3 (rhs_and, rhs_short, spu_const (V8HImode, 0xff00)));
|
1076 |
|
|
emit_insn (gen_subv8hi3 (hi_char, lhs_short, rhs_and));
|
1077 |
|
|
emit_insn (gen_subv8hi3 (lo_char, lhs_short, rhs_short));
|
1078 |
|
|
emit_insn (gen_selb (res_short, hi_char, lo_char, mask));
|
1079 |
|
|
DONE;
|
1080 |
|
|
}")
|
1081 |
|
|
|
1082 |
|
|
(define_insn "sub3"
|
1083 |
|
|
[(set (match_operand:VHSI 0 "spu_reg_operand" "=r,r")
|
1084 |
|
|
(minus:VHSI (match_operand:VHSI 1 "spu_arith_operand" "r,B")
|
1085 |
|
|
(match_operand:VHSI 2 "spu_reg_operand" "r,r")))]
|
1086 |
|
|
""
|
1087 |
|
|
"@
|
1088 |
|
|
sf\t%0,%2,%1
|
1089 |
|
|
sfi\t%0,%2,%1")
|
1090 |
|
|
|
1091 |
|
|
(define_expand "sub3"
|
1092 |
|
|
[(set (match_dup:VDI 3)
|
1093 |
|
|
(unspec:VDI [(match_operand:VDI 1 "spu_reg_operand" "")
|
1094 |
|
|
(match_operand:VDI 2 "spu_reg_operand" "")] UNSPEC_BG))
|
1095 |
|
|
(set (match_dup:VDI 5)
|
1096 |
|
|
(unspec:VDI [(match_dup 3)
|
1097 |
|
|
(match_dup 3)
|
1098 |
|
|
(match_dup:TI 4)] UNSPEC_SHUFB))
|
1099 |
|
|
(set (match_operand:VDI 0 "spu_reg_operand" "")
|
1100 |
|
|
(unspec:VDI [(match_dup 1)
|
1101 |
|
|
(match_dup 2)
|
1102 |
|
|
(match_dup 5)] UNSPEC_SFX))]
|
1103 |
|
|
""
|
1104 |
|
|
{
|
1105 |
|
|
unsigned char pat[16] = {
|
1106 |
|
|
0x04, 0x05, 0x06, 0x07,
|
1107 |
|
|
0xc0, 0xc0, 0xc0, 0xc0,
|
1108 |
|
|
0x0c, 0x0d, 0x0e, 0x0f,
|
1109 |
|
|
0xc0, 0xc0, 0xc0, 0xc0
|
1110 |
|
|
};
|
1111 |
|
|
operands[3] = gen_reg_rtx (mode);
|
1112 |
|
|
operands[4] = gen_reg_rtx (TImode);
|
1113 |
|
|
operands[5] = gen_reg_rtx (mode);
|
1114 |
|
|
emit_move_insn (operands[4], array_to_constant (TImode, pat));
|
1115 |
|
|
})
|
1116 |
|
|
|
1117 |
|
|
(define_insn "bg_"
|
1118 |
|
|
[(set (match_operand:CBOP 0 "spu_reg_operand" "=r")
|
1119 |
|
|
(unspec:CBOP [(match_operand 1 "spu_reg_operand" "r")
|
1120 |
|
|
(match_operand 2 "spu_reg_operand" "r")] UNSPEC_BG))]
|
1121 |
|
|
"operands"
|
1122 |
|
|
"bg\t%0,%2,%1")
|
1123 |
|
|
|
1124 |
|
|
(define_insn "bgx_"
|
1125 |
|
|
[(set (match_operand:CBOP 0 "spu_reg_operand" "=r")
|
1126 |
|
|
(unspec:CBOP [(match_operand 1 "spu_reg_operand" "r")
|
1127 |
|
|
(match_operand 2 "spu_reg_operand" "r")
|
1128 |
|
|
(match_operand 3 "spu_reg_operand" "0")] UNSPEC_BGX))]
|
1129 |
|
|
"operands"
|
1130 |
|
|
"bgx\t%0,%2,%1")
|
1131 |
|
|
|
1132 |
|
|
(define_insn "sfx_"
|
1133 |
|
|
[(set (match_operand:CBOP 0 "spu_reg_operand" "=r")
|
1134 |
|
|
(unspec:CBOP [(match_operand 1 "spu_reg_operand" "r")
|
1135 |
|
|
(match_operand 2 "spu_reg_operand" "r")
|
1136 |
|
|
(match_operand 3 "spu_reg_operand" "0")] UNSPEC_SFX))]
|
1137 |
|
|
"operands"
|
1138 |
|
|
"sfx\t%0,%2,%1")
|
1139 |
|
|
|
1140 |
|
|
(define_insn "subti3"
|
1141 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r")
|
1142 |
|
|
(minus:TI (match_operand:TI 1 "spu_reg_operand" "r")
|
1143 |
|
|
(match_operand:TI 2 "spu_reg_operand" "r")))
|
1144 |
|
|
(clobber (match_scratch:TI 3 "=&r"))
|
1145 |
|
|
(clobber (match_scratch:TI 4 "=&r"))
|
1146 |
|
|
(clobber (match_scratch:TI 5 "=&r"))
|
1147 |
|
|
(clobber (match_scratch:TI 6 "=&r"))]
|
1148 |
|
|
""
|
1149 |
|
|
"il\t%6,1\n\\
|
1150 |
|
|
bg\t%3,%2,%1\n\\
|
1151 |
|
|
xor\t%3,%3,%6\n\\
|
1152 |
|
|
sf\t%4,%2,%1\n\\
|
1153 |
|
|
shlqbyi\t%5,%3,4\n\\
|
1154 |
|
|
bg\t%3,%5,%4\n\\
|
1155 |
|
|
xor\t%3,%3,%6\n\\
|
1156 |
|
|
sf\t%4,%5,%4\n\\
|
1157 |
|
|
shlqbyi\t%5,%3,4\n\\
|
1158 |
|
|
bg\t%3,%5,%4\n\\
|
1159 |
|
|
xor\t%3,%3,%6\n\\
|
1160 |
|
|
sf\t%4,%5,%4\n\\
|
1161 |
|
|
shlqbyi\t%5,%3,4\n\\
|
1162 |
|
|
sf\t%0,%5,%4"
|
1163 |
|
|
[(set_attr "type" "multi0")
|
1164 |
|
|
(set_attr "length" "56")])
|
1165 |
|
|
|
1166 |
|
|
(define_insn "sub3"
|
1167 |
|
|
[(set (match_operand:VSF 0 "spu_reg_operand" "=r")
|
1168 |
|
|
(minus:VSF (match_operand:VSF 1 "spu_reg_operand" "r")
|
1169 |
|
|
(match_operand:VSF 2 "spu_reg_operand" "r")))]
|
1170 |
|
|
""
|
1171 |
|
|
"fs\t%0,%1,%2"
|
1172 |
|
|
[(set_attr "type" "fp6")])
|
1173 |
|
|
|
1174 |
|
|
(define_insn "sub3"
|
1175 |
|
|
[(set (match_operand:VDF 0 "spu_reg_operand" "=r")
|
1176 |
|
|
(minus:VDF (match_operand:VDF 1 "spu_reg_operand" "r")
|
1177 |
|
|
(match_operand:VDF 2 "spu_reg_operand" "r")))]
|
1178 |
|
|
""
|
1179 |
|
|
"dfs\t%0,%1,%2"
|
1180 |
|
|
[(set_attr "type" "fpd")])
|
1181 |
|
|
|
1182 |
|
|
|
1183 |
|
|
;; neg
|
1184 |
|
|
|
1185 |
|
|
(define_expand "negv16qi2"
|
1186 |
|
|
[(set (match_operand:V16QI 0 "spu_reg_operand" "=r")
|
1187 |
|
|
(neg:V16QI (match_operand:V16QI 1 "spu_reg_operand" "r")))]
|
1188 |
|
|
""
|
1189 |
|
|
"{
|
1190 |
|
|
rtx zero = gen_reg_rtx (V16QImode);
|
1191 |
|
|
emit_move_insn (zero, CONST0_RTX (V16QImode));
|
1192 |
|
|
emit_insn (gen_subv16qi3 (operands[0], zero, operands[1]));
|
1193 |
|
|
DONE;
|
1194 |
|
|
}")
|
1195 |
|
|
|
1196 |
|
|
(define_insn "neg2"
|
1197 |
|
|
[(set (match_operand:VHSI 0 "spu_reg_operand" "=r")
|
1198 |
|
|
(neg:VHSI (match_operand:VHSI 1 "spu_reg_operand" "r")))]
|
1199 |
|
|
""
|
1200 |
|
|
"sfi\t%0,%1,0")
|
1201 |
|
|
|
1202 |
|
|
(define_expand "negdi2"
|
1203 |
|
|
[(set (match_operand:DI 0 "spu_reg_operand" "")
|
1204 |
|
|
(neg:DI (match_operand:DI 1 "spu_reg_operand" "")))]
|
1205 |
|
|
""
|
1206 |
|
|
{
|
1207 |
|
|
rtx zero = gen_reg_rtx(DImode);
|
1208 |
|
|
emit_move_insn(zero, GEN_INT(0));
|
1209 |
|
|
emit_insn (gen_subdi3(operands[0], zero, operands[1]));
|
1210 |
|
|
DONE;
|
1211 |
|
|
})
|
1212 |
|
|
|
1213 |
|
|
(define_expand "negti2"
|
1214 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "")
|
1215 |
|
|
(neg:TI (match_operand:TI 1 "spu_reg_operand" "")))]
|
1216 |
|
|
""
|
1217 |
|
|
{
|
1218 |
|
|
rtx zero = gen_reg_rtx(TImode);
|
1219 |
|
|
emit_move_insn(zero, GEN_INT(0));
|
1220 |
|
|
emit_insn (gen_subti3(operands[0], zero, operands[1]));
|
1221 |
|
|
DONE;
|
1222 |
|
|
})
|
1223 |
|
|
|
1224 |
|
|
(define_expand "neg2"
|
1225 |
|
|
[(parallel
|
1226 |
|
|
[(set (match_operand:VSF 0 "spu_reg_operand" "")
|
1227 |
|
|
(neg:VSF (match_operand:VSF 1 "spu_reg_operand" "")))
|
1228 |
|
|
(use (match_dup 2))])]
|
1229 |
|
|
""
|
1230 |
|
|
"operands[2] = gen_reg_rtx (mode);
|
1231 |
|
|
emit_move_insn (operands[2], spu_const (mode, -0x80000000ull));")
|
1232 |
|
|
|
1233 |
|
|
(define_expand "neg2"
|
1234 |
|
|
[(parallel
|
1235 |
|
|
[(set (match_operand:VDF 0 "spu_reg_operand" "")
|
1236 |
|
|
(neg:VDF (match_operand:VDF 1 "spu_reg_operand" "")))
|
1237 |
|
|
(use (match_dup 2))])]
|
1238 |
|
|
""
|
1239 |
|
|
"operands[2] = gen_reg_rtx (mode);
|
1240 |
|
|
emit_move_insn (operands[2], spu_const (mode, -0x8000000000000000ull));")
|
1241 |
|
|
|
1242 |
|
|
(define_insn_and_split "_neg2"
|
1243 |
|
|
[(set (match_operand:VSDF 0 "spu_reg_operand" "=r")
|
1244 |
|
|
(neg:VSDF (match_operand:VSDF 1 "spu_reg_operand" "r")))
|
1245 |
|
|
(use (match_operand: 2 "spu_reg_operand" "r"))]
|
1246 |
|
|
""
|
1247 |
|
|
"#"
|
1248 |
|
|
""
|
1249 |
|
|
[(set (match_dup: 3)
|
1250 |
|
|
(xor: (match_dup: 4)
|
1251 |
|
|
(match_dup: 2)))]
|
1252 |
|
|
{
|
1253 |
|
|
operands[3] = spu_gen_subreg (mode, operands[0]);
|
1254 |
|
|
operands[4] = spu_gen_subreg (mode, operands[1]);
|
1255 |
|
|
})
|
1256 |
|
|
|
1257 |
|
|
|
1258 |
|
|
;; abs
|
1259 |
|
|
|
1260 |
|
|
(define_expand "abs2"
|
1261 |
|
|
[(parallel
|
1262 |
|
|
[(set (match_operand:VSF 0 "spu_reg_operand" "")
|
1263 |
|
|
(abs:VSF (match_operand:VSF 1 "spu_reg_operand" "")))
|
1264 |
|
|
(use (match_dup 2))])]
|
1265 |
|
|
""
|
1266 |
|
|
"operands[2] = gen_reg_rtx (mode);
|
1267 |
|
|
emit_move_insn (operands[2], spu_const (mode, 0x7fffffffull));")
|
1268 |
|
|
|
1269 |
|
|
(define_expand "abs2"
|
1270 |
|
|
[(parallel
|
1271 |
|
|
[(set (match_operand:VDF 0 "spu_reg_operand" "")
|
1272 |
|
|
(abs:VDF (match_operand:VDF 1 "spu_reg_operand" "")))
|
1273 |
|
|
(use (match_dup 2))])]
|
1274 |
|
|
""
|
1275 |
|
|
"operands[2] = gen_reg_rtx (mode);
|
1276 |
|
|
emit_move_insn (operands[2], spu_const (mode, 0x7fffffffffffffffull));")
|
1277 |
|
|
|
1278 |
|
|
(define_insn_and_split "_abs2"
|
1279 |
|
|
[(set (match_operand:VSDF 0 "spu_reg_operand" "=r")
|
1280 |
|
|
(abs:VSDF (match_operand:VSDF 1 "spu_reg_operand" "r")))
|
1281 |
|
|
(use (match_operand: 2 "spu_reg_operand" "r"))]
|
1282 |
|
|
""
|
1283 |
|
|
"#"
|
1284 |
|
|
""
|
1285 |
|
|
[(set (match_dup: 3)
|
1286 |
|
|
(and: (match_dup: 4)
|
1287 |
|
|
(match_dup: 2)))]
|
1288 |
|
|
{
|
1289 |
|
|
operands[3] = spu_gen_subreg (mode, operands[0]);
|
1290 |
|
|
operands[4] = spu_gen_subreg (mode, operands[1]);
|
1291 |
|
|
})
|
1292 |
|
|
|
1293 |
|
|
|
1294 |
|
|
;; mul
|
1295 |
|
|
|
1296 |
|
|
(define_insn "mulhi3"
|
1297 |
|
|
[(set (match_operand:HI 0 "spu_reg_operand" "=r,r")
|
1298 |
|
|
(mult:HI (match_operand:HI 1 "spu_reg_operand" "r,r")
|
1299 |
|
|
(match_operand:HI 2 "spu_arith_operand" "r,B")))]
|
1300 |
|
|
""
|
1301 |
|
|
"@
|
1302 |
|
|
mpy\t%0,%1,%2
|
1303 |
|
|
mpyi\t%0,%1,%2"
|
1304 |
|
|
[(set_attr "type" "fp7")])
|
1305 |
|
|
|
1306 |
|
|
(define_expand "mulv8hi3"
|
1307 |
|
|
[(set (match_operand:V8HI 0 "spu_reg_operand" "")
|
1308 |
|
|
(mult:V8HI (match_operand:V8HI 1 "spu_reg_operand" "")
|
1309 |
|
|
(match_operand:V8HI 2 "spu_reg_operand" "")))]
|
1310 |
|
|
""
|
1311 |
|
|
"{
|
1312 |
|
|
rtx result = simplify_gen_subreg (V4SImode, operands[0], V8HImode, 0);
|
1313 |
|
|
rtx low = gen_reg_rtx (V4SImode);
|
1314 |
|
|
rtx high = gen_reg_rtx (V4SImode);
|
1315 |
|
|
rtx shift = gen_reg_rtx (V4SImode);
|
1316 |
|
|
rtx mask = gen_reg_rtx (V4SImode);
|
1317 |
|
|
|
1318 |
|
|
emit_move_insn (mask, spu_const (V4SImode, 0x0000ffff));
|
1319 |
|
|
emit_insn (gen_spu_mpyhh (high, operands[1], operands[2]));
|
1320 |
|
|
emit_insn (gen_spu_mpy (low, operands[1], operands[2]));
|
1321 |
|
|
emit_insn (gen_vashlv4si3 (shift, high, spu_const(V4SImode, 16)));
|
1322 |
|
|
emit_insn (gen_selb (result, shift, low, mask));
|
1323 |
|
|
DONE;
|
1324 |
|
|
}")
|
1325 |
|
|
|
1326 |
|
|
(define_expand "mul3"
|
1327 |
|
|
[(parallel
|
1328 |
|
|
[(set (match_operand:VSI 0 "spu_reg_operand" "")
|
1329 |
|
|
(mult:VSI (match_operand:VSI 1 "spu_reg_operand" "")
|
1330 |
|
|
(match_operand:VSI 2 "spu_reg_operand" "")))
|
1331 |
|
|
(clobber (match_dup:VSI 3))
|
1332 |
|
|
(clobber (match_dup:VSI 4))
|
1333 |
|
|
(clobber (match_dup:VSI 5))
|
1334 |
|
|
(clobber (match_dup:VSI 6))])]
|
1335 |
|
|
""
|
1336 |
|
|
{
|
1337 |
|
|
operands[3] = gen_reg_rtx(mode);
|
1338 |
|
|
operands[4] = gen_reg_rtx(mode);
|
1339 |
|
|
operands[5] = gen_reg_rtx(mode);
|
1340 |
|
|
operands[6] = gen_reg_rtx(mode);
|
1341 |
|
|
})
|
1342 |
|
|
|
1343 |
|
|
(define_insn_and_split "_mulsi3"
|
1344 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
1345 |
|
|
(mult:SI (match_operand:SI 1 "spu_reg_operand" "r")
|
1346 |
|
|
(match_operand:SI 2 "spu_arith_operand" "rK")))
|
1347 |
|
|
(clobber (match_operand:SI 3 "spu_reg_operand" "=&r"))
|
1348 |
|
|
(clobber (match_operand:SI 4 "spu_reg_operand" "=&r"))
|
1349 |
|
|
(clobber (match_operand:SI 5 "spu_reg_operand" "=&r"))
|
1350 |
|
|
(clobber (match_operand:SI 6 "spu_reg_operand" "=&r"))]
|
1351 |
|
|
""
|
1352 |
|
|
"#"
|
1353 |
|
|
""
|
1354 |
|
|
[(set (match_dup:SI 0)
|
1355 |
|
|
(mult:SI (match_dup:SI 1)
|
1356 |
|
|
(match_dup:SI 2)))]
|
1357 |
|
|
{
|
1358 |
|
|
HOST_WIDE_INT val = 0;
|
1359 |
|
|
rtx a = operands[3];
|
1360 |
|
|
rtx b = operands[4];
|
1361 |
|
|
rtx c = operands[5];
|
1362 |
|
|
rtx d = operands[6];
|
1363 |
|
|
if (GET_CODE(operands[2]) == CONST_INT)
|
1364 |
|
|
{
|
1365 |
|
|
val = INTVAL(operands[2]);
|
1366 |
|
|
emit_move_insn(d, operands[2]);
|
1367 |
|
|
operands[2] = d;
|
1368 |
|
|
}
|
1369 |
|
|
if (val && (val & 0xffff) == 0)
|
1370 |
|
|
{
|
1371 |
|
|
emit_insn (gen_mpyh_si(operands[0], operands[2], operands[1]));
|
1372 |
|
|
}
|
1373 |
|
|
else if (val > 0 && val < 0x10000)
|
1374 |
|
|
{
|
1375 |
|
|
rtx cst = satisfies_constraint_K (GEN_INT (val)) ? GEN_INT(val) : d;
|
1376 |
|
|
emit_insn (gen_mpyh_si(a, operands[1], operands[2]));
|
1377 |
|
|
emit_insn (gen_mpyu_si(c, operands[1], cst));
|
1378 |
|
|
emit_insn (gen_addsi3(operands[0], a, c));
|
1379 |
|
|
}
|
1380 |
|
|
else
|
1381 |
|
|
{
|
1382 |
|
|
emit_insn (gen_mpyh_si(a, operands[1], operands[2]));
|
1383 |
|
|
emit_insn (gen_mpyh_si(b, operands[2], operands[1]));
|
1384 |
|
|
emit_insn (gen_mpyu_si(c, operands[1], operands[2]));
|
1385 |
|
|
emit_insn (gen_addsi3(d, a, b));
|
1386 |
|
|
emit_insn (gen_addsi3(operands[0], d, c));
|
1387 |
|
|
}
|
1388 |
|
|
DONE;
|
1389 |
|
|
})
|
1390 |
|
|
|
1391 |
|
|
(define_insn_and_split "_mulv4si3"
|
1392 |
|
|
[(set (match_operand:V4SI 0 "spu_reg_operand" "=r")
|
1393 |
|
|
(mult:V4SI (match_operand:V4SI 1 "spu_reg_operand" "r")
|
1394 |
|
|
(match_operand:V4SI 2 "spu_reg_operand" "r")))
|
1395 |
|
|
(clobber (match_operand:V4SI 3 "spu_reg_operand" "=&r"))
|
1396 |
|
|
(clobber (match_operand:V4SI 4 "spu_reg_operand" "=&r"))
|
1397 |
|
|
(clobber (match_operand:V4SI 5 "spu_reg_operand" "=&r"))
|
1398 |
|
|
(clobber (match_operand:V4SI 6 "spu_reg_operand" "=&r"))]
|
1399 |
|
|
""
|
1400 |
|
|
"#"
|
1401 |
|
|
""
|
1402 |
|
|
[(set (match_dup:V4SI 0)
|
1403 |
|
|
(mult:V4SI (match_dup:V4SI 1)
|
1404 |
|
|
(match_dup:V4SI 2)))]
|
1405 |
|
|
{
|
1406 |
|
|
rtx a = operands[3];
|
1407 |
|
|
rtx b = operands[4];
|
1408 |
|
|
rtx c = operands[5];
|
1409 |
|
|
rtx d = operands[6];
|
1410 |
|
|
rtx op1 = simplify_gen_subreg (V8HImode, operands[1], V4SImode, 0);
|
1411 |
|
|
rtx op2 = simplify_gen_subreg (V8HImode, operands[2], V4SImode, 0);
|
1412 |
|
|
emit_insn (gen_spu_mpyh(a, op1, op2));
|
1413 |
|
|
emit_insn (gen_spu_mpyh(b, op2, op1));
|
1414 |
|
|
emit_insn (gen_spu_mpyu(c, op1, op2));
|
1415 |
|
|
emit_insn (gen_addv4si3(d, a, b));
|
1416 |
|
|
emit_insn (gen_addv4si3(operands[0], d, c));
|
1417 |
|
|
DONE;
|
1418 |
|
|
})
|
1419 |
|
|
|
1420 |
|
|
(define_insn "mulhisi3"
|
1421 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
1422 |
|
|
(mult:SI (sign_extend:SI (match_operand:HI 1 "spu_reg_operand" "r"))
|
1423 |
|
|
(sign_extend:SI (match_operand:HI 2 "spu_reg_operand" "r"))))]
|
1424 |
|
|
""
|
1425 |
|
|
"mpy\t%0,%1,%2"
|
1426 |
|
|
[(set_attr "type" "fp7")])
|
1427 |
|
|
|
1428 |
|
|
(define_insn "mulhisi3_imm"
|
1429 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
1430 |
|
|
(mult:SI (sign_extend:SI (match_operand:HI 1 "spu_reg_operand" "r"))
|
1431 |
|
|
(match_operand:SI 2 "imm_K_operand" "K")))]
|
1432 |
|
|
""
|
1433 |
|
|
"mpyi\t%0,%1,%2"
|
1434 |
|
|
[(set_attr "type" "fp7")])
|
1435 |
|
|
|
1436 |
|
|
(define_insn "umulhisi3"
|
1437 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
1438 |
|
|
(mult:SI (zero_extend:SI (match_operand:HI 1 "spu_reg_operand" "r"))
|
1439 |
|
|
(zero_extend:SI (match_operand:HI 2 "spu_reg_operand" "r"))))]
|
1440 |
|
|
""
|
1441 |
|
|
"mpyu\t%0,%1,%2"
|
1442 |
|
|
[(set_attr "type" "fp7")])
|
1443 |
|
|
|
1444 |
|
|
(define_insn "umulhisi3_imm"
|
1445 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
1446 |
|
|
(mult:SI (zero_extend:SI (match_operand:HI 1 "spu_reg_operand" "r"))
|
1447 |
|
|
(and:SI (match_operand:SI 2 "imm_K_operand" "K") (const_int 65535))))]
|
1448 |
|
|
""
|
1449 |
|
|
"mpyui\t%0,%1,%2"
|
1450 |
|
|
[(set_attr "type" "fp7")])
|
1451 |
|
|
|
1452 |
|
|
(define_insn "mpyu_si"
|
1453 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r,r")
|
1454 |
|
|
(mult:SI (and:SI (match_operand:SI 1 "spu_reg_operand" "r,r")
|
1455 |
|
|
(const_int 65535))
|
1456 |
|
|
(and:SI (match_operand:SI 2 "spu_arith_operand" "r,K")
|
1457 |
|
|
(const_int 65535))))]
|
1458 |
|
|
""
|
1459 |
|
|
"@
|
1460 |
|
|
mpyu\t%0,%1,%2
|
1461 |
|
|
mpyui\t%0,%1,%2"
|
1462 |
|
|
[(set_attr "type" "fp7")])
|
1463 |
|
|
|
1464 |
|
|
;; This isn't always profitable to use. Consider r = a * b + c * d.
|
1465 |
|
|
;; It's faster to do the multiplies in parallel then add them. If we
|
1466 |
|
|
;; merge a multiply and add it prevents the multiplies from happening in
|
1467 |
|
|
;; parallel.
|
1468 |
|
|
(define_insn "mpya_si"
|
1469 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
1470 |
|
|
(plus:SI (mult:SI (sign_extend:SI (match_operand:HI 1 "spu_reg_operand" "r"))
|
1471 |
|
|
(sign_extend:SI (match_operand:HI 2 "spu_reg_operand" "r")))
|
1472 |
|
|
(match_operand:SI 3 "spu_reg_operand" "r")))]
|
1473 |
|
|
"0"
|
1474 |
|
|
"mpya\t%0,%1,%2,%3"
|
1475 |
|
|
[(set_attr "type" "fp7")])
|
1476 |
|
|
|
1477 |
|
|
(define_insn "mpyh_si"
|
1478 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
1479 |
|
|
(mult:SI (and:SI (match_operand:SI 1 "spu_reg_operand" "r")
|
1480 |
|
|
(const_int -65536))
|
1481 |
|
|
(and:SI (match_operand:SI 2 "spu_reg_operand" "r")
|
1482 |
|
|
(const_int 65535))))]
|
1483 |
|
|
""
|
1484 |
|
|
"mpyh\t%0,%1,%2"
|
1485 |
|
|
[(set_attr "type" "fp7")])
|
1486 |
|
|
|
1487 |
|
|
(define_insn "mpys_si"
|
1488 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
1489 |
|
|
(ashiftrt:SI
|
1490 |
|
|
(mult:SI (sign_extend:SI (match_operand:HI 1 "spu_reg_operand" "r"))
|
1491 |
|
|
(sign_extend:SI (match_operand:HI 2 "spu_reg_operand" "r")))
|
1492 |
|
|
(const_int 16)))]
|
1493 |
|
|
""
|
1494 |
|
|
"mpys\t%0,%1,%2"
|
1495 |
|
|
[(set_attr "type" "fp7")])
|
1496 |
|
|
|
1497 |
|
|
(define_insn "mpyhh_si"
|
1498 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
1499 |
|
|
(mult:SI (ashiftrt:SI (match_operand:SI 1 "spu_reg_operand" "r")
|
1500 |
|
|
(const_int 16))
|
1501 |
|
|
(ashiftrt:SI (match_operand:SI 2 "spu_reg_operand" "r")
|
1502 |
|
|
(const_int 16))))]
|
1503 |
|
|
""
|
1504 |
|
|
"mpyhh\t%0,%1,%2"
|
1505 |
|
|
[(set_attr "type" "fp7")])
|
1506 |
|
|
|
1507 |
|
|
(define_insn "mpyhhu_si"
|
1508 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
1509 |
|
|
(mult:SI (lshiftrt:SI (match_operand:SI 1 "spu_reg_operand" "r")
|
1510 |
|
|
(const_int 16))
|
1511 |
|
|
(lshiftrt:SI (match_operand:SI 2 "spu_reg_operand" "r")
|
1512 |
|
|
(const_int 16))))]
|
1513 |
|
|
""
|
1514 |
|
|
"mpyhhu\t%0,%1,%2"
|
1515 |
|
|
[(set_attr "type" "fp7")])
|
1516 |
|
|
|
1517 |
|
|
(define_insn "mpyhha_si"
|
1518 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
1519 |
|
|
(plus:SI (mult:SI (ashiftrt:SI (match_operand:SI 1 "spu_reg_operand" "r")
|
1520 |
|
|
(const_int 16))
|
1521 |
|
|
(ashiftrt:SI (match_operand:SI 2 "spu_reg_operand" "r")
|
1522 |
|
|
(const_int 16)))
|
1523 |
|
|
(match_operand:SI 3 "spu_reg_operand" "0")))]
|
1524 |
|
|
"0"
|
1525 |
|
|
"mpyhha\t%0,%1,%2"
|
1526 |
|
|
[(set_attr "type" "fp7")])
|
1527 |
|
|
|
1528 |
|
|
(define_insn "mul3"
|
1529 |
|
|
[(set (match_operand:VSDF 0 "spu_reg_operand" "=r")
|
1530 |
|
|
(mult:VSDF (match_operand:VSDF 1 "spu_reg_operand" "r")
|
1531 |
|
|
(match_operand:VSDF 2 "spu_reg_operand" "r")))]
|
1532 |
|
|
""
|
1533 |
|
|
"fm\t%0,%1,%2"
|
1534 |
|
|
[(set_attr "type" "fp")])
|
1535 |
|
|
|
1536 |
|
|
(define_insn "fma_"
|
1537 |
|
|
[(set (match_operand:VSF 0 "spu_reg_operand" "=r")
|
1538 |
|
|
(plus:VSF (mult:VSF (match_operand:VSF 1 "spu_reg_operand" "r")
|
1539 |
|
|
(match_operand:VSF 2 "spu_reg_operand" "r"))
|
1540 |
|
|
(match_operand:VSF 3 "spu_reg_operand" "r")))]
|
1541 |
|
|
""
|
1542 |
|
|
"fma\t%0,%1,%2,%3"
|
1543 |
|
|
[(set_attr "type" "fp6")])
|
1544 |
|
|
|
1545 |
|
|
(define_insn "fnms_"
|
1546 |
|
|
[(set (match_operand:VSF 0 "spu_reg_operand" "=r")
|
1547 |
|
|
(minus:VSF (match_operand:VSF 3 "spu_reg_operand" "r")
|
1548 |
|
|
(mult:VSF (match_operand:VSF 1 "spu_reg_operand" "r")
|
1549 |
|
|
(match_operand:VSF 2 "spu_reg_operand" "r"))))]
|
1550 |
|
|
""
|
1551 |
|
|
"fnms\t%0,%1,%2,%3"
|
1552 |
|
|
[(set_attr "type" "fp6")])
|
1553 |
|
|
|
1554 |
|
|
(define_insn "fms_"
|
1555 |
|
|
[(set (match_operand:VSF 0 "spu_reg_operand" "=r")
|
1556 |
|
|
(minus:VSF (mult:VSF (match_operand:VSF 1 "spu_reg_operand" "r")
|
1557 |
|
|
(match_operand:VSF 2 "spu_reg_operand" "r"))
|
1558 |
|
|
(match_operand:VSF 3 "spu_reg_operand" "r")))]
|
1559 |
|
|
""
|
1560 |
|
|
"fms\t%0,%1,%2,%3"
|
1561 |
|
|
[(set_attr "type" "fp6")])
|
1562 |
|
|
|
1563 |
|
|
(define_insn "fma_"
|
1564 |
|
|
[(set (match_operand:VDF 0 "spu_reg_operand" "=r")
|
1565 |
|
|
(plus:VDF (mult:VDF (match_operand:VDF 1 "spu_reg_operand" "r")
|
1566 |
|
|
(match_operand:VDF 2 "spu_reg_operand" "r"))
|
1567 |
|
|
(match_operand:VDF 3 "spu_reg_operand" "0")))]
|
1568 |
|
|
""
|
1569 |
|
|
"dfma\t%0,%1,%2"
|
1570 |
|
|
[(set_attr "type" "fpd")])
|
1571 |
|
|
|
1572 |
|
|
(define_insn "fnma_"
|
1573 |
|
|
[(set (match_operand:VDF 0 "spu_reg_operand" "=r")
|
1574 |
|
|
(neg:VDF (plus:VDF (mult:VDF (match_operand:VDF 1 "spu_reg_operand" "r")
|
1575 |
|
|
(match_operand:VDF 2 "spu_reg_operand" "r"))
|
1576 |
|
|
(match_operand:VDF 3 "spu_reg_operand" "0"))))]
|
1577 |
|
|
""
|
1578 |
|
|
"dfnma\t%0,%1,%2"
|
1579 |
|
|
[(set_attr "type" "fpd")])
|
1580 |
|
|
|
1581 |
|
|
(define_insn "fnms_"
|
1582 |
|
|
[(set (match_operand:VDF 0 "spu_reg_operand" "=r")
|
1583 |
|
|
(minus:VDF (match_operand:VDF 3 "spu_reg_operand" "0")
|
1584 |
|
|
(mult:VDF (match_operand:VDF 1 "spu_reg_operand" "r")
|
1585 |
|
|
(match_operand:VDF 2 "spu_reg_operand" "r"))))]
|
1586 |
|
|
""
|
1587 |
|
|
"dfnms\t%0,%1,%2"
|
1588 |
|
|
[(set_attr "type" "fpd")])
|
1589 |
|
|
|
1590 |
|
|
(define_insn "fms_"
|
1591 |
|
|
[(set (match_operand:VDF 0 "spu_reg_operand" "=r")
|
1592 |
|
|
(minus:VDF (mult:VDF (match_operand:VDF 1 "spu_reg_operand" "r")
|
1593 |
|
|
(match_operand:VDF 2 "spu_reg_operand" "r"))
|
1594 |
|
|
(match_operand:VDF 3 "spu_reg_operand" "0")))]
|
1595 |
|
|
""
|
1596 |
|
|
"dfms\t%0,%1,%2"
|
1597 |
|
|
[(set_attr "type" "fpd")])
|
1598 |
|
|
|
1599 |
|
|
|
1600 |
|
|
;; mul highpart, used for divide by constant optimizations.
|
1601 |
|
|
|
1602 |
|
|
(define_expand "smulsi3_highpart"
|
1603 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
1604 |
|
|
(truncate:SI
|
1605 |
|
|
(ashiftrt:DI
|
1606 |
|
|
(mult:DI (sign_extend:DI (match_operand:SI 1 "register_operand" ""))
|
1607 |
|
|
(sign_extend:DI (match_operand:SI 2 "register_operand" "")))
|
1608 |
|
|
(const_int 32))))]
|
1609 |
|
|
""
|
1610 |
|
|
{
|
1611 |
|
|
rtx t0 = gen_reg_rtx (SImode);
|
1612 |
|
|
rtx t1 = gen_reg_rtx (SImode);
|
1613 |
|
|
rtx t2 = gen_reg_rtx (SImode);
|
1614 |
|
|
rtx t3 = gen_reg_rtx (SImode);
|
1615 |
|
|
rtx t4 = gen_reg_rtx (SImode);
|
1616 |
|
|
rtx t5 = gen_reg_rtx (SImode);
|
1617 |
|
|
rtx t6 = gen_reg_rtx (SImode);
|
1618 |
|
|
rtx t7 = gen_reg_rtx (SImode);
|
1619 |
|
|
rtx t8 = gen_reg_rtx (SImode);
|
1620 |
|
|
rtx t9 = gen_reg_rtx (SImode);
|
1621 |
|
|
rtx t11 = gen_reg_rtx (SImode);
|
1622 |
|
|
rtx t12 = gen_reg_rtx (SImode);
|
1623 |
|
|
rtx t14 = gen_reg_rtx (SImode);
|
1624 |
|
|
rtx t15 = gen_reg_rtx (HImode);
|
1625 |
|
|
rtx t16 = gen_reg_rtx (HImode);
|
1626 |
|
|
rtx t17 = gen_reg_rtx (HImode);
|
1627 |
|
|
rtx t18 = gen_reg_rtx (HImode);
|
1628 |
|
|
rtx t19 = gen_reg_rtx (SImode);
|
1629 |
|
|
rtx t20 = gen_reg_rtx (SImode);
|
1630 |
|
|
rtx t21 = gen_reg_rtx (SImode);
|
1631 |
|
|
rtx op1_hi = gen_rtx_SUBREG (HImode, operands[1], 2);
|
1632 |
|
|
rtx op2_hi = gen_rtx_SUBREG (HImode, operands[2], 2);
|
1633 |
|
|
rtx t0_hi = gen_rtx_SUBREG (HImode, t0, 2);
|
1634 |
|
|
rtx t1_hi = gen_rtx_SUBREG (HImode, t1, 2);
|
1635 |
|
|
|
1636 |
|
|
rtx insn = emit_insn (gen_lshrsi3 (t0, operands[1], GEN_INT (16)));
|
1637 |
|
|
emit_insn (gen_lshrsi3 (t1, operands[2], GEN_INT (16)));
|
1638 |
|
|
emit_insn (gen_umulhisi3 (t2, op1_hi, op2_hi));
|
1639 |
|
|
emit_insn (gen_mpyh_si (t3, operands[1], operands[2]));
|
1640 |
|
|
emit_insn (gen_mpyh_si (t4, operands[2], operands[1]));
|
1641 |
|
|
emit_insn (gen_mpyhh_si (t5, operands[1], operands[2]));
|
1642 |
|
|
emit_insn (gen_mpys_si (t6, t0_hi, op2_hi));
|
1643 |
|
|
emit_insn (gen_mpys_si (t7, t1_hi, op1_hi));
|
1644 |
|
|
|
1645 |
|
|
/* Gen carry bits (in t9 and t11). */
|
1646 |
|
|
emit_insn (gen_addsi3 (t8, t2, t3));
|
1647 |
|
|
emit_insn (gen_cg_si (t9, t2, t3));
|
1648 |
|
|
emit_insn (gen_cg_si (t11, t8, t4));
|
1649 |
|
|
|
1650 |
|
|
/* Gen high 32 bits in operand[0]. Correct for mpys. */
|
1651 |
|
|
emit_insn (gen_addx_si (t12, t5, t6, t9));
|
1652 |
|
|
emit_insn (gen_addx_si (t14, t12, t7, t11));
|
1653 |
|
|
|
1654 |
|
|
/* mpys treats both operands as signed when we really want it to treat
|
1655 |
|
|
the first operand as signed and the second operand as unsigned.
|
1656 |
|
|
The code below corrects for that difference. */
|
1657 |
|
|
emit_insn (gen_cgt_hi (t15, op1_hi, GEN_INT (-1)));
|
1658 |
|
|
emit_insn (gen_cgt_hi (t16, op2_hi, GEN_INT (-1)));
|
1659 |
|
|
emit_insn (gen_andc_hi (t17, t1_hi, t15));
|
1660 |
|
|
emit_insn (gen_andc_hi (t18, t0_hi, t16));
|
1661 |
|
|
emit_insn (gen_extendhisi2 (t19, t17));
|
1662 |
|
|
emit_insn (gen_extendhisi2 (t20, t18));
|
1663 |
|
|
emit_insn (gen_addsi3 (t21, t19, t20));
|
1664 |
|
|
emit_insn (gen_addsi3 (operands[0], t14, t21));
|
1665 |
|
|
unshare_all_rtl_in_chain (insn);
|
1666 |
|
|
DONE;
|
1667 |
|
|
})
|
1668 |
|
|
|
1669 |
|
|
(define_expand "umulsi3_highpart"
|
1670 |
|
|
[(set (match_operand:SI 0 "register_operand" "")
|
1671 |
|
|
(truncate:SI
|
1672 |
|
|
(ashiftrt:DI
|
1673 |
|
|
(mult:DI (zero_extend:DI (match_operand:SI 1 "register_operand" ""))
|
1674 |
|
|
(zero_extend:DI (match_operand:SI 2 "register_operand" "")))
|
1675 |
|
|
(const_int 32))))]
|
1676 |
|
|
""
|
1677 |
|
|
|
1678 |
|
|
{
|
1679 |
|
|
rtx t0 = gen_reg_rtx (SImode);
|
1680 |
|
|
rtx t1 = gen_reg_rtx (SImode);
|
1681 |
|
|
rtx t2 = gen_reg_rtx (SImode);
|
1682 |
|
|
rtx t3 = gen_reg_rtx (SImode);
|
1683 |
|
|
rtx t4 = gen_reg_rtx (SImode);
|
1684 |
|
|
rtx t5 = gen_reg_rtx (SImode);
|
1685 |
|
|
rtx t6 = gen_reg_rtx (SImode);
|
1686 |
|
|
rtx t7 = gen_reg_rtx (SImode);
|
1687 |
|
|
rtx t8 = gen_reg_rtx (SImode);
|
1688 |
|
|
rtx t9 = gen_reg_rtx (SImode);
|
1689 |
|
|
rtx t10 = gen_reg_rtx (SImode);
|
1690 |
|
|
rtx t12 = gen_reg_rtx (SImode);
|
1691 |
|
|
rtx t13 = gen_reg_rtx (SImode);
|
1692 |
|
|
rtx t14 = gen_reg_rtx (SImode);
|
1693 |
|
|
rtx op1_hi = gen_rtx_SUBREG (HImode, operands[1], 2);
|
1694 |
|
|
rtx op2_hi = gen_rtx_SUBREG (HImode, operands[2], 2);
|
1695 |
|
|
rtx t0_hi = gen_rtx_SUBREG (HImode, t0, 2);
|
1696 |
|
|
|
1697 |
|
|
rtx insn = emit_insn (gen_rotlsi3 (t0, operands[2], GEN_INT (16)));
|
1698 |
|
|
emit_insn (gen_umulhisi3 (t1, op1_hi, op2_hi));
|
1699 |
|
|
emit_insn (gen_umulhisi3 (t2, op1_hi, t0_hi));
|
1700 |
|
|
emit_insn (gen_mpyhhu_si (t3, operands[1], t0));
|
1701 |
|
|
emit_insn (gen_mpyhhu_si (t4, operands[1], operands[2]));
|
1702 |
|
|
emit_insn (gen_ashlsi3 (t5, t2, GEN_INT (16)));
|
1703 |
|
|
emit_insn (gen_ashlsi3 (t6, t3, GEN_INT (16)));
|
1704 |
|
|
emit_insn (gen_lshrsi3 (t7, t2, GEN_INT (16)));
|
1705 |
|
|
emit_insn (gen_lshrsi3 (t8, t3, GEN_INT (16)));
|
1706 |
|
|
|
1707 |
|
|
/* Gen carry bits (in t10 and t12). */
|
1708 |
|
|
emit_insn (gen_addsi3 (t9, t1, t5));
|
1709 |
|
|
emit_insn (gen_cg_si (t10, t1, t5));
|
1710 |
|
|
emit_insn (gen_cg_si (t12, t9, t6));
|
1711 |
|
|
|
1712 |
|
|
/* Gen high 32 bits in operand[0]. */
|
1713 |
|
|
emit_insn (gen_addx_si (t13, t4, t7, t10));
|
1714 |
|
|
emit_insn (gen_addx_si (t14, t13, t8, t12));
|
1715 |
|
|
emit_insn (gen_movsi (operands[0], t14));
|
1716 |
|
|
unshare_all_rtl_in_chain (insn);
|
1717 |
|
|
|
1718 |
|
|
DONE;
|
1719 |
|
|
})
|
1720 |
|
|
|
1721 |
|
|
;; div
|
1722 |
|
|
|
1723 |
|
|
;; Not necessarily the best implementation of divide but faster then
|
1724 |
|
|
;; the default that gcc provides because this is inlined and it uses
|
1725 |
|
|
;; clz.
|
1726 |
|
|
(define_insn "divmodsi4"
|
1727 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=&r")
|
1728 |
|
|
(div:SI (match_operand:SI 1 "spu_reg_operand" "r")
|
1729 |
|
|
(match_operand:SI 2 "spu_reg_operand" "r")))
|
1730 |
|
|
(set (match_operand:SI 3 "spu_reg_operand" "=&r")
|
1731 |
|
|
(mod:SI (match_dup 1)
|
1732 |
|
|
(match_dup 2)))
|
1733 |
|
|
(clobber (match_scratch:SI 4 "=&r"))
|
1734 |
|
|
(clobber (match_scratch:SI 5 "=&r"))
|
1735 |
|
|
(clobber (match_scratch:SI 6 "=&r"))
|
1736 |
|
|
(clobber (match_scratch:SI 7 "=&r"))
|
1737 |
|
|
(clobber (match_scratch:SI 8 "=&r"))
|
1738 |
|
|
(clobber (match_scratch:SI 9 "=&r"))
|
1739 |
|
|
(clobber (match_scratch:SI 10 "=&r"))
|
1740 |
|
|
(clobber (match_scratch:SI 11 "=&r"))
|
1741 |
|
|
(clobber (match_scratch:SI 12 "=&r"))
|
1742 |
|
|
(clobber (reg:SI 130))]
|
1743 |
|
|
""
|
1744 |
|
|
"heqi %2,0\\n\\
|
1745 |
|
|
hbrr 3f,1f\\n\\
|
1746 |
|
|
sfi %8,%1,0\\n\\
|
1747 |
|
|
sfi %9,%2,0\\n\\
|
1748 |
|
|
cgti %10,%1,-1\\n\\
|
1749 |
|
|
cgti %11,%2,-1\\n\\
|
1750 |
|
|
selb %8,%8,%1,%10\\n\\
|
1751 |
|
|
selb %9,%9,%2,%11\\n\\
|
1752 |
|
|
clz %4,%8\\n\\
|
1753 |
|
|
clz %7,%9\\n\\
|
1754 |
|
|
il %5,1\\n\\
|
1755 |
|
|
fsmbi %0,0\\n\\
|
1756 |
|
|
sf %7,%4,%7\\n\\
|
1757 |
|
|
shlqbyi %3,%8,0\\n\\
|
1758 |
|
|
xor %11,%10,%11\\n\\
|
1759 |
|
|
shl %5,%5,%7\\n\\
|
1760 |
|
|
shl %4,%9,%7\\n\\
|
1761 |
|
|
lnop \\n\\
|
1762 |
|
|
1: or %12,%0,%5\\n\\
|
1763 |
|
|
rotqmbii %5,%5,-1\\n\\
|
1764 |
|
|
clgt %6,%4,%3\\n\\
|
1765 |
|
|
lnop \\n\\
|
1766 |
|
|
sf %7,%4,%3\\n\\
|
1767 |
|
|
rotqmbii %4,%4,-1\\n\\
|
1768 |
|
|
selb %0,%12,%0,%6\\n\\
|
1769 |
|
|
lnop \\n\\
|
1770 |
|
|
selb %3,%7,%3,%6\\n\\
|
1771 |
|
|
3: brnz %5,1b\\n\\
|
1772 |
|
|
2: sfi %8,%3,0\\n\\
|
1773 |
|
|
sfi %9,%0,0\\n\\
|
1774 |
|
|
selb %3,%8,%3,%10\\n\\
|
1775 |
|
|
selb %0,%0,%9,%11"
|
1776 |
|
|
[(set_attr "type" "multi0")
|
1777 |
|
|
(set_attr "length" "128")])
|
1778 |
|
|
|
1779 |
|
|
(define_insn "udivmodsi4"
|
1780 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=&r")
|
1781 |
|
|
(udiv:SI (match_operand:SI 1 "spu_reg_operand" "r")
|
1782 |
|
|
(match_operand:SI 2 "spu_reg_operand" "r")))
|
1783 |
|
|
(set (match_operand:SI 3 "spu_reg_operand" "=&r")
|
1784 |
|
|
(umod:SI (match_dup 1)
|
1785 |
|
|
(match_dup 2)))
|
1786 |
|
|
(clobber (match_scratch:SI 4 "=&r"))
|
1787 |
|
|
(clobber (match_scratch:SI 5 "=&r"))
|
1788 |
|
|
(clobber (match_scratch:SI 6 "=&r"))
|
1789 |
|
|
(clobber (match_scratch:SI 7 "=&r"))
|
1790 |
|
|
(clobber (match_scratch:SI 8 "=&r"))
|
1791 |
|
|
(clobber (reg:SI 130))]
|
1792 |
|
|
""
|
1793 |
|
|
"heqi %2,0\\n\\
|
1794 |
|
|
hbrr 3f,1f\\n\\
|
1795 |
|
|
clz %7,%2\\n\\
|
1796 |
|
|
clz %4,%1\\n\\
|
1797 |
|
|
il %5,1\\n\\
|
1798 |
|
|
fsmbi %0,0\\n\\
|
1799 |
|
|
sf %7,%4,%7\\n\\
|
1800 |
|
|
ori %3,%1,0\\n\\
|
1801 |
|
|
shl %5,%5,%7\\n\\
|
1802 |
|
|
shl %4,%2,%7\\n\\
|
1803 |
|
|
1: or %8,%0,%5\\n\\
|
1804 |
|
|
rotqmbii %5,%5,-1\\n\\
|
1805 |
|
|
clgt %6,%4,%3\\n\\
|
1806 |
|
|
lnop \\n\\
|
1807 |
|
|
sf %7,%4,%3\\n\\
|
1808 |
|
|
rotqmbii %4,%4,-1\\n\\
|
1809 |
|
|
selb %0,%8,%0,%6\\n\\
|
1810 |
|
|
lnop \\n\\
|
1811 |
|
|
selb %3,%7,%3,%6\\n\\
|
1812 |
|
|
3: brnz %5,1b\\n\\
|
1813 |
|
|
2:"
|
1814 |
|
|
[(set_attr "type" "multi0")
|
1815 |
|
|
(set_attr "length" "80")])
|
1816 |
|
|
|
1817 |
|
|
(define_expand "div3"
|
1818 |
|
|
[(parallel
|
1819 |
|
|
[(set (match_operand:VSF 0 "spu_reg_operand" "")
|
1820 |
|
|
(div:VSF (match_operand:VSF 1 "spu_reg_operand" "")
|
1821 |
|
|
(match_operand:VSF 2 "spu_reg_operand" "")))
|
1822 |
|
|
(clobber (match_scratch:VSF 3 ""))
|
1823 |
|
|
(clobber (match_scratch:VSF 4 ""))
|
1824 |
|
|
(clobber (match_scratch:VSF 5 ""))])]
|
1825 |
|
|
""
|
1826 |
|
|
"")
|
1827 |
|
|
|
1828 |
|
|
(define_insn_and_split "*div3_fast"
|
1829 |
|
|
[(set (match_operand:VSF 0 "spu_reg_operand" "=r")
|
1830 |
|
|
(div:VSF (match_operand:VSF 1 "spu_reg_operand" "r")
|
1831 |
|
|
(match_operand:VSF 2 "spu_reg_operand" "r")))
|
1832 |
|
|
(clobber (match_scratch:VSF 3 "=&r"))
|
1833 |
|
|
(clobber (match_scratch:VSF 4 "=&r"))
|
1834 |
|
|
(clobber (scratch:VSF))]
|
1835 |
|
|
"flag_unsafe_math_optimizations"
|
1836 |
|
|
"#"
|
1837 |
|
|
"reload_completed"
|
1838 |
|
|
[(set (match_dup:VSF 0)
|
1839 |
|
|
(div:VSF (match_dup:VSF 1)
|
1840 |
|
|
(match_dup:VSF 2)))
|
1841 |
|
|
(clobber (match_dup:VSF 3))
|
1842 |
|
|
(clobber (match_dup:VSF 4))
|
1843 |
|
|
(clobber (scratch:VSF))]
|
1844 |
|
|
{
|
1845 |
|
|
emit_insn (gen_frest_(operands[3], operands[2]));
|
1846 |
|
|
emit_insn (gen_fi_(operands[3], operands[2], operands[3]));
|
1847 |
|
|
emit_insn (gen_mul3(operands[4], operands[1], operands[3]));
|
1848 |
|
|
emit_insn (gen_fnms_(operands[0], operands[4], operands[2], operands[1]));
|
1849 |
|
|
emit_insn (gen_fma_(operands[0], operands[0], operands[3], operands[4]));
|
1850 |
|
|
DONE;
|
1851 |
|
|
})
|
1852 |
|
|
|
1853 |
|
|
(define_insn_and_split "*div3_adjusted"
|
1854 |
|
|
[(set (match_operand:VSF 0 "spu_reg_operand" "=r")
|
1855 |
|
|
(div:VSF (match_operand:VSF 1 "spu_reg_operand" "r")
|
1856 |
|
|
(match_operand:VSF 2 "spu_reg_operand" "r")))
|
1857 |
|
|
(clobber (match_scratch:VSF 3 "=&r"))
|
1858 |
|
|
(clobber (match_scratch:VSF 4 "=&r"))
|
1859 |
|
|
(clobber (match_scratch:VSF 5 "=&r"))]
|
1860 |
|
|
"!flag_unsafe_math_optimizations"
|
1861 |
|
|
"#"
|
1862 |
|
|
"reload_completed"
|
1863 |
|
|
[(set (match_dup:VSF 0)
|
1864 |
|
|
(div:VSF (match_dup:VSF 1)
|
1865 |
|
|
(match_dup:VSF 2)))
|
1866 |
|
|
(clobber (match_dup:VSF 3))
|
1867 |
|
|
(clobber (match_dup:VSF 4))
|
1868 |
|
|
(clobber (match_dup:VSF 5))]
|
1869 |
|
|
{
|
1870 |
|
|
emit_insn (gen_frest_ (operands[3], operands[2]));
|
1871 |
|
|
emit_insn (gen_fi_ (operands[3], operands[2], operands[3]));
|
1872 |
|
|
emit_insn (gen_mul3 (operands[4], operands[1], operands[3]));
|
1873 |
|
|
emit_insn (gen_fnms_ (operands[5], operands[4], operands[2], operands[1]));
|
1874 |
|
|
emit_insn (gen_fma_ (operands[3], operands[5], operands[3], operands[4]));
|
1875 |
|
|
|
1876 |
|
|
/* Due to truncation error, the quotient result may be low by 1 ulp.
|
1877 |
|
|
Conditionally add one if the estimate is too small in magnitude. */
|
1878 |
|
|
|
1879 |
|
|
emit_move_insn (gen_lowpart (mode, operands[4]),
|
1880 |
|
|
spu_const (mode, 0x80000000ULL));
|
1881 |
|
|
emit_move_insn (gen_lowpart (mode, operands[5]),
|
1882 |
|
|
spu_const (mode, 0x3f800000ULL));
|
1883 |
|
|
emit_insn (gen_selb (operands[5], operands[5], operands[1], operands[4]));
|
1884 |
|
|
|
1885 |
|
|
emit_insn (gen_add3 (gen_lowpart (mode, operands[4]),
|
1886 |
|
|
gen_lowpart (mode, operands[3]),
|
1887 |
|
|
spu_const (mode, 1)));
|
1888 |
|
|
emit_insn (gen_fnms_ (operands[0], operands[2], operands[4], operands[1]));
|
1889 |
|
|
emit_insn (gen_mul3 (operands[0], operands[0], operands[5]));
|
1890 |
|
|
emit_insn (gen_cgt_ (gen_lowpart (mode, operands[0]),
|
1891 |
|
|
gen_lowpart (mode, operands[0]),
|
1892 |
|
|
spu_const (mode, -1)));
|
1893 |
|
|
emit_insn (gen_selb (operands[0], operands[3], operands[4], operands[0]));
|
1894 |
|
|
DONE;
|
1895 |
|
|
})
|
1896 |
|
|
|
1897 |
|
|
|
1898 |
|
|
;; sqrt
|
1899 |
|
|
|
1900 |
|
|
(define_insn_and_split "sqrtsf2"
|
1901 |
|
|
[(set (match_operand:SF 0 "spu_reg_operand" "=r")
|
1902 |
|
|
(sqrt:SF (match_operand:SF 1 "spu_reg_operand" "r")))
|
1903 |
|
|
(clobber (match_scratch:SF 2 "=&r"))
|
1904 |
|
|
(clobber (match_scratch:SF 3 "=&r"))
|
1905 |
|
|
(clobber (match_scratch:SF 4 "=&r"))
|
1906 |
|
|
(clobber (match_scratch:SF 5 "=&r"))]
|
1907 |
|
|
""
|
1908 |
|
|
"#"
|
1909 |
|
|
"reload_completed"
|
1910 |
|
|
[(set (match_dup:SF 0)
|
1911 |
|
|
(sqrt:SF (match_dup:SF 1)))
|
1912 |
|
|
(clobber (match_dup:SF 2))
|
1913 |
|
|
(clobber (match_dup:SF 3))
|
1914 |
|
|
(clobber (match_dup:SF 4))
|
1915 |
|
|
(clobber (match_dup:SF 5))]
|
1916 |
|
|
{
|
1917 |
|
|
emit_move_insn (operands[3],spu_float_const(\"0.5\",SFmode));
|
1918 |
|
|
emit_move_insn (operands[4],spu_float_const(\"1.00000011920928955078125\",SFmode));
|
1919 |
|
|
emit_insn (gen_frsqest_sf(operands[2],operands[1]));
|
1920 |
|
|
emit_insn (gen_fi_sf(operands[2],operands[1],operands[2]));
|
1921 |
|
|
emit_insn (gen_mulsf3(operands[5],operands[2],operands[1]));
|
1922 |
|
|
emit_insn (gen_mulsf3(operands[3],operands[5],operands[3]));
|
1923 |
|
|
emit_insn (gen_fnms_sf(operands[4],operands[2],operands[5],operands[4]));
|
1924 |
|
|
emit_insn (gen_fma_sf(operands[0],operands[4],operands[3],operands[5]));
|
1925 |
|
|
DONE;
|
1926 |
|
|
})
|
1927 |
|
|
|
1928 |
|
|
(define_insn "frest_"
|
1929 |
|
|
[(set (match_operand:VSF 0 "spu_reg_operand" "=r")
|
1930 |
|
|
(unspec:VSF [(match_operand:VSF 1 "spu_reg_operand" "r")] UNSPEC_FREST))]
|
1931 |
|
|
""
|
1932 |
|
|
"frest\t%0,%1"
|
1933 |
|
|
[(set_attr "type" "shuf")])
|
1934 |
|
|
|
1935 |
|
|
(define_insn "frsqest_"
|
1936 |
|
|
[(set (match_operand:VSF 0 "spu_reg_operand" "=r")
|
1937 |
|
|
(unspec:VSF [(match_operand:VSF 1 "spu_reg_operand" "r")] UNSPEC_FRSQEST))]
|
1938 |
|
|
""
|
1939 |
|
|
"frsqest\t%0,%1"
|
1940 |
|
|
[(set_attr "type" "shuf")])
|
1941 |
|
|
|
1942 |
|
|
(define_insn "fi_"
|
1943 |
|
|
[(set (match_operand:VSF 0 "spu_reg_operand" "=r")
|
1944 |
|
|
(unspec:VSF [(match_operand:VSF 1 "spu_reg_operand" "r")
|
1945 |
|
|
(match_operand:VSF 2 "spu_reg_operand" "r")] UNSPEC_FI))]
|
1946 |
|
|
""
|
1947 |
|
|
"fi\t%0,%1,%2"
|
1948 |
|
|
[(set_attr "type" "fp7")])
|
1949 |
|
|
|
1950 |
|
|
|
1951 |
|
|
;; and
|
1952 |
|
|
|
1953 |
|
|
(define_insn "and3"
|
1954 |
|
|
[(set (match_operand:MOV 0 "spu_reg_operand" "=r,r")
|
1955 |
|
|
(and:MOV (match_operand:MOV 1 "spu_reg_operand" "r,r")
|
1956 |
|
|
(match_operand:MOV 2 "spu_logical_operand" "r,C")))]
|
1957 |
|
|
""
|
1958 |
|
|
"@
|
1959 |
|
|
and\t%0,%1,%2
|
1960 |
|
|
and%j2i\t%0,%1,%J2")
|
1961 |
|
|
|
1962 |
|
|
(define_insn "anddi3"
|
1963 |
|
|
[(set (match_operand:DI 0 "spu_reg_operand" "=r,r")
|
1964 |
|
|
(and:DI (match_operand:DI 1 "spu_reg_operand" "r,r")
|
1965 |
|
|
(match_operand:DI 2 "spu_logical_operand" "r,c")))]
|
1966 |
|
|
""
|
1967 |
|
|
"@
|
1968 |
|
|
and\t%0,%1,%2
|
1969 |
|
|
and%k2i\t%0,%1,%K2")
|
1970 |
|
|
|
1971 |
|
|
(define_insn "andti3"
|
1972 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r,r")
|
1973 |
|
|
(and:TI (match_operand:TI 1 "spu_reg_operand" "r,r")
|
1974 |
|
|
(match_operand:TI 2 "spu_logical_operand" "r,Y")))]
|
1975 |
|
|
""
|
1976 |
|
|
"@
|
1977 |
|
|
and\t%0,%1,%2
|
1978 |
|
|
and%m2i\t%0,%1,%L2")
|
1979 |
|
|
|
1980 |
|
|
(define_insn "andc_"
|
1981 |
|
|
[(set (match_operand:ALL 0 "spu_reg_operand" "=r")
|
1982 |
|
|
(and:ALL (not:ALL (match_operand:ALL 2 "spu_reg_operand" "r"))
|
1983 |
|
|
(match_operand:ALL 1 "spu_reg_operand" "r")))]
|
1984 |
|
|
""
|
1985 |
|
|
"andc\t%0,%1,%2")
|
1986 |
|
|
|
1987 |
|
|
(define_insn "nand_"
|
1988 |
|
|
[(set (match_operand:ALL 0 "spu_reg_operand" "=r")
|
1989 |
|
|
(not:ALL (and:ALL (match_operand:ALL 2 "spu_reg_operand" "r")
|
1990 |
|
|
(match_operand:ALL 1 "spu_reg_operand" "r"))))]
|
1991 |
|
|
""
|
1992 |
|
|
"nand\t%0,%1,%2")
|
1993 |
|
|
|
1994 |
|
|
|
1995 |
|
|
;; ior
|
1996 |
|
|
|
1997 |
|
|
(define_insn "ior3"
|
1998 |
|
|
[(set (match_operand:MOV 0 "spu_reg_operand" "=r,r,r")
|
1999 |
|
|
(ior:MOV (match_operand:MOV 1 "spu_reg_operand" "r,r,0")
|
2000 |
|
|
(match_operand:MOV 2 "spu_ior_operand" "r,C,D")))]
|
2001 |
|
|
""
|
2002 |
|
|
"@
|
2003 |
|
|
or\t%0,%1,%2
|
2004 |
|
|
or%j2i\t%0,%1,%J2
|
2005 |
|
|
iohl\t%0,%J2")
|
2006 |
|
|
|
2007 |
|
|
(define_insn "iordi3"
|
2008 |
|
|
[(set (match_operand:DI 0 "spu_reg_operand" "=r,r,r")
|
2009 |
|
|
(ior:DI (match_operand:DI 1 "spu_reg_operand" "r,r,0")
|
2010 |
|
|
(match_operand:DI 2 "spu_ior_operand" "r,c,d")))]
|
2011 |
|
|
""
|
2012 |
|
|
"@
|
2013 |
|
|
or\t%0,%1,%2
|
2014 |
|
|
or%k2i\t%0,%1,%K2
|
2015 |
|
|
iohl\t%0,%K2")
|
2016 |
|
|
|
2017 |
|
|
(define_insn "iorti3"
|
2018 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r,r,r")
|
2019 |
|
|
(ior:TI (match_operand:TI 1 "spu_reg_operand" "r,r,0")
|
2020 |
|
|
(match_operand:TI 2 "spu_ior_operand" "r,Y,Z")))]
|
2021 |
|
|
""
|
2022 |
|
|
"@
|
2023 |
|
|
or\t%0,%1,%2
|
2024 |
|
|
or%m2i\t%0,%1,%L2
|
2025 |
|
|
iohl\t%0,%L2")
|
2026 |
|
|
|
2027 |
|
|
(define_insn "orc_"
|
2028 |
|
|
[(set (match_operand:ALL 0 "spu_reg_operand" "=r")
|
2029 |
|
|
(ior:ALL (not:ALL (match_operand:ALL 2 "spu_reg_operand" "r"))
|
2030 |
|
|
(match_operand:ALL 1 "spu_reg_operand" "r")))]
|
2031 |
|
|
""
|
2032 |
|
|
"orc\t%0,%1,%2")
|
2033 |
|
|
|
2034 |
|
|
(define_insn "nor_"
|
2035 |
|
|
[(set (match_operand:ALL 0 "spu_reg_operand" "=r")
|
2036 |
|
|
(not:ALL (ior:ALL (match_operand:ALL 1 "spu_reg_operand" "r")
|
2037 |
|
|
(match_operand:ALL 2 "spu_reg_operand" "r"))))]
|
2038 |
|
|
""
|
2039 |
|
|
"nor\t%0,%1,%2")
|
2040 |
|
|
|
2041 |
|
|
;; xor
|
2042 |
|
|
|
2043 |
|
|
(define_insn "xor3"
|
2044 |
|
|
[(set (match_operand:MOV 0 "spu_reg_operand" "=r,r")
|
2045 |
|
|
(xor:MOV (match_operand:MOV 1 "spu_reg_operand" "r,r")
|
2046 |
|
|
(match_operand:MOV 2 "spu_logical_operand" "r,B")))]
|
2047 |
|
|
""
|
2048 |
|
|
"@
|
2049 |
|
|
xor\t%0,%1,%2
|
2050 |
|
|
xor%j2i\t%0,%1,%J2")
|
2051 |
|
|
|
2052 |
|
|
(define_insn "xordi3"
|
2053 |
|
|
[(set (match_operand:DI 0 "spu_reg_operand" "=r,r")
|
2054 |
|
|
(xor:DI (match_operand:DI 1 "spu_reg_operand" "r,r")
|
2055 |
|
|
(match_operand:DI 2 "spu_logical_operand" "r,c")))]
|
2056 |
|
|
""
|
2057 |
|
|
"@
|
2058 |
|
|
xor\t%0,%1,%2
|
2059 |
|
|
xor%k2i\t%0,%1,%K2")
|
2060 |
|
|
|
2061 |
|
|
(define_insn "xorti3"
|
2062 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r,r")
|
2063 |
|
|
(xor:TI (match_operand:TI 1 "spu_reg_operand" "r,r")
|
2064 |
|
|
(match_operand:TI 2 "spu_logical_operand" "r,Y")))]
|
2065 |
|
|
""
|
2066 |
|
|
"@
|
2067 |
|
|
xor\t%0,%1,%2
|
2068 |
|
|
xor%m2i\t%0,%1,%L2")
|
2069 |
|
|
|
2070 |
|
|
(define_insn "eqv_"
|
2071 |
|
|
[(set (match_operand:ALL 0 "spu_reg_operand" "=r")
|
2072 |
|
|
(not:ALL (xor:ALL (match_operand:ALL 1 "spu_reg_operand" "r")
|
2073 |
|
|
(match_operand:ALL 2 "spu_reg_operand" "r"))))]
|
2074 |
|
|
""
|
2075 |
|
|
"eqv\t%0,%1,%2")
|
2076 |
|
|
|
2077 |
|
|
;; one_cmpl
|
2078 |
|
|
|
2079 |
|
|
(define_insn "one_cmpl2"
|
2080 |
|
|
[(set (match_operand:ALL 0 "spu_reg_operand" "=r")
|
2081 |
|
|
(not:ALL (match_operand:ALL 1 "spu_reg_operand" "r")))]
|
2082 |
|
|
""
|
2083 |
|
|
"nor\t%0,%1,%1")
|
2084 |
|
|
|
2085 |
|
|
|
2086 |
|
|
;; selb
|
2087 |
|
|
|
2088 |
|
|
(define_expand "selb"
|
2089 |
|
|
[(set (match_operand 0 "spu_reg_operand" "")
|
2090 |
|
|
(unspec [(match_operand 1 "spu_reg_operand" "")
|
2091 |
|
|
(match_operand 2 "spu_reg_operand" "")
|
2092 |
|
|
(match_operand 3 "spu_reg_operand" "")] UNSPEC_SELB))]
|
2093 |
|
|
""
|
2094 |
|
|
{
|
2095 |
|
|
rtx s = gen__selb (operands[0], operands[1], operands[2], operands[3]);
|
2096 |
|
|
PUT_MODE (SET_SRC (s), GET_MODE (operands[0]));
|
2097 |
|
|
emit_insn (s);
|
2098 |
|
|
DONE;
|
2099 |
|
|
})
|
2100 |
|
|
|
2101 |
|
|
;; This could be defined as a combination of logical operations, but at
|
2102 |
|
|
;; one time it caused a crash due to recursive expansion of rtl during CSE.
|
2103 |
|
|
(define_insn "_selb"
|
2104 |
|
|
[(set (match_operand 0 "spu_reg_operand" "=r")
|
2105 |
|
|
(unspec [(match_operand 1 "spu_reg_operand" "r")
|
2106 |
|
|
(match_operand 2 "spu_reg_operand" "r")
|
2107 |
|
|
(match_operand 3 "spu_reg_operand" "r")] UNSPEC_SELB))]
|
2108 |
|
|
"GET_MODE(operands[0]) == GET_MODE(operands[1])
|
2109 |
|
|
&& GET_MODE(operands[1]) == GET_MODE(operands[2])"
|
2110 |
|
|
"selb\t%0,%1,%2,%3")
|
2111 |
|
|
|
2112 |
|
|
|
2113 |
|
|
;; Misc. byte/bit operations
|
2114 |
|
|
;; clz/ctz/ffs/popcount/parity
|
2115 |
|
|
;; cntb/sumb
|
2116 |
|
|
|
2117 |
|
|
(define_insn "clz2"
|
2118 |
|
|
[(set (match_operand:VSI 0 "spu_reg_operand" "=r")
|
2119 |
|
|
(clz:VSI (match_operand:VSI 1 "spu_reg_operand" "r")))]
|
2120 |
|
|
""
|
2121 |
|
|
"clz\t%0,%1")
|
2122 |
|
|
|
2123 |
|
|
(define_expand "ctz2"
|
2124 |
|
|
[(set (match_dup 2)
|
2125 |
|
|
(neg:VSI (match_operand:VSI 1 "spu_reg_operand" "")))
|
2126 |
|
|
(set (match_dup 3) (and:VSI (match_dup 1)
|
2127 |
|
|
(match_dup 2)))
|
2128 |
|
|
(set (match_dup 4) (clz:VSI (match_dup 3)))
|
2129 |
|
|
(set (match_operand:VSI 0 "spu_reg_operand" "")
|
2130 |
|
|
(minus:VSI (match_dup 5) (match_dup 4)))]
|
2131 |
|
|
""
|
2132 |
|
|
{
|
2133 |
|
|
operands[2] = gen_reg_rtx (mode);
|
2134 |
|
|
operands[3] = gen_reg_rtx (mode);
|
2135 |
|
|
operands[4] = gen_reg_rtx (mode);
|
2136 |
|
|
operands[5] = spu_const(mode, 31);
|
2137 |
|
|
})
|
2138 |
|
|
|
2139 |
|
|
(define_expand "ffs2"
|
2140 |
|
|
[(set (match_dup 2)
|
2141 |
|
|
(neg:VSI (match_operand:VSI 1 "spu_reg_operand" "")))
|
2142 |
|
|
(set (match_dup 3) (and:VSI (match_dup 1)
|
2143 |
|
|
(match_dup 2)))
|
2144 |
|
|
(set (match_dup 4) (clz:VSI (match_dup 3)))
|
2145 |
|
|
(set (match_operand:VSI 0 "spu_reg_operand" "")
|
2146 |
|
|
(minus:VSI (match_dup 5) (match_dup 4)))]
|
2147 |
|
|
""
|
2148 |
|
|
{
|
2149 |
|
|
operands[2] = gen_reg_rtx (mode);
|
2150 |
|
|
operands[3] = gen_reg_rtx (mode);
|
2151 |
|
|
operands[4] = gen_reg_rtx (mode);
|
2152 |
|
|
operands[5] = spu_const(mode, 32);
|
2153 |
|
|
})
|
2154 |
|
|
|
2155 |
|
|
(define_expand "popcountsi2"
|
2156 |
|
|
[(set (match_dup 2)
|
2157 |
|
|
(unspec:SI [(match_operand:SI 1 "spu_reg_operand" "")]
|
2158 |
|
|
UNSPEC_CNTB))
|
2159 |
|
|
(set (match_dup 3)
|
2160 |
|
|
(unspec:HI [(match_dup 2)] UNSPEC_SUMB))
|
2161 |
|
|
(set (match_operand:SI 0 "spu_reg_operand" "")
|
2162 |
|
|
(sign_extend:SI (match_dup 3)))]
|
2163 |
|
|
""
|
2164 |
|
|
{
|
2165 |
|
|
operands[2] = gen_reg_rtx (SImode);
|
2166 |
|
|
operands[3] = gen_reg_rtx (HImode);
|
2167 |
|
|
})
|
2168 |
|
|
|
2169 |
|
|
(define_expand "paritysi2"
|
2170 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "")
|
2171 |
|
|
(parity:SI (match_operand:SI 1 "spu_reg_operand" "")))]
|
2172 |
|
|
""
|
2173 |
|
|
{
|
2174 |
|
|
operands[2] = gen_reg_rtx (SImode);
|
2175 |
|
|
emit_insn (gen_popcountsi2(operands[2], operands[1]));
|
2176 |
|
|
emit_insn (gen_andsi3(operands[0], operands[2], GEN_INT (1)));
|
2177 |
|
|
DONE;
|
2178 |
|
|
})
|
2179 |
|
|
|
2180 |
|
|
(define_insn "cntb_si"
|
2181 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
2182 |
|
|
(unspec:SI [(match_operand:SI 1 "spu_reg_operand" "r")]
|
2183 |
|
|
UNSPEC_CNTB))]
|
2184 |
|
|
""
|
2185 |
|
|
"cntb\t%0,%1"
|
2186 |
|
|
[(set_attr "type" "fxb")])
|
2187 |
|
|
|
2188 |
|
|
(define_insn "cntb_v16qi"
|
2189 |
|
|
[(set (match_operand:V16QI 0 "spu_reg_operand" "=r")
|
2190 |
|
|
(unspec:V16QI [(match_operand:V16QI 1 "spu_reg_operand" "r")]
|
2191 |
|
|
UNSPEC_CNTB))]
|
2192 |
|
|
""
|
2193 |
|
|
"cntb\t%0,%1"
|
2194 |
|
|
[(set_attr "type" "fxb")])
|
2195 |
|
|
|
2196 |
|
|
(define_insn "sumb_si"
|
2197 |
|
|
[(set (match_operand:HI 0 "spu_reg_operand" "=r")
|
2198 |
|
|
(unspec:HI [(match_operand:SI 1 "spu_reg_operand" "r")] UNSPEC_SUMB))]
|
2199 |
|
|
""
|
2200 |
|
|
"sumb\t%0,%1,%1"
|
2201 |
|
|
[(set_attr "type" "fxb")])
|
2202 |
|
|
|
2203 |
|
|
|
2204 |
|
|
;; ashl, vashl
|
2205 |
|
|
|
2206 |
|
|
(define_insn "ashl3"
|
2207 |
|
|
[(set (match_operand:VHSI 0 "spu_reg_operand" "=r,r")
|
2208 |
|
|
(ashift:VHSI (match_operand:VHSI 1 "spu_reg_operand" "r,r")
|
2209 |
|
|
(match_operand:VHSI 2 "spu_nonmem_operand" "r,W")))]
|
2210 |
|
|
""
|
2211 |
|
|
"@
|
2212 |
|
|
shl\t%0,%1,%2
|
2213 |
|
|
shli\t%0,%1,%2"
|
2214 |
|
|
[(set_attr "type" "fx3")])
|
2215 |
|
|
|
2216 |
|
|
(define_insn_and_split "ashldi3"
|
2217 |
|
|
[(set (match_operand:DI 0 "spu_reg_operand" "=r,r")
|
2218 |
|
|
(ashift:DI (match_operand:DI 1 "spu_reg_operand" "r,r")
|
2219 |
|
|
(match_operand:SI 2 "spu_nonmem_operand" "r,I")))
|
2220 |
|
|
(clobber (match_scratch:SI 3 "=&r,X"))]
|
2221 |
|
|
""
|
2222 |
|
|
"#"
|
2223 |
|
|
"reload_completed"
|
2224 |
|
|
[(set (match_dup:DI 0)
|
2225 |
|
|
(ashift:DI (match_dup:DI 1)
|
2226 |
|
|
(match_dup:SI 2)))]
|
2227 |
|
|
{
|
2228 |
|
|
rtx op0 = gen_rtx_REG (TImode, REGNO (operands[0]));
|
2229 |
|
|
rtx op1 = gen_rtx_REG (TImode, REGNO (operands[1]));
|
2230 |
|
|
rtx op2 = operands[2];
|
2231 |
|
|
rtx op3 = operands[3];
|
2232 |
|
|
|
2233 |
|
|
if (GET_CODE (operands[2]) == REG)
|
2234 |
|
|
{
|
2235 |
|
|
emit_insn (gen_addsi3 (op3, op2, GEN_INT (64)));
|
2236 |
|
|
emit_insn (gen_rotlti3 (op0, op1, GEN_INT (64)));
|
2237 |
|
|
emit_insn (gen_shlqbybi_ti (op0, op0, op3));
|
2238 |
|
|
emit_insn (gen_shlqbi_ti (op0, op0, op3));
|
2239 |
|
|
}
|
2240 |
|
|
else
|
2241 |
|
|
{
|
2242 |
|
|
HOST_WIDE_INT val = INTVAL (operands[2]);
|
2243 |
|
|
emit_insn (gen_rotlti3 (op0, op1, GEN_INT (64)));
|
2244 |
|
|
emit_insn (gen_shlqby_ti (op0, op0, GEN_INT (val / 8 + 8)));
|
2245 |
|
|
if (val % 8)
|
2246 |
|
|
emit_insn (gen_shlqbi_ti (op0, op0, GEN_INT (val % 8)));
|
2247 |
|
|
}
|
2248 |
|
|
DONE;
|
2249 |
|
|
})
|
2250 |
|
|
|
2251 |
|
|
(define_expand "ashlti3"
|
2252 |
|
|
[(parallel [(set (match_operand:TI 0 "spu_reg_operand" "")
|
2253 |
|
|
(ashift:TI (match_operand:TI 1 "spu_reg_operand" "")
|
2254 |
|
|
(match_operand:SI 2 "spu_nonmem_operand" "")))
|
2255 |
|
|
(clobber (match_dup:TI 3))])]
|
2256 |
|
|
""
|
2257 |
|
|
"if (GET_CODE (operands[2]) == CONST_INT)
|
2258 |
|
|
{
|
2259 |
|
|
emit_insn (gen_ashlti3_imm(operands[0], operands[1], operands[2]));
|
2260 |
|
|
DONE;
|
2261 |
|
|
}
|
2262 |
|
|
operands[3] = gen_reg_rtx (TImode);")
|
2263 |
|
|
|
2264 |
|
|
(define_insn_and_split "ashlti3_imm"
|
2265 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r,r")
|
2266 |
|
|
(ashift:TI (match_operand:TI 1 "spu_reg_operand" "r,r")
|
2267 |
|
|
(match_operand:SI 2 "immediate_operand" "O,P")))]
|
2268 |
|
|
""
|
2269 |
|
|
"@
|
2270 |
|
|
shlqbyi\t%0,%1,%h2
|
2271 |
|
|
shlqbii\t%0,%1,%e2"
|
2272 |
|
|
"!satisfies_constraint_O (operands[2]) && !satisfies_constraint_P (operands[2])"
|
2273 |
|
|
[(set (match_dup:TI 0)
|
2274 |
|
|
(ashift:TI (match_dup:TI 1)
|
2275 |
|
|
(match_dup:SI 3)))
|
2276 |
|
|
(set (match_dup:TI 0)
|
2277 |
|
|
(ashift:TI (match_dup:TI 0)
|
2278 |
|
|
(match_dup:SI 4)))]
|
2279 |
|
|
{
|
2280 |
|
|
HOST_WIDE_INT val = INTVAL(operands[2]);
|
2281 |
|
|
operands[3] = GEN_INT (val&7);
|
2282 |
|
|
operands[4] = GEN_INT (val&-8);
|
2283 |
|
|
}
|
2284 |
|
|
[(set_attr "type" "shuf,shuf")])
|
2285 |
|
|
|
2286 |
|
|
(define_insn_and_split "ashlti3_reg"
|
2287 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r")
|
2288 |
|
|
(ashift:TI (match_operand:TI 1 "spu_reg_operand" "r")
|
2289 |
|
|
(match_operand:SI 2 "spu_reg_operand" "r")))
|
2290 |
|
|
(clobber (match_operand:TI 3 "spu_reg_operand" "=&r"))]
|
2291 |
|
|
""
|
2292 |
|
|
"#"
|
2293 |
|
|
""
|
2294 |
|
|
[(set (match_dup:TI 3)
|
2295 |
|
|
(ashift:TI (match_dup:TI 1)
|
2296 |
|
|
(and:SI (match_dup:SI 2)
|
2297 |
|
|
(const_int 7))))
|
2298 |
|
|
(set (match_dup:TI 0)
|
2299 |
|
|
(ashift:TI (match_dup:TI 3)
|
2300 |
|
|
(and:SI (match_dup:SI 2)
|
2301 |
|
|
(const_int -8))))]
|
2302 |
|
|
"")
|
2303 |
|
|
|
2304 |
|
|
(define_insn "shlqbybi_ti"
|
2305 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r,r")
|
2306 |
|
|
(ashift:TI (match_operand:TI 1 "spu_reg_operand" "r,r")
|
2307 |
|
|
(and:SI (match_operand:SI 2 "spu_nonmem_operand" "r,I")
|
2308 |
|
|
(const_int -8))))]
|
2309 |
|
|
""
|
2310 |
|
|
"@
|
2311 |
|
|
shlqbybi\t%0,%1,%2
|
2312 |
|
|
shlqbyi\t%0,%1,%h2"
|
2313 |
|
|
[(set_attr "type" "shuf,shuf")])
|
2314 |
|
|
|
2315 |
|
|
(define_insn "shlqbi_ti"
|
2316 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r,r")
|
2317 |
|
|
(ashift:TI (match_operand:TI 1 "spu_reg_operand" "r,r")
|
2318 |
|
|
(and:SI (match_operand:SI 2 "spu_nonmem_operand" "r,I")
|
2319 |
|
|
(const_int 7))))]
|
2320 |
|
|
""
|
2321 |
|
|
"@
|
2322 |
|
|
shlqbi\t%0,%1,%2
|
2323 |
|
|
shlqbii\t%0,%1,%e2"
|
2324 |
|
|
[(set_attr "type" "shuf,shuf")])
|
2325 |
|
|
|
2326 |
|
|
(define_insn "shlqby_ti"
|
2327 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r,r")
|
2328 |
|
|
(ashift:TI (match_operand:TI 1 "spu_reg_operand" "r,r")
|
2329 |
|
|
(mult:SI (match_operand:SI 2 "spu_nonmem_operand" "r,I")
|
2330 |
|
|
(const_int 8))))]
|
2331 |
|
|
""
|
2332 |
|
|
"@
|
2333 |
|
|
shlqby\t%0,%1,%2
|
2334 |
|
|
shlqbyi\t%0,%1,%f2"
|
2335 |
|
|
[(set_attr "type" "shuf,shuf")])
|
2336 |
|
|
|
2337 |
|
|
|
2338 |
|
|
;; lshr, vlshr
|
2339 |
|
|
|
2340 |
|
|
(define_insn_and_split "lshr3"
|
2341 |
|
|
[(set (match_operand:VHSI 0 "spu_reg_operand" "=r,r")
|
2342 |
|
|
(lshiftrt:VHSI (match_operand:VHSI 1 "spu_reg_operand" "r,r")
|
2343 |
|
|
(match_operand:VHSI 2 "spu_nonmem_operand" "r,W")))
|
2344 |
|
|
(clobber (match_scratch:VHSI 3 "=&r,X"))]
|
2345 |
|
|
""
|
2346 |
|
|
"@
|
2347 |
|
|
#
|
2348 |
|
|
rotmi\t%0,%1,-%2"
|
2349 |
|
|
"reload_completed && GET_CODE (operands[2]) == REG"
|
2350 |
|
|
[(set (match_dup:VHSI 3)
|
2351 |
|
|
(neg:VHSI (match_dup:VHSI 2)))
|
2352 |
|
|
(set (match_dup:VHSI 0)
|
2353 |
|
|
(lshiftrt:VHSI (match_dup:VHSI 1)
|
2354 |
|
|
(neg:VHSI (match_dup:VHSI 3))))]
|
2355 |
|
|
""
|
2356 |
|
|
[(set_attr "type" "*,fx3")])
|
2357 |
|
|
|
2358 |
|
|
(define_insn "lshr3_imm"
|
2359 |
|
|
[(set (match_operand:VHSI 0 "spu_reg_operand" "=r")
|
2360 |
|
|
(lshiftrt:VHSI (match_operand:VHSI 1 "spu_reg_operand" "r")
|
2361 |
|
|
(match_operand:VHSI 2 "immediate_operand" "W")))]
|
2362 |
|
|
""
|
2363 |
|
|
"rotmi\t%0,%1,-%2"
|
2364 |
|
|
[(set_attr "type" "fx3")])
|
2365 |
|
|
|
2366 |
|
|
(define_insn "rotm_"
|
2367 |
|
|
[(set (match_operand:VHSI 0 "spu_reg_operand" "=r,r")
|
2368 |
|
|
(lshiftrt:VHSI (match_operand:VHSI 1 "spu_reg_operand" "r,r")
|
2369 |
|
|
(neg:VHSI (match_operand:VHSI 2 "spu_nonmem_operand" "r,W"))))]
|
2370 |
|
|
""
|
2371 |
|
|
"@
|
2372 |
|
|
rotm\t%0,%1,%2
|
2373 |
|
|
rotmi\t%0,%1,-%2"
|
2374 |
|
|
[(set_attr "type" "fx3")])
|
2375 |
|
|
|
2376 |
|
|
(define_insn_and_split "lshr3"
|
2377 |
|
|
[(set (match_operand:DTI 0 "spu_reg_operand" "=r,r,r")
|
2378 |
|
|
(lshiftrt:DTI (match_operand:DTI 1 "spu_reg_operand" "r,r,r")
|
2379 |
|
|
(match_operand:SI 2 "spu_nonmem_operand" "r,O,P")))]
|
2380 |
|
|
""
|
2381 |
|
|
"@
|
2382 |
|
|
#
|
2383 |
|
|
rotqmbyi\t%0,%1,-%h2
|
2384 |
|
|
rotqmbii\t%0,%1,-%e2"
|
2385 |
|
|
"REG_P (operands[2]) || (!satisfies_constraint_O (operands[2]) && !satisfies_constraint_P (operands[2]))"
|
2386 |
|
|
[(set (match_dup:DTI 3)
|
2387 |
|
|
(lshiftrt:DTI (match_dup:DTI 1)
|
2388 |
|
|
(match_dup:SI 4)))
|
2389 |
|
|
(set (match_dup:DTI 0)
|
2390 |
|
|
(lshiftrt:DTI (match_dup:DTI 3)
|
2391 |
|
|
(match_dup:SI 5)))]
|
2392 |
|
|
{
|
2393 |
|
|
operands[3] = gen_reg_rtx (mode);
|
2394 |
|
|
if (GET_CODE (operands[2]) == CONST_INT)
|
2395 |
|
|
{
|
2396 |
|
|
HOST_WIDE_INT val = INTVAL(operands[2]);
|
2397 |
|
|
operands[4] = GEN_INT (val & 7);
|
2398 |
|
|
operands[5] = GEN_INT (val & -8);
|
2399 |
|
|
}
|
2400 |
|
|
else
|
2401 |
|
|
{
|
2402 |
|
|
rtx t0 = gen_reg_rtx (SImode);
|
2403 |
|
|
rtx t1 = gen_reg_rtx (SImode);
|
2404 |
|
|
emit_insn (gen_subsi3(t0, GEN_INT(0), operands[2]));
|
2405 |
|
|
emit_insn (gen_subsi3(t1, GEN_INT(7), operands[2]));
|
2406 |
|
|
operands[4] = gen_rtx_AND (SImode, gen_rtx_NEG (SImode, t0), GEN_INT (7));
|
2407 |
|
|
operands[5] = gen_rtx_AND (SImode, gen_rtx_NEG (SImode, gen_rtx_AND (SImode, t1, GEN_INT (-8))), GEN_INT (-8));
|
2408 |
|
|
}
|
2409 |
|
|
}
|
2410 |
|
|
[(set_attr "type" "*,shuf,shuf")])
|
2411 |
|
|
|
2412 |
|
|
(define_expand "shrqbybi_"
|
2413 |
|
|
[(set (match_operand:DTI 0 "spu_reg_operand" "=r,r")
|
2414 |
|
|
(lshiftrt:DTI (match_operand:DTI 1 "spu_reg_operand" "r,r")
|
2415 |
|
|
(and:SI (neg:SI (and:SI (match_operand:SI 2 "spu_nonmem_operand" "r,I")
|
2416 |
|
|
(const_int -8)))
|
2417 |
|
|
(const_int -8))))]
|
2418 |
|
|
""
|
2419 |
|
|
{
|
2420 |
|
|
if (GET_CODE (operands[2]) == CONST_INT)
|
2421 |
|
|
operands[2] = GEN_INT (7 - INTVAL (operands[2]));
|
2422 |
|
|
else
|
2423 |
|
|
{
|
2424 |
|
|
rtx t0 = gen_reg_rtx (SImode);
|
2425 |
|
|
emit_insn (gen_subsi3 (t0, GEN_INT (7), operands[2]));
|
2426 |
|
|
operands[2] = t0;
|
2427 |
|
|
}
|
2428 |
|
|
})
|
2429 |
|
|
|
2430 |
|
|
(define_insn "rotqmbybi_"
|
2431 |
|
|
[(set (match_operand:DTI 0 "spu_reg_operand" "=r,r")
|
2432 |
|
|
(lshiftrt:DTI (match_operand:DTI 1 "spu_reg_operand" "r,r")
|
2433 |
|
|
(and:SI (neg:SI (and:SI (match_operand:SI 2 "spu_nonmem_operand" "r,I")
|
2434 |
|
|
(const_int -8)))
|
2435 |
|
|
(const_int -8))))]
|
2436 |
|
|
""
|
2437 |
|
|
"@
|
2438 |
|
|
rotqmbybi\t%0,%1,%2
|
2439 |
|
|
rotqmbyi\t%0,%1,-%H2"
|
2440 |
|
|
[(set_attr "type" "shuf")])
|
2441 |
|
|
|
2442 |
|
|
(define_insn_and_split "shrqbi_"
|
2443 |
|
|
[(set (match_operand:DTI 0 "spu_reg_operand" "=r,r")
|
2444 |
|
|
(lshiftrt:DTI (match_operand:DTI 1 "spu_reg_operand" "r,r")
|
2445 |
|
|
(and:SI (match_operand:SI 2 "spu_nonmem_operand" "r,I")
|
2446 |
|
|
(const_int 7))))
|
2447 |
|
|
(clobber (match_scratch:SI 3 "=&r,X"))]
|
2448 |
|
|
""
|
2449 |
|
|
"#"
|
2450 |
|
|
"reload_completed"
|
2451 |
|
|
[(set (match_dup:DTI 0)
|
2452 |
|
|
(lshiftrt:DTI (match_dup:DTI 1)
|
2453 |
|
|
(and:SI (neg:SI (match_dup:SI 3)) (const_int 7))))]
|
2454 |
|
|
{
|
2455 |
|
|
if (GET_CODE (operands[2]) == CONST_INT)
|
2456 |
|
|
operands[3] = GEN_INT (-INTVAL (operands[2]));
|
2457 |
|
|
else
|
2458 |
|
|
emit_insn (gen_subsi3 (operands[3], GEN_INT (0), operands[2]));
|
2459 |
|
|
}
|
2460 |
|
|
[(set_attr "type" "shuf")])
|
2461 |
|
|
|
2462 |
|
|
(define_insn "rotqmbi_"
|
2463 |
|
|
[(set (match_operand:DTI 0 "spu_reg_operand" "=r,r")
|
2464 |
|
|
(lshiftrt:DTI (match_operand:DTI 1 "spu_reg_operand" "r,r")
|
2465 |
|
|
(and:SI (neg:SI (match_operand:SI 2 "spu_nonmem_operand" "r,I"))
|
2466 |
|
|
(const_int 7))))]
|
2467 |
|
|
""
|
2468 |
|
|
"@
|
2469 |
|
|
rotqmbi\t%0,%1,%2
|
2470 |
|
|
rotqmbii\t%0,%1,-%E2"
|
2471 |
|
|
[(set_attr "type" "shuf")])
|
2472 |
|
|
|
2473 |
|
|
(define_expand "shrqby_"
|
2474 |
|
|
[(set (match_operand:DTI 0 "spu_reg_operand" "=r,r")
|
2475 |
|
|
(lshiftrt:DTI (match_operand:DTI 1 "spu_reg_operand" "r,r")
|
2476 |
|
|
(mult:SI (neg:SI (match_operand:SI 2 "spu_nonmem_operand" "r,I"))
|
2477 |
|
|
(const_int 8))))]
|
2478 |
|
|
""
|
2479 |
|
|
{
|
2480 |
|
|
if (GET_CODE (operands[2]) == CONST_INT)
|
2481 |
|
|
operands[2] = GEN_INT (-INTVAL (operands[2]));
|
2482 |
|
|
else
|
2483 |
|
|
{
|
2484 |
|
|
rtx t0 = gen_reg_rtx (SImode);
|
2485 |
|
|
emit_insn (gen_subsi3 (t0, GEN_INT (0), operands[2]));
|
2486 |
|
|
operands[2] = t0;
|
2487 |
|
|
}
|
2488 |
|
|
})
|
2489 |
|
|
|
2490 |
|
|
(define_insn "rotqmby_"
|
2491 |
|
|
[(set (match_operand:DTI 0 "spu_reg_operand" "=r,r")
|
2492 |
|
|
(lshiftrt:DTI (match_operand:DTI 1 "spu_reg_operand" "r,r")
|
2493 |
|
|
(mult:SI (neg:SI (match_operand:SI 2 "spu_nonmem_operand" "r,I"))
|
2494 |
|
|
(const_int 8))))]
|
2495 |
|
|
""
|
2496 |
|
|
"@
|
2497 |
|
|
rotqmby\t%0,%1,%2
|
2498 |
|
|
rotqmbyi\t%0,%1,-%F2"
|
2499 |
|
|
[(set_attr "type" "shuf")])
|
2500 |
|
|
|
2501 |
|
|
|
2502 |
|
|
;; ashr, vashr
|
2503 |
|
|
|
2504 |
|
|
(define_insn_and_split "ashr3"
|
2505 |
|
|
[(set (match_operand:VHSI 0 "spu_reg_operand" "=r,r")
|
2506 |
|
|
(ashiftrt:VHSI (match_operand:VHSI 1 "spu_reg_operand" "r,r")
|
2507 |
|
|
(match_operand:VHSI 2 "spu_nonmem_operand" "r,W")))
|
2508 |
|
|
(clobber (match_scratch:VHSI 3 "=&r,X"))]
|
2509 |
|
|
""
|
2510 |
|
|
"@
|
2511 |
|
|
#
|
2512 |
|
|
rotmai\t%0,%1,-%2"
|
2513 |
|
|
"reload_completed && GET_CODE (operands[2]) == REG"
|
2514 |
|
|
[(set (match_dup:VHSI 3)
|
2515 |
|
|
(neg:VHSI (match_dup:VHSI 2)))
|
2516 |
|
|
(set (match_dup:VHSI 0)
|
2517 |
|
|
(ashiftrt:VHSI (match_dup:VHSI 1)
|
2518 |
|
|
(neg:VHSI (match_dup:VHSI 3))))]
|
2519 |
|
|
""
|
2520 |
|
|
[(set_attr "type" "*,fx3")])
|
2521 |
|
|
|
2522 |
|
|
(define_insn "ashr3_imm"
|
2523 |
|
|
[(set (match_operand:VHSI 0 "spu_reg_operand" "=r")
|
2524 |
|
|
(ashiftrt:VHSI (match_operand:VHSI 1 "spu_reg_operand" "r")
|
2525 |
|
|
(match_operand:VHSI 2 "immediate_operand" "W")))]
|
2526 |
|
|
""
|
2527 |
|
|
"rotmai\t%0,%1,-%2"
|
2528 |
|
|
[(set_attr "type" "fx3")])
|
2529 |
|
|
|
2530 |
|
|
|
2531 |
|
|
(define_insn "rotma_"
|
2532 |
|
|
[(set (match_operand:VHSI 0 "spu_reg_operand" "=r,r")
|
2533 |
|
|
(ashiftrt:VHSI (match_operand:VHSI 1 "spu_reg_operand" "r,r")
|
2534 |
|
|
(neg:VHSI (match_operand:VHSI 2 "spu_nonmem_operand" "r,W"))))]
|
2535 |
|
|
""
|
2536 |
|
|
"@
|
2537 |
|
|
rotma\t%0,%1,%2
|
2538 |
|
|
rotmai\t%0,%1,-%2"
|
2539 |
|
|
[(set_attr "type" "fx3")])
|
2540 |
|
|
|
2541 |
|
|
(define_insn_and_split "ashrdi3"
|
2542 |
|
|
[(set (match_operand:DI 0 "spu_reg_operand" "=r,r")
|
2543 |
|
|
(ashiftrt:DI (match_operand:DI 1 "spu_reg_operand" "r,r")
|
2544 |
|
|
(match_operand:SI 2 "spu_nonmem_operand" "r,I")))
|
2545 |
|
|
(clobber (match_scratch:TI 3 "=&r,&r"))
|
2546 |
|
|
(clobber (match_scratch:TI 4 "=&r,&r"))
|
2547 |
|
|
(clobber (match_scratch:SI 5 "=&r,&r"))]
|
2548 |
|
|
""
|
2549 |
|
|
"#"
|
2550 |
|
|
"reload_completed"
|
2551 |
|
|
[(set (match_dup:DI 0)
|
2552 |
|
|
(ashiftrt:DI (match_dup:DI 1)
|
2553 |
|
|
(match_dup:SI 2)))]
|
2554 |
|
|
{
|
2555 |
|
|
rtx op0 = gen_rtx_REG (TImode, REGNO (operands[0]));
|
2556 |
|
|
rtx op0v = gen_rtx_REG (V4SImode, REGNO (op0));
|
2557 |
|
|
rtx op1 = gen_rtx_REG (TImode, REGNO (operands[1]));
|
2558 |
|
|
rtx op1s = gen_rtx_REG (SImode, REGNO (op1));
|
2559 |
|
|
rtx op2 = operands[2];
|
2560 |
|
|
rtx op3 = operands[3];
|
2561 |
|
|
rtx op4 = operands[4];
|
2562 |
|
|
rtx op5 = operands[5];
|
2563 |
|
|
|
2564 |
|
|
if (GET_CODE (op2) == CONST_INT && INTVAL (op2) >= 63)
|
2565 |
|
|
{
|
2566 |
|
|
rtx op0s = gen_rtx_REG (SImode, REGNO (op0));
|
2567 |
|
|
emit_insn (gen_ashrsi3 (op0s, op1s, GEN_INT (32)));
|
2568 |
|
|
emit_insn (gen_spu_fsm (op0v, op0s));
|
2569 |
|
|
}
|
2570 |
|
|
else if (GET_CODE (op2) == CONST_INT && INTVAL (op2) >= 32)
|
2571 |
|
|
{
|
2572 |
|
|
rtx op0d = gen_rtx_REG (V2DImode, REGNO (op0));
|
2573 |
|
|
HOST_WIDE_INT val = INTVAL (op2);
|
2574 |
|
|
emit_insn (gen_lshrti3 (op0, op1, GEN_INT (32)));
|
2575 |
|
|
emit_insn (gen_spu_xswd (op0d, op0v));
|
2576 |
|
|
if (val > 32)
|
2577 |
|
|
emit_insn (gen_vashrv4si3 (op0v, op0v, spu_const (V4SImode, val - 32)));
|
2578 |
|
|
}
|
2579 |
|
|
else
|
2580 |
|
|
{
|
2581 |
|
|
rtx op3v = gen_rtx_REG (V4SImode, REGNO (op3));
|
2582 |
|
|
unsigned char arr[16] = {
|
2583 |
|
|
0xff, 0xff, 0xff, 0xff,
|
2584 |
|
|
0xff, 0xff, 0xff, 0xff,
|
2585 |
|
|
0x00, 0x00, 0x00, 0x00,
|
2586 |
|
|
0x00, 0x00, 0x00, 0x00
|
2587 |
|
|
};
|
2588 |
|
|
|
2589 |
|
|
emit_insn (gen_ashrsi3 (op5, op1s, GEN_INT (31)));
|
2590 |
|
|
emit_move_insn (op4, array_to_constant (TImode, arr));
|
2591 |
|
|
emit_insn (gen_spu_fsm (op3v, op5));
|
2592 |
|
|
|
2593 |
|
|
if (GET_CODE (operands[2]) == REG)
|
2594 |
|
|
{
|
2595 |
|
|
emit_insn (gen_selb (op4, op3, op1, op4));
|
2596 |
|
|
emit_insn (gen_negsi2 (op5, op2));
|
2597 |
|
|
emit_insn (gen_rotqbybi_ti (op0, op4, op5));
|
2598 |
|
|
emit_insn (gen_rotqbi_ti (op0, op0, op5));
|
2599 |
|
|
}
|
2600 |
|
|
else
|
2601 |
|
|
{
|
2602 |
|
|
HOST_WIDE_INT val = -INTVAL (op2);
|
2603 |
|
|
emit_insn (gen_selb (op0, op3, op1, op4));
|
2604 |
|
|
if ((val - 7) / 8)
|
2605 |
|
|
emit_insn (gen_rotqby_ti (op0, op0, GEN_INT ((val - 7) / 8)));
|
2606 |
|
|
if (val % 8)
|
2607 |
|
|
emit_insn (gen_rotqbi_ti (op0, op0, GEN_INT (val % 8)));
|
2608 |
|
|
}
|
2609 |
|
|
}
|
2610 |
|
|
DONE;
|
2611 |
|
|
})
|
2612 |
|
|
|
2613 |
|
|
|
2614 |
|
|
(define_insn_and_split "ashrti3"
|
2615 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r,r")
|
2616 |
|
|
(ashiftrt:TI (match_operand:TI 1 "spu_reg_operand" "r,r")
|
2617 |
|
|
(match_operand:SI 2 "spu_nonmem_operand" "r,i")))]
|
2618 |
|
|
""
|
2619 |
|
|
"#"
|
2620 |
|
|
""
|
2621 |
|
|
[(set (match_dup:TI 0)
|
2622 |
|
|
(ashiftrt:TI (match_dup:TI 1)
|
2623 |
|
|
(match_dup:SI 2)))]
|
2624 |
|
|
{
|
2625 |
|
|
rtx sign_shift = gen_reg_rtx (SImode);
|
2626 |
|
|
rtx sign_mask = gen_reg_rtx (TImode);
|
2627 |
|
|
rtx sign_mask_v4si = gen_rtx_SUBREG (V4SImode, sign_mask, 0);
|
2628 |
|
|
rtx op1_v4si = spu_gen_subreg (V4SImode, operands[1]);
|
2629 |
|
|
rtx t = gen_reg_rtx (TImode);
|
2630 |
|
|
emit_insn (gen_subsi3 (sign_shift, GEN_INT (128), force_reg (SImode, operands[2])));
|
2631 |
|
|
emit_insn (gen_vashrv4si3 (sign_mask_v4si, op1_v4si, spu_const (V4SImode, 31)));
|
2632 |
|
|
emit_insn (gen_fsm_ti (sign_mask, sign_mask));
|
2633 |
|
|
emit_insn (gen_ashlti3 (sign_mask, sign_mask, sign_shift));
|
2634 |
|
|
emit_insn (gen_lshrti3 (t, operands[1], operands[2]));
|
2635 |
|
|
emit_insn (gen_iorti3 (operands[0], t, sign_mask));
|
2636 |
|
|
DONE;
|
2637 |
|
|
})
|
2638 |
|
|
|
2639 |
|
|
;; fsm is used after rotam to replicate the sign across the whole register.
|
2640 |
|
|
(define_insn "fsm_ti"
|
2641 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r")
|
2642 |
|
|
(unspec:TI [(match_operand:TI 1 "spu_reg_operand" "r")] UNSPEC_FSM))]
|
2643 |
|
|
""
|
2644 |
|
|
"fsm\t%0,%1"
|
2645 |
|
|
[(set_attr "type" "shuf")])
|
2646 |
|
|
|
2647 |
|
|
|
2648 |
|
|
;; vrotl, rotl
|
2649 |
|
|
|
2650 |
|
|
(define_insn "rotl3"
|
2651 |
|
|
[(set (match_operand:VHSI 0 "spu_reg_operand" "=r,r")
|
2652 |
|
|
(rotate:VHSI (match_operand:VHSI 1 "spu_reg_operand" "r,r")
|
2653 |
|
|
(match_operand:VHSI 2 "spu_nonmem_operand" "r,W")))]
|
2654 |
|
|
""
|
2655 |
|
|
"@
|
2656 |
|
|
rot\t%0,%1,%2
|
2657 |
|
|
roti\t%0,%1,%2"
|
2658 |
|
|
[(set_attr "type" "fx3")])
|
2659 |
|
|
|
2660 |
|
|
(define_insn "rotlti3"
|
2661 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=&r,r,r,r")
|
2662 |
|
|
(rotate:TI (match_operand:TI 1 "spu_reg_operand" "r,r,r,r")
|
2663 |
|
|
(match_operand:SI 2 "spu_nonmem_operand" "r,O,P,I")))]
|
2664 |
|
|
""
|
2665 |
|
|
"@
|
2666 |
|
|
rotqbybi\t%0,%1,%2\;rotqbi\t%0,%0,%2
|
2667 |
|
|
rotqbyi\t%0,%1,%h2
|
2668 |
|
|
rotqbii\t%0,%1,%e2
|
2669 |
|
|
rotqbyi\t%0,%1,%h2\;rotqbii\t%0,%0,%e2"
|
2670 |
|
|
[(set_attr "length" "8,4,4,8")
|
2671 |
|
|
(set_attr "type" "multi1,shuf,shuf,multi1")])
|
2672 |
|
|
|
2673 |
|
|
(define_insn "rotqbybi_ti"
|
2674 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r,r")
|
2675 |
|
|
(rotate:TI (match_operand:TI 1 "spu_reg_operand" "r,r")
|
2676 |
|
|
(and:SI (match_operand:SI 2 "spu_nonmem_operand" "r,I")
|
2677 |
|
|
(const_int -8))))]
|
2678 |
|
|
""
|
2679 |
|
|
"@
|
2680 |
|
|
rotqbybi\t%0,%1,%2
|
2681 |
|
|
rotqbyi\t%0,%1,%h2"
|
2682 |
|
|
[(set_attr "type" "shuf,shuf")])
|
2683 |
|
|
|
2684 |
|
|
(define_insn "rotqby_ti"
|
2685 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r,r")
|
2686 |
|
|
(rotate:TI (match_operand:TI 1 "spu_reg_operand" "r,r")
|
2687 |
|
|
(mult:SI (match_operand:SI 2 "spu_nonmem_operand" "r,I")
|
2688 |
|
|
(const_int 8))))]
|
2689 |
|
|
""
|
2690 |
|
|
"@
|
2691 |
|
|
rotqby\t%0,%1,%2
|
2692 |
|
|
rotqbyi\t%0,%1,%f2"
|
2693 |
|
|
[(set_attr "type" "shuf,shuf")])
|
2694 |
|
|
|
2695 |
|
|
(define_insn "rotqbi_ti"
|
2696 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r,r")
|
2697 |
|
|
(rotate:TI (match_operand:TI 1 "spu_reg_operand" "r,r")
|
2698 |
|
|
(and:SI (match_operand:SI 2 "spu_nonmem_operand" "r,I")
|
2699 |
|
|
(const_int 7))))]
|
2700 |
|
|
""
|
2701 |
|
|
"@
|
2702 |
|
|
rotqbi\t%0,%1,%2
|
2703 |
|
|
rotqbii\t%0,%1,%e2"
|
2704 |
|
|
[(set_attr "type" "shuf,shuf")])
|
2705 |
|
|
|
2706 |
|
|
|
2707 |
|
|
;; struct extract/insert
|
2708 |
|
|
;; We handle mem's because GCC will generate invalid SUBREG's
|
2709 |
|
|
;; and inefficient code.
|
2710 |
|
|
|
2711 |
|
|
(define_expand "extv"
|
2712 |
|
|
[(set (match_operand:TI 0 "register_operand" "")
|
2713 |
|
|
(sign_extract:TI (match_operand 1 "nonimmediate_operand" "")
|
2714 |
|
|
(match_operand:SI 2 "const_int_operand" "")
|
2715 |
|
|
(match_operand:SI 3 "const_int_operand" "")))]
|
2716 |
|
|
""
|
2717 |
|
|
{
|
2718 |
|
|
spu_expand_extv (operands, 0);
|
2719 |
|
|
DONE;
|
2720 |
|
|
})
|
2721 |
|
|
|
2722 |
|
|
(define_expand "extzv"
|
2723 |
|
|
[(set (match_operand:TI 0 "register_operand" "")
|
2724 |
|
|
(zero_extract:TI (match_operand 1 "nonimmediate_operand" "")
|
2725 |
|
|
(match_operand:SI 2 "const_int_operand" "")
|
2726 |
|
|
(match_operand:SI 3 "const_int_operand" "")))]
|
2727 |
|
|
""
|
2728 |
|
|
{
|
2729 |
|
|
spu_expand_extv (operands, 1);
|
2730 |
|
|
DONE;
|
2731 |
|
|
})
|
2732 |
|
|
|
2733 |
|
|
(define_expand "insv"
|
2734 |
|
|
[(set (zero_extract (match_operand 0 "nonimmediate_operand" "")
|
2735 |
|
|
(match_operand:SI 1 "const_int_operand" "")
|
2736 |
|
|
(match_operand:SI 2 "const_int_operand" ""))
|
2737 |
|
|
(match_operand 3 "nonmemory_operand" ""))]
|
2738 |
|
|
""
|
2739 |
|
|
{ spu_expand_insv(operands); DONE; })
|
2740 |
|
|
|
2741 |
|
|
;; Simplify a number of patterns that get generated by extv, extzv,
|
2742 |
|
|
;; insv, and loads.
|
2743 |
|
|
(define_insn_and_split "trunc_shr_ti"
|
2744 |
|
|
[(set (match_operand:QHSI 0 "spu_reg_operand" "=r")
|
2745 |
|
|
(truncate:QHSI (match_operator:TI 2 "shiftrt_operator" [(match_operand:TI 1 "spu_reg_operand" "0")
|
2746 |
|
|
(const_int 96)])))]
|
2747 |
|
|
""
|
2748 |
|
|
"#"
|
2749 |
|
|
"reload_completed"
|
2750 |
|
|
[(const_int 0)]
|
2751 |
|
|
{
|
2752 |
|
|
spu_split_convert (operands);
|
2753 |
|
|
DONE;
|
2754 |
|
|
}
|
2755 |
|
|
[(set_attr "type" "convert")
|
2756 |
|
|
(set_attr "length" "0")])
|
2757 |
|
|
|
2758 |
|
|
(define_insn_and_split "trunc_shr_tidi"
|
2759 |
|
|
[(set (match_operand:DI 0 "spu_reg_operand" "=r")
|
2760 |
|
|
(truncate:DI (match_operator:TI 2 "shiftrt_operator" [(match_operand:TI 1 "spu_reg_operand" "0")
|
2761 |
|
|
(const_int 64)])))]
|
2762 |
|
|
""
|
2763 |
|
|
"#"
|
2764 |
|
|
"reload_completed"
|
2765 |
|
|
[(const_int 0)]
|
2766 |
|
|
{
|
2767 |
|
|
spu_split_convert (operands);
|
2768 |
|
|
DONE;
|
2769 |
|
|
}
|
2770 |
|
|
[(set_attr "type" "convert")
|
2771 |
|
|
(set_attr "length" "0")])
|
2772 |
|
|
|
2773 |
|
|
(define_insn_and_split "shl_ext_ti"
|
2774 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r")
|
2775 |
|
|
(ashift:TI (match_operator:TI 2 "extend_operator" [(match_operand:QHSI 1 "spu_reg_operand" "0")])
|
2776 |
|
|
(const_int 96)))]
|
2777 |
|
|
""
|
2778 |
|
|
"#"
|
2779 |
|
|
"reload_completed"
|
2780 |
|
|
[(const_int 0)]
|
2781 |
|
|
{
|
2782 |
|
|
spu_split_convert (operands);
|
2783 |
|
|
DONE;
|
2784 |
|
|
}
|
2785 |
|
|
[(set_attr "type" "convert")
|
2786 |
|
|
(set_attr "length" "0")])
|
2787 |
|
|
|
2788 |
|
|
(define_insn_and_split "shl_ext_diti"
|
2789 |
|
|
[(set (match_operand:TI 0 "spu_reg_operand" "=r")
|
2790 |
|
|
(ashift:TI (match_operator:TI 2 "extend_operator" [(match_operand:DI 1 "spu_reg_operand" "0")])
|
2791 |
|
|
(const_int 64)))]
|
2792 |
|
|
""
|
2793 |
|
|
"#"
|
2794 |
|
|
"reload_completed"
|
2795 |
|
|
[(const_int 0)]
|
2796 |
|
|
{
|
2797 |
|
|
spu_split_convert (operands);
|
2798 |
|
|
DONE;
|
2799 |
|
|
}
|
2800 |
|
|
[(set_attr "type" "convert")
|
2801 |
|
|
(set_attr "length" "0")])
|
2802 |
|
|
|
2803 |
|
|
(define_insn "sext_trunc_lshr_tiqisi"
|
2804 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
2805 |
|
|
(sign_extend:SI (truncate:QI (match_operator:TI 2 "shiftrt_operator" [(match_operand:TI 1 "spu_reg_operand" "r")
|
2806 |
|
|
(const_int 120)]))))]
|
2807 |
|
|
""
|
2808 |
|
|
"rotmai\t%0,%1,-24"
|
2809 |
|
|
[(set_attr "type" "fx3")])
|
2810 |
|
|
|
2811 |
|
|
(define_insn "zext_trunc_lshr_tiqisi"
|
2812 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
2813 |
|
|
(zero_extend:SI (truncate:QI (match_operator:TI 2 "shiftrt_operator" [(match_operand:TI 1 "spu_reg_operand" "r")
|
2814 |
|
|
(const_int 120)]))))]
|
2815 |
|
|
""
|
2816 |
|
|
"rotmi\t%0,%1,-24"
|
2817 |
|
|
[(set_attr "type" "fx3")])
|
2818 |
|
|
|
2819 |
|
|
(define_insn "sext_trunc_lshr_tihisi"
|
2820 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
2821 |
|
|
(sign_extend:SI (truncate:HI (match_operator:TI 2 "shiftrt_operator" [(match_operand:TI 1 "spu_reg_operand" "r")
|
2822 |
|
|
(const_int 112)]))))]
|
2823 |
|
|
""
|
2824 |
|
|
"rotmai\t%0,%1,-16"
|
2825 |
|
|
[(set_attr "type" "fx3")])
|
2826 |
|
|
|
2827 |
|
|
(define_insn "zext_trunc_lshr_tihisi"
|
2828 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
2829 |
|
|
(zero_extend:SI (truncate:HI (match_operator:TI 2 "shiftrt_operator" [(match_operand:TI 1 "spu_reg_operand" "r")
|
2830 |
|
|
(const_int 112)]))))]
|
2831 |
|
|
""
|
2832 |
|
|
"rotmi\t%0,%1,-16"
|
2833 |
|
|
[(set_attr "type" "fx3")])
|
2834 |
|
|
|
2835 |
|
|
|
2836 |
|
|
;; String/block move insn.
|
2837 |
|
|
;; Argument 0 is the destination
|
2838 |
|
|
;; Argument 1 is the source
|
2839 |
|
|
;; Argument 2 is the length
|
2840 |
|
|
;; Argument 3 is the alignment
|
2841 |
|
|
|
2842 |
|
|
(define_expand "movstrsi"
|
2843 |
|
|
[(parallel [(set (match_operand:BLK 0 "" "")
|
2844 |
|
|
(match_operand:BLK 1 "" ""))
|
2845 |
|
|
(use (match_operand:SI 2 "" ""))
|
2846 |
|
|
(use (match_operand:SI 3 "" ""))])]
|
2847 |
|
|
""
|
2848 |
|
|
"
|
2849 |
|
|
{
|
2850 |
|
|
if (spu_expand_block_move (operands))
|
2851 |
|
|
DONE;
|
2852 |
|
|
else
|
2853 |
|
|
FAIL;
|
2854 |
|
|
}")
|
2855 |
|
|
|
2856 |
|
|
|
2857 |
|
|
;; jump
|
2858 |
|
|
|
2859 |
|
|
(define_insn "indirect_jump"
|
2860 |
|
|
[(set (pc) (match_operand:SI 0 "spu_reg_operand" "r"))]
|
2861 |
|
|
""
|
2862 |
|
|
"bi\t%0"
|
2863 |
|
|
[(set_attr "type" "br")])
|
2864 |
|
|
|
2865 |
|
|
(define_insn "jump"
|
2866 |
|
|
[(set (pc)
|
2867 |
|
|
(label_ref (match_operand 0 "" "")))]
|
2868 |
|
|
""
|
2869 |
|
|
"br\t%0"
|
2870 |
|
|
[(set_attr "type" "br")])
|
2871 |
|
|
|
2872 |
|
|
|
2873 |
|
|
;; return
|
2874 |
|
|
|
2875 |
|
|
;; This will be used for leaf functions, that don't save any regs and
|
2876 |
|
|
;; don't have locals on stack, maybe... that is for functions that
|
2877 |
|
|
;; don't change $sp and don't need to save $lr.
|
2878 |
|
|
(define_expand "return"
|
2879 |
|
|
[(return)]
|
2880 |
|
|
"direct_return()"
|
2881 |
|
|
"")
|
2882 |
|
|
|
2883 |
|
|
;; used in spu_expand_epilogue to generate return from a function and
|
2884 |
|
|
;; explicitly set use of $lr.
|
2885 |
|
|
|
2886 |
|
|
(define_insn "_return"
|
2887 |
|
|
[(return)]
|
2888 |
|
|
""
|
2889 |
|
|
"bi\t$lr"
|
2890 |
|
|
[(set_attr "type" "br")])
|
2891 |
|
|
|
2892 |
|
|
|
2893 |
|
|
|
2894 |
|
|
;; ceq
|
2895 |
|
|
|
2896 |
|
|
(define_insn "ceq_"
|
2897 |
|
|
[(set (match_operand:VQHSI 0 "spu_reg_operand" "=r,r")
|
2898 |
|
|
(eq:VQHSI (match_operand:VQHSI 1 "spu_reg_operand" "r,r")
|
2899 |
|
|
(match_operand:VQHSI 2 "spu_arith_operand" "r,B")))]
|
2900 |
|
|
""
|
2901 |
|
|
"@
|
2902 |
|
|
ceq\t%0,%1,%2
|
2903 |
|
|
ceqi\t%0,%1,%2")
|
2904 |
|
|
|
2905 |
|
|
(define_insn_and_split "ceq_di"
|
2906 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
2907 |
|
|
(eq:SI (match_operand:DI 1 "spu_reg_operand" "r")
|
2908 |
|
|
(match_operand:DI 2 "spu_reg_operand" "r")))]
|
2909 |
|
|
""
|
2910 |
|
|
"#"
|
2911 |
|
|
"reload_completed"
|
2912 |
|
|
[(set (match_dup:SI 0)
|
2913 |
|
|
(eq:SI (match_dup:DI 1)
|
2914 |
|
|
(match_dup:DI 2)))]
|
2915 |
|
|
{
|
2916 |
|
|
rtx op0 = gen_rtx_REG (V4SImode, REGNO (operands[0]));
|
2917 |
|
|
rtx op1 = gen_rtx_REG (V4SImode, REGNO (operands[1]));
|
2918 |
|
|
rtx op2 = gen_rtx_REG (V4SImode, REGNO (operands[2]));
|
2919 |
|
|
emit_insn (gen_ceq_v4si (op0, op1, op2));
|
2920 |
|
|
emit_insn (gen_spu_gb (op0, op0));
|
2921 |
|
|
emit_insn (gen_cgt_si (operands[0], operands[0], GEN_INT (11)));
|
2922 |
|
|
DONE;
|
2923 |
|
|
})
|
2924 |
|
|
|
2925 |
|
|
|
2926 |
|
|
;; We provide the TI compares for completeness and because some parts of
|
2927 |
|
|
;; gcc/libgcc use them, even though user code might never see it.
|
2928 |
|
|
(define_insn "ceq_ti"
|
2929 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
2930 |
|
|
(eq:SI (match_operand:TI 1 "spu_reg_operand" "r")
|
2931 |
|
|
(match_operand:TI 2 "spu_reg_operand" "r")))]
|
2932 |
|
|
""
|
2933 |
|
|
"ceq\t%0,%1,%2\;gb\t%0,%0\;ceqi\t%0,%0,15"
|
2934 |
|
|
[(set_attr "type" "multi0")
|
2935 |
|
|
(set_attr "length" "12")])
|
2936 |
|
|
|
2937 |
|
|
(define_insn "ceq_"
|
2938 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
2939 |
|
|
(eq: (match_operand:VSF 1 "spu_reg_operand" "r")
|
2940 |
|
|
(match_operand:VSF 2 "spu_reg_operand" "r")))]
|
2941 |
|
|
""
|
2942 |
|
|
"fceq\t%0,%1,%2")
|
2943 |
|
|
|
2944 |
|
|
(define_insn "cmeq_"
|
2945 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
2946 |
|
|
(eq: (abs:VSF (match_operand:VSF 1 "spu_reg_operand" "r"))
|
2947 |
|
|
(abs:VSF (match_operand:VSF 2 "spu_reg_operand" "r"))))]
|
2948 |
|
|
""
|
2949 |
|
|
"fcmeq\t%0,%1,%2")
|
2950 |
|
|
|
2951 |
|
|
;; These implementations will ignore checking of NaN or INF if
|
2952 |
|
|
;; compiled with option -ffinite-math-only.
|
2953 |
|
|
(define_expand "ceq_df"
|
2954 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
2955 |
|
|
(eq:SI (match_operand:DF 1 "spu_reg_operand" "r")
|
2956 |
|
|
(match_operand:DF 2 "const_zero_operand" "i")))]
|
2957 |
|
|
""
|
2958 |
|
|
{
|
2959 |
|
|
if (spu_arch == PROCESSOR_CELL)
|
2960 |
|
|
{
|
2961 |
|
|
rtx ra = gen_reg_rtx (V4SImode);
|
2962 |
|
|
rtx rb = gen_reg_rtx (V4SImode);
|
2963 |
|
|
rtx temp = gen_reg_rtx (TImode);
|
2964 |
|
|
rtx temp_v4si = spu_gen_subreg (V4SImode, temp);
|
2965 |
|
|
rtx temp2 = gen_reg_rtx (V4SImode);
|
2966 |
|
|
rtx biteq = gen_reg_rtx (V4SImode);
|
2967 |
|
|
rtx ahi_inf = gen_reg_rtx (V4SImode);
|
2968 |
|
|
rtx a_nan = gen_reg_rtx (V4SImode);
|
2969 |
|
|
rtx a_abs = gen_reg_rtx (V4SImode);
|
2970 |
|
|
rtx b_abs = gen_reg_rtx (V4SImode);
|
2971 |
|
|
rtx iszero = gen_reg_rtx (V4SImode);
|
2972 |
|
|
rtx sign_mask = gen_reg_rtx (V4SImode);
|
2973 |
|
|
rtx nan_mask = gen_reg_rtx (V4SImode);
|
2974 |
|
|
rtx hihi_promote = gen_reg_rtx (TImode);
|
2975 |
|
|
rtx pat = spu_const_from_ints (V4SImode, 0x7FFFFFFF, 0xFFFFFFFF,
|
2976 |
|
|
0x7FFFFFFF, 0xFFFFFFFF);
|
2977 |
|
|
|
2978 |
|
|
emit_move_insn (sign_mask, pat);
|
2979 |
|
|
pat = spu_const_from_ints (V4SImode, 0x7FF00000, 0x0,
|
2980 |
|
|
0x7FF00000, 0x0);
|
2981 |
|
|
emit_move_insn (nan_mask, pat);
|
2982 |
|
|
pat = spu_const_from_ints (TImode, 0x00010203, 0x10111213,
|
2983 |
|
|
0x08090A0B, 0x18191A1B);
|
2984 |
|
|
emit_move_insn (hihi_promote, pat);
|
2985 |
|
|
|
2986 |
|
|
emit_insn (gen_spu_convert (ra, operands[1]));
|
2987 |
|
|
emit_insn (gen_spu_convert (rb, operands[2]));
|
2988 |
|
|
emit_insn (gen_ceq_v4si (biteq, ra, rb));
|
2989 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, biteq),
|
2990 |
|
|
GEN_INT (4 * 8)));
|
2991 |
|
|
emit_insn (gen_andv4si3 (biteq, biteq, temp_v4si));
|
2992 |
|
|
|
2993 |
|
|
emit_insn (gen_andv4si3 (a_abs, ra, sign_mask));
|
2994 |
|
|
emit_insn (gen_andv4si3 (b_abs, rb, sign_mask));
|
2995 |
|
|
if (!flag_finite_math_only)
|
2996 |
|
|
{
|
2997 |
|
|
emit_insn (gen_clgt_v4si (a_nan, a_abs, nan_mask));
|
2998 |
|
|
emit_insn (gen_ceq_v4si (ahi_inf, a_abs, nan_mask));
|
2999 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, a_nan),
|
3000 |
|
|
GEN_INT (4 * 8)));
|
3001 |
|
|
emit_insn (gen_andv4si3 (temp2, temp_v4si, ahi_inf));
|
3002 |
|
|
emit_insn (gen_iorv4si3 (a_nan, a_nan, temp2));
|
3003 |
|
|
}
|
3004 |
|
|
emit_insn (gen_iorv4si3 (temp2, a_abs, b_abs));
|
3005 |
|
|
emit_insn (gen_ceq_v4si (iszero, temp2, CONST0_RTX (V4SImode)));
|
3006 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, iszero),
|
3007 |
|
|
GEN_INT (4 * 8)));
|
3008 |
|
|
emit_insn (gen_andv4si3 (iszero, iszero, temp_v4si));
|
3009 |
|
|
emit_insn (gen_iorv4si3 (temp2, biteq, iszero));
|
3010 |
|
|
if (!flag_finite_math_only)
|
3011 |
|
|
{
|
3012 |
|
|
emit_insn (gen_andc_v4si (temp2, temp2, a_nan));
|
3013 |
|
|
}
|
3014 |
|
|
emit_insn (gen_shufb (operands[0], temp2, temp2, hihi_promote));
|
3015 |
|
|
DONE;
|
3016 |
|
|
}
|
3017 |
|
|
})
|
3018 |
|
|
|
3019 |
|
|
(define_insn "ceq__celledp"
|
3020 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
3021 |
|
|
(eq: (match_operand:VDF 1 "spu_reg_operand" "r")
|
3022 |
|
|
(match_operand:VDF 2 "spu_reg_operand" "r")))]
|
3023 |
|
|
"spu_arch == PROCESSOR_CELLEDP"
|
3024 |
|
|
"dfceq\t%0,%1,%2"
|
3025 |
|
|
[(set_attr "type" "fpd")])
|
3026 |
|
|
|
3027 |
|
|
(define_insn "cmeq__celledp"
|
3028 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
3029 |
|
|
(eq: (abs:VDF (match_operand:VDF 1 "spu_reg_operand" "r"))
|
3030 |
|
|
(abs:VDF (match_operand:VDF 2 "spu_reg_operand" "r"))))]
|
3031 |
|
|
"spu_arch == PROCESSOR_CELLEDP"
|
3032 |
|
|
"dfcmeq\t%0,%1,%2"
|
3033 |
|
|
[(set_attr "type" "fpd")])
|
3034 |
|
|
|
3035 |
|
|
(define_expand "ceq_v2df"
|
3036 |
|
|
[(set (match_operand:V2DI 0 "spu_reg_operand" "=r")
|
3037 |
|
|
(eq:V2DI (match_operand:V2DF 1 "spu_reg_operand" "r")
|
3038 |
|
|
(match_operand:V2DF 2 "spu_reg_operand" "r")))]
|
3039 |
|
|
""
|
3040 |
|
|
{
|
3041 |
|
|
if (spu_arch == PROCESSOR_CELL)
|
3042 |
|
|
{
|
3043 |
|
|
rtx ra = spu_gen_subreg (V4SImode, operands[1]);
|
3044 |
|
|
rtx rb = spu_gen_subreg (V4SImode, operands[2]);
|
3045 |
|
|
rtx temp = gen_reg_rtx (TImode);
|
3046 |
|
|
rtx temp_v4si = spu_gen_subreg (V4SImode, temp);
|
3047 |
|
|
rtx temp2 = gen_reg_rtx (V4SImode);
|
3048 |
|
|
rtx biteq = gen_reg_rtx (V4SImode);
|
3049 |
|
|
rtx ahi_inf = gen_reg_rtx (V4SImode);
|
3050 |
|
|
rtx a_nan = gen_reg_rtx (V4SImode);
|
3051 |
|
|
rtx a_abs = gen_reg_rtx (V4SImode);
|
3052 |
|
|
rtx b_abs = gen_reg_rtx (V4SImode);
|
3053 |
|
|
rtx iszero = gen_reg_rtx (V4SImode);
|
3054 |
|
|
rtx pat = spu_const_from_ints (V4SImode, 0x7FFFFFFF, 0xFFFFFFFF,
|
3055 |
|
|
0x7FFFFFFF, 0xFFFFFFFF);
|
3056 |
|
|
rtx sign_mask = gen_reg_rtx (V4SImode);
|
3057 |
|
|
rtx nan_mask = gen_reg_rtx (V4SImode);
|
3058 |
|
|
rtx hihi_promote = gen_reg_rtx (TImode);
|
3059 |
|
|
|
3060 |
|
|
emit_move_insn (sign_mask, pat);
|
3061 |
|
|
pat = spu_const_from_ints (V4SImode, 0x7FF00000, 0x0,
|
3062 |
|
|
0x7FF00000, 0x0);
|
3063 |
|
|
emit_move_insn (nan_mask, pat);
|
3064 |
|
|
pat = spu_const_from_ints (TImode, 0x00010203, 0x10111213,
|
3065 |
|
|
0x08090A0B, 0x18191A1B);
|
3066 |
|
|
emit_move_insn (hihi_promote, pat);
|
3067 |
|
|
|
3068 |
|
|
emit_insn (gen_ceq_v4si (biteq, ra, rb));
|
3069 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, biteq),
|
3070 |
|
|
GEN_INT (4 * 8)));
|
3071 |
|
|
emit_insn (gen_andv4si3 (biteq, biteq, temp_v4si));
|
3072 |
|
|
emit_insn (gen_andv4si3 (a_abs, ra, sign_mask));
|
3073 |
|
|
emit_insn (gen_andv4si3 (b_abs, rb, sign_mask));
|
3074 |
|
|
emit_insn (gen_clgt_v4si (a_nan, a_abs, nan_mask));
|
3075 |
|
|
emit_insn (gen_ceq_v4si (ahi_inf, a_abs, nan_mask));
|
3076 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, a_nan),
|
3077 |
|
|
GEN_INT (4 * 8)));
|
3078 |
|
|
emit_insn (gen_andv4si3 (temp2, temp_v4si, ahi_inf));
|
3079 |
|
|
emit_insn (gen_iorv4si3 (a_nan, a_nan, temp2));
|
3080 |
|
|
emit_insn (gen_iorv4si3 (temp2, a_abs, b_abs));
|
3081 |
|
|
emit_insn (gen_ceq_v4si (iszero, temp2, CONST0_RTX (V4SImode)));
|
3082 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, iszero),
|
3083 |
|
|
GEN_INT (4 * 8)));
|
3084 |
|
|
emit_insn (gen_andv4si3 (iszero, iszero, temp_v4si));
|
3085 |
|
|
emit_insn (gen_iorv4si3 (temp2, biteq, iszero));
|
3086 |
|
|
emit_insn (gen_andc_v4si (temp2, temp2, a_nan));
|
3087 |
|
|
emit_insn (gen_shufb (operands[0], temp2, temp2, hihi_promote));
|
3088 |
|
|
DONE;
|
3089 |
|
|
}
|
3090 |
|
|
})
|
3091 |
|
|
|
3092 |
|
|
(define_expand "cmeq_v2df"
|
3093 |
|
|
[(set (match_operand:V2DI 0 "spu_reg_operand" "=r")
|
3094 |
|
|
(eq:V2DI (abs:V2DF (match_operand:V2DF 1 "spu_reg_operand" "r"))
|
3095 |
|
|
(abs:V2DF (match_operand:V2DF 2 "spu_reg_operand" "r"))))]
|
3096 |
|
|
""
|
3097 |
|
|
{
|
3098 |
|
|
if (spu_arch == PROCESSOR_CELL)
|
3099 |
|
|
{
|
3100 |
|
|
rtx ra = spu_gen_subreg (V4SImode, operands[1]);
|
3101 |
|
|
rtx rb = spu_gen_subreg (V4SImode, operands[2]);
|
3102 |
|
|
rtx temp = gen_reg_rtx (TImode);
|
3103 |
|
|
rtx temp_v4si = spu_gen_subreg (V4SImode, temp);
|
3104 |
|
|
rtx temp2 = gen_reg_rtx (V4SImode);
|
3105 |
|
|
rtx biteq = gen_reg_rtx (V4SImode);
|
3106 |
|
|
rtx ahi_inf = gen_reg_rtx (V4SImode);
|
3107 |
|
|
rtx a_nan = gen_reg_rtx (V4SImode);
|
3108 |
|
|
rtx a_abs = gen_reg_rtx (V4SImode);
|
3109 |
|
|
rtx b_abs = gen_reg_rtx (V4SImode);
|
3110 |
|
|
|
3111 |
|
|
rtx pat = spu_const_from_ints (V4SImode, 0x7FFFFFFF, 0xFFFFFFFF,
|
3112 |
|
|
0x7FFFFFFF, 0xFFFFFFFF);
|
3113 |
|
|
rtx sign_mask = gen_reg_rtx (V4SImode);
|
3114 |
|
|
rtx nan_mask = gen_reg_rtx (V4SImode);
|
3115 |
|
|
rtx hihi_promote = gen_reg_rtx (TImode);
|
3116 |
|
|
|
3117 |
|
|
emit_move_insn (sign_mask, pat);
|
3118 |
|
|
|
3119 |
|
|
pat = spu_const_from_ints (V4SImode, 0x7FF00000, 0x0,
|
3120 |
|
|
0x7FF00000, 0x0);
|
3121 |
|
|
emit_move_insn (nan_mask, pat);
|
3122 |
|
|
pat = spu_const_from_ints (TImode, 0x00010203, 0x10111213,
|
3123 |
|
|
0x08090A0B, 0x18191A1B);
|
3124 |
|
|
emit_move_insn (hihi_promote, pat);
|
3125 |
|
|
|
3126 |
|
|
emit_insn (gen_andv4si3 (a_abs, ra, sign_mask));
|
3127 |
|
|
emit_insn (gen_andv4si3 (b_abs, rb, sign_mask));
|
3128 |
|
|
emit_insn (gen_ceq_v4si (biteq, a_abs, b_abs));
|
3129 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, biteq),
|
3130 |
|
|
GEN_INT (4 * 8)));
|
3131 |
|
|
emit_insn (gen_andv4si3 (biteq, biteq, temp_v4si));
|
3132 |
|
|
emit_insn (gen_clgt_v4si (a_nan, a_abs, nan_mask));
|
3133 |
|
|
emit_insn (gen_ceq_v4si (ahi_inf, a_abs, nan_mask));
|
3134 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, a_nan),
|
3135 |
|
|
GEN_INT (4 * 8)));
|
3136 |
|
|
emit_insn (gen_andv4si3 (temp2, temp_v4si, ahi_inf));
|
3137 |
|
|
emit_insn (gen_iorv4si3 (a_nan, a_nan, temp2));
|
3138 |
|
|
emit_insn (gen_andc_v4si (temp2, biteq, a_nan));
|
3139 |
|
|
emit_insn (gen_shufb (operands[0], temp2, temp2, hihi_promote));
|
3140 |
|
|
DONE;
|
3141 |
|
|
}
|
3142 |
|
|
})
|
3143 |
|
|
|
3144 |
|
|
|
3145 |
|
|
;; cgt
|
3146 |
|
|
|
3147 |
|
|
(define_insn "cgt_"
|
3148 |
|
|
[(set (match_operand:VQHSI 0 "spu_reg_operand" "=r,r")
|
3149 |
|
|
(gt:VQHSI (match_operand:VQHSI 1 "spu_reg_operand" "r,r")
|
3150 |
|
|
(match_operand:VQHSI 2 "spu_arith_operand" "r,B")))]
|
3151 |
|
|
""
|
3152 |
|
|
"@
|
3153 |
|
|
cgt\t%0,%1,%2
|
3154 |
|
|
cgti\t%0,%1,%2")
|
3155 |
|
|
|
3156 |
|
|
(define_insn "cgt_di_m1"
|
3157 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
3158 |
|
|
(gt:SI (match_operand:DI 1 "spu_reg_operand" "r")
|
3159 |
|
|
(const_int -1)))]
|
3160 |
|
|
""
|
3161 |
|
|
"cgti\t%0,%1,-1")
|
3162 |
|
|
|
3163 |
|
|
(define_insn_and_split "cgt_di"
|
3164 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
3165 |
|
|
(gt:SI (match_operand:DI 1 "spu_reg_operand" "r")
|
3166 |
|
|
(match_operand:DI 2 "spu_reg_operand" "r")))
|
3167 |
|
|
(clobber (match_scratch:V4SI 3 "=&r"))
|
3168 |
|
|
(clobber (match_scratch:V4SI 4 "=&r"))
|
3169 |
|
|
(clobber (match_scratch:V4SI 5 "=&r"))]
|
3170 |
|
|
""
|
3171 |
|
|
"#"
|
3172 |
|
|
"reload_completed"
|
3173 |
|
|
[(set (match_dup:SI 0)
|
3174 |
|
|
(gt:SI (match_dup:DI 1)
|
3175 |
|
|
(match_dup:DI 2)))]
|
3176 |
|
|
{
|
3177 |
|
|
rtx op0 = gen_rtx_REG (V4SImode, REGNO (operands[0]));
|
3178 |
|
|
rtx op1 = gen_rtx_REG (V4SImode, REGNO (operands[1]));
|
3179 |
|
|
rtx op2 = gen_rtx_REG (V4SImode, REGNO (operands[2]));
|
3180 |
|
|
rtx op3 = operands[3];
|
3181 |
|
|
rtx op4 = operands[4];
|
3182 |
|
|
rtx op5 = operands[5];
|
3183 |
|
|
rtx op3d = gen_rtx_REG (V2DImode, REGNO (operands[3]));
|
3184 |
|
|
emit_insn (gen_clgt_v4si (op3, op1, op2));
|
3185 |
|
|
emit_insn (gen_ceq_v4si (op4, op1, op2));
|
3186 |
|
|
emit_insn (gen_cgt_v4si (op5, op1, op2));
|
3187 |
|
|
emit_insn (gen_spu_xswd (op3d, op3));
|
3188 |
|
|
emit_insn (gen_selb (op0, op5, op3, op4));
|
3189 |
|
|
DONE;
|
3190 |
|
|
})
|
3191 |
|
|
|
3192 |
|
|
(define_insn "cgt_ti"
|
3193 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
3194 |
|
|
(gt:SI (match_operand:TI 1 "spu_reg_operand" "r")
|
3195 |
|
|
(match_operand:TI 2 "spu_reg_operand" "r")))
|
3196 |
|
|
(clobber (match_scratch:V4SI 3 "=&r"))
|
3197 |
|
|
(clobber (match_scratch:V4SI 4 "=&r"))
|
3198 |
|
|
(clobber (match_scratch:V4SI 5 "=&r"))]
|
3199 |
|
|
""
|
3200 |
|
|
"clgt\t%4,%1,%2\;\
|
3201 |
|
|
ceq\t%3,%1,%2\;\
|
3202 |
|
|
cgt\t%5,%1,%2\;\
|
3203 |
|
|
shlqbyi\t%0,%4,4\;\
|
3204 |
|
|
selb\t%0,%4,%0,%3\;\
|
3205 |
|
|
shlqbyi\t%0,%0,4\;\
|
3206 |
|
|
selb\t%0,%4,%0,%3\;\
|
3207 |
|
|
shlqbyi\t%0,%0,4\;\
|
3208 |
|
|
selb\t%0,%5,%0,%3"
|
3209 |
|
|
[(set_attr "type" "multi0")
|
3210 |
|
|
(set_attr "length" "36")])
|
3211 |
|
|
|
3212 |
|
|
(define_insn "cgt_"
|
3213 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
3214 |
|
|
(gt: (match_operand:VSF 1 "spu_reg_operand" "r")
|
3215 |
|
|
(match_operand:VSF 2 "spu_reg_operand" "r")))]
|
3216 |
|
|
""
|
3217 |
|
|
"fcgt\t%0,%1,%2")
|
3218 |
|
|
|
3219 |
|
|
(define_insn "cmgt_"
|
3220 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
3221 |
|
|
(gt: (abs:VSF (match_operand:VSF 1 "spu_reg_operand" "r"))
|
3222 |
|
|
(abs:VSF (match_operand:VSF 2 "spu_reg_operand" "r"))))]
|
3223 |
|
|
""
|
3224 |
|
|
"fcmgt\t%0,%1,%2")
|
3225 |
|
|
|
3226 |
|
|
(define_expand "cgt_df"
|
3227 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
3228 |
|
|
(gt:SI (match_operand:DF 1 "spu_reg_operand" "r")
|
3229 |
|
|
(match_operand:DF 2 "const_zero_operand" "i")))]
|
3230 |
|
|
""
|
3231 |
|
|
{
|
3232 |
|
|
if (spu_arch == PROCESSOR_CELL)
|
3233 |
|
|
{
|
3234 |
|
|
rtx ra = gen_reg_rtx (V4SImode);
|
3235 |
|
|
rtx rb = gen_reg_rtx (V4SImode);
|
3236 |
|
|
rtx zero = gen_reg_rtx (V4SImode);
|
3237 |
|
|
rtx temp = gen_reg_rtx (TImode);
|
3238 |
|
|
rtx temp_v4si = spu_gen_subreg (V4SImode, temp);
|
3239 |
|
|
rtx temp2 = gen_reg_rtx (V4SImode);
|
3240 |
|
|
rtx hi_inf = gen_reg_rtx (V4SImode);
|
3241 |
|
|
rtx a_nan = gen_reg_rtx (V4SImode);
|
3242 |
|
|
rtx b_nan = gen_reg_rtx (V4SImode);
|
3243 |
|
|
rtx a_abs = gen_reg_rtx (V4SImode);
|
3244 |
|
|
rtx b_abs = gen_reg_rtx (V4SImode);
|
3245 |
|
|
rtx asel = gen_reg_rtx (V4SImode);
|
3246 |
|
|
rtx bsel = gen_reg_rtx (V4SImode);
|
3247 |
|
|
rtx abor = gen_reg_rtx (V4SImode);
|
3248 |
|
|
rtx bbor = gen_reg_rtx (V4SImode);
|
3249 |
|
|
rtx gt_hi = gen_reg_rtx (V4SImode);
|
3250 |
|
|
rtx gt_lo = gen_reg_rtx (V4SImode);
|
3251 |
|
|
rtx sign_mask = gen_reg_rtx (V4SImode);
|
3252 |
|
|
rtx nan_mask = gen_reg_rtx (V4SImode);
|
3253 |
|
|
rtx hi_promote = gen_reg_rtx (TImode);
|
3254 |
|
|
rtx borrow_shuffle = gen_reg_rtx (TImode);
|
3255 |
|
|
|
3256 |
|
|
rtx pat = spu_const_from_ints (V4SImode, 0x7FFFFFFF, 0xFFFFFFFF,
|
3257 |
|
|
0x7FFFFFFF, 0xFFFFFFFF);
|
3258 |
|
|
emit_move_insn (sign_mask, pat);
|
3259 |
|
|
pat = spu_const_from_ints (V4SImode, 0x7FF00000, 0x0,
|
3260 |
|
|
0x7FF00000, 0x0);
|
3261 |
|
|
emit_move_insn (nan_mask, pat);
|
3262 |
|
|
pat = spu_const_from_ints (TImode, 0x00010203, 0x00010203,
|
3263 |
|
|
0x08090A0B, 0x08090A0B);
|
3264 |
|
|
emit_move_insn (hi_promote, pat);
|
3265 |
|
|
pat = spu_const_from_ints (TImode, 0x04050607, 0xC0C0C0C0,
|
3266 |
|
|
0x0C0D0E0F, 0xC0C0C0C0);
|
3267 |
|
|
emit_move_insn (borrow_shuffle, pat);
|
3268 |
|
|
|
3269 |
|
|
emit_insn (gen_spu_convert (ra, operands[1]));
|
3270 |
|
|
emit_insn (gen_spu_convert (rb, operands[2]));
|
3271 |
|
|
emit_insn (gen_andv4si3 (a_abs, ra, sign_mask));
|
3272 |
|
|
emit_insn (gen_andv4si3 (b_abs, rb, sign_mask));
|
3273 |
|
|
|
3274 |
|
|
if (!flag_finite_math_only)
|
3275 |
|
|
{
|
3276 |
|
|
/* check if ra is NaN */
|
3277 |
|
|
emit_insn (gen_ceq_v4si (hi_inf, a_abs, nan_mask));
|
3278 |
|
|
emit_insn (gen_clgt_v4si (a_nan, a_abs, nan_mask));
|
3279 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, a_nan),
|
3280 |
|
|
GEN_INT (4 * 8)));
|
3281 |
|
|
emit_insn (gen_andv4si3 (temp2, temp_v4si, hi_inf));
|
3282 |
|
|
emit_insn (gen_iorv4si3 (a_nan, a_nan, temp2));
|
3283 |
|
|
emit_insn (gen_shufb (a_nan, a_nan, a_nan, hi_promote));
|
3284 |
|
|
|
3285 |
|
|
/* check if rb is NaN */
|
3286 |
|
|
emit_insn (gen_ceq_v4si (hi_inf, b_abs, nan_mask));
|
3287 |
|
|
emit_insn (gen_clgt_v4si (b_nan, b_abs, nan_mask));
|
3288 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, b_nan),
|
3289 |
|
|
GEN_INT (4 * 8)));
|
3290 |
|
|
emit_insn (gen_andv4si3 (temp2, temp_v4si, hi_inf));
|
3291 |
|
|
emit_insn (gen_iorv4si3 (b_nan, b_nan, temp2));
|
3292 |
|
|
emit_insn (gen_shufb (b_nan, b_nan, b_nan, hi_promote));
|
3293 |
|
|
|
3294 |
|
|
/* check if ra or rb is NaN */
|
3295 |
|
|
emit_insn (gen_iorv4si3 (a_nan, a_nan, b_nan));
|
3296 |
|
|
}
|
3297 |
|
|
emit_move_insn (zero, CONST0_RTX (V4SImode));
|
3298 |
|
|
emit_insn (gen_vashrv4si3 (asel, ra, spu_const (V4SImode, 31)));
|
3299 |
|
|
emit_insn (gen_shufb (asel, asel, asel, hi_promote));
|
3300 |
|
|
emit_insn (gen_bg_v4si (abor, zero, a_abs));
|
3301 |
|
|
emit_insn (gen_shufb (abor, abor, abor, borrow_shuffle));
|
3302 |
|
|
emit_insn (gen_sfx_v4si (abor, zero, a_abs, abor));
|
3303 |
|
|
emit_insn (gen_selb (abor, a_abs, abor, asel));
|
3304 |
|
|
|
3305 |
|
|
emit_insn (gen_vashrv4si3 (bsel, rb, spu_const (V4SImode, 31)));
|
3306 |
|
|
emit_insn (gen_shufb (bsel, bsel, bsel, hi_promote));
|
3307 |
|
|
emit_insn (gen_bg_v4si (bbor, zero, b_abs));
|
3308 |
|
|
emit_insn (gen_shufb (bbor, bbor, bbor, borrow_shuffle));
|
3309 |
|
|
emit_insn (gen_sfx_v4si (bbor, zero, b_abs, bbor));
|
3310 |
|
|
emit_insn (gen_selb (bbor, b_abs, bbor, bsel));
|
3311 |
|
|
|
3312 |
|
|
emit_insn (gen_cgt_v4si (gt_hi, abor, bbor));
|
3313 |
|
|
emit_insn (gen_clgt_v4si (gt_lo, abor, bbor));
|
3314 |
|
|
emit_insn (gen_ceq_v4si (temp2, abor, bbor));
|
3315 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, gt_lo),
|
3316 |
|
|
GEN_INT (4 * 8)));
|
3317 |
|
|
emit_insn (gen_andv4si3 (temp2, temp2, temp_v4si));
|
3318 |
|
|
emit_insn (gen_iorv4si3 (temp2, gt_hi, temp2));
|
3319 |
|
|
emit_insn (gen_shufb (temp2, temp2, temp2, hi_promote));
|
3320 |
|
|
if (!flag_finite_math_only)
|
3321 |
|
|
{
|
3322 |
|
|
/* correct for NaNs */
|
3323 |
|
|
emit_insn (gen_andc_v4si (temp2, temp2, a_nan));
|
3324 |
|
|
}
|
3325 |
|
|
emit_insn (gen_spu_convert (operands[0], temp2));
|
3326 |
|
|
DONE;
|
3327 |
|
|
}
|
3328 |
|
|
})
|
3329 |
|
|
|
3330 |
|
|
(define_insn "cgt__celledp"
|
3331 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
3332 |
|
|
(gt: (match_operand:VDF 1 "spu_reg_operand" "r")
|
3333 |
|
|
(match_operand:VDF 2 "spu_reg_operand" "r")))]
|
3334 |
|
|
"spu_arch == PROCESSOR_CELLEDP"
|
3335 |
|
|
"dfcgt\t%0,%1,%2"
|
3336 |
|
|
[(set_attr "type" "fpd")])
|
3337 |
|
|
|
3338 |
|
|
(define_insn "cmgt__celledp"
|
3339 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
3340 |
|
|
(gt: (abs:VDF (match_operand:VDF 1 "spu_reg_operand" "r"))
|
3341 |
|
|
(abs:VDF (match_operand:VDF 2 "spu_reg_operand" "r"))))]
|
3342 |
|
|
"spu_arch == PROCESSOR_CELLEDP"
|
3343 |
|
|
"dfcmgt\t%0,%1,%2"
|
3344 |
|
|
[(set_attr "type" "fpd")])
|
3345 |
|
|
|
3346 |
|
|
(define_expand "cgt_v2df"
|
3347 |
|
|
[(set (match_operand:V2DI 0 "spu_reg_operand" "=r")
|
3348 |
|
|
(gt:V2DI (match_operand:V2DF 1 "spu_reg_operand" "r")
|
3349 |
|
|
(match_operand:V2DF 2 "spu_reg_operand" "r")))]
|
3350 |
|
|
""
|
3351 |
|
|
{
|
3352 |
|
|
if (spu_arch == PROCESSOR_CELL)
|
3353 |
|
|
{
|
3354 |
|
|
rtx ra = spu_gen_subreg (V4SImode, operands[1]);
|
3355 |
|
|
rtx rb = spu_gen_subreg (V4SImode, operands[2]);
|
3356 |
|
|
rtx zero = gen_reg_rtx (V4SImode);
|
3357 |
|
|
rtx temp = gen_reg_rtx (TImode);
|
3358 |
|
|
rtx temp_v4si = spu_gen_subreg (V4SImode, temp);
|
3359 |
|
|
rtx temp2 = gen_reg_rtx (V4SImode);
|
3360 |
|
|
rtx hi_inf = gen_reg_rtx (V4SImode);
|
3361 |
|
|
rtx a_nan = gen_reg_rtx (V4SImode);
|
3362 |
|
|
rtx b_nan = gen_reg_rtx (V4SImode);
|
3363 |
|
|
rtx a_abs = gen_reg_rtx (V4SImode);
|
3364 |
|
|
rtx b_abs = gen_reg_rtx (V4SImode);
|
3365 |
|
|
rtx asel = gen_reg_rtx (V4SImode);
|
3366 |
|
|
rtx bsel = gen_reg_rtx (V4SImode);
|
3367 |
|
|
rtx abor = gen_reg_rtx (V4SImode);
|
3368 |
|
|
rtx bbor = gen_reg_rtx (V4SImode);
|
3369 |
|
|
rtx gt_hi = gen_reg_rtx (V4SImode);
|
3370 |
|
|
rtx gt_lo = gen_reg_rtx (V4SImode);
|
3371 |
|
|
rtx sign_mask = gen_reg_rtx (V4SImode);
|
3372 |
|
|
rtx nan_mask = gen_reg_rtx (V4SImode);
|
3373 |
|
|
rtx hi_promote = gen_reg_rtx (TImode);
|
3374 |
|
|
rtx borrow_shuffle = gen_reg_rtx (TImode);
|
3375 |
|
|
rtx pat = spu_const_from_ints (V4SImode, 0x7FFFFFFF, 0xFFFFFFFF,
|
3376 |
|
|
0x7FFFFFFF, 0xFFFFFFFF);
|
3377 |
|
|
emit_move_insn (sign_mask, pat);
|
3378 |
|
|
pat = spu_const_from_ints (V4SImode, 0x7FF00000, 0x0,
|
3379 |
|
|
0x7FF00000, 0x0);
|
3380 |
|
|
emit_move_insn (nan_mask, pat);
|
3381 |
|
|
pat = spu_const_from_ints (TImode, 0x00010203, 0x00010203,
|
3382 |
|
|
0x08090A0B, 0x08090A0B);
|
3383 |
|
|
emit_move_insn (hi_promote, pat);
|
3384 |
|
|
pat = spu_const_from_ints (TImode, 0x04050607, 0xC0C0C0C0,
|
3385 |
|
|
0x0C0D0E0F, 0xC0C0C0C0);
|
3386 |
|
|
emit_move_insn (borrow_shuffle, pat);
|
3387 |
|
|
|
3388 |
|
|
emit_insn (gen_andv4si3 (a_abs, ra, sign_mask));
|
3389 |
|
|
emit_insn (gen_ceq_v4si (hi_inf, a_abs, nan_mask));
|
3390 |
|
|
emit_insn (gen_clgt_v4si (a_nan, a_abs, nan_mask));
|
3391 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, a_nan),
|
3392 |
|
|
GEN_INT (4 * 8)));
|
3393 |
|
|
emit_insn (gen_andv4si3 (temp2, temp_v4si, hi_inf));
|
3394 |
|
|
emit_insn (gen_iorv4si3 (a_nan, a_nan, temp2));
|
3395 |
|
|
emit_insn (gen_shufb (a_nan, a_nan, a_nan, hi_promote));
|
3396 |
|
|
emit_insn (gen_andv4si3 (b_abs, rb, sign_mask));
|
3397 |
|
|
emit_insn (gen_ceq_v4si (hi_inf, b_abs, nan_mask));
|
3398 |
|
|
emit_insn (gen_clgt_v4si (b_nan, b_abs, nan_mask));
|
3399 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, b_nan),
|
3400 |
|
|
GEN_INT (4 * 8)));
|
3401 |
|
|
emit_insn (gen_andv4si3 (temp2, temp_v4si, hi_inf));
|
3402 |
|
|
emit_insn (gen_iorv4si3 (b_nan, b_nan, temp2));
|
3403 |
|
|
emit_insn (gen_shufb (b_nan, b_nan, b_nan, hi_promote));
|
3404 |
|
|
emit_insn (gen_iorv4si3 (a_nan, a_nan, b_nan));
|
3405 |
|
|
emit_move_insn (zero, CONST0_RTX (V4SImode));
|
3406 |
|
|
emit_insn (gen_vashrv4si3 (asel, ra, spu_const (V4SImode, 31)));
|
3407 |
|
|
emit_insn (gen_shufb (asel, asel, asel, hi_promote));
|
3408 |
|
|
emit_insn (gen_bg_v4si (abor, zero, a_abs));
|
3409 |
|
|
emit_insn (gen_shufb (abor, abor, abor, borrow_shuffle));
|
3410 |
|
|
emit_insn (gen_sfx_v4si (abor, zero, a_abs, abor));
|
3411 |
|
|
emit_insn (gen_selb (abor, a_abs, abor, asel));
|
3412 |
|
|
emit_insn (gen_vashrv4si3 (bsel, rb, spu_const (V4SImode, 31)));
|
3413 |
|
|
emit_insn (gen_shufb (bsel, bsel, bsel, hi_promote));
|
3414 |
|
|
emit_insn (gen_bg_v4si (bbor, zero, b_abs));
|
3415 |
|
|
emit_insn (gen_shufb (bbor, bbor, bbor, borrow_shuffle));
|
3416 |
|
|
emit_insn (gen_sfx_v4si (bbor, zero, b_abs, bbor));
|
3417 |
|
|
emit_insn (gen_selb (bbor, b_abs, bbor, bsel));
|
3418 |
|
|
emit_insn (gen_cgt_v4si (gt_hi, abor, bbor));
|
3419 |
|
|
emit_insn (gen_clgt_v4si (gt_lo, abor, bbor));
|
3420 |
|
|
emit_insn (gen_ceq_v4si (temp2, abor, bbor));
|
3421 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, gt_lo),
|
3422 |
|
|
GEN_INT (4 * 8)));
|
3423 |
|
|
emit_insn (gen_andv4si3 (temp2, temp2, temp_v4si));
|
3424 |
|
|
emit_insn (gen_iorv4si3 (temp2, gt_hi, temp2));
|
3425 |
|
|
|
3426 |
|
|
emit_insn (gen_shufb (temp2, temp2, temp2, hi_promote));
|
3427 |
|
|
emit_insn (gen_andc_v4si (temp2, temp2, a_nan));
|
3428 |
|
|
emit_move_insn (operands[0], spu_gen_subreg (V2DImode, temp2));
|
3429 |
|
|
DONE;
|
3430 |
|
|
}
|
3431 |
|
|
})
|
3432 |
|
|
|
3433 |
|
|
(define_expand "cmgt_v2df"
|
3434 |
|
|
[(set (match_operand:V2DI 0 "spu_reg_operand" "=r")
|
3435 |
|
|
(gt:V2DI (abs:V2DF (match_operand:V2DF 1 "spu_reg_operand" "r"))
|
3436 |
|
|
(abs:V2DF (match_operand:V2DF 2 "spu_reg_operand" "r"))))]
|
3437 |
|
|
""
|
3438 |
|
|
{
|
3439 |
|
|
if (spu_arch == PROCESSOR_CELL)
|
3440 |
|
|
{
|
3441 |
|
|
rtx ra = spu_gen_subreg (V4SImode, operands[1]);
|
3442 |
|
|
rtx rb = spu_gen_subreg (V4SImode, operands[2]);
|
3443 |
|
|
rtx temp = gen_reg_rtx (TImode);
|
3444 |
|
|
rtx temp_v4si = spu_gen_subreg (V4SImode, temp);
|
3445 |
|
|
rtx temp2 = gen_reg_rtx (V4SImode);
|
3446 |
|
|
rtx hi_inf = gen_reg_rtx (V4SImode);
|
3447 |
|
|
rtx a_nan = gen_reg_rtx (V4SImode);
|
3448 |
|
|
rtx b_nan = gen_reg_rtx (V4SImode);
|
3449 |
|
|
rtx a_abs = gen_reg_rtx (V4SImode);
|
3450 |
|
|
rtx b_abs = gen_reg_rtx (V4SImode);
|
3451 |
|
|
rtx gt_hi = gen_reg_rtx (V4SImode);
|
3452 |
|
|
rtx gt_lo = gen_reg_rtx (V4SImode);
|
3453 |
|
|
rtx sign_mask = gen_reg_rtx (V4SImode);
|
3454 |
|
|
rtx nan_mask = gen_reg_rtx (V4SImode);
|
3455 |
|
|
rtx hi_promote = gen_reg_rtx (TImode);
|
3456 |
|
|
rtx pat = spu_const_from_ints (V4SImode, 0x7FFFFFFF, 0xFFFFFFFF,
|
3457 |
|
|
0x7FFFFFFF, 0xFFFFFFFF);
|
3458 |
|
|
emit_move_insn (sign_mask, pat);
|
3459 |
|
|
pat = spu_const_from_ints (V4SImode, 0x7FF00000, 0x0,
|
3460 |
|
|
0x7FF00000, 0x0);
|
3461 |
|
|
emit_move_insn (nan_mask, pat);
|
3462 |
|
|
pat = spu_const_from_ints (TImode, 0x00010203, 0x00010203,
|
3463 |
|
|
0x08090A0B, 0x08090A0B);
|
3464 |
|
|
emit_move_insn (hi_promote, pat);
|
3465 |
|
|
|
3466 |
|
|
emit_insn (gen_andv4si3 (a_abs, ra, sign_mask));
|
3467 |
|
|
emit_insn (gen_ceq_v4si (hi_inf, a_abs, nan_mask));
|
3468 |
|
|
emit_insn (gen_clgt_v4si (a_nan, a_abs, nan_mask));
|
3469 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, a_nan),
|
3470 |
|
|
GEN_INT (4 * 8)));
|
3471 |
|
|
emit_insn (gen_andv4si3 (temp2, temp_v4si, hi_inf));
|
3472 |
|
|
emit_insn (gen_iorv4si3 (a_nan, a_nan, temp2));
|
3473 |
|
|
emit_insn (gen_shufb (a_nan, a_nan, a_nan, hi_promote));
|
3474 |
|
|
emit_insn (gen_andv4si3 (b_abs, rb, sign_mask));
|
3475 |
|
|
emit_insn (gen_ceq_v4si (hi_inf, b_abs, nan_mask));
|
3476 |
|
|
emit_insn (gen_clgt_v4si (b_nan, b_abs, nan_mask));
|
3477 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, b_nan),
|
3478 |
|
|
GEN_INT (4 * 8)));
|
3479 |
|
|
emit_insn (gen_andv4si3 (temp2, temp_v4si, hi_inf));
|
3480 |
|
|
emit_insn (gen_iorv4si3 (b_nan, b_nan, temp2));
|
3481 |
|
|
emit_insn (gen_shufb (b_nan, b_nan, b_nan, hi_promote));
|
3482 |
|
|
emit_insn (gen_iorv4si3 (a_nan, a_nan, b_nan));
|
3483 |
|
|
|
3484 |
|
|
emit_insn (gen_clgt_v4si (gt_hi, a_abs, b_abs));
|
3485 |
|
|
emit_insn (gen_clgt_v4si (gt_lo, a_abs, b_abs));
|
3486 |
|
|
emit_insn (gen_ceq_v4si (temp2, a_abs, b_abs));
|
3487 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, gt_lo),
|
3488 |
|
|
GEN_INT (4 * 8)));
|
3489 |
|
|
emit_insn (gen_andv4si3 (temp2, temp2, temp_v4si));
|
3490 |
|
|
emit_insn (gen_iorv4si3 (temp2, gt_hi, temp2));
|
3491 |
|
|
emit_insn (gen_shufb (temp2, temp2, temp2, hi_promote));
|
3492 |
|
|
emit_insn (gen_andc_v4si (temp2, temp2, a_nan));
|
3493 |
|
|
emit_move_insn (operands[0], spu_gen_subreg (V2DImode, temp2));
|
3494 |
|
|
DONE;
|
3495 |
|
|
}
|
3496 |
|
|
})
|
3497 |
|
|
|
3498 |
|
|
|
3499 |
|
|
;; clgt
|
3500 |
|
|
|
3501 |
|
|
(define_insn "clgt_"
|
3502 |
|
|
[(set (match_operand:VQHSI 0 "spu_reg_operand" "=r,r")
|
3503 |
|
|
(gtu:VQHSI (match_operand:VQHSI 1 "spu_reg_operand" "r,r")
|
3504 |
|
|
(match_operand:VQHSI 2 "spu_arith_operand" "r,B")))]
|
3505 |
|
|
""
|
3506 |
|
|
"@
|
3507 |
|
|
clgt\t%0,%1,%2
|
3508 |
|
|
clgti\t%0,%1,%2")
|
3509 |
|
|
|
3510 |
|
|
(define_insn_and_split "clgt_di"
|
3511 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
3512 |
|
|
(gtu:SI (match_operand:DI 1 "spu_reg_operand" "r")
|
3513 |
|
|
(match_operand:DI 2 "spu_reg_operand" "r")))
|
3514 |
|
|
(clobber (match_scratch:V4SI 3 "=&r"))
|
3515 |
|
|
(clobber (match_scratch:V4SI 4 "=&r"))
|
3516 |
|
|
(clobber (match_scratch:V4SI 5 "=&r"))]
|
3517 |
|
|
""
|
3518 |
|
|
"#"
|
3519 |
|
|
"reload_completed"
|
3520 |
|
|
[(set (match_dup:SI 0)
|
3521 |
|
|
(gtu:SI (match_dup:DI 1)
|
3522 |
|
|
(match_dup:DI 2)))]
|
3523 |
|
|
{
|
3524 |
|
|
rtx op0 = gen_rtx_REG (V4SImode, REGNO (operands[0]));
|
3525 |
|
|
rtx op1 = gen_rtx_REG (V4SImode, REGNO (operands[1]));
|
3526 |
|
|
rtx op2 = gen_rtx_REG (V4SImode, REGNO (operands[2]));
|
3527 |
|
|
rtx op3 = operands[3];
|
3528 |
|
|
rtx op4 = operands[4];
|
3529 |
|
|
rtx op5 = operands[5];
|
3530 |
|
|
rtx op5d = gen_rtx_REG (V2DImode, REGNO (operands[5]));
|
3531 |
|
|
emit_insn (gen_clgt_v4si (op3, op1, op2));
|
3532 |
|
|
emit_insn (gen_ceq_v4si (op4, op1, op2));
|
3533 |
|
|
emit_insn (gen_spu_xswd (op5d, op3));
|
3534 |
|
|
emit_insn (gen_selb (op0, op3, op5, op4));
|
3535 |
|
|
DONE;
|
3536 |
|
|
})
|
3537 |
|
|
|
3538 |
|
|
(define_insn "clgt_ti"
|
3539 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
3540 |
|
|
(gtu:SI (match_operand:TI 1 "spu_reg_operand" "r")
|
3541 |
|
|
(match_operand:TI 2 "spu_reg_operand" "r")))
|
3542 |
|
|
(clobber (match_scratch:V4SI 3 "=&r"))
|
3543 |
|
|
(clobber (match_scratch:V4SI 4 "=&r"))]
|
3544 |
|
|
""
|
3545 |
|
|
"ceq\t%3,%1,%2\;\
|
3546 |
|
|
clgt\t%4,%1,%2\;\
|
3547 |
|
|
shlqbyi\t%0,%4,4\;\
|
3548 |
|
|
selb\t%0,%4,%0,%3\;\
|
3549 |
|
|
shlqbyi\t%0,%0,4\;\
|
3550 |
|
|
selb\t%0,%4,%0,%3\;\
|
3551 |
|
|
shlqbyi\t%0,%0,4\;\
|
3552 |
|
|
selb\t%0,%4,%0,%3"
|
3553 |
|
|
[(set_attr "type" "multi0")
|
3554 |
|
|
(set_attr "length" "32")])
|
3555 |
|
|
|
3556 |
|
|
|
3557 |
|
|
;; dftsv
|
3558 |
|
|
(define_insn "dftsv_celledp"
|
3559 |
|
|
[(set (match_operand:V2DI 0 "spu_reg_operand" "=r")
|
3560 |
|
|
(unspec:V2DI [(match_operand:V2DF 1 "spu_reg_operand" "r")
|
3561 |
|
|
(match_operand:SI 2 "const_int_operand" "i")]
|
3562 |
|
|
UNSPEC_DFTSV))]
|
3563 |
|
|
"spu_arch == PROCESSOR_CELLEDP"
|
3564 |
|
|
"dftsv\t%0,%1,%2"
|
3565 |
|
|
[(set_attr "type" "fpd")])
|
3566 |
|
|
|
3567 |
|
|
(define_expand "dftsv"
|
3568 |
|
|
[(set (match_operand:V2DI 0 "spu_reg_operand" "=r")
|
3569 |
|
|
(unspec:V2DI [(match_operand:V2DF 1 "spu_reg_operand" "r")
|
3570 |
|
|
(match_operand:SI 2 "const_int_operand" "i")]
|
3571 |
|
|
UNSPEC_DFTSV))]
|
3572 |
|
|
""
|
3573 |
|
|
{
|
3574 |
|
|
if (spu_arch == PROCESSOR_CELL)
|
3575 |
|
|
{
|
3576 |
|
|
rtx result = gen_reg_rtx (V4SImode);
|
3577 |
|
|
emit_move_insn (result, CONST0_RTX (V4SImode));
|
3578 |
|
|
|
3579 |
|
|
if (INTVAL (operands[2]))
|
3580 |
|
|
{
|
3581 |
|
|
rtx ra = spu_gen_subreg (V4SImode, operands[1]);
|
3582 |
|
|
rtx abs = gen_reg_rtx (V4SImode);
|
3583 |
|
|
rtx sign = gen_reg_rtx (V4SImode);
|
3584 |
|
|
rtx temp = gen_reg_rtx (TImode);
|
3585 |
|
|
rtx temp_v4si = spu_gen_subreg (V4SImode, temp);
|
3586 |
|
|
rtx temp2 = gen_reg_rtx (V4SImode);
|
3587 |
|
|
rtx pat = spu_const_from_ints (V4SImode, 0x7FFFFFFF, 0xFFFFFFFF,
|
3588 |
|
|
0x7FFFFFFF, 0xFFFFFFFF);
|
3589 |
|
|
rtx sign_mask = gen_reg_rtx (V4SImode);
|
3590 |
|
|
rtx hi_promote = gen_reg_rtx (TImode);
|
3591 |
|
|
emit_move_insn (sign_mask, pat);
|
3592 |
|
|
pat = spu_const_from_ints (TImode, 0x00010203, 0x00010203,
|
3593 |
|
|
0x08090A0B, 0x08090A0B);
|
3594 |
|
|
emit_move_insn (hi_promote, pat);
|
3595 |
|
|
|
3596 |
|
|
emit_insn (gen_vashrv4si3 (sign, ra, spu_const (V4SImode, 31)));
|
3597 |
|
|
emit_insn (gen_shufb (sign, sign, sign, hi_promote));
|
3598 |
|
|
emit_insn (gen_andv4si3 (abs, ra, sign_mask));
|
3599 |
|
|
|
3600 |
|
|
/* NaN or +inf or -inf */
|
3601 |
|
|
if (INTVAL (operands[2]) & 0x70)
|
3602 |
|
|
{
|
3603 |
|
|
rtx nan_mask = gen_reg_rtx (V4SImode);
|
3604 |
|
|
rtx isinf = gen_reg_rtx (V4SImode);
|
3605 |
|
|
pat = spu_const_from_ints (V4SImode, 0x7FF00000, 0x0,
|
3606 |
|
|
0x7FF00000, 0x0);
|
3607 |
|
|
emit_move_insn (nan_mask, pat);
|
3608 |
|
|
emit_insn (gen_ceq_v4si (isinf, abs, nan_mask));
|
3609 |
|
|
|
3610 |
|
|
/* NaN */
|
3611 |
|
|
if (INTVAL (operands[2]) & 0x40)
|
3612 |
|
|
{
|
3613 |
|
|
rtx isnan = gen_reg_rtx (V4SImode);
|
3614 |
|
|
emit_insn (gen_clgt_v4si (isnan, abs, nan_mask));
|
3615 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, isnan),
|
3616 |
|
|
GEN_INT (4 * 8)));
|
3617 |
|
|
emit_insn (gen_andv4si3 (temp2, temp_v4si, isinf));
|
3618 |
|
|
emit_insn (gen_iorv4si3 (isnan, isnan, temp2));
|
3619 |
|
|
emit_insn (gen_shufb (isnan, isnan, isnan, hi_promote));
|
3620 |
|
|
emit_insn (gen_iorv4si3 (result, result, isnan));
|
3621 |
|
|
}
|
3622 |
|
|
/* +inf or -inf */
|
3623 |
|
|
if (INTVAL (operands[2]) & 0x30)
|
3624 |
|
|
{
|
3625 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, isinf),
|
3626 |
|
|
GEN_INT (4 * 8)));
|
3627 |
|
|
emit_insn (gen_andv4si3 (isinf, isinf, temp_v4si));
|
3628 |
|
|
emit_insn (gen_shufb (isinf, isinf, isinf, hi_promote));
|
3629 |
|
|
|
3630 |
|
|
/* +inf */
|
3631 |
|
|
if (INTVAL (operands[2]) & 0x20)
|
3632 |
|
|
{
|
3633 |
|
|
emit_insn (gen_andc_v4si (temp2, isinf, sign));
|
3634 |
|
|
emit_insn (gen_iorv4si3 (result, result, temp2));
|
3635 |
|
|
}
|
3636 |
|
|
/* -inf */
|
3637 |
|
|
if (INTVAL (operands[2]) & 0x10)
|
3638 |
|
|
{
|
3639 |
|
|
emit_insn (gen_andv4si3 (temp2, isinf, sign));
|
3640 |
|
|
emit_insn (gen_iorv4si3 (result, result, temp2));
|
3641 |
|
|
}
|
3642 |
|
|
}
|
3643 |
|
|
}
|
3644 |
|
|
|
3645 |
|
|
/* 0 or denorm */
|
3646 |
|
|
if (INTVAL (operands[2]) & 0xF)
|
3647 |
|
|
{
|
3648 |
|
|
rtx iszero = gen_reg_rtx (V4SImode);
|
3649 |
|
|
emit_insn (gen_ceq_v4si (iszero, abs, CONST0_RTX (V4SImode)));
|
3650 |
|
|
emit_insn (gen_rotlti3 (temp, spu_gen_subreg (TImode, iszero),
|
3651 |
|
|
GEN_INT (4 * 8)));
|
3652 |
|
|
emit_insn (gen_andv4si3 (iszero, iszero, temp_v4si));
|
3653 |
|
|
|
3654 |
|
|
/* denorm */
|
3655 |
|
|
if (INTVAL (operands[2]) & 0x3)
|
3656 |
|
|
{
|
3657 |
|
|
rtx isdenorm = gen_reg_rtx (V4SImode);
|
3658 |
|
|
rtx denorm_mask = gen_reg_rtx (V4SImode);
|
3659 |
|
|
emit_move_insn (denorm_mask, spu_const (V4SImode, 0xFFFFF));
|
3660 |
|
|
emit_insn (gen_clgt_v4si (isdenorm, abs, denorm_mask));
|
3661 |
|
|
emit_insn (gen_nor_v4si (isdenorm, isdenorm, iszero));
|
3662 |
|
|
emit_insn (gen_shufb (isdenorm, isdenorm,
|
3663 |
|
|
isdenorm, hi_promote));
|
3664 |
|
|
/* +denorm */
|
3665 |
|
|
if (INTVAL (operands[2]) & 0x2)
|
3666 |
|
|
{
|
3667 |
|
|
emit_insn (gen_andc_v4si (temp2, isdenorm, sign));
|
3668 |
|
|
emit_insn (gen_iorv4si3 (result, result, temp2));
|
3669 |
|
|
}
|
3670 |
|
|
/* -denorm */
|
3671 |
|
|
if (INTVAL (operands[2]) & 0x1)
|
3672 |
|
|
{
|
3673 |
|
|
emit_insn (gen_andv4si3 (temp2, isdenorm, sign));
|
3674 |
|
|
emit_insn (gen_iorv4si3 (result, result, temp2));
|
3675 |
|
|
}
|
3676 |
|
|
}
|
3677 |
|
|
|
3678 |
|
|
/* 0 */
|
3679 |
|
|
if (INTVAL (operands[2]) & 0xC)
|
3680 |
|
|
{
|
3681 |
|
|
emit_insn (gen_shufb (iszero, iszero, iszero, hi_promote));
|
3682 |
|
|
/* +0 */
|
3683 |
|
|
if (INTVAL (operands[2]) & 0x8)
|
3684 |
|
|
{
|
3685 |
|
|
emit_insn (gen_andc_v4si (temp2, iszero, sign));
|
3686 |
|
|
emit_insn (gen_iorv4si3 (result, result, temp2));
|
3687 |
|
|
}
|
3688 |
|
|
/* -0 */
|
3689 |
|
|
if (INTVAL (operands[2]) & 0x4)
|
3690 |
|
|
{
|
3691 |
|
|
emit_insn (gen_andv4si3 (temp2, iszero, sign));
|
3692 |
|
|
emit_insn (gen_iorv4si3 (result, result, temp2));
|
3693 |
|
|
}
|
3694 |
|
|
}
|
3695 |
|
|
}
|
3696 |
|
|
}
|
3697 |
|
|
emit_move_insn (operands[0], spu_gen_subreg (V2DImode, result));
|
3698 |
|
|
DONE;
|
3699 |
|
|
}
|
3700 |
|
|
})
|
3701 |
|
|
|
3702 |
|
|
|
3703 |
|
|
;; branches
|
3704 |
|
|
|
3705 |
|
|
(define_insn ""
|
3706 |
|
|
[(set (pc)
|
3707 |
|
|
(if_then_else (match_operator 1 "branch_comparison_operator"
|
3708 |
|
|
[(match_operand 2
|
3709 |
|
|
"spu_reg_operand" "r")
|
3710 |
|
|
(const_int 0)])
|
3711 |
|
|
(label_ref (match_operand 0 "" ""))
|
3712 |
|
|
(pc)))]
|
3713 |
|
|
""
|
3714 |
|
|
"br%b2%b1z\t%2,%0"
|
3715 |
|
|
[(set_attr "type" "br")])
|
3716 |
|
|
|
3717 |
|
|
(define_insn ""
|
3718 |
|
|
[(set (pc)
|
3719 |
|
|
(if_then_else (match_operator 0 "branch_comparison_operator"
|
3720 |
|
|
[(match_operand 1
|
3721 |
|
|
"spu_reg_operand" "r")
|
3722 |
|
|
(const_int 0)])
|
3723 |
|
|
(return)
|
3724 |
|
|
(pc)))]
|
3725 |
|
|
"direct_return ()"
|
3726 |
|
|
"bi%b1%b0z\t%1,$lr"
|
3727 |
|
|
[(set_attr "type" "br")])
|
3728 |
|
|
|
3729 |
|
|
(define_insn ""
|
3730 |
|
|
[(set (pc)
|
3731 |
|
|
(if_then_else (match_operator 1 "branch_comparison_operator"
|
3732 |
|
|
[(match_operand 2
|
3733 |
|
|
"spu_reg_operand" "r")
|
3734 |
|
|
(const_int 0)])
|
3735 |
|
|
(pc)
|
3736 |
|
|
(label_ref (match_operand 0 "" ""))))]
|
3737 |
|
|
""
|
3738 |
|
|
"br%b2%b1z\t%2,%0"
|
3739 |
|
|
[(set_attr "type" "br")])
|
3740 |
|
|
|
3741 |
|
|
(define_insn ""
|
3742 |
|
|
[(set (pc)
|
3743 |
|
|
(if_then_else (match_operator 0 "branch_comparison_operator"
|
3744 |
|
|
[(match_operand 1
|
3745 |
|
|
"spu_reg_operand" "r")
|
3746 |
|
|
(const_int 0)])
|
3747 |
|
|
(pc)
|
3748 |
|
|
(return)))]
|
3749 |
|
|
"direct_return ()"
|
3750 |
|
|
"bi%b1%b0z\t%1,$lr"
|
3751 |
|
|
[(set_attr "type" "br")])
|
3752 |
|
|
|
3753 |
|
|
|
3754 |
|
|
;; vector conditional compare patterns
|
3755 |
|
|
(define_expand "vcond"
|
3756 |
|
|
[(set (match_operand:VCMP 0 "spu_reg_operand" "=r")
|
3757 |
|
|
(if_then_else:VCMP
|
3758 |
|
|
(match_operator 3 "comparison_operator"
|
3759 |
|
|
[(match_operand:VCMP 4 "spu_reg_operand" "r")
|
3760 |
|
|
(match_operand:VCMP 5 "spu_reg_operand" "r")])
|
3761 |
|
|
(match_operand:VCMP 1 "spu_reg_operand" "r")
|
3762 |
|
|
(match_operand:VCMP 2 "spu_reg_operand" "r")))]
|
3763 |
|
|
""
|
3764 |
|
|
{
|
3765 |
|
|
if (spu_emit_vector_cond_expr (operands[0], operands[1], operands[2],
|
3766 |
|
|
operands[3], operands[4], operands[5]))
|
3767 |
|
|
DONE;
|
3768 |
|
|
else
|
3769 |
|
|
FAIL;
|
3770 |
|
|
})
|
3771 |
|
|
|
3772 |
|
|
(define_expand "vcondu"
|
3773 |
|
|
[(set (match_operand:VCMPU 0 "spu_reg_operand" "=r")
|
3774 |
|
|
(if_then_else:VCMPU
|
3775 |
|
|
(match_operator 3 "comparison_operator"
|
3776 |
|
|
[(match_operand:VCMPU 4 "spu_reg_operand" "r")
|
3777 |
|
|
(match_operand:VCMPU 5 "spu_reg_operand" "r")])
|
3778 |
|
|
(match_operand:VCMPU 1 "spu_reg_operand" "r")
|
3779 |
|
|
(match_operand:VCMPU 2 "spu_reg_operand" "r")))]
|
3780 |
|
|
""
|
3781 |
|
|
{
|
3782 |
|
|
if (spu_emit_vector_cond_expr (operands[0], operands[1], operands[2],
|
3783 |
|
|
operands[3], operands[4], operands[5]))
|
3784 |
|
|
DONE;
|
3785 |
|
|
else
|
3786 |
|
|
FAIL;
|
3787 |
|
|
})
|
3788 |
|
|
|
3789 |
|
|
|
3790 |
|
|
;; branch on condition
|
3791 |
|
|
|
3792 |
|
|
(define_expand "cbranch4"
|
3793 |
|
|
[(use (match_operator 0 "ordered_comparison_operator"
|
3794 |
|
|
[(match_operand:VQHSI 1 "spu_reg_operand" "")
|
3795 |
|
|
(match_operand:VQHSI 2 "spu_nonmem_operand" "")]))
|
3796 |
|
|
(use (match_operand 3 ""))]
|
3797 |
|
|
""
|
3798 |
|
|
{ spu_emit_branch_or_set (0, operands[0], operands); DONE; })
|
3799 |
|
|
|
3800 |
|
|
(define_expand "cbranch4"
|
3801 |
|
|
[(use (match_operator 0 "ordered_comparison_operator"
|
3802 |
|
|
[(match_operand:DTI 1 "spu_reg_operand" "")
|
3803 |
|
|
(match_operand:DTI 2 "spu_reg_operand" "")]))
|
3804 |
|
|
(use (match_operand 3 ""))]
|
3805 |
|
|
""
|
3806 |
|
|
{ spu_emit_branch_or_set (0, operands[0], operands); DONE; })
|
3807 |
|
|
|
3808 |
|
|
(define_expand "cbranch4"
|
3809 |
|
|
[(use (match_operator 0 "ordered_comparison_operator"
|
3810 |
|
|
[(match_operand:VSF 1 "spu_reg_operand" "")
|
3811 |
|
|
(match_operand:VSF 2 "spu_reg_operand" "")]))
|
3812 |
|
|
(use (match_operand 3 ""))]
|
3813 |
|
|
""
|
3814 |
|
|
{ spu_emit_branch_or_set (0, operands[0], operands); DONE; })
|
3815 |
|
|
|
3816 |
|
|
(define_expand "cbranchdf4"
|
3817 |
|
|
[(use (match_operator 0 "ordered_comparison_operator"
|
3818 |
|
|
[(match_operand:DF 1 "spu_reg_operand" "")
|
3819 |
|
|
(match_operand:DF 2 "spu_reg_operand" "")]))
|
3820 |
|
|
(use (match_operand 3 ""))]
|
3821 |
|
|
""
|
3822 |
|
|
{ spu_emit_branch_or_set (0, operands[0], operands); DONE; })
|
3823 |
|
|
|
3824 |
|
|
|
3825 |
|
|
;; set on condition
|
3826 |
|
|
|
3827 |
|
|
(define_expand "cstore4"
|
3828 |
|
|
[(use (match_operator 1 "ordered_comparison_operator"
|
3829 |
|
|
[(match_operand:VQHSI 2 "spu_reg_operand" "")
|
3830 |
|
|
(match_operand:VQHSI 3 "spu_nonmem_operand" "")]))
|
3831 |
|
|
(clobber (match_operand:SI 0 "spu_reg_operand"))]
|
3832 |
|
|
""
|
3833 |
|
|
{ spu_emit_branch_or_set (1, operands[1], operands); DONE; })
|
3834 |
|
|
|
3835 |
|
|
(define_expand "cstore4"
|
3836 |
|
|
[(use (match_operator 1 "ordered_comparison_operator"
|
3837 |
|
|
[(match_operand:DTI 2 "spu_reg_operand" "")
|
3838 |
|
|
(match_operand:DTI 3 "spu_reg_operand" "")]))
|
3839 |
|
|
(clobber (match_operand:SI 0 "spu_reg_operand"))]
|
3840 |
|
|
""
|
3841 |
|
|
{ spu_emit_branch_or_set (1, operands[1], operands); DONE; })
|
3842 |
|
|
|
3843 |
|
|
(define_expand "cstore4"
|
3844 |
|
|
[(use (match_operator 1 "ordered_comparison_operator"
|
3845 |
|
|
[(match_operand:VSF 2 "spu_reg_operand" "")
|
3846 |
|
|
(match_operand:VSF 3 "spu_reg_operand" "")]))
|
3847 |
|
|
(clobber (match_operand:SI 0 "spu_reg_operand"))]
|
3848 |
|
|
""
|
3849 |
|
|
{ spu_emit_branch_or_set (1, operands[1], operands); DONE; })
|
3850 |
|
|
|
3851 |
|
|
(define_expand "cstoredf4"
|
3852 |
|
|
[(use (match_operator 1 "ordered_comparison_operator"
|
3853 |
|
|
[(match_operand:DF 2 "spu_reg_operand" "")
|
3854 |
|
|
(match_operand:DF 3 "spu_reg_operand" "")]))
|
3855 |
|
|
(clobber (match_operand:SI 0 "spu_reg_operand"))]
|
3856 |
|
|
""
|
3857 |
|
|
{ spu_emit_branch_or_set (1, operands[1], operands); DONE; })
|
3858 |
|
|
|
3859 |
|
|
|
3860 |
|
|
;; conditional move
|
3861 |
|
|
|
3862 |
|
|
;; Define this first one so HAVE_conditional_move is defined.
|
3863 |
|
|
(define_insn "movcc_dummy"
|
3864 |
|
|
[(set (match_operand 0 "" "")
|
3865 |
|
|
(if_then_else (match_operand 1 "" "")
|
3866 |
|
|
(match_operand 2 "" "")
|
3867 |
|
|
(match_operand 3 "" "")))]
|
3868 |
|
|
"!operands[0]"
|
3869 |
|
|
"")
|
3870 |
|
|
|
3871 |
|
|
(define_expand "movcc"
|
3872 |
|
|
[(set (match_operand:ALL 0 "spu_reg_operand" "")
|
3873 |
|
|
(if_then_else:ALL (match_operand 1 "ordered_comparison_operator" "")
|
3874 |
|
|
(match_operand:ALL 2 "spu_reg_operand" "")
|
3875 |
|
|
(match_operand:ALL 3 "spu_reg_operand" "")))]
|
3876 |
|
|
""
|
3877 |
|
|
{
|
3878 |
|
|
spu_emit_branch_or_set(2, operands[1], operands);
|
3879 |
|
|
DONE;
|
3880 |
|
|
})
|
3881 |
|
|
|
3882 |
|
|
;; This pattern is used when the result of a compare is not large
|
3883 |
|
|
;; enough to use in a selb when expanding conditional moves.
|
3884 |
|
|
(define_expand "extend_compare"
|
3885 |
|
|
[(set (match_operand 0 "spu_reg_operand" "=r")
|
3886 |
|
|
(unspec [(match_operand 1 "spu_reg_operand" "r")] UNSPEC_EXTEND_CMP))]
|
3887 |
|
|
""
|
3888 |
|
|
{
|
3889 |
|
|
emit_insn (gen_rtx_SET (VOIDmode, operands[0],
|
3890 |
|
|
gen_rtx_UNSPEC (GET_MODE (operands[0]),
|
3891 |
|
|
gen_rtvec (1, operands[1]),
|
3892 |
|
|
UNSPEC_EXTEND_CMP)));
|
3893 |
|
|
DONE;
|
3894 |
|
|
})
|
3895 |
|
|
|
3896 |
|
|
(define_insn "extend_compare"
|
3897 |
|
|
[(set (match_operand:ALL 0 "spu_reg_operand" "=r")
|
3898 |
|
|
(unspec:ALL [(match_operand 1 "spu_reg_operand" "r")] UNSPEC_EXTEND_CMP))]
|
3899 |
|
|
"operands"
|
3900 |
|
|
"fsm\t%0,%1"
|
3901 |
|
|
[(set_attr "type" "shuf")])
|
3902 |
|
|
|
3903 |
|
|
|
3904 |
|
|
;; case
|
3905 |
|
|
|
3906 |
|
|
;; operand 0 is index
|
3907 |
|
|
;; operand 1 is the minimum bound
|
3908 |
|
|
;; operand 2 is the maximum bound - minimum bound + 1
|
3909 |
|
|
;; operand 3 is CODE_LABEL for the table;
|
3910 |
|
|
;; operand 4 is the CODE_LABEL to go to if index out of range.
|
3911 |
|
|
(define_expand "casesi"
|
3912 |
|
|
[(match_operand:SI 0 "spu_reg_operand" "")
|
3913 |
|
|
(match_operand:SI 1 "immediate_operand" "")
|
3914 |
|
|
(match_operand:SI 2 "immediate_operand" "")
|
3915 |
|
|
(match_operand 3 "" "")
|
3916 |
|
|
(match_operand 4 "" "")]
|
3917 |
|
|
""
|
3918 |
|
|
{
|
3919 |
|
|
rtx table = gen_reg_rtx (SImode);
|
3920 |
|
|
rtx index = gen_reg_rtx (SImode);
|
3921 |
|
|
rtx sindex = gen_reg_rtx (SImode);
|
3922 |
|
|
rtx addr = gen_reg_rtx (Pmode);
|
3923 |
|
|
|
3924 |
|
|
emit_move_insn (table, gen_rtx_LABEL_REF (SImode, operands[3]));
|
3925 |
|
|
|
3926 |
|
|
emit_insn (gen_subsi3(index, operands[0], force_reg(SImode, operands[1])));
|
3927 |
|
|
emit_insn (gen_ashlsi3(sindex, index, GEN_INT (2)));
|
3928 |
|
|
emit_move_insn (addr, gen_rtx_MEM (SImode,
|
3929 |
|
|
gen_rtx_PLUS (SImode, table, sindex)));
|
3930 |
|
|
if (flag_pic)
|
3931 |
|
|
emit_insn (gen_addsi3 (addr, addr, table));
|
3932 |
|
|
|
3933 |
|
|
emit_cmp_and_jump_insns (index, operands[2], GTU, NULL_RTX, SImode, 1, operands[4]);
|
3934 |
|
|
emit_jump_insn (gen_tablejump (addr, operands[3]));
|
3935 |
|
|
DONE;
|
3936 |
|
|
})
|
3937 |
|
|
|
3938 |
|
|
(define_insn "tablejump"
|
3939 |
|
|
[(set (pc) (match_operand:SI 0 "spu_reg_operand" "r"))
|
3940 |
|
|
(use (label_ref (match_operand 1 "" "")))]
|
3941 |
|
|
""
|
3942 |
|
|
"bi\t%0"
|
3943 |
|
|
[(set_attr "type" "br")])
|
3944 |
|
|
|
3945 |
|
|
|
3946 |
|
|
;; call
|
3947 |
|
|
|
3948 |
|
|
;; Note that operand 1 is total size of args, in bytes,
|
3949 |
|
|
;; and what the call insn wants is the number of words.
|
3950 |
|
|
(define_expand "sibcall"
|
3951 |
|
|
[(parallel
|
3952 |
|
|
[(call (match_operand:QI 0 "call_operand" "")
|
3953 |
|
|
(match_operand:QI 1 "" ""))
|
3954 |
|
|
(use (reg:SI 0))])]
|
3955 |
|
|
""
|
3956 |
|
|
{
|
3957 |
|
|
if (! call_operand (operands[0], QImode))
|
3958 |
|
|
XEXP (operands[0], 0) = copy_to_mode_reg (Pmode, XEXP (operands[0], 0));
|
3959 |
|
|
})
|
3960 |
|
|
|
3961 |
|
|
(define_insn "_sibcall"
|
3962 |
|
|
[(parallel
|
3963 |
|
|
[(call (match_operand:QI 0 "call_operand" "R,S")
|
3964 |
|
|
(match_operand:QI 1 "" "i,i"))
|
3965 |
|
|
(use (reg:SI 0))])]
|
3966 |
|
|
"SIBLING_CALL_P(insn)"
|
3967 |
|
|
"@
|
3968 |
|
|
bi\t%i0
|
3969 |
|
|
br\t%0"
|
3970 |
|
|
[(set_attr "type" "br,br")])
|
3971 |
|
|
|
3972 |
|
|
(define_expand "sibcall_value"
|
3973 |
|
|
[(parallel
|
3974 |
|
|
[(set (match_operand 0 "" "")
|
3975 |
|
|
(call (match_operand:QI 1 "call_operand" "")
|
3976 |
|
|
(match_operand:QI 2 "" "")))
|
3977 |
|
|
(use (reg:SI 0))])]
|
3978 |
|
|
""
|
3979 |
|
|
{
|
3980 |
|
|
if (! call_operand (operands[1], QImode))
|
3981 |
|
|
XEXP (operands[1], 0) = copy_to_mode_reg (Pmode, XEXP (operands[1], 0));
|
3982 |
|
|
})
|
3983 |
|
|
|
3984 |
|
|
(define_insn "_sibcall_value"
|
3985 |
|
|
[(parallel
|
3986 |
|
|
[(set (match_operand 0 "" "")
|
3987 |
|
|
(call (match_operand:QI 1 "call_operand" "R,S")
|
3988 |
|
|
(match_operand:QI 2 "" "i,i")))
|
3989 |
|
|
(use (reg:SI 0))])]
|
3990 |
|
|
"SIBLING_CALL_P(insn)"
|
3991 |
|
|
"@
|
3992 |
|
|
bi\t%i1
|
3993 |
|
|
br\t%1"
|
3994 |
|
|
[(set_attr "type" "br,br")])
|
3995 |
|
|
|
3996 |
|
|
;; Note that operand 1 is total size of args, in bytes,
|
3997 |
|
|
;; and what the call insn wants is the number of words.
|
3998 |
|
|
(define_expand "call"
|
3999 |
|
|
[(parallel
|
4000 |
|
|
[(call (match_operand:QI 0 "call_operand" "")
|
4001 |
|
|
(match_operand:QI 1 "" ""))
|
4002 |
|
|
(clobber (reg:SI 0))
|
4003 |
|
|
(clobber (reg:SI 130))])]
|
4004 |
|
|
""
|
4005 |
|
|
{
|
4006 |
|
|
if (! call_operand (operands[0], QImode))
|
4007 |
|
|
XEXP (operands[0], 0) = copy_to_mode_reg (Pmode, XEXP (operands[0], 0));
|
4008 |
|
|
})
|
4009 |
|
|
|
4010 |
|
|
(define_insn "_call"
|
4011 |
|
|
[(parallel
|
4012 |
|
|
[(call (match_operand:QI 0 "call_operand" "R,S,T")
|
4013 |
|
|
(match_operand:QI 1 "" "i,i,i"))
|
4014 |
|
|
(clobber (reg:SI 0))
|
4015 |
|
|
(clobber (reg:SI 130))])]
|
4016 |
|
|
""
|
4017 |
|
|
"@
|
4018 |
|
|
bisl\t$lr,%i0
|
4019 |
|
|
brsl\t$lr,%0
|
4020 |
|
|
brasl\t$lr,%0"
|
4021 |
|
|
[(set_attr "type" "br")])
|
4022 |
|
|
|
4023 |
|
|
(define_expand "call_value"
|
4024 |
|
|
[(parallel
|
4025 |
|
|
[(set (match_operand 0 "" "")
|
4026 |
|
|
(call (match_operand:QI 1 "call_operand" "")
|
4027 |
|
|
(match_operand:QI 2 "" "")))
|
4028 |
|
|
(clobber (reg:SI 0))
|
4029 |
|
|
(clobber (reg:SI 130))])]
|
4030 |
|
|
""
|
4031 |
|
|
{
|
4032 |
|
|
if (! call_operand (operands[1], QImode))
|
4033 |
|
|
XEXP (operands[1], 0) = copy_to_mode_reg (Pmode, XEXP (operands[1], 0));
|
4034 |
|
|
})
|
4035 |
|
|
|
4036 |
|
|
(define_insn "_call_value"
|
4037 |
|
|
[(parallel
|
4038 |
|
|
[(set (match_operand 0 "" "")
|
4039 |
|
|
(call (match_operand:QI 1 "call_operand" "R,S,T")
|
4040 |
|
|
(match_operand:QI 2 "" "i,i,i")))
|
4041 |
|
|
(clobber (reg:SI 0))
|
4042 |
|
|
(clobber (reg:SI 130))])]
|
4043 |
|
|
""
|
4044 |
|
|
"@
|
4045 |
|
|
bisl\t$lr,%i1
|
4046 |
|
|
brsl\t$lr,%1
|
4047 |
|
|
brasl\t$lr,%1"
|
4048 |
|
|
[(set_attr "type" "br")])
|
4049 |
|
|
|
4050 |
|
|
(define_expand "untyped_call"
|
4051 |
|
|
[(parallel [(call (match_operand 0 "" "")
|
4052 |
|
|
(const_int 0))
|
4053 |
|
|
(match_operand 1 "" "")
|
4054 |
|
|
(match_operand 2 "" "")])]
|
4055 |
|
|
""
|
4056 |
|
|
{
|
4057 |
|
|
int i;
|
4058 |
|
|
rtx reg = gen_rtx_REG (TImode, 3);
|
4059 |
|
|
|
4060 |
|
|
/* We need to use call_value so the return value registers don't get
|
4061 |
|
|
* clobbered. */
|
4062 |
|
|
emit_call_insn (gen_call_value (reg, operands[0], const0_rtx));
|
4063 |
|
|
|
4064 |
|
|
for (i = 0; i < XVECLEN (operands[2], 0); i++)
|
4065 |
|
|
{
|
4066 |
|
|
rtx set = XVECEXP (operands[2], 0, i);
|
4067 |
|
|
emit_move_insn (SET_DEST (set), SET_SRC (set));
|
4068 |
|
|
}
|
4069 |
|
|
|
4070 |
|
|
/* The optimizer does not know that the call sets the function value
|
4071 |
|
|
registers we stored in the result block. We avoid problems by
|
4072 |
|
|
claiming that all hard registers are used and clobbered at this
|
4073 |
|
|
point. */
|
4074 |
|
|
emit_insn (gen_blockage ());
|
4075 |
|
|
|
4076 |
|
|
DONE;
|
4077 |
|
|
})
|
4078 |
|
|
|
4079 |
|
|
|
4080 |
|
|
;; Patterns used for splitting and combining.
|
4081 |
|
|
|
4082 |
|
|
|
4083 |
|
|
;; Function prologue and epilogue.
|
4084 |
|
|
|
4085 |
|
|
(define_expand "prologue"
|
4086 |
|
|
[(const_int 1)]
|
4087 |
|
|
""
|
4088 |
|
|
{ spu_expand_prologue (); DONE; })
|
4089 |
|
|
|
4090 |
|
|
;; "blockage" is only emited in epilogue. This is what it took to
|
4091 |
|
|
;; make "basic block reordering" work with the insns sequence
|
4092 |
|
|
;; generated by the spu_expand_epilogue (taken from mips.md)
|
4093 |
|
|
|
4094 |
|
|
(define_insn "blockage"
|
4095 |
|
|
[(unspec_volatile [(const_int 0)] UNSPEC_BLOCKAGE)]
|
4096 |
|
|
""
|
4097 |
|
|
""
|
4098 |
|
|
[(set_attr "type" "convert")
|
4099 |
|
|
(set_attr "length" "0")])
|
4100 |
|
|
|
4101 |
|
|
(define_expand "epilogue"
|
4102 |
|
|
[(const_int 2)]
|
4103 |
|
|
""
|
4104 |
|
|
{ spu_expand_epilogue (false); DONE; })
|
4105 |
|
|
|
4106 |
|
|
(define_expand "sibcall_epilogue"
|
4107 |
|
|
[(const_int 2)]
|
4108 |
|
|
""
|
4109 |
|
|
{ spu_expand_epilogue (true); DONE; })
|
4110 |
|
|
|
4111 |
|
|
|
4112 |
|
|
;; stack manipulations
|
4113 |
|
|
|
4114 |
|
|
;; An insn to allocate new stack space for dynamic use (e.g., alloca).
|
4115 |
|
|
;; We move the back-chain and decrement the stack pointer.
|
4116 |
|
|
(define_expand "allocate_stack"
|
4117 |
|
|
[(set (match_operand 0 "spu_reg_operand" "")
|
4118 |
|
|
(minus (reg 1) (match_operand 1 "spu_nonmem_operand" "")))
|
4119 |
|
|
(set (reg 1)
|
4120 |
|
|
(minus (reg 1) (match_dup 1)))]
|
4121 |
|
|
""
|
4122 |
|
|
"spu_allocate_stack (operands[0], operands[1]); DONE;")
|
4123 |
|
|
|
4124 |
|
|
;; These patterns say how to save and restore the stack pointer. We need not
|
4125 |
|
|
;; save the stack pointer at function level since we are careful to preserve
|
4126 |
|
|
;; the backchain.
|
4127 |
|
|
;;
|
4128 |
|
|
|
4129 |
|
|
;; At block level the stack pointer is saved and restored, so that the
|
4130 |
|
|
;; stack space allocated within a block is deallocated when leaving
|
4131 |
|
|
;; block scope. By default, according to the SPU ABI, the stack
|
4132 |
|
|
;; pointer and available stack size are saved in a register. Upon
|
4133 |
|
|
;; restoration, the stack pointer is simply copied back, and the
|
4134 |
|
|
;; current available stack size is calculated against the restored
|
4135 |
|
|
;; stack pointer.
|
4136 |
|
|
;;
|
4137 |
|
|
;; For nonlocal gotos, we must save the stack pointer and its
|
4138 |
|
|
;; backchain and restore both. Note that in the nonlocal case, the
|
4139 |
|
|
;; save area is a memory location.
|
4140 |
|
|
|
4141 |
|
|
(define_expand "save_stack_function"
|
4142 |
|
|
[(match_operand 0 "general_operand" "")
|
4143 |
|
|
(match_operand 1 "general_operand" "")]
|
4144 |
|
|
""
|
4145 |
|
|
"DONE;")
|
4146 |
|
|
|
4147 |
|
|
(define_expand "restore_stack_function"
|
4148 |
|
|
[(match_operand 0 "general_operand" "")
|
4149 |
|
|
(match_operand 1 "general_operand" "")]
|
4150 |
|
|
""
|
4151 |
|
|
"DONE;")
|
4152 |
|
|
|
4153 |
|
|
(define_expand "restore_stack_block"
|
4154 |
|
|
[(match_operand 0 "spu_reg_operand" "")
|
4155 |
|
|
(match_operand 1 "memory_operand" "")]
|
4156 |
|
|
""
|
4157 |
|
|
"
|
4158 |
|
|
{
|
4159 |
|
|
spu_restore_stack_block (operands[0], operands[1]);
|
4160 |
|
|
DONE;
|
4161 |
|
|
}")
|
4162 |
|
|
|
4163 |
|
|
(define_expand "save_stack_nonlocal"
|
4164 |
|
|
[(match_operand 0 "memory_operand" "")
|
4165 |
|
|
(match_operand 1 "spu_reg_operand" "")]
|
4166 |
|
|
""
|
4167 |
|
|
"
|
4168 |
|
|
{
|
4169 |
|
|
rtx temp = gen_reg_rtx (Pmode);
|
4170 |
|
|
|
4171 |
|
|
/* Copy the backchain to the first word, sp to the second. We need to
|
4172 |
|
|
save the back chain because __builtin_apply appears to clobber it. */
|
4173 |
|
|
emit_move_insn (temp, gen_rtx_MEM (Pmode, operands[1]));
|
4174 |
|
|
emit_move_insn (adjust_address_nv (operands[0], SImode, 0), temp);
|
4175 |
|
|
emit_move_insn (adjust_address_nv (operands[0], SImode, 4), operands[1]);
|
4176 |
|
|
DONE;
|
4177 |
|
|
}")
|
4178 |
|
|
|
4179 |
|
|
(define_expand "restore_stack_nonlocal"
|
4180 |
|
|
[(match_operand 0 "spu_reg_operand" "")
|
4181 |
|
|
(match_operand 1 "memory_operand" "")]
|
4182 |
|
|
""
|
4183 |
|
|
"
|
4184 |
|
|
{
|
4185 |
|
|
spu_restore_stack_nonlocal(operands[0], operands[1]);
|
4186 |
|
|
DONE;
|
4187 |
|
|
}")
|
4188 |
|
|
|
4189 |
|
|
|
4190 |
|
|
;; vector patterns
|
4191 |
|
|
|
4192 |
|
|
;; Vector initialization
|
4193 |
|
|
(define_expand "vec_init"
|
4194 |
|
|
[(match_operand:V 0 "register_operand" "")
|
4195 |
|
|
(match_operand 1 "" "")]
|
4196 |
|
|
""
|
4197 |
|
|
{
|
4198 |
|
|
spu_expand_vector_init (operands[0], operands[1]);
|
4199 |
|
|
DONE;
|
4200 |
|
|
})
|
4201 |
|
|
|
4202 |
|
|
(define_expand "vec_set"
|
4203 |
|
|
[(use (match_operand:SI 2 "spu_nonmem_operand" ""))
|
4204 |
|
|
(set (match_dup:TI 3)
|
4205 |
|
|
(unspec:TI [(match_dup:SI 4)
|
4206 |
|
|
(match_dup:SI 5)
|
4207 |
|
|
(match_dup:SI 6)] UNSPEC_CPAT))
|
4208 |
|
|
(set (match_operand:V 0 "spu_reg_operand" "")
|
4209 |
|
|
(unspec:V [(match_operand: 1 "spu_reg_operand" "")
|
4210 |
|
|
(match_dup:V 0)
|
4211 |
|
|
(match_dup:TI 3)] UNSPEC_SHUFB))]
|
4212 |
|
|
""
|
4213 |
|
|
{
|
4214 |
|
|
HOST_WIDE_INT size = GET_MODE_SIZE (mode);
|
4215 |
|
|
rtx offset = GEN_INT (INTVAL (operands[2]) * size);
|
4216 |
|
|
operands[3] = gen_reg_rtx (TImode);
|
4217 |
|
|
operands[4] = stack_pointer_rtx;
|
4218 |
|
|
operands[5] = offset;
|
4219 |
|
|
operands[6] = GEN_INT (size);
|
4220 |
|
|
})
|
4221 |
|
|
|
4222 |
|
|
(define_expand "vec_extract"
|
4223 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
4224 |
|
|
(vec_select: (match_operand:V 1 "spu_reg_operand" "r")
|
4225 |
|
|
(parallel [(match_operand 2 "const_int_operand" "i")])))]
|
4226 |
|
|
""
|
4227 |
|
|
{
|
4228 |
|
|
if ((INTVAL (operands[2]) * + ) % 16 == 0)
|
4229 |
|
|
{
|
4230 |
|
|
emit_insn (gen_spu_convert (operands[0], operands[1]));
|
4231 |
|
|
DONE;
|
4232 |
|
|
}
|
4233 |
|
|
})
|
4234 |
|
|
|
4235 |
|
|
(define_insn "_vec_extract"
|
4236 |
|
|
[(set (match_operand: 0 "spu_reg_operand" "=r")
|
4237 |
|
|
(vec_select: (match_operand:V 1 "spu_reg_operand" "r")
|
4238 |
|
|
(parallel [(match_operand 2 "const_int_operand" "i")])))]
|
4239 |
|
|
""
|
4240 |
|
|
"rotqbyi\t%0,%1,(%2*+)%%16"
|
4241 |
|
|
[(set_attr "type" "shuf")])
|
4242 |
|
|
|
4243 |
|
|
(define_insn "_vec_extractv8hi_ze"
|
4244 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=r")
|
4245 |
|
|
(zero_extend:SI (vec_select:HI (match_operand:V8HI 1 "spu_reg_operand" "r")
|
4246 |
|
|
(parallel [(const_int 0)]))))]
|
4247 |
|
|
""
|
4248 |
|
|
"rotqmbyi\t%0,%1,-2"
|
4249 |
|
|
[(set_attr "type" "shuf")])
|
4250 |
|
|
|
4251 |
|
|
|
4252 |
|
|
;; misc
|
4253 |
|
|
|
4254 |
|
|
(define_expand "shufb"
|
4255 |
|
|
[(set (match_operand 0 "spu_reg_operand" "")
|
4256 |
|
|
(unspec [(match_operand 1 "spu_reg_operand" "")
|
4257 |
|
|
(match_operand 2 "spu_reg_operand" "")
|
4258 |
|
|
(match_operand:TI 3 "spu_reg_operand" "")] UNSPEC_SHUFB))]
|
4259 |
|
|
""
|
4260 |
|
|
{
|
4261 |
|
|
rtx s = gen__shufb (operands[0], operands[1], operands[2], operands[3]);
|
4262 |
|
|
PUT_MODE (SET_SRC (s), GET_MODE (operands[0]));
|
4263 |
|
|
emit_insn (s);
|
4264 |
|
|
DONE;
|
4265 |
|
|
})
|
4266 |
|
|
|
4267 |
|
|
(define_insn "_shufb"
|
4268 |
|
|
[(set (match_operand 0 "spu_reg_operand" "=r")
|
4269 |
|
|
(unspec [(match_operand 1 "spu_reg_operand" "r")
|
4270 |
|
|
(match_operand 2 "spu_reg_operand" "r")
|
4271 |
|
|
(match_operand:TI 3 "spu_reg_operand" "r")] UNSPEC_SHUFB))]
|
4272 |
|
|
"operands"
|
4273 |
|
|
"shufb\t%0,%1,%2,%3"
|
4274 |
|
|
[(set_attr "type" "shuf")])
|
4275 |
|
|
|
4276 |
|
|
(define_insn "nop"
|
4277 |
|
|
[(unspec_volatile [(const_int 0)] UNSPEC_NOP)]
|
4278 |
|
|
""
|
4279 |
|
|
"nop"
|
4280 |
|
|
[(set_attr "type" "nop")])
|
4281 |
|
|
|
4282 |
|
|
(define_insn "nopn"
|
4283 |
|
|
[(unspec_volatile [(match_operand:SI 0 "immediate_operand" "K")] UNSPEC_NOP)]
|
4284 |
|
|
""
|
4285 |
|
|
"nop\t%0"
|
4286 |
|
|
[(set_attr "type" "nop")])
|
4287 |
|
|
|
4288 |
|
|
(define_insn "lnop"
|
4289 |
|
|
[(unspec_volatile [(const_int 0)] UNSPEC_LNOP)]
|
4290 |
|
|
""
|
4291 |
|
|
"lnop"
|
4292 |
|
|
[(set_attr "type" "lnop")])
|
4293 |
|
|
|
4294 |
|
|
;; The operand is so we know why we generated this hbrp.
|
4295 |
|
|
;; We clobber mem to make sure it isn't moved over any
|
4296 |
|
|
;; loads, stores or calls while scheduling.
|
4297 |
|
|
(define_insn "iprefetch"
|
4298 |
|
|
[(unspec [(match_operand:SI 0 "const_int_operand" "n")] UNSPEC_IPREFETCH)
|
4299 |
|
|
(clobber (mem:BLK (scratch)))]
|
4300 |
|
|
""
|
4301 |
|
|
"hbrp\t# %0"
|
4302 |
|
|
[(set_attr "type" "iprefetch")])
|
4303 |
|
|
|
4304 |
|
|
;; A non-volatile version so it gets scheduled
|
4305 |
|
|
(define_insn "nopn_nv"
|
4306 |
|
|
[(unspec [(match_operand:SI 0 "register_operand" "r")] UNSPEC_NOP)]
|
4307 |
|
|
""
|
4308 |
|
|
"nop\t%0"
|
4309 |
|
|
[(set_attr "type" "nop")])
|
4310 |
|
|
|
4311 |
|
|
(define_insn "hbr"
|
4312 |
|
|
[(set (reg:SI 130)
|
4313 |
|
|
(unspec:SI [(match_operand:SI 0 "immediate_operand" "i,i,i")
|
4314 |
|
|
(match_operand:SI 1 "nonmemory_operand" "r,s,i")] UNSPEC_HBR))
|
4315 |
|
|
(unspec [(const_int 0)] UNSPEC_HBR)]
|
4316 |
|
|
""
|
4317 |
|
|
"@
|
4318 |
|
|
hbr\t%0,%1
|
4319 |
|
|
hbrr\t%0,%1
|
4320 |
|
|
hbra\t%0,%1"
|
4321 |
|
|
[(set_attr "type" "hbr")])
|
4322 |
|
|
|
4323 |
|
|
(define_insn "sync"
|
4324 |
|
|
[(unspec_volatile [(const_int 0)] UNSPEC_SYNC)
|
4325 |
|
|
(clobber (mem:BLK (scratch)))]
|
4326 |
|
|
""
|
4327 |
|
|
"sync"
|
4328 |
|
|
[(set_attr "type" "br")])
|
4329 |
|
|
|
4330 |
|
|
(define_insn "syncc"
|
4331 |
|
|
[(unspec_volatile [(const_int 1)] UNSPEC_SYNC)
|
4332 |
|
|
(clobber (mem:BLK (scratch)))]
|
4333 |
|
|
""
|
4334 |
|
|
"syncc"
|
4335 |
|
|
[(set_attr "type" "br")])
|
4336 |
|
|
|
4337 |
|
|
(define_insn "dsync"
|
4338 |
|
|
[(unspec_volatile [(const_int 2)] UNSPEC_SYNC)
|
4339 |
|
|
(clobber (mem:BLK (scratch)))]
|
4340 |
|
|
""
|
4341 |
|
|
"dsync"
|
4342 |
|
|
[(set_attr "type" "br")])
|
4343 |
|
|
|
4344 |
|
|
|
4345 |
|
|
|
4346 |
|
|
;; Define the subtract-one-and-jump insns so loop.c
|
4347 |
|
|
;; knows what to generate.
|
4348 |
|
|
(define_expand "doloop_end"
|
4349 |
|
|
[(use (match_operand 0 "" "")) ; loop pseudo
|
4350 |
|
|
(use (match_operand 1 "" "")) ; iterations; zero if unknown
|
4351 |
|
|
(use (match_operand 2 "" "")) ; max iterations
|
4352 |
|
|
(use (match_operand 3 "" "")) ; loop level
|
4353 |
|
|
(use (match_operand 4 "" ""))] ; label
|
4354 |
|
|
""
|
4355 |
|
|
"
|
4356 |
|
|
{
|
4357 |
|
|
/* Currently SMS relies on the do-loop pattern to recognize loops
|
4358 |
|
|
where (1) the control part comprises of all insns defining and/or
|
4359 |
|
|
using a certain 'count' register and (2) the loop count can be
|
4360 |
|
|
adjusted by modifying this register prior to the loop.
|
4361 |
|
|
. ??? The possible introduction of a new block to initialize the
|
4362 |
|
|
new IV can potentially effects branch optimizations. */
|
4363 |
|
|
if (optimize > 0 && flag_modulo_sched)
|
4364 |
|
|
{
|
4365 |
|
|
rtx s0;
|
4366 |
|
|
rtx bcomp;
|
4367 |
|
|
rtx loc_ref;
|
4368 |
|
|
|
4369 |
|
|
/* Only use this on innermost loops. */
|
4370 |
|
|
if (INTVAL (operands[3]) > 1)
|
4371 |
|
|
FAIL;
|
4372 |
|
|
if (GET_MODE (operands[0]) != SImode)
|
4373 |
|
|
FAIL;
|
4374 |
|
|
|
4375 |
|
|
s0 = operands [0];
|
4376 |
|
|
emit_move_insn (s0, gen_rtx_PLUS (SImode, s0, GEN_INT (-1)));
|
4377 |
|
|
bcomp = gen_rtx_NE(SImode, s0, const0_rtx);
|
4378 |
|
|
loc_ref = gen_rtx_LABEL_REF (VOIDmode, operands [4]);
|
4379 |
|
|
emit_jump_insn (gen_rtx_SET (VOIDmode, pc_rtx,
|
4380 |
|
|
gen_rtx_IF_THEN_ELSE (VOIDmode, bcomp,
|
4381 |
|
|
loc_ref, pc_rtx)));
|
4382 |
|
|
|
4383 |
|
|
DONE;
|
4384 |
|
|
}else
|
4385 |
|
|
FAIL;
|
4386 |
|
|
}")
|
4387 |
|
|
|
4388 |
|
|
;; convert between any two modes, avoiding any GCC assumptions
|
4389 |
|
|
(define_expand "spu_convert"
|
4390 |
|
|
[(set (match_operand 0 "spu_reg_operand" "")
|
4391 |
|
|
(unspec [(match_operand 1 "spu_reg_operand" "")] UNSPEC_CONVERT))]
|
4392 |
|
|
""
|
4393 |
|
|
{
|
4394 |
|
|
rtx c = gen__spu_convert (operands[0], operands[1]);
|
4395 |
|
|
PUT_MODE (SET_SRC (c), GET_MODE (operands[0]));
|
4396 |
|
|
emit_insn (c);
|
4397 |
|
|
DONE;
|
4398 |
|
|
})
|
4399 |
|
|
|
4400 |
|
|
(define_insn_and_split "_spu_convert"
|
4401 |
|
|
[(set (match_operand 0 "spu_reg_operand" "=r")
|
4402 |
|
|
(unspec [(match_operand 1 "spu_reg_operand" "0")] UNSPEC_CONVERT))]
|
4403 |
|
|
""
|
4404 |
|
|
"#"
|
4405 |
|
|
"reload_completed"
|
4406 |
|
|
[(const_int 0)]
|
4407 |
|
|
{
|
4408 |
|
|
spu_split_convert (operands);
|
4409 |
|
|
DONE;
|
4410 |
|
|
}
|
4411 |
|
|
[(set_attr "type" "convert")
|
4412 |
|
|
(set_attr "length" "0")])
|
4413 |
|
|
|
4414 |
|
|
|
4415 |
|
|
;;
|
4416 |
|
|
(include "spu-builtins.md")
|
4417 |
|
|
|
4418 |
|
|
|
4419 |
|
|
(define_expand "smaxv4sf3"
|
4420 |
|
|
[(set (match_operand:V4SF 0 "register_operand" "=r")
|
4421 |
|
|
(smax:V4SF (match_operand:V4SF 1 "register_operand" "r")
|
4422 |
|
|
(match_operand:V4SF 2 "register_operand" "r")))]
|
4423 |
|
|
""
|
4424 |
|
|
"
|
4425 |
|
|
{
|
4426 |
|
|
rtx mask = gen_reg_rtx (V4SImode);
|
4427 |
|
|
|
4428 |
|
|
emit_insn (gen_cgt_v4sf (mask, operands[1], operands[2]));
|
4429 |
|
|
emit_insn (gen_selb (operands[0], operands[2], operands[1], mask));
|
4430 |
|
|
DONE;
|
4431 |
|
|
}")
|
4432 |
|
|
|
4433 |
|
|
(define_expand "sminv4sf3"
|
4434 |
|
|
[(set (match_operand:V4SF 0 "register_operand" "=r")
|
4435 |
|
|
(smin:V4SF (match_operand:V4SF 1 "register_operand" "r")
|
4436 |
|
|
(match_operand:V4SF 2 "register_operand" "r")))]
|
4437 |
|
|
""
|
4438 |
|
|
"
|
4439 |
|
|
{
|
4440 |
|
|
rtx mask = gen_reg_rtx (V4SImode);
|
4441 |
|
|
|
4442 |
|
|
emit_insn (gen_cgt_v4sf (mask, operands[1], operands[2]));
|
4443 |
|
|
emit_insn (gen_selb (operands[0], operands[1], operands[2], mask));
|
4444 |
|
|
DONE;
|
4445 |
|
|
}")
|
4446 |
|
|
|
4447 |
|
|
(define_expand "smaxv2df3"
|
4448 |
|
|
[(set (match_operand:V2DF 0 "register_operand" "=r")
|
4449 |
|
|
(smax:V2DF (match_operand:V2DF 1 "register_operand" "r")
|
4450 |
|
|
(match_operand:V2DF 2 "register_operand" "r")))]
|
4451 |
|
|
""
|
4452 |
|
|
"
|
4453 |
|
|
{
|
4454 |
|
|
rtx mask = gen_reg_rtx (V2DImode);
|
4455 |
|
|
emit_insn (gen_cgt_v2df (mask, operands[1], operands[2]));
|
4456 |
|
|
emit_insn (gen_selb (operands[0], operands[2], operands[1],
|
4457 |
|
|
spu_gen_subreg (V4SImode, mask)));
|
4458 |
|
|
DONE;
|
4459 |
|
|
}")
|
4460 |
|
|
|
4461 |
|
|
(define_expand "sminv2df3"
|
4462 |
|
|
[(set (match_operand:V2DF 0 "register_operand" "=r")
|
4463 |
|
|
(smin:V2DF (match_operand:V2DF 1 "register_operand" "r")
|
4464 |
|
|
(match_operand:V2DF 2 "register_operand" "r")))]
|
4465 |
|
|
""
|
4466 |
|
|
"
|
4467 |
|
|
{
|
4468 |
|
|
rtx mask = gen_reg_rtx (V2DImode);
|
4469 |
|
|
emit_insn (gen_cgt_v2df (mask, operands[1], operands[2]));
|
4470 |
|
|
emit_insn (gen_selb (operands[0], operands[1], operands[2],
|
4471 |
|
|
spu_gen_subreg (V4SImode, mask)));
|
4472 |
|
|
DONE;
|
4473 |
|
|
}")
|
4474 |
|
|
|
4475 |
|
|
(define_expand "vec_widen_umult_hi_v8hi"
|
4476 |
|
|
[(set (match_operand:V4SI 0 "register_operand" "=r")
|
4477 |
|
|
(mult:V4SI
|
4478 |
|
|
(zero_extend:V4SI
|
4479 |
|
|
(vec_select:V4HI
|
4480 |
|
|
(match_operand:V8HI 1 "register_operand" "r")
|
4481 |
|
|
(parallel [(const_int 0)(const_int 1)(const_int 2)(const_int 3)])))
|
4482 |
|
|
(zero_extend:V4SI
|
4483 |
|
|
(vec_select:V4HI
|
4484 |
|
|
(match_operand:V8HI 2 "register_operand" "r")
|
4485 |
|
|
(parallel [(const_int 0)(const_int 1)(const_int 2)(const_int 3)])))))]
|
4486 |
|
|
""
|
4487 |
|
|
"
|
4488 |
|
|
{
|
4489 |
|
|
rtx ve = gen_reg_rtx (V4SImode);
|
4490 |
|
|
rtx vo = gen_reg_rtx (V4SImode);
|
4491 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4492 |
|
|
unsigned char arr[16] = {
|
4493 |
|
|
0x00, 0x01, 0x02, 0x03, 0x10, 0x11, 0x12, 0x13,
|
4494 |
|
|
0x04, 0x05, 0x06, 0x07, 0x14, 0x15, 0x16, 0x17};
|
4495 |
|
|
|
4496 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4497 |
|
|
emit_insn (gen_spu_mpyhhu (ve, operands[1], operands[2]));
|
4498 |
|
|
emit_insn (gen_spu_mpyu (vo, operands[1], operands[2]));
|
4499 |
|
|
emit_insn (gen_shufb (operands[0], ve, vo, mask));
|
4500 |
|
|
DONE;
|
4501 |
|
|
}")
|
4502 |
|
|
|
4503 |
|
|
(define_expand "vec_widen_umult_lo_v8hi"
|
4504 |
|
|
[(set (match_operand:V4SI 0 "register_operand" "=r")
|
4505 |
|
|
(mult:V4SI
|
4506 |
|
|
(zero_extend:V4SI
|
4507 |
|
|
(vec_select:V4HI
|
4508 |
|
|
(match_operand:V8HI 1 "register_operand" "r")
|
4509 |
|
|
(parallel [(const_int 4)(const_int 5)(const_int 6)(const_int 7)])))
|
4510 |
|
|
(zero_extend:V4SI
|
4511 |
|
|
(vec_select:V4HI
|
4512 |
|
|
(match_operand:V8HI 2 "register_operand" "r")
|
4513 |
|
|
(parallel [(const_int 4)(const_int 5)(const_int 6)(const_int 7)])))))]
|
4514 |
|
|
""
|
4515 |
|
|
"
|
4516 |
|
|
{
|
4517 |
|
|
rtx ve = gen_reg_rtx (V4SImode);
|
4518 |
|
|
rtx vo = gen_reg_rtx (V4SImode);
|
4519 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4520 |
|
|
unsigned char arr[16] = {
|
4521 |
|
|
0x08, 0x09, 0x0A, 0x0B, 0x18, 0x19, 0x1A, 0x1B,
|
4522 |
|
|
0x0C, 0x0D, 0x0E, 0x0F, 0x1C, 0x1D, 0x1E, 0x1F};
|
4523 |
|
|
|
4524 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4525 |
|
|
emit_insn (gen_spu_mpyhhu (ve, operands[1], operands[2]));
|
4526 |
|
|
emit_insn (gen_spu_mpyu (vo, operands[1], operands[2]));
|
4527 |
|
|
emit_insn (gen_shufb (operands[0], ve, vo, mask));
|
4528 |
|
|
DONE;
|
4529 |
|
|
}")
|
4530 |
|
|
|
4531 |
|
|
(define_expand "vec_widen_smult_hi_v8hi"
|
4532 |
|
|
[(set (match_operand:V4SI 0 "register_operand" "=r")
|
4533 |
|
|
(mult:V4SI
|
4534 |
|
|
(sign_extend:V4SI
|
4535 |
|
|
(vec_select:V4HI
|
4536 |
|
|
(match_operand:V8HI 1 "register_operand" "r")
|
4537 |
|
|
(parallel [(const_int 0)(const_int 1)(const_int 2)(const_int 3)])))
|
4538 |
|
|
(sign_extend:V4SI
|
4539 |
|
|
(vec_select:V4HI
|
4540 |
|
|
(match_operand:V8HI 2 "register_operand" "r")
|
4541 |
|
|
(parallel [(const_int 0)(const_int 1)(const_int 2)(const_int 3)])))))]
|
4542 |
|
|
""
|
4543 |
|
|
"
|
4544 |
|
|
{
|
4545 |
|
|
rtx ve = gen_reg_rtx (V4SImode);
|
4546 |
|
|
rtx vo = gen_reg_rtx (V4SImode);
|
4547 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4548 |
|
|
unsigned char arr[16] = {
|
4549 |
|
|
0x00, 0x01, 0x02, 0x03, 0x10, 0x11, 0x12, 0x13,
|
4550 |
|
|
0x04, 0x05, 0x06, 0x07, 0x14, 0x15, 0x16, 0x17};
|
4551 |
|
|
|
4552 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4553 |
|
|
emit_insn (gen_spu_mpyhh (ve, operands[1], operands[2]));
|
4554 |
|
|
emit_insn (gen_spu_mpy (vo, operands[1], operands[2]));
|
4555 |
|
|
emit_insn (gen_shufb (operands[0], ve, vo, mask));
|
4556 |
|
|
DONE;
|
4557 |
|
|
}")
|
4558 |
|
|
|
4559 |
|
|
(define_expand "vec_widen_smult_lo_v8hi"
|
4560 |
|
|
[(set (match_operand:V4SI 0 "register_operand" "=r")
|
4561 |
|
|
(mult:V4SI
|
4562 |
|
|
(sign_extend:V4SI
|
4563 |
|
|
(vec_select:V4HI
|
4564 |
|
|
(match_operand:V8HI 1 "register_operand" "r")
|
4565 |
|
|
(parallel [(const_int 4)(const_int 5)(const_int 6)(const_int 7)])))
|
4566 |
|
|
(sign_extend:V4SI
|
4567 |
|
|
(vec_select:V4HI
|
4568 |
|
|
(match_operand:V8HI 2 "register_operand" "r")
|
4569 |
|
|
(parallel [(const_int 4)(const_int 5)(const_int 6)(const_int 7)])))))]
|
4570 |
|
|
""
|
4571 |
|
|
"
|
4572 |
|
|
{
|
4573 |
|
|
rtx ve = gen_reg_rtx (V4SImode);
|
4574 |
|
|
rtx vo = gen_reg_rtx (V4SImode);
|
4575 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4576 |
|
|
unsigned char arr[16] = {
|
4577 |
|
|
0x08, 0x09, 0x0A, 0x0B, 0x18, 0x19, 0x1A, 0x1B,
|
4578 |
|
|
0x0C, 0x0D, 0x0E, 0x0F, 0x1C, 0x1D, 0x1E, 0x1F};
|
4579 |
|
|
|
4580 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4581 |
|
|
emit_insn (gen_spu_mpyhh (ve, operands[1], operands[2]));
|
4582 |
|
|
emit_insn (gen_spu_mpy (vo, operands[1], operands[2]));
|
4583 |
|
|
emit_insn (gen_shufb (operands[0], ve, vo, mask));
|
4584 |
|
|
DONE;
|
4585 |
|
|
}")
|
4586 |
|
|
|
4587 |
|
|
(define_expand "vec_realign_load_"
|
4588 |
|
|
[(set (match_operand:ALL 0 "register_operand" "=r")
|
4589 |
|
|
(unspec:ALL [(match_operand:ALL 1 "register_operand" "r")
|
4590 |
|
|
(match_operand:ALL 2 "register_operand" "r")
|
4591 |
|
|
(match_operand:TI 3 "register_operand" "r")] UNSPEC_SPU_REALIGN_LOAD))]
|
4592 |
|
|
""
|
4593 |
|
|
"
|
4594 |
|
|
{
|
4595 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], operands[3]));
|
4596 |
|
|
DONE;
|
4597 |
|
|
}")
|
4598 |
|
|
|
4599 |
|
|
(define_expand "spu_lvsr"
|
4600 |
|
|
[(set (match_operand:V16QI 0 "register_operand" "")
|
4601 |
|
|
(unspec:V16QI [(match_operand 1 "memory_operand" "")] UNSPEC_SPU_MASK_FOR_LOAD))]
|
4602 |
|
|
""
|
4603 |
|
|
"
|
4604 |
|
|
{
|
4605 |
|
|
rtx addr;
|
4606 |
|
|
rtx offset = gen_reg_rtx (V8HImode);
|
4607 |
|
|
rtx addr_bits = gen_reg_rtx (SImode);
|
4608 |
|
|
rtx addr_bits_vec = gen_reg_rtx (V8HImode);
|
4609 |
|
|
rtx splatqi = gen_reg_rtx (TImode);
|
4610 |
|
|
rtx result = gen_reg_rtx (V8HImode);
|
4611 |
|
|
unsigned char arr[16] = {
|
4612 |
|
|
0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17,
|
4613 |
|
|
0x18, 0x19, 0x1A, 0x1B, 0x1C, 0x1D, 0x1E, 0x1F};
|
4614 |
|
|
unsigned char arr2[16] = {
|
4615 |
|
|
0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03,
|
4616 |
|
|
0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03};
|
4617 |
|
|
|
4618 |
|
|
emit_move_insn (offset, array_to_constant (V8HImode, arr));
|
4619 |
|
|
emit_move_insn (splatqi, array_to_constant (TImode, arr2));
|
4620 |
|
|
|
4621 |
|
|
gcc_assert (GET_CODE (operands[1]) == MEM);
|
4622 |
|
|
addr = force_reg (Pmode, XEXP (operands[1], 0));
|
4623 |
|
|
emit_insn (gen_andsi3 (addr_bits, addr, GEN_INT (0xF)));
|
4624 |
|
|
emit_insn (gen_shufb (addr_bits_vec, addr_bits, addr_bits, splatqi));
|
4625 |
|
|
|
4626 |
|
|
/* offset - (addr & 0xF)
|
4627 |
|
|
It is safe to use a single sfh, because each byte of offset is > 15 and
|
4628 |
|
|
each byte of addr is <= 15. */
|
4629 |
|
|
emit_insn (gen_subv8hi3 (result, offset, addr_bits_vec));
|
4630 |
|
|
|
4631 |
|
|
result = simplify_gen_subreg (V16QImode, result, V8HImode, 0);
|
4632 |
|
|
emit_move_insn (operands[0], result);
|
4633 |
|
|
|
4634 |
|
|
DONE;
|
4635 |
|
|
}")
|
4636 |
|
|
|
4637 |
|
|
(define_expand "vec_unpacku_hi_v8hi"
|
4638 |
|
|
[(set (match_operand:V4SI 0 "spu_reg_operand" "=r")
|
4639 |
|
|
(zero_extend:V4SI
|
4640 |
|
|
(vec_select:V4HI
|
4641 |
|
|
(match_operand:V8HI 1 "spu_reg_operand" "r")
|
4642 |
|
|
(parallel [(const_int 0)(const_int 1)(const_int 2)(const_int 3)]))))]
|
4643 |
|
|
""
|
4644 |
|
|
{
|
4645 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4646 |
|
|
unsigned char arr[16] = {
|
4647 |
|
|
0x80, 0x80, 0x00, 0x01, 0x80, 0x80, 0x02, 0x03,
|
4648 |
|
|
0x80, 0x80, 0x04, 0x05, 0x80, 0x80, 0x06, 0x07};
|
4649 |
|
|
|
4650 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4651 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[1], mask));
|
4652 |
|
|
|
4653 |
|
|
DONE;
|
4654 |
|
|
})
|
4655 |
|
|
|
4656 |
|
|
(define_expand "vec_unpacku_lo_v8hi"
|
4657 |
|
|
[(set (match_operand:V4SI 0 "spu_reg_operand" "=r")
|
4658 |
|
|
(zero_extend:V4SI
|
4659 |
|
|
(vec_select:V4HI
|
4660 |
|
|
(match_operand:V8HI 1 "spu_reg_operand" "r")
|
4661 |
|
|
(parallel [(const_int 4)(const_int 5)(const_int 6)(const_int 7)]))))]
|
4662 |
|
|
""
|
4663 |
|
|
{
|
4664 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4665 |
|
|
unsigned char arr[16] = {
|
4666 |
|
|
0x80, 0x80, 0x08, 0x09, 0x80, 0x80, 0x0A, 0x0B,
|
4667 |
|
|
0x80, 0x80, 0x0C, 0x0D, 0x80, 0x80, 0x0E, 0x0F};
|
4668 |
|
|
|
4669 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4670 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[1], mask));
|
4671 |
|
|
|
4672 |
|
|
DONE;
|
4673 |
|
|
})
|
4674 |
|
|
|
4675 |
|
|
(define_expand "vec_unpacks_hi_v8hi"
|
4676 |
|
|
[(set (match_operand:V4SI 0 "spu_reg_operand" "=r")
|
4677 |
|
|
(sign_extend:V4SI
|
4678 |
|
|
(vec_select:V4HI
|
4679 |
|
|
(match_operand:V8HI 1 "spu_reg_operand" "r")
|
4680 |
|
|
(parallel [(const_int 0)(const_int 1)(const_int 2)(const_int 3)]))))]
|
4681 |
|
|
""
|
4682 |
|
|
{
|
4683 |
|
|
rtx tmp1 = gen_reg_rtx (V8HImode);
|
4684 |
|
|
rtx tmp2 = gen_reg_rtx (V4SImode);
|
4685 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4686 |
|
|
unsigned char arr[16] = {
|
4687 |
|
|
0x80, 0x80, 0x00, 0x01, 0x80, 0x80, 0x02, 0x03,
|
4688 |
|
|
0x80, 0x80, 0x04, 0x05, 0x80, 0x80, 0x06, 0x07};
|
4689 |
|
|
|
4690 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4691 |
|
|
emit_insn (gen_shufb (tmp1, operands[1], operands[1], mask));
|
4692 |
|
|
emit_insn (gen_spu_xshw (tmp2, tmp1));
|
4693 |
|
|
emit_move_insn (operands[0], tmp2);
|
4694 |
|
|
|
4695 |
|
|
DONE;
|
4696 |
|
|
})
|
4697 |
|
|
|
4698 |
|
|
(define_expand "vec_unpacks_lo_v8hi"
|
4699 |
|
|
[(set (match_operand:V4SI 0 "spu_reg_operand" "=r")
|
4700 |
|
|
(sign_extend:V4SI
|
4701 |
|
|
(vec_select:V4HI
|
4702 |
|
|
(match_operand:V8HI 1 "spu_reg_operand" "r")
|
4703 |
|
|
(parallel [(const_int 4)(const_int 5)(const_int 6)(const_int 7)]))))]
|
4704 |
|
|
""
|
4705 |
|
|
{
|
4706 |
|
|
rtx tmp1 = gen_reg_rtx (V8HImode);
|
4707 |
|
|
rtx tmp2 = gen_reg_rtx (V4SImode);
|
4708 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4709 |
|
|
unsigned char arr[16] = {
|
4710 |
|
|
0x80, 0x80, 0x08, 0x09, 0x80, 0x80, 0x0A, 0x0B,
|
4711 |
|
|
0x80, 0x80, 0x0C, 0x0D, 0x80, 0x80, 0x0E, 0x0F};
|
4712 |
|
|
|
4713 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4714 |
|
|
emit_insn (gen_shufb (tmp1, operands[1], operands[1], mask));
|
4715 |
|
|
emit_insn (gen_spu_xshw (tmp2, tmp1));
|
4716 |
|
|
emit_move_insn (operands[0], tmp2);
|
4717 |
|
|
|
4718 |
|
|
DONE;
|
4719 |
|
|
})
|
4720 |
|
|
|
4721 |
|
|
(define_expand "vec_unpacku_hi_v16qi"
|
4722 |
|
|
[(set (match_operand:V8HI 0 "spu_reg_operand" "=r")
|
4723 |
|
|
(zero_extend:V8HI
|
4724 |
|
|
(vec_select:V8QI
|
4725 |
|
|
(match_operand:V16QI 1 "spu_reg_operand" "r")
|
4726 |
|
|
(parallel [(const_int 0)(const_int 1)(const_int 2)(const_int 3)
|
4727 |
|
|
(const_int 4)(const_int 5)(const_int 6)(const_int 7)]))))]
|
4728 |
|
|
""
|
4729 |
|
|
{
|
4730 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4731 |
|
|
unsigned char arr[16] = {
|
4732 |
|
|
0x80, 0x00, 0x80, 0x01, 0x80, 0x02, 0x80, 0x03,
|
4733 |
|
|
0x80, 0x04, 0x80, 0x05, 0x80, 0x06, 0x80, 0x07};
|
4734 |
|
|
|
4735 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4736 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[1], mask));
|
4737 |
|
|
|
4738 |
|
|
DONE;
|
4739 |
|
|
})
|
4740 |
|
|
|
4741 |
|
|
(define_expand "vec_unpacku_lo_v16qi"
|
4742 |
|
|
[(set (match_operand:V8HI 0 "spu_reg_operand" "=r")
|
4743 |
|
|
(zero_extend:V8HI
|
4744 |
|
|
(vec_select:V8QI
|
4745 |
|
|
(match_operand:V16QI 1 "spu_reg_operand" "r")
|
4746 |
|
|
(parallel [(const_int 8)(const_int 9)(const_int 10)(const_int 11)
|
4747 |
|
|
(const_int 12)(const_int 13)(const_int 14)(const_int 15)]))))]
|
4748 |
|
|
""
|
4749 |
|
|
{
|
4750 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4751 |
|
|
unsigned char arr[16] = {
|
4752 |
|
|
0x80, 0x08, 0x80, 0x09, 0x80, 0x0A, 0x80, 0x0B,
|
4753 |
|
|
0x80, 0x0C, 0x80, 0x0D, 0x80, 0x0E, 0x80, 0x0F};
|
4754 |
|
|
|
4755 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4756 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[1], mask));
|
4757 |
|
|
|
4758 |
|
|
DONE;
|
4759 |
|
|
})
|
4760 |
|
|
|
4761 |
|
|
(define_expand "vec_unpacks_hi_v16qi"
|
4762 |
|
|
[(set (match_operand:V8HI 0 "spu_reg_operand" "=r")
|
4763 |
|
|
(sign_extend:V8HI
|
4764 |
|
|
(vec_select:V8QI
|
4765 |
|
|
(match_operand:V16QI 1 "spu_reg_operand" "r")
|
4766 |
|
|
(parallel [(const_int 0)(const_int 1)(const_int 2)(const_int 3)
|
4767 |
|
|
(const_int 4)(const_int 5)(const_int 6)(const_int 7)]))))]
|
4768 |
|
|
""
|
4769 |
|
|
{
|
4770 |
|
|
rtx tmp1 = gen_reg_rtx (V16QImode);
|
4771 |
|
|
rtx tmp2 = gen_reg_rtx (V8HImode);
|
4772 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4773 |
|
|
unsigned char arr[16] = {
|
4774 |
|
|
0x80, 0x00, 0x80, 0x01, 0x80, 0x02, 0x80, 0x03,
|
4775 |
|
|
0x80, 0x04, 0x80, 0x05, 0x80, 0x06, 0x80, 0x07};
|
4776 |
|
|
|
4777 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4778 |
|
|
emit_insn (gen_shufb (tmp1, operands[1], operands[1], mask));
|
4779 |
|
|
emit_insn (gen_spu_xsbh (tmp2, tmp1));
|
4780 |
|
|
emit_move_insn (operands[0], tmp2);
|
4781 |
|
|
|
4782 |
|
|
DONE;
|
4783 |
|
|
})
|
4784 |
|
|
|
4785 |
|
|
(define_expand "vec_unpacks_lo_v16qi"
|
4786 |
|
|
[(set (match_operand:V8HI 0 "spu_reg_operand" "=r")
|
4787 |
|
|
(sign_extend:V8HI
|
4788 |
|
|
(vec_select:V8QI
|
4789 |
|
|
(match_operand:V16QI 1 "spu_reg_operand" "r")
|
4790 |
|
|
(parallel [(const_int 8)(const_int 9)(const_int 10)(const_int 11)
|
4791 |
|
|
(const_int 12)(const_int 13)(const_int 14)(const_int 15)]))))]
|
4792 |
|
|
""
|
4793 |
|
|
{
|
4794 |
|
|
rtx tmp1 = gen_reg_rtx (V16QImode);
|
4795 |
|
|
rtx tmp2 = gen_reg_rtx (V8HImode);
|
4796 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4797 |
|
|
unsigned char arr[16] = {
|
4798 |
|
|
0x80, 0x08, 0x80, 0x09, 0x80, 0x0A, 0x80, 0x0B,
|
4799 |
|
|
0x80, 0x0C, 0x80, 0x0D, 0x80, 0x0E, 0x80, 0x0F};
|
4800 |
|
|
|
4801 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4802 |
|
|
emit_insn (gen_shufb (tmp1, operands[1], operands[1], mask));
|
4803 |
|
|
emit_insn (gen_spu_xsbh (tmp2, tmp1));
|
4804 |
|
|
emit_move_insn (operands[0], tmp2);
|
4805 |
|
|
|
4806 |
|
|
DONE;
|
4807 |
|
|
})
|
4808 |
|
|
|
4809 |
|
|
|
4810 |
|
|
(define_expand "vec_extract_evenv4si"
|
4811 |
|
|
[(set (match_operand:V4SI 0 "spu_reg_operand" "=r")
|
4812 |
|
|
(vec_concat:V4SI
|
4813 |
|
|
(vec_select:V2SI
|
4814 |
|
|
(match_operand:V4SI 1 "spu_reg_operand" "r")
|
4815 |
|
|
(parallel [(const_int 0)(const_int 2)]))
|
4816 |
|
|
(vec_select:V2SI
|
4817 |
|
|
(match_operand:V4SI 2 "spu_reg_operand" "r")
|
4818 |
|
|
(parallel [(const_int 0)(const_int 2)]))))]
|
4819 |
|
|
|
4820 |
|
|
""
|
4821 |
|
|
"
|
4822 |
|
|
{
|
4823 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4824 |
|
|
unsigned char arr[16] = {
|
4825 |
|
|
0x00, 0x01, 0x02, 0x03,
|
4826 |
|
|
0x08, 0x09, 0x0A, 0x0B,
|
4827 |
|
|
0x10, 0x11, 0x12, 0x13,
|
4828 |
|
|
0x18, 0x19, 0x1A, 0x1B};
|
4829 |
|
|
|
4830 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4831 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
4832 |
|
|
DONE;
|
4833 |
|
|
}")
|
4834 |
|
|
|
4835 |
|
|
|
4836 |
|
|
(define_expand "vec_extract_evenv4sf"
|
4837 |
|
|
[(set (match_operand:V4SF 0 "spu_reg_operand" "=r")
|
4838 |
|
|
(vec_concat:V4SF
|
4839 |
|
|
(vec_select:V2SF
|
4840 |
|
|
(match_operand:V4SF 1 "spu_reg_operand" "r")
|
4841 |
|
|
(parallel [(const_int 0)(const_int 2)]))
|
4842 |
|
|
(vec_select:V2SF
|
4843 |
|
|
(match_operand:V4SF 2 "spu_reg_operand" "r")
|
4844 |
|
|
(parallel [(const_int 0)(const_int 2)]))))]
|
4845 |
|
|
|
4846 |
|
|
""
|
4847 |
|
|
"
|
4848 |
|
|
{
|
4849 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4850 |
|
|
unsigned char arr[16] = {
|
4851 |
|
|
0x00, 0x01, 0x02, 0x03,
|
4852 |
|
|
0x08, 0x09, 0x0A, 0x0B,
|
4853 |
|
|
0x10, 0x11, 0x12, 0x13,
|
4854 |
|
|
0x18, 0x19, 0x1A, 0x1B};
|
4855 |
|
|
|
4856 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4857 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
4858 |
|
|
DONE;
|
4859 |
|
|
}")
|
4860 |
|
|
|
4861 |
|
|
(define_expand "vec_extract_evenv8hi"
|
4862 |
|
|
[(set (match_operand:V8HI 0 "spu_reg_operand" "=r")
|
4863 |
|
|
(vec_concat:V8HI
|
4864 |
|
|
(vec_select:V4HI
|
4865 |
|
|
(match_operand:V8HI 1 "spu_reg_operand" "r")
|
4866 |
|
|
(parallel [(const_int 0)(const_int 2)(const_int 4)(const_int 6)]))
|
4867 |
|
|
(vec_select:V4HI
|
4868 |
|
|
(match_operand:V8HI 2 "spu_reg_operand" "r")
|
4869 |
|
|
(parallel [(const_int 0)(const_int 2)(const_int 4)(const_int 6)]))))]
|
4870 |
|
|
|
4871 |
|
|
""
|
4872 |
|
|
"
|
4873 |
|
|
{
|
4874 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4875 |
|
|
unsigned char arr[16] = {
|
4876 |
|
|
0x00, 0x01, 0x04, 0x05,
|
4877 |
|
|
0x08, 0x09, 0x0C, 0x0D,
|
4878 |
|
|
0x10, 0x11, 0x14, 0x15,
|
4879 |
|
|
0x18, 0x19, 0x1C, 0x1D};
|
4880 |
|
|
|
4881 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4882 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
4883 |
|
|
DONE;
|
4884 |
|
|
}")
|
4885 |
|
|
|
4886 |
|
|
(define_expand "vec_extract_evenv16qi"
|
4887 |
|
|
[(set (match_operand:V16QI 0 "spu_reg_operand" "=r")
|
4888 |
|
|
(vec_concat:V16QI
|
4889 |
|
|
(vec_select:V8QI
|
4890 |
|
|
(match_operand:V16QI 1 "spu_reg_operand" "r")
|
4891 |
|
|
(parallel [(const_int 0)(const_int 2)(const_int 4)(const_int 6)
|
4892 |
|
|
(const_int 8)(const_int 10)(const_int 12)(const_int 14)]))
|
4893 |
|
|
(vec_select:V8QI
|
4894 |
|
|
(match_operand:V16QI 2 "spu_reg_operand" "r")
|
4895 |
|
|
(parallel [(const_int 0)(const_int 2)(const_int 4)(const_int 6)
|
4896 |
|
|
(const_int 8)(const_int 10)(const_int 12)(const_int 14)]))))]
|
4897 |
|
|
|
4898 |
|
|
""
|
4899 |
|
|
"
|
4900 |
|
|
{
|
4901 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4902 |
|
|
unsigned char arr[16] = {
|
4903 |
|
|
0x00, 0x02, 0x04, 0x06,
|
4904 |
|
|
0x08, 0x0A, 0x0C, 0x0E,
|
4905 |
|
|
0x10, 0x12, 0x14, 0x16,
|
4906 |
|
|
0x18, 0x1A, 0x1C, 0x1E};
|
4907 |
|
|
|
4908 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4909 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
4910 |
|
|
DONE;
|
4911 |
|
|
}")
|
4912 |
|
|
|
4913 |
|
|
(define_expand "vec_extract_oddv4si"
|
4914 |
|
|
[(set (match_operand:V4SI 0 "spu_reg_operand" "=r")
|
4915 |
|
|
(vec_concat:V4SI
|
4916 |
|
|
(vec_select:V2SI
|
4917 |
|
|
(match_operand:V4SI 1 "spu_reg_operand" "r")
|
4918 |
|
|
(parallel [(const_int 1)(const_int 3)]))
|
4919 |
|
|
(vec_select:V2SI
|
4920 |
|
|
(match_operand:V4SI 2 "spu_reg_operand" "r")
|
4921 |
|
|
(parallel [(const_int 1)(const_int 3)]))))]
|
4922 |
|
|
|
4923 |
|
|
""
|
4924 |
|
|
"
|
4925 |
|
|
{
|
4926 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4927 |
|
|
unsigned char arr[16] = {
|
4928 |
|
|
0x04, 0x05, 0x06, 0x07,
|
4929 |
|
|
0x0C, 0x0D, 0x0E, 0x0F,
|
4930 |
|
|
0x14, 0x15, 0x16, 0x17,
|
4931 |
|
|
0x1C, 0x1D, 0x1E, 0x1F};
|
4932 |
|
|
|
4933 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4934 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
4935 |
|
|
DONE;
|
4936 |
|
|
}")
|
4937 |
|
|
|
4938 |
|
|
(define_expand "vec_extract_oddv4sf"
|
4939 |
|
|
[(set (match_operand:V4SF 0 "spu_reg_operand" "=r")
|
4940 |
|
|
(vec_concat:V4SF
|
4941 |
|
|
(vec_select:V2SF
|
4942 |
|
|
(match_operand:V4SF 1 "spu_reg_operand" "r")
|
4943 |
|
|
(parallel [(const_int 1)(const_int 3)]))
|
4944 |
|
|
(vec_select:V2SF
|
4945 |
|
|
(match_operand:V4SF 2 "spu_reg_operand" "r")
|
4946 |
|
|
(parallel [(const_int 1)(const_int 3)]))))]
|
4947 |
|
|
|
4948 |
|
|
""
|
4949 |
|
|
"
|
4950 |
|
|
{
|
4951 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4952 |
|
|
unsigned char arr[16] = {
|
4953 |
|
|
0x04, 0x05, 0x06, 0x07,
|
4954 |
|
|
0x0C, 0x0D, 0x0E, 0x0F,
|
4955 |
|
|
0x14, 0x15, 0x16, 0x17,
|
4956 |
|
|
0x1C, 0x1D, 0x1E, 0x1F};
|
4957 |
|
|
|
4958 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4959 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
4960 |
|
|
DONE;
|
4961 |
|
|
}")
|
4962 |
|
|
|
4963 |
|
|
(define_expand "vec_extract_oddv8hi"
|
4964 |
|
|
[(set (match_operand:V8HI 0 "spu_reg_operand" "=r")
|
4965 |
|
|
(vec_concat:V8HI
|
4966 |
|
|
(vec_select:V4HI
|
4967 |
|
|
(match_operand:V8HI 1 "spu_reg_operand" "r")
|
4968 |
|
|
(parallel [(const_int 1)(const_int 3)(const_int 5)(const_int 7)]))
|
4969 |
|
|
(vec_select:V4HI
|
4970 |
|
|
(match_operand:V8HI 2 "spu_reg_operand" "r")
|
4971 |
|
|
(parallel [(const_int 1)(const_int 3)(const_int 5)(const_int 7)]))))]
|
4972 |
|
|
|
4973 |
|
|
""
|
4974 |
|
|
"
|
4975 |
|
|
{
|
4976 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
4977 |
|
|
unsigned char arr[16] = {
|
4978 |
|
|
0x02, 0x03, 0x06, 0x07,
|
4979 |
|
|
0x0A, 0x0B, 0x0E, 0x0F,
|
4980 |
|
|
0x12, 0x13, 0x16, 0x17,
|
4981 |
|
|
0x1A, 0x1B, 0x1E, 0x1F};
|
4982 |
|
|
|
4983 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
4984 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
4985 |
|
|
DONE;
|
4986 |
|
|
}")
|
4987 |
|
|
|
4988 |
|
|
(define_expand "vec_extract_oddv16qi"
|
4989 |
|
|
[(set (match_operand:V16QI 0 "spu_reg_operand" "=r")
|
4990 |
|
|
(vec_concat:V16QI
|
4991 |
|
|
(vec_select:V8QI
|
4992 |
|
|
(match_operand:V16QI 1 "spu_reg_operand" "r")
|
4993 |
|
|
(parallel [(const_int 1)(const_int 3)(const_int 5)(const_int 7)
|
4994 |
|
|
(const_int 9)(const_int 11)(const_int 13)(const_int 15)]))
|
4995 |
|
|
(vec_select:V8QI
|
4996 |
|
|
(match_operand:V16QI 2 "spu_reg_operand" "r")
|
4997 |
|
|
(parallel [(const_int 1)(const_int 3)(const_int 5)(const_int 7)
|
4998 |
|
|
(const_int 9)(const_int 11)(const_int 13)(const_int 15)]))))]
|
4999 |
|
|
|
5000 |
|
|
""
|
5001 |
|
|
"
|
5002 |
|
|
{
|
5003 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
5004 |
|
|
unsigned char arr[16] = {
|
5005 |
|
|
0x01, 0x03, 0x05, 0x07,
|
5006 |
|
|
0x09, 0x0B, 0x0D, 0x0F,
|
5007 |
|
|
0x11, 0x13, 0x15, 0x17,
|
5008 |
|
|
0x19, 0x1B, 0x1D, 0x1F};
|
5009 |
|
|
|
5010 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
5011 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
5012 |
|
|
DONE;
|
5013 |
|
|
}")
|
5014 |
|
|
|
5015 |
|
|
(define_expand "vec_interleave_highv4sf"
|
5016 |
|
|
[(set (match_operand:V4SF 0 "spu_reg_operand" "=r")
|
5017 |
|
|
(vec_select:V4SF
|
5018 |
|
|
(vec_concat:V4SF
|
5019 |
|
|
(vec_select:V2SF
|
5020 |
|
|
(match_operand:V4SF 1 "spu_reg_operand" "r")
|
5021 |
|
|
(parallel [(const_int 0)(const_int 1)]))
|
5022 |
|
|
(vec_select:V2SF
|
5023 |
|
|
(match_operand:V4SF 2 "spu_reg_operand" "r")
|
5024 |
|
|
(parallel [(const_int 0)(const_int 1)])))
|
5025 |
|
|
(parallel [(const_int 0)(const_int 2)(const_int 1)(const_int 3)])))]
|
5026 |
|
|
|
5027 |
|
|
""
|
5028 |
|
|
"
|
5029 |
|
|
{
|
5030 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
5031 |
|
|
unsigned char arr[16] = {
|
5032 |
|
|
0x00, 0x01, 0x02, 0x03,
|
5033 |
|
|
0x10, 0x11, 0x12, 0x13,
|
5034 |
|
|
0x04, 0x05, 0x06, 0x07,
|
5035 |
|
|
0x14, 0x15, 0x16, 0x17};
|
5036 |
|
|
|
5037 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
5038 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
5039 |
|
|
DONE;
|
5040 |
|
|
}")
|
5041 |
|
|
|
5042 |
|
|
(define_expand "vec_interleave_lowv4sf"
|
5043 |
|
|
[(set (match_operand:V4SF 0 "spu_reg_operand" "=r")
|
5044 |
|
|
(vec_select:V4SF
|
5045 |
|
|
(vec_concat:V4SF
|
5046 |
|
|
(vec_select:V2SF
|
5047 |
|
|
(match_operand:V4SF 1 "spu_reg_operand" "r")
|
5048 |
|
|
(parallel [(const_int 2)(const_int 3)]))
|
5049 |
|
|
(vec_select:V2SF
|
5050 |
|
|
(match_operand:V4SF 2 "spu_reg_operand" "r")
|
5051 |
|
|
(parallel [(const_int 2)(const_int 3)])))
|
5052 |
|
|
(parallel [(const_int 0)(const_int 2)(const_int 1)(const_int 3)])))]
|
5053 |
|
|
|
5054 |
|
|
""
|
5055 |
|
|
"
|
5056 |
|
|
{
|
5057 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
5058 |
|
|
unsigned char arr[16] = {
|
5059 |
|
|
0x08, 0x09, 0x0A, 0x0B,
|
5060 |
|
|
0x18, 0x19, 0x1A, 0x1B,
|
5061 |
|
|
0x0C, 0x0D, 0x0E, 0x0F,
|
5062 |
|
|
0x1C, 0x1D, 0x1E, 0x1F};
|
5063 |
|
|
|
5064 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
5065 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
5066 |
|
|
DONE;
|
5067 |
|
|
}")
|
5068 |
|
|
|
5069 |
|
|
(define_expand "vec_interleave_highv4si"
|
5070 |
|
|
[(set (match_operand:V4SI 0 "spu_reg_operand" "=r")
|
5071 |
|
|
(vec_select:V4SI
|
5072 |
|
|
(vec_concat:V4SI
|
5073 |
|
|
(vec_select:V2SI
|
5074 |
|
|
(match_operand:V4SI 1 "spu_reg_operand" "r")
|
5075 |
|
|
(parallel [(const_int 0)(const_int 1)]))
|
5076 |
|
|
(vec_select:V2SI
|
5077 |
|
|
(match_operand:V4SI 2 "spu_reg_operand" "r")
|
5078 |
|
|
(parallel [(const_int 0)(const_int 1)])))
|
5079 |
|
|
(parallel [(const_int 0)(const_int 2)(const_int 1)(const_int 3)])))]
|
5080 |
|
|
|
5081 |
|
|
""
|
5082 |
|
|
"
|
5083 |
|
|
{
|
5084 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
5085 |
|
|
unsigned char arr[16] = {
|
5086 |
|
|
0x00, 0x01, 0x02, 0x03,
|
5087 |
|
|
0x10, 0x11, 0x12, 0x13,
|
5088 |
|
|
0x04, 0x05, 0x06, 0x07,
|
5089 |
|
|
0x14, 0x15, 0x16, 0x17};
|
5090 |
|
|
|
5091 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
5092 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
5093 |
|
|
DONE;
|
5094 |
|
|
}")
|
5095 |
|
|
|
5096 |
|
|
(define_expand "vec_interleave_lowv4si"
|
5097 |
|
|
[(set (match_operand:V4SI 0 "spu_reg_operand" "=r")
|
5098 |
|
|
(vec_select:V4SI
|
5099 |
|
|
(vec_concat:V4SI
|
5100 |
|
|
(vec_select:V2SI
|
5101 |
|
|
(match_operand:V4SI 1 "spu_reg_operand" "r")
|
5102 |
|
|
(parallel [(const_int 2)(const_int 3)]))
|
5103 |
|
|
(vec_select:V2SI
|
5104 |
|
|
(match_operand:V4SI 2 "spu_reg_operand" "r")
|
5105 |
|
|
(parallel [(const_int 2)(const_int 3)])))
|
5106 |
|
|
(parallel [(const_int 0)(const_int 2)(const_int 1)(const_int 3)])))]
|
5107 |
|
|
|
5108 |
|
|
""
|
5109 |
|
|
"
|
5110 |
|
|
{
|
5111 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
5112 |
|
|
unsigned char arr[16] = {
|
5113 |
|
|
0x08, 0x09, 0x0A, 0x0B,
|
5114 |
|
|
0x18, 0x19, 0x1A, 0x1B,
|
5115 |
|
|
0x0C, 0x0D, 0x0E, 0x0F,
|
5116 |
|
|
0x1C, 0x1D, 0x1E, 0x1F};
|
5117 |
|
|
|
5118 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
5119 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
5120 |
|
|
DONE;
|
5121 |
|
|
}")
|
5122 |
|
|
|
5123 |
|
|
(define_expand "vec_interleave_highv8hi"
|
5124 |
|
|
[(set (match_operand:V8HI 0 "spu_reg_operand" "=r")
|
5125 |
|
|
(vec_select:V8HI
|
5126 |
|
|
(vec_concat:V8HI
|
5127 |
|
|
(vec_select:V4HI
|
5128 |
|
|
(match_operand:V8HI 1 "spu_reg_operand" "r")
|
5129 |
|
|
(parallel [(const_int 0)(const_int 1)(const_int 2)(const_int 3)]))
|
5130 |
|
|
(vec_select:V4HI
|
5131 |
|
|
(match_operand:V8HI 2 "spu_reg_operand" "r")
|
5132 |
|
|
(parallel [(const_int 0)(const_int 1)(const_int 2)(const_int 3)])))
|
5133 |
|
|
(parallel [(const_int 0)(const_int 4)(const_int 1)(const_int 5)
|
5134 |
|
|
(const_int 2)(const_int 6)(const_int 3)(const_int 7)])))]
|
5135 |
|
|
|
5136 |
|
|
""
|
5137 |
|
|
"
|
5138 |
|
|
{
|
5139 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
5140 |
|
|
unsigned char arr[16] = {
|
5141 |
|
|
0x00, 0x01, 0x10, 0x11,
|
5142 |
|
|
0x02, 0x03, 0x12, 0x13,
|
5143 |
|
|
0x04, 0x05, 0x14, 0x15,
|
5144 |
|
|
0x06, 0x07, 0x16, 0x17};
|
5145 |
|
|
|
5146 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
5147 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
5148 |
|
|
DONE;
|
5149 |
|
|
}")
|
5150 |
|
|
|
5151 |
|
|
(define_expand "vec_interleave_lowv8hi"
|
5152 |
|
|
[(set (match_operand:V8HI 0 "spu_reg_operand" "=r")
|
5153 |
|
|
(vec_select:V8HI
|
5154 |
|
|
(vec_concat:V8HI
|
5155 |
|
|
(vec_select:V4HI
|
5156 |
|
|
(match_operand:V8HI 1 "spu_reg_operand" "r")
|
5157 |
|
|
(parallel [(const_int 4)(const_int 5)(const_int 6)(const_int 7)]))
|
5158 |
|
|
(vec_select:V4HI
|
5159 |
|
|
(match_operand:V8HI 2 "spu_reg_operand" "r")
|
5160 |
|
|
(parallel [(const_int 4)(const_int 5)(const_int 6)(const_int 7)])))
|
5161 |
|
|
(parallel [(const_int 0)(const_int 4)(const_int 1)(const_int 5)
|
5162 |
|
|
(const_int 2)(const_int 6)(const_int 3)(const_int 7)])))]
|
5163 |
|
|
|
5164 |
|
|
""
|
5165 |
|
|
"
|
5166 |
|
|
{
|
5167 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
5168 |
|
|
unsigned char arr[16] = {
|
5169 |
|
|
0x08, 0x09, 0x18, 0x19,
|
5170 |
|
|
0x0A, 0x0B, 0x1A, 0x1B,
|
5171 |
|
|
0x0C, 0x0D, 0x1C, 0x1D,
|
5172 |
|
|
0x0E, 0x0F, 0x1E, 0x1F};
|
5173 |
|
|
|
5174 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
5175 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
5176 |
|
|
DONE;
|
5177 |
|
|
}")
|
5178 |
|
|
|
5179 |
|
|
(define_expand "vec_interleave_highv16qi"
|
5180 |
|
|
[(set (match_operand:V16QI 0 "spu_reg_operand" "=r")
|
5181 |
|
|
(vec_select:V16QI
|
5182 |
|
|
(vec_concat:V16QI
|
5183 |
|
|
(vec_select:V8QI
|
5184 |
|
|
(match_operand:V16QI 1 "spu_reg_operand" "r")
|
5185 |
|
|
(parallel [(const_int 0)(const_int 1)(const_int 2)(const_int 3)
|
5186 |
|
|
(const_int 4)(const_int 5)(const_int 6)(const_int 7)]))
|
5187 |
|
|
(vec_select:V8QI
|
5188 |
|
|
(match_operand:V16QI 2 "spu_reg_operand" "r")
|
5189 |
|
|
(parallel [(const_int 0)(const_int 1)(const_int 2)(const_int 3)
|
5190 |
|
|
(const_int 4)(const_int 5)(const_int 6)(const_int 7)])))
|
5191 |
|
|
(parallel [(const_int 0)(const_int 8)(const_int 1)(const_int 9)
|
5192 |
|
|
(const_int 2)(const_int 10)(const_int 3)(const_int 11)
|
5193 |
|
|
(const_int 4)(const_int 12)(const_int 5)(const_int 13)
|
5194 |
|
|
(const_int 6)(const_int 14)(const_int 7)(const_int 15)])))]
|
5195 |
|
|
|
5196 |
|
|
""
|
5197 |
|
|
"
|
5198 |
|
|
{
|
5199 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
5200 |
|
|
unsigned char arr[16] = {
|
5201 |
|
|
0x00, 0x10, 0x01, 0x11,
|
5202 |
|
|
0x02, 0x12, 0x03, 0x13,
|
5203 |
|
|
0x04, 0x14, 0x05, 0x15,
|
5204 |
|
|
0x06, 0x16, 0x07, 0x17};
|
5205 |
|
|
|
5206 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
5207 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
5208 |
|
|
DONE;
|
5209 |
|
|
}")
|
5210 |
|
|
|
5211 |
|
|
(define_expand "vec_interleave_lowv16qi"
|
5212 |
|
|
[(set (match_operand:V16QI 0 "spu_reg_operand" "=r")
|
5213 |
|
|
(vec_select:V16QI
|
5214 |
|
|
(vec_concat:V16QI
|
5215 |
|
|
(vec_select:V8QI
|
5216 |
|
|
(match_operand:V16QI 1 "spu_reg_operand" "r")
|
5217 |
|
|
(parallel [(const_int 8)(const_int 9)(const_int 10)(const_int 11)
|
5218 |
|
|
(const_int 12)(const_int 13)(const_int 14)(const_int 15)]))
|
5219 |
|
|
(vec_select:V8QI
|
5220 |
|
|
(match_operand:V16QI 2 "spu_reg_operand" "r")
|
5221 |
|
|
(parallel [(const_int 8)(const_int 9)(const_int 10)(const_int 11)
|
5222 |
|
|
(const_int 12)(const_int 13)(const_int 14)(const_int 15)])))
|
5223 |
|
|
(parallel [(const_int 0)(const_int 8)(const_int 1)(const_int 9)
|
5224 |
|
|
(const_int 2)(const_int 10)(const_int 3)(const_int 11)
|
5225 |
|
|
(const_int 4)(const_int 12)(const_int 5)(const_int 13)
|
5226 |
|
|
(const_int 6)(const_int 14)(const_int 7)(const_int 15)])))]
|
5227 |
|
|
|
5228 |
|
|
""
|
5229 |
|
|
"
|
5230 |
|
|
{
|
5231 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
5232 |
|
|
unsigned char arr[16] = {
|
5233 |
|
|
0x08, 0x18, 0x09, 0x19,
|
5234 |
|
|
0x0A, 0x1A, 0x0B, 0x1B,
|
5235 |
|
|
0x0C, 0x1C, 0x0D, 0x1D,
|
5236 |
|
|
0x0E, 0x1E, 0x0F, 0x1F};
|
5237 |
|
|
|
5238 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
5239 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
5240 |
|
|
DONE;
|
5241 |
|
|
}")
|
5242 |
|
|
|
5243 |
|
|
(define_expand "vec_pack_trunc_v8hi"
|
5244 |
|
|
[(set (match_operand:V16QI 0 "spu_reg_operand" "=r")
|
5245 |
|
|
(vec_concat:V16QI
|
5246 |
|
|
(truncate:V8QI (match_operand:V8HI 1 "spu_reg_operand" "r"))
|
5247 |
|
|
(truncate:V8QI (match_operand:V8HI 2 "spu_reg_operand" "r"))))]
|
5248 |
|
|
""
|
5249 |
|
|
"
|
5250 |
|
|
{
|
5251 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
5252 |
|
|
unsigned char arr[16] = {
|
5253 |
|
|
0x01, 0x03, 0x05, 0x07, 0x09, 0x0B, 0x0D, 0x0F,
|
5254 |
|
|
0x11, 0x13, 0x15, 0x17, 0x19, 0x1B, 0x1D, 0x1F};
|
5255 |
|
|
|
5256 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
5257 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
5258 |
|
|
|
5259 |
|
|
DONE;
|
5260 |
|
|
}")
|
5261 |
|
|
|
5262 |
|
|
(define_expand "vec_pack_trunc_v4si"
|
5263 |
|
|
[(set (match_operand:V8HI 0 "spu_reg_operand" "=r")
|
5264 |
|
|
(vec_concat:V8HI
|
5265 |
|
|
(truncate:V4HI (match_operand:V4SI 1 "spu_reg_operand" "r"))
|
5266 |
|
|
(truncate:V4HI (match_operand:V4SI 2 "spu_reg_operand" "r"))))]
|
5267 |
|
|
""
|
5268 |
|
|
"
|
5269 |
|
|
{
|
5270 |
|
|
rtx mask = gen_reg_rtx (TImode);
|
5271 |
|
|
unsigned char arr[16] = {
|
5272 |
|
|
0x02, 0x03, 0x06, 0x07, 0x0A, 0x0B, 0x0E, 0x0F,
|
5273 |
|
|
0x12, 0x13, 0x16, 0x17, 0x1A, 0x1B, 0x1E, 0x1F};
|
5274 |
|
|
|
5275 |
|
|
emit_move_insn (mask, array_to_constant (TImode, arr));
|
5276 |
|
|
emit_insn (gen_shufb (operands[0], operands[1], operands[2], mask));
|
5277 |
|
|
|
5278 |
|
|
DONE;
|
5279 |
|
|
}")
|
5280 |
|
|
|
5281 |
|
|
(define_insn "stack_protect_set"
|
5282 |
|
|
[(set (match_operand:SI 0 "memory_operand" "=m")
|
5283 |
|
|
(unspec:SI [(match_operand:SI 1 "memory_operand" "m")] UNSPEC_SP_SET))
|
5284 |
|
|
(set (match_scratch:SI 2 "=&r") (const_int 0))]
|
5285 |
|
|
""
|
5286 |
|
|
"lq%p1\t%2,%1\;stq%p0\t%2,%0\;xor\t%2,%2,%2"
|
5287 |
|
|
[(set_attr "length" "12")
|
5288 |
|
|
(set_attr "type" "multi1")]
|
5289 |
|
|
)
|
5290 |
|
|
|
5291 |
|
|
(define_expand "stack_protect_test"
|
5292 |
|
|
[(match_operand 0 "memory_operand" "")
|
5293 |
|
|
(match_operand 1 "memory_operand" "")
|
5294 |
|
|
(match_operand 2 "" "")]
|
5295 |
|
|
""
|
5296 |
|
|
{
|
5297 |
|
|
rtx compare_result;
|
5298 |
|
|
rtx bcomp, loc_ref;
|
5299 |
|
|
|
5300 |
|
|
compare_result = gen_reg_rtx (SImode);
|
5301 |
|
|
|
5302 |
|
|
emit_insn (gen_stack_protect_test_si (compare_result,
|
5303 |
|
|
operands[0],
|
5304 |
|
|
operands[1]));
|
5305 |
|
|
|
5306 |
|
|
bcomp = gen_rtx_NE (SImode, compare_result, const0_rtx);
|
5307 |
|
|
|
5308 |
|
|
loc_ref = gen_rtx_LABEL_REF (VOIDmode, operands[2]);
|
5309 |
|
|
|
5310 |
|
|
emit_jump_insn (gen_rtx_SET (VOIDmode, pc_rtx,
|
5311 |
|
|
gen_rtx_IF_THEN_ELSE (VOIDmode, bcomp,
|
5312 |
|
|
loc_ref, pc_rtx)));
|
5313 |
|
|
|
5314 |
|
|
DONE;
|
5315 |
|
|
})
|
5316 |
|
|
|
5317 |
|
|
(define_insn "stack_protect_test_si"
|
5318 |
|
|
[(set (match_operand:SI 0 "spu_reg_operand" "=&r")
|
5319 |
|
|
(unspec:SI [(match_operand:SI 1 "memory_operand" "m")
|
5320 |
|
|
(match_operand:SI 2 "memory_operand" "m")]
|
5321 |
|
|
UNSPEC_SP_TEST))
|
5322 |
|
|
(set (match_scratch:SI 3 "=&r") (const_int 0))]
|
5323 |
|
|
""
|
5324 |
|
|
"lq%p1\t%0,%1\;lq%p2\t%3,%2\;ceq\t%0,%0,%3\;xor\t%3,%3,%3"
|
5325 |
|
|
[(set_attr "length" "16")
|
5326 |
|
|
(set_attr "type" "multi1")]
|
5327 |
|
|
)
|
5328 |
|
|
|