1 ;; Expander definitions for vector support between altivec & vsx. No
2 ;; instructions are in this file, this file provides the generic vector
3 ;; expander, and the actual vector instructions will be in altivec.md and
6 ;; Copyright (C) 2009, 2010, 2011
7 ;; Free Software Foundation, Inc.
8 ;; Contributed by Michael Meissner <meissner@linux.vnet.ibm.com>
10 ;; This file is part of GCC.
12 ;; GCC is free software; you can redistribute it and/or modify it
13 ;; under the terms of the GNU General Public License as published
14 ;; by the Free Software Foundation; either version 3, or (at your
15 ;; option) any later version.
17 ;; GCC is distributed in the hope that it will be useful, but WITHOUT
18 ;; ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
19 ;; or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
20 ;; License for more details.
22 ;; You should have received a copy of the GNU General Public License
23 ;; along with GCC; see the file COPYING3. If not see
24 ;; <http://www.gnu.org/licenses/>.
28 (define_mode_iterator VEC_I [V16QI V8HI V4SI])
31 (define_mode_iterator VEC_F [V4SF V2DF])
33 ;; Vector arithmetic modes
34 (define_mode_iterator VEC_A [V16QI V8HI V4SI V4SF V2DF])
36 ;; Vector modes that need alginment via permutes
37 (define_mode_iterator VEC_K [V16QI V8HI V4SI V4SF])
39 ;; Vector logical modes
40 (define_mode_iterator VEC_L [V16QI V8HI V4SI V2DI V4SF V2DF TI])
42 ;; Vector modes for moves. Don't do TImode here.
43 (define_mode_iterator VEC_M [V16QI V8HI V4SI V2DI V4SF V2DF])
45 ;; Vector modes for types that don't need a realignment under VSX
46 (define_mode_iterator VEC_N [V4SI V4SF V2DI V2DF])
48 ;; Vector comparison modes
49 (define_mode_iterator VEC_C [V16QI V8HI V4SI V4SF V2DF])
51 ;; Vector init/extract modes
52 (define_mode_iterator VEC_E [V16QI V8HI V4SI V2DI V4SF V2DF])
54 ;; Vector modes for 64-bit base types
55 (define_mode_iterator VEC_64 [V2DI V2DF])
57 ;; Vector reload iterator
58 (define_mode_iterator VEC_R [V16QI V8HI V4SI V2DI V4SF V2DF DF TI])
60 ;; Base type from vector mode
61 (define_mode_attr VEC_base [(V16QI "QI")
69 ;; Same size integer type for floating point data
70 (define_mode_attr VEC_int [(V4SF "v4si")
73 (define_mode_attr VEC_INT [(V4SF "V4SI")
76 ;; constants for unspec
77 (define_c_enum "unspec" [UNSPEC_PREDICATE
80 ;; Vector reduction code iterators
81 (define_code_iterator VEC_reduc [plus smin smax])
83 (define_code_attr VEC_reduc_name [(plus "splus")
87 (define_code_attr VEC_reduc_rtx [(plus "add")
92 ;; Vector move instructions.
93 (define_expand "mov<mode>"
94 [(set (match_operand:VEC_M 0 "nonimmediate_operand" "")
95 (match_operand:VEC_M 1 "any_operand" ""))]
96 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
98 if (can_create_pseudo_p ())
100 if (CONSTANT_P (operands[1])
101 && !easy_vector_constant (operands[1], <MODE>mode))
102 operands[1] = force_const_mem (<MODE>mode, operands[1]);
104 else if (!vlogical_operand (operands[0], <MODE>mode)
105 && !vlogical_operand (operands[1], <MODE>mode))
106 operands[1] = force_reg (<MODE>mode, operands[1]);
110 ;; Generic vector floating point load/store instructions. These will match
111 ;; insns defined in vsx.md or altivec.md depending on the switches.
112 (define_expand "vector_load_<mode>"
113 [(set (match_operand:VEC_M 0 "vfloat_operand" "")
114 (match_operand:VEC_M 1 "memory_operand" ""))]
115 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
118 (define_expand "vector_store_<mode>"
119 [(set (match_operand:VEC_M 0 "memory_operand" "")
120 (match_operand:VEC_M 1 "vfloat_operand" ""))]
121 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
124 ;; Splits if a GPR register was chosen for the move
126 [(set (match_operand:VEC_L 0 "nonimmediate_operand" "")
127 (match_operand:VEC_L 1 "input_operand" ""))]
128 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)
130 && gpr_or_gpr_p (operands[0], operands[1])"
133 rs6000_split_multireg_move (operands[0], operands[1]);
137 ;; Vector floating point load/store instructions that uses the Altivec
138 ;; instructions even if we are compiling for VSX, since the Altivec
139 ;; instructions silently ignore the bottom 3 bits of the address, and VSX does
141 (define_expand "vector_altivec_load_<mode>"
142 [(set (match_operand:VEC_M 0 "vfloat_operand" "")
143 (match_operand:VEC_M 1 "memory_operand" ""))]
144 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
147 gcc_assert (VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode));
149 if (VECTOR_MEM_VSX_P (<MODE>mode))
151 operands[1] = rs6000_address_for_altivec (operands[1]);
152 emit_insn (gen_altivec_lvx_<mode> (operands[0], operands[1]));
157 (define_expand "vector_altivec_store_<mode>"
158 [(set (match_operand:VEC_M 0 "memory_operand" "")
159 (match_operand:VEC_M 1 "vfloat_operand" ""))]
160 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
163 gcc_assert (VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode));
165 if (VECTOR_MEM_VSX_P (<MODE>mode))
167 operands[0] = rs6000_address_for_altivec (operands[0]);
168 emit_insn (gen_altivec_stvx_<mode> (operands[0], operands[1]));
175 ;; Reload patterns for vector operations. We may need an addtional base
176 ;; register to convert the reg+offset addressing to reg+reg for vector
177 ;; registers and reg+reg or (reg+reg)&(-16) addressing to just an index
178 ;; register for gpr registers.
179 (define_expand "reload_<VEC_R:mode>_<P:mptrsize>_store"
180 [(parallel [(match_operand:VEC_R 0 "memory_operand" "m")
181 (match_operand:VEC_R 1 "gpc_reg_operand" "r")
182 (match_operand:P 2 "register_operand" "=&b")])]
185 rs6000_secondary_reload_inner (operands[1], operands[0], operands[2], true);
189 (define_expand "reload_<VEC_R:mode>_<P:mptrsize>_load"
190 [(parallel [(match_operand:VEC_R 0 "gpc_reg_operand" "=&r")
191 (match_operand:VEC_R 1 "memory_operand" "m")
192 (match_operand:P 2 "register_operand" "=&b")])]
195 rs6000_secondary_reload_inner (operands[0], operands[1], operands[2], false);
199 ;; Reload sometimes tries to move the address to a GPR, and can generate
200 ;; invalid RTL for addresses involving AND -16. Allow addresses involving
201 ;; reg+reg, reg+small constant, or just reg, all wrapped in an AND -16.
203 (define_insn_and_split "*vec_reload_and_plus_<mptrsize>"
204 [(set (match_operand:P 0 "gpc_reg_operand" "=b")
205 (and:P (plus:P (match_operand:P 1 "gpc_reg_operand" "r")
206 (match_operand:P 2 "reg_or_cint_operand" "rI"))
208 "(TARGET_ALTIVEC || TARGET_VSX) && (reload_in_progress || reload_completed)"
210 "&& reload_completed"
212 (plus:P (match_dup 1)
214 (parallel [(set (match_dup 0)
217 (clobber:CC (scratch:CC))])])
219 ;; The normal ANDSI3/ANDDI3 won't match if reload decides to move an AND -16
220 ;; address to a register because there is no clobber of a (scratch), so we add
222 (define_insn_and_split "*vec_reload_and_reg_<mptrsize>"
223 [(set (match_operand:P 0 "gpc_reg_operand" "=b")
224 (and:P (match_operand:P 1 "gpc_reg_operand" "r")
226 "(TARGET_ALTIVEC || TARGET_VSX) && (reload_in_progress || reload_completed)"
228 "&& reload_completed"
229 [(parallel [(set (match_dup 0)
232 (clobber:CC (scratch:CC))])])
234 ;; Generic floating point vector arithmetic support
235 (define_expand "add<mode>3"
236 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
237 (plus:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")
238 (match_operand:VEC_F 2 "vfloat_operand" "")))]
239 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
242 (define_expand "sub<mode>3"
243 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
244 (minus:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")
245 (match_operand:VEC_F 2 "vfloat_operand" "")))]
246 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
249 (define_expand "mul<mode>3"
250 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
251 (mult:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")
252 (match_operand:VEC_F 2 "vfloat_operand" "")))]
253 "VECTOR_UNIT_VSX_P (<MODE>mode) || VECTOR_UNIT_ALTIVEC_P (<MODE>mode)"
255 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
257 emit_insn (gen_altivec_mulv4sf3 (operands[0], operands[1], operands[2]));
262 (define_expand "div<mode>3"
263 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
264 (div:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")
265 (match_operand:VEC_F 2 "vfloat_operand" "")))]
266 "VECTOR_UNIT_VSX_P (<MODE>mode)"
269 (define_expand "neg<mode>2"
270 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
271 (neg:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")))]
272 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
275 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
277 emit_insn (gen_altivec_negv4sf2 (operands[0], operands[1]));
282 (define_expand "abs<mode>2"
283 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
284 (abs:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")))]
285 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
288 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
290 emit_insn (gen_altivec_absv4sf2 (operands[0], operands[1]));
295 (define_expand "smin<mode>3"
296 [(set (match_operand:VEC_F 0 "register_operand" "")
297 (smin:VEC_F (match_operand:VEC_F 1 "register_operand" "")
298 (match_operand:VEC_F 2 "register_operand" "")))]
299 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
302 (define_expand "smax<mode>3"
303 [(set (match_operand:VEC_F 0 "register_operand" "")
304 (smax:VEC_F (match_operand:VEC_F 1 "register_operand" "")
305 (match_operand:VEC_F 2 "register_operand" "")))]
306 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
310 (define_expand "sqrt<mode>2"
311 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
312 (sqrt:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")))]
313 "VECTOR_UNIT_VSX_P (<MODE>mode)"
316 (define_expand "rsqrte<mode>2"
317 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
318 (unspec:VEC_F [(match_operand:VEC_F 1 "vfloat_operand" "")]
320 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
323 (define_expand "re<mode>2"
324 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
325 (unspec:VEC_F [(match_operand:VEC_F 1 "vfloat_operand" "f")]
327 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
330 (define_expand "ftrunc<mode>2"
331 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
332 (fix:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")))]
333 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
336 (define_expand "vector_ceil<mode>2"
337 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
338 (unspec:VEC_F [(match_operand:VEC_F 1 "vfloat_operand" "")]
340 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
343 (define_expand "vector_floor<mode>2"
344 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
345 (unspec:VEC_F [(match_operand:VEC_F 1 "vfloat_operand" "")]
347 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
350 (define_expand "vector_btrunc<mode>2"
351 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
352 (fix:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")))]
353 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
356 (define_expand "vector_copysign<mode>3"
357 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
358 (unspec:VEC_F [(match_operand:VEC_F 1 "vfloat_operand" "")
359 (match_operand:VEC_F 2 "vfloat_operand" "")] UNSPEC_COPYSIGN))]
360 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
363 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
365 emit_insn (gen_altivec_copysign_v4sf3 (operands[0], operands[1],
372 ;; Vector comparisons
373 (define_expand "vcond<mode><mode>"
374 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
376 (match_operator 3 "comparison_operator"
377 [(match_operand:VEC_F 4 "vfloat_operand" "")
378 (match_operand:VEC_F 5 "vfloat_operand" "")])
379 (match_operand:VEC_F 1 "vfloat_operand" "")
380 (match_operand:VEC_F 2 "vfloat_operand" "")))]
381 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
384 if (rs6000_emit_vector_cond_expr (operands[0], operands[1], operands[2],
385 operands[3], operands[4], operands[5]))
391 (define_expand "vcond<mode><mode>"
392 [(set (match_operand:VEC_I 0 "vint_operand" "")
394 (match_operator 3 "comparison_operator"
395 [(match_operand:VEC_I 4 "vint_operand" "")
396 (match_operand:VEC_I 5 "vint_operand" "")])
397 (match_operand:VEC_I 1 "vint_operand" "")
398 (match_operand:VEC_I 2 "vint_operand" "")))]
399 "VECTOR_UNIT_ALTIVEC_P (<MODE>mode)"
402 if (rs6000_emit_vector_cond_expr (operands[0], operands[1], operands[2],
403 operands[3], operands[4], operands[5]))
409 (define_expand "vcondv4sfv4si"
410 [(set (match_operand:V4SF 0 "vfloat_operand" "")
412 (match_operator 3 "comparison_operator"
413 [(match_operand:V4SI 4 "vint_operand" "")
414 (match_operand:V4SI 5 "vint_operand" "")])
415 (match_operand:V4SF 1 "vfloat_operand" "")
416 (match_operand:V4SF 2 "vfloat_operand" "")))]
417 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SFmode)
418 && VECTOR_UNIT_ALTIVEC_P (V4SImode)"
421 if (rs6000_emit_vector_cond_expr (operands[0], operands[1], operands[2],
422 operands[3], operands[4], operands[5]))
428 (define_expand "vcondv4siv4sf"
429 [(set (match_operand:V4SI 0 "vint_operand" "")
431 (match_operator 3 "comparison_operator"
432 [(match_operand:V4SF 4 "vfloat_operand" "")
433 (match_operand:V4SF 5 "vfloat_operand" "")])
434 (match_operand:V4SI 1 "vint_operand" "")
435 (match_operand:V4SI 2 "vint_operand" "")))]
436 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SFmode)
437 && VECTOR_UNIT_ALTIVEC_P (V4SImode)"
440 if (rs6000_emit_vector_cond_expr (operands[0], operands[1], operands[2],
441 operands[3], operands[4], operands[5]))
447 (define_expand "vcondu<mode><mode>"
448 [(set (match_operand:VEC_I 0 "vint_operand" "")
450 (match_operator 3 "comparison_operator"
451 [(match_operand:VEC_I 4 "vint_operand" "")
452 (match_operand:VEC_I 5 "vint_operand" "")])
453 (match_operand:VEC_I 1 "vint_operand" "")
454 (match_operand:VEC_I 2 "vint_operand" "")))]
455 "VECTOR_UNIT_ALTIVEC_P (<MODE>mode)"
458 if (rs6000_emit_vector_cond_expr (operands[0], operands[1], operands[2],
459 operands[3], operands[4], operands[5]))
465 (define_expand "vconduv4sfv4si"
466 [(set (match_operand:V4SF 0 "vfloat_operand" "")
468 (match_operator 3 "comparison_operator"
469 [(match_operand:V4SI 4 "vint_operand" "")
470 (match_operand:V4SI 5 "vint_operand" "")])
471 (match_operand:V4SF 1 "vfloat_operand" "")
472 (match_operand:V4SF 2 "vfloat_operand" "")))]
473 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SFmode)
474 && VECTOR_UNIT_ALTIVEC_P (V4SImode)"
477 if (rs6000_emit_vector_cond_expr (operands[0], operands[1], operands[2],
478 operands[3], operands[4], operands[5]))
484 (define_expand "vector_eq<mode>"
485 [(set (match_operand:VEC_C 0 "vlogical_operand" "")
486 (eq:VEC_C (match_operand:VEC_C 1 "vlogical_operand" "")
487 (match_operand:VEC_C 2 "vlogical_operand" "")))]
488 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
491 (define_expand "vector_gt<mode>"
492 [(set (match_operand:VEC_C 0 "vlogical_operand" "")
493 (gt:VEC_C (match_operand:VEC_C 1 "vlogical_operand" "")
494 (match_operand:VEC_C 2 "vlogical_operand" "")))]
495 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
498 (define_expand "vector_ge<mode>"
499 [(set (match_operand:VEC_C 0 "vlogical_operand" "")
500 (ge:VEC_C (match_operand:VEC_C 1 "vlogical_operand" "")
501 (match_operand:VEC_C 2 "vlogical_operand" "")))]
502 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
505 (define_expand "vector_gtu<mode>"
506 [(set (match_operand:VEC_I 0 "vint_operand" "")
507 (gtu:VEC_I (match_operand:VEC_I 1 "vint_operand" "")
508 (match_operand:VEC_I 2 "vint_operand" "")))]
509 "VECTOR_UNIT_ALTIVEC_P (<MODE>mode)"
512 (define_expand "vector_geu<mode>"
513 [(set (match_operand:VEC_I 0 "vint_operand" "")
514 (geu:VEC_I (match_operand:VEC_I 1 "vint_operand" "")
515 (match_operand:VEC_I 2 "vint_operand" "")))]
516 "VECTOR_UNIT_ALTIVEC_P (<MODE>mode)"
519 ;; Note the arguments for __builtin_altivec_vsel are op2, op1, mask
520 ;; which is in the reverse order that we want
521 (define_expand "vector_select_<mode>"
522 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
524 (ne:CC (match_operand:VEC_L 3 "vlogical_operand" "")
526 (match_operand:VEC_L 2 "vlogical_operand" "")
527 (match_operand:VEC_L 1 "vlogical_operand" "")))]
528 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
529 "operands[4] = CONST0_RTX (<MODE>mode);")
531 (define_expand "vector_select_<mode>_uns"
532 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
534 (ne:CCUNS (match_operand:VEC_L 3 "vlogical_operand" "")
536 (match_operand:VEC_L 2 "vlogical_operand" "")
537 (match_operand:VEC_L 1 "vlogical_operand" "")))]
538 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
539 "operands[4] = CONST0_RTX (<MODE>mode);")
541 ;; Expansions that compare vectors producing a vector result and a predicate,
542 ;; setting CR6 to indicate a combined status
543 (define_expand "vector_eq_<mode>_p"
546 (unspec:CC [(eq:CC (match_operand:VEC_A 1 "vlogical_operand" "")
547 (match_operand:VEC_A 2 "vlogical_operand" ""))]
549 (set (match_operand:VEC_A 0 "vlogical_operand" "")
550 (eq:VEC_A (match_dup 1)
552 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
555 (define_expand "vector_gt_<mode>_p"
558 (unspec:CC [(gt:CC (match_operand:VEC_A 1 "vlogical_operand" "")
559 (match_operand:VEC_A 2 "vlogical_operand" ""))]
561 (set (match_operand:VEC_A 0 "vlogical_operand" "")
562 (gt:VEC_A (match_dup 1)
564 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
567 (define_expand "vector_ge_<mode>_p"
570 (unspec:CC [(ge:CC (match_operand:VEC_F 1 "vfloat_operand" "")
571 (match_operand:VEC_F 2 "vfloat_operand" ""))]
573 (set (match_operand:VEC_F 0 "vfloat_operand" "")
574 (ge:VEC_F (match_dup 1)
576 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
579 (define_expand "vector_gtu_<mode>_p"
582 (unspec:CC [(gtu:CC (match_operand:VEC_I 1 "vint_operand" "")
583 (match_operand:VEC_I 2 "vint_operand" ""))]
585 (set (match_operand:VEC_I 0 "vlogical_operand" "")
586 (gtu:VEC_I (match_dup 1)
588 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
591 ;; AltiVec/VSX predicates.
593 (define_expand "cr6_test_for_zero"
594 [(set (match_operand:SI 0 "register_operand" "=r")
597 "TARGET_ALTIVEC || TARGET_VSX"
600 (define_expand "cr6_test_for_zero_reverse"
601 [(set (match_operand:SI 0 "register_operand" "=r")
604 (set (match_dup 0) (minus:SI (const_int 1) (match_dup 0)))]
605 "TARGET_ALTIVEC || TARGET_VSX"
608 (define_expand "cr6_test_for_lt"
609 [(set (match_operand:SI 0 "register_operand" "=r")
612 "TARGET_ALTIVEC || TARGET_VSX"
615 (define_expand "cr6_test_for_lt_reverse"
616 [(set (match_operand:SI 0 "register_operand" "=r")
619 (set (match_dup 0) (minus:SI (const_int 1) (match_dup 0)))]
620 "TARGET_ALTIVEC || TARGET_VSX"
624 ;; Vector logical instructions
625 (define_expand "xor<mode>3"
626 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
627 (xor:VEC_L (match_operand:VEC_L 1 "vlogical_operand" "")
628 (match_operand:VEC_L 2 "vlogical_operand" "")))]
629 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
632 (define_expand "ior<mode>3"
633 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
634 (ior:VEC_L (match_operand:VEC_L 1 "vlogical_operand" "")
635 (match_operand:VEC_L 2 "vlogical_operand" "")))]
636 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
639 (define_expand "and<mode>3"
640 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
641 (and:VEC_L (match_operand:VEC_L 1 "vlogical_operand" "")
642 (match_operand:VEC_L 2 "vlogical_operand" "")))]
643 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
646 (define_expand "one_cmpl<mode>2"
647 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
648 (not:VEC_L (match_operand:VEC_L 1 "vlogical_operand" "")))]
649 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
652 (define_expand "nor<mode>3"
653 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
654 (not:VEC_L (ior:VEC_L (match_operand:VEC_L 1 "vlogical_operand" "")
655 (match_operand:VEC_L 2 "vlogical_operand" ""))))]
656 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
659 (define_expand "andc<mode>3"
660 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
661 (and:VEC_L (not:VEC_L (match_operand:VEC_L 2 "vlogical_operand" ""))
662 (match_operand:VEC_L 1 "vlogical_operand" "")))]
663 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
666 ;; Same size conversions
667 (define_expand "float<VEC_int><mode>2"
668 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
669 (float:VEC_F (match_operand:<VEC_INT> 1 "vint_operand" "")))]
670 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
673 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
675 emit_insn (gen_altivec_vcfsx (operands[0], operands[1], const0_rtx));
680 (define_expand "floatuns<VEC_int><mode>2"
681 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
682 (unsigned_float:VEC_F (match_operand:<VEC_INT> 1 "vint_operand" "")))]
683 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
686 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
688 emit_insn (gen_altivec_vcfux (operands[0], operands[1], const0_rtx));
693 (define_expand "fix_trunc<mode><VEC_int>2"
694 [(set (match_operand:<VEC_INT> 0 "vint_operand" "")
695 (fix:<VEC_INT> (match_operand:VEC_F 1 "vfloat_operand" "")))]
696 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
699 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
701 emit_insn (gen_altivec_vctsxs (operands[0], operands[1], const0_rtx));
706 (define_expand "fixuns_trunc<mode><VEC_int>2"
707 [(set (match_operand:<VEC_INT> 0 "vint_operand" "")
708 (unsigned_fix:<VEC_INT> (match_operand:VEC_F 1 "vfloat_operand" "")))]
709 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
712 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
714 emit_insn (gen_altivec_vctuxs (operands[0], operands[1], const0_rtx));
720 ;; Vector initialization, set, extract
721 (define_expand "vec_init<mode>"
722 [(match_operand:VEC_E 0 "vlogical_operand" "")
723 (match_operand:VEC_E 1 "" "")]
724 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
726 rs6000_expand_vector_init (operands[0], operands[1]);
730 (define_expand "vec_set<mode>"
731 [(match_operand:VEC_E 0 "vlogical_operand" "")
732 (match_operand:<VEC_base> 1 "register_operand" "")
733 (match_operand 2 "const_int_operand" "")]
734 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
736 rs6000_expand_vector_set (operands[0], operands[1], INTVAL (operands[2]));
740 (define_expand "vec_extract<mode>"
741 [(match_operand:<VEC_base> 0 "register_operand" "")
742 (match_operand:VEC_E 1 "vlogical_operand" "")
743 (match_operand 2 "const_int_operand" "")]
744 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
746 rs6000_expand_vector_extract (operands[0], operands[1],
747 INTVAL (operands[2]));
751 ;; Interleave patterns
752 (define_expand "vec_interleave_highv4sf"
753 [(set (match_operand:V4SF 0 "vfloat_operand" "")
755 (vec_select:V4SF (match_operand:V4SF 1 "vfloat_operand" "")
756 (parallel [(const_int 0)
760 (vec_select:V4SF (match_operand:V4SF 2 "vfloat_operand" "")
761 (parallel [(const_int 2)
766 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SFmode)"
769 (define_expand "vec_interleave_lowv4sf"
770 [(set (match_operand:V4SF 0 "vfloat_operand" "")
772 (vec_select:V4SF (match_operand:V4SF 1 "vfloat_operand" "")
773 (parallel [(const_int 2)
777 (vec_select:V4SF (match_operand:V4SF 2 "vfloat_operand" "")
778 (parallel [(const_int 0)
783 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SFmode)"
786 (define_expand "vec_interleave_high<mode>"
787 [(set (match_operand:VEC_64 0 "vfloat_operand" "")
789 (vec_select:<VEC_base> (match_operand:VEC_64 1 "vfloat_operand" "")
790 (parallel [(const_int 0)]))
791 (vec_select:<VEC_base> (match_operand:VEC_64 2 "vfloat_operand" "")
792 (parallel [(const_int 0)]))))]
793 "VECTOR_UNIT_VSX_P (<MODE>mode)"
796 (define_expand "vec_interleave_low<mode>"
797 [(set (match_operand:VEC_64 0 "vfloat_operand" "")
799 (vec_select:<VEC_base> (match_operand:VEC_64 1 "vfloat_operand" "")
800 (parallel [(const_int 1)]))
801 (vec_select:<VEC_base> (match_operand:VEC_64 2 "vfloat_operand" "")
802 (parallel [(const_int 1)]))))]
803 "VECTOR_UNIT_VSX_P (<MODE>mode)"
807 ;; Convert double word types to single word types
808 (define_expand "vec_pack_trunc_v2df"
809 [(match_operand:V4SF 0 "vfloat_operand" "")
810 (match_operand:V2DF 1 "vfloat_operand" "")
811 (match_operand:V2DF 2 "vfloat_operand" "")]
812 "VECTOR_UNIT_VSX_P (V2DFmode) && TARGET_ALTIVEC"
814 rtx r1 = gen_reg_rtx (V4SFmode);
815 rtx r2 = gen_reg_rtx (V4SFmode);
817 emit_insn (gen_vsx_xvcvdpsp (r1, operands[1]));
818 emit_insn (gen_vsx_xvcvdpsp (r2, operands[2]));
819 emit_insn (gen_vec_extract_evenv4sf (operands[0], r1, r2));
823 (define_expand "vec_pack_sfix_trunc_v2df"
824 [(match_operand:V4SI 0 "vint_operand" "")
825 (match_operand:V2DF 1 "vfloat_operand" "")
826 (match_operand:V2DF 2 "vfloat_operand" "")]
827 "VECTOR_UNIT_VSX_P (V2DFmode) && TARGET_ALTIVEC"
829 rtx r1 = gen_reg_rtx (V4SImode);
830 rtx r2 = gen_reg_rtx (V4SImode);
832 emit_insn (gen_vsx_xvcvdpsxws (r1, operands[1]));
833 emit_insn (gen_vsx_xvcvdpsxws (r2, operands[2]));
834 emit_insn (gen_vec_extract_evenv4si (operands[0], r1, r2));
838 (define_expand "vec_pack_ufix_trunc_v2df"
839 [(match_operand:V4SI 0 "vint_operand" "")
840 (match_operand:V2DF 1 "vfloat_operand" "")
841 (match_operand:V2DF 2 "vfloat_operand" "")]
842 "VECTOR_UNIT_VSX_P (V2DFmode) && TARGET_ALTIVEC"
844 rtx r1 = gen_reg_rtx (V4SImode);
845 rtx r2 = gen_reg_rtx (V4SImode);
847 emit_insn (gen_vsx_xvcvdpuxws (r1, operands[1]));
848 emit_insn (gen_vsx_xvcvdpuxws (r2, operands[2]));
849 emit_insn (gen_vec_extract_evenv4si (operands[0], r1, r2));
853 ;; Convert single word types to double word
854 (define_expand "vec_unpacks_hi_v4sf"
855 [(match_operand:V2DF 0 "vfloat_operand" "")
856 (match_operand:V4SF 1 "vfloat_operand" "")]
857 "VECTOR_UNIT_VSX_P (V2DFmode) && VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SFmode)"
859 rtx reg = gen_reg_rtx (V4SFmode);
861 emit_insn (gen_vec_interleave_highv4sf (reg, operands[1], operands[1]));
862 emit_insn (gen_vsx_xvcvspdp (operands[0], reg));
866 (define_expand "vec_unpacks_lo_v4sf"
867 [(match_operand:V2DF 0 "vfloat_operand" "")
868 (match_operand:V4SF 1 "vfloat_operand" "")]
869 "VECTOR_UNIT_VSX_P (V2DFmode) && VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SFmode)"
871 rtx reg = gen_reg_rtx (V4SFmode);
873 emit_insn (gen_vec_interleave_lowv4sf (reg, operands[1], operands[1]));
874 emit_insn (gen_vsx_xvcvspdp (operands[0], reg));
878 (define_expand "vec_unpacks_float_hi_v4si"
879 [(match_operand:V2DF 0 "vfloat_operand" "")
880 (match_operand:V4SI 1 "vint_operand" "")]
881 "VECTOR_UNIT_VSX_P (V2DFmode) && VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SImode)"
883 rtx reg = gen_reg_rtx (V4SImode);
885 emit_insn (gen_vec_interleave_highv4si (reg, operands[1], operands[1]));
886 emit_insn (gen_vsx_xvcvsxwdp (operands[0], reg));
890 (define_expand "vec_unpacks_float_lo_v4si"
891 [(match_operand:V2DF 0 "vfloat_operand" "")
892 (match_operand:V4SI 1 "vint_operand" "")]
893 "VECTOR_UNIT_VSX_P (V2DFmode) && VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SImode)"
895 rtx reg = gen_reg_rtx (V4SImode);
897 emit_insn (gen_vec_interleave_lowv4si (reg, operands[1], operands[1]));
898 emit_insn (gen_vsx_xvcvsxwdp (operands[0], reg));
902 (define_expand "vec_unpacku_float_hi_v4si"
903 [(match_operand:V2DF 0 "vfloat_operand" "")
904 (match_operand:V4SI 1 "vint_operand" "")]
905 "VECTOR_UNIT_VSX_P (V2DFmode) && VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SImode)"
907 rtx reg = gen_reg_rtx (V4SImode);
909 emit_insn (gen_vec_interleave_highv4si (reg, operands[1], operands[1]));
910 emit_insn (gen_vsx_xvcvuxwdp (operands[0], reg));
914 (define_expand "vec_unpacku_float_lo_v4si"
915 [(match_operand:V2DF 0 "vfloat_operand" "")
916 (match_operand:V4SI 1 "vint_operand" "")]
917 "VECTOR_UNIT_VSX_P (V2DFmode) && VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SImode)"
919 rtx reg = gen_reg_rtx (V4SImode);
921 emit_insn (gen_vec_interleave_lowv4si (reg, operands[1], operands[1]));
922 emit_insn (gen_vsx_xvcvuxwdp (operands[0], reg));
927 ;; Align vector loads with a permute.
928 (define_expand "vec_realign_load_<mode>"
929 [(match_operand:VEC_K 0 "vlogical_operand" "")
930 (match_operand:VEC_K 1 "vlogical_operand" "")
931 (match_operand:VEC_K 2 "vlogical_operand" "")
932 (match_operand:V16QI 3 "vlogical_operand" "")]
933 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
935 emit_insn (gen_altivec_vperm_<mode> (operands[0], operands[1], operands[2],
940 ;; Under VSX, vectors of 4/8 byte alignments do not need to be aligned
941 ;; since the load already handles it.
942 (define_expand "movmisalign<mode>"
943 [(set (match_operand:VEC_N 0 "nonimmediate_operand" "")
944 (match_operand:VEC_N 1 "any_operand" ""))]
945 "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_ALLOW_MOVMISALIGN"
949 ;; Vector shift left in bits. Currently supported ony for shift
950 ;; amounts that can be expressed as byte shifts (divisible by 8).
951 ;; General shift amounts can be supported using vslo + vsl. We're
952 ;; not expecting to see these yet (the vectorizer currently
953 ;; generates only shifts divisible by byte_size).
954 (define_expand "vec_shl_<mode>"
955 [(match_operand:VEC_L 0 "vlogical_operand" "")
956 (match_operand:VEC_L 1 "vlogical_operand" "")
957 (match_operand:QI 2 "reg_or_short_operand" "")]
961 rtx bitshift = operands[2];
964 HOST_WIDE_INT bitshift_val;
965 HOST_WIDE_INT byteshift_val;
967 if (! CONSTANT_P (bitshift))
969 bitshift_val = INTVAL (bitshift);
970 if (bitshift_val & 0x7)
972 byteshift_val = bitshift_val >> 3;
973 if (TARGET_VSX && (byteshift_val & 0x3) == 0)
975 shift = gen_rtx_CONST_INT (QImode, byteshift_val >> 2);
976 insn = gen_vsx_xxsldwi_<mode> (operands[0], operands[1], operands[1],
981 shift = gen_rtx_CONST_INT (QImode, byteshift_val);
982 insn = gen_altivec_vsldoi_<mode> (operands[0], operands[1], operands[1],
990 ;; Vector shift right in bits. Currently supported ony for shift
991 ;; amounts that can be expressed as byte shifts (divisible by 8).
992 ;; General shift amounts can be supported using vsro + vsr. We're
993 ;; not expecting to see these yet (the vectorizer currently
994 ;; generates only shifts divisible by byte_size).
995 (define_expand "vec_shr_<mode>"
996 [(match_operand:VEC_L 0 "vlogical_operand" "")
997 (match_operand:VEC_L 1 "vlogical_operand" "")
998 (match_operand:QI 2 "reg_or_short_operand" "")]
1002 rtx bitshift = operands[2];
1005 HOST_WIDE_INT bitshift_val;
1006 HOST_WIDE_INT byteshift_val;
1008 if (! CONSTANT_P (bitshift))
1010 bitshift_val = INTVAL (bitshift);
1011 if (bitshift_val & 0x7)
1013 byteshift_val = 16 - (bitshift_val >> 3);
1014 if (TARGET_VSX && (byteshift_val & 0x3) == 0)
1016 shift = gen_rtx_CONST_INT (QImode, byteshift_val >> 2);
1017 insn = gen_vsx_xxsldwi_<mode> (operands[0], operands[1], operands[1],
1022 shift = gen_rtx_CONST_INT (QImode, byteshift_val);
1023 insn = gen_altivec_vsldoi_<mode> (operands[0], operands[1], operands[1],
1031 ;; Expanders for rotate each element in a vector
1032 (define_expand "vrotl<mode>3"
1033 [(set (match_operand:VEC_I 0 "vint_operand" "")
1034 (rotate:VEC_I (match_operand:VEC_I 1 "vint_operand" "")
1035 (match_operand:VEC_I 2 "vint_operand" "")))]
1039 ;; Expanders for arithmetic shift left on each vector element
1040 (define_expand "vashl<mode>3"
1041 [(set (match_operand:VEC_I 0 "vint_operand" "")
1042 (ashift:VEC_I (match_operand:VEC_I 1 "vint_operand" "")
1043 (match_operand:VEC_I 2 "vint_operand" "")))]
1047 ;; Expanders for logical shift right on each vector element
1048 (define_expand "vlshr<mode>3"
1049 [(set (match_operand:VEC_I 0 "vint_operand" "")
1050 (lshiftrt:VEC_I (match_operand:VEC_I 1 "vint_operand" "")
1051 (match_operand:VEC_I 2 "vint_operand" "")))]
1055 ;; Expanders for arithmetic shift right on each vector element
1056 (define_expand "vashr<mode>3"
1057 [(set (match_operand:VEC_I 0 "vint_operand" "")
1058 (ashiftrt:VEC_I (match_operand:VEC_I 1 "vint_operand" "")
1059 (match_operand:VEC_I 2 "vint_operand" "")))]
1063 ;; Vector reduction expanders for VSX
1065 (define_expand "reduc_<VEC_reduc_name>_v2df"
1066 [(parallel [(set (match_operand:V2DF 0 "vfloat_operand" "")
1070 (match_operand:V2DF 1 "vfloat_operand" "")
1071 (parallel [(const_int 1)]))
1074 (parallel [(const_int 0)])))
1076 (clobber (match_scratch:V2DF 2 ""))])]
1077 "VECTOR_UNIT_VSX_P (V2DFmode)"
1080 ; The (VEC_reduc:V4SF
1082 ; (unspec:V4SF [(const_int 0)] UNSPEC_REDUC))
1084 ; is to allow us to use a code iterator, but not completely list all of the
1085 ; vector rotates, etc. to prevent canonicalization
1087 (define_expand "reduc_<VEC_reduc_name>_v4sf"
1088 [(parallel [(set (match_operand:V4SF 0 "vfloat_operand" "")
1090 (unspec:V4SF [(const_int 0)] UNSPEC_REDUC)
1091 (match_operand:V4SF 1 "vfloat_operand" "")))
1092 (clobber (match_scratch:V4SF 2 ""))
1093 (clobber (match_scratch:V4SF 3 ""))])]
1094 "VECTOR_UNIT_VSX_P (V4SFmode)"
1098 ;;; Expanders for vector insn patterns shared between the SPE and TARGET_PAIRED systems.
1100 (define_expand "absv2sf2"
1101 [(set (match_operand:V2SF 0 "gpc_reg_operand" "")
1102 (abs:V2SF (match_operand:V2SF 1 "gpc_reg_operand" "")))]
1103 "TARGET_PAIRED_FLOAT || TARGET_SPE"
1106 (define_expand "negv2sf2"
1107 [(set (match_operand:V2SF 0 "gpc_reg_operand" "")
1108 (neg:V2SF (match_operand:V2SF 1 "gpc_reg_operand" "")))]
1109 "TARGET_PAIRED_FLOAT || TARGET_SPE"
1112 (define_expand "addv2sf3"
1113 [(set (match_operand:V2SF 0 "gpc_reg_operand" "")
1114 (plus:V2SF (match_operand:V2SF 1 "gpc_reg_operand" "")
1115 (match_operand:V2SF 2 "gpc_reg_operand" "")))]
1116 "TARGET_PAIRED_FLOAT || TARGET_SPE"
1121 /* We need to make a note that we clobber SPEFSCR. */
1122 rtx par = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (2));
1124 XVECEXP (par, 0, 0) = gen_rtx_SET (VOIDmode, operands[0],
1125 gen_rtx_PLUS (V2SFmode, operands[1], operands[2]));
1126 XVECEXP (par, 0, 1) = gen_rtx_CLOBBER (VOIDmode, gen_rtx_REG (SImode, SPEFSCR_REGNO));
1132 (define_expand "subv2sf3"
1133 [(set (match_operand:V2SF 0 "gpc_reg_operand" "")
1134 (minus:V2SF (match_operand:V2SF 1 "gpc_reg_operand" "")
1135 (match_operand:V2SF 2 "gpc_reg_operand" "")))]
1136 "TARGET_PAIRED_FLOAT || TARGET_SPE"
1141 /* We need to make a note that we clobber SPEFSCR. */
1142 rtx par = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (2));
1144 XVECEXP (par, 0, 0) = gen_rtx_SET (VOIDmode, operands[0],
1145 gen_rtx_MINUS (V2SFmode, operands[1], operands[2]));
1146 XVECEXP (par, 0, 1) = gen_rtx_CLOBBER (VOIDmode, gen_rtx_REG (SImode, SPEFSCR_REGNO));
1152 (define_expand "mulv2sf3"
1153 [(set (match_operand:V2SF 0 "gpc_reg_operand" "")
1154 (mult:V2SF (match_operand:V2SF 1 "gpc_reg_operand" "")
1155 (match_operand:V2SF 2 "gpc_reg_operand" "")))]
1156 "TARGET_PAIRED_FLOAT || TARGET_SPE"
1161 /* We need to make a note that we clobber SPEFSCR. */
1162 rtx par = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (2));
1164 XVECEXP (par, 0, 0) = gen_rtx_SET (VOIDmode, operands[0],
1165 gen_rtx_MULT (V2SFmode, operands[1], operands[2]));
1166 XVECEXP (par, 0, 1) = gen_rtx_CLOBBER (VOIDmode, gen_rtx_REG (SImode, SPEFSCR_REGNO));
1172 (define_expand "divv2sf3"
1173 [(set (match_operand:V2SF 0 "gpc_reg_operand" "")
1174 (div:V2SF (match_operand:V2SF 1 "gpc_reg_operand" "")
1175 (match_operand:V2SF 2 "gpc_reg_operand" "")))]
1176 "TARGET_PAIRED_FLOAT || TARGET_SPE"
1181 /* We need to make a note that we clobber SPEFSCR. */
1182 rtx par = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (2));
1184 XVECEXP (par, 0, 0) = gen_rtx_SET (VOIDmode, operands[0],
1185 gen_rtx_DIV (V2SFmode, operands[1], operands[2]));
1186 XVECEXP (par, 0, 1) = gen_rtx_CLOBBER (VOIDmode, gen_rtx_REG (SImode, SPEFSCR_REGNO));