1 ;; Expander definitions for vector support between altivec & vsx. No
2 ;; instructions are in this file, this file provides the generic vector
3 ;; expander, and the actual vector instructions will be in altivec.md and
6 ;; Copyright (C) 2009, 2010, 2011
7 ;; Free Software Foundation, Inc.
8 ;; Contributed by Michael Meissner <meissner@linux.vnet.ibm.com>
10 ;; This file is part of GCC.
12 ;; GCC is free software; you can redistribute it and/or modify it
13 ;; under the terms of the GNU General Public License as published
14 ;; by the Free Software Foundation; either version 3, or (at your
15 ;; option) any later version.
17 ;; GCC is distributed in the hope that it will be useful, but WITHOUT
18 ;; ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
19 ;; or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
20 ;; License for more details.
22 ;; You should have received a copy of the GNU General Public License
23 ;; along with GCC; see the file COPYING3. If not see
24 ;; <http://www.gnu.org/licenses/>.
28 (define_mode_iterator VEC_I [V16QI V8HI V4SI])
31 (define_mode_iterator VEC_F [V4SF V2DF])
33 ;; Vector arithmetic modes
34 (define_mode_iterator VEC_A [V16QI V8HI V4SI V4SF V2DF])
36 ;; Vector modes that need alginment via permutes
37 (define_mode_iterator VEC_K [V16QI V8HI V4SI V4SF])
39 ;; Vector logical modes
40 (define_mode_iterator VEC_L [V16QI V8HI V4SI V2DI V4SF V2DF TI])
42 ;; Vector modes for moves. Don't do TImode here.
43 (define_mode_iterator VEC_M [V16QI V8HI V4SI V2DI V4SF V2DF])
45 ;; Vector modes for types that don't need a realignment under VSX
46 (define_mode_iterator VEC_N [V4SI V4SF V2DI V2DF])
48 ;; Vector comparison modes
49 (define_mode_iterator VEC_C [V16QI V8HI V4SI V4SF V2DF])
51 ;; Vector init/extract modes
52 (define_mode_iterator VEC_E [V16QI V8HI V4SI V2DI V4SF V2DF])
54 ;; Vector modes for 64-bit base types
55 (define_mode_iterator VEC_64 [V2DI V2DF])
57 ;; Vector reload iterator
58 (define_mode_iterator VEC_R [V16QI V8HI V4SI V2DI V4SF V2DF DF TI])
60 ;; Base type from vector mode
61 (define_mode_attr VEC_base [(V16QI "QI")
69 ;; Same size integer type for floating point data
70 (define_mode_attr VEC_int [(V4SF "v4si")
73 (define_mode_attr VEC_INT [(V4SF "V4SI")
76 ;; constants for unspec
77 (define_c_enum "unspec" [UNSPEC_PREDICATE
80 ;; Vector reduction code iterators
81 (define_code_iterator VEC_reduc [plus smin smax])
83 (define_code_attr VEC_reduc_name [(plus "splus")
87 (define_code_attr VEC_reduc_rtx [(plus "add")
92 ;; Vector move instructions.
93 (define_expand "mov<mode>"
94 [(set (match_operand:VEC_M 0 "nonimmediate_operand" "")
95 (match_operand:VEC_M 1 "any_operand" ""))]
96 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
98 if (can_create_pseudo_p ())
100 if (CONSTANT_P (operands[1])
101 && !easy_vector_constant (operands[1], <MODE>mode))
102 operands[1] = force_const_mem (<MODE>mode, operands[1]);
104 else if (!vlogical_operand (operands[0], <MODE>mode)
105 && !vlogical_operand (operands[1], <MODE>mode))
106 operands[1] = force_reg (<MODE>mode, operands[1]);
110 ;; Generic vector floating point load/store instructions. These will match
111 ;; insns defined in vsx.md or altivec.md depending on the switches.
112 (define_expand "vector_load_<mode>"
113 [(set (match_operand:VEC_M 0 "vfloat_operand" "")
114 (match_operand:VEC_M 1 "memory_operand" ""))]
115 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
118 (define_expand "vector_store_<mode>"
119 [(set (match_operand:VEC_M 0 "memory_operand" "")
120 (match_operand:VEC_M 1 "vfloat_operand" ""))]
121 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
124 ;; Splits if a GPR register was chosen for the move
126 [(set (match_operand:VEC_L 0 "nonimmediate_operand" "")
127 (match_operand:VEC_L 1 "input_operand" ""))]
128 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)
130 && gpr_or_gpr_p (operands[0], operands[1])"
133 rs6000_split_multireg_move (operands[0], operands[1]);
137 ;; Vector floating point load/store instructions that uses the Altivec
138 ;; instructions even if we are compiling for VSX, since the Altivec
139 ;; instructions silently ignore the bottom 3 bits of the address, and VSX does
141 (define_expand "vector_altivec_load_<mode>"
142 [(set (match_operand:VEC_M 0 "vfloat_operand" "")
143 (match_operand:VEC_M 1 "memory_operand" ""))]
144 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
147 gcc_assert (VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode));
149 if (VECTOR_MEM_VSX_P (<MODE>mode))
151 operands[1] = rs6000_address_for_altivec (operands[1]);
152 emit_insn (gen_altivec_lvx_<mode> (operands[0], operands[1]));
157 (define_expand "vector_altivec_store_<mode>"
158 [(set (match_operand:VEC_M 0 "memory_operand" "")
159 (match_operand:VEC_M 1 "vfloat_operand" ""))]
160 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
163 gcc_assert (VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode));
165 if (VECTOR_MEM_VSX_P (<MODE>mode))
167 operands[0] = rs6000_address_for_altivec (operands[0]);
168 emit_insn (gen_altivec_stvx_<mode> (operands[0], operands[1]));
175 ;; Reload patterns for vector operations. We may need an addtional base
176 ;; register to convert the reg+offset addressing to reg+reg for vector
177 ;; registers and reg+reg or (reg+reg)&(-16) addressing to just an index
178 ;; register for gpr registers.
179 (define_expand "reload_<VEC_R:mode>_<P:mptrsize>_store"
180 [(parallel [(match_operand:VEC_R 0 "memory_operand" "m")
181 (match_operand:VEC_R 1 "gpc_reg_operand" "r")
182 (match_operand:P 2 "register_operand" "=&b")])]
185 rs6000_secondary_reload_inner (operands[1], operands[0], operands[2], true);
189 (define_expand "reload_<VEC_R:mode>_<P:mptrsize>_load"
190 [(parallel [(match_operand:VEC_R 0 "gpc_reg_operand" "=&r")
191 (match_operand:VEC_R 1 "memory_operand" "m")
192 (match_operand:P 2 "register_operand" "=&b")])]
195 rs6000_secondary_reload_inner (operands[0], operands[1], operands[2], false);
199 ;; Reload sometimes tries to move the address to a GPR, and can generate
200 ;; invalid RTL for addresses involving AND -16. Allow addresses involving
201 ;; reg+reg, reg+small constant, or just reg, all wrapped in an AND -16.
203 (define_insn_and_split "*vec_reload_and_plus_<mptrsize>"
204 [(set (match_operand:P 0 "gpc_reg_operand" "=b")
205 (and:P (plus:P (match_operand:P 1 "gpc_reg_operand" "r")
206 (match_operand:P 2 "reg_or_cint_operand" "rI"))
208 "(TARGET_ALTIVEC || TARGET_VSX) && (reload_in_progress || reload_completed)"
210 "&& reload_completed"
212 (plus:P (match_dup 1)
214 (parallel [(set (match_dup 0)
217 (clobber:CC (scratch:CC))])])
219 ;; The normal ANDSI3/ANDDI3 won't match if reload decides to move an AND -16
220 ;; address to a register because there is no clobber of a (scratch), so we add
222 (define_insn_and_split "*vec_reload_and_reg_<mptrsize>"
223 [(set (match_operand:P 0 "gpc_reg_operand" "=b")
224 (and:P (match_operand:P 1 "gpc_reg_operand" "r")
226 "(TARGET_ALTIVEC || TARGET_VSX) && (reload_in_progress || reload_completed)"
228 "&& reload_completed"
229 [(parallel [(set (match_dup 0)
232 (clobber:CC (scratch:CC))])])
234 ;; Generic floating point vector arithmetic support
235 (define_expand "add<mode>3"
236 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
237 (plus:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")
238 (match_operand:VEC_F 2 "vfloat_operand" "")))]
239 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
242 (define_expand "sub<mode>3"
243 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
244 (minus:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")
245 (match_operand:VEC_F 2 "vfloat_operand" "")))]
246 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
249 (define_expand "mul<mode>3"
250 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
251 (mult:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")
252 (match_operand:VEC_F 2 "vfloat_operand" "")))]
253 "VECTOR_UNIT_VSX_P (<MODE>mode) || VECTOR_UNIT_ALTIVEC_P (<MODE>mode)"
255 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
257 emit_insn (gen_altivec_mulv4sf3 (operands[0], operands[1], operands[2]));
262 (define_expand "div<mode>3"
263 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
264 (div:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")
265 (match_operand:VEC_F 2 "vfloat_operand" "")))]
266 "VECTOR_UNIT_VSX_P (<MODE>mode)"
269 (define_expand "neg<mode>2"
270 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
271 (neg:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")))]
272 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
275 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
277 emit_insn (gen_altivec_negv4sf2 (operands[0], operands[1]));
282 (define_expand "abs<mode>2"
283 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
284 (abs:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")))]
285 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
288 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
290 emit_insn (gen_altivec_absv4sf2 (operands[0], operands[1]));
295 (define_expand "smin<mode>3"
296 [(set (match_operand:VEC_F 0 "register_operand" "")
297 (smin:VEC_F (match_operand:VEC_F 1 "register_operand" "")
298 (match_operand:VEC_F 2 "register_operand" "")))]
299 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
302 (define_expand "smax<mode>3"
303 [(set (match_operand:VEC_F 0 "register_operand" "")
304 (smax:VEC_F (match_operand:VEC_F 1 "register_operand" "")
305 (match_operand:VEC_F 2 "register_operand" "")))]
306 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
310 (define_expand "sqrt<mode>2"
311 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
312 (sqrt:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")))]
313 "VECTOR_UNIT_VSX_P (<MODE>mode)"
316 (define_expand "rsqrte<mode>2"
317 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
318 (unspec:VEC_F [(match_operand:VEC_F 1 "vfloat_operand" "")]
320 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
323 (define_expand "re<mode>2"
324 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
325 (unspec:VEC_F [(match_operand:VEC_F 1 "vfloat_operand" "f")]
327 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
330 (define_expand "ftrunc<mode>2"
331 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
332 (fix:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")))]
333 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
336 (define_expand "vector_ceil<mode>2"
337 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
338 (unspec:VEC_F [(match_operand:VEC_F 1 "vfloat_operand" "")]
340 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
343 (define_expand "vector_floor<mode>2"
344 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
345 (unspec:VEC_F [(match_operand:VEC_F 1 "vfloat_operand" "")]
347 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
350 (define_expand "vector_btrunc<mode>2"
351 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
352 (fix:VEC_F (match_operand:VEC_F 1 "vfloat_operand" "")))]
353 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
356 (define_expand "vector_copysign<mode>3"
357 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
358 (unspec:VEC_F [(match_operand:VEC_F 1 "vfloat_operand" "")
359 (match_operand:VEC_F 2 "vfloat_operand" "")] UNSPEC_COPYSIGN))]
360 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
363 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
365 emit_insn (gen_altivec_copysign_v4sf3 (operands[0], operands[1],
372 ;; Vector comparisons
373 (define_expand "vcond<mode><mode>"
374 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
376 (match_operator 3 "comparison_operator"
377 [(match_operand:VEC_F 4 "vfloat_operand" "")
378 (match_operand:VEC_F 5 "vfloat_operand" "")])
379 (match_operand:VEC_F 1 "vfloat_operand" "")
380 (match_operand:VEC_F 2 "vfloat_operand" "")))]
381 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
384 if (rs6000_emit_vector_cond_expr (operands[0], operands[1], operands[2],
385 operands[3], operands[4], operands[5]))
391 (define_expand "vcond<mode><mode>"
392 [(set (match_operand:VEC_I 0 "vint_operand" "")
394 (match_operator 3 "comparison_operator"
395 [(match_operand:VEC_I 4 "vint_operand" "")
396 (match_operand:VEC_I 5 "vint_operand" "")])
397 (match_operand:VEC_I 1 "vint_operand" "")
398 (match_operand:VEC_I 2 "vint_operand" "")))]
399 "VECTOR_UNIT_ALTIVEC_P (<MODE>mode)"
402 if (rs6000_emit_vector_cond_expr (operands[0], operands[1], operands[2],
403 operands[3], operands[4], operands[5]))
409 (define_expand "vcondu<mode><mode>"
410 [(set (match_operand:VEC_I 0 "vint_operand" "")
412 (match_operator 3 "comparison_operator"
413 [(match_operand:VEC_I 4 "vint_operand" "")
414 (match_operand:VEC_I 5 "vint_operand" "")])
415 (match_operand:VEC_I 1 "vint_operand" "")
416 (match_operand:VEC_I 2 "vint_operand" "")))]
417 "VECTOR_UNIT_ALTIVEC_P (<MODE>mode)"
420 if (rs6000_emit_vector_cond_expr (operands[0], operands[1], operands[2],
421 operands[3], operands[4], operands[5]))
427 (define_expand "vector_eq<mode>"
428 [(set (match_operand:VEC_C 0 "vlogical_operand" "")
429 (eq:VEC_C (match_operand:VEC_C 1 "vlogical_operand" "")
430 (match_operand:VEC_C 2 "vlogical_operand" "")))]
431 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
434 (define_expand "vector_gt<mode>"
435 [(set (match_operand:VEC_C 0 "vlogical_operand" "")
436 (gt:VEC_C (match_operand:VEC_C 1 "vlogical_operand" "")
437 (match_operand:VEC_C 2 "vlogical_operand" "")))]
438 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
441 (define_expand "vector_ge<mode>"
442 [(set (match_operand:VEC_C 0 "vlogical_operand" "")
443 (ge:VEC_C (match_operand:VEC_C 1 "vlogical_operand" "")
444 (match_operand:VEC_C 2 "vlogical_operand" "")))]
445 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
448 (define_expand "vector_gtu<mode>"
449 [(set (match_operand:VEC_I 0 "vint_operand" "")
450 (gtu:VEC_I (match_operand:VEC_I 1 "vint_operand" "")
451 (match_operand:VEC_I 2 "vint_operand" "")))]
452 "VECTOR_UNIT_ALTIVEC_P (<MODE>mode)"
455 (define_expand "vector_geu<mode>"
456 [(set (match_operand:VEC_I 0 "vint_operand" "")
457 (geu:VEC_I (match_operand:VEC_I 1 "vint_operand" "")
458 (match_operand:VEC_I 2 "vint_operand" "")))]
459 "VECTOR_UNIT_ALTIVEC_P (<MODE>mode)"
462 ;; Note the arguments for __builtin_altivec_vsel are op2, op1, mask
463 ;; which is in the reverse order that we want
464 (define_expand "vector_select_<mode>"
465 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
467 (ne:CC (match_operand:VEC_L 3 "vlogical_operand" "")
469 (match_operand:VEC_L 2 "vlogical_operand" "")
470 (match_operand:VEC_L 1 "vlogical_operand" "")))]
471 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
472 "operands[4] = CONST0_RTX (<MODE>mode);")
474 (define_expand "vector_select_<mode>_uns"
475 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
477 (ne:CCUNS (match_operand:VEC_L 3 "vlogical_operand" "")
479 (match_operand:VEC_L 2 "vlogical_operand" "")
480 (match_operand:VEC_L 1 "vlogical_operand" "")))]
481 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
482 "operands[4] = CONST0_RTX (<MODE>mode);")
484 ;; Expansions that compare vectors producing a vector result and a predicate,
485 ;; setting CR6 to indicate a combined status
486 (define_expand "vector_eq_<mode>_p"
489 (unspec:CC [(eq:CC (match_operand:VEC_A 1 "vlogical_operand" "")
490 (match_operand:VEC_A 2 "vlogical_operand" ""))]
492 (set (match_operand:VEC_A 0 "vlogical_operand" "")
493 (eq:VEC_A (match_dup 1)
495 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
498 (define_expand "vector_gt_<mode>_p"
501 (unspec:CC [(gt:CC (match_operand:VEC_A 1 "vlogical_operand" "")
502 (match_operand:VEC_A 2 "vlogical_operand" ""))]
504 (set (match_operand:VEC_A 0 "vlogical_operand" "")
505 (gt:VEC_A (match_dup 1)
507 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
510 (define_expand "vector_ge_<mode>_p"
513 (unspec:CC [(ge:CC (match_operand:VEC_F 1 "vfloat_operand" "")
514 (match_operand:VEC_F 2 "vfloat_operand" ""))]
516 (set (match_operand:VEC_F 0 "vfloat_operand" "")
517 (ge:VEC_F (match_dup 1)
519 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
522 (define_expand "vector_gtu_<mode>_p"
525 (unspec:CC [(gtu:CC (match_operand:VEC_I 1 "vint_operand" "")
526 (match_operand:VEC_I 2 "vint_operand" ""))]
528 (set (match_operand:VEC_I 0 "vlogical_operand" "")
529 (gtu:VEC_I (match_dup 1)
531 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
534 ;; AltiVec/VSX predicates.
536 (define_expand "cr6_test_for_zero"
537 [(set (match_operand:SI 0 "register_operand" "=r")
540 "TARGET_ALTIVEC || TARGET_VSX"
543 (define_expand "cr6_test_for_zero_reverse"
544 [(set (match_operand:SI 0 "register_operand" "=r")
547 (set (match_dup 0) (minus:SI (const_int 1) (match_dup 0)))]
548 "TARGET_ALTIVEC || TARGET_VSX"
551 (define_expand "cr6_test_for_lt"
552 [(set (match_operand:SI 0 "register_operand" "=r")
555 "TARGET_ALTIVEC || TARGET_VSX"
558 (define_expand "cr6_test_for_lt_reverse"
559 [(set (match_operand:SI 0 "register_operand" "=r")
562 (set (match_dup 0) (minus:SI (const_int 1) (match_dup 0)))]
563 "TARGET_ALTIVEC || TARGET_VSX"
567 ;; Vector logical instructions
568 (define_expand "xor<mode>3"
569 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
570 (xor:VEC_L (match_operand:VEC_L 1 "vlogical_operand" "")
571 (match_operand:VEC_L 2 "vlogical_operand" "")))]
572 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
575 (define_expand "ior<mode>3"
576 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
577 (ior:VEC_L (match_operand:VEC_L 1 "vlogical_operand" "")
578 (match_operand:VEC_L 2 "vlogical_operand" "")))]
579 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
582 (define_expand "and<mode>3"
583 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
584 (and:VEC_L (match_operand:VEC_L 1 "vlogical_operand" "")
585 (match_operand:VEC_L 2 "vlogical_operand" "")))]
586 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
589 (define_expand "one_cmpl<mode>2"
590 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
591 (not:VEC_L (match_operand:VEC_L 1 "vlogical_operand" "")))]
592 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
595 (define_expand "nor<mode>3"
596 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
597 (not:VEC_L (ior:VEC_L (match_operand:VEC_L 1 "vlogical_operand" "")
598 (match_operand:VEC_L 2 "vlogical_operand" ""))))]
599 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
602 (define_expand "andc<mode>3"
603 [(set (match_operand:VEC_L 0 "vlogical_operand" "")
604 (and:VEC_L (not:VEC_L (match_operand:VEC_L 2 "vlogical_operand" ""))
605 (match_operand:VEC_L 1 "vlogical_operand" "")))]
606 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
609 ;; Same size conversions
610 (define_expand "float<VEC_int><mode>2"
611 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
612 (float:VEC_F (match_operand:<VEC_INT> 1 "vint_operand" "")))]
613 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
616 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
618 emit_insn (gen_altivec_vcfsx (operands[0], operands[1], const0_rtx));
623 (define_expand "unsigned_float<VEC_int><mode>2"
624 [(set (match_operand:VEC_F 0 "vfloat_operand" "")
625 (unsigned_float:VEC_F (match_operand:<VEC_INT> 1 "vint_operand" "")))]
626 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
629 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
631 emit_insn (gen_altivec_vcfux (operands[0], operands[1], const0_rtx));
636 (define_expand "fix_trunc<mode><VEC_int>2"
637 [(set (match_operand:<VEC_INT> 0 "vint_operand" "")
638 (fix:<VEC_INT> (match_operand:VEC_F 1 "vfloat_operand" "")))]
639 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
642 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
644 emit_insn (gen_altivec_vctsxs (operands[0], operands[1], const0_rtx));
649 (define_expand "fixuns_trunc<mode><VEC_int>2"
650 [(set (match_operand:<VEC_INT> 0 "vint_operand" "")
651 (unsigned_fix:<VEC_INT> (match_operand:VEC_F 1 "vfloat_operand" "")))]
652 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (<MODE>mode)"
655 if (<MODE>mode == V4SFmode && VECTOR_UNIT_ALTIVEC_P (<MODE>mode))
657 emit_insn (gen_altivec_vctuxs (operands[0], operands[1], const0_rtx));
663 ;; Vector initialization, set, extract
664 (define_expand "vec_init<mode>"
665 [(match_operand:VEC_E 0 "vlogical_operand" "")
666 (match_operand:VEC_E 1 "" "")]
667 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
669 rs6000_expand_vector_init (operands[0], operands[1]);
673 (define_expand "vec_set<mode>"
674 [(match_operand:VEC_E 0 "vlogical_operand" "")
675 (match_operand:<VEC_base> 1 "register_operand" "")
676 (match_operand 2 "const_int_operand" "")]
677 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
679 rs6000_expand_vector_set (operands[0], operands[1], INTVAL (operands[2]));
683 (define_expand "vec_extract<mode>"
684 [(match_operand:<VEC_base> 0 "register_operand" "")
685 (match_operand:VEC_E 1 "vlogical_operand" "")
686 (match_operand 2 "const_int_operand" "")]
687 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
689 rs6000_expand_vector_extract (operands[0], operands[1],
690 INTVAL (operands[2]));
694 ;; Interleave patterns
695 (define_expand "vec_interleave_highv4sf"
696 [(set (match_operand:V4SF 0 "vfloat_operand" "")
698 (vec_select:V4SF (match_operand:V4SF 1 "vfloat_operand" "")
699 (parallel [(const_int 0)
703 (vec_select:V4SF (match_operand:V4SF 2 "vfloat_operand" "")
704 (parallel [(const_int 2)
709 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SFmode)"
712 (define_expand "vec_interleave_lowv4sf"
713 [(set (match_operand:V4SF 0 "vfloat_operand" "")
715 (vec_select:V4SF (match_operand:V4SF 1 "vfloat_operand" "")
716 (parallel [(const_int 2)
720 (vec_select:V4SF (match_operand:V4SF 2 "vfloat_operand" "")
721 (parallel [(const_int 0)
726 "VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SFmode)"
729 (define_expand "vec_interleave_high<mode>"
730 [(set (match_operand:VEC_64 0 "vfloat_operand" "")
732 (vec_select:<VEC_base> (match_operand:VEC_64 1 "vfloat_operand" "")
733 (parallel [(const_int 0)]))
734 (vec_select:<VEC_base> (match_operand:VEC_64 2 "vfloat_operand" "")
735 (parallel [(const_int 0)]))))]
736 "VECTOR_UNIT_VSX_P (<MODE>mode)"
739 (define_expand "vec_interleave_low<mode>"
740 [(set (match_operand:VEC_64 0 "vfloat_operand" "")
742 (vec_select:<VEC_base> (match_operand:VEC_64 1 "vfloat_operand" "")
743 (parallel [(const_int 1)]))
744 (vec_select:<VEC_base> (match_operand:VEC_64 2 "vfloat_operand" "")
745 (parallel [(const_int 1)]))))]
746 "VECTOR_UNIT_VSX_P (<MODE>mode)"
750 ;; Convert double word types to single word types
751 (define_expand "vec_pack_trunc_v2df"
752 [(match_operand:V4SF 0 "vfloat_operand" "")
753 (match_operand:V2DF 1 "vfloat_operand" "")
754 (match_operand:V2DF 2 "vfloat_operand" "")]
755 "VECTOR_UNIT_VSX_P (V2DFmode) && TARGET_ALTIVEC"
757 rtx r1 = gen_reg_rtx (V4SFmode);
758 rtx r2 = gen_reg_rtx (V4SFmode);
760 emit_insn (gen_vsx_xvcvdpsp (r1, operands[1]));
761 emit_insn (gen_vsx_xvcvdpsp (r2, operands[2]));
762 emit_insn (gen_vec_extract_evenv4sf (operands[0], r1, r2));
766 (define_expand "vec_pack_sfix_trunc_v2df"
767 [(match_operand:V4SI 0 "vint_operand" "")
768 (match_operand:V2DF 1 "vfloat_operand" "")
769 (match_operand:V2DF 2 "vfloat_operand" "")]
770 "VECTOR_UNIT_VSX_P (V2DFmode) && TARGET_ALTIVEC"
772 rtx r1 = gen_reg_rtx (V4SImode);
773 rtx r2 = gen_reg_rtx (V4SImode);
775 emit_insn (gen_vsx_xvcvdpsxws (r1, operands[1]));
776 emit_insn (gen_vsx_xvcvdpsxws (r2, operands[2]));
777 emit_insn (gen_vec_extract_evenv4si (operands[0], r1, r2));
781 (define_expand "vec_pack_ufix_trunc_v2df"
782 [(match_operand:V4SI 0 "vint_operand" "")
783 (match_operand:V2DF 1 "vfloat_operand" "")
784 (match_operand:V2DF 2 "vfloat_operand" "")]
785 "VECTOR_UNIT_VSX_P (V2DFmode) && TARGET_ALTIVEC"
787 rtx r1 = gen_reg_rtx (V4SImode);
788 rtx r2 = gen_reg_rtx (V4SImode);
790 emit_insn (gen_vsx_xvcvdpuxws (r1, operands[1]));
791 emit_insn (gen_vsx_xvcvdpuxws (r2, operands[2]));
792 emit_insn (gen_vec_extract_evenv4si (operands[0], r1, r2));
796 ;; Convert single word types to double word
797 (define_expand "vec_unpacks_hi_v4sf"
798 [(match_operand:V2DF 0 "vfloat_operand" "")
799 (match_operand:V4SF 1 "vfloat_operand" "")]
800 "VECTOR_UNIT_VSX_P (V2DFmode) && VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SFmode)"
802 rtx reg = gen_reg_rtx (V4SFmode);
804 emit_insn (gen_vec_interleave_highv4sf (reg, operands[1], operands[1]));
805 emit_insn (gen_vsx_xvcvspdp (operands[0], reg));
809 (define_expand "vec_unpacks_lo_v4sf"
810 [(match_operand:V2DF 0 "vfloat_operand" "")
811 (match_operand:V4SF 1 "vfloat_operand" "")]
812 "VECTOR_UNIT_VSX_P (V2DFmode) && VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SFmode)"
814 rtx reg = gen_reg_rtx (V4SFmode);
816 emit_insn (gen_vec_interleave_lowv4sf (reg, operands[1], operands[1]));
817 emit_insn (gen_vsx_xvcvspdp (operands[0], reg));
821 (define_expand "vec_unpacks_float_hi_v4si"
822 [(match_operand:V2DF 0 "vfloat_operand" "")
823 (match_operand:V4SI 1 "vint_operand" "")]
824 "VECTOR_UNIT_VSX_P (V2DFmode) && VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SImode)"
826 rtx reg = gen_reg_rtx (V4SImode);
828 emit_insn (gen_vec_interleave_highv4si (reg, operands[1], operands[1]));
829 emit_insn (gen_vsx_xvcvsxwdp (operands[0], reg));
833 (define_expand "vec_unpacks_float_lo_v4si"
834 [(match_operand:V2DF 0 "vfloat_operand" "")
835 (match_operand:V4SI 1 "vint_operand" "")]
836 "VECTOR_UNIT_VSX_P (V2DFmode) && VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SImode)"
838 rtx reg = gen_reg_rtx (V4SImode);
840 emit_insn (gen_vec_interleave_lowv4si (reg, operands[1], operands[1]));
841 emit_insn (gen_vsx_xvcvsxwdp (operands[0], reg));
845 (define_expand "vec_unpacku_float_hi_v4si"
846 [(match_operand:V2DF 0 "vfloat_operand" "")
847 (match_operand:V4SI 1 "vint_operand" "")]
848 "VECTOR_UNIT_VSX_P (V2DFmode) && VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SImode)"
850 rtx reg = gen_reg_rtx (V4SImode);
852 emit_insn (gen_vec_interleave_highv4si (reg, operands[1], operands[1]));
853 emit_insn (gen_vsx_xvcvuxwdp (operands[0], reg));
857 (define_expand "vec_unpacku_float_lo_v4si"
858 [(match_operand:V2DF 0 "vfloat_operand" "")
859 (match_operand:V4SI 1 "vint_operand" "")]
860 "VECTOR_UNIT_VSX_P (V2DFmode) && VECTOR_UNIT_ALTIVEC_OR_VSX_P (V4SImode)"
862 rtx reg = gen_reg_rtx (V4SImode);
864 emit_insn (gen_vec_interleave_lowv4si (reg, operands[1], operands[1]));
865 emit_insn (gen_vsx_xvcvuxwdp (operands[0], reg));
870 ;; Align vector loads with a permute.
871 (define_expand "vec_realign_load_<mode>"
872 [(match_operand:VEC_K 0 "vlogical_operand" "")
873 (match_operand:VEC_K 1 "vlogical_operand" "")
874 (match_operand:VEC_K 2 "vlogical_operand" "")
875 (match_operand:V16QI 3 "vlogical_operand" "")]
876 "VECTOR_MEM_ALTIVEC_OR_VSX_P (<MODE>mode)"
878 emit_insn (gen_altivec_vperm_<mode> (operands[0], operands[1], operands[2],
883 ;; Under VSX, vectors of 4/8 byte alignments do not need to be aligned
884 ;; since the load already handles it.
885 (define_expand "movmisalign<mode>"
886 [(set (match_operand:VEC_N 0 "nonimmediate_operand" "")
887 (match_operand:VEC_N 1 "any_operand" ""))]
888 "VECTOR_MEM_VSX_P (<MODE>mode) && TARGET_ALLOW_MOVMISALIGN"
892 ;; Vector shift left in bits. Currently supported ony for shift
893 ;; amounts that can be expressed as byte shifts (divisible by 8).
894 ;; General shift amounts can be supported using vslo + vsl. We're
895 ;; not expecting to see these yet (the vectorizer currently
896 ;; generates only shifts divisible by byte_size).
897 (define_expand "vec_shl_<mode>"
898 [(match_operand:VEC_L 0 "vlogical_operand" "")
899 (match_operand:VEC_L 1 "vlogical_operand" "")
900 (match_operand:QI 2 "reg_or_short_operand" "")]
904 rtx bitshift = operands[2];
907 HOST_WIDE_INT bitshift_val;
908 HOST_WIDE_INT byteshift_val;
910 if (! CONSTANT_P (bitshift))
912 bitshift_val = INTVAL (bitshift);
913 if (bitshift_val & 0x7)
915 byteshift_val = bitshift_val >> 3;
916 if (TARGET_VSX && (byteshift_val & 0x3) == 0)
918 shift = gen_rtx_CONST_INT (QImode, byteshift_val >> 2);
919 insn = gen_vsx_xxsldwi_<mode> (operands[0], operands[1], operands[1],
924 shift = gen_rtx_CONST_INT (QImode, byteshift_val);
925 insn = gen_altivec_vsldoi_<mode> (operands[0], operands[1], operands[1],
933 ;; Vector shift right in bits. Currently supported ony for shift
934 ;; amounts that can be expressed as byte shifts (divisible by 8).
935 ;; General shift amounts can be supported using vsro + vsr. We're
936 ;; not expecting to see these yet (the vectorizer currently
937 ;; generates only shifts divisible by byte_size).
938 (define_expand "vec_shr_<mode>"
939 [(match_operand:VEC_L 0 "vlogical_operand" "")
940 (match_operand:VEC_L 1 "vlogical_operand" "")
941 (match_operand:QI 2 "reg_or_short_operand" "")]
945 rtx bitshift = operands[2];
948 HOST_WIDE_INT bitshift_val;
949 HOST_WIDE_INT byteshift_val;
951 if (! CONSTANT_P (bitshift))
953 bitshift_val = INTVAL (bitshift);
954 if (bitshift_val & 0x7)
956 byteshift_val = 16 - (bitshift_val >> 3);
957 if (TARGET_VSX && (byteshift_val & 0x3) == 0)
959 shift = gen_rtx_CONST_INT (QImode, byteshift_val >> 2);
960 insn = gen_vsx_xxsldwi_<mode> (operands[0], operands[1], operands[1],
965 shift = gen_rtx_CONST_INT (QImode, byteshift_val);
966 insn = gen_altivec_vsldoi_<mode> (operands[0], operands[1], operands[1],
974 ;; Expanders for rotate each element in a vector
975 (define_expand "vrotl<mode>3"
976 [(set (match_operand:VEC_I 0 "vint_operand" "")
977 (rotate:VEC_I (match_operand:VEC_I 1 "vint_operand" "")
978 (match_operand:VEC_I 2 "vint_operand" "")))]
982 ;; Expanders for arithmetic shift left on each vector element
983 (define_expand "vashl<mode>3"
984 [(set (match_operand:VEC_I 0 "vint_operand" "")
985 (ashift:VEC_I (match_operand:VEC_I 1 "vint_operand" "")
986 (match_operand:VEC_I 2 "vint_operand" "")))]
990 ;; Expanders for logical shift right on each vector element
991 (define_expand "vlshr<mode>3"
992 [(set (match_operand:VEC_I 0 "vint_operand" "")
993 (lshiftrt:VEC_I (match_operand:VEC_I 1 "vint_operand" "")
994 (match_operand:VEC_I 2 "vint_operand" "")))]
998 ;; Expanders for arithmetic shift right on each vector element
999 (define_expand "vashr<mode>3"
1000 [(set (match_operand:VEC_I 0 "vint_operand" "")
1001 (ashiftrt:VEC_I (match_operand:VEC_I 1 "vint_operand" "")
1002 (match_operand:VEC_I 2 "vint_operand" "")))]
1006 ;; Vector reduction expanders for VSX
1008 (define_expand "reduc_<VEC_reduc_name>_v2df"
1009 [(parallel [(set (match_operand:V2DF 0 "vfloat_operand" "")
1013 (match_operand:V2DF 1 "vfloat_operand" "")
1014 (parallel [(const_int 1)]))
1017 (parallel [(const_int 0)])))
1019 (clobber (match_scratch:V2DF 2 ""))])]
1020 "VECTOR_UNIT_VSX_P (V2DFmode)"
1023 ; The (VEC_reduc:V4SF
1025 ; (unspec:V4SF [(const_int 0)] UNSPEC_REDUC))
1027 ; is to allow us to use a code iterator, but not completely list all of the
1028 ; vector rotates, etc. to prevent canonicalization
1030 (define_expand "reduc_<VEC_reduc_name>_v4sf"
1031 [(parallel [(set (match_operand:V4SF 0 "vfloat_operand" "")
1033 (unspec:V4SF [(const_int 0)] UNSPEC_REDUC)
1034 (match_operand:V4SF 1 "vfloat_operand" "")))
1035 (clobber (match_scratch:V4SF 2 ""))
1036 (clobber (match_scratch:V4SF 3 ""))])]
1037 "VECTOR_UNIT_VSX_P (V4SFmode)"
1041 ;;; Expanders for vector insn patterns shared between the SPE and TARGET_PAIRED systems.
1043 (define_expand "absv2sf2"
1044 [(set (match_operand:V2SF 0 "gpc_reg_operand" "")
1045 (abs:V2SF (match_operand:V2SF 1 "gpc_reg_operand" "")))]
1046 "TARGET_PAIRED_FLOAT || TARGET_SPE"
1049 (define_expand "negv2sf2"
1050 [(set (match_operand:V2SF 0 "gpc_reg_operand" "")
1051 (neg:V2SF (match_operand:V2SF 1 "gpc_reg_operand" "")))]
1052 "TARGET_PAIRED_FLOAT || TARGET_SPE"
1055 (define_expand "addv2sf3"
1056 [(set (match_operand:V2SF 0 "gpc_reg_operand" "")
1057 (plus:V2SF (match_operand:V2SF 1 "gpc_reg_operand" "")
1058 (match_operand:V2SF 2 "gpc_reg_operand" "")))]
1059 "TARGET_PAIRED_FLOAT || TARGET_SPE"
1064 /* We need to make a note that we clobber SPEFSCR. */
1065 rtx par = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (2));
1067 XVECEXP (par, 0, 0) = gen_rtx_SET (VOIDmode, operands[0],
1068 gen_rtx_PLUS (V2SFmode, operands[1], operands[2]));
1069 XVECEXP (par, 0, 1) = gen_rtx_CLOBBER (VOIDmode, gen_rtx_REG (SImode, SPEFSCR_REGNO));
1075 (define_expand "subv2sf3"
1076 [(set (match_operand:V2SF 0 "gpc_reg_operand" "")
1077 (minus:V2SF (match_operand:V2SF 1 "gpc_reg_operand" "")
1078 (match_operand:V2SF 2 "gpc_reg_operand" "")))]
1079 "TARGET_PAIRED_FLOAT || TARGET_SPE"
1084 /* We need to make a note that we clobber SPEFSCR. */
1085 rtx par = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (2));
1087 XVECEXP (par, 0, 0) = gen_rtx_SET (VOIDmode, operands[0],
1088 gen_rtx_MINUS (V2SFmode, operands[1], operands[2]));
1089 XVECEXP (par, 0, 1) = gen_rtx_CLOBBER (VOIDmode, gen_rtx_REG (SImode, SPEFSCR_REGNO));
1095 (define_expand "mulv2sf3"
1096 [(set (match_operand:V2SF 0 "gpc_reg_operand" "")
1097 (mult:V2SF (match_operand:V2SF 1 "gpc_reg_operand" "")
1098 (match_operand:V2SF 2 "gpc_reg_operand" "")))]
1099 "TARGET_PAIRED_FLOAT || TARGET_SPE"
1104 /* We need to make a note that we clobber SPEFSCR. */
1105 rtx par = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (2));
1107 XVECEXP (par, 0, 0) = gen_rtx_SET (VOIDmode, operands[0],
1108 gen_rtx_MULT (V2SFmode, operands[1], operands[2]));
1109 XVECEXP (par, 0, 1) = gen_rtx_CLOBBER (VOIDmode, gen_rtx_REG (SImode, SPEFSCR_REGNO));
1115 (define_expand "divv2sf3"
1116 [(set (match_operand:V2SF 0 "gpc_reg_operand" "")
1117 (div:V2SF (match_operand:V2SF 1 "gpc_reg_operand" "")
1118 (match_operand:V2SF 2 "gpc_reg_operand" "")))]
1119 "TARGET_PAIRED_FLOAT || TARGET_SPE"
1124 /* We need to make a note that we clobber SPEFSCR. */
1125 rtx par = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (2));
1127 XVECEXP (par, 0, 0) = gen_rtx_SET (VOIDmode, operands[0],
1128 gen_rtx_DIV (V2SFmode, operands[1], operands[2]));
1129 XVECEXP (par, 0, 1) = gen_rtx_CLOBBER (VOIDmode, gen_rtx_REG (SImode, SPEFSCR_REGNO));