Hi,
On 09 May 18:45, Jakub Jelinek wrote:
> Hi!
> 
> vinsertps is already in AVX512F, so we can use use v constraints
> freely.
> 
> Bootstrapped/regtested on x86_64-linux and i686-linux, ok for trunk?
OK.

--
Thanks, K
> 
> 2016-05-09  Jakub Jelinek  <ja...@redhat.com>
> 
>       * config/i386/sse.md (*vec_setv4sf_sse4_1, sse4_1_insertps): Use v
>       constraint instead of x in avx alternatives.  Use maybe_evex instead
>       of vex prefix.
> 
>       * gcc.target/i386/avx512vl-vinsertps-1.c: New test.
> 
> --- gcc/config/i386/sse.md.jj 2016-05-09 12:34:58.839865460 +0200
> +++ gcc/config/i386/sse.md    2016-05-09 13:15:55.400130875 +0200
> @@ -6657,11 +6657,11 @@ (define_insn "vec_set<mode>_0"
>  
>  ;; A subset is vec_setv4sf.
>  (define_insn "*vec_setv4sf_sse4_1"
> -  [(set (match_operand:V4SF 0 "register_operand" "=Yr,*x,x")
> +  [(set (match_operand:V4SF 0 "register_operand" "=Yr,*x,v")
>       (vec_merge:V4SF
>         (vec_duplicate:V4SF
> -         (match_operand:SF 2 "nonimmediate_operand" "Yrm,*xm,xm"))
> -       (match_operand:V4SF 1 "register_operand" "0,0,x")
> +         (match_operand:SF 2 "nonimmediate_operand" "Yrm,*xm,vm"))
> +       (match_operand:V4SF 1 "register_operand" "0,0,v")
>         (match_operand:SI 3 "const_int_operand")))]
>    "TARGET_SSE4_1
>     && ((unsigned) exact_log2 (INTVAL (operands[3]))
> @@ -6684,13 +6684,13 @@ (define_insn "*vec_setv4sf_sse4_1"
>     (set_attr "prefix_data16" "1,1,*")
>     (set_attr "prefix_extra" "1")
>     (set_attr "length_immediate" "1")
> -   (set_attr "prefix" "orig,orig,vex")
> +   (set_attr "prefix" "orig,orig,maybe_evex")
>     (set_attr "mode" "V4SF")])
>  
>  (define_insn "sse4_1_insertps"
> -  [(set (match_operand:V4SF 0 "register_operand" "=Yr,*x,x")
> -     (unspec:V4SF [(match_operand:V4SF 2 "nonimmediate_operand" "Yrm,*xm,xm")
> -                   (match_operand:V4SF 1 "register_operand" "0,0,x")
> +  [(set (match_operand:V4SF 0 "register_operand" "=Yr,*x,v")
> +     (unspec:V4SF [(match_operand:V4SF 2 "nonimmediate_operand" "Yrm,*xm,vm")
> +                   (match_operand:V4SF 1 "register_operand" "0,0,v")
>                     (match_operand:SI 3 "const_0_to_255_operand" "n,n,n")]
>                    UNSPEC_INSERTPS))]
>    "TARGET_SSE4_1"
> @@ -6718,7 +6718,7 @@ (define_insn "sse4_1_insertps"
>     (set_attr "prefix_data16" "1,1,*")
>     (set_attr "prefix_extra" "1")
>     (set_attr "length_immediate" "1")
> -   (set_attr "prefix" "orig,orig,vex")
> +   (set_attr "prefix" "orig,orig,maybe_evex")
>     (set_attr "mode" "V4SF")])
>  
>  (define_split
> --- gcc/testsuite/gcc.target/i386/avx512vl-vinsertps-1.c.jj   2016-05-09 
> 13:10:08.277794535 +0200
> +++ gcc/testsuite/gcc.target/i386/avx512vl-vinsertps-1.c      2016-05-09 
> 13:13:51.788792211 +0200
> @@ -0,0 +1,39 @@
> +/* { dg-do compile { target { ! ia32 } } } */
> +/* { dg-options "-O2 -mavx512vl" } */
> +
> +#include <x86intrin.h>
> +
> +__m128
> +f1 (__m128 a, __m128 b)
> +{
> +  register __m128 c __asm ("xmm16") = a;
> +  asm volatile ("" : "+v" (c));
> +  c = _mm_insert_ps (c, b, 1);
> +  asm volatile ("" : "+v" (c));
> +  return c;
> +}
> +
> +/* { dg-final { scan-assembler "vinsertps\[^\n\r\]*xmm16" } } */
> +
> +__v4sf
> +f2 (__v4sf a, float b)
> +{
> +  register __v4sf c __asm ("xmm17") = a;
> +  asm volatile ("" : "+v" (c));
> +  c[1] = b;
> +  asm volatile ("" : "+v" (c));
> +  return c;
> +}
> +
> +/* { dg-final { scan-assembler "vinsertps\[^\n\r\]*xmm17" } } */
> +
> +__v4sf
> +f3 (__v4sf a, float b)
> +{
> +  register float c __asm ("xmm18") = b;
> +  asm volatile ("" : "+v" (c));
> +  a[1] = c;
> +  return a;
> +}
> +
> +/* { dg-final { scan-assembler "vinsertps\[^\n\r\]*xmm18" } } */
> 
>       Jakub

Reply via email to