aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorAlexander Ivchenko <alexander.ivchenko@intel.com>2014-09-10 06:54:51 +0000
committerKirill Yukhin <kyukhin@gcc.gnu.org>2014-09-10 06:54:51 +0000
commitb9826286455578db4b0a3b8eb511484407745797 (patch)
treec6822eb55a88f7ff01f0ac0ae4ea5da23707a6a2
parentb040ded3c6aacdac0218328a9e7245ea1352e3ec (diff)
downloadgcc-b9826286455578db4b0a3b8eb511484407745797.zip
gcc-b9826286455578db4b0a3b8eb511484407745797.tar.gz
gcc-b9826286455578db4b0a3b8eb511484407745797.tar.bz2
AVX-512. Add reduce, range, fpclass insn patterns.
gcc/ * config/i386/i386.c (ix86_expand_args_builtin): Handle avx512dq_rangepv8df_mask_round, avx512dq_rangepv16sf_mask_round, avx512dq_rangepv4df_mask, avx512dq_rangepv8sf_mask, avx512dq_rangepv2df_mask, avx512dq_rangepv4sf_mask. * config/i386/sse.md (define_c_enum "unspec"): Add UNSPEC_REDUCE, UNSPEC_FPCLASS, UNSPEC_RANGE. (define_insn "<mask_codefor>reducep<mode><mask_name>"): New. (define_insn "reduces<mode>"): Ditto. (define_insn "avx512dq_rangep<mode><mask_name><round_saeonly_name>"): Ditto. (define_insn "avx512dq_ranges<mode><round_saeonly_name>"): Ditto. (define_insn "avx512dq_fpclass<mode><mask_scalar_merge_name>"): Ditto. (define_insn "avx512dq_vmfpclass<mode>"): Ditto.. Co-Authored-By: Andrey Turetskiy <andrey.turetskiy@intel.com> Co-Authored-By: Anna Tikhonova <anna.tikhonova@intel.com> Co-Authored-By: Ilya Tocar <ilya.tocar@intel.com> Co-Authored-By: Ilya Verbin <ilya.verbin@intel.com> Co-Authored-By: Kirill Yukhin <kirill.yukhin@intel.com> Co-Authored-By: Maxim Kuznetsov <maxim.kuznetsov@intel.com> Co-Authored-By: Michael Zolotukhin <michael.v.zolotukhin@intel.com> From-SVN: r215107
-rw-r--r--gcc/ChangeLog25
-rw-r--r--gcc/config/i386/i386.c6
-rw-r--r--gcc/config/i386/sse.md90
3 files changed, 121 insertions, 0 deletions
diff --git a/gcc/ChangeLog b/gcc/ChangeLog
index 5145aca..7668aab 100644
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -8,6 +8,31 @@
Michael Zolotukhin <michael.v.zolotukhin@intel.com>
* config/i386/i386.c
+ (ix86_expand_args_builtin): Handle avx512dq_rangepv8df_mask_round,
+ avx512dq_rangepv16sf_mask_round, avx512dq_rangepv4df_mask,
+ avx512dq_rangepv8sf_mask, avx512dq_rangepv2df_mask,
+ avx512dq_rangepv4sf_mask.
+ * config/i386/sse.md
+ (define_c_enum "unspec"): Add UNSPEC_REDUCE, UNSPEC_FPCLASS,
+ UNSPEC_RANGE.
+ (define_insn "<mask_codefor>reducep<mode><mask_name>"): New.
+ (define_insn "reduces<mode>"): Ditto.
+ (define_insn "avx512dq_rangep<mode><mask_name><round_saeonly_name>"):
+ Ditto.
+ (define_insn "avx512dq_ranges<mode><round_saeonly_name>"): Ditto.
+ (define_insn "avx512dq_fpclass<mode><mask_scalar_merge_name>"): Ditto.
+ (define_insn "avx512dq_vmfpclass<mode>"): Ditto..
+
+2014-09-10 Alexander Ivchenko <alexander.ivchenko@intel.com>
+ Maxim Kuznetsov <maxim.kuznetsov@intel.com>
+ Anna Tikhonova <anna.tikhonova@intel.com>
+ Ilya Tocar <ilya.tocar@intel.com>
+ Andrey Turetskiy <andrey.turetskiy@intel.com>
+ Ilya Verbin <ilya.verbin@intel.com>
+ Kirill Yukhin <kirill.yukhin@intel.com>
+ Michael Zolotukhin <michael.v.zolotukhin@intel.com>
+
+ * config/i386/i386.c
(avx512f_vgetmantv2df_round): Rename from "avx512f_getmantv2df_round".
(avx512f_vgetmantv4sf_round): Rename from "avx512f_vgetmantv4sf_round".
(ix86_expand_args_builtin): Handle avx512vl_getmantv8sf_mask,
diff --git a/gcc/config/i386/i386.c b/gcc/config/i386/i386.c
index 8449089..8f45e52 100644
--- a/gcc/config/i386/i386.c
+++ b/gcc/config/i386/i386.c
@@ -34090,6 +34090,12 @@ ix86_expand_args_builtin (const struct builtin_description *d,
case CODE_FOR_avx512vl_getmantv4df_mask:
case CODE_FOR_avx512vl_getmantv4sf_mask:
case CODE_FOR_avx512vl_getmantv2df_mask:
+ case CODE_FOR_avx512dq_rangepv8df_mask_round:
+ case CODE_FOR_avx512dq_rangepv16sf_mask_round:
+ case CODE_FOR_avx512dq_rangepv4df_mask:
+ case CODE_FOR_avx512dq_rangepv8sf_mask:
+ case CODE_FOR_avx512dq_rangepv2df_mask:
+ case CODE_FOR_avx512dq_rangepv4sf_mask:
error ("the last argument must be a 4-bit immediate");
return const0_rtx;
diff --git a/gcc/config/i386/sse.md b/gcc/config/i386/sse.md
index 1706e4c..78276b7 100644
--- a/gcc/config/i386/sse.md
+++ b/gcc/config/i386/sse.md
@@ -128,6 +128,11 @@
UNSPEC_SHA256MSG1
UNSPEC_SHA256MSG2
UNSPEC_SHA256RNDS2
+
+ ;; For AVX512DQ support
+ UNSPEC_REDUCE
+ UNSPEC_FPCLASS
+ UNSPEC_RANGE
])
(define_c_enum "unspecv" [
@@ -2330,6 +2335,34 @@
DONE;
})
+(define_insn "<mask_codefor>reducep<mode><mask_name>"
+ [(set (match_operand:VF_AVX512VL 0 "register_operand" "=v")
+ (unspec:VF_AVX512VL
+ [(match_operand:VF_AVX512VL 1 "nonimmediate_operand" "vm")
+ (match_operand:SI 2 "const_0_to_255_operand")]
+ UNSPEC_REDUCE))]
+ "TARGET_AVX512DQ"
+ "vreduce<ssemodesuffix>\t{%2, %1, %0<mask_operand3>|%0<mask_operand3>, %1, %2}"
+ [(set_attr "type" "sse")
+ (set_attr "prefix" "evex")
+ (set_attr "mode" "<MODE>")])
+
+(define_insn "reduces<mode>"
+ [(set (match_operand:VF_128 0 "register_operand" "=v")
+ (vec_merge:VF_128
+ (unspec:VF_128
+ [(match_operand:VF_128 1 "register_operand" "v")
+ (match_operand:VF_128 2 "nonimmediate_operand" "vm")
+ (match_operand:SI 3 "const_0_to_255_operand")]
+ UNSPEC_REDUCE)
+ (match_dup 1)
+ (const_int 1)))]
+ "TARGET_AVX512DQ"
+ "vreduce<ssescalarmodesuffix>\t{%3, %2, %1, %0|%0, %1, %2, %3}"
+ [(set_attr "type" "sse")
+ (set_attr "prefix" "evex")
+ (set_attr "mode" "<MODE>")])
+
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
;;
;; Parallel floating point comparisons
@@ -16754,6 +16787,63 @@
(set_attr "memory" "none,load")
(set_attr "mode" "<sseinsnmode>")])
+(define_insn "avx512dq_rangep<mode><mask_name><round_saeonly_name>"
+ [(set (match_operand:VF_AVX512VL 0 "register_operand" "=v")
+ (unspec:VF_AVX512VL
+ [(match_operand:VF_AVX512VL 1 "register_operand" "v")
+ (match_operand:VF_AVX512VL 2 "<round_saeonly_nimm_predicate>" "<round_saeonly_constraint>")
+ (match_operand:SI 3 "const_0_to_15_operand")]
+ UNSPEC_RANGE))]
+ "TARGET_AVX512DQ && <round_saeonly_mode512bit_condition>"
+ "vrange<ssemodesuffix>\t{<round_saeonly_mask_op4>%3, %2, %1, %0<mask_operand4>|%0<mask_operand4>, %1, %2, %3<round_saeonly_mask_op4>}"
+ [(set_attr "type" "sse")
+ (set_attr "prefix" "evex")
+ (set_attr "mode" "<MODE>")])
+
+(define_insn "avx512dq_ranges<mode><round_saeonly_name>"
+ [(set (match_operand:VF_128 0 "register_operand" "=v")
+ (vec_merge:VF_128
+ (unspec:VF_128
+ [(match_operand:VF_128 1 "register_operand" "v")
+ (match_operand:VF_128 2 "<round_saeonly_nimm_predicate>" "<round_saeonly_constraint>")
+ (match_operand:SI 3 "const_0_to_15_operand")]
+ UNSPEC_RANGE)
+ (match_dup 1)
+ (const_int 1)))]
+ "TARGET_AVX512DQ"
+ "vrange<ssescalarmodesuffix>\t{<round_saeonly_op4>%3, %2, %1, %0|%0, %1, %2, %3<round_saeonly_op4>}"
+ [(set_attr "type" "sse")
+ (set_attr "prefix" "evex")
+ (set_attr "mode" "<MODE>")])
+
+(define_insn "avx512dq_fpclass<mode><mask_scalar_merge_name>"
+ [(set (match_operand:<avx512fmaskmode> 0 "register_operand" "=Yk")
+ (unspec:<avx512fmaskmode>
+ [(match_operand:VF_AVX512VL 1 "register_operand" "v")
+ (match_operand:QI 2 "const_0_to_255_operand" "n")]
+ UNSPEC_FPCLASS))]
+ "TARGET_AVX512DQ"
+ "vfpclass<ssemodesuffix>\t{%2, %1, %0<mask_scalar_merge_operand3>|%0<mask_scalar_merge_operand3>, %1, %2}";
+ [(set_attr "type" "sse")
+ (set_attr "length_immediate" "1")
+ (set_attr "prefix" "evex")
+ (set_attr "mode" "<MODE>")])
+
+(define_insn "avx512dq_vmfpclass<mode>"
+ [(set (match_operand:<avx512fmaskmode> 0 "register_operand" "=Yk")
+ (and:<avx512fmaskmode>
+ (unspec:<avx512fmaskmode>
+ [(match_operand:VF_128 1 "register_operand" "v")
+ (match_operand:QI 2 "const_0_to_255_operand" "n")]
+ UNSPEC_FPCLASS)
+ (const_int 1)))]
+ "TARGET_AVX512DQ"
+ "vfpclass<ssescalarmodesuffix>\t{%2, %1, %0|%0, %1, %2}";
+ [(set_attr "type" "sse")
+ (set_attr "length_immediate" "1")
+ (set_attr "prefix" "evex")
+ (set_attr "mode" "<MODE>")])
+
(define_insn "<avx512>_getmant<mode><mask_name><round_saeonly_name>"
[(set (match_operand:VF_AVX512VL 0 "register_operand" "=v")
(unspec:VF_AVX512VL