================
@@ -0,0 +1,28 @@
+// REQUIRES: aarch64-registered-target || arm-registered-target
+
+// RUN: %clang_cc1 -triple arm64-none-linux-gnu
-target-feature +neon -target-feature +bf16 -disable-O0-optnone
-flax-vector-conversions=none -emit-llvm -o - %s | opt -S
-passes=mem2reg,sroa | FileCheck %s --check-prefixes=ALL,LLVM
+// RUN: %if cir-enabled %{%clang_cc1 -triple arm64-none-linux-gnu
-target-feature +neon -target-feature +bf16 -disable-O0-optnone
-flax-vector-conversions=none -fclangir -emit-llvm -o - %s | opt -S
-passes=mem2reg,sroa | FileCheck %s --check-prefixes=ALL,LLVM %}
+// RUN: %if cir-enabled %{%clang_cc1 -triple arm64-none-linux-gnu
-target-feature +neon -target-feature +bf16 -disable-O0-optnone
-flax-vector-conversions=none -fclangir -emit-cir -o - %s |
FileCheck %s --check-prefixes=ALL,CIR %}
+
+#include <arm_neon.h>
+
+//===------------------------------------------------------===//
+// BF16 get/set lane
+//===------------------------------------------------------===//
+// TODO: Add the remaining intrinsics from this group.
+
+// ALL-LABEL: @test_vduph_lane_bf16(
+bfloat16_t test_vduph_lane_bf16(bfloat16x4_t v) {
+ // CIR: cir.vec.extract %{{.*}}[%{{.*}} : !s32i] : !cir.vector<4 x !cir.bf16>
+ // LLVM: [[VGET_LANE:%.*]] = extractelement <4 x bfloat> %{{.*}}, i{{32|64}}
1
+ // LLVM: ret bfloat [[VGET_LANE]]
+ return vduph_lane_bf16(v, 1);
+}
+
+// ALL-LABEL: @test_vduph_laneq_bf16(
+bfloat16_t test_vduph_laneq_bf16(bfloat16x8_t v) {
+ // CIR: cir.vec.extract %{{.*}}[%{{.*}} : !s32i] : !cir.vector<8 x !cir.bf16>
+ // LLVM: [[VGETQ_LANE:%.*]] = extractelement <8 x bfloat> %{{.*}},
i{{32|64}} 7
----------------
banach-space wrote:
```suggestion
// LLVM: [[VGETQ_LANE:%.*]] = extractelement <8 x bfloat> %{{.*}}, i32 7
```
https://github.com/llvm/llvm-project/pull/185852
_______________________________________________
cfe-commits mailing list
[email protected]
https://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits