[clang] [CIR] Add ClangIR tests for AVX512VL rotate builtins (prord/prorq) (PR #173822)

via cfe-commits Sun, 28 Dec 2025 21:26:19 -0800

https://github.com/Lane0218 created 
https://github.com/llvm/llvm-project/pull/173822


This PR adds missing ClangIR (CIR) test coverage for the 128/256-bit x86 
rotate-right builtins used by prord/prorq.

Background
- CIR support for x86 rotate builtins was implemented in 
271e99daf0ff860d0ab50c688ba5e0480de78847 ("[CIR] Support x86 builtin rotate 
(#169566)").
- Existing CIR tests cover the 512-bit forms 
(_mm512_ror_epi32/_mm512_ror_epi64) in 
clang/test/CIR/CodeGenBuiltins/X86/avx512f-builtins.c, but there was no 
equivalent coverage for the 128/256-bit AVX512VL forms.

What this adds
- Extends clang/test/CIR/CodeGenBuiltins/X86/avx512vl-builtins.c with unmasked 
rotate-right tests:
  - _mm_ror_epi32  -> llvm.fshr.v4i32
  - _mm256_ror_epi32 -> llvm.fshr.v8i32
  - _mm_ror_epi64  -> llvm.fshr.v2i64
  - _mm256_ror_epi64 -> llvm.fshr.v4i64
- Each test checks:
  - CIR emission uses the "fshr" intrinsic with the expected vector shapes.
  - CIR->LLVM lowering and OGCG lowering both produce the expected @llvm.fshr.* 
call.
  - The first two operands to @llvm.fshr.* are bound and verified to be the 
same value (to avoid false positives).

Testing
- build-cir/bin/llvm-lit -sv 
clang/test/CIR/CodeGenBuiltins/X86/avx512vl-builtins.c

Refs
- Tracking issue: llvm/llvm-project#167765


>From 9446a60deb36e0bcc56ac7344dfa324abf64039a Mon Sep 17 00:00:00 2001
From: Lane0218 <[email protected]>
Date: Mon, 29 Dec 2025 13:20:00 +0800
Subject: [PATCH] [CIR] Add AVX512VL rotate builtin tests

---
 .../CodeGenBuiltins/X86/avx512vl-builtins.c   | 62 +++++++++++++++++++
 1 file changed, 62 insertions(+)

diff --git a/clang/test/CIR/CodeGenBuiltins/X86/avx512vl-builtins.c 
b/clang/test/CIR/CodeGenBuiltins/X86/avx512vl-builtins.c
index 4ca07e2f099f1..4a1fad1336e90 100644
--- a/clang/test/CIR/CodeGenBuiltins/X86/avx512vl-builtins.c
+++ b/clang/test/CIR/CodeGenBuiltins/X86/avx512vl-builtins.c
@@ -199,6 +199,68 @@ __m256i test_mm256_mask_i32gather_epi32(__m256i __v1_old, 
__mmask8 __mask, __m25
   return _mm256_mmask_i32gather_epi32(__v1_old, __mask, __index, __addr, 2); 
 }
 
+__m128i test_mm_ror_epi32(__m128i __A) {
+  // CIR-LABEL: test_mm_ror_epi32
+  // CIR: cir.cast integral %{{.*}} : !s32i -> !u32i
+  // CIR: cir.vec.splat %{{.*}} : !u32i, !cir.vector<4 x !u32i>
+  // CIR: cir.call_llvm_intrinsic "fshr" %{{.*}}: (!cir.vector<4 x !s32i>, 
!cir.vector<4 x !s32i>, !cir.vector<4 x !u32i>) -> !cir.vector<4 x !s32i>
+
+  // LLVM-LABEL: @test_mm_ror_epi32
+  // LLVM: %[[CASTED_VAR:.*]] = bitcast <2 x i64> %{{.*}} to <4 x i32>
+  // LLVM: call <4 x i32> @llvm.fshr.v4i32(<4 x i32> %[[CASTED_VAR]], <4 x 
i32> %[[CASTED_VAR]], <4 x i32> splat (i32 5))
+
+  // OGCG-LABEL: @test_mm_ror_epi32
+  // OGCG: %[[CASTED_VAR:.*]] = bitcast <2 x i64> %{{.*}} to <4 x i32>
+  // OGCG: call <4 x i32> @llvm.fshr.v4i32(<4 x i32> %[[CASTED_VAR]], <4 x 
i32> %[[CASTED_VAR]], <4 x i32> splat (i32 5))
+  return _mm_ror_epi32(__A, 5);
+}
+
+__m256i test_mm256_ror_epi32(__m256i __A) {
+  // CIR-LABEL: test_mm256_ror_epi32
+  // CIR: cir.cast integral %{{.*}} : !s32i -> !u32i
+  // CIR: cir.vec.splat %{{.*}} : !u32i, !cir.vector<8 x !u32i>
+  // CIR: cir.call_llvm_intrinsic "fshr" %{{.*}}: (!cir.vector<8 x !s32i>, 
!cir.vector<8 x !s32i>, !cir.vector<8 x !u32i>) -> !cir.vector<8 x !s32i>
+
+  // LLVM-LABEL: @test_mm256_ror_epi32
+  // LLVM: %[[CASTED_VAR:.*]] = bitcast <4 x i64> %{{.*}} to <8 x i32>
+  // LLVM: call <8 x i32> @llvm.fshr.v8i32(<8 x i32> %[[CASTED_VAR]], <8 x 
i32> %[[CASTED_VAR]], <8 x i32> splat (i32 5))
+
+  // OGCG-LABEL: @test_mm256_ror_epi32
+  // OGCG: %[[CASTED_VAR:.*]] = bitcast <4 x i64> %{{.*}} to <8 x i32>
+  // OGCG: call <8 x i32> @llvm.fshr.v8i32(<8 x i32> %[[CASTED_VAR]], <8 x 
i32> %[[CASTED_VAR]], <8 x i32> splat (i32 5))
+  return _mm256_ror_epi32(__A, 5);
+}
+
+__m128i test_mm_ror_epi64(__m128i __A) {
+  // CIR-LABEL: test_mm_ror_epi64
+  // CIR: cir.cast integral %{{.*}} : !s32i -> !u32i
+  // CIR: cir.cast integral %{{.*}} : !u32i -> !u64i
+  // CIR: cir.vec.splat %{{.*}} : !u64i, !cir.vector<2 x !u64i>
+  // CIR: cir.call_llvm_intrinsic "fshr" %{{.*}}: (!cir.vector<2 x !s64i>, 
!cir.vector<2 x !s64i>, !cir.vector<2 x !u64i>) -> !cir.vector<2 x !s64i>
+
+  // LLVM-LABEL: @test_mm_ror_epi64
+  // LLVM: call <2 x i64> @llvm.fshr.v2i64(<2 x i64> %[[V:.*]], <2 x i64> 
%[[V]], <2 x i64> splat (i64 5))
+
+  // OGCG-LABEL: @test_mm_ror_epi64
+  // OGCG: call <2 x i64> @llvm.fshr.v2i64(<2 x i64> %[[V:.*]], <2 x i64> 
%[[V]], <2 x i64> splat (i64 5))
+  return _mm_ror_epi64(__A, 5);
+}
+
+__m256i test_mm256_ror_epi64(__m256i __A) {
+  // CIR-LABEL: test_mm256_ror_epi64
+  // CIR: cir.cast integral %{{.*}} : !s32i -> !u32i
+  // CIR: cir.cast integral %{{.*}} : !u32i -> !u64i
+  // CIR: cir.vec.splat %{{.*}} : !u64i, !cir.vector<4 x !u64i>
+  // CIR: cir.call_llvm_intrinsic "fshr" %{{.*}}: (!cir.vector<4 x !s64i>, 
!cir.vector<4 x !s64i>, !cir.vector<4 x !u64i>) -> !cir.vector<4 x !s64i>
+
+  // LLVM-LABEL: @test_mm256_ror_epi64
+  // LLVM: call <4 x i64> @llvm.fshr.v4i64(<4 x i64> %[[V:.*]], <4 x i64> 
%[[V]], <4 x i64> splat (i64 5))
+
+  // OGCG-LABEL: @test_mm256_ror_epi64
+  // OGCG: call <4 x i64> @llvm.fshr.v4i64(<4 x i64> %[[V:.*]], <4 x i64> 
%[[V]], <4 x i64> splat (i64 5))
+  return _mm256_ror_epi64(__A, 5);
+}
+
 __m256 test_mm256_insertf32x4(__m256 __A, __m128 __B) {
   // CIR-LABEL: test_mm256_insertf32x4
   // CIR: %{{.*}} = cir.vec.shuffle(%{{.*}}, %{{.*}} : !cir.vector<8 x 
!cir.float>) [#cir.int<0> : !s32i, #cir.int<1> : !s32i, #cir.int<2> : !s32i, 
#cir.int<3> : !s32i, #cir.int<8> : !s32i, #cir.int<9> : !s32i, #cir.int<10> : 
!s32i, #cir.int<11> : !s32i] : !cir.vector<8 x !cir.float>

_______________________________________________
cfe-commits mailing list
[email protected]
https://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits

[clang] [CIR] Add ClangIR tests for AVX512VL rotate builtins (prord/prorq) (PR #173822)

Reply via email to