forked from llvm/llvm-project
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
[HLSL] Implement HLSL Aggregate splatting (llvm#118992)
Implement HLSL Aggregate Splat casting that handles splatting for arrays and structs, and vectors if splatting from a vec1. Closes llvm#100609 and Closes llvm#100619 Depends on llvm#118842
- Loading branch information
Showing
18 changed files
with
305 additions
and
4 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
87 changes: 87 additions & 0 deletions
87
clang/test/CodeGenHLSL/BasicFeatures/AggregateSplatCast.hlsl
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,87 @@ | ||
// RUN: %clang_cc1 -finclude-default-header -triple dxil-pc-shadermodel6.3-library -x hlsl -emit-llvm -disable-llvm-passes -o - %s | FileCheck %s | ||
|
||
// array splat | ||
// CHECK-LABEL: define void {{.*}}call4 | ||
// CHECK: [[B:%.*]] = alloca [2 x i32], align 4 | ||
// CHECK-NEXT: call void @llvm.memcpy.p0.p0.i32(ptr align 4 [[B]], ptr align 4 {{.*}}, i32 8, i1 false) | ||
// CHECK-NEXT: [[G1:%.*]] = getelementptr inbounds [2 x i32], ptr [[B]], i32 0, i32 0 | ||
// CHECK-NEXT: [[G2:%.*]] = getelementptr inbounds [2 x i32], ptr [[B]], i32 0, i32 1 | ||
// CHECK-NEXT: store i32 3, ptr [[G1]], align 4 | ||
// CHECK-NEXT: store i32 3, ptr [[G2]], align 4 | ||
export void call4() { | ||
int B[2] = {1,2}; | ||
B = (int[2])3; | ||
} | ||
|
||
// splat from vector of length 1 | ||
// CHECK-LABEL: define void {{.*}}call8 | ||
// CHECK: [[A:%.*]] = alloca <1 x i32>, align 4 | ||
// CHECK-NEXT: [[B:%.*]] = alloca [2 x i32], align 4 | ||
// CHECK-NEXT: store <1 x i32> splat (i32 1), ptr [[A]], align 4 | ||
// CHECK-NEXT: call void @llvm.memcpy.p0.p0.i32(ptr align 4 [[B]], ptr align 4 {{.*}}, i32 8, i1 false) | ||
// CHECK-NEXT: [[L:%.*]] = load <1 x i32>, ptr [[A]], align 4 | ||
// CHECK-NEXT: [[VL:%.*]] = extractelement <1 x i32> [[L]], i32 0 | ||
// CHECK-NEXT: [[G1:%.*]] = getelementptr inbounds [2 x i32], ptr [[B]], i32 0, i32 0 | ||
// CHECK-NEXT: [[G2:%.*]] = getelementptr inbounds [2 x i32], ptr [[B]], i32 0, i32 1 | ||
// CHECK-NEXT: store i32 [[VL]], ptr [[G1]], align 4 | ||
// CHECK-NEXT: store i32 [[VL]], ptr [[G2]], align 4 | ||
export void call8() { | ||
int1 A = {1}; | ||
int B[2] = {1,2}; | ||
B = (int[2])A; | ||
} | ||
|
||
// vector splat from vector of length 1 | ||
// CHECK-LABEL: define void {{.*}}call1 | ||
// CHECK: [[B:%.*]] = alloca <1 x float>, align 4 | ||
// CHECK-NEXT: [[A:%.*]] = alloca <4 x i32>, align 16 | ||
// CHECK-NEXT: store <1 x float> splat (float 1.000000e+00), ptr [[B]], align 4 | ||
// CHECK-NEXT: [[L:%.*]] = load <1 x float>, ptr [[B]], align 4 | ||
// CHECK-NEXT: [[VL:%.*]] = extractelement <1 x float> [[L]], i32 0 | ||
// CHECK-NEXT: [[C:%.*]] = fptosi float [[VL]] to i32 | ||
// CHECK-NEXT: [[SI:%.*]] = insertelement <4 x i32> poison, i32 [[C]], i64 0 | ||
// CHECK-NEXT: [[S:%.*]] = shufflevector <4 x i32> [[SI]], <4 x i32> poison, <4 x i32> zeroinitializer | ||
// CHECK-NEXT: store <4 x i32> [[S]], ptr [[A]], align 16 | ||
export void call1() { | ||
float1 B = {1.0}; | ||
int4 A = (int4)B; | ||
} | ||
|
||
struct S { | ||
int X; | ||
float Y; | ||
}; | ||
|
||
// struct splats | ||
// CHECK-LABEL: define void {{.*}}call3 | ||
// CHECK: [[A:%.*]] = alloca <1 x i32>, align 4 | ||
// CHECK: [[s:%.*]] = alloca %struct.S, align 4 | ||
// CHECK-NEXT: store <1 x i32> splat (i32 1), ptr [[A]], align 4 | ||
// CHECK-NEXT: [[L:%.*]] = load <1 x i32>, ptr [[A]], align 4 | ||
// CHECK-NEXT: [[VL:%.*]] = extractelement <1 x i32> [[L]], i32 0 | ||
// CHECK-NEXT: [[G1:%.*]] = getelementptr inbounds %struct.S, ptr [[s]], i32 0, i32 0 | ||
// CHECK-NEXT: [[G2:%.*]] = getelementptr inbounds %struct.S, ptr [[s]], i32 0, i32 1 | ||
// CHECK-NEXT: store i32 [[VL]], ptr [[G1]], align 4 | ||
// CHECK-NEXT: [[C:%.*]] = sitofp i32 [[VL]] to float | ||
// CHECK-NEXT: store float [[C]], ptr [[G2]], align 4 | ||
export void call3() { | ||
int1 A = {1}; | ||
S s = (S)A; | ||
} | ||
|
||
// struct splat from vector of length 1 | ||
// CHECK-LABEL: define void {{.*}}call5 | ||
// CHECK: [[A:%.*]] = alloca <1 x i32>, align 4 | ||
// CHECK-NEXT: [[s:%.*]] = alloca %struct.S, align 4 | ||
// CHECK-NEXT: store <1 x i32> splat (i32 1), ptr [[A]], align 4 | ||
// CHECK-NEXT: [[L:%.*]] = load <1 x i32>, ptr [[A]], align 4 | ||
// CHECK-NEXT: [[VL:%.*]] = extractelement <1 x i32> [[L]], i32 0 | ||
// CHECK-NEXT: [[G1:%.*]] = getelementptr inbounds %struct.S, ptr [[s]], i32 0, i32 0 | ||
// CHECK-NEXT: [[G2:%.*]] = getelementptr inbounds %struct.S, ptr [[s]], i32 0, i32 1 | ||
// CHECK-NEXT: store i32 [[VL]], ptr [[G1]], align 4 | ||
// CHECK-NEXT: [[C:%.*]] = sitofp i32 [[VL]] to float | ||
// CHECK-NEXT: store float [[C]], ptr [[G2]], align 4 | ||
export void call5() { | ||
int1 A = {1}; | ||
S s = (S)A; | ||
} |
Oops, something went wrong.