Skip to content

Commit

Permalink
Added cl_khr_fp16 extension support for test_op_vector_insert from sp…
Browse files Browse the repository at this point in the history
…irv_new (#1766)

* Added cl_khr_fp16 extension support for test_op_vector_insert from spirv_new, work in progress.

* Added cl_khr_fp16 extension support for test_op_vector_insert from spirv_new (issue #142)
  • Loading branch information
shajder authored Jul 11, 2023
1 parent 9e8430a commit 1e2d352
Show file tree
Hide file tree
Showing 4 changed files with 125 additions and 19 deletions.
43 changes: 43 additions & 0 deletions test_conformance/spirv_new/spirv_asm/vector_half8_insert.spvasm32
Original file line number Diff line number Diff line change
@@ -0,0 +1,43 @@
; SPIR-V
; Version: 1.0
; Generator: Khronos SPIR-V Tools Assembler; 0
; Bound: 23
; Schema: 0
OpCapability Addresses
OpCapability Linkage
OpCapability Kernel
OpCapability Vector16
OpCapability Float16
OpMemoryModel Physical32 OpenCL
OpEntryPoint Kernel %1 "vector_half8_insert" %gl_GlobalInvocationID
OpName %in "in"
OpDecorate %gl_GlobalInvocationID BuiltIn GlobalInvocationId
OpDecorate %gl_GlobalInvocationID Constant
OpDecorate %in FuncParamAttr NoCapture
OpDecorate %4 FuncParamAttr NoCapture
OpDecorate %gl_GlobalInvocationID LinkageAttributes "__spirv_GlobalInvocationId" Import
%uint = OpTypeInt 32 0
%v3uint = OpTypeVector %uint 3
%_ptr_Input_v3uint = OpTypePointer Input %v3uint
%void = OpTypeVoid
%half = OpTypeFloat 16
%v8half = OpTypeVector %half 8
%_ptr_CrossWorkgroup_half = OpTypePointer CrossWorkgroup %half
%_ptr_CrossWorkgroup_v8half = OpTypePointer CrossWorkgroup %v8half
%13 = OpTypeFunction %void %_ptr_CrossWorkgroup_half %_ptr_CrossWorkgroup_v8half %uint
%gl_GlobalInvocationID = OpVariable %_ptr_Input_v3uint Input
%1 = OpFunction %void None %13
%in = OpFunctionParameter %_ptr_CrossWorkgroup_half
%4 = OpFunctionParameter %_ptr_CrossWorkgroup_v8half
%14 = OpFunctionParameter %uint
%15 = OpLabel
%16 = OpLoad %v3uint %gl_GlobalInvocationID Aligned 0
%17 = OpCompositeExtract %uint %16 0
%18 = OpInBoundsPtrAccessChain %_ptr_CrossWorkgroup_half %in %17
%19 = OpLoad %half %18
%20 = OpInBoundsPtrAccessChain %_ptr_CrossWorkgroup_v8half %4 %17
%21 = OpLoad %v8half %20
%22 = OpVectorInsertDynamic %v8half %21 %19 %14
OpStore %20 %22
OpReturn
OpFunctionEnd
48 changes: 48 additions & 0 deletions test_conformance/spirv_new/spirv_asm/vector_half8_insert.spvasm64
Original file line number Diff line number Diff line change
@@ -0,0 +1,48 @@
; SPIR-V
; Version: 1.0
; Generator: Khronos SPIR-V Tools Assembler; 0
; Bound: 27
; Schema: 0
OpCapability Addresses
OpCapability Linkage
OpCapability Kernel
OpCapability Int64
OpCapability Vector16
OpCapability Float16
OpMemoryModel Physical64 OpenCL
OpEntryPoint Kernel %1 "vector_half8_insert" %gl_GlobalInvocationID
OpName %in "in"
OpDecorate %gl_GlobalInvocationID BuiltIn GlobalInvocationId
OpDecorate %gl_GlobalInvocationID Constant
OpDecorate %in FuncParamAttr NoCapture
OpDecorate %4 FuncParamAttr NoCapture
OpDecorate %gl_GlobalInvocationID LinkageAttributes "__spirv_GlobalInvocationId" Import
%ulong = OpTypeInt 64 0
%v3ulong = OpTypeVector %ulong 3
%_ptr_Input_v3ulong = OpTypePointer Input %v3ulong
%ulong_32 = OpConstant %ulong 32
%uint = OpTypeInt 32 0
%void = OpTypeVoid
%half = OpTypeFloat 16
%v8half = OpTypeVector %half 8
%_ptr_CrossWorkgroup_half = OpTypePointer CrossWorkgroup %half
%_ptr_CrossWorkgroup_v8half = OpTypePointer CrossWorkgroup %v8half
%15 = OpTypeFunction %void %_ptr_CrossWorkgroup_half %_ptr_CrossWorkgroup_v8half %uint
%gl_GlobalInvocationID = OpVariable %_ptr_Input_v3ulong Input
%1 = OpFunction %void None %15
%in = OpFunctionParameter %_ptr_CrossWorkgroup_half
%4 = OpFunctionParameter %_ptr_CrossWorkgroup_v8half
%16 = OpFunctionParameter %uint
%17 = OpLabel
%18 = OpLoad %v3ulong %gl_GlobalInvocationID Aligned 0
%19 = OpCompositeExtract %ulong %18 0
%20 = OpShiftLeftLogical %ulong %19 %ulong_32
%21 = OpShiftRightArithmetic %ulong %20 %ulong_32
%22 = OpInBoundsPtrAccessChain %_ptr_CrossWorkgroup_half %in %21
%23 = OpLoad %half %22
%24 = OpInBoundsPtrAccessChain %_ptr_CrossWorkgroup_v8half %4 %21
%25 = OpLoad %v8half %24
%26 = OpVectorInsertDynamic %v8half %25 %23 %16
OpStore %24 %26
OpReturn
OpFunctionEnd
52 changes: 33 additions & 19 deletions test_conformance/spirv_new/test_op_vector_insert.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,17 @@ int test_insert(cl_device_id deviceID, cl_context context,
return 0;
}
}

if (std::string(name).find("half") != std::string::npos)
{
if (!is_extension_available(deviceID, "cl_khr_fp16"))
{
log_info(
"Extension cl_khr_fp16 not supported; skipping half tests.\n");
return 0;
}
}

cl_int err = CL_SUCCESS;
clProgramWrapper prog;
err = get_program_with_il(prog, deviceID, context, name);
Expand Down Expand Up @@ -94,27 +105,30 @@ int test_insert(cl_device_id deviceID, cl_context context,
return 0;
}

#define TEST_VECTOR_INSERT(TYPE, N) \
TEST_SPIRV_FUNC(op_vector_##TYPE##N##_insert) \
{ \
typedef cl_##TYPE##N Tv; \
typedef cl_##TYPE Ts; \
const int num = 1 << 20; \
std::vector<Ts> in(num); \
const char *name = "vector_" #TYPE #N "_insert"; \
\
RandomSeed seed(gRandomSeed); \
\
for (int i = 0; i < num; i++) { \
in[i] = genrand<Ts>(seed); \
} \
\
return test_insert<Ts, Tv>(deviceID, \
context, queue, \
name, \
in, N); \
#define TEST_VECTOR_INSERT(TYPE, N) \
TEST_SPIRV_FUNC(op_vector_##TYPE##N##_insert) \
{ \
if (sizeof(cl_##TYPE) == 2) \
{ \
PASSIVE_REQUIRE_FP16_SUPPORT(deviceID); \
} \
typedef cl_##TYPE##N Tv; \
typedef cl_##TYPE Ts; \
const int num = 1 << 20; \
std::vector<Ts> in(num); \
const char *name = "vector_" #TYPE #N "_insert"; \
\
RandomSeed seed(gRandomSeed); \
\
for (int i = 0; i < num; i++) \
{ \
in[i] = genrand<Ts>(seed); \
} \
\
return test_insert<Ts, Tv>(deviceID, context, queue, name, in, N); \
}

TEST_VECTOR_INSERT(half, 8)
TEST_VECTOR_INSERT(int, 4)
TEST_VECTOR_INSERT(float, 4)
TEST_VECTOR_INSERT(long, 2)
Expand Down
1 change: 1 addition & 0 deletions test_conformance/spirv_new/types.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -113,6 +113,7 @@ GENRAND_REAL_FUNC(cl_double, 2)
GENRAND_REAL_FUNC(cl_double, 4)
GENRAND_REAL_FUNC(cl_half, 2)
GENRAND_REAL_FUNC(cl_half, 4)
GENRAND_REAL_FUNC(cl_half, 8)

template<> inline cl_half genrandReal<cl_half>(RandomSeed &seed)
{
Expand Down

0 comments on commit 1e2d352

Please sign in to comment.