blob: d128e6b67581c481e37ae87ea96de7f0855c431b [file]
; RUN: clspv-opt %s -o %t -ReplaceOpenCLBuiltin
; RUN: FileCheck %s < %t
target datalayout = "e-p:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024"
target triple = "spir-unknown-unknown"
; CHECK-NOT: call spir_func
define void @foo(<4 x float> addrspace(1)* %a, <4 x float> addrspace(1)* %b, i32 %n) {
entry:
%cast = bitcast <4 x float> addrspace(1)* %b to <2 x i32> addrspace(1)*
; CHECK: [[gep:%[a-zA-Z0-9_.]+]] = getelementptr <2 x i32>, <2 x i32> addrspace(1)* %cast, i32 %n
; CHECK: [[ld:%[a-zA-Z0-9_.]+]] = load <2 x i32>, <2 x i32> addrspace(1)* [[gep]]
; CHECK: [[ex0:%[a-zA-Z0-9_.]+]] = extractelement <2 x i32> [[ld]], i32 0
; CHECK: [[ex1:%[a-zA-Z0-9_.]+]] = extractelement <2 x i32> [[ld]], i32 1
; CHECK: [[unpack0:%[a-zA-Z0-9_.]+]] = call <2 x float> @_Z18spirv.unpack.v2f16(i32 [[ex0]])
; CHECK: [[unpack1:%[a-zA-Z0-9_.]+]] = call <2 x float> @_Z18spirv.unpack.v2f16(i32 [[ex1]])
; CHECK: shufflevector <2 x float> [[unpack0]], <2 x float> [[unpack1]], <4 x i32> <i32 0, i32 1, i32 2, i32 3>
%call1 = call spir_func <4 x float> @_Z20__clspv_vloada_half4jPU3AS1KDv2_j(i32 %n, <2 x i32> addrspace(1)* %cast)
; CHECK: [[gep:%[a-zA-Z0-9_.]+]] = getelementptr <2 x i32>, <2 x i32> addrspace(1)* %cast, i32 0
; CHECK: [[ld:%[a-zA-Z0-9_.]+]] = load <2 x i32>, <2 x i32> addrspace(1)* [[gep]]
; CHECK: [[ex0:%[a-zA-Z0-9_.]+]] = extractelement <2 x i32> [[ld]], i32 0
; CHECK: [[ex1:%[a-zA-Z0-9_.]+]] = extractelement <2 x i32> [[ld]], i32 1
; CHECK: [[unpack0:%[a-zA-Z0-9_.]+]] = call <2 x float> @_Z18spirv.unpack.v2f16(i32 [[ex0]])
; CHECK: [[unpack1:%[a-zA-Z0-9_.]+]] = call <2 x float> @_Z18spirv.unpack.v2f16(i32 [[ex1]])
; CHECK: shufflevector <2 x float> [[unpack0]], <2 x float> [[unpack1]], <4 x i32> <i32 0, i32 1, i32 2, i32 3>
%call2 = call spir_func <4 x float> @_Z20__clspv_vloada_half4jPU3AS1KDv2_j(i32 0, <2 x i32> addrspace(1)* %cast)
ret void
}
declare spir_func <4 x float> @_Z20__clspv_vloada_half4jPU3AS1KDv2_j(i32, <2 x i32> addrspace(1)*)