Alexander Timofeev | 982aee6 | 2017-07-04 17:32:00 +0000 | [diff] [blame] | 1 | ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=FUNC %s |
| 2 | ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=tonga -mattr=-flat-for-global -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=FUNC %s |
| 3 | ; RUN: llc -amdgpu-scalarize-global-loads=false -march=r600 -mcpu=cypress -verify-machineinstrs < %s | FileCheck -check-prefix=EG -check-prefix=FUNC %s |
Matt Arsenault | b0df925 | 2014-07-10 03:22:20 +0000 | [diff] [blame] | 4 | |
Tim Northover | fd7e424 | 2014-07-17 10:51:23 +0000 | [diff] [blame] | 5 | declare i16 @llvm.convert.to.fp16.f32(float) nounwind readnone |
Matt Arsenault | b0df925 | 2014-07-10 03:22:20 +0000 | [diff] [blame] | 6 | |
Jan Vesely | 0d6cb1c | 2017-01-11 00:12:39 +0000 | [diff] [blame] | 7 | ; FUNC-LABEL: {{^}}test_convert_fp32_to_fp16: |
| 8 | ; GCN: buffer_load_dword [[VAL:v[0-9]+]] |
| 9 | ; GCN: v_cvt_f16_f32_e32 [[RESULT:v[0-9]+]], [[VAL]] |
| 10 | ; GCN: buffer_store_short [[RESULT]] |
| 11 | |
| 12 | ; EG: MEM_RAT MSKOR |
| 13 | ; EG: VTX_READ_32 |
| 14 | ; EG: FLT32_TO_FLT16 |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 15 | define amdgpu_kernel void @test_convert_fp32_to_fp16(i16 addrspace(1)* noalias %out, float addrspace(1)* noalias %in) nounwind { |
David Blaikie | a79ac14 | 2015-02-27 21:17:42 +0000 | [diff] [blame] | 16 | %val = load float, float addrspace(1)* %in, align 4 |
Tim Northover | fd7e424 | 2014-07-17 10:51:23 +0000 | [diff] [blame] | 17 | %cvt = call i16 @llvm.convert.to.fp16.f32(float %val) nounwind readnone |
Matt Arsenault | b0df925 | 2014-07-10 03:22:20 +0000 | [diff] [blame] | 18 | store i16 %cvt, i16 addrspace(1)* %out, align 2 |
| 19 | ret void |
| 20 | } |