blob: e640a7cd69f6d953a62430a0bed9cb4bfd68f2f3 [file] [log] [blame]
Tom Stellard50122a52014-04-07 19:45:41 +00001; RUN: llc < %s -march=r600 -mcpu=redwood | FileCheck %s --check-prefix=EG --check-prefix=FUNC
2; RUN: llc < %s -march=r600 -mcpu=cayman | FileCheck %s --check-prefix=EG --check-prefix=FUNC
Tom Stellard49f8bfd2015-01-06 18:00:21 +00003; RUN: llc < %s -march=amdgcn -mcpu=SI -verify-machineinstrs | FileCheck %s --check-prefix=SI --check-prefix=FUNC
Marek Olsak75170772015-01-27 17:27:15 +00004; RUN: llc < %s -march=amdgcn -mcpu=tonga -verify-machineinstrs | FileCheck %s --check-prefix=SI --check-prefix=FUNC
Tom Stellard41fc7852013-07-23 01:48:42 +00005
Tom Stellard79243d92014-10-01 17:15:17 +00006; FUNC-LABEL: {{^}}u32_mul24:
Tom Stellard50122a52014-04-07 19:45:41 +00007; EG: MUL_UINT24 {{[* ]*}}T{{[0-9]\.[XYZW]}}, KC0[2].Z, KC0[2].W
Tom Stellard326d6ec2014-11-05 14:50:53 +00008; SI: v_mul_u32_u24
Tom Stellard41fc7852013-07-23 01:48:42 +00009
10define void @u32_mul24(i32 addrspace(1)* %out, i32 %a, i32 %b) {
11entry:
12 %0 = shl i32 %a, 8
13 %a_24 = lshr i32 %0, 8
14 %1 = shl i32 %b, 8
15 %b_24 = lshr i32 %1, 8
16 %2 = mul i32 %a_24, %b_24
17 store i32 %2, i32 addrspace(1)* %out
18 ret void
19}
20
Tom Stellard79243d92014-10-01 17:15:17 +000021; FUNC-LABEL: {{^}}i16_mul24:
Tom Stellard50122a52014-04-07 19:45:41 +000022; EG: MUL_UINT24 {{[* ]*}}T{{[0-9]}}.[[MUL_CHAN:[XYZW]]]
Tom Stellard41fc7852013-07-23 01:48:42 +000023; The result must be sign-extended
Tom Stellard50122a52014-04-07 19:45:41 +000024; EG: BFE_INT {{[* ]*}}T{{[0-9]}}.{{[XYZW]}}, PV.[[MUL_CHAN]], 0.0, literal.x
25; EG: 16
Tom Stellard326d6ec2014-11-05 14:50:53 +000026; SI: v_mul_u32_u24_e{{(32|64)}} [[MUL:v[0-9]]], {{[sv][0-9], [sv][0-9]}}
27; SI: v_bfe_i32 v{{[0-9]}}, [[MUL]], 0, 16
Tom Stellard41fc7852013-07-23 01:48:42 +000028define void @i16_mul24(i32 addrspace(1)* %out, i16 %a, i16 %b) {
29entry:
30 %0 = mul i16 %a, %b
31 %1 = sext i16 %0 to i32
32 store i32 %1, i32 addrspace(1)* %out
33 ret void
34}
35
Tom Stellard79243d92014-10-01 17:15:17 +000036; FUNC-LABEL: {{^}}i8_mul24:
Tom Stellard50122a52014-04-07 19:45:41 +000037; EG: MUL_UINT24 {{[* ]*}}T{{[0-9]}}.[[MUL_CHAN:[XYZW]]]
Tom Stellard41fc7852013-07-23 01:48:42 +000038; The result must be sign-extended
Tom Stellard50122a52014-04-07 19:45:41 +000039; EG: BFE_INT {{[* ]*}}T{{[0-9]}}.{{[XYZW]}}, PV.[[MUL_CHAN]], 0.0, literal.x
Tom Stellard326d6ec2014-11-05 14:50:53 +000040; SI: v_mul_u32_u24_e{{(32|64)}} [[MUL:v[0-9]]], {{[sv][0-9], [sv][0-9]}}
41; SI: v_bfe_i32 v{{[0-9]}}, [[MUL]], 0, 8
Tom Stellard41fc7852013-07-23 01:48:42 +000042
43define void @i8_mul24(i32 addrspace(1)* %out, i8 %a, i8 %b) {
44entry:
45 %0 = mul i8 %a, %b
46 %1 = sext i8 %0 to i32
47 store i32 %1, i32 addrspace(1)* %out
48 ret void
49}
Tom Stellarda1a5d9a2014-04-11 16:12:01 +000050
51; Multiply with 24-bit inputs and 64-bit output
Tom Stellard79243d92014-10-01 17:15:17 +000052; FUNC_LABEL: {{^}}mul24_i64:
Tom Stellarda1a5d9a2014-04-11 16:12:01 +000053; EG; MUL_UINT24
54; EG: MULHI
Tom Stellard326d6ec2014-11-05 14:50:53 +000055; SI: v_mul_u32_u24
Tom Stellarda1a5d9a2014-04-11 16:12:01 +000056; FIXME: SI support 24-bit mulhi
Tom Stellard326d6ec2014-11-05 14:50:53 +000057; SI: v_mul_hi_u32
Tom Stellarda1a5d9a2014-04-11 16:12:01 +000058define void @mul24_i64(i64 addrspace(1)* %out, i64 %a, i64 %b) {
59entry:
60 %0 = shl i64 %a, 40
61 %a_24 = lshr i64 %0, 40
62 %1 = shl i64 %b, 40
63 %b_24 = lshr i64 %1, 40
64 %2 = mul i64 %a_24, %b_24
65 store i64 %2, i64 addrspace(1)* %out
66 ret void
67}