blob: 8a0e71d739bee424c2c34b07ee345570b017c732 [file] [log] [blame]
Tom Stellard50122a52014-04-07 19:45:41 +00001; RUN: llc < %s -march=r600 -mcpu=redwood | FileCheck %s --check-prefix=EG --check-prefix=FUNC
2; RUN: llc < %s -march=r600 -mcpu=cayman | FileCheck %s --check-prefix=EG --check-prefix=FUNC
Tom Stellard49f8bfd2015-01-06 18:00:21 +00003; RUN: llc < %s -march=amdgcn -mcpu=SI -verify-machineinstrs | FileCheck %s --check-prefix=SI --check-prefix=FUNC
Marek Olsak75170772015-01-27 17:27:15 +00004; RUN: llc < %s -march=amdgcn -mcpu=tonga -verify-machineinstrs | FileCheck %s --check-prefix=SI --check-prefix=FUNC
Tom Stellard41fc7852013-07-23 01:48:42 +00005
Tom Stellard79243d92014-10-01 17:15:17 +00006; FUNC-LABEL: {{^}}u32_mul24:
Tom Stellard50122a52014-04-07 19:45:41 +00007; EG: MUL_UINT24 {{[* ]*}}T{{[0-9]\.[XYZW]}}, KC0[2].Z, KC0[2].W
Tom Stellard326d6ec2014-11-05 14:50:53 +00008; SI: v_mul_u32_u24
Tom Stellard41fc7852013-07-23 01:48:42 +00009
10define void @u32_mul24(i32 addrspace(1)* %out, i32 %a, i32 %b) {
11entry:
12 %0 = shl i32 %a, 8
13 %a_24 = lshr i32 %0, 8
14 %1 = shl i32 %b, 8
15 %b_24 = lshr i32 %1, 8
16 %2 = mul i32 %a_24, %b_24
17 store i32 %2, i32 addrspace(1)* %out
18 ret void
19}
20
Tom Stellard79243d92014-10-01 17:15:17 +000021; FUNC-LABEL: {{^}}i16_mul24:
Tom Stellard50122a52014-04-07 19:45:41 +000022; EG: MUL_UINT24 {{[* ]*}}T{{[0-9]}}.[[MUL_CHAN:[XYZW]]]
Tom Stellard41fc7852013-07-23 01:48:42 +000023; The result must be sign-extended
Tom Stellard50122a52014-04-07 19:45:41 +000024; EG: BFE_INT {{[* ]*}}T{{[0-9]}}.{{[XYZW]}}, PV.[[MUL_CHAN]], 0.0, literal.x
25; EG: 16
Tom Stellard326d6ec2014-11-05 14:50:53 +000026; SI: v_mul_u32_u24_e{{(32|64)}} [[MUL:v[0-9]]], {{[sv][0-9], [sv][0-9]}}
27; SI: v_bfe_i32 v{{[0-9]}}, [[MUL]], 0, 16
Tom Stellard41fc7852013-07-23 01:48:42 +000028define void @i16_mul24(i32 addrspace(1)* %out, i16 %a, i16 %b) {
29entry:
30 %0 = mul i16 %a, %b
31 %1 = sext i16 %0 to i32
32 store i32 %1, i32 addrspace(1)* %out
33 ret void
34}
35
Tom Stellard79243d92014-10-01 17:15:17 +000036; FUNC-LABEL: {{^}}i8_mul24:
Tom Stellard50122a52014-04-07 19:45:41 +000037; EG: MUL_UINT24 {{[* ]*}}T{{[0-9]}}.[[MUL_CHAN:[XYZW]]]
Tom Stellard41fc7852013-07-23 01:48:42 +000038; The result must be sign-extended
Tom Stellard50122a52014-04-07 19:45:41 +000039; EG: BFE_INT {{[* ]*}}T{{[0-9]}}.{{[XYZW]}}, PV.[[MUL_CHAN]], 0.0, literal.x
Tom Stellard326d6ec2014-11-05 14:50:53 +000040; SI: v_mul_u32_u24_e{{(32|64)}} [[MUL:v[0-9]]], {{[sv][0-9], [sv][0-9]}}
41; SI: v_bfe_i32 v{{[0-9]}}, [[MUL]], 0, 8
Tom Stellard41fc7852013-07-23 01:48:42 +000042
43define void @i8_mul24(i32 addrspace(1)* %out, i8 %a, i8 %b) {
44entry:
45 %0 = mul i8 %a, %b
46 %1 = sext i8 %0 to i32
47 store i32 %1, i32 addrspace(1)* %out
48 ret void
49}
Tom Stellarda1a5d9a2014-04-11 16:12:01 +000050
51; Multiply with 24-bit inputs and 64-bit output
Tom Stellard79243d92014-10-01 17:15:17 +000052; FUNC_LABEL: {{^}}mul24_i64:
Tom Stellarda1a5d9a2014-04-11 16:12:01 +000053; EG; MUL_UINT24
54; EG: MULHI
Tom Stellarda1a5d9a2014-04-11 16:12:01 +000055; FIXME: SI support 24-bit mulhi
Matt Arsenault24692112015-07-14 18:20:33 +000056
57; SI-DAG: v_mul_u32_u24
58; SI-DAG: v_mul_hi_u32
59; SI: s_endpgm
60define void @mul24_i64(i64 addrspace(1)* %out, i64 %a, i64 %b, i64 %c) {
Tom Stellarda1a5d9a2014-04-11 16:12:01 +000061entry:
Matt Arsenault24692112015-07-14 18:20:33 +000062 %tmp0 = shl i64 %a, 40
63 %a_24 = lshr i64 %tmp0, 40
64 %tmp1 = shl i64 %b, 40
65 %b_24 = lshr i64 %tmp1, 40
66 %tmp2 = mul i64 %a_24, %b_24
67 store i64 %tmp2, i64 addrspace(1)* %out
Tom Stellarda1a5d9a2014-04-11 16:12:01 +000068 ret void
69}