| Matt Arsenault | c5559bb | 2013-11-15 04:42:23 +0000 | [diff] [blame] | 1 | ; RUN: llc -march=r600 -mcpu=cypress < %s | FileCheck -check-prefix=EG %s | 
|  | 2 |  | 
|  | 3 | ; | 
|  | 4 | ; kernel void combine_vloads(global char8* src, global char8* result) { | 
|  | 5 | ;   for (int i = 0; i < 1024; ++i) | 
|  | 6 | ;     result[i] = src[0] + src[1] + src[2] + src[3]; | 
|  | 7 | ; } | 
|  | 8 | ; | 
|  | 9 |  | 
|  | 10 |  | 
|  | 11 | ; 128-bit loads instead of many 8-bit | 
| Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 12 | ; EG-LABEL: {{^}}combine_vloads: | 
| Matt Arsenault | c5559bb | 2013-11-15 04:42:23 +0000 | [diff] [blame] | 13 | ; EG: VTX_READ_128 | 
|  | 14 | ; EG: VTX_READ_128 | 
|  | 15 | define void @combine_vloads(<8 x i8> addrspace(1)* nocapture %src, <8 x i8> addrspace(1)* nocapture %result) nounwind { | 
|  | 16 | entry: | 
|  | 17 | br label %for.body | 
|  | 18 |  | 
|  | 19 | for.exit:                                         ; preds = %for.body | 
|  | 20 | ret void | 
|  | 21 |  | 
|  | 22 | for.body:                                         ; preds = %for.body, %entry | 
|  | 23 | %i.01 = phi i32 [ 0, %entry ], [ %tmp19, %for.body ] | 
|  | 24 | %arrayidx_v4 = bitcast <8 x i8> addrspace(1)* %src to <32 x i8> addrspace(1)* | 
|  | 25 | %0 = bitcast <32 x i8> addrspace(1)* %arrayidx_v4 to <8 x i32> addrspace(1)* | 
| David Blaikie | a79ac14 | 2015-02-27 21:17:42 +0000 | [diff] [blame] | 26 | %vecload2 = load <8 x i32>, <8 x i32> addrspace(1)* %0, align 32 | 
| Matt Arsenault | c5559bb | 2013-11-15 04:42:23 +0000 | [diff] [blame] | 27 | %1 = bitcast <8 x i32> %vecload2 to <32 x i8> | 
|  | 28 | %tmp5 = shufflevector <32 x i8> %1, <32 x i8> undef, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7> | 
|  | 29 | %tmp8 = shufflevector <32 x i8> %1, <32 x i8> undef, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15> | 
|  | 30 | %tmp9 = add nsw <8 x i8> %tmp5, %tmp8 | 
|  | 31 | %tmp12 = shufflevector <32 x i8> %1, <32 x i8> undef, <8 x i32> <i32 16, i32 17, i32 18, i32 19, i32 20, i32 21, i32 22, i32 23> | 
|  | 32 | %tmp13 = add nsw <8 x i8> %tmp9, %tmp12 | 
|  | 33 | %tmp16 = shufflevector <32 x i8> %1, <32 x i8> undef, <8 x i32> <i32 24, i32 25, i32 26, i32 27, i32 28, i32 29, i32 30, i32 31> | 
|  | 34 | %tmp17 = add nsw <8 x i8> %tmp13, %tmp16 | 
| David Blaikie | 79e6c74 | 2015-02-27 19:29:02 +0000 | [diff] [blame] | 35 | %scevgep = getelementptr <8 x i8>, <8 x i8> addrspace(1)* %result, i32 %i.01 | 
| Matt Arsenault | c5559bb | 2013-11-15 04:42:23 +0000 | [diff] [blame] | 36 | %2 = bitcast <8 x i8> %tmp17 to <2 x i32> | 
|  | 37 | %3 = bitcast <8 x i8> addrspace(1)* %scevgep to <2 x i32> addrspace(1)* | 
|  | 38 | store <2 x i32> %2, <2 x i32> addrspace(1)* %3, align 8 | 
|  | 39 | %tmp19 = add nsw i32 %i.01, 1 | 
|  | 40 | %exitcond = icmp eq i32 %tmp19, 1024 | 
|  | 41 | br i1 %exitcond, label %for.exit, label %for.body | 
|  | 42 | } |