blob: 6e5efd85a347b78b194027bfdfe0e4952288b0f8 [file] [log] [blame]
Amara Emerson33089092013-09-19 11:59:01 +00001; RUN: llc < %s -mtriple=armv8 -mattr=+crypto | FileCheck %s
2
3define arm_aapcs_vfpcc <16 x i8> @test_aesde(<16 x i8>* %a, <16 x i8> *%b) {
David Blaikiea79ac142015-02-27 21:17:42 +00004 %tmp = load <16 x i8>, <16 x i8>* %a
5 %tmp2 = load <16 x i8>, <16 x i8>* %b
Tim Northover24979d82014-02-03 17:27:49 +00006 %tmp3 = call <16 x i8> @llvm.arm.neon.aesd(<16 x i8> %tmp, <16 x i8> %tmp2)
Amara Emerson33089092013-09-19 11:59:01 +00007 ; CHECK: aesd.8 q{{[0-9]+}}, q{{[0-9]+}}
Tim Northover24979d82014-02-03 17:27:49 +00008 %tmp4 = call <16 x i8> @llvm.arm.neon.aese(<16 x i8> %tmp3, <16 x i8> %tmp2)
Amara Emerson33089092013-09-19 11:59:01 +00009 ; CHECK: aese.8 q{{[0-9]+}}, q{{[0-9]+}}
Tim Northover24979d82014-02-03 17:27:49 +000010 %tmp5 = call <16 x i8> @llvm.arm.neon.aesimc(<16 x i8> %tmp4)
Amara Emerson33089092013-09-19 11:59:01 +000011 ; CHECK: aesimc.8 q{{[0-9]+}}, q{{[0-9]+}}
Tim Northover24979d82014-02-03 17:27:49 +000012 %tmp6 = call <16 x i8> @llvm.arm.neon.aesmc(<16 x i8> %tmp5)
Amara Emerson33089092013-09-19 11:59:01 +000013 ; CHECK: aesmc.8 q{{[0-9]+}}, q{{[0-9]+}}
14 ret <16 x i8> %tmp6
15}
16
17define arm_aapcs_vfpcc <4 x i32> @test_sha(<4 x i32> *%a, <4 x i32> *%b, <4 x i32> *%c) {
David Blaikiea79ac142015-02-27 21:17:42 +000018 %tmp = load <4 x i32>, <4 x i32>* %a
19 %tmp2 = load <4 x i32>, <4 x i32>* %b
20 %tmp3 = load <4 x i32>, <4 x i32>* %c
Tim Northover24979d82014-02-03 17:27:49 +000021 %scalar = extractelement <4 x i32> %tmp, i32 0
22 %resscalar = call i32 @llvm.arm.neon.sha1h(i32 %scalar)
23 %res1 = insertelement <4 x i32> undef, i32 %resscalar, i32 0
Amara Emerson33089092013-09-19 11:59:01 +000024 ; CHECK: sha1h.32 q{{[0-9]+}}, q{{[0-9]+}}
Tim Northover24979d82014-02-03 17:27:49 +000025 %res2 = call <4 x i32> @llvm.arm.neon.sha1c(<4 x i32> %tmp2, i32 %scalar, <4 x i32> %res1)
Amara Emerson33089092013-09-19 11:59:01 +000026 ; CHECK: sha1c.32 q{{[0-9]+}}, q{{[0-9]+}}, q{{[0-9]+}}
Tim Northover24979d82014-02-03 17:27:49 +000027 %res3 = call <4 x i32> @llvm.arm.neon.sha1m(<4 x i32> %res2, i32 %scalar, <4 x i32> %res1)
Amara Emerson33089092013-09-19 11:59:01 +000028 ; CHECK: sha1m.32 q{{[0-9]+}}, q{{[0-9]+}}, q{{[0-9]+}}
Tim Northover24979d82014-02-03 17:27:49 +000029 %res4 = call <4 x i32> @llvm.arm.neon.sha1p(<4 x i32> %res3, i32 %scalar, <4 x i32> %res1)
Amara Emerson33089092013-09-19 11:59:01 +000030 ; CHECK: sha1p.32 q{{[0-9]+}}, q{{[0-9]+}}, q{{[0-9]+}}
Tim Northover24979d82014-02-03 17:27:49 +000031 %res5 = call <4 x i32> @llvm.arm.neon.sha1su0(<4 x i32> %res4, <4 x i32> %tmp3, <4 x i32> %res1)
Amara Emerson33089092013-09-19 11:59:01 +000032 ; CHECK: sha1su0.32 q{{[0-9]+}}, q{{[0-9]+}}, q{{[0-9]+}}
Tim Northover24979d82014-02-03 17:27:49 +000033 %res6 = call <4 x i32> @llvm.arm.neon.sha1su1(<4 x i32> %res5, <4 x i32> %res1)
Amara Emerson33089092013-09-19 11:59:01 +000034 ; CHECK: sha1su1.32 q{{[0-9]+}}, q{{[0-9]+}}
Tim Northover24979d82014-02-03 17:27:49 +000035 %res7 = call <4 x i32> @llvm.arm.neon.sha256h(<4 x i32> %res6, <4 x i32> %tmp3, <4 x i32> %res1)
Amara Emerson33089092013-09-19 11:59:01 +000036 ; CHECK: sha256h.32 q{{[0-9]+}}, q{{[0-9]+}}, q{{[0-9]+}}
Tim Northover24979d82014-02-03 17:27:49 +000037 %res8 = call <4 x i32> @llvm.arm.neon.sha256h2(<4 x i32> %res7, <4 x i32> %tmp3, <4 x i32> %res1)
Amara Emerson33089092013-09-19 11:59:01 +000038 ; CHECK: sha256h2.32 q{{[0-9]+}}, q{{[0-9]+}}, q{{[0-9]+}}
Tim Northover24979d82014-02-03 17:27:49 +000039 %res9 = call <4 x i32> @llvm.arm.neon.sha256su1(<4 x i32> %res8, <4 x i32> %tmp3, <4 x i32> %res1)
Amara Emerson33089092013-09-19 11:59:01 +000040 ; CHECK: sha256su1.32 q{{[0-9]+}}, q{{[0-9]+}}, q{{[0-9]+}}
Tim Northover24979d82014-02-03 17:27:49 +000041 %res10 = call <4 x i32> @llvm.arm.neon.sha256su0(<4 x i32> %res9, <4 x i32> %tmp3)
Amara Emerson33089092013-09-19 11:59:01 +000042 ; CHECK: sha256su0.32 q{{[0-9]+}}, q{{[0-9]+}}
43 ret <4 x i32> %res10
44}
45
Tim Northover24979d82014-02-03 17:27:49 +000046declare <16 x i8> @llvm.arm.neon.aesd(<16 x i8>, <16 x i8>)
47declare <16 x i8> @llvm.arm.neon.aese(<16 x i8>, <16 x i8>)
48declare <16 x i8> @llvm.arm.neon.aesimc(<16 x i8>)
49declare <16 x i8> @llvm.arm.neon.aesmc(<16 x i8>)
50declare i32 @llvm.arm.neon.sha1h(i32)
51declare <4 x i32> @llvm.arm.neon.sha1c(<4 x i32>, i32, <4 x i32>)
52declare <4 x i32> @llvm.arm.neon.sha1m(<4 x i32>, i32, <4 x i32>)
53declare <4 x i32> @llvm.arm.neon.sha1p(<4 x i32>, i32, <4 x i32>)
54declare <4 x i32> @llvm.arm.neon.sha1su0(<4 x i32>, <4 x i32>, <4 x i32>)
55declare <4 x i32> @llvm.arm.neon.sha256h(<4 x i32>, <4 x i32>, <4 x i32>)
56declare <4 x i32> @llvm.arm.neon.sha256h2(<4 x i32>, <4 x i32>, <4 x i32>)
57declare <4 x i32> @llvm.arm.neon.sha256su1(<4 x i32>, <4 x i32>, <4 x i32>)
58declare <4 x i32> @llvm.arm.neon.sha256su0(<4 x i32>, <4 x i32>)
59declare <4 x i32> @llvm.arm.neon.sha1su1(<4 x i32>, <4 x i32>)