Vineet Gupta | 5210d1e | 2013-01-18 15:12:18 +0530 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2004, 2007-2010, 2011-2012 Synopsys, Inc. (www.synopsys.com) |
| 3 | * |
| 4 | * This program is free software; you can redistribute it and/or modify |
| 5 | * it under the terms of the GNU General Public License version 2 as |
| 6 | * published by the Free Software Foundation. |
| 7 | */ |
| 8 | |
Vineet Gupta | ec7ac6a | 2014-02-07 13:47:43 +0530 | [diff] [blame] | 9 | #include <linux/linkage.h> |
Vineet Gupta | 5210d1e | 2013-01-18 15:12:18 +0530 | [diff] [blame] | 10 | |
| 11 | #ifdef __LITTLE_ENDIAN__ |
| 12 | #define WORD2 r2 |
| 13 | #define SHIFT r3 |
| 14 | #else /* BIG ENDIAN */ |
| 15 | #define WORD2 r3 |
| 16 | #define SHIFT r2 |
| 17 | #endif |
| 18 | |
Vineet Gupta | ec7ac6a | 2014-02-07 13:47:43 +0530 | [diff] [blame] | 19 | ENTRY(memcmp) |
Vineet Gupta | 5210d1e | 2013-01-18 15:12:18 +0530 | [diff] [blame] | 20 | or r12,r0,r1 |
| 21 | asl_s r12,r12,30 |
| 22 | sub r3,r2,1 |
| 23 | brls r2,r12,.Lbytewise |
| 24 | ld r4,[r0,0] |
| 25 | ld r5,[r1,0] |
| 26 | lsr.f lp_count,r3,3 |
Vineet Gupta | 8922bc3 | 2013-10-07 18:10:08 +0530 | [diff] [blame] | 27 | #ifdef CONFIG_ISA_ARCV2 |
| 28 | /* In ARCv2 a branch can't be the last instruction in a zero overhead |
| 29 | * loop. |
| 30 | * So we move the branch to the start of the loop, duplicate it |
| 31 | * after the end, and set up r12 so that the branch isn't taken |
| 32 | * initially. |
| 33 | */ |
| 34 | mov_s r12,WORD2 |
| 35 | lpne .Loop_end |
| 36 | brne WORD2,r12,.Lodd |
| 37 | ld WORD2,[r0,4] |
| 38 | #else |
Vineet Gupta | 5210d1e | 2013-01-18 15:12:18 +0530 | [diff] [blame] | 39 | lpne .Loop_end |
| 40 | ld_s WORD2,[r0,4] |
Vineet Gupta | 8922bc3 | 2013-10-07 18:10:08 +0530 | [diff] [blame] | 41 | #endif |
Vineet Gupta | 5210d1e | 2013-01-18 15:12:18 +0530 | [diff] [blame] | 42 | ld_s r12,[r1,4] |
| 43 | brne r4,r5,.Leven |
| 44 | ld.a r4,[r0,8] |
| 45 | ld.a r5,[r1,8] |
Vineet Gupta | 8922bc3 | 2013-10-07 18:10:08 +0530 | [diff] [blame] | 46 | #ifdef CONFIG_ISA_ARCV2 |
| 47 | .Loop_end: |
| 48 | brne WORD2,r12,.Lodd |
| 49 | #else |
Vineet Gupta | 5210d1e | 2013-01-18 15:12:18 +0530 | [diff] [blame] | 50 | brne WORD2,r12,.Lodd |
| 51 | .Loop_end: |
Vineet Gupta | 8922bc3 | 2013-10-07 18:10:08 +0530 | [diff] [blame] | 52 | #endif |
Vineet Gupta | 5210d1e | 2013-01-18 15:12:18 +0530 | [diff] [blame] | 53 | asl_s SHIFT,SHIFT,3 |
| 54 | bhs_s .Last_cmp |
| 55 | brne r4,r5,.Leven |
| 56 | ld r4,[r0,4] |
| 57 | ld r5,[r1,4] |
| 58 | #ifdef __LITTLE_ENDIAN__ |
| 59 | nop_s |
| 60 | ; one more load latency cycle |
| 61 | .Last_cmp: |
| 62 | xor r0,r4,r5 |
| 63 | bset r0,r0,SHIFT |
| 64 | sub_s r1,r0,1 |
| 65 | bic_s r1,r1,r0 |
| 66 | norm r1,r1 |
| 67 | b.d .Leven_cmp |
| 68 | and r1,r1,24 |
| 69 | .Leven: |
| 70 | xor r0,r4,r5 |
| 71 | sub_s r1,r0,1 |
| 72 | bic_s r1,r1,r0 |
| 73 | norm r1,r1 |
| 74 | ; slow track insn |
| 75 | and r1,r1,24 |
| 76 | .Leven_cmp: |
| 77 | asl r2,r4,r1 |
| 78 | asl r12,r5,r1 |
| 79 | lsr_s r2,r2,1 |
| 80 | lsr_s r12,r12,1 |
| 81 | j_s.d [blink] |
| 82 | sub r0,r2,r12 |
| 83 | .balign 4 |
| 84 | .Lodd: |
| 85 | xor r0,WORD2,r12 |
| 86 | sub_s r1,r0,1 |
| 87 | bic_s r1,r1,r0 |
| 88 | norm r1,r1 |
| 89 | ; slow track insn |
| 90 | and r1,r1,24 |
| 91 | asl_s r2,r2,r1 |
| 92 | asl_s r12,r12,r1 |
| 93 | lsr_s r2,r2,1 |
| 94 | lsr_s r12,r12,1 |
| 95 | j_s.d [blink] |
| 96 | sub r0,r2,r12 |
| 97 | #else /* BIG ENDIAN */ |
| 98 | .Last_cmp: |
| 99 | neg_s SHIFT,SHIFT |
| 100 | lsr r4,r4,SHIFT |
| 101 | lsr r5,r5,SHIFT |
| 102 | ; slow track insn |
| 103 | .Leven: |
| 104 | sub.f r0,r4,r5 |
| 105 | mov.ne r0,1 |
| 106 | j_s.d [blink] |
| 107 | bset.cs r0,r0,31 |
| 108 | .Lodd: |
| 109 | cmp_s WORD2,r12 |
Vineet Gupta | 5210d1e | 2013-01-18 15:12:18 +0530 | [diff] [blame] | 110 | mov_s r0,1 |
| 111 | j_s.d [blink] |
| 112 | bset.cs r0,r0,31 |
| 113 | #endif /* ENDIAN */ |
| 114 | .balign 4 |
| 115 | .Lbytewise: |
| 116 | breq r2,0,.Lnil |
| 117 | ldb r4,[r0,0] |
| 118 | ldb r5,[r1,0] |
| 119 | lsr.f lp_count,r3 |
Vineet Gupta | 8922bc3 | 2013-10-07 18:10:08 +0530 | [diff] [blame] | 120 | #ifdef CONFIG_ISA_ARCV2 |
| 121 | mov r12,r3 |
Vineet Gupta | 5210d1e | 2013-01-18 15:12:18 +0530 | [diff] [blame] | 122 | lpne .Lbyte_end |
Vineet Gupta | 8922bc3 | 2013-10-07 18:10:08 +0530 | [diff] [blame] | 123 | brne r3,r12,.Lbyte_odd |
| 124 | #else |
| 125 | lpne .Lbyte_end |
| 126 | #endif |
Vineet Gupta | 5210d1e | 2013-01-18 15:12:18 +0530 | [diff] [blame] | 127 | ldb_s r3,[r0,1] |
| 128 | ldb r12,[r1,1] |
| 129 | brne r4,r5,.Lbyte_even |
| 130 | ldb.a r4,[r0,2] |
| 131 | ldb.a r5,[r1,2] |
Vineet Gupta | 8922bc3 | 2013-10-07 18:10:08 +0530 | [diff] [blame] | 132 | #ifdef CONFIG_ISA_ARCV2 |
| 133 | .Lbyte_end: |
| 134 | brne r3,r12,.Lbyte_odd |
| 135 | #else |
Vineet Gupta | 5210d1e | 2013-01-18 15:12:18 +0530 | [diff] [blame] | 136 | brne r3,r12,.Lbyte_odd |
| 137 | .Lbyte_end: |
Vineet Gupta | 8922bc3 | 2013-10-07 18:10:08 +0530 | [diff] [blame] | 138 | #endif |
Vineet Gupta | 5210d1e | 2013-01-18 15:12:18 +0530 | [diff] [blame] | 139 | bcc .Lbyte_even |
| 140 | brne r4,r5,.Lbyte_even |
| 141 | ldb_s r3,[r0,1] |
| 142 | ldb_s r12,[r1,1] |
| 143 | .Lbyte_odd: |
| 144 | j_s.d [blink] |
| 145 | sub r0,r3,r12 |
| 146 | .Lbyte_even: |
| 147 | j_s.d [blink] |
| 148 | sub r0,r4,r5 |
| 149 | .Lnil: |
| 150 | j_s.d [blink] |
| 151 | mov r0,0 |
Vineet Gupta | ec7ac6a | 2014-02-07 13:47:43 +0530 | [diff] [blame] | 152 | END(memcmp) |