1
2
3
4
5
6
7
8
9 #include <linux/linkage.h>
10 #include <asm/assembler.h>
11
12 .text
13 .fpu crypto-neon-fp-armv8
14
15 k0 .req q7
16 k1 .req q8
17 rk .req r3
18
19 ta0 .req q9
20 ta1 .req q10
21 tb0 .req q10
22 tb1 .req q9
23
24 dga .req q11
25 dgb .req q12
26
27 dg0 .req q13
28 dg1 .req q14
29 dg2 .req q15
30
31 .macro add_only, ev, s0
32 vmov dg2, dg0
33 .ifnb \s0
34 vld1.32 {k\ev}, [rk, :128]!
35 .endif
36 sha256h.32 dg0, dg1, tb\ev
37 sha256h2.32 dg1, dg2, tb\ev
38 .ifnb \s0
39 vadd.u32 ta\ev, q\s0, k\ev
40 .endif
41 .endm
42
43 .macro add_update, ev, s0, s1, s2, s3
44 sha256su0.32 q\s0, q\s1
45 add_only \ev, \s1
46 sha256su1.32 q\s0, q\s2, q\s3
47 .endm
48
49 .align 6
50 .Lsha256_rcon:
51 .word 0x428a2f98, 0x71374491, 0xb5c0fbcf, 0xe9b5dba5
52 .word 0x3956c25b, 0x59f111f1, 0x923f82a4, 0xab1c5ed5
53 .word 0xd807aa98, 0x12835b01, 0x243185be, 0x550c7dc3
54 .word 0x72be5d74, 0x80deb1fe, 0x9bdc06a7, 0xc19bf174
55 .word 0xe49b69c1, 0xefbe4786, 0x0fc19dc6, 0x240ca1cc
56 .word 0x2de92c6f, 0x4a7484aa, 0x5cb0a9dc, 0x76f988da
57 .word 0x983e5152, 0xa831c66d, 0xb00327c8, 0xbf597fc7
58 .word 0xc6e00bf3, 0xd5a79147, 0x06ca6351, 0x14292967
59 .word 0x27b70a85, 0x2e1b2138, 0x4d2c6dfc, 0x53380d13
60 .word 0x650a7354, 0x766a0abb, 0x81c2c92e, 0x92722c85
61 .word 0xa2bfe8a1, 0xa81a664b, 0xc24b8b70, 0xc76c51a3
62 .word 0xd192e819, 0xd6990624, 0xf40e3585, 0x106aa070
63 .word 0x19a4c116, 0x1e376c08, 0x2748774c, 0x34b0bcb5
64 .word 0x391c0cb3, 0x4ed8aa4a, 0x5b9cca4f, 0x682e6ff3
65 .word 0x748f82ee, 0x78a5636f, 0x84c87814, 0x8cc70208
66 .word 0x90befffa, 0xa4506ceb, 0xbef9a3f7, 0xc67178f2
67
68
69
70
71
72 ENTRY(sha2_ce_transform)
73
74 vld1.32 {dga-dgb}, [r0]
75
76
77 0: vld1.32 {q0-q1}, [r1]!
78 vld1.32 {q2-q3}, [r1]!
79 subs r2, r2, #1
80
81 #ifndef CONFIG_CPU_BIG_ENDIAN
82 vrev32.8 q0, q0
83 vrev32.8 q1, q1
84 vrev32.8 q2, q2
85 vrev32.8 q3, q3
86 #endif
87
88
89 adr rk, .Lsha256_rcon
90 vld1.32 {k0}, [rk, :128]!
91
92 vadd.u32 ta0, q0, k0
93 vmov dg0, dga
94 vmov dg1, dgb
95
96 add_update 1, 0, 1, 2, 3
97 add_update 0, 1, 2, 3, 0
98 add_update 1, 2, 3, 0, 1
99 add_update 0, 3, 0, 1, 2
100 add_update 1, 0, 1, 2, 3
101 add_update 0, 1, 2, 3, 0
102 add_update 1, 2, 3, 0, 1
103 add_update 0, 3, 0, 1, 2
104 add_update 1, 0, 1, 2, 3
105 add_update 0, 1, 2, 3, 0
106 add_update 1, 2, 3, 0, 1
107 add_update 0, 3, 0, 1, 2
108
109 add_only 1, 1
110 add_only 0, 2
111 add_only 1, 3
112 add_only 0
113
114
115 vadd.u32 dga, dga, dg0
116 vadd.u32 dgb, dgb, dg1
117 bne 0b
118
119
120 vst1.32 {dga-dgb}, [r0]
121 bx lr
122 ENDPROC(sha2_ce_transform)