1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
|
TEXT _sha1block+0(SB),$328
/*
* wp[off] = x;
* x += A <<< 5;
* E += 0xca62c1d6 + x;
* x = FN(B,C,D);
* E += x;
* B >>> 2
*/
#define BODYX(off,FN,V,A,B,C,D,E)\
FN(B,C,D)\
ADDU TMP1,E;\
ADDU V,E;\
MOVW TMP2,off(WREG);\
ADDU TMP2,E;\
SLL $5,A,TMP3;\
SRL $27,A,TMP4;\
OR TMP3,TMP4;\
ADDU TMP4,E;\
SLL $30,B,TMP4;\
SRL $2,B;\
OR TMP4,B
/*
* x = data[i]
* BODYX
*/
#define BODY1(off,FN,V,A,B,C,D,E)\
MOVBU off(DATAREG),TMP2;\
MOVBU (off+1)(DATAREG),TMP3;\
MOVBU (off+2)(DATAREG),TMP1;\
MOVBU (off+3)(DATAREG),TMP4;\
SLL $24,TMP2;\
SLL $16,TMP3;\
OR TMP3,TMP2;\
SLL $8,TMP1;\
OR TMP1,TMP2;\
OR TMP4,TMP2;\
BODYX(off,FN,V,A,B,C,D,E)
/*
* x = (wp[off-3] ^ wp[off-8] ^ wp[off-14] ^ wp[off-16]) <<< 1;
* BODYX
*/
#define BODY(off,FN,V,A,B,C,D,E)\
MOVW (off-64)(WREG),TMP1;\
MOVW (off-56)(WREG),TMP2;\
MOVW (off-32)(WREG),TMP3;\
MOVW (off-12)(WREG),TMP4;\
XOR TMP1,TMP2;\
XOR TMP3,TMP2;\
XOR TMP4,TMP2;\
SLL $1,TMP2,TMP1;\
SRL $31,TMP2;\
OR TMP1,TMP2;\
BODYX(off,FN,V,A,B,C,D,E)
/*
* fn1 = (((C^D)&B)^D);
*/
#define FN1(B,C,D)\
XOR C,D,TMP1;\
AND B,TMP1;\
XOR D,TMP1;
/*
* fn24 = B ^ C ^ D
*/
#define FN24(B,C,D)\
XOR B,C,TMP1;\
XOR D,TMP1;
/*
* fn3 = ((B ^ C) & (D ^ B)) ^ B
*/
#define FN3(B,C,D)\
XOR B,C,TMP1;\
XOR B,D,TMP4;\
AND TMP4,TMP1;\
XOR B,TMP1;
/*
* stack offsets
* void vtSha1Block(ulong *STATE, uchar *DATA, int LEN)
*/
#define DATA 0
#define LEN 4
#define STATE 8
/*
* stack offsets for locals
* ulong w[80];
* uchar *edata;
* ulong *w15, *w40, *w60, *w80;
* register local
* ulong *wp = BP
* ulong a = eax, b = ebx, c = ecx, d = edx, e = esi
* ulong tmp = edi
*/
#define WARRAY (-4-(80*4))
#define AREG R5
#define BREG R6
#define CREG R7
#define DREG R8
#define EREG R9
#define DATAREG R1
#define STREG R11
#define WREG R12
#define W15REG R13
#define W60REG R14
#define W40REG R15
#define W80REG R16
#define EDREG R17
#define VREG R18
#define TMP1 R10
#define TMP2 R2
#define TMP3 R3
#define TMP4 R4
#define TMP5 R19
MOVW len+LEN(FP),TMP1
MOVW state+STATE(FP),STREG
ADDU DATAREG,TMP1,EDREG
MOVW 0(STREG),AREG
MOVW 4(STREG),BREG
MOVW 8(STREG),CREG
MOVW 12(STREG),DREG
MOVW 16(STREG),EREG
MOVW $warray+WARRAY(SP),WREG
ADDU $(15*4),WREG,W15REG
ADDU $(40*4),WREG,W40REG
ADDU $(60*4),WREG,W60REG
ADDU $(80*4),WREG,W80REG
mainloop:
MOVW $warray+WARRAY(SP),WREG
MOVW $0x5a827999,VREG
loop1:
BODY1(0,FN1,VREG,AREG,BREG,CREG,DREG,EREG)
BODY1(4,FN1,VREG,EREG,AREG,BREG,CREG,DREG)
BODY1(8,FN1,VREG,DREG,EREG,AREG,BREG,CREG)
BODY1(12,FN1,VREG,CREG,DREG,EREG,AREG,BREG)
BODY1(16,FN1,VREG,BREG,CREG,DREG,EREG,AREG)
ADDU $20,DATAREG
ADDU $20,WREG
BNE WREG,W15REG,loop1
BODY1(0,FN1,VREG,AREG,BREG,CREG,DREG,EREG)
ADDU $4,DATAREG
BODY(4,FN1,VREG,EREG,AREG,BREG,CREG,DREG)
BODY(8,FN1,VREG,DREG,EREG,AREG,BREG,CREG)
BODY(12,FN1,VREG,CREG,DREG,EREG,AREG,BREG)
BODY(16,FN1,VREG,BREG,CREG,DREG,EREG,AREG)
ADDU $20,WREG
MOVW $0x6ed9eba1,VREG
loop2:
BODY(0,FN24,VREG,AREG,BREG,CREG,DREG,EREG)
BODY(4,FN24,VREG,EREG,AREG,BREG,CREG,DREG)
BODY(8,FN24,VREG,DREG,EREG,AREG,BREG,CREG)
BODY(12,FN24,VREG,CREG,DREG,EREG,AREG,BREG)
BODY(16,FN24,VREG,BREG,CREG,DREG,EREG,AREG)
ADDU $20,WREG
BNE WREG,W40REG,loop2
MOVW $0x8f1bbcdc,VREG
loop3:
BODY(0,FN3,VREG,AREG,BREG,CREG,DREG,EREG)
BODY(4,FN3,VREG,EREG,AREG,BREG,CREG,DREG)
BODY(8,FN3,VREG,DREG,EREG,AREG,BREG,CREG)
BODY(12,FN3,VREG,CREG,DREG,EREG,AREG,BREG)
BODY(16,FN3,VREG,BREG,CREG,DREG,EREG,AREG)
ADDU $20,WREG
BNE WREG,W60REG,loop3
MOVW $0xca62c1d6,VREG
loop4:
BODY(0,FN24,VREG,AREG,BREG,CREG,DREG,EREG)
BODY(4,FN24,VREG,EREG,AREG,BREG,CREG,DREG)
BODY(8,FN24,VREG,DREG,EREG,AREG,BREG,CREG)
BODY(12,FN24,VREG,CREG,DREG,EREG,AREG,BREG)
BODY(16,FN24,VREG,BREG,CREG,DREG,EREG,AREG)
ADDU $20,WREG
BNE WREG,W80REG,loop4
MOVW 0(STREG),TMP1
MOVW 4(STREG),TMP2
MOVW 8(STREG),TMP3
MOVW 12(STREG),TMP4
MOVW 16(STREG),TMP5
ADDU TMP1,AREG
ADDU TMP2,BREG
ADDU TMP3,CREG
ADDU TMP4,DREG
ADDU TMP5,EREG
MOVW AREG,0(STREG)
MOVW BREG,4(STREG)
MOVW CREG,8(STREG)
MOVW DREG,12(STREG)
MOVW EREG,16(STREG)
BNE DATAREG,EDREG,mainloop
RET
END
|