TEXT _sha1block+0(SB),$328 /* * wp[off] = x; * x += A <<< 5; * E += 0xca62c1d6 + x; * x = FN(B,C,D); * E += x; * B >>> 2 */ #define BODYX(off,FN,V,A,B,C,D,E)\ FN(B,C,D)\ ADDU TMP1,E;\ ADDU V,E;\ MOVW TMP2,off(WREG);\ ADDU TMP2,E;\ SLL $5,A,TMP3;\ SRL $27,A,TMP4;\ OR TMP3,TMP4;\ ADDU TMP4,E;\ SLL $30,B,TMP4;\ SRL $2,B;\ OR TMP4,B /* * x = data[i] * BODYX */ #define BODY1(off,FN,V,A,B,C,D,E)\ MOVBU off(DATAREG),TMP2;\ MOVBU (off+1)(DATAREG),TMP3;\ MOVBU (off+2)(DATAREG),TMP1;\ MOVBU (off+3)(DATAREG),TMP4;\ SLL $24,TMP2;\ SLL $16,TMP3;\ OR TMP3,TMP2;\ SLL $8,TMP1;\ OR TMP1,TMP2;\ OR TMP4,TMP2;\ BODYX(off,FN,V,A,B,C,D,E) /* * x = (wp[off-3] ^ wp[off-8] ^ wp[off-14] ^ wp[off-16]) <<< 1; * BODYX */ #define BODY(off,FN,V,A,B,C,D,E)\ MOVW (off-64)(WREG),TMP1;\ MOVW (off-56)(WREG),TMP2;\ MOVW (off-32)(WREG),TMP3;\ MOVW (off-12)(WREG),TMP4;\ XOR TMP1,TMP2;\ XOR TMP3,TMP2;\ XOR TMP4,TMP2;\ SLL $1,TMP2,TMP1;\ SRL $31,TMP2;\ OR TMP1,TMP2;\ BODYX(off,FN,V,A,B,C,D,E) /* * fn1 = (((C^D)&B)^D); */ #define FN1(B,C,D)\ XOR C,D,TMP1;\ AND B,TMP1;\ XOR D,TMP1; /* * fn24 = B ^ C ^ D */ #define FN24(B,C,D)\ XOR B,C,TMP1;\ XOR D,TMP1; /* * fn3 = ((B ^ C) & (D ^ B)) ^ B */ #define FN3(B,C,D)\ XOR B,C,TMP1;\ XOR B,D,TMP4;\ AND TMP4,TMP1;\ XOR B,TMP1; /* * stack offsets * void vtSha1Block(ulong *STATE, uchar *DATA, int LEN) */ #define DATA 0 #define LEN 4 #define STATE 8 /* * stack offsets for locals * ulong w[80]; * uchar *edata; * ulong *w15, *w40, *w60, *w80; * register local * ulong *wp = BP * ulong a = eax, b = ebx, c = ecx, d = edx, e = esi * ulong tmp = edi */ #define WARRAY (-4-(80*4)) #define AREG R5 #define BREG R6 #define CREG R7 #define DREG R8 #define EREG R9 #define DATAREG R1 #define STREG R11 #define WREG R12 #define W15REG R13 #define W60REG R14 #define W40REG R15 #define W80REG R16 #define EDREG R17 #define VREG R18 #define TMP1 R10 #define TMP2 R2 #define TMP3 R3 #define TMP4 R4 #define TMP5 R19 MOVW len+LEN(FP),TMP1 MOVW state+STATE(FP),STREG ADDU DATAREG,TMP1,EDREG MOVW 0(STREG),AREG MOVW 4(STREG),BREG MOVW 8(STREG),CREG MOVW 12(STREG),DREG MOVW 16(STREG),EREG MOVW $warray+WARRAY(SP),WREG ADDU $(15*4),WREG,W15REG ADDU $(40*4),WREG,W40REG ADDU $(60*4),WREG,W60REG ADDU $(80*4),WREG,W80REG mainloop: MOVW $warray+WARRAY(SP),WREG MOVW $0x5a827999,VREG loop1: BODY1(0,FN1,VREG,AREG,BREG,CREG,DREG,EREG) BODY1(4,FN1,VREG,EREG,AREG,BREG,CREG,DREG) BODY1(8,FN1,VREG,DREG,EREG,AREG,BREG,CREG) BODY1(12,FN1,VREG,CREG,DREG,EREG,AREG,BREG) BODY1(16,FN1,VREG,BREG,CREG,DREG,EREG,AREG) ADDU $20,DATAREG ADDU $20,WREG BNE WREG,W15REG,loop1 BODY1(0,FN1,VREG,AREG,BREG,CREG,DREG,EREG) ADDU $4,DATAREG BODY(4,FN1,VREG,EREG,AREG,BREG,CREG,DREG) BODY(8,FN1,VREG,DREG,EREG,AREG,BREG,CREG) BODY(12,FN1,VREG,CREG,DREG,EREG,AREG,BREG) BODY(16,FN1,VREG,BREG,CREG,DREG,EREG,AREG) ADDU $20,WREG MOVW $0x6ed9eba1,VREG loop2: BODY(0,FN24,VREG,AREG,BREG,CREG,DREG,EREG) BODY(4,FN24,VREG,EREG,AREG,BREG,CREG,DREG) BODY(8,FN24,VREG,DREG,EREG,AREG,BREG,CREG) BODY(12,FN24,VREG,CREG,DREG,EREG,AREG,BREG) BODY(16,FN24,VREG,BREG,CREG,DREG,EREG,AREG) ADDU $20,WREG BNE WREG,W40REG,loop2 MOVW $0x8f1bbcdc,VREG loop3: BODY(0,FN3,VREG,AREG,BREG,CREG,DREG,EREG) BODY(4,FN3,VREG,EREG,AREG,BREG,CREG,DREG) BODY(8,FN3,VREG,DREG,EREG,AREG,BREG,CREG) BODY(12,FN3,VREG,CREG,DREG,EREG,AREG,BREG) BODY(16,FN3,VREG,BREG,CREG,DREG,EREG,AREG) ADDU $20,WREG BNE WREG,W60REG,loop3 MOVW $0xca62c1d6,VREG loop4: BODY(0,FN24,VREG,AREG,BREG,CREG,DREG,EREG) BODY(4,FN24,VREG,EREG,AREG,BREG,CREG,DREG) BODY(8,FN24,VREG,DREG,EREG,AREG,BREG,CREG) BODY(12,FN24,VREG,CREG,DREG,EREG,AREG,BREG) BODY(16,FN24,VREG,BREG,CREG,DREG,EREG,AREG) ADDU $20,WREG BNE WREG,W80REG,loop4 MOVW 0(STREG),TMP1 MOVW 4(STREG),TMP2 MOVW 8(STREG),TMP3 MOVW 12(STREG),TMP4 MOVW 16(STREG),TMP5 ADDU TMP1,AREG ADDU TMP2,BREG ADDU TMP3,CREG ADDU TMP4,DREG ADDU TMP5,EREG MOVW AREG,0(STREG) MOVW BREG,4(STREG) MOVW CREG,8(STREG) MOVW DREG,12(STREG) MOVW EREG,16(STREG) BNE DATAREG,EDREG,mainloop RET END