evlwwsplat rK,0(rKP);
evlwwsplat rK,4(rKP);
evlwwsplat rK,8(rKP);
evlwwsplat rK,12(rKP);
stwu r1,-128(r1); \
evstdw r14,8(r1); \
evstdw r15,16(r1); \
evstdw r16,24(r1); \
evstdw r17,32(r1); \
evstdw r18,40(r1); \
evstdw r19,48(r1); \
evstdw r20,56(r1); \
evstdw r21,64(r1); \
evstdw r22,72(r1); \
evstdw r23,80(r1);
evldw r14,8(r1); \
evldw r15,16(r1); \
evldw r16,24(r1); \
evldw r17,32(r1); \
evldw r18,40(r1); \
evldw r19,48(r1); \
evldw r20,56(r1); \
evldw r21,64(r1); \
evldw r22,72(r1); \
evldw r23,80(r1); \
xor r0,r0,r0; \
stw r0,8(r1); \
stw r0,16(r1); \
stw r0,24(r1); \
stw r0,32(r1); \
stw r0,40(r1); \
stw r0,48(r1); \
stw r0,56(r1); \
stw r0,64(r1); \
stw r0,72(r1); \
stw r0,80(r1); \
addi r1,r1,128;
lwz reg,off(rWP);
addi rWP,rWP,64;
lwbrx reg,0,rWP; \
addi rWP,rWP,4;
LOAD_DATA(w0, off) \
and rT2,b,c; \
LOAD_K
andc rT1,d,b; \
rotrwi rT0,a,27; \
or rT2,rT2,rT1; \
add e,e,rT0; \
rotrwi b,b,2; \
add e,e,w0; \
LOAD_DATA(w1, off+4) \
add e,e,rT2; \
and rT1,a,b; \
add e,e,rK; \
andc rT2,c,a; \
add d,d,rK; \
or rT2,rT2,rT1; \
rotrwi rT0,e,27; \
add d,d,w1; \
rotrwi a,a,2; \
add d,d,rT0; \
evmergelo w1,w1,w0; \
add d,d,rT2
and rT2,b,c; \
evmergelohi rT0,w7,w6; \
andc rT1,d,b; \
evxor w0,w0,rT0; \
or rT1,rT1,rT2; \
evxor w0,w0,w4; \
add e,e,rT1; \
evxor w0,w0,w1; \
rotrwi rT2,a,27; \
evrlwi w0,w0,1; \
add e,e,rT2; \
evaddw rT0,w0,rK; \
rotrwi b,b,2; \
LOAD_K
evmergehi rT1,rT1,rT0; \
add e,e,rT0; \
add d,d,rT1; \
and rT2,a,b; \
andc rT1,c,a; \
rotrwi rT0,e,27; \
or rT1,rT1,rT2; \
add d,d,rT0; \
rotrwi a,a,2; \
add d,d,rT1
evmergelohi rT0,w7,w6; \
xor rT2,b,c; \
evxor w0,w0,rT0; \
xor rT2,rT2,d; \
evxor w0,w0,w4; \
add e,e,rT2; \
evxor w0,w0,w1; \
rotrwi rT2,a,27; \
evrlwi w0,w0,1; \
add e,e,rT2; \
evaddw rT0,w0,rK; \
rotrwi b,b,2; \
LOAD_K
evmergehi rT1,rT1,rT0; \
add e,e,rT0; \
xor rT2,a,b; \
add d,d,rT1; \
xor rT2,rT2,c; \
rotrwi rT0,e,27; \
add d,d,rT2; \
rotrwi a,a,2; \
add d,d,rT0
and rT2,b,c; \
evmergelohi rT0,w7,w6; \
or rT1,b,c; \
evxor w0,w0,rT0; \
and rT1,d,rT1; \
evxor w0,w0,w4; \
or rT2,rT2,rT1; \
evxor w0,w0,w1; \
add e,e,rT2; \
evrlwi w0,w0,1; \
rotrwi rT2,a,27; \
evaddw rT0,w0,rK; \
add e,e,rT2; \
LOAD_K
evmergehi rT1,rT1,rT0; \
rotrwi b,b,2; \
add e,e,rT0; \
and rT2,a,b; \
or rT0,a,b; \
add d,d,rT1; \
and rT0,c,rT0; \
rotrwi a,a,2; \
or rT2,rT2,rT0; \
rotrwi rT0,e,27; \
add d,d,rT2; \
add d,d,rT0
R_20_39(a, b, c, d, e, w0, w1, w4, w6, w7, k)
_GLOBAL(ppc_spe_sha1_transform)
INITIALIZE
lwz rH0,0(rHP)
lwz rH1,4(rHP)
mtctr r5
lwz rH2,8(rHP)
lis rKP,PPC_SPE_SHA1_K@h
lwz rH3,12(rHP)
ori rKP,rKP,PPC_SPE_SHA1_K@l
lwz rH4,16(rHP)
ppc_spe_sha1_main:
R_00_15(rH0, rH1, rH2, rH3, rH4, rW1, rW0, 1, 0)
R_00_15(rH3, rH4, rH0, rH1, rH2, rW2, rW1, 0, 8)
R_00_15(rH1, rH2, rH3, rH4, rH0, rW3, rW2, 0, 16)
R_00_15(rH4, rH0, rH1, rH2, rH3, rW4, rW3, 0, 24)
R_00_15(rH2, rH3, rH4, rH0, rH1, rW5, rW4, 0, 32)
R_00_15(rH0, rH1, rH2, rH3, rH4, rW6, rW5, 0, 40)
R_00_15(rH3, rH4, rH0, rH1, rH2, rT3, rW6, 0, 48)
R_00_15(rH1, rH2, rH3, rH4, rH0, rT3, rW7, 0, 56)
R_16_19(rH4, rH0, rH1, rH2, rH3, rW0, rW1, rW4, rW6, rW7, 0)
R_16_19(rH2, rH3, rH4, rH0, rH1, rW1, rW2, rW5, rW7, rW0, 2)
R_20_39(rH0, rH1, rH2, rH3, rH4, rW2, rW3, rW6, rW0, rW1, 0)
R_20_39(rH3, rH4, rH0, rH1, rH2, rW3, rW4, rW7, rW1, rW2, 0)
R_20_39(rH1, rH2, rH3, rH4, rH0, rW4, rW5, rW0, rW2, rW3, 0)
R_20_39(rH4, rH0, rH1, rH2, rH3, rW5, rW6, rW1, rW3, rW4, 0)
R_20_39(rH2, rH3, rH4, rH0, rH1, rW6, rW7, rW2, rW4, rW5, 0)
R_20_39(rH0, rH1, rH2, rH3, rH4, rW7, rW0, rW3, rW5, rW6, 0)
R_20_39(rH3, rH4, rH0, rH1, rH2, rW0, rW1, rW4, rW6, rW7, 0)
R_20_39(rH1, rH2, rH3, rH4, rH0, rW1, rW2, rW5, rW7, rW0, 0)
R_20_39(rH4, rH0, rH1, rH2, rH3, rW2, rW3, rW6, rW0, rW1, 0)
R_20_39(rH2, rH3, rH4, rH0, rH1, rW3, rW4, rW7, rW1, rW2, 3)
R_40_59(rH0, rH1, rH2, rH3, rH4, rW4, rW5, rW0, rW2, rW3, 0)
R_40_59(rH3, rH4, rH0, rH1, rH2, rW5, rW6, rW1, rW3, rW4, 0)
R_40_59(rH1, rH2, rH3, rH4, rH0, rW6, rW7, rW2, rW4, rW5, 0)
R_40_59(rH4, rH0, rH1, rH2, rH3, rW7, rW0, rW3, rW5, rW6, 0)
R_40_59(rH2, rH3, rH4, rH0, rH1, rW0, rW1, rW4, rW6, rW7, 0)
R_40_59(rH0, rH1, rH2, rH3, rH4, rW1, rW2, rW5, rW7, rW0, 0)
R_40_59(rH3, rH4, rH0, rH1, rH2, rW2, rW3, rW6, rW0, rW1, 0)
R_40_59(rH1, rH2, rH3, rH4, rH0, rW3, rW4, rW7, rW1, rW2, 0)
R_40_59(rH4, rH0, rH1, rH2, rH3, rW4, rW5, rW0, rW2, rW3, 0)
R_40_59(rH2, rH3, rH4, rH0, rH1, rW5, rW6, rW1, rW3, rW4, 4)
R_60_79(rH0, rH1, rH2, rH3, rH4, rW6, rW7, rW2, rW4, rW5, 0)
R_60_79(rH3, rH4, rH0, rH1, rH2, rW7, rW0, rW3, rW5, rW6, 0)
R_60_79(rH1, rH2, rH3, rH4, rH0, rW0, rW1, rW4, rW6, rW7, 0)
R_60_79(rH4, rH0, rH1, rH2, rH3, rW1, rW2, rW5, rW7, rW0, 0)
R_60_79(rH2, rH3, rH4, rH0, rH1, rW2, rW3, rW6, rW0, rW1, 0)
R_60_79(rH0, rH1, rH2, rH3, rH4, rW3, rW4, rW7, rW1, rW2, 0)
R_60_79(rH3, rH4, rH0, rH1, rH2, rW4, rW5, rW0, rW2, rW3, 0)
lwz rT3,0(rHP)
R_60_79(rH1, rH2, rH3, rH4, rH0, rW5, rW6, rW1, rW3, rW4, 0)
lwz rW1,4(rHP)
R_60_79(rH4, rH0, rH1, rH2, rH3, rW6, rW7, rW2, rW4, rW5, 0)
lwz rW2,8(rHP)
R_60_79(rH2, rH3, rH4, rH0, rH1, rW7, rW0, rW3, rW5, rW6, 0)
lwz rW3,12(rHP)
NEXT_BLOCK
lwz rW4,16(rHP)
add rH0,rH0,rT3
stw rH0,0(rHP)
add rH1,rH1,rW1
stw rH1,4(rHP)
add rH2,rH2,rW2
stw rH2,8(rHP)
add rH3,rH3,rW3
stw rH3,12(rHP)
add rH4,rH4,rW4
stw rH4,16(rHP)
bdnz ppc_spe_sha1_main
FINALIZE
blr
.data
.align 4
PPC_SPE_SHA1_K:
.long 0x5A827999,0x6ED9EBA1,0x8F1BBCDC,0xCA62C1D6