2778 lines
61 KiB
ArmAsm
2778 lines
61 KiB
ArmAsm
/* $FreeBSD$ */
|
|
/* Do not modify. This file is auto-generated from sha256-armv4.pl. */
|
|
|
|
@ ====================================================================
|
|
@ Written by Andy Polyakov <appro@openssl.org> for the OpenSSL
|
|
@ project. The module is, however, dual licensed under OpenSSL and
|
|
@ CRYPTOGAMS licenses depending on where you obtain it. For further
|
|
@ details see http://www.openssl.org/~appro/cryptogams/.
|
|
@
|
|
@ Permission to use under GPL terms is granted.
|
|
@ ====================================================================
|
|
|
|
@ SHA256 block procedure for ARMv4. May 2007.
|
|
|
|
@ Performance is ~2x better than gcc 3.4 generated code and in "abso-
|
|
@ lute" terms is ~2250 cycles per 64-byte block or ~35 cycles per
|
|
@ byte [on single-issue Xscale PXA250 core].
|
|
|
|
@ July 2010.
|
|
@
|
|
@ Rescheduling for dual-issue pipeline resulted in 22% improvement on
|
|
@ Cortex A8 core and ~20 cycles per processed byte.
|
|
|
|
@ February 2011.
|
|
@
|
|
@ Profiler-assisted and platform-specific optimization resulted in 16%
|
|
@ improvement on Cortex A8 core and ~15.4 cycles per processed byte.
|
|
|
|
@ September 2013.
|
|
@
|
|
@ Add NEON implementation. On Cortex A8 it was measured to process one
|
|
@ byte in 12.5 cycles or 23% faster than integer-only code. Snapdragon
|
|
@ S4 does it in 12.5 cycles too, but it's 50% faster than integer-only
|
|
@ code (meaning that latter performs sub-optimally, nothing was done
|
|
@ about it).
|
|
|
|
@ May 2014.
|
|
@
|
|
@ Add ARMv8 code path performing at 2.0 cpb on Apple A7.
|
|
|
|
#ifndef __KERNEL__
|
|
# include "arm_arch.h"
|
|
#else
|
|
# define __ARM_ARCH__ __LINUX_ARM_ARCH__
|
|
# define __ARM_MAX_ARCH__ 7
|
|
#endif
|
|
|
|
.text
|
|
#if __ARM_ARCH__<7
|
|
.code 32
|
|
#else
|
|
.syntax unified
|
|
# ifdef __thumb2__
|
|
.thumb
|
|
# else
|
|
.code 32
|
|
# endif
|
|
#endif
|
|
|
|
.type K256,%object
|
|
.align 5
|
|
K256:
|
|
.word 0x428a2f98,0x71374491,0xb5c0fbcf,0xe9b5dba5
|
|
.word 0x3956c25b,0x59f111f1,0x923f82a4,0xab1c5ed5
|
|
.word 0xd807aa98,0x12835b01,0x243185be,0x550c7dc3
|
|
.word 0x72be5d74,0x80deb1fe,0x9bdc06a7,0xc19bf174
|
|
.word 0xe49b69c1,0xefbe4786,0x0fc19dc6,0x240ca1cc
|
|
.word 0x2de92c6f,0x4a7484aa,0x5cb0a9dc,0x76f988da
|
|
.word 0x983e5152,0xa831c66d,0xb00327c8,0xbf597fc7
|
|
.word 0xc6e00bf3,0xd5a79147,0x06ca6351,0x14292967
|
|
.word 0x27b70a85,0x2e1b2138,0x4d2c6dfc,0x53380d13
|
|
.word 0x650a7354,0x766a0abb,0x81c2c92e,0x92722c85
|
|
.word 0xa2bfe8a1,0xa81a664b,0xc24b8b70,0xc76c51a3
|
|
.word 0xd192e819,0xd6990624,0xf40e3585,0x106aa070
|
|
.word 0x19a4c116,0x1e376c08,0x2748774c,0x34b0bcb5
|
|
.word 0x391c0cb3,0x4ed8aa4a,0x5b9cca4f,0x682e6ff3
|
|
.word 0x748f82ee,0x78a5636f,0x84c87814,0x8cc70208
|
|
.word 0x90befffa,0xa4506ceb,0xbef9a3f7,0xc67178f2
|
|
.size K256,.-K256
|
|
.word 0 @ terminator
|
|
#if __ARM_MAX_ARCH__>=7 && !defined(__KERNEL__)
|
|
.LOPENSSL_armcap:
|
|
.word OPENSSL_armcap_P-sha256_block_data_order
|
|
#endif
|
|
.align 5
|
|
|
|
.global sha256_block_data_order
|
|
.type sha256_block_data_order,%function
|
|
sha256_block_data_order:
|
|
#if __ARM_ARCH__<7
|
|
sub r3,pc,#8 @ sha256_block_data_order
|
|
#else
|
|
adr r3,.
|
|
#endif
|
|
#if __ARM_MAX_ARCH__>=7 && !defined(__KERNEL__)
|
|
ldr r12,.LOPENSSL_armcap
|
|
ldr r12,[r3,r12] @ OPENSSL_armcap_P
|
|
tst r12,#ARMV8_SHA256
|
|
bne .LARMv8
|
|
tst r12,#ARMV7_NEON
|
|
bne .LNEON
|
|
#endif
|
|
add r2,r1,r2,lsl#6 @ len to point at the end of inp
|
|
stmdb sp!,{r0,r1,r2,r4-r11,lr}
|
|
ldmia r0,{r4,r5,r6,r7,r8,r9,r10,r11}
|
|
sub r14,r3,#256+32 @ K256
|
|
sub sp,sp,#16*4 @ alloca(X[16])
|
|
.Loop:
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r5,r6 @ magic
|
|
eor r12,r12,r12
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 0
|
|
# if 0==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r8,r8,ror#5
|
|
add r4,r4,r12 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r8,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 0
|
|
add r4,r4,r12 @ h+=Maj(a,b,c) from the past
|
|
ldrb r12,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r12,lsl#8
|
|
ldrb r12,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 0==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r8,r8,ror#5
|
|
orr r2,r2,r12,lsl#24
|
|
eor r0,r0,r8,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r11,r11,r2 @ h+=X[i]
|
|
str r2,[sp,#0*4]
|
|
eor r2,r9,r10
|
|
add r11,r11,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r8
|
|
add r11,r11,r12 @ h+=K256[i]
|
|
eor r2,r2,r10 @ Ch(e,f,g)
|
|
eor r0,r4,r4,ror#11
|
|
add r11,r11,r2 @ h+=Ch(e,f,g)
|
|
#if 0==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 0<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r4,r5 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#2*4] @ from future BODY_16_xx
|
|
eor r12,r4,r5 @ a^b, b^c in next round
|
|
ldr r1,[sp,#15*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r4,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r7,r7,r11 @ d+=h
|
|
eor r3,r3,r5 @ Maj(a,b,c)
|
|
add r11,r11,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r11,r11,r3 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 1
|
|
# if 1==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r7,r7,ror#5
|
|
add r11,r11,r3 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r7,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 1
|
|
add r11,r11,r3 @ h+=Maj(a,b,c) from the past
|
|
ldrb r3,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r3,lsl#8
|
|
ldrb r3,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 1==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r7,r7,ror#5
|
|
orr r2,r2,r3,lsl#24
|
|
eor r0,r0,r7,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r10,r10,r2 @ h+=X[i]
|
|
str r2,[sp,#1*4]
|
|
eor r2,r8,r9
|
|
add r10,r10,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r7
|
|
add r10,r10,r3 @ h+=K256[i]
|
|
eor r2,r2,r9 @ Ch(e,f,g)
|
|
eor r0,r11,r11,ror#11
|
|
add r10,r10,r2 @ h+=Ch(e,f,g)
|
|
#if 1==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 1<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r11,r4 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#3*4] @ from future BODY_16_xx
|
|
eor r3,r11,r4 @ a^b, b^c in next round
|
|
ldr r1,[sp,#0*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r11,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r6,r6,r10 @ d+=h
|
|
eor r12,r12,r4 @ Maj(a,b,c)
|
|
add r10,r10,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r10,r10,r12 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 2
|
|
# if 2==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r6,r6,ror#5
|
|
add r10,r10,r12 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r6,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 2
|
|
add r10,r10,r12 @ h+=Maj(a,b,c) from the past
|
|
ldrb r12,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r12,lsl#8
|
|
ldrb r12,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 2==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r6,r6,ror#5
|
|
orr r2,r2,r12,lsl#24
|
|
eor r0,r0,r6,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r9,r9,r2 @ h+=X[i]
|
|
str r2,[sp,#2*4]
|
|
eor r2,r7,r8
|
|
add r9,r9,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r6
|
|
add r9,r9,r12 @ h+=K256[i]
|
|
eor r2,r2,r8 @ Ch(e,f,g)
|
|
eor r0,r10,r10,ror#11
|
|
add r9,r9,r2 @ h+=Ch(e,f,g)
|
|
#if 2==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 2<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r10,r11 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#4*4] @ from future BODY_16_xx
|
|
eor r12,r10,r11 @ a^b, b^c in next round
|
|
ldr r1,[sp,#1*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r10,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r5,r5,r9 @ d+=h
|
|
eor r3,r3,r11 @ Maj(a,b,c)
|
|
add r9,r9,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r9,r9,r3 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 3
|
|
# if 3==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r5,r5,ror#5
|
|
add r9,r9,r3 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r5,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 3
|
|
add r9,r9,r3 @ h+=Maj(a,b,c) from the past
|
|
ldrb r3,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r3,lsl#8
|
|
ldrb r3,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 3==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r5,r5,ror#5
|
|
orr r2,r2,r3,lsl#24
|
|
eor r0,r0,r5,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r8,r8,r2 @ h+=X[i]
|
|
str r2,[sp,#3*4]
|
|
eor r2,r6,r7
|
|
add r8,r8,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r5
|
|
add r8,r8,r3 @ h+=K256[i]
|
|
eor r2,r2,r7 @ Ch(e,f,g)
|
|
eor r0,r9,r9,ror#11
|
|
add r8,r8,r2 @ h+=Ch(e,f,g)
|
|
#if 3==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 3<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r9,r10 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#5*4] @ from future BODY_16_xx
|
|
eor r3,r9,r10 @ a^b, b^c in next round
|
|
ldr r1,[sp,#2*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r9,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r4,r4,r8 @ d+=h
|
|
eor r12,r12,r10 @ Maj(a,b,c)
|
|
add r8,r8,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r8,r8,r12 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 4
|
|
# if 4==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r4,r4,ror#5
|
|
add r8,r8,r12 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r4,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 4
|
|
add r8,r8,r12 @ h+=Maj(a,b,c) from the past
|
|
ldrb r12,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r12,lsl#8
|
|
ldrb r12,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 4==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r4,r4,ror#5
|
|
orr r2,r2,r12,lsl#24
|
|
eor r0,r0,r4,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r7,r7,r2 @ h+=X[i]
|
|
str r2,[sp,#4*4]
|
|
eor r2,r5,r6
|
|
add r7,r7,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r4
|
|
add r7,r7,r12 @ h+=K256[i]
|
|
eor r2,r2,r6 @ Ch(e,f,g)
|
|
eor r0,r8,r8,ror#11
|
|
add r7,r7,r2 @ h+=Ch(e,f,g)
|
|
#if 4==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 4<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r8,r9 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#6*4] @ from future BODY_16_xx
|
|
eor r12,r8,r9 @ a^b, b^c in next round
|
|
ldr r1,[sp,#3*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r8,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r11,r11,r7 @ d+=h
|
|
eor r3,r3,r9 @ Maj(a,b,c)
|
|
add r7,r7,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r7,r7,r3 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 5
|
|
# if 5==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r11,r11,ror#5
|
|
add r7,r7,r3 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r11,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 5
|
|
add r7,r7,r3 @ h+=Maj(a,b,c) from the past
|
|
ldrb r3,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r3,lsl#8
|
|
ldrb r3,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 5==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r11,r11,ror#5
|
|
orr r2,r2,r3,lsl#24
|
|
eor r0,r0,r11,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r6,r6,r2 @ h+=X[i]
|
|
str r2,[sp,#5*4]
|
|
eor r2,r4,r5
|
|
add r6,r6,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r11
|
|
add r6,r6,r3 @ h+=K256[i]
|
|
eor r2,r2,r5 @ Ch(e,f,g)
|
|
eor r0,r7,r7,ror#11
|
|
add r6,r6,r2 @ h+=Ch(e,f,g)
|
|
#if 5==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 5<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r7,r8 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#7*4] @ from future BODY_16_xx
|
|
eor r3,r7,r8 @ a^b, b^c in next round
|
|
ldr r1,[sp,#4*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r7,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r10,r10,r6 @ d+=h
|
|
eor r12,r12,r8 @ Maj(a,b,c)
|
|
add r6,r6,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r6,r6,r12 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 6
|
|
# if 6==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r10,r10,ror#5
|
|
add r6,r6,r12 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r10,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 6
|
|
add r6,r6,r12 @ h+=Maj(a,b,c) from the past
|
|
ldrb r12,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r12,lsl#8
|
|
ldrb r12,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 6==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r10,r10,ror#5
|
|
orr r2,r2,r12,lsl#24
|
|
eor r0,r0,r10,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r5,r5,r2 @ h+=X[i]
|
|
str r2,[sp,#6*4]
|
|
eor r2,r11,r4
|
|
add r5,r5,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r10
|
|
add r5,r5,r12 @ h+=K256[i]
|
|
eor r2,r2,r4 @ Ch(e,f,g)
|
|
eor r0,r6,r6,ror#11
|
|
add r5,r5,r2 @ h+=Ch(e,f,g)
|
|
#if 6==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 6<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r6,r7 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#8*4] @ from future BODY_16_xx
|
|
eor r12,r6,r7 @ a^b, b^c in next round
|
|
ldr r1,[sp,#5*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r6,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r9,r9,r5 @ d+=h
|
|
eor r3,r3,r7 @ Maj(a,b,c)
|
|
add r5,r5,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r5,r5,r3 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 7
|
|
# if 7==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r9,r9,ror#5
|
|
add r5,r5,r3 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r9,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 7
|
|
add r5,r5,r3 @ h+=Maj(a,b,c) from the past
|
|
ldrb r3,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r3,lsl#8
|
|
ldrb r3,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 7==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r9,r9,ror#5
|
|
orr r2,r2,r3,lsl#24
|
|
eor r0,r0,r9,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r4,r4,r2 @ h+=X[i]
|
|
str r2,[sp,#7*4]
|
|
eor r2,r10,r11
|
|
add r4,r4,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r9
|
|
add r4,r4,r3 @ h+=K256[i]
|
|
eor r2,r2,r11 @ Ch(e,f,g)
|
|
eor r0,r5,r5,ror#11
|
|
add r4,r4,r2 @ h+=Ch(e,f,g)
|
|
#if 7==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 7<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r5,r6 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#9*4] @ from future BODY_16_xx
|
|
eor r3,r5,r6 @ a^b, b^c in next round
|
|
ldr r1,[sp,#6*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r5,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r8,r8,r4 @ d+=h
|
|
eor r12,r12,r6 @ Maj(a,b,c)
|
|
add r4,r4,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r4,r4,r12 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 8
|
|
# if 8==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r8,r8,ror#5
|
|
add r4,r4,r12 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r8,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 8
|
|
add r4,r4,r12 @ h+=Maj(a,b,c) from the past
|
|
ldrb r12,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r12,lsl#8
|
|
ldrb r12,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 8==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r8,r8,ror#5
|
|
orr r2,r2,r12,lsl#24
|
|
eor r0,r0,r8,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r11,r11,r2 @ h+=X[i]
|
|
str r2,[sp,#8*4]
|
|
eor r2,r9,r10
|
|
add r11,r11,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r8
|
|
add r11,r11,r12 @ h+=K256[i]
|
|
eor r2,r2,r10 @ Ch(e,f,g)
|
|
eor r0,r4,r4,ror#11
|
|
add r11,r11,r2 @ h+=Ch(e,f,g)
|
|
#if 8==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 8<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r4,r5 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#10*4] @ from future BODY_16_xx
|
|
eor r12,r4,r5 @ a^b, b^c in next round
|
|
ldr r1,[sp,#7*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r4,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r7,r7,r11 @ d+=h
|
|
eor r3,r3,r5 @ Maj(a,b,c)
|
|
add r11,r11,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r11,r11,r3 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 9
|
|
# if 9==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r7,r7,ror#5
|
|
add r11,r11,r3 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r7,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 9
|
|
add r11,r11,r3 @ h+=Maj(a,b,c) from the past
|
|
ldrb r3,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r3,lsl#8
|
|
ldrb r3,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 9==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r7,r7,ror#5
|
|
orr r2,r2,r3,lsl#24
|
|
eor r0,r0,r7,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r10,r10,r2 @ h+=X[i]
|
|
str r2,[sp,#9*4]
|
|
eor r2,r8,r9
|
|
add r10,r10,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r7
|
|
add r10,r10,r3 @ h+=K256[i]
|
|
eor r2,r2,r9 @ Ch(e,f,g)
|
|
eor r0,r11,r11,ror#11
|
|
add r10,r10,r2 @ h+=Ch(e,f,g)
|
|
#if 9==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 9<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r11,r4 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#11*4] @ from future BODY_16_xx
|
|
eor r3,r11,r4 @ a^b, b^c in next round
|
|
ldr r1,[sp,#8*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r11,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r6,r6,r10 @ d+=h
|
|
eor r12,r12,r4 @ Maj(a,b,c)
|
|
add r10,r10,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r10,r10,r12 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 10
|
|
# if 10==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r6,r6,ror#5
|
|
add r10,r10,r12 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r6,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 10
|
|
add r10,r10,r12 @ h+=Maj(a,b,c) from the past
|
|
ldrb r12,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r12,lsl#8
|
|
ldrb r12,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 10==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r6,r6,ror#5
|
|
orr r2,r2,r12,lsl#24
|
|
eor r0,r0,r6,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r9,r9,r2 @ h+=X[i]
|
|
str r2,[sp,#10*4]
|
|
eor r2,r7,r8
|
|
add r9,r9,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r6
|
|
add r9,r9,r12 @ h+=K256[i]
|
|
eor r2,r2,r8 @ Ch(e,f,g)
|
|
eor r0,r10,r10,ror#11
|
|
add r9,r9,r2 @ h+=Ch(e,f,g)
|
|
#if 10==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 10<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r10,r11 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#12*4] @ from future BODY_16_xx
|
|
eor r12,r10,r11 @ a^b, b^c in next round
|
|
ldr r1,[sp,#9*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r10,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r5,r5,r9 @ d+=h
|
|
eor r3,r3,r11 @ Maj(a,b,c)
|
|
add r9,r9,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r9,r9,r3 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 11
|
|
# if 11==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r5,r5,ror#5
|
|
add r9,r9,r3 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r5,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 11
|
|
add r9,r9,r3 @ h+=Maj(a,b,c) from the past
|
|
ldrb r3,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r3,lsl#8
|
|
ldrb r3,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 11==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r5,r5,ror#5
|
|
orr r2,r2,r3,lsl#24
|
|
eor r0,r0,r5,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r8,r8,r2 @ h+=X[i]
|
|
str r2,[sp,#11*4]
|
|
eor r2,r6,r7
|
|
add r8,r8,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r5
|
|
add r8,r8,r3 @ h+=K256[i]
|
|
eor r2,r2,r7 @ Ch(e,f,g)
|
|
eor r0,r9,r9,ror#11
|
|
add r8,r8,r2 @ h+=Ch(e,f,g)
|
|
#if 11==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 11<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r9,r10 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#13*4] @ from future BODY_16_xx
|
|
eor r3,r9,r10 @ a^b, b^c in next round
|
|
ldr r1,[sp,#10*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r9,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r4,r4,r8 @ d+=h
|
|
eor r12,r12,r10 @ Maj(a,b,c)
|
|
add r8,r8,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r8,r8,r12 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 12
|
|
# if 12==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r4,r4,ror#5
|
|
add r8,r8,r12 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r4,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 12
|
|
add r8,r8,r12 @ h+=Maj(a,b,c) from the past
|
|
ldrb r12,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r12,lsl#8
|
|
ldrb r12,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 12==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r4,r4,ror#5
|
|
orr r2,r2,r12,lsl#24
|
|
eor r0,r0,r4,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r7,r7,r2 @ h+=X[i]
|
|
str r2,[sp,#12*4]
|
|
eor r2,r5,r6
|
|
add r7,r7,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r4
|
|
add r7,r7,r12 @ h+=K256[i]
|
|
eor r2,r2,r6 @ Ch(e,f,g)
|
|
eor r0,r8,r8,ror#11
|
|
add r7,r7,r2 @ h+=Ch(e,f,g)
|
|
#if 12==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 12<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r8,r9 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#14*4] @ from future BODY_16_xx
|
|
eor r12,r8,r9 @ a^b, b^c in next round
|
|
ldr r1,[sp,#11*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r8,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r11,r11,r7 @ d+=h
|
|
eor r3,r3,r9 @ Maj(a,b,c)
|
|
add r7,r7,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r7,r7,r3 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 13
|
|
# if 13==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r11,r11,ror#5
|
|
add r7,r7,r3 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r11,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 13
|
|
add r7,r7,r3 @ h+=Maj(a,b,c) from the past
|
|
ldrb r3,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r3,lsl#8
|
|
ldrb r3,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 13==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r11,r11,ror#5
|
|
orr r2,r2,r3,lsl#24
|
|
eor r0,r0,r11,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r6,r6,r2 @ h+=X[i]
|
|
str r2,[sp,#13*4]
|
|
eor r2,r4,r5
|
|
add r6,r6,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r11
|
|
add r6,r6,r3 @ h+=K256[i]
|
|
eor r2,r2,r5 @ Ch(e,f,g)
|
|
eor r0,r7,r7,ror#11
|
|
add r6,r6,r2 @ h+=Ch(e,f,g)
|
|
#if 13==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 13<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r7,r8 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#15*4] @ from future BODY_16_xx
|
|
eor r3,r7,r8 @ a^b, b^c in next round
|
|
ldr r1,[sp,#12*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r7,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r10,r10,r6 @ d+=h
|
|
eor r12,r12,r8 @ Maj(a,b,c)
|
|
add r6,r6,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r6,r6,r12 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 14
|
|
# if 14==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r10,r10,ror#5
|
|
add r6,r6,r12 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r10,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 14
|
|
add r6,r6,r12 @ h+=Maj(a,b,c) from the past
|
|
ldrb r12,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r12,lsl#8
|
|
ldrb r12,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 14==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r10,r10,ror#5
|
|
orr r2,r2,r12,lsl#24
|
|
eor r0,r0,r10,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r5,r5,r2 @ h+=X[i]
|
|
str r2,[sp,#14*4]
|
|
eor r2,r11,r4
|
|
add r5,r5,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r10
|
|
add r5,r5,r12 @ h+=K256[i]
|
|
eor r2,r2,r4 @ Ch(e,f,g)
|
|
eor r0,r6,r6,ror#11
|
|
add r5,r5,r2 @ h+=Ch(e,f,g)
|
|
#if 14==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 14<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r6,r7 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#0*4] @ from future BODY_16_xx
|
|
eor r12,r6,r7 @ a^b, b^c in next round
|
|
ldr r1,[sp,#13*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r6,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r9,r9,r5 @ d+=h
|
|
eor r3,r3,r7 @ Maj(a,b,c)
|
|
add r5,r5,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r5,r5,r3 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
@ ldr r2,[r1],#4 @ 15
|
|
# if 15==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r9,r9,ror#5
|
|
add r5,r5,r3 @ h+=Maj(a,b,c) from the past
|
|
eor r0,r0,r9,ror#19 @ Sigma1(e)
|
|
rev r2,r2
|
|
#else
|
|
@ ldrb r2,[r1,#3] @ 15
|
|
add r5,r5,r3 @ h+=Maj(a,b,c) from the past
|
|
ldrb r3,[r1,#2]
|
|
ldrb r0,[r1,#1]
|
|
orr r2,r2,r3,lsl#8
|
|
ldrb r3,[r1],#4
|
|
orr r2,r2,r0,lsl#16
|
|
# if 15==15
|
|
str r1,[sp,#17*4] @ make room for r1
|
|
# endif
|
|
eor r0,r9,r9,ror#5
|
|
orr r2,r2,r3,lsl#24
|
|
eor r0,r0,r9,ror#19 @ Sigma1(e)
|
|
#endif
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r4,r4,r2 @ h+=X[i]
|
|
str r2,[sp,#15*4]
|
|
eor r2,r10,r11
|
|
add r4,r4,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r9
|
|
add r4,r4,r3 @ h+=K256[i]
|
|
eor r2,r2,r11 @ Ch(e,f,g)
|
|
eor r0,r5,r5,ror#11
|
|
add r4,r4,r2 @ h+=Ch(e,f,g)
|
|
#if 15==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 15<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r5,r6 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#1*4] @ from future BODY_16_xx
|
|
eor r3,r5,r6 @ a^b, b^c in next round
|
|
ldr r1,[sp,#14*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r5,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r8,r8,r4 @ d+=h
|
|
eor r12,r12,r6 @ Maj(a,b,c)
|
|
add r4,r4,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r4,r4,r12 @ h+=Maj(a,b,c)
|
|
.Lrounds_16_xx:
|
|
@ ldr r2,[sp,#1*4] @ 16
|
|
@ ldr r1,[sp,#14*4]
|
|
mov r0,r2,ror#7
|
|
add r4,r4,r12 @ h+=Maj(a,b,c) from the past
|
|
mov r12,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r12,r12,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#0*4]
|
|
eor r12,r12,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#9*4]
|
|
|
|
add r12,r12,r0
|
|
eor r0,r8,r8,ror#5 @ from BODY_00_15
|
|
add r2,r2,r12
|
|
eor r0,r0,r8,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r11,r11,r2 @ h+=X[i]
|
|
str r2,[sp,#0*4]
|
|
eor r2,r9,r10
|
|
add r11,r11,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r8
|
|
add r11,r11,r12 @ h+=K256[i]
|
|
eor r2,r2,r10 @ Ch(e,f,g)
|
|
eor r0,r4,r4,ror#11
|
|
add r11,r11,r2 @ h+=Ch(e,f,g)
|
|
#if 16==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 16<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r4,r5 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#2*4] @ from future BODY_16_xx
|
|
eor r12,r4,r5 @ a^b, b^c in next round
|
|
ldr r1,[sp,#15*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r4,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r7,r7,r11 @ d+=h
|
|
eor r3,r3,r5 @ Maj(a,b,c)
|
|
add r11,r11,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r11,r11,r3 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#2*4] @ 17
|
|
@ ldr r1,[sp,#15*4]
|
|
mov r0,r2,ror#7
|
|
add r11,r11,r3 @ h+=Maj(a,b,c) from the past
|
|
mov r3,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r3,r3,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#1*4]
|
|
eor r3,r3,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#10*4]
|
|
|
|
add r3,r3,r0
|
|
eor r0,r7,r7,ror#5 @ from BODY_00_15
|
|
add r2,r2,r3
|
|
eor r0,r0,r7,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r10,r10,r2 @ h+=X[i]
|
|
str r2,[sp,#1*4]
|
|
eor r2,r8,r9
|
|
add r10,r10,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r7
|
|
add r10,r10,r3 @ h+=K256[i]
|
|
eor r2,r2,r9 @ Ch(e,f,g)
|
|
eor r0,r11,r11,ror#11
|
|
add r10,r10,r2 @ h+=Ch(e,f,g)
|
|
#if 17==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 17<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r11,r4 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#3*4] @ from future BODY_16_xx
|
|
eor r3,r11,r4 @ a^b, b^c in next round
|
|
ldr r1,[sp,#0*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r11,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r6,r6,r10 @ d+=h
|
|
eor r12,r12,r4 @ Maj(a,b,c)
|
|
add r10,r10,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r10,r10,r12 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#3*4] @ 18
|
|
@ ldr r1,[sp,#0*4]
|
|
mov r0,r2,ror#7
|
|
add r10,r10,r12 @ h+=Maj(a,b,c) from the past
|
|
mov r12,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r12,r12,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#2*4]
|
|
eor r12,r12,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#11*4]
|
|
|
|
add r12,r12,r0
|
|
eor r0,r6,r6,ror#5 @ from BODY_00_15
|
|
add r2,r2,r12
|
|
eor r0,r0,r6,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r9,r9,r2 @ h+=X[i]
|
|
str r2,[sp,#2*4]
|
|
eor r2,r7,r8
|
|
add r9,r9,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r6
|
|
add r9,r9,r12 @ h+=K256[i]
|
|
eor r2,r2,r8 @ Ch(e,f,g)
|
|
eor r0,r10,r10,ror#11
|
|
add r9,r9,r2 @ h+=Ch(e,f,g)
|
|
#if 18==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 18<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r10,r11 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#4*4] @ from future BODY_16_xx
|
|
eor r12,r10,r11 @ a^b, b^c in next round
|
|
ldr r1,[sp,#1*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r10,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r5,r5,r9 @ d+=h
|
|
eor r3,r3,r11 @ Maj(a,b,c)
|
|
add r9,r9,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r9,r9,r3 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#4*4] @ 19
|
|
@ ldr r1,[sp,#1*4]
|
|
mov r0,r2,ror#7
|
|
add r9,r9,r3 @ h+=Maj(a,b,c) from the past
|
|
mov r3,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r3,r3,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#3*4]
|
|
eor r3,r3,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#12*4]
|
|
|
|
add r3,r3,r0
|
|
eor r0,r5,r5,ror#5 @ from BODY_00_15
|
|
add r2,r2,r3
|
|
eor r0,r0,r5,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r8,r8,r2 @ h+=X[i]
|
|
str r2,[sp,#3*4]
|
|
eor r2,r6,r7
|
|
add r8,r8,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r5
|
|
add r8,r8,r3 @ h+=K256[i]
|
|
eor r2,r2,r7 @ Ch(e,f,g)
|
|
eor r0,r9,r9,ror#11
|
|
add r8,r8,r2 @ h+=Ch(e,f,g)
|
|
#if 19==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 19<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r9,r10 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#5*4] @ from future BODY_16_xx
|
|
eor r3,r9,r10 @ a^b, b^c in next round
|
|
ldr r1,[sp,#2*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r9,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r4,r4,r8 @ d+=h
|
|
eor r12,r12,r10 @ Maj(a,b,c)
|
|
add r8,r8,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r8,r8,r12 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#5*4] @ 20
|
|
@ ldr r1,[sp,#2*4]
|
|
mov r0,r2,ror#7
|
|
add r8,r8,r12 @ h+=Maj(a,b,c) from the past
|
|
mov r12,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r12,r12,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#4*4]
|
|
eor r12,r12,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#13*4]
|
|
|
|
add r12,r12,r0
|
|
eor r0,r4,r4,ror#5 @ from BODY_00_15
|
|
add r2,r2,r12
|
|
eor r0,r0,r4,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r7,r7,r2 @ h+=X[i]
|
|
str r2,[sp,#4*4]
|
|
eor r2,r5,r6
|
|
add r7,r7,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r4
|
|
add r7,r7,r12 @ h+=K256[i]
|
|
eor r2,r2,r6 @ Ch(e,f,g)
|
|
eor r0,r8,r8,ror#11
|
|
add r7,r7,r2 @ h+=Ch(e,f,g)
|
|
#if 20==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 20<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r8,r9 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#6*4] @ from future BODY_16_xx
|
|
eor r12,r8,r9 @ a^b, b^c in next round
|
|
ldr r1,[sp,#3*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r8,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r11,r11,r7 @ d+=h
|
|
eor r3,r3,r9 @ Maj(a,b,c)
|
|
add r7,r7,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r7,r7,r3 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#6*4] @ 21
|
|
@ ldr r1,[sp,#3*4]
|
|
mov r0,r2,ror#7
|
|
add r7,r7,r3 @ h+=Maj(a,b,c) from the past
|
|
mov r3,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r3,r3,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#5*4]
|
|
eor r3,r3,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#14*4]
|
|
|
|
add r3,r3,r0
|
|
eor r0,r11,r11,ror#5 @ from BODY_00_15
|
|
add r2,r2,r3
|
|
eor r0,r0,r11,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r6,r6,r2 @ h+=X[i]
|
|
str r2,[sp,#5*4]
|
|
eor r2,r4,r5
|
|
add r6,r6,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r11
|
|
add r6,r6,r3 @ h+=K256[i]
|
|
eor r2,r2,r5 @ Ch(e,f,g)
|
|
eor r0,r7,r7,ror#11
|
|
add r6,r6,r2 @ h+=Ch(e,f,g)
|
|
#if 21==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 21<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r7,r8 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#7*4] @ from future BODY_16_xx
|
|
eor r3,r7,r8 @ a^b, b^c in next round
|
|
ldr r1,[sp,#4*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r7,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r10,r10,r6 @ d+=h
|
|
eor r12,r12,r8 @ Maj(a,b,c)
|
|
add r6,r6,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r6,r6,r12 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#7*4] @ 22
|
|
@ ldr r1,[sp,#4*4]
|
|
mov r0,r2,ror#7
|
|
add r6,r6,r12 @ h+=Maj(a,b,c) from the past
|
|
mov r12,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r12,r12,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#6*4]
|
|
eor r12,r12,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#15*4]
|
|
|
|
add r12,r12,r0
|
|
eor r0,r10,r10,ror#5 @ from BODY_00_15
|
|
add r2,r2,r12
|
|
eor r0,r0,r10,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r5,r5,r2 @ h+=X[i]
|
|
str r2,[sp,#6*4]
|
|
eor r2,r11,r4
|
|
add r5,r5,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r10
|
|
add r5,r5,r12 @ h+=K256[i]
|
|
eor r2,r2,r4 @ Ch(e,f,g)
|
|
eor r0,r6,r6,ror#11
|
|
add r5,r5,r2 @ h+=Ch(e,f,g)
|
|
#if 22==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 22<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r6,r7 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#8*4] @ from future BODY_16_xx
|
|
eor r12,r6,r7 @ a^b, b^c in next round
|
|
ldr r1,[sp,#5*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r6,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r9,r9,r5 @ d+=h
|
|
eor r3,r3,r7 @ Maj(a,b,c)
|
|
add r5,r5,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r5,r5,r3 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#8*4] @ 23
|
|
@ ldr r1,[sp,#5*4]
|
|
mov r0,r2,ror#7
|
|
add r5,r5,r3 @ h+=Maj(a,b,c) from the past
|
|
mov r3,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r3,r3,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#7*4]
|
|
eor r3,r3,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#0*4]
|
|
|
|
add r3,r3,r0
|
|
eor r0,r9,r9,ror#5 @ from BODY_00_15
|
|
add r2,r2,r3
|
|
eor r0,r0,r9,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r4,r4,r2 @ h+=X[i]
|
|
str r2,[sp,#7*4]
|
|
eor r2,r10,r11
|
|
add r4,r4,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r9
|
|
add r4,r4,r3 @ h+=K256[i]
|
|
eor r2,r2,r11 @ Ch(e,f,g)
|
|
eor r0,r5,r5,ror#11
|
|
add r4,r4,r2 @ h+=Ch(e,f,g)
|
|
#if 23==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 23<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r5,r6 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#9*4] @ from future BODY_16_xx
|
|
eor r3,r5,r6 @ a^b, b^c in next round
|
|
ldr r1,[sp,#6*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r5,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r8,r8,r4 @ d+=h
|
|
eor r12,r12,r6 @ Maj(a,b,c)
|
|
add r4,r4,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r4,r4,r12 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#9*4] @ 24
|
|
@ ldr r1,[sp,#6*4]
|
|
mov r0,r2,ror#7
|
|
add r4,r4,r12 @ h+=Maj(a,b,c) from the past
|
|
mov r12,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r12,r12,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#8*4]
|
|
eor r12,r12,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#1*4]
|
|
|
|
add r12,r12,r0
|
|
eor r0,r8,r8,ror#5 @ from BODY_00_15
|
|
add r2,r2,r12
|
|
eor r0,r0,r8,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r11,r11,r2 @ h+=X[i]
|
|
str r2,[sp,#8*4]
|
|
eor r2,r9,r10
|
|
add r11,r11,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r8
|
|
add r11,r11,r12 @ h+=K256[i]
|
|
eor r2,r2,r10 @ Ch(e,f,g)
|
|
eor r0,r4,r4,ror#11
|
|
add r11,r11,r2 @ h+=Ch(e,f,g)
|
|
#if 24==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 24<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r4,r5 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#10*4] @ from future BODY_16_xx
|
|
eor r12,r4,r5 @ a^b, b^c in next round
|
|
ldr r1,[sp,#7*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r4,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r7,r7,r11 @ d+=h
|
|
eor r3,r3,r5 @ Maj(a,b,c)
|
|
add r11,r11,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r11,r11,r3 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#10*4] @ 25
|
|
@ ldr r1,[sp,#7*4]
|
|
mov r0,r2,ror#7
|
|
add r11,r11,r3 @ h+=Maj(a,b,c) from the past
|
|
mov r3,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r3,r3,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#9*4]
|
|
eor r3,r3,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#2*4]
|
|
|
|
add r3,r3,r0
|
|
eor r0,r7,r7,ror#5 @ from BODY_00_15
|
|
add r2,r2,r3
|
|
eor r0,r0,r7,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r10,r10,r2 @ h+=X[i]
|
|
str r2,[sp,#9*4]
|
|
eor r2,r8,r9
|
|
add r10,r10,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r7
|
|
add r10,r10,r3 @ h+=K256[i]
|
|
eor r2,r2,r9 @ Ch(e,f,g)
|
|
eor r0,r11,r11,ror#11
|
|
add r10,r10,r2 @ h+=Ch(e,f,g)
|
|
#if 25==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 25<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r11,r4 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#11*4] @ from future BODY_16_xx
|
|
eor r3,r11,r4 @ a^b, b^c in next round
|
|
ldr r1,[sp,#8*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r11,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r6,r6,r10 @ d+=h
|
|
eor r12,r12,r4 @ Maj(a,b,c)
|
|
add r10,r10,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r10,r10,r12 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#11*4] @ 26
|
|
@ ldr r1,[sp,#8*4]
|
|
mov r0,r2,ror#7
|
|
add r10,r10,r12 @ h+=Maj(a,b,c) from the past
|
|
mov r12,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r12,r12,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#10*4]
|
|
eor r12,r12,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#3*4]
|
|
|
|
add r12,r12,r0
|
|
eor r0,r6,r6,ror#5 @ from BODY_00_15
|
|
add r2,r2,r12
|
|
eor r0,r0,r6,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r9,r9,r2 @ h+=X[i]
|
|
str r2,[sp,#10*4]
|
|
eor r2,r7,r8
|
|
add r9,r9,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r6
|
|
add r9,r9,r12 @ h+=K256[i]
|
|
eor r2,r2,r8 @ Ch(e,f,g)
|
|
eor r0,r10,r10,ror#11
|
|
add r9,r9,r2 @ h+=Ch(e,f,g)
|
|
#if 26==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 26<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r10,r11 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#12*4] @ from future BODY_16_xx
|
|
eor r12,r10,r11 @ a^b, b^c in next round
|
|
ldr r1,[sp,#9*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r10,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r5,r5,r9 @ d+=h
|
|
eor r3,r3,r11 @ Maj(a,b,c)
|
|
add r9,r9,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r9,r9,r3 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#12*4] @ 27
|
|
@ ldr r1,[sp,#9*4]
|
|
mov r0,r2,ror#7
|
|
add r9,r9,r3 @ h+=Maj(a,b,c) from the past
|
|
mov r3,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r3,r3,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#11*4]
|
|
eor r3,r3,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#4*4]
|
|
|
|
add r3,r3,r0
|
|
eor r0,r5,r5,ror#5 @ from BODY_00_15
|
|
add r2,r2,r3
|
|
eor r0,r0,r5,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r8,r8,r2 @ h+=X[i]
|
|
str r2,[sp,#11*4]
|
|
eor r2,r6,r7
|
|
add r8,r8,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r5
|
|
add r8,r8,r3 @ h+=K256[i]
|
|
eor r2,r2,r7 @ Ch(e,f,g)
|
|
eor r0,r9,r9,ror#11
|
|
add r8,r8,r2 @ h+=Ch(e,f,g)
|
|
#if 27==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 27<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r9,r10 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#13*4] @ from future BODY_16_xx
|
|
eor r3,r9,r10 @ a^b, b^c in next round
|
|
ldr r1,[sp,#10*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r9,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r4,r4,r8 @ d+=h
|
|
eor r12,r12,r10 @ Maj(a,b,c)
|
|
add r8,r8,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r8,r8,r12 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#13*4] @ 28
|
|
@ ldr r1,[sp,#10*4]
|
|
mov r0,r2,ror#7
|
|
add r8,r8,r12 @ h+=Maj(a,b,c) from the past
|
|
mov r12,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r12,r12,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#12*4]
|
|
eor r12,r12,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#5*4]
|
|
|
|
add r12,r12,r0
|
|
eor r0,r4,r4,ror#5 @ from BODY_00_15
|
|
add r2,r2,r12
|
|
eor r0,r0,r4,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r7,r7,r2 @ h+=X[i]
|
|
str r2,[sp,#12*4]
|
|
eor r2,r5,r6
|
|
add r7,r7,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r4
|
|
add r7,r7,r12 @ h+=K256[i]
|
|
eor r2,r2,r6 @ Ch(e,f,g)
|
|
eor r0,r8,r8,ror#11
|
|
add r7,r7,r2 @ h+=Ch(e,f,g)
|
|
#if 28==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 28<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r8,r9 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#14*4] @ from future BODY_16_xx
|
|
eor r12,r8,r9 @ a^b, b^c in next round
|
|
ldr r1,[sp,#11*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r8,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r11,r11,r7 @ d+=h
|
|
eor r3,r3,r9 @ Maj(a,b,c)
|
|
add r7,r7,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r7,r7,r3 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#14*4] @ 29
|
|
@ ldr r1,[sp,#11*4]
|
|
mov r0,r2,ror#7
|
|
add r7,r7,r3 @ h+=Maj(a,b,c) from the past
|
|
mov r3,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r3,r3,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#13*4]
|
|
eor r3,r3,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#6*4]
|
|
|
|
add r3,r3,r0
|
|
eor r0,r11,r11,ror#5 @ from BODY_00_15
|
|
add r2,r2,r3
|
|
eor r0,r0,r11,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r6,r6,r2 @ h+=X[i]
|
|
str r2,[sp,#13*4]
|
|
eor r2,r4,r5
|
|
add r6,r6,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r11
|
|
add r6,r6,r3 @ h+=K256[i]
|
|
eor r2,r2,r5 @ Ch(e,f,g)
|
|
eor r0,r7,r7,ror#11
|
|
add r6,r6,r2 @ h+=Ch(e,f,g)
|
|
#if 29==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 29<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r7,r8 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#15*4] @ from future BODY_16_xx
|
|
eor r3,r7,r8 @ a^b, b^c in next round
|
|
ldr r1,[sp,#12*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r7,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r10,r10,r6 @ d+=h
|
|
eor r12,r12,r8 @ Maj(a,b,c)
|
|
add r6,r6,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r6,r6,r12 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#15*4] @ 30
|
|
@ ldr r1,[sp,#12*4]
|
|
mov r0,r2,ror#7
|
|
add r6,r6,r12 @ h+=Maj(a,b,c) from the past
|
|
mov r12,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r12,r12,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#14*4]
|
|
eor r12,r12,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#7*4]
|
|
|
|
add r12,r12,r0
|
|
eor r0,r10,r10,ror#5 @ from BODY_00_15
|
|
add r2,r2,r12
|
|
eor r0,r0,r10,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r12,[r14],#4 @ *K256++
|
|
add r5,r5,r2 @ h+=X[i]
|
|
str r2,[sp,#14*4]
|
|
eor r2,r11,r4
|
|
add r5,r5,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r10
|
|
add r5,r5,r12 @ h+=K256[i]
|
|
eor r2,r2,r4 @ Ch(e,f,g)
|
|
eor r0,r6,r6,ror#11
|
|
add r5,r5,r2 @ h+=Ch(e,f,g)
|
|
#if 30==31
|
|
and r12,r12,#0xff
|
|
cmp r12,#0xf2 @ done?
|
|
#endif
|
|
#if 30<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r12,r6,r7 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#0*4] @ from future BODY_16_xx
|
|
eor r12,r6,r7 @ a^b, b^c in next round
|
|
ldr r1,[sp,#13*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r6,ror#20 @ Sigma0(a)
|
|
and r3,r3,r12 @ (b^c)&=(a^b)
|
|
add r9,r9,r5 @ d+=h
|
|
eor r3,r3,r7 @ Maj(a,b,c)
|
|
add r5,r5,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r5,r5,r3 @ h+=Maj(a,b,c)
|
|
@ ldr r2,[sp,#0*4] @ 31
|
|
@ ldr r1,[sp,#13*4]
|
|
mov r0,r2,ror#7
|
|
add r5,r5,r3 @ h+=Maj(a,b,c) from the past
|
|
mov r3,r1,ror#17
|
|
eor r0,r0,r2,ror#18
|
|
eor r3,r3,r1,ror#19
|
|
eor r0,r0,r2,lsr#3 @ sigma0(X[i+1])
|
|
ldr r2,[sp,#15*4]
|
|
eor r3,r3,r1,lsr#10 @ sigma1(X[i+14])
|
|
ldr r1,[sp,#8*4]
|
|
|
|
add r3,r3,r0
|
|
eor r0,r9,r9,ror#5 @ from BODY_00_15
|
|
add r2,r2,r3
|
|
eor r0,r0,r9,ror#19 @ Sigma1(e)
|
|
add r2,r2,r1 @ X[i]
|
|
ldr r3,[r14],#4 @ *K256++
|
|
add r4,r4,r2 @ h+=X[i]
|
|
str r2,[sp,#15*4]
|
|
eor r2,r10,r11
|
|
add r4,r4,r0,ror#6 @ h+=Sigma1(e)
|
|
and r2,r2,r9
|
|
add r4,r4,r3 @ h+=K256[i]
|
|
eor r2,r2,r11 @ Ch(e,f,g)
|
|
eor r0,r5,r5,ror#11
|
|
add r4,r4,r2 @ h+=Ch(e,f,g)
|
|
#if 31==31
|
|
and r3,r3,#0xff
|
|
cmp r3,#0xf2 @ done?
|
|
#endif
|
|
#if 31<15
|
|
# if __ARM_ARCH__>=7
|
|
ldr r2,[r1],#4 @ prefetch
|
|
# else
|
|
ldrb r2,[r1,#3]
|
|
# endif
|
|
eor r3,r5,r6 @ a^b, b^c in next round
|
|
#else
|
|
ldr r2,[sp,#1*4] @ from future BODY_16_xx
|
|
eor r3,r5,r6 @ a^b, b^c in next round
|
|
ldr r1,[sp,#14*4] @ from future BODY_16_xx
|
|
#endif
|
|
eor r0,r0,r5,ror#20 @ Sigma0(a)
|
|
and r12,r12,r3 @ (b^c)&=(a^b)
|
|
add r8,r8,r4 @ d+=h
|
|
eor r12,r12,r6 @ Maj(a,b,c)
|
|
add r4,r4,r0,ror#2 @ h+=Sigma0(a)
|
|
@ add r4,r4,r12 @ h+=Maj(a,b,c)
|
|
#if __ARM_ARCH__>=7
|
|
ite eq @ Thumb2 thing, sanity check in ARM
|
|
#endif
|
|
ldreq r3,[sp,#16*4] @ pull ctx
|
|
bne .Lrounds_16_xx
|
|
|
|
add r4,r4,r12 @ h+=Maj(a,b,c) from the past
|
|
ldr r0,[r3,#0]
|
|
ldr r2,[r3,#4]
|
|
ldr r12,[r3,#8]
|
|
add r4,r4,r0
|
|
ldr r0,[r3,#12]
|
|
add r5,r5,r2
|
|
ldr r2,[r3,#16]
|
|
add r6,r6,r12
|
|
ldr r12,[r3,#20]
|
|
add r7,r7,r0
|
|
ldr r0,[r3,#24]
|
|
add r8,r8,r2
|
|
ldr r2,[r3,#28]
|
|
add r9,r9,r12
|
|
ldr r1,[sp,#17*4] @ pull inp
|
|
ldr r12,[sp,#18*4] @ pull inp+len
|
|
add r10,r10,r0
|
|
add r11,r11,r2
|
|
stmia r3,{r4,r5,r6,r7,r8,r9,r10,r11}
|
|
cmp r1,r12
|
|
sub r14,r14,#256 @ rewind Ktbl
|
|
bne .Loop
|
|
|
|
add sp,sp,#19*4 @ destroy frame
|
|
#if __ARM_ARCH__>=5
|
|
ldmia sp!,{r4-r11,pc}
|
|
#else
|
|
ldmia sp!,{r4-r11,lr}
|
|
tst lr,#1
|
|
moveq pc,lr @ be binary compatible with V4, yet
|
|
.word 0xe12fff1e @ interoperable with Thumb ISA:-)
|
|
#endif
|
|
.size sha256_block_data_order,.-sha256_block_data_order
|
|
#if __ARM_MAX_ARCH__>=7
|
|
.arch armv7-a
|
|
.fpu neon
|
|
|
|
.global sha256_block_data_order_neon
|
|
.type sha256_block_data_order_neon,%function
|
|
.align 4
|
|
sha256_block_data_order_neon:
|
|
.LNEON:
|
|
stmdb sp!,{r4-r12,lr}
|
|
|
|
sub r11,sp,#16*4+16
|
|
adr r14,K256
|
|
bic r11,r11,#15 @ align for 128-bit stores
|
|
mov r12,sp
|
|
mov sp,r11 @ alloca
|
|
add r2,r1,r2,lsl#6 @ len to point at the end of inp
|
|
|
|
vld1.8 {q0},[r1]!
|
|
vld1.8 {q1},[r1]!
|
|
vld1.8 {q2},[r1]!
|
|
vld1.8 {q3},[r1]!
|
|
vld1.32 {q8},[r14,:128]!
|
|
vld1.32 {q9},[r14,:128]!
|
|
vld1.32 {q10},[r14,:128]!
|
|
vld1.32 {q11},[r14,:128]!
|
|
vrev32.8 q0,q0 @ yes, even on
|
|
str r0,[sp,#64]
|
|
vrev32.8 q1,q1 @ big-endian
|
|
str r1,[sp,#68]
|
|
mov r1,sp
|
|
vrev32.8 q2,q2
|
|
str r2,[sp,#72]
|
|
vrev32.8 q3,q3
|
|
str r12,[sp,#76] @ save original sp
|
|
vadd.i32 q8,q8,q0
|
|
vadd.i32 q9,q9,q1
|
|
vst1.32 {q8},[r1,:128]!
|
|
vadd.i32 q10,q10,q2
|
|
vst1.32 {q9},[r1,:128]!
|
|
vadd.i32 q11,q11,q3
|
|
vst1.32 {q10},[r1,:128]!
|
|
vst1.32 {q11},[r1,:128]!
|
|
|
|
ldmia r0,{r4-r11}
|
|
sub r1,r1,#64
|
|
ldr r2,[sp,#0]
|
|
eor r12,r12,r12
|
|
eor r3,r5,r6
|
|
b .L_00_48
|
|
|
|
.align 4
|
|
.L_00_48:
|
|
vext.8 q8,q0,q1,#4
|
|
add r11,r11,r2
|
|
eor r2,r9,r10
|
|
eor r0,r8,r8,ror#5
|
|
vext.8 q9,q2,q3,#4
|
|
add r4,r4,r12
|
|
and r2,r2,r8
|
|
eor r12,r0,r8,ror#19
|
|
vshr.u32 q10,q8,#7
|
|
eor r0,r4,r4,ror#11
|
|
eor r2,r2,r10
|
|
vadd.i32 q0,q0,q9
|
|
add r11,r11,r12,ror#6
|
|
eor r12,r4,r5
|
|
vshr.u32 q9,q8,#3
|
|
eor r0,r0,r4,ror#20
|
|
add r11,r11,r2
|
|
vsli.32 q10,q8,#25
|
|
ldr r2,[sp,#4]
|
|
and r3,r3,r12
|
|
vshr.u32 q11,q8,#18
|
|
add r7,r7,r11
|
|
add r11,r11,r0,ror#2
|
|
eor r3,r3,r5
|
|
veor q9,q9,q10
|
|
add r10,r10,r2
|
|
vsli.32 q11,q8,#14
|
|
eor r2,r8,r9
|
|
eor r0,r7,r7,ror#5
|
|
vshr.u32 d24,d7,#17
|
|
add r11,r11,r3
|
|
and r2,r2,r7
|
|
veor q9,q9,q11
|
|
eor r3,r0,r7,ror#19
|
|
eor r0,r11,r11,ror#11
|
|
vsli.32 d24,d7,#15
|
|
eor r2,r2,r9
|
|
add r10,r10,r3,ror#6
|
|
vshr.u32 d25,d7,#10
|
|
eor r3,r11,r4
|
|
eor r0,r0,r11,ror#20
|
|
vadd.i32 q0,q0,q9
|
|
add r10,r10,r2
|
|
ldr r2,[sp,#8]
|
|
veor d25,d25,d24
|
|
and r12,r12,r3
|
|
add r6,r6,r10
|
|
vshr.u32 d24,d7,#19
|
|
add r10,r10,r0,ror#2
|
|
eor r12,r12,r4
|
|
vsli.32 d24,d7,#13
|
|
add r9,r9,r2
|
|
eor r2,r7,r8
|
|
veor d25,d25,d24
|
|
eor r0,r6,r6,ror#5
|
|
add r10,r10,r12
|
|
vadd.i32 d0,d0,d25
|
|
and r2,r2,r6
|
|
eor r12,r0,r6,ror#19
|
|
vshr.u32 d24,d0,#17
|
|
eor r0,r10,r10,ror#11
|
|
eor r2,r2,r8
|
|
vsli.32 d24,d0,#15
|
|
add r9,r9,r12,ror#6
|
|
eor r12,r10,r11
|
|
vshr.u32 d25,d0,#10
|
|
eor r0,r0,r10,ror#20
|
|
add r9,r9,r2
|
|
veor d25,d25,d24
|
|
ldr r2,[sp,#12]
|
|
and r3,r3,r12
|
|
vshr.u32 d24,d0,#19
|
|
add r5,r5,r9
|
|
add r9,r9,r0,ror#2
|
|
eor r3,r3,r11
|
|
vld1.32 {q8},[r14,:128]!
|
|
add r8,r8,r2
|
|
vsli.32 d24,d0,#13
|
|
eor r2,r6,r7
|
|
eor r0,r5,r5,ror#5
|
|
veor d25,d25,d24
|
|
add r9,r9,r3
|
|
and r2,r2,r5
|
|
vadd.i32 d1,d1,d25
|
|
eor r3,r0,r5,ror#19
|
|
eor r0,r9,r9,ror#11
|
|
vadd.i32 q8,q8,q0
|
|
eor r2,r2,r7
|
|
add r8,r8,r3,ror#6
|
|
eor r3,r9,r10
|
|
eor r0,r0,r9,ror#20
|
|
add r8,r8,r2
|
|
ldr r2,[sp,#16]
|
|
and r12,r12,r3
|
|
add r4,r4,r8
|
|
vst1.32 {q8},[r1,:128]!
|
|
add r8,r8,r0,ror#2
|
|
eor r12,r12,r10
|
|
vext.8 q8,q1,q2,#4
|
|
add r7,r7,r2
|
|
eor r2,r5,r6
|
|
eor r0,r4,r4,ror#5
|
|
vext.8 q9,q3,q0,#4
|
|
add r8,r8,r12
|
|
and r2,r2,r4
|
|
eor r12,r0,r4,ror#19
|
|
vshr.u32 q10,q8,#7
|
|
eor r0,r8,r8,ror#11
|
|
eor r2,r2,r6
|
|
vadd.i32 q1,q1,q9
|
|
add r7,r7,r12,ror#6
|
|
eor r12,r8,r9
|
|
vshr.u32 q9,q8,#3
|
|
eor r0,r0,r8,ror#20
|
|
add r7,r7,r2
|
|
vsli.32 q10,q8,#25
|
|
ldr r2,[sp,#20]
|
|
and r3,r3,r12
|
|
vshr.u32 q11,q8,#18
|
|
add r11,r11,r7
|
|
add r7,r7,r0,ror#2
|
|
eor r3,r3,r9
|
|
veor q9,q9,q10
|
|
add r6,r6,r2
|
|
vsli.32 q11,q8,#14
|
|
eor r2,r4,r5
|
|
eor r0,r11,r11,ror#5
|
|
vshr.u32 d24,d1,#17
|
|
add r7,r7,r3
|
|
and r2,r2,r11
|
|
veor q9,q9,q11
|
|
eor r3,r0,r11,ror#19
|
|
eor r0,r7,r7,ror#11
|
|
vsli.32 d24,d1,#15
|
|
eor r2,r2,r5
|
|
add r6,r6,r3,ror#6
|
|
vshr.u32 d25,d1,#10
|
|
eor r3,r7,r8
|
|
eor r0,r0,r7,ror#20
|
|
vadd.i32 q1,q1,q9
|
|
add r6,r6,r2
|
|
ldr r2,[sp,#24]
|
|
veor d25,d25,d24
|
|
and r12,r12,r3
|
|
add r10,r10,r6
|
|
vshr.u32 d24,d1,#19
|
|
add r6,r6,r0,ror#2
|
|
eor r12,r12,r8
|
|
vsli.32 d24,d1,#13
|
|
add r5,r5,r2
|
|
eor r2,r11,r4
|
|
veor d25,d25,d24
|
|
eor r0,r10,r10,ror#5
|
|
add r6,r6,r12
|
|
vadd.i32 d2,d2,d25
|
|
and r2,r2,r10
|
|
eor r12,r0,r10,ror#19
|
|
vshr.u32 d24,d2,#17
|
|
eor r0,r6,r6,ror#11
|
|
eor r2,r2,r4
|
|
vsli.32 d24,d2,#15
|
|
add r5,r5,r12,ror#6
|
|
eor r12,r6,r7
|
|
vshr.u32 d25,d2,#10
|
|
eor r0,r0,r6,ror#20
|
|
add r5,r5,r2
|
|
veor d25,d25,d24
|
|
ldr r2,[sp,#28]
|
|
and r3,r3,r12
|
|
vshr.u32 d24,d2,#19
|
|
add r9,r9,r5
|
|
add r5,r5,r0,ror#2
|
|
eor r3,r3,r7
|
|
vld1.32 {q8},[r14,:128]!
|
|
add r4,r4,r2
|
|
vsli.32 d24,d2,#13
|
|
eor r2,r10,r11
|
|
eor r0,r9,r9,ror#5
|
|
veor d25,d25,d24
|
|
add r5,r5,r3
|
|
and r2,r2,r9
|
|
vadd.i32 d3,d3,d25
|
|
eor r3,r0,r9,ror#19
|
|
eor r0,r5,r5,ror#11
|
|
vadd.i32 q8,q8,q1
|
|
eor r2,r2,r11
|
|
add r4,r4,r3,ror#6
|
|
eor r3,r5,r6
|
|
eor r0,r0,r5,ror#20
|
|
add r4,r4,r2
|
|
ldr r2,[sp,#32]
|
|
and r12,r12,r3
|
|
add r8,r8,r4
|
|
vst1.32 {q8},[r1,:128]!
|
|
add r4,r4,r0,ror#2
|
|
eor r12,r12,r6
|
|
vext.8 q8,q2,q3,#4
|
|
add r11,r11,r2
|
|
eor r2,r9,r10
|
|
eor r0,r8,r8,ror#5
|
|
vext.8 q9,q0,q1,#4
|
|
add r4,r4,r12
|
|
and r2,r2,r8
|
|
eor r12,r0,r8,ror#19
|
|
vshr.u32 q10,q8,#7
|
|
eor r0,r4,r4,ror#11
|
|
eor r2,r2,r10
|
|
vadd.i32 q2,q2,q9
|
|
add r11,r11,r12,ror#6
|
|
eor r12,r4,r5
|
|
vshr.u32 q9,q8,#3
|
|
eor r0,r0,r4,ror#20
|
|
add r11,r11,r2
|
|
vsli.32 q10,q8,#25
|
|
ldr r2,[sp,#36]
|
|
and r3,r3,r12
|
|
vshr.u32 q11,q8,#18
|
|
add r7,r7,r11
|
|
add r11,r11,r0,ror#2
|
|
eor r3,r3,r5
|
|
veor q9,q9,q10
|
|
add r10,r10,r2
|
|
vsli.32 q11,q8,#14
|
|
eor r2,r8,r9
|
|
eor r0,r7,r7,ror#5
|
|
vshr.u32 d24,d3,#17
|
|
add r11,r11,r3
|
|
and r2,r2,r7
|
|
veor q9,q9,q11
|
|
eor r3,r0,r7,ror#19
|
|
eor r0,r11,r11,ror#11
|
|
vsli.32 d24,d3,#15
|
|
eor r2,r2,r9
|
|
add r10,r10,r3,ror#6
|
|
vshr.u32 d25,d3,#10
|
|
eor r3,r11,r4
|
|
eor r0,r0,r11,ror#20
|
|
vadd.i32 q2,q2,q9
|
|
add r10,r10,r2
|
|
ldr r2,[sp,#40]
|
|
veor d25,d25,d24
|
|
and r12,r12,r3
|
|
add r6,r6,r10
|
|
vshr.u32 d24,d3,#19
|
|
add r10,r10,r0,ror#2
|
|
eor r12,r12,r4
|
|
vsli.32 d24,d3,#13
|
|
add r9,r9,r2
|
|
eor r2,r7,r8
|
|
veor d25,d25,d24
|
|
eor r0,r6,r6,ror#5
|
|
add r10,r10,r12
|
|
vadd.i32 d4,d4,d25
|
|
and r2,r2,r6
|
|
eor r12,r0,r6,ror#19
|
|
vshr.u32 d24,d4,#17
|
|
eor r0,r10,r10,ror#11
|
|
eor r2,r2,r8
|
|
vsli.32 d24,d4,#15
|
|
add r9,r9,r12,ror#6
|
|
eor r12,r10,r11
|
|
vshr.u32 d25,d4,#10
|
|
eor r0,r0,r10,ror#20
|
|
add r9,r9,r2
|
|
veor d25,d25,d24
|
|
ldr r2,[sp,#44]
|
|
and r3,r3,r12
|
|
vshr.u32 d24,d4,#19
|
|
add r5,r5,r9
|
|
add r9,r9,r0,ror#2
|
|
eor r3,r3,r11
|
|
vld1.32 {q8},[r14,:128]!
|
|
add r8,r8,r2
|
|
vsli.32 d24,d4,#13
|
|
eor r2,r6,r7
|
|
eor r0,r5,r5,ror#5
|
|
veor d25,d25,d24
|
|
add r9,r9,r3
|
|
and r2,r2,r5
|
|
vadd.i32 d5,d5,d25
|
|
eor r3,r0,r5,ror#19
|
|
eor r0,r9,r9,ror#11
|
|
vadd.i32 q8,q8,q2
|
|
eor r2,r2,r7
|
|
add r8,r8,r3,ror#6
|
|
eor r3,r9,r10
|
|
eor r0,r0,r9,ror#20
|
|
add r8,r8,r2
|
|
ldr r2,[sp,#48]
|
|
and r12,r12,r3
|
|
add r4,r4,r8
|
|
vst1.32 {q8},[r1,:128]!
|
|
add r8,r8,r0,ror#2
|
|
eor r12,r12,r10
|
|
vext.8 q8,q3,q0,#4
|
|
add r7,r7,r2
|
|
eor r2,r5,r6
|
|
eor r0,r4,r4,ror#5
|
|
vext.8 q9,q1,q2,#4
|
|
add r8,r8,r12
|
|
and r2,r2,r4
|
|
eor r12,r0,r4,ror#19
|
|
vshr.u32 q10,q8,#7
|
|
eor r0,r8,r8,ror#11
|
|
eor r2,r2,r6
|
|
vadd.i32 q3,q3,q9
|
|
add r7,r7,r12,ror#6
|
|
eor r12,r8,r9
|
|
vshr.u32 q9,q8,#3
|
|
eor r0,r0,r8,ror#20
|
|
add r7,r7,r2
|
|
vsli.32 q10,q8,#25
|
|
ldr r2,[sp,#52]
|
|
and r3,r3,r12
|
|
vshr.u32 q11,q8,#18
|
|
add r11,r11,r7
|
|
add r7,r7,r0,ror#2
|
|
eor r3,r3,r9
|
|
veor q9,q9,q10
|
|
add r6,r6,r2
|
|
vsli.32 q11,q8,#14
|
|
eor r2,r4,r5
|
|
eor r0,r11,r11,ror#5
|
|
vshr.u32 d24,d5,#17
|
|
add r7,r7,r3
|
|
and r2,r2,r11
|
|
veor q9,q9,q11
|
|
eor r3,r0,r11,ror#19
|
|
eor r0,r7,r7,ror#11
|
|
vsli.32 d24,d5,#15
|
|
eor r2,r2,r5
|
|
add r6,r6,r3,ror#6
|
|
vshr.u32 d25,d5,#10
|
|
eor r3,r7,r8
|
|
eor r0,r0,r7,ror#20
|
|
vadd.i32 q3,q3,q9
|
|
add r6,r6,r2
|
|
ldr r2,[sp,#56]
|
|
veor d25,d25,d24
|
|
and r12,r12,r3
|
|
add r10,r10,r6
|
|
vshr.u32 d24,d5,#19
|
|
add r6,r6,r0,ror#2
|
|
eor r12,r12,r8
|
|
vsli.32 d24,d5,#13
|
|
add r5,r5,r2
|
|
eor r2,r11,r4
|
|
veor d25,d25,d24
|
|
eor r0,r10,r10,ror#5
|
|
add r6,r6,r12
|
|
vadd.i32 d6,d6,d25
|
|
and r2,r2,r10
|
|
eor r12,r0,r10,ror#19
|
|
vshr.u32 d24,d6,#17
|
|
eor r0,r6,r6,ror#11
|
|
eor r2,r2,r4
|
|
vsli.32 d24,d6,#15
|
|
add r5,r5,r12,ror#6
|
|
eor r12,r6,r7
|
|
vshr.u32 d25,d6,#10
|
|
eor r0,r0,r6,ror#20
|
|
add r5,r5,r2
|
|
veor d25,d25,d24
|
|
ldr r2,[sp,#60]
|
|
and r3,r3,r12
|
|
vshr.u32 d24,d6,#19
|
|
add r9,r9,r5
|
|
add r5,r5,r0,ror#2
|
|
eor r3,r3,r7
|
|
vld1.32 {q8},[r14,:128]!
|
|
add r4,r4,r2
|
|
vsli.32 d24,d6,#13
|
|
eor r2,r10,r11
|
|
eor r0,r9,r9,ror#5
|
|
veor d25,d25,d24
|
|
add r5,r5,r3
|
|
and r2,r2,r9
|
|
vadd.i32 d7,d7,d25
|
|
eor r3,r0,r9,ror#19
|
|
eor r0,r5,r5,ror#11
|
|
vadd.i32 q8,q8,q3
|
|
eor r2,r2,r11
|
|
add r4,r4,r3,ror#6
|
|
eor r3,r5,r6
|
|
eor r0,r0,r5,ror#20
|
|
add r4,r4,r2
|
|
ldr r2,[r14]
|
|
and r12,r12,r3
|
|
add r8,r8,r4
|
|
vst1.32 {q8},[r1,:128]!
|
|
add r4,r4,r0,ror#2
|
|
eor r12,r12,r6
|
|
teq r2,#0 @ check for K256 terminator
|
|
ldr r2,[sp,#0]
|
|
sub r1,r1,#64
|
|
bne .L_00_48
|
|
|
|
ldr r1,[sp,#68]
|
|
ldr r0,[sp,#72]
|
|
sub r14,r14,#256 @ rewind r14
|
|
teq r1,r0
|
|
it eq
|
|
subeq r1,r1,#64 @ avoid SEGV
|
|
vld1.8 {q0},[r1]! @ load next input block
|
|
vld1.8 {q1},[r1]!
|
|
vld1.8 {q2},[r1]!
|
|
vld1.8 {q3},[r1]!
|
|
it ne
|
|
strne r1,[sp,#68]
|
|
mov r1,sp
|
|
add r11,r11,r2
|
|
eor r2,r9,r10
|
|
eor r0,r8,r8,ror#5
|
|
add r4,r4,r12
|
|
vld1.32 {q8},[r14,:128]!
|
|
and r2,r2,r8
|
|
eor r12,r0,r8,ror#19
|
|
eor r0,r4,r4,ror#11
|
|
eor r2,r2,r10
|
|
vrev32.8 q0,q0
|
|
add r11,r11,r12,ror#6
|
|
eor r12,r4,r5
|
|
eor r0,r0,r4,ror#20
|
|
add r11,r11,r2
|
|
vadd.i32 q8,q8,q0
|
|
ldr r2,[sp,#4]
|
|
and r3,r3,r12
|
|
add r7,r7,r11
|
|
add r11,r11,r0,ror#2
|
|
eor r3,r3,r5
|
|
add r10,r10,r2
|
|
eor r2,r8,r9
|
|
eor r0,r7,r7,ror#5
|
|
add r11,r11,r3
|
|
and r2,r2,r7
|
|
eor r3,r0,r7,ror#19
|
|
eor r0,r11,r11,ror#11
|
|
eor r2,r2,r9
|
|
add r10,r10,r3,ror#6
|
|
eor r3,r11,r4
|
|
eor r0,r0,r11,ror#20
|
|
add r10,r10,r2
|
|
ldr r2,[sp,#8]
|
|
and r12,r12,r3
|
|
add r6,r6,r10
|
|
add r10,r10,r0,ror#2
|
|
eor r12,r12,r4
|
|
add r9,r9,r2
|
|
eor r2,r7,r8
|
|
eor r0,r6,r6,ror#5
|
|
add r10,r10,r12
|
|
and r2,r2,r6
|
|
eor r12,r0,r6,ror#19
|
|
eor r0,r10,r10,ror#11
|
|
eor r2,r2,r8
|
|
add r9,r9,r12,ror#6
|
|
eor r12,r10,r11
|
|
eor r0,r0,r10,ror#20
|
|
add r9,r9,r2
|
|
ldr r2,[sp,#12]
|
|
and r3,r3,r12
|
|
add r5,r5,r9
|
|
add r9,r9,r0,ror#2
|
|
eor r3,r3,r11
|
|
add r8,r8,r2
|
|
eor r2,r6,r7
|
|
eor r0,r5,r5,ror#5
|
|
add r9,r9,r3
|
|
and r2,r2,r5
|
|
eor r3,r0,r5,ror#19
|
|
eor r0,r9,r9,ror#11
|
|
eor r2,r2,r7
|
|
add r8,r8,r3,ror#6
|
|
eor r3,r9,r10
|
|
eor r0,r0,r9,ror#20
|
|
add r8,r8,r2
|
|
ldr r2,[sp,#16]
|
|
and r12,r12,r3
|
|
add r4,r4,r8
|
|
add r8,r8,r0,ror#2
|
|
eor r12,r12,r10
|
|
vst1.32 {q8},[r1,:128]!
|
|
add r7,r7,r2
|
|
eor r2,r5,r6
|
|
eor r0,r4,r4,ror#5
|
|
add r8,r8,r12
|
|
vld1.32 {q8},[r14,:128]!
|
|
and r2,r2,r4
|
|
eor r12,r0,r4,ror#19
|
|
eor r0,r8,r8,ror#11
|
|
eor r2,r2,r6
|
|
vrev32.8 q1,q1
|
|
add r7,r7,r12,ror#6
|
|
eor r12,r8,r9
|
|
eor r0,r0,r8,ror#20
|
|
add r7,r7,r2
|
|
vadd.i32 q8,q8,q1
|
|
ldr r2,[sp,#20]
|
|
and r3,r3,r12
|
|
add r11,r11,r7
|
|
add r7,r7,r0,ror#2
|
|
eor r3,r3,r9
|
|
add r6,r6,r2
|
|
eor r2,r4,r5
|
|
eor r0,r11,r11,ror#5
|
|
add r7,r7,r3
|
|
and r2,r2,r11
|
|
eor r3,r0,r11,ror#19
|
|
eor r0,r7,r7,ror#11
|
|
eor r2,r2,r5
|
|
add r6,r6,r3,ror#6
|
|
eor r3,r7,r8
|
|
eor r0,r0,r7,ror#20
|
|
add r6,r6,r2
|
|
ldr r2,[sp,#24]
|
|
and r12,r12,r3
|
|
add r10,r10,r6
|
|
add r6,r6,r0,ror#2
|
|
eor r12,r12,r8
|
|
add r5,r5,r2
|
|
eor r2,r11,r4
|
|
eor r0,r10,r10,ror#5
|
|
add r6,r6,r12
|
|
and r2,r2,r10
|
|
eor r12,r0,r10,ror#19
|
|
eor r0,r6,r6,ror#11
|
|
eor r2,r2,r4
|
|
add r5,r5,r12,ror#6
|
|
eor r12,r6,r7
|
|
eor r0,r0,r6,ror#20
|
|
add r5,r5,r2
|
|
ldr r2,[sp,#28]
|
|
and r3,r3,r12
|
|
add r9,r9,r5
|
|
add r5,r5,r0,ror#2
|
|
eor r3,r3,r7
|
|
add r4,r4,r2
|
|
eor r2,r10,r11
|
|
eor r0,r9,r9,ror#5
|
|
add r5,r5,r3
|
|
and r2,r2,r9
|
|
eor r3,r0,r9,ror#19
|
|
eor r0,r5,r5,ror#11
|
|
eor r2,r2,r11
|
|
add r4,r4,r3,ror#6
|
|
eor r3,r5,r6
|
|
eor r0,r0,r5,ror#20
|
|
add r4,r4,r2
|
|
ldr r2,[sp,#32]
|
|
and r12,r12,r3
|
|
add r8,r8,r4
|
|
add r4,r4,r0,ror#2
|
|
eor r12,r12,r6
|
|
vst1.32 {q8},[r1,:128]!
|
|
add r11,r11,r2
|
|
eor r2,r9,r10
|
|
eor r0,r8,r8,ror#5
|
|
add r4,r4,r12
|
|
vld1.32 {q8},[r14,:128]!
|
|
and r2,r2,r8
|
|
eor r12,r0,r8,ror#19
|
|
eor r0,r4,r4,ror#11
|
|
eor r2,r2,r10
|
|
vrev32.8 q2,q2
|
|
add r11,r11,r12,ror#6
|
|
eor r12,r4,r5
|
|
eor r0,r0,r4,ror#20
|
|
add r11,r11,r2
|
|
vadd.i32 q8,q8,q2
|
|
ldr r2,[sp,#36]
|
|
and r3,r3,r12
|
|
add r7,r7,r11
|
|
add r11,r11,r0,ror#2
|
|
eor r3,r3,r5
|
|
add r10,r10,r2
|
|
eor r2,r8,r9
|
|
eor r0,r7,r7,ror#5
|
|
add r11,r11,r3
|
|
and r2,r2,r7
|
|
eor r3,r0,r7,ror#19
|
|
eor r0,r11,r11,ror#11
|
|
eor r2,r2,r9
|
|
add r10,r10,r3,ror#6
|
|
eor r3,r11,r4
|
|
eor r0,r0,r11,ror#20
|
|
add r10,r10,r2
|
|
ldr r2,[sp,#40]
|
|
and r12,r12,r3
|
|
add r6,r6,r10
|
|
add r10,r10,r0,ror#2
|
|
eor r12,r12,r4
|
|
add r9,r9,r2
|
|
eor r2,r7,r8
|
|
eor r0,r6,r6,ror#5
|
|
add r10,r10,r12
|
|
and r2,r2,r6
|
|
eor r12,r0,r6,ror#19
|
|
eor r0,r10,r10,ror#11
|
|
eor r2,r2,r8
|
|
add r9,r9,r12,ror#6
|
|
eor r12,r10,r11
|
|
eor r0,r0,r10,ror#20
|
|
add r9,r9,r2
|
|
ldr r2,[sp,#44]
|
|
and r3,r3,r12
|
|
add r5,r5,r9
|
|
add r9,r9,r0,ror#2
|
|
eor r3,r3,r11
|
|
add r8,r8,r2
|
|
eor r2,r6,r7
|
|
eor r0,r5,r5,ror#5
|
|
add r9,r9,r3
|
|
and r2,r2,r5
|
|
eor r3,r0,r5,ror#19
|
|
eor r0,r9,r9,ror#11
|
|
eor r2,r2,r7
|
|
add r8,r8,r3,ror#6
|
|
eor r3,r9,r10
|
|
eor r0,r0,r9,ror#20
|
|
add r8,r8,r2
|
|
ldr r2,[sp,#48]
|
|
and r12,r12,r3
|
|
add r4,r4,r8
|
|
add r8,r8,r0,ror#2
|
|
eor r12,r12,r10
|
|
vst1.32 {q8},[r1,:128]!
|
|
add r7,r7,r2
|
|
eor r2,r5,r6
|
|
eor r0,r4,r4,ror#5
|
|
add r8,r8,r12
|
|
vld1.32 {q8},[r14,:128]!
|
|
and r2,r2,r4
|
|
eor r12,r0,r4,ror#19
|
|
eor r0,r8,r8,ror#11
|
|
eor r2,r2,r6
|
|
vrev32.8 q3,q3
|
|
add r7,r7,r12,ror#6
|
|
eor r12,r8,r9
|
|
eor r0,r0,r8,ror#20
|
|
add r7,r7,r2
|
|
vadd.i32 q8,q8,q3
|
|
ldr r2,[sp,#52]
|
|
and r3,r3,r12
|
|
add r11,r11,r7
|
|
add r7,r7,r0,ror#2
|
|
eor r3,r3,r9
|
|
add r6,r6,r2
|
|
eor r2,r4,r5
|
|
eor r0,r11,r11,ror#5
|
|
add r7,r7,r3
|
|
and r2,r2,r11
|
|
eor r3,r0,r11,ror#19
|
|
eor r0,r7,r7,ror#11
|
|
eor r2,r2,r5
|
|
add r6,r6,r3,ror#6
|
|
eor r3,r7,r8
|
|
eor r0,r0,r7,ror#20
|
|
add r6,r6,r2
|
|
ldr r2,[sp,#56]
|
|
and r12,r12,r3
|
|
add r10,r10,r6
|
|
add r6,r6,r0,ror#2
|
|
eor r12,r12,r8
|
|
add r5,r5,r2
|
|
eor r2,r11,r4
|
|
eor r0,r10,r10,ror#5
|
|
add r6,r6,r12
|
|
and r2,r2,r10
|
|
eor r12,r0,r10,ror#19
|
|
eor r0,r6,r6,ror#11
|
|
eor r2,r2,r4
|
|
add r5,r5,r12,ror#6
|
|
eor r12,r6,r7
|
|
eor r0,r0,r6,ror#20
|
|
add r5,r5,r2
|
|
ldr r2,[sp,#60]
|
|
and r3,r3,r12
|
|
add r9,r9,r5
|
|
add r5,r5,r0,ror#2
|
|
eor r3,r3,r7
|
|
add r4,r4,r2
|
|
eor r2,r10,r11
|
|
eor r0,r9,r9,ror#5
|
|
add r5,r5,r3
|
|
and r2,r2,r9
|
|
eor r3,r0,r9,ror#19
|
|
eor r0,r5,r5,ror#11
|
|
eor r2,r2,r11
|
|
add r4,r4,r3,ror#6
|
|
eor r3,r5,r6
|
|
eor r0,r0,r5,ror#20
|
|
add r4,r4,r2
|
|
ldr r2,[sp,#64]
|
|
and r12,r12,r3
|
|
add r8,r8,r4
|
|
add r4,r4,r0,ror#2
|
|
eor r12,r12,r6
|
|
vst1.32 {q8},[r1,:128]!
|
|
ldr r0,[r2,#0]
|
|
add r4,r4,r12 @ h+=Maj(a,b,c) from the past
|
|
ldr r12,[r2,#4]
|
|
ldr r3,[r2,#8]
|
|
ldr r1,[r2,#12]
|
|
add r4,r4,r0 @ accumulate
|
|
ldr r0,[r2,#16]
|
|
add r5,r5,r12
|
|
ldr r12,[r2,#20]
|
|
add r6,r6,r3
|
|
ldr r3,[r2,#24]
|
|
add r7,r7,r1
|
|
ldr r1,[r2,#28]
|
|
add r8,r8,r0
|
|
str r4,[r2],#4
|
|
add r9,r9,r12
|
|
str r5,[r2],#4
|
|
add r10,r10,r3
|
|
str r6,[r2],#4
|
|
add r11,r11,r1
|
|
str r7,[r2],#4
|
|
stmia r2,{r8-r11}
|
|
|
|
ittte ne
|
|
movne r1,sp
|
|
ldrne r2,[sp,#0]
|
|
eorne r12,r12,r12
|
|
ldreq sp,[sp,#76] @ restore original sp
|
|
itt ne
|
|
eorne r3,r5,r6
|
|
bne .L_00_48
|
|
|
|
ldmia sp!,{r4-r12,pc}
|
|
.size sha256_block_data_order_neon,.-sha256_block_data_order_neon
|
|
#endif
|
|
#if __ARM_MAX_ARCH__>=7 && !defined(__KERNEL__)
|
|
|
|
# ifdef __thumb2__
|
|
# define INST(a,b,c,d) .byte c,d|0xc,a,b
|
|
# else
|
|
# define INST(a,b,c,d) .byte a,b,c,d
|
|
# endif
|
|
|
|
.type sha256_block_data_order_armv8,%function
|
|
.align 5
|
|
sha256_block_data_order_armv8:
|
|
.LARMv8:
|
|
vld1.32 {q0,q1},[r0]
|
|
# ifdef __thumb2__
|
|
adr r3,.LARMv8
|
|
sub r3,r3,#.LARMv8-K256
|
|
# else
|
|
sub r3,r3,#256+32
|
|
# endif
|
|
add r2,r1,r2,lsl#6 @ len to point at the end of inp
|
|
|
|
.Loop_v8:
|
|
vld1.8 {q8-q9},[r1]!
|
|
vld1.8 {q10-q11},[r1]!
|
|
vld1.32 {q12},[r3]!
|
|
vrev32.8 q8,q8
|
|
vrev32.8 q9,q9
|
|
vrev32.8 q10,q10
|
|
vrev32.8 q11,q11
|
|
vmov q14,q0 @ offload
|
|
vmov q15,q1
|
|
teq r1,r2
|
|
vld1.32 {q13},[r3]!
|
|
vadd.i32 q12,q12,q8
|
|
INST(0xe2,0x03,0xfa,0xf3) @ sha256su0 q8,q9
|
|
vmov q2,q0
|
|
INST(0x68,0x0c,0x02,0xf3) @ sha256h q0,q1,q12
|
|
INST(0x68,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q12
|
|
INST(0xe6,0x0c,0x64,0xf3) @ sha256su1 q8,q10,q11
|
|
vld1.32 {q12},[r3]!
|
|
vadd.i32 q13,q13,q9
|
|
INST(0xe4,0x23,0xfa,0xf3) @ sha256su0 q9,q10
|
|
vmov q2,q0
|
|
INST(0x6a,0x0c,0x02,0xf3) @ sha256h q0,q1,q13
|
|
INST(0x6a,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q13
|
|
INST(0xe0,0x2c,0x66,0xf3) @ sha256su1 q9,q11,q8
|
|
vld1.32 {q13},[r3]!
|
|
vadd.i32 q12,q12,q10
|
|
INST(0xe6,0x43,0xfa,0xf3) @ sha256su0 q10,q11
|
|
vmov q2,q0
|
|
INST(0x68,0x0c,0x02,0xf3) @ sha256h q0,q1,q12
|
|
INST(0x68,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q12
|
|
INST(0xe2,0x4c,0x60,0xf3) @ sha256su1 q10,q8,q9
|
|
vld1.32 {q12},[r3]!
|
|
vadd.i32 q13,q13,q11
|
|
INST(0xe0,0x63,0xfa,0xf3) @ sha256su0 q11,q8
|
|
vmov q2,q0
|
|
INST(0x6a,0x0c,0x02,0xf3) @ sha256h q0,q1,q13
|
|
INST(0x6a,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q13
|
|
INST(0xe4,0x6c,0x62,0xf3) @ sha256su1 q11,q9,q10
|
|
vld1.32 {q13},[r3]!
|
|
vadd.i32 q12,q12,q8
|
|
INST(0xe2,0x03,0xfa,0xf3) @ sha256su0 q8,q9
|
|
vmov q2,q0
|
|
INST(0x68,0x0c,0x02,0xf3) @ sha256h q0,q1,q12
|
|
INST(0x68,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q12
|
|
INST(0xe6,0x0c,0x64,0xf3) @ sha256su1 q8,q10,q11
|
|
vld1.32 {q12},[r3]!
|
|
vadd.i32 q13,q13,q9
|
|
INST(0xe4,0x23,0xfa,0xf3) @ sha256su0 q9,q10
|
|
vmov q2,q0
|
|
INST(0x6a,0x0c,0x02,0xf3) @ sha256h q0,q1,q13
|
|
INST(0x6a,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q13
|
|
INST(0xe0,0x2c,0x66,0xf3) @ sha256su1 q9,q11,q8
|
|
vld1.32 {q13},[r3]!
|
|
vadd.i32 q12,q12,q10
|
|
INST(0xe6,0x43,0xfa,0xf3) @ sha256su0 q10,q11
|
|
vmov q2,q0
|
|
INST(0x68,0x0c,0x02,0xf3) @ sha256h q0,q1,q12
|
|
INST(0x68,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q12
|
|
INST(0xe2,0x4c,0x60,0xf3) @ sha256su1 q10,q8,q9
|
|
vld1.32 {q12},[r3]!
|
|
vadd.i32 q13,q13,q11
|
|
INST(0xe0,0x63,0xfa,0xf3) @ sha256su0 q11,q8
|
|
vmov q2,q0
|
|
INST(0x6a,0x0c,0x02,0xf3) @ sha256h q0,q1,q13
|
|
INST(0x6a,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q13
|
|
INST(0xe4,0x6c,0x62,0xf3) @ sha256su1 q11,q9,q10
|
|
vld1.32 {q13},[r3]!
|
|
vadd.i32 q12,q12,q8
|
|
INST(0xe2,0x03,0xfa,0xf3) @ sha256su0 q8,q9
|
|
vmov q2,q0
|
|
INST(0x68,0x0c,0x02,0xf3) @ sha256h q0,q1,q12
|
|
INST(0x68,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q12
|
|
INST(0xe6,0x0c,0x64,0xf3) @ sha256su1 q8,q10,q11
|
|
vld1.32 {q12},[r3]!
|
|
vadd.i32 q13,q13,q9
|
|
INST(0xe4,0x23,0xfa,0xf3) @ sha256su0 q9,q10
|
|
vmov q2,q0
|
|
INST(0x6a,0x0c,0x02,0xf3) @ sha256h q0,q1,q13
|
|
INST(0x6a,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q13
|
|
INST(0xe0,0x2c,0x66,0xf3) @ sha256su1 q9,q11,q8
|
|
vld1.32 {q13},[r3]!
|
|
vadd.i32 q12,q12,q10
|
|
INST(0xe6,0x43,0xfa,0xf3) @ sha256su0 q10,q11
|
|
vmov q2,q0
|
|
INST(0x68,0x0c,0x02,0xf3) @ sha256h q0,q1,q12
|
|
INST(0x68,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q12
|
|
INST(0xe2,0x4c,0x60,0xf3) @ sha256su1 q10,q8,q9
|
|
vld1.32 {q12},[r3]!
|
|
vadd.i32 q13,q13,q11
|
|
INST(0xe0,0x63,0xfa,0xf3) @ sha256su0 q11,q8
|
|
vmov q2,q0
|
|
INST(0x6a,0x0c,0x02,0xf3) @ sha256h q0,q1,q13
|
|
INST(0x6a,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q13
|
|
INST(0xe4,0x6c,0x62,0xf3) @ sha256su1 q11,q9,q10
|
|
vld1.32 {q13},[r3]!
|
|
vadd.i32 q12,q12,q8
|
|
vmov q2,q0
|
|
INST(0x68,0x0c,0x02,0xf3) @ sha256h q0,q1,q12
|
|
INST(0x68,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q12
|
|
|
|
vld1.32 {q12},[r3]!
|
|
vadd.i32 q13,q13,q9
|
|
vmov q2,q0
|
|
INST(0x6a,0x0c,0x02,0xf3) @ sha256h q0,q1,q13
|
|
INST(0x6a,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q13
|
|
|
|
vld1.32 {q13},[r3]
|
|
vadd.i32 q12,q12,q10
|
|
sub r3,r3,#256-16 @ rewind
|
|
vmov q2,q0
|
|
INST(0x68,0x0c,0x02,0xf3) @ sha256h q0,q1,q12
|
|
INST(0x68,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q12
|
|
|
|
vadd.i32 q13,q13,q11
|
|
vmov q2,q0
|
|
INST(0x6a,0x0c,0x02,0xf3) @ sha256h q0,q1,q13
|
|
INST(0x6a,0x2c,0x14,0xf3) @ sha256h2 q1,q2,q13
|
|
|
|
vadd.i32 q0,q0,q14
|
|
vadd.i32 q1,q1,q15
|
|
it ne
|
|
bne .Loop_v8
|
|
|
|
vst1.32 {q0,q1},[r0]
|
|
|
|
bx lr @ bx lr
|
|
.size sha256_block_data_order_armv8,.-sha256_block_data_order_armv8
|
|
#endif
|
|
.asciz "SHA256 block transform for ARMv4/NEON/ARMv8, CRYPTOGAMS by <appro@openssl.org>"
|
|
.align 2
|
|
#if __ARM_MAX_ARCH__>=7 && !defined(__KERNEL__)
|
|
.comm OPENSSL_armcap_P,4,4
|
|
#endif
|