@ @ Implementation by Ronny Van Keer, hereby denoted as "the implementer". @ @ For more information, feedback or questions, please refer to our website: @ https://keccak.team/ @ @ To the extent possible under law, the implementer has waived all copyright @ and related or neighboring rights to the source code in this file. @ http://creativecommons.org/publicdomain/zero/1.0/ @ @ --- @ @ This file implements Keccak-p[400] in a SnP-compatible way. @ Please refer to SnP-documentation.h for more details. @ @ This implementation comes with KeccakP-400-SnP.h in the same folder. @ Please refer to LowLevel.build for the exact list of other files it must be combined with. @ @ WARNING: This implementation assumes a little endian CPU with ARMv7M architecture (e.g., Cortex-M3) and the GCC compiler. .thumb .syntax unified .text @---------------------------------------------------------------------------- .equ _ba , 0*2 .equ _be , 1*2 .equ _bi , 2*2 .equ _bo , 3*2 .equ _bu , 4*2 .equ _ga , 5*2 .equ _ge , 6*2 .equ _gi , 7*2 .equ _go , 8*2 .equ _gu , 9*2 .equ _ka , 10*2 .equ _ke , 11*2 .equ _ki , 12*2 .equ _ko , 13*2 .equ _ku , 14*2 .equ _ma , 15*2 .equ _me , 16*2 .equ _mi , 17*2 .equ _mo , 18*2 .equ _mu , 19*2 .equ _sa , 20*2 .equ _se , 21*2 .equ _si , 22*2 .equ _so , 23*2 .equ _su , 24*2 .macro xor5 result,ptr,b,g,k,m,rs ldrh \result, [\ptr, #\b] ldrh r6, [\ptr, #\g] eor \result, \result, \rs ldrh \rs, [\ptr, #\k] eor \result, \result, r6 ldrh r6, [\ptr, #\m] eor \result, \result, \rs eor \result, \result, r6 .endm .macro xor5D resultL,resultH,ptr,b,g,k,m,rsL,rsH bfi \rsL, \rsH, #16, #16 ldr \resultL, [\ptr, #\b] ldr r6, [\ptr, #\g] eor \resultL, \resultL, \rsL ldr \rsL, [\ptr, #\k] eor \resultL, \resultL, r6 ldr r6, [\ptr, #\m] eor \resultL, \resultL, \rsL eor \resultL, \resultL, r6 lsr \resultH, \resultL, #16 uxth \resultL, \resultL .endm .macro xorrol b, yy, rr eor \b, \b, \yy .if \rr != 8 lsl \b, \b, #\rr orr \b, \b, \b, LSR #16 .else rev16 \b, \b .endif .endm .macro rolxor d, a, b eor \d, \a, \b, LSL #1 eor \d, \d, \b, LSR #15 uxth \d, \d .endm .macro xandnot resptr, resofs, aa, bb, cc, temp bic \temp, \cc, \bb eor \temp, \temp, \aa strh \temp, [\resptr, #\resofs] .endm .macro xandnotRC resptr, resofs, aa, bb, cc ldrh r6, [r8], #2 bic \cc, \cc, \bb eor \cc, \cc, r6 eor \cc, \cc, \aa strh \cc, [\resptr, #\resofs] .endm .macro KeccakRound sOut, sIn @prepTheta xor5D r1, r2, \sIn, _ba, _ga, _ka, _ma, r9, r10 xor5D r3, r4, \sIn, _bi, _gi, _ki, _mi, r11, r12 rolxor r9, r7, r2 rolxor r10, r1, r3 rolxor r11, r2, r4 rolxor r12, r3, r7 rolxor lr, r4, r1 @thetaRhoPiChiIota ldrh r1, [\sIn, #_ba] ldrh r2, [\sIn, #_ge] ldrh r3, [\sIn, #_ki] ldrh r4, [\sIn, #_mo] eor r1, r1, r9 xorrol r2, r10, 12 xorrol r3, r11, 11 xorrol r4, r12, 5 xorrol r5, lr, 14 xandnot \sOut, _be, r2, r3, r4, r6 xandnot \sOut, _bi, r3, r4, r5, r6 xandnot \sOut, _bo, r4, r5, r1, r6 xandnot \sOut, _bu, r5, r1, r2, r7 xandnotRC \sOut, _ba, r1, r2, r3 ldrh r1, [\sIn, #_bo] ldrh r2, [\sIn, #_gu] ldrh r3, [\sIn, #_ka] ldrh r4, [\sIn, #_me] ldrh r5, [\sIn, #_si] xorrol r1, r12, 12 xorrol r2, lr, 4 xorrol r3, r9, 3 xorrol r4, r10, 13 xorrol r5, r11, 13 xandnot \sOut, _ga, r1, r2, r3, r6 xandnot \sOut, _ge, r2, r3, r4, r6 xandnot \sOut, _gi, r3, r4, r5, r6 xandnot \sOut, _go, r4, r5, r1, r6 xandnot \sOut, _gu, r5, r1, r2, r6 eor r7, r7, r6 ldrh r1, [\sIn, #_be] ldrh r2, [\sIn, #_gi] ldrh r3, [\sIn, #_ko] ldrh r4, [\sIn, #_mu] ldrh r5, [\sIn, #_sa] xorrol r1, r10, 1 xorrol r2, r11, 6 xorrol r3, r12, 9 xorrol r4, lr, 8 xorrol r5, r9, 2 xandnot \sOut, _ka, r1, r2, r3, r6 xandnot \sOut, _ke, r2, r3, r4, r6 xandnot \sOut, _ki, r3, r4, r5, r6 xandnot \sOut, _ko, r4, r5, r1, r6 xandnot \sOut, _ku, r5, r1, r2, r6 eor r7, r7, r6 ldrh r1, [\sIn, #_bu] ldrh r2, [\sIn, #_ga] ldrh r3, [\sIn, #_ke] ldrh r4, [\sIn, #_mi] ldrh r5, [\sIn, #_so] xorrol r1, lr, 11 xorrol r2, r9, 4 xorrol r3, r10, 10 xorrol r4, r11, 15 xorrol r5, r12, 8 xandnot \sOut, _ma, r1, r2, r3, r6 xandnot \sOut, _me, r2, r3, r4, r6 xandnot \sOut, _mi, r3, r4, r5, r6 xandnot \sOut, _mo, r4, r5, r1, r6 xandnot \sOut, _mu, r5, r1, r2, r6 eor r7, r7, r6 ldrh r1, [\sIn, #_bi] ldrh r2, [\sIn, #_go] ldrh r3, [\sIn, #_ku] ldrh r4, [\sIn, #_ma] ldrh r5, [\sIn, #_se] xorrol r1, r11, 14 xorrol r2, r12, 7 xorrol r3, lr, 7 xorrol r4, r9, 9 xorrol r5, r10, 2 xandnot \sOut, _sa, r1, r2, r3, r9 xandnot \sOut, _se, r2, r3, r4, r10 xandnot \sOut, _si, r3, r4, r5, r11 xandnot \sOut, _so, r4, r5, r1, r12 bic r1, r2, r1 eor r5, r5, r1 eor r7, r7, r5 uxth r7, r7 strh r5, [\sOut, #_su] uxth r5, r5 .endm @---------------------------------------------------------------------------- @ @ void KeccakP400_StaticInitialize( void ) @ .align 8 .global KeccakP400_StaticInitialize .type KeccakP400_StaticInitialize, %function; KeccakP400_StaticInitialize: bx lr @---------------------------------------------------------------------------- @ @ void KeccakP400_Initialize(void *state) @ .align 8 .global KeccakP400_Initialize .type KeccakP400_Initialize, %function; KeccakP400_Initialize: movs r1, #0 movs r2, #0 movs r3, #0 stmia r0!, { r1 - r3 } stmia r0!, { r1 - r3 } stmia r0!, { r1 - r3 } stmia r0!, { r1 - r3 } strh r1, [r0] bx lr @ ---------------------------------------------------------------------------- @ @ void KeccakP400_AddByte(void *state, unsigned char byte, unsigned int offset) @ .align 8 .global KeccakP400_AddByte .type KeccakP400_AddByte, %function; KeccakP400_AddByte: ldrb r3, [r0, r2] eors r3, r3, r1 strb r3, [r0, r2] bx lr @---------------------------------------------------------------------------- @ @ void KeccakP400_AddBytes(void *state, const unsigned char *data, unsigned int offset, unsigned int length) @ .align 8 .global KeccakP400_AddBytes .type KeccakP400_AddBytes, %function; KeccakP400_AddBytes: subs r3, r3, #1 bcc KeccakP400_AddBytes_Exit adds r0, r0, r2 push {r4,lr} KeccakP400_AddBytes_Loop: ldrb r2, [r1, r3] ldrb r4, [r0, r3] eors r2, r2, r4 strb r2, [r0, r3] subs r3, r3, #1 bcs KeccakP400_AddBytes_Loop pop {r4,pc} KeccakP400_AddBytes_Exit: bx lr @ ---------------------------------------------------------------------------- @ @ void KeccakP400_OverwriteBytes(void *state, const unsigned char *data, unsigned int offset, unsigned int length) @ .align 8 .global KeccakP400_OverwriteBytes .type KeccakP400_OverwriteBytes, %function; KeccakP400_OverwriteBytes: subs r3, r3, #1 bcc KeccakP400_OverwriteBytes_Exit adds r0, r0, r2 KeccakP400_OverwriteBytes_Loop: ldrb r2, [r1, r3] strb r2, [r0, r3] subs r3, r3, #1 bcs KeccakP400_OverwriteBytes_Loop KeccakP400_OverwriteBytes_Exit: bx lr @---------------------------------------------------------------------------- @ @ void KeccakP400_OverwriteWithZeroes(void *state, unsigned int byteCount) @ .align 8 .global KeccakP400_OverwriteWithZeroes .type KeccakP400_OverwriteWithZeroes, %function; KeccakP400_OverwriteWithZeroes: movs r3, #0 lsrs r2, r1, #2 beq KeccakP400_OverwriteWithZeroes_Bytes KeccakP400_OverwriteWithZeroes_Loop2Lanes: str r3, [r0], #4 subs r2, r2, #1 bne KeccakP400_OverwriteWithZeroes_Loop2Lanes KeccakP400_OverwriteWithZeroes_Bytes: ands r1, #3 beq KeccakP400_OverwriteWithZeroes_Exit KeccakP400_OverwriteWithZeroes_LoopBytes: strb r3, [r0], #1 subs r1, r1, #1 bne KeccakP400_OverwriteWithZeroes_LoopBytes KeccakP400_OverwriteWithZeroes_Exit: bx lr @ ---------------------------------------------------------------------------- @ @ void KeccakP400_ExtractBytes(void *state, const unsigned char *data, unsigned int offset, unsigned int length) @ .align 8 .global KeccakP400_ExtractBytes .type KeccakP400_ExtractBytes, %function; KeccakP400_ExtractBytes: subs r3, r3, #1 bcc KeccakP400_ExtractBytes_Exit adds r0, r0, r2 KeccakP400_ExtractBytes_Loop: ldrb r2, [r0, r3] strb r2, [r1, r3] subs r3, r3, #1 bcs KeccakP400_ExtractBytes_Loop KeccakP400_ExtractBytes_Exit: bx lr @ ---------------------------------------------------------------------------- @ @ void KeccakP400_ExtractAndAddBytes(void *state, const unsigned char *input, unsigned char *output, unsigned int offset, unsigned int length) @ .align 8 .global KeccakP400_ExtractAndAddBytes .type KeccakP400_ExtractAndAddBytes, %function; KeccakP400_ExtractAndAddBytes: push {r4,r5} adds r0, r0, r3 @ state += offset (offset register no longer needed, reuse for length) ldr r3, [sp, #8] @ get length argument from stack subs r3, r3, #1 @ .if length != 0 bcc KeccakP400_ExtractAndAddBytes_Exit KeccakP400_ExtractAndAddBytes_Loop: ldrb r5, [r0, r3] ldrb r4, [r1, r3] eors r5, r5, r4 strb r5, [r2, r3] subs r3, r3, #1 bcs KeccakP400_ExtractAndAddBytes_Loop KeccakP400_ExtractAndAddBytes_Exit: pop {r4,r5} bx lr @---------------------------------------------------------------------------- @ @ void KeccakP400_Permute_Nrounds( void *state, unsigned int nr ) @ .align 8 .global KeccakP400_Permute_Nrounds .type KeccakP400_Permute_Nrounds, %function; KeccakP400_Permute_Nrounds: push {r4-r12,lr} sub sp, sp, #2*25+6 adr r8, KeccakP400_Permute_RoundConstants sub r8, r8, r1, LSL #1 lsls r1, r1, #31 beq KeccakP400_PermuteIntern mov r1, sp @ odd number of rounds ldm r0!, { r2, r3, r4, r5, r11, r12 } @ copy state to stack stm r1!, { r2, r3, r4, r5, r11, r12 } ldm r0!, { r2, r3, r4, r5, r11, r12 } stm r1!, { r2, r3, r4, r5, r11, r12 } sub r0, r0, #2*24 ldrh lr, [r0, #_su] strh lr, [sp, #_su] uxth r9, r11 uxth r10, r11, ROR #16 uxth r11, r12 lsr r12, r12, #16 mov r5, lr xor5 r7, r0, _bu, _gu, _ku, _mu, lr b KeccakP400_Permute_RoundOdd @---------------------------------------------------------------------------- @ @ void KeccakP400_Permute_20rounds( void *state ) @ .align 8 .global KeccakP400_Permute_20rounds .type KeccakP400_Permute_20rounds, %function; KeccakP400_Permute_20rounds: push {r4-r12,lr} sub sp, sp, #2*25+6 adr r8, KeccakP400_Permute_RoundConstants20 KeccakP400_PermuteIntern: ldrh r9, [r0, #_sa] ldrh r10, [r0, #_se] ldrh r11, [r0, #_si] ldrh lr, [r0, #_su] ldrh r12, [r0, #_so] mov r5, lr xor5 r7, r0, _bu, _gu, _ku, _mu, lr KeccakP400_Permute_RoundLoop: KeccakRound sp, r0 KeccakP400_Permute_RoundOdd: KeccakRound r0, sp ldrh r3, [r8] cmp r3, #0 bne KeccakP400_Permute_RoundLoop add sp,sp,#2*25+6 pop {r4-r12,pc} .align 8 KeccakP400_Permute_RoundConstants20: .short 0x0001 .short 0x8082 .short 0x808a .short 0x8000 .short 0x808b .short 0x0001 .short 0x8081 .short 0x8009 .short 0x008a .short 0x0088 .short 0x8009 .short 0x000a .short 0x808b .short 0x008b .short 0x8089 .short 0x8003 .short 0x8002 .short 0x0080 .short 0x800a .short 0x000a KeccakP400_Permute_RoundConstants: .short 0 @ terminator