corecrypto/acceleratecrypto/Source/aes/arm64/encrypt_ecb.s

120 lines
2.8 KiB
ArmAsm
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

# Copyright (c) (2011-2016,2018-2020) Apple Inc. All rights reserved.
#
# corecrypto is licensed under Apple Inc.s Internal Use License Agreement (which
# is contained in the License.txt file distributed with corecrypto) and only to
# people who accept that license. IMPORTANT: Any license rights granted to you by
# Apple Inc. (if any) are limited to internal use within your organization only on
# devices and computers you own or control, for the sole purpose of verifying the
# security characteristics and correct functioning of the Apple Software. You may
# not, directly or indirectly, redistribute the Apple Software or any portions thereof.
#if defined(__arm64__)
#include "arm64_isa_compatibility.h"
#include "ccarm_pac_bti_macros.h"
#define key x0
#define nblocks w1
#define in x2
#define out x3
#define keylen x4
#define t x5
.subsections_via_symbols
.text
.p2align 4
.globl _AccelerateCrypto_ecb_AES_encrypt
_AccelerateCrypto_ecb_AES_encrypt:
BRANCH_TARGET_CALL
#if BUILDKERNEL
// save used vector registers
sub x4, sp, #6*16
sub sp, sp, #6*16
st1.4s {v0,v1,v2,v3}, [x4], #4*16
st1.4s {v4,v5}, [x4], #2*16
#endif
ldr w4, [key, #240] // keylength = 32-bit, 160/192/224
subs nblocks, nblocks, #4 // pre-decrement nblocks by 4
ldr q5, [key, keylen] // expanded key
b.lt 1f // if nblocks < 4, go to scalar loop
L_4blocks:
// handle 4 blocks per iteration
ldr q4, [key] // expanded key
mov t, #16
ld1.4s {v0,v1,v2,v3}, [in], #4*16
0:
AESE 0, 4
AESMC 0, 0
AESE 1, 4
AESMC 1, 1
AESE 2, 4
AESMC 2, 2
AESE 3, 4
AESMC 3, 3
ldr q4, [key, t] // expanded key
add t, t, #16
cmp t, keylen
b.lt 0b
AESE 0, 4
eor.16b v0, v0, v5
AESE 1, 4
eor.16b v1, v1, v5
AESE 2, 4
eor.16b v2, v2, v5
AESE 3, 4
eor.16b v3, v3, v5
st1.4s {v0,v1,v2,v3}, [out], #4*16
subs nblocks, nblocks, #4
b.ge L_4blocks
1: // handle 1 block per iteration
ands nblocks, nblocks, #3
b.eq 9f
L_1block:
ldr q4, [key] // expanded key
mov t, #16
ldr q0, [in], #16 // plain data
0:
AESE 0, 4
AESMC 0, 0
ldr q4, [key, t] // expanded key
add t, t, #16
cmp t, keylen
b.lt 0b
AESE 0, 4
eor.16b v0, v0, v5
str q0, [out], #16
subs nblocks, nblocks, #1
b.gt L_1block
9:
#if BUILDKERNEL
// restore used vector registers
ld1.4s {v0,v1,v2,v3}, [sp], #4*16
ld1.4s {v4,v5}, [sp], #2*16
#endif
mov x0, #0
ret lr
#undef in
#undef out
#undef key
#undef nblocks
#undef keylen
#endif