vaseboot/VasEBoot-core/lib/libgcrypt/cipher/rijndael-ppc.c

231 lines
6.1 KiB
C

/* Rijndael (AES) for GnuPG - PowerPC Vector Crypto AES implementation
* Copyright (C) 2019 Shawn Landden <shawn@git.icu>
* Copyright (C) 2019-2020, 2022 Jussi Kivilinna <jussi.kivilinna@iki.fi>
*
* This file is part of Libgcrypt.
*
* Libgcrypt is free software; you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License as
* published by the Free Software Foundation; either version 2.1 of
* the License, or (at your option) any later version.
*
* Libgcrypt is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with this program; if not, see <http://www.gnu.org/licenses/>.
*
* Alternatively, this code may be used in OpenSSL from The OpenSSL Project,
* and Cryptogams by Andy Polyakov, and if made part of a release of either
* or both projects, is thereafter dual-licensed under the license said project
* is released under.
*/
#include <config.h>
#include "rijndael-internal.h"
#include "cipher-internal.h"
#include "bufhelp.h"
#ifdef USE_PPC_CRYPTO
#include "rijndael-ppc-common.h"
#ifdef HAVE_GCC_ATTRIBUTE_OPTIMIZE
# define FUNC_ATTR_OPT __attribute__((optimize("-O2")))
#else
# define FUNC_ATTR_OPT
#endif
#if defined(__clang__) && defined(HAVE_CLANG_ATTRIBUTE_PPC_TARGET)
# define PPC_OPT_ATTR __attribute__((target("arch=pwr8"))) FUNC_ATTR_OPT
#elif defined(HAVE_GCC_ATTRIBUTE_PPC_TARGET)
# define PPC_OPT_ATTR __attribute__((target("cpu=power8"))) FUNC_ATTR_OPT
#else
# define PPC_OPT_ATTR FUNC_ATTR_OPT
#endif
#ifndef WORDS_BIGENDIAN
static const block vec_bswap32_const_neg =
{ ~3, ~2, ~1, ~0, ~7, ~6, ~5, ~4, ~11, ~10, ~9, ~8, ~15, ~14, ~13, ~12 };
#endif
static ASM_FUNC_ATTR_INLINE block
asm_load_be_const(void)
{
#ifndef WORDS_BIGENDIAN
return ALIGNED_LOAD (&vec_bswap32_const_neg, 0);
#else
static const block vec_dummy = { 0 };
return vec_dummy;
#endif
}
static ASM_FUNC_ATTR_INLINE block
asm_be_swap(block vec, block be_bswap_const)
{
(void)be_bswap_const;
#ifndef WORDS_BIGENDIAN
return asm_vperm1 (vec, be_bswap_const);
#else
return vec;
#endif
}
static ASM_FUNC_ATTR_INLINE block
asm_load_be_noswap(unsigned long offset, const void *ptr)
{
block vec;
#if __GNUC__ >= 4
if (__builtin_constant_p (offset) && offset == 0)
__asm__ volatile ("lxvw4x %x0,0,%1\n\t"
: "=wa" (vec)
: "r" ((uintptr_t)ptr)
: "memory");
else
#endif
__asm__ volatile ("lxvw4x %x0,%1,%2\n\t"
: "=wa" (vec)
: "r" (offset), "r" ((uintptr_t)ptr)
: "memory", "r0");
/* NOTE: vec needs to be be-swapped using 'asm_be_swap' by caller */
return vec;
}
static ASM_FUNC_ATTR_INLINE void
asm_store_be_noswap(block vec, unsigned long offset, void *ptr)
{
/* NOTE: vec be-swapped using 'asm_be_swap' by caller */
#if __GNUC__ >= 4
if (__builtin_constant_p (offset) && offset == 0)
__asm__ volatile ("stxvw4x %x0,0,%1\n\t"
:
: "wa" (vec), "r" ((uintptr_t)ptr)
: "memory");
else
#endif
__asm__ volatile ("stxvw4x %x0,%1,%2\n\t"
:
: "wa" (vec), "r" (offset), "r" ((uintptr_t)ptr)
: "memory", "r0");
}
static ASM_FUNC_ATTR_INLINE unsigned int
keysched_idx(unsigned int in)
{
#ifdef WORDS_BIGENDIAN
return in;
#else
return (in & ~3U) | (3U - (in & 3U));
#endif
}
static ASM_FUNC_ATTR_INLINE vec_u32
bcast_u32_to_vec(u32 x)
{
vec_u32 v = { x, x, x, x };
return v;
}
static ASM_FUNC_ATTR_INLINE u32
u32_from_vec(vec_u32 x)
{
#ifdef WORDS_BIGENDIAN
return x[1];
#else
return x[2];
#endif
}
void PPC_OPT_ATTR
_gcry_aes_ppc8_setkey (RIJNDAEL_context *ctx, const byte *key)
{
static const vec_u32 rotate24 = { 24, 24, 24, 24 };
static const vec_u32 rcon_const = { 0x1b, 0x1b, 0x1b, 0x1b };
vec_u32 tk_vu32[MAXKC];
unsigned int rounds = ctx->rounds;
unsigned int KC = rounds - 6;
u32 *W_u32 = ctx->keyschenc32b;
unsigned int i, j;
vec_u32 tk_prev;
vec_u32 rcon = { 1, 1, 1, 1 };
for (i = 0; i < KC; i += 2)
{
unsigned int idx0 = keysched_idx(i + 0);
unsigned int idx1 = keysched_idx(i + 1);
tk_vu32[i + 0] = bcast_u32_to_vec(buf_get_le32(key + i * 4 + 0));
tk_vu32[i + 1] = bcast_u32_to_vec(buf_get_le32(key + i * 4 + 4));
W_u32[idx0] = u32_from_vec(vec_revb(tk_vu32[i + 0]));
W_u32[idx1] = u32_from_vec(vec_revb(tk_vu32[i + 1]));
}
for (i = KC, j = KC, tk_prev = tk_vu32[KC - 1];
i < 4 * (rounds + 1);
i += 2, j += 2)
{
unsigned int idx0 = keysched_idx(i + 0);
unsigned int idx1 = keysched_idx(i + 1);
vec_u32 temp0 = tk_prev;
vec_u32 temp1;
if (j == KC)
{
j = 0;
temp0 = (vec_u32)(asm_sbox_be((block)vec_rl(temp0, rotate24))) ^ rcon;
rcon = (vec_u32)(((block)rcon << 1)
^ (-((block)rcon >> 7) & (block)rcon_const));
}
else if (KC == 8 && j == 4)
{
temp0 = (vec_u32)asm_sbox_be((block)temp0);
}
temp1 = tk_vu32[j + 0];
tk_vu32[j + 0] = temp0 ^ temp1;
tk_vu32[j + 1] ^= temp0 ^ temp1;
tk_prev = tk_vu32[j + 1];
W_u32[idx0] = u32_from_vec(vec_revb(tk_vu32[j + 0]));
W_u32[idx1] = u32_from_vec(vec_revb(tk_vu32[j + 1]));
}
wipememory(tk_vu32, sizeof(tk_vu32));
}
void PPC_OPT_ATTR
_gcry_aes_ppc8_prepare_decryption (RIJNDAEL_context *ctx)
{
internal_aes_ppc_prepare_decryption (ctx);
}
#define GCRY_AES_PPC8 1
#define ENCRYPT_BLOCK_FUNC _gcry_aes_ppc8_encrypt
#define DECRYPT_BLOCK_FUNC _gcry_aes_ppc8_decrypt
#define ECB_CRYPT_FUNC _gcry_aes_ppc8_ecb_crypt
#define CFB_ENC_FUNC _gcry_aes_ppc8_cfb_enc
#define CFB_DEC_FUNC _gcry_aes_ppc8_cfb_dec
#define CBC_ENC_FUNC _gcry_aes_ppc8_cbc_enc
#define CBC_DEC_FUNC _gcry_aes_ppc8_cbc_dec
#define CTR_ENC_FUNC _gcry_aes_ppc8_ctr_enc
#define OCB_CRYPT_FUNC _gcry_aes_ppc8_ocb_crypt
#define OCB_AUTH_FUNC _gcry_aes_ppc8_ocb_auth
#define XTS_CRYPT_FUNC _gcry_aes_ppc8_xts_crypt
#define CTR32LE_ENC_FUNC _gcry_aes_ppc8_ctr32le_enc
#include <rijndael-ppc-functions.h>
#endif /* USE_PPC_CRYPTO */