mirror of
https://github.com/Atmosphere-NX/Atmosphere
synced 2025-01-05 11:58:00 +00:00
227 lines
7.6 KiB
C
227 lines
7.6 KiB
C
/*
|
|
* Copyright (c) 2018 Atmosphère-NX
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify it
|
|
* under the terms and conditions of the GNU General Public License,
|
|
* version 2, as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
* more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#include <stdint.h>
|
|
#include <string.h>
|
|
|
|
#include "arm.h"
|
|
#include "utils.h"
|
|
#include "fuse.h"
|
|
#include "gcm.h"
|
|
|
|
#include "sealedkeys.h"
|
|
#include "se.h"
|
|
|
|
/* Shifts right a little endian 128-bit value. */
|
|
static void shr_128(uint64_t *val) {
|
|
val[0] >>= 1;
|
|
val[0] |= (val[1] & 1) << 63;
|
|
val[1] >>= 1;
|
|
}
|
|
|
|
/* Shifts left a little endian 128-bit value. */
|
|
static void shl_128(uint64_t *val) {
|
|
val[1] <<= 1;
|
|
val[1] |= (val[0] & (1ull << 63)) >> 63;
|
|
val[0] <<= 1;
|
|
}
|
|
|
|
/* Multiplies two 128-bit numbers X,Y in the GF(128) Galois Field. */
|
|
static void gf128_mul(uint8_t *dst, const uint8_t *x, const uint8_t *y) {
|
|
uint8_t x_work[0x10];
|
|
uint8_t y_work[0x10];
|
|
uint8_t dst_work[0x10];
|
|
|
|
uint64_t *p_x = (uint64_t *)(&x_work[0]);
|
|
uint64_t *p_y = (uint64_t *)(&y_work[0]);
|
|
uint64_t *p_dst = (uint64_t *)(&dst_work[0]);
|
|
|
|
/* Initialize buffers. */
|
|
for (unsigned int i = 0; i < 0x10; i++) {
|
|
x_work[i] = x[0xF-i];
|
|
y_work[i] = y[0xF-i];
|
|
dst_work[i] = 0;
|
|
}
|
|
|
|
/* Perform operation for each bit in y. */
|
|
for (unsigned int round = 0; round < 0x80; round++) {
|
|
p_dst[0] ^= p_x[0] * ((y_work[0xF] & 0x80) >> 7);
|
|
p_dst[1] ^= p_x[1] * ((y_work[0xF] & 0x80) >> 7);
|
|
shl_128(p_y);
|
|
uint8_t xval = 0xE1 * (x_work[0] & 1);
|
|
shr_128(p_x);
|
|
x_work[0xF] ^= xval;
|
|
}
|
|
|
|
for (unsigned int i = 0; i < 0x10; i++) {
|
|
dst[i] = dst_work[0xF-i];
|
|
}
|
|
}
|
|
|
|
|
|
|
|
/* Performs an AES-GCM GHASH operation over the data into dst. */
|
|
static void ghash(void *dst, const void *data, size_t data_size, const void *j_block, bool encrypt) {
|
|
uint8_t x[0x10] = {0};
|
|
uint8_t h[0x10];
|
|
|
|
uint64_t *p_x = (uint64_t *)(&x[0]);
|
|
uint64_t *p_data = (uint64_t *)data;
|
|
|
|
/* H = aes_ecb_encrypt(zeroes) */
|
|
se_aes_128_ecb_encrypt_block(KEYSLOT_SWITCH_TEMPKEY, h, 0x10, x, 0x10);
|
|
|
|
size_t total_size = data_size;
|
|
|
|
while (data_size >= 0x10) {
|
|
/* X = (X ^ current_block) * H */
|
|
p_x[0] ^= p_data[0];
|
|
p_x[1] ^= p_data[1];
|
|
gf128_mul(x, x, h);
|
|
|
|
/* Increment p_data by 0x10 bytes. */
|
|
p_data += 2;
|
|
data_size -= 0x10;
|
|
}
|
|
|
|
/* Nintendo's code *discards all data in the last block* if unaligned. */
|
|
/* And treats that block as though it were all-zero. */
|
|
/* This is a bug, they just forget to XOR with the copy of the last block they save. */
|
|
if (data_size & 0xF) {
|
|
gf128_mul(x, x, h);
|
|
}
|
|
|
|
uint64_t xor_size = total_size << 3;
|
|
xor_size = __builtin_bswap64(xor_size);
|
|
|
|
/* Due to a Nintendo bug, the wrong QWORD gets XOR'd in the "final output block" case. */
|
|
if (encrypt) {
|
|
p_x[0] ^= xor_size;
|
|
} else {
|
|
p_x[1] ^= xor_size;
|
|
}
|
|
|
|
gf128_mul(x, x, h);
|
|
|
|
/* If final output block, XOR with encrypted J block. */
|
|
if (encrypt) {
|
|
se_aes_128_ecb_encrypt_block(KEYSLOT_SWITCH_TEMPKEY, h, 0x10, j_block, 0x10);
|
|
for (unsigned int i = 0; i < 0x10; i++) {
|
|
x[i] ^= h[i];
|
|
}
|
|
}
|
|
/* Copy output. */
|
|
memcpy(dst, x, 0x10);
|
|
}
|
|
|
|
|
|
/* This function is a doozy. It decrypts and validates a (non-standard) AES-GCM wrapped keypair. */
|
|
size_t gcm_decrypt_key(void *dst, size_t dst_size, const void *src, size_t src_size, const void *sealed_kek, size_t kek_size, const void *wrapped_key, size_t key_size, unsigned int usecase, bool is_personalized, uint8_t *out_deviceid_high) {
|
|
if (is_personalized == 0) {
|
|
/* Devkit keys use a different keyformat without a MAC/Device ID. */
|
|
if (src_size <= 0x10 || src_size - 0x10 > dst_size) {
|
|
generic_panic();
|
|
}
|
|
} else {
|
|
if (src_size <= 0x30 || src_size - 0x20 > dst_size) {
|
|
generic_panic();
|
|
}
|
|
}
|
|
|
|
uint8_t intermediate_buf[0x400] = {0};
|
|
|
|
/* Unwrap the key */
|
|
unseal_key(KEYSLOT_SWITCH_TEMPKEY, sealed_kek, kek_size, usecase);
|
|
decrypt_data_into_keyslot(KEYSLOT_SWITCH_TEMPKEY, KEYSLOT_SWITCH_TEMPKEY, wrapped_key, key_size);
|
|
|
|
/* Decrypt the GCM keypair, AES-CTR with CTR = blob[:0x10]. */
|
|
se_aes_ctr_crypt(KEYSLOT_SWITCH_TEMPKEY, intermediate_buf, dst_size, src + 0x10, src_size - 0x10, src, 0x10);
|
|
|
|
if (!is_personalized) {
|
|
/* Devkit non-personalized keys have no further authentication. */
|
|
memcpy(dst, intermediate_buf, src_size - 0x10);
|
|
memset(intermediate_buf, 0, sizeof(intermediate_buf));
|
|
return src_size - 0x10;
|
|
}
|
|
|
|
/* J = GHASH(CTR); */
|
|
uint8_t j_block[0x10];
|
|
ghash(j_block, src, 0x10, NULL, false);
|
|
|
|
/* MAC = GHASH(PLAINTEXT) ^ ENCRYPT(J) */
|
|
/* Note: That MAC is calculated over plaintext is non-standard. */
|
|
/* It is supposed to be over the ciphertext. */
|
|
uint8_t calc_mac[0x10];
|
|
ghash(calc_mac, intermediate_buf, src_size - 0x20, j_block, true);
|
|
|
|
/* Const-time memcmp. */
|
|
const uint8_t *src_bytes = src;
|
|
int different = 0;
|
|
for (unsigned int i = 0; i < 0x10; i++) {
|
|
different |= src_bytes[src_size - 0x10 + i] ^ calc_mac[i];
|
|
}
|
|
if (different) {
|
|
return 0;
|
|
}
|
|
|
|
if ((read64be(intermediate_buf, src_size - 0x28) & 0x00FFFFFFFFFFFFFFULL) != fuse_get_device_id()) {
|
|
return 0;
|
|
}
|
|
|
|
if (out_deviceid_high != NULL) {
|
|
*out_deviceid_high = intermediate_buf[src_size - 0x28];
|
|
}
|
|
|
|
memcpy(dst, intermediate_buf, src_size - 0x30);
|
|
memset(intermediate_buf, 0, sizeof(intermediate_buf));
|
|
return src_size - 0x30;
|
|
}
|
|
|
|
void gcm_encrypt_key(void *dst, size_t dst_size, const void *src, size_t src_size, const void *sealed_kek, size_t kek_size, const void *wrapped_key, size_t key_size, unsigned int usecase, uint64_t deviceid_high) {
|
|
uint8_t intermediate_buf[0x400] = {0};
|
|
if (src_size + 0x30 > dst_size) {
|
|
generic_panic();
|
|
}
|
|
|
|
/* Unwrap the key */
|
|
unseal_key(KEYSLOT_SWITCH_TEMPKEY, sealed_kek, kek_size, usecase);
|
|
decrypt_data_into_keyslot(KEYSLOT_SWITCH_TEMPKEY, KEYSLOT_SWITCH_TEMPKEY, wrapped_key, key_size);
|
|
|
|
/* Generate a random CTR. */
|
|
flush_dcache_range(intermediate_buf, intermediate_buf + 0x10);
|
|
se_generate_random(KEYSLOT_SWITCH_RNGKEY, intermediate_buf, 0x10);
|
|
flush_dcache_range(intermediate_buf, intermediate_buf + 0x10);
|
|
|
|
/* Write Device ID. */
|
|
write64be(intermediate_buf, src_size + 0x18, fuse_get_device_id() | (deviceid_high << 56));
|
|
|
|
|
|
/* J = GHASH(CTR); */
|
|
uint8_t j_block[0x10];
|
|
ghash(j_block, intermediate_buf, 0x10, NULL, false);
|
|
|
|
/* MAC = GHASH(PLAINTEXT) ^ ENCRYPT(J) */
|
|
/* Note: That MAC is calculated over plaintext is non-standard. */
|
|
/* It is supposed to be over the ciphertext. */
|
|
ghash(intermediate_buf + src_size + 0x20, intermediate_buf + 0x10, src_size + 0x10, j_block, true);
|
|
|
|
/* Encrypt the GCM keypair, AES-CTR with CTR = blob[:0x10]. */
|
|
se_aes_ctr_crypt(KEYSLOT_SWITCH_TEMPKEY, intermediate_buf + 0x10, src_size + 0x10, intermediate_buf + 0x10, src_size + 0x10, intermediate_buf, 0x10);
|
|
|
|
/* Copy the wrapped key out. */
|
|
memcpy(dst, intermediate_buf, src_size + 0x30);
|
|
memset(intermediate_buf, 0, sizeof(intermediate_buf));
|
|
}
|