| 1 | use super::{arch::*, utils::*}; |
| 2 | use crate::{Block, Block8}; |
| 3 | use cipher::inout::InOut; |
| 4 | use core::mem; |
| 5 | |
| 6 | /// AES-128 round keys |
| 7 | pub(super) type RoundKeys = [__m128i; 11]; |
| 8 | |
| 9 | #[inline ] |
| 10 | #[target_feature (enable = "aes" )] |
| 11 | pub(super) unsafe fn encrypt1(keys: &RoundKeys, block: InOut<'_, '_, Block>) { |
| 12 | let (in_ptr: *const GenericArray>, out_ptr: *mut GenericArray>) = block.into_raw(); |
| 13 | let mut b: __m128i = _mm_loadu_si128(mem_addr:in_ptr as *const __m128i); |
| 14 | b = _mm_xor_si128(a:b, b:keys[0]); |
| 15 | b = _mm_aesenc_si128(a:b, round_key:keys[1]); |
| 16 | b = _mm_aesenc_si128(a:b, round_key:keys[2]); |
| 17 | b = _mm_aesenc_si128(a:b, round_key:keys[3]); |
| 18 | b = _mm_aesenc_si128(a:b, round_key:keys[4]); |
| 19 | b = _mm_aesenc_si128(a:b, round_key:keys[5]); |
| 20 | b = _mm_aesenc_si128(a:b, round_key:keys[6]); |
| 21 | b = _mm_aesenc_si128(a:b, round_key:keys[7]); |
| 22 | b = _mm_aesenc_si128(a:b, round_key:keys[8]); |
| 23 | b = _mm_aesenc_si128(a:b, round_key:keys[9]); |
| 24 | b = _mm_aesenclast_si128(a:b, round_key:keys[10]); |
| 25 | _mm_storeu_si128(mem_addr:out_ptr as *mut __m128i, a:b); |
| 26 | } |
| 27 | |
| 28 | #[inline ] |
| 29 | #[target_feature (enable = "aes" )] |
| 30 | pub(super) unsafe fn encrypt8(keys: &RoundKeys, blocks: InOut<'_, '_, Block8>) { |
| 31 | let (in_ptr: *const GenericArray, …>, out_ptr: *mut GenericArray, …>) = blocks.into_raw(); |
| 32 | let mut b: [__m128i; 8] = load8(blocks:in_ptr); |
| 33 | xor8(&mut b, key:keys[0]); |
| 34 | aesenc8(&mut b, key:keys[1]); |
| 35 | aesenc8(&mut b, key:keys[2]); |
| 36 | aesenc8(&mut b, key:keys[3]); |
| 37 | aesenc8(&mut b, key:keys[4]); |
| 38 | aesenc8(&mut b, key:keys[5]); |
| 39 | aesenc8(&mut b, key:keys[6]); |
| 40 | aesenc8(&mut b, key:keys[7]); |
| 41 | aesenc8(&mut b, key:keys[8]); |
| 42 | aesenc8(&mut b, key:keys[9]); |
| 43 | aesenclast8(&mut b, key:keys[10]); |
| 44 | store8(blocks:out_ptr, b); |
| 45 | } |
| 46 | |
| 47 | #[inline ] |
| 48 | #[target_feature (enable = "aes" )] |
| 49 | pub(super) unsafe fn decrypt1(keys: &RoundKeys, block: InOut<'_, '_, Block>) { |
| 50 | let (in_ptr: *const GenericArray>, out_ptr: *mut GenericArray>) = block.into_raw(); |
| 51 | let mut b: __m128i = _mm_loadu_si128(mem_addr:in_ptr as *const __m128i); |
| 52 | b = _mm_xor_si128(a:b, b:keys[10]); |
| 53 | b = _mm_aesdec_si128(a:b, round_key:keys[9]); |
| 54 | b = _mm_aesdec_si128(a:b, round_key:keys[8]); |
| 55 | b = _mm_aesdec_si128(a:b, round_key:keys[7]); |
| 56 | b = _mm_aesdec_si128(a:b, round_key:keys[6]); |
| 57 | b = _mm_aesdec_si128(a:b, round_key:keys[5]); |
| 58 | b = _mm_aesdec_si128(a:b, round_key:keys[4]); |
| 59 | b = _mm_aesdec_si128(a:b, round_key:keys[3]); |
| 60 | b = _mm_aesdec_si128(a:b, round_key:keys[2]); |
| 61 | b = _mm_aesdec_si128(a:b, round_key:keys[1]); |
| 62 | b = _mm_aesdeclast_si128(a:b, round_key:keys[0]); |
| 63 | _mm_storeu_si128(mem_addr:out_ptr as *mut __m128i, a:b); |
| 64 | } |
| 65 | |
| 66 | #[inline ] |
| 67 | #[target_feature (enable = "aes" )] |
| 68 | pub(super) unsafe fn decrypt8(keys: &RoundKeys, blocks: InOut<'_, '_, Block8>) { |
| 69 | let (in_ptr: *const GenericArray, …>, out_ptr: *mut GenericArray, …>) = blocks.into_raw(); |
| 70 | let mut b: [__m128i; 8] = load8(blocks:in_ptr); |
| 71 | xor8(&mut b, key:keys[10]); |
| 72 | aesdec8(&mut b, key:keys[9]); |
| 73 | aesdec8(&mut b, key:keys[8]); |
| 74 | aesdec8(&mut b, key:keys[7]); |
| 75 | aesdec8(&mut b, key:keys[6]); |
| 76 | aesdec8(&mut b, key:keys[5]); |
| 77 | aesdec8(&mut b, key:keys[4]); |
| 78 | aesdec8(&mut b, key:keys[3]); |
| 79 | aesdec8(&mut b, key:keys[2]); |
| 80 | aesdec8(&mut b, key:keys[1]); |
| 81 | aesdeclast8(&mut b, key:keys[0]); |
| 82 | store8(blocks:out_ptr, b); |
| 83 | } |
| 84 | |
| 85 | macro_rules! expand_round { |
| 86 | ($keys:expr, $pos:expr, $round:expr) => { |
| 87 | let mut t1 = $keys[$pos - 1]; |
| 88 | let mut t2; |
| 89 | let mut t3; |
| 90 | |
| 91 | t2 = _mm_aeskeygenassist_si128(t1, $round); |
| 92 | t2 = _mm_shuffle_epi32(t2, 0xff); |
| 93 | t3 = _mm_slli_si128(t1, 0x4); |
| 94 | t1 = _mm_xor_si128(t1, t3); |
| 95 | t3 = _mm_slli_si128(t3, 0x4); |
| 96 | t1 = _mm_xor_si128(t1, t3); |
| 97 | t3 = _mm_slli_si128(t3, 0x4); |
| 98 | t1 = _mm_xor_si128(t1, t3); |
| 99 | t1 = _mm_xor_si128(t1, t2); |
| 100 | |
| 101 | $keys[$pos] = t1; |
| 102 | }; |
| 103 | } |
| 104 | |
| 105 | #[inline ] |
| 106 | #[target_feature (enable = "aes" )] |
| 107 | pub(super) unsafe fn expand_key(key: &[u8; 16]) -> RoundKeys { |
| 108 | // SAFETY: `RoundKeys` is a `[__m128i; 11]` which can be initialized |
| 109 | // with all zeroes. |
| 110 | let mut keys: RoundKeys = mem::zeroed(); |
| 111 | |
| 112 | let k: __m128i = _mm_loadu_si128(mem_addr:key.as_ptr() as *const __m128i); |
| 113 | keys[0] = k; |
| 114 | |
| 115 | expand_round!(keys, 1, 0x01); |
| 116 | expand_round!(keys, 2, 0x02); |
| 117 | expand_round!(keys, 3, 0x04); |
| 118 | expand_round!(keys, 4, 0x08); |
| 119 | expand_round!(keys, 5, 0x10); |
| 120 | expand_round!(keys, 6, 0x20); |
| 121 | expand_round!(keys, 7, 0x40); |
| 122 | expand_round!(keys, 8, 0x80); |
| 123 | expand_round!(keys, 9, 0x1B); |
| 124 | expand_round!(keys, 10, 0x36); |
| 125 | |
| 126 | keys |
| 127 | } |
| 128 | |
| 129 | #[inline ] |
| 130 | #[target_feature (enable = "aes" )] |
| 131 | pub(super) unsafe fn inv_expanded_keys(keys: &RoundKeys) -> RoundKeys { |
| 132 | [ |
| 133 | keys[0], |
| 134 | _mm_aesimc_si128(keys[1]), |
| 135 | _mm_aesimc_si128(keys[2]), |
| 136 | _mm_aesimc_si128(keys[3]), |
| 137 | _mm_aesimc_si128(keys[4]), |
| 138 | _mm_aesimc_si128(keys[5]), |
| 139 | _mm_aesimc_si128(keys[6]), |
| 140 | _mm_aesimc_si128(keys[7]), |
| 141 | _mm_aesimc_si128(keys[8]), |
| 142 | _mm_aesimc_si128(keys[9]), |
| 143 | keys[10], |
| 144 | ] |
| 145 | } |
| 146 | |