2014-05-06 19:26:28 +02:00
|
|
|
#include <stdlib.h>
|
2014-05-06 18:22:22 +02:00
|
|
|
#include "aes.h"
|
|
|
|
|
|
|
|
namespace i2p
|
|
|
|
{
|
|
|
|
namespace crypto
|
|
|
|
{
|
2014-05-07 20:48:37 +02:00
|
|
|
|
|
|
|
#ifdef __x86_64__
|
2014-05-09 03:43:08 +02:00
|
|
|
|
|
|
|
ECBCryptoAESNI::ECBCryptoAESNI ()
|
|
|
|
{
|
|
|
|
m_KeySchedule = m_UnalignedBuffer;
|
|
|
|
uint8_t rem = ((uint64_t)m_KeySchedule) & 0x0f;
|
|
|
|
if (rem)
|
|
|
|
m_KeySchedule += (16 - rem);
|
|
|
|
}
|
|
|
|
|
2014-05-13 17:03:33 +02:00
|
|
|
#define KeyExpansion256(round0,round1) \
|
2014-05-07 20:48:37 +02:00
|
|
|
"pshufd $0xff, %%xmm2, %%xmm2 \n" \
|
|
|
|
"movaps %%xmm1, %%xmm4 \n" \
|
|
|
|
"pslldq $4, %%xmm4 \n" \
|
|
|
|
"pxor %%xmm4, %%xmm1 \n" \
|
|
|
|
"pslldq $4, %%xmm4 \n" \
|
|
|
|
"pxor %%xmm4, %%xmm1 \n" \
|
|
|
|
"pslldq $4, %%xmm4 \n" \
|
|
|
|
"pxor %%xmm4, %%xmm1 \n" \
|
|
|
|
"pxor %%xmm2, %%xmm1 \n" \
|
2014-05-13 17:03:33 +02:00
|
|
|
"movaps %%xmm1, "#round0"(%[sched]) \n" \
|
2014-05-07 20:48:37 +02:00
|
|
|
"aeskeygenassist $0, %%xmm1, %%xmm4 \n" \
|
|
|
|
"pshufd $0xaa, %%xmm4, %%xmm2 \n" \
|
|
|
|
"movaps %%xmm3, %%xmm4 \n" \
|
|
|
|
"pslldq $4, %%xmm4 \n" \
|
|
|
|
"pxor %%xmm4, %%xmm3 \n" \
|
|
|
|
"pslldq $4, %%xmm4 \n" \
|
|
|
|
"pxor %%xmm4, %%xmm3 \n" \
|
|
|
|
"pslldq $4, %%xmm4 \n" \
|
|
|
|
"pxor %%xmm4, %%xmm3 \n" \
|
|
|
|
"pxor %%xmm2, %%xmm3 \n" \
|
2014-05-13 17:03:33 +02:00
|
|
|
"movaps %%xmm3, "#round1"(%[sched]) \n"
|
2014-05-07 20:48:37 +02:00
|
|
|
|
2014-05-08 21:11:38 +02:00
|
|
|
void ECBCryptoAESNI::ExpandKey (const uint8_t * key)
|
2014-05-07 20:48:37 +02:00
|
|
|
{
|
|
|
|
__asm__
|
|
|
|
(
|
2014-05-09 20:11:05 +02:00
|
|
|
"movups (%[key]), %%xmm1 \n"
|
|
|
|
"movups 16(%[key]), %%xmm3 \n"
|
2014-05-13 04:51:59 +02:00
|
|
|
"movaps %%xmm1, (%[sched]) \n"
|
|
|
|
"movaps %%xmm3, 16(%[sched]) \n"
|
2014-05-07 20:48:37 +02:00
|
|
|
"aeskeygenassist $1, %%xmm3, %%xmm2 \n"
|
2014-05-13 17:03:33 +02:00
|
|
|
KeyExpansion256(32,48)
|
2014-05-07 20:48:37 +02:00
|
|
|
"aeskeygenassist $2, %%xmm3, %%xmm2 \n"
|
2014-05-13 17:03:33 +02:00
|
|
|
KeyExpansion256(64,80)
|
2014-05-07 20:48:37 +02:00
|
|
|
"aeskeygenassist $4, %%xmm3, %%xmm2 \n"
|
2014-05-13 17:03:33 +02:00
|
|
|
KeyExpansion256(96,112)
|
2014-05-07 20:48:37 +02:00
|
|
|
"aeskeygenassist $8, %%xmm3, %%xmm2 \n"
|
2014-05-13 17:03:33 +02:00
|
|
|
KeyExpansion256(128,144)
|
2014-05-08 17:53:54 +02:00
|
|
|
"aeskeygenassist $16, %%xmm3, %%xmm2 \n"
|
2014-05-13 17:03:33 +02:00
|
|
|
KeyExpansion256(160,176)
|
2014-05-08 17:53:54 +02:00
|
|
|
"aeskeygenassist $32, %%xmm3, %%xmm2 \n"
|
2014-05-13 17:03:33 +02:00
|
|
|
KeyExpansion256(192,208)
|
2014-05-08 17:53:54 +02:00
|
|
|
"aeskeygenassist $64, %%xmm3, %%xmm2 \n"
|
2014-05-07 20:48:37 +02:00
|
|
|
// key expansion final
|
|
|
|
"pshufd $0xff, %%xmm2, %%xmm2 \n"
|
|
|
|
"movaps %%xmm1, %%xmm4 \n"
|
|
|
|
"pslldq $4, %%xmm4 \n"
|
|
|
|
"pxor %%xmm4, %%xmm1 \n"
|
|
|
|
"pslldq $4, %%xmm4 \n"
|
|
|
|
"pxor %%xmm4, %%xmm1 \n"
|
|
|
|
"pslldq $4, %%xmm4 \n"
|
|
|
|
"pxor %%xmm4, %%xmm1 \n"
|
|
|
|
"pxor %%xmm2, %%xmm1 \n"
|
2014-05-13 17:03:33 +02:00
|
|
|
"movups %%xmm1, 224(%[sched]) \n"
|
2014-05-07 20:48:37 +02:00
|
|
|
: // output
|
2014-05-13 04:51:59 +02:00
|
|
|
: [key]"r"(key), [sched]"r"(m_KeySchedule) // input
|
2014-05-13 17:03:33 +02:00
|
|
|
: "%xmm1", "%xmm2", "%xmm3", "%xmm4" // clogged
|
2014-05-07 20:48:37 +02:00
|
|
|
);
|
|
|
|
}
|
|
|
|
|
2014-05-15 17:00:35 +02:00
|
|
|
#define EncryptAES256(sched) \
|
|
|
|
"pxor (%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenc 16(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenc 32(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenc 48(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenc 64(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenc 80(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenc 96(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenc 112(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenc 128(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenc 144(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenc 160(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenc 176(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenc 192(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenc 208(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesenclast 224(%["#sched"]), %%xmm0 \n"
|
2014-05-13 04:51:59 +02:00
|
|
|
|
2014-05-08 21:11:38 +02:00
|
|
|
void ECBEncryptionAESNI::Encrypt (const ChipherBlock * in, ChipherBlock * out)
|
2014-05-07 21:39:30 +02:00
|
|
|
{
|
|
|
|
__asm__
|
|
|
|
(
|
2014-05-09 20:11:05 +02:00
|
|
|
"movups (%[in]), %%xmm0 \n"
|
2014-05-15 17:00:35 +02:00
|
|
|
EncryptAES256(sched)
|
2014-05-09 20:11:05 +02:00
|
|
|
"movups %%xmm0, (%[out]) \n"
|
2014-05-13 04:51:59 +02:00
|
|
|
: : [sched]"r"(m_KeySchedule), [in]"r"(in), [out]"r"(out) : "%xmm0"
|
2014-05-07 21:39:30 +02:00
|
|
|
);
|
2014-05-08 21:11:38 +02:00
|
|
|
}
|
2014-05-07 21:39:30 +02:00
|
|
|
|
2014-05-15 17:00:35 +02:00
|
|
|
#define DecryptAES256(sched) \
|
|
|
|
"pxor 224(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdec 208(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdec 192(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdec 176(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdec 160(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdec 144(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdec 128(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdec 112(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdec 96(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdec 80(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdec 64(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdec 48(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdec 32(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdec 16(%["#sched"]), %%xmm0 \n" \
|
|
|
|
"aesdeclast (%["#sched"]), %%xmm0 \n"
|
2014-05-13 04:51:59 +02:00
|
|
|
|
2014-05-08 21:11:38 +02:00
|
|
|
void ECBDecryptionAESNI::Decrypt (const ChipherBlock * in, ChipherBlock * out)
|
2014-05-07 21:39:30 +02:00
|
|
|
{
|
|
|
|
__asm__
|
|
|
|
(
|
2014-05-09 20:11:05 +02:00
|
|
|
"movups (%[in]), %%xmm0 \n"
|
2014-05-15 17:00:35 +02:00
|
|
|
DecryptAES256(sched)
|
2014-05-09 20:11:05 +02:00
|
|
|
"movups %%xmm0, (%[out]) \n"
|
2014-05-13 04:51:59 +02:00
|
|
|
: : [sched]"r"(m_KeySchedule), [in]"r"(in), [out]"r"(out) : "%xmm0"
|
2014-05-07 21:39:30 +02:00
|
|
|
);
|
|
|
|
}
|
|
|
|
|
2014-05-08 21:11:38 +02:00
|
|
|
#define CallAESIMC(offset) \
|
2014-05-09 20:11:05 +02:00
|
|
|
"movaps "#offset"(%[shed]), %%xmm0 \n" \
|
2014-05-08 21:11:38 +02:00
|
|
|
"aesimc %%xmm0, %%xmm0 \n" \
|
2014-05-09 20:11:05 +02:00
|
|
|
"movaps %%xmm0, "#offset"(%[shed]) \n"
|
2014-05-08 21:11:38 +02:00
|
|
|
|
|
|
|
void ECBDecryptionAESNI::SetKey (const uint8_t * key)
|
|
|
|
{
|
|
|
|
ExpandKey (key); // expand encryption key first
|
|
|
|
// then invert it using aesimc
|
|
|
|
__asm__
|
|
|
|
(
|
|
|
|
CallAESIMC(16)
|
|
|
|
CallAESIMC(32)
|
|
|
|
CallAESIMC(48)
|
|
|
|
CallAESIMC(64)
|
|
|
|
CallAESIMC(80)
|
|
|
|
CallAESIMC(96)
|
|
|
|
CallAESIMC(112)
|
|
|
|
CallAESIMC(128)
|
|
|
|
CallAESIMC(144)
|
|
|
|
CallAESIMC(160)
|
|
|
|
CallAESIMC(176)
|
|
|
|
CallAESIMC(192)
|
|
|
|
CallAESIMC(208)
|
2014-05-09 20:11:05 +02:00
|
|
|
: : [shed]"r"(m_KeySchedule) : "%xmm0"
|
2014-05-08 21:11:38 +02:00
|
|
|
);
|
|
|
|
}
|
|
|
|
|
2014-05-07 20:48:37 +02:00
|
|
|
#endif
|
|
|
|
|
|
|
|
|
2014-05-06 18:22:22 +02:00
|
|
|
void CBCEncryption::Encrypt (int numBlocks, const ChipherBlock * in, ChipherBlock * out)
|
|
|
|
{
|
2014-05-13 04:51:59 +02:00
|
|
|
#ifdef __x86_64__
|
|
|
|
__asm__
|
|
|
|
(
|
|
|
|
"movups (%[iv]), %%xmm1 \n"
|
2014-05-13 19:43:07 +02:00
|
|
|
"block_e: \n"
|
2014-05-13 04:51:59 +02:00
|
|
|
"movups (%[in]), %%xmm0 \n"
|
|
|
|
"pxor %%xmm1, %%xmm0 \n"
|
2014-05-15 17:00:35 +02:00
|
|
|
EncryptAES256(sched)
|
2014-05-13 04:51:59 +02:00
|
|
|
"movaps %%xmm0, %%xmm1 \n"
|
|
|
|
"movups %%xmm0, (%[out]) \n"
|
|
|
|
"add $16, %[in] \n"
|
|
|
|
"add $16, %[out] \n"
|
|
|
|
"dec %[num] \n"
|
2014-05-13 19:43:07 +02:00
|
|
|
"jnz block_e; \n"
|
2014-05-13 04:51:59 +02:00
|
|
|
"movups %%xmm1, (%[iv]) \n"
|
|
|
|
:
|
|
|
|
: [iv]"r"(&m_LastBlock), [sched]"r"(m_ECBEncryption.GetKeySchedule ()),
|
|
|
|
[in]"r"(in), [out]"r"(out), [num]"r"(numBlocks)
|
|
|
|
: "%xmm0", "%xmm1", "cc", "memory"
|
|
|
|
);
|
|
|
|
#else
|
2014-05-06 18:22:22 +02:00
|
|
|
for (int i = 0; i < numBlocks; i++)
|
|
|
|
{
|
2014-05-09 18:05:04 +02:00
|
|
|
m_LastBlock ^= in[i];
|
2014-05-09 03:43:08 +02:00
|
|
|
m_ECBEncryption.Encrypt (&m_LastBlock, &m_LastBlock);
|
2014-05-06 18:22:22 +02:00
|
|
|
out[i] = m_LastBlock;
|
|
|
|
}
|
2014-05-13 04:51:59 +02:00
|
|
|
#endif
|
2014-05-06 18:22:22 +02:00
|
|
|
}
|
|
|
|
|
2014-05-06 19:26:28 +02:00
|
|
|
bool CBCEncryption::Encrypt (const uint8_t * in, std::size_t len, uint8_t * out)
|
|
|
|
{
|
|
|
|
div_t d = div (len, 16);
|
|
|
|
if (d.rem) return false; // len is not multipple of 16
|
|
|
|
Encrypt (d.quot, (const ChipherBlock *)in, (ChipherBlock *)out);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2014-05-14 20:54:01 +02:00
|
|
|
void CBCEncryption::Encrypt (const uint8_t * in, uint8_t * out)
|
|
|
|
{
|
|
|
|
#ifdef __x86_64__
|
|
|
|
__asm__
|
|
|
|
(
|
|
|
|
"movups (%[iv]), %%xmm1 \n"
|
|
|
|
"movups (%[in]), %%xmm0 \n"
|
|
|
|
"pxor %%xmm1, %%xmm0 \n"
|
2014-05-15 17:00:35 +02:00
|
|
|
EncryptAES256(sched)
|
2014-05-14 20:54:01 +02:00
|
|
|
"movups %%xmm0, (%[out]) \n"
|
|
|
|
"movups %%xmm0, (%[iv]) \n"
|
|
|
|
:
|
|
|
|
: [iv]"r"(&m_LastBlock), [sched]"r"(m_ECBEncryption.GetKeySchedule ()),
|
|
|
|
[in]"r"(in), [out]"r"(out)
|
|
|
|
: "%xmm0", "%xmm1", "memory"
|
|
|
|
);
|
|
|
|
#else
|
|
|
|
Encrypt (1, (const ChipherBlock *)in, (ChipherBlock *)out);
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2014-05-06 18:22:22 +02:00
|
|
|
void CBCDecryption::Decrypt (int numBlocks, const ChipherBlock * in, ChipherBlock * out)
|
|
|
|
{
|
2014-05-13 19:43:07 +02:00
|
|
|
#ifdef __x86_64__
|
|
|
|
__asm__
|
|
|
|
(
|
|
|
|
"movups (%[iv]), %%xmm1 \n"
|
|
|
|
"block_d: \n"
|
|
|
|
"movups (%[in]), %%xmm0 \n"
|
|
|
|
"movaps %%xmm0, %%xmm2 \n"
|
2014-05-15 17:00:35 +02:00
|
|
|
DecryptAES256(sched)
|
2014-05-13 19:43:07 +02:00
|
|
|
"pxor %%xmm1, %%xmm0 \n"
|
|
|
|
"movups %%xmm0, (%[out]) \n"
|
|
|
|
"movaps %%xmm2, %%xmm1 \n"
|
|
|
|
"add $16, %[in] \n"
|
|
|
|
"add $16, %[out] \n"
|
|
|
|
"dec %[num] \n"
|
|
|
|
"jnz block_d; \n"
|
|
|
|
"movups %%xmm1, (%[iv]) \n"
|
|
|
|
:
|
|
|
|
: [iv]"r"(&m_IV), [sched]"r"(m_ECBDecryption.GetKeySchedule ()),
|
|
|
|
[in]"r"(in), [out]"r"(out), [num]"r"(numBlocks)
|
|
|
|
: "%xmm0", "%xmm1", "%xmm2", "cc", "memory"
|
|
|
|
);
|
|
|
|
#else
|
2014-05-06 18:22:22 +02:00
|
|
|
for (int i = 0; i < numBlocks; i++)
|
|
|
|
{
|
2014-05-06 19:26:28 +02:00
|
|
|
ChipherBlock tmp = in[i];
|
2014-05-09 03:43:08 +02:00
|
|
|
m_ECBDecryption.Decrypt (in + i, out + i);
|
2014-05-09 18:05:04 +02:00
|
|
|
out[i] ^= m_IV;
|
2014-05-06 19:26:28 +02:00
|
|
|
m_IV = tmp;
|
2014-05-06 18:22:22 +02:00
|
|
|
}
|
2014-05-13 19:43:07 +02:00
|
|
|
#endif
|
2014-05-06 18:22:22 +02:00
|
|
|
}
|
2014-05-06 19:26:28 +02:00
|
|
|
|
|
|
|
bool CBCDecryption::Decrypt (const uint8_t * in, std::size_t len, uint8_t * out)
|
|
|
|
{
|
|
|
|
div_t d = div (len, 16);
|
2014-05-13 19:43:07 +02:00
|
|
|
if (d.rem) return false; // len is not multiple of 16
|
2014-05-06 19:26:28 +02:00
|
|
|
Decrypt (d.quot, (const ChipherBlock *)in, (ChipherBlock *)out);
|
|
|
|
return true;
|
|
|
|
}
|
2014-05-14 20:54:01 +02:00
|
|
|
|
|
|
|
void CBCDecryption::Decrypt (const uint8_t * in, uint8_t * out)
|
|
|
|
{
|
|
|
|
#ifdef __x86_64__
|
|
|
|
__asm__
|
|
|
|
(
|
|
|
|
"movups (%[iv]), %%xmm1 \n"
|
|
|
|
"movups (%[in]), %%xmm0 \n"
|
|
|
|
"movups %%xmm0, (%[iv]) \n"
|
2014-05-15 17:00:35 +02:00
|
|
|
DecryptAES256(sched)
|
2014-05-14 20:54:01 +02:00
|
|
|
"pxor %%xmm1, %%xmm0 \n"
|
|
|
|
"movups %%xmm0, (%[out]) \n"
|
|
|
|
:
|
|
|
|
: [iv]"r"(&m_IV), [sched]"r"(m_ECBDecryption.GetKeySchedule ()),
|
|
|
|
[in]"r"(in), [out]"r"(out)
|
|
|
|
: "%xmm0", "%xmm1", "memory"
|
|
|
|
);
|
|
|
|
#else
|
|
|
|
Decrypt (1, (const ChipherBlock *)in, (ChipherBlock *)out);
|
|
|
|
#endif
|
|
|
|
}
|
2014-05-06 18:22:22 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|