mirror of https://github.com/PurpleI2P/i2pd.git
EinMByte
9 years ago
9 changed files with 394 additions and 369 deletions
@ -0,0 +1,66 @@ |
|||||||
|
#ifndef AESNIMACROS_H__ |
||||||
|
#define AESNIMACROS_H__ |
||||||
|
|
||||||
|
#define KeyExpansion256(round0,round1) \ |
||||||
|
"pshufd $0xff, %%xmm2, %%xmm2 \n" \ |
||||||
|
"movaps %%xmm1, %%xmm4 \n" \ |
||||||
|
"pslldq $4, %%xmm4 \n" \ |
||||||
|
"pxor %%xmm4, %%xmm1 \n" \ |
||||||
|
"pslldq $4, %%xmm4 \n" \ |
||||||
|
"pxor %%xmm4, %%xmm1 \n" \ |
||||||
|
"pslldq $4, %%xmm4 \n" \ |
||||||
|
"pxor %%xmm4, %%xmm1 \n" \ |
||||||
|
"pxor %%xmm2, %%xmm1 \n" \ |
||||||
|
"movaps %%xmm1, "#round0"(%[sched]) \n" \ |
||||||
|
"aeskeygenassist $0, %%xmm1, %%xmm4 \n" \ |
||||||
|
"pshufd $0xaa, %%xmm4, %%xmm2 \n" \ |
||||||
|
"movaps %%xmm3, %%xmm4 \n" \ |
||||||
|
"pslldq $4, %%xmm4 \n" \ |
||||||
|
"pxor %%xmm4, %%xmm3 \n" \ |
||||||
|
"pslldq $4, %%xmm4 \n" \ |
||||||
|
"pxor %%xmm4, %%xmm3 \n" \ |
||||||
|
"pslldq $4, %%xmm4 \n" \ |
||||||
|
"pxor %%xmm4, %%xmm3 \n" \ |
||||||
|
"pxor %%xmm2, %%xmm3 \n" \ |
||||||
|
"movaps %%xmm3, "#round1"(%[sched]) \n" |
||||||
|
|
||||||
|
#define EncryptAES256(sched) \ |
||||||
|
"pxor (%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenc 16(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenc 32(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenc 48(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenc 64(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenc 80(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenc 96(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenc 112(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenc 128(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenc 144(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenc 160(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenc 176(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenc 192(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenc 208(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesenclast 224(%["#sched"]), %%xmm0 \n" |
||||||
|
|
||||||
|
#define DecryptAES256(sched) \ |
||||||
|
"pxor 224(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdec 208(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdec 192(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdec 176(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdec 160(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdec 144(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdec 128(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdec 112(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdec 96(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdec 80(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdec 64(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdec 48(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdec 32(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdec 16(%["#sched"]), %%xmm0 \n" \ |
||||||
|
"aesdeclast (%["#sched"]), %%xmm0 \n" |
||||||
|
|
||||||
|
#define CallAESIMC(offset) \ |
||||||
|
"movaps "#offset"(%[shed]), %%xmm0 \n" \ |
||||||
|
"aesimc %%xmm0, %%xmm0 \n" \ |
||||||
|
"movaps %%xmm0, "#offset"(%[shed]) \n" |
||||||
|
|
||||||
|
#endif |
@ -1,357 +1,222 @@ |
|||||||
#include <stdlib.h> |
#include <stdlib.h> |
||||||
#include "tunnel/TunnelBase.h" |
|
||||||
#include "aes.h" |
#include "aes.h" |
||||||
|
|
||||||
namespace i2p |
namespace i2p { |
||||||
{ |
namespace crypto { |
||||||
namespace crypto |
|
||||||
{ |
|
||||||
|
|
||||||
#ifdef AESNI |
#ifdef AESNI |
||||||
|
#include "AESNIMacros.h" |
||||||
|
|
||||||
#define KeyExpansion256(round0,round1) \ |
void ECBCryptoAESNI::ExpandKey (const AESKey& key) |
||||||
"pshufd $0xff, %%xmm2, %%xmm2 \n" \ |
{ |
||||||
"movaps %%xmm1, %%xmm4 \n" \ |
__asm__ |
||||||
"pslldq $4, %%xmm4 \n" \ |
( |
||||||
"pxor %%xmm4, %%xmm1 \n" \ |
"movups (%[key]), %%xmm1 \n" |
||||||
"pslldq $4, %%xmm4 \n" \ |
"movups 16(%[key]), %%xmm3 \n" |
||||||
"pxor %%xmm4, %%xmm1 \n" \ |
"movaps %%xmm1, (%[sched]) \n" |
||||||
"pslldq $4, %%xmm4 \n" \ |
"movaps %%xmm3, 16(%[sched]) \n" |
||||||
"pxor %%xmm4, %%xmm1 \n" \ |
"aeskeygenassist $1, %%xmm3, %%xmm2 \n" |
||||||
"pxor %%xmm2, %%xmm1 \n" \ |
KeyExpansion256(32,48) |
||||||
"movaps %%xmm1, "#round0"(%[sched]) \n" \ |
"aeskeygenassist $2, %%xmm3, %%xmm2 \n" |
||||||
"aeskeygenassist $0, %%xmm1, %%xmm4 \n" \ |
KeyExpansion256(64,80) |
||||||
"pshufd $0xaa, %%xmm4, %%xmm2 \n" \ |
"aeskeygenassist $4, %%xmm3, %%xmm2 \n" |
||||||
"movaps %%xmm3, %%xmm4 \n" \ |
KeyExpansion256(96,112) |
||||||
"pslldq $4, %%xmm4 \n" \ |
"aeskeygenassist $8, %%xmm3, %%xmm2 \n" |
||||||
"pxor %%xmm4, %%xmm3 \n" \ |
KeyExpansion256(128,144) |
||||||
"pslldq $4, %%xmm4 \n" \ |
"aeskeygenassist $16, %%xmm3, %%xmm2 \n" |
||||||
"pxor %%xmm4, %%xmm3 \n" \ |
KeyExpansion256(160,176) |
||||||
"pslldq $4, %%xmm4 \n" \ |
"aeskeygenassist $32, %%xmm3, %%xmm2 \n" |
||||||
"pxor %%xmm4, %%xmm3 \n" \ |
KeyExpansion256(192,208) |
||||||
"pxor %%xmm2, %%xmm3 \n" \ |
"aeskeygenassist $64, %%xmm3, %%xmm2 \n" |
||||||
"movaps %%xmm3, "#round1"(%[sched]) \n" |
// key expansion final
|
||||||
|
"pshufd $0xff, %%xmm2, %%xmm2 \n" |
||||||
void ECBCryptoAESNI::ExpandKey (const AESKey& key) |
"movaps %%xmm1, %%xmm4 \n" |
||||||
{ |
"pslldq $4, %%xmm4 \n" |
||||||
__asm__ |
"pxor %%xmm4, %%xmm1 \n" |
||||||
( |
"pslldq $4, %%xmm4 \n" |
||||||
"movups (%[key]), %%xmm1 \n" |
"pxor %%xmm4, %%xmm1 \n" |
||||||
"movups 16(%[key]), %%xmm3 \n" |
"pslldq $4, %%xmm4 \n" |
||||||
"movaps %%xmm1, (%[sched]) \n" |
"pxor %%xmm4, %%xmm1 \n" |
||||||
"movaps %%xmm3, 16(%[sched]) \n" |
"pxor %%xmm2, %%xmm1 \n" |
||||||
"aeskeygenassist $1, %%xmm3, %%xmm2 \n" |
"movups %%xmm1, 224(%[sched]) \n" |
||||||
KeyExpansion256(32,48) |
: // output
|
||||||
"aeskeygenassist $2, %%xmm3, %%xmm2 \n" |
: [key]"r"((const uint8_t *)key), [sched]"r"(GetKeySchedule ()) // input
|
||||||
KeyExpansion256(64,80) |
: "%xmm1", "%xmm2", "%xmm3", "%xmm4", "memory" // clogged
|
||||||
"aeskeygenassist $4, %%xmm3, %%xmm2 \n" |
); |
||||||
KeyExpansion256(96,112) |
} |
||||||
"aeskeygenassist $8, %%xmm3, %%xmm2 \n" |
|
||||||
KeyExpansion256(128,144) |
|
||||||
"aeskeygenassist $16, %%xmm3, %%xmm2 \n" |
|
||||||
KeyExpansion256(160,176) |
|
||||||
"aeskeygenassist $32, %%xmm3, %%xmm2 \n" |
|
||||||
KeyExpansion256(192,208) |
|
||||||
"aeskeygenassist $64, %%xmm3, %%xmm2 \n" |
|
||||||
// key expansion final
|
|
||||||
"pshufd $0xff, %%xmm2, %%xmm2 \n" |
|
||||||
"movaps %%xmm1, %%xmm4 \n" |
|
||||||
"pslldq $4, %%xmm4 \n" |
|
||||||
"pxor %%xmm4, %%xmm1 \n" |
|
||||||
"pslldq $4, %%xmm4 \n" |
|
||||||
"pxor %%xmm4, %%xmm1 \n" |
|
||||||
"pslldq $4, %%xmm4 \n" |
|
||||||
"pxor %%xmm4, %%xmm1 \n" |
|
||||||
"pxor %%xmm2, %%xmm1 \n" |
|
||||||
"movups %%xmm1, 224(%[sched]) \n" |
|
||||||
: // output
|
|
||||||
: [key]"r"((const uint8_t *)key), [sched]"r"(GetKeySchedule ()) // input
|
|
||||||
: "%xmm1", "%xmm2", "%xmm3", "%xmm4", "memory" // clogged
|
|
||||||
); |
|
||||||
} |
|
||||||
|
|
||||||
#define EncryptAES256(sched) \ |
|
||||||
"pxor (%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenc 16(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenc 32(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenc 48(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenc 64(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenc 80(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenc 96(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenc 112(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenc 128(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenc 144(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenc 160(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenc 176(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenc 192(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenc 208(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesenclast 224(%["#sched"]), %%xmm0 \n" |
|
||||||
|
|
||||||
void ECBEncryptionAESNI::Encrypt (const ChipherBlock * in, ChipherBlock * out) |
|
||||||
{ |
|
||||||
__asm__ |
|
||||||
( |
|
||||||
"movups (%[in]), %%xmm0 \n" |
|
||||||
EncryptAES256(sched) |
|
||||||
"movups %%xmm0, (%[out]) \n" |
|
||||||
: : [sched]"r"(GetKeySchedule ()), [in]"r"(in), [out]"r"(out) : "%xmm0", "memory" |
|
||||||
); |
|
||||||
} |
|
||||||
|
|
||||||
#define DecryptAES256(sched) \ |
void ECBEncryptionAESNI::Encrypt (const ChipherBlock * in, ChipherBlock * out) |
||||||
"pxor 224(%["#sched"]), %%xmm0 \n" \ |
{ |
||||||
"aesdec 208(%["#sched"]), %%xmm0 \n" \ |
__asm__ |
||||||
"aesdec 192(%["#sched"]), %%xmm0 \n" \ |
( |
||||||
"aesdec 176(%["#sched"]), %%xmm0 \n" \ |
"movups (%[in]), %%xmm0 \n" |
||||||
"aesdec 160(%["#sched"]), %%xmm0 \n" \ |
EncryptAES256(sched) |
||||||
"aesdec 144(%["#sched"]), %%xmm0 \n" \ |
"movups %%xmm0, (%[out]) \n" |
||||||
"aesdec 128(%["#sched"]), %%xmm0 \n" \ |
: : [sched]"r"(GetKeySchedule ()), [in]"r"(in), [out]"r"(out) : "%xmm0", "memory" |
||||||
"aesdec 112(%["#sched"]), %%xmm0 \n" \ |
); |
||||||
"aesdec 96(%["#sched"]), %%xmm0 \n" \ |
} |
||||||
"aesdec 80(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesdec 64(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesdec 48(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesdec 32(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesdec 16(%["#sched"]), %%xmm0 \n" \ |
|
||||||
"aesdeclast (%["#sched"]), %%xmm0 \n" |
|
||||||
|
|
||||||
void ECBDecryptionAESNI::Decrypt (const ChipherBlock * in, ChipherBlock * out) |
|
||||||
{ |
|
||||||
__asm__ |
|
||||||
( |
|
||||||
"movups (%[in]), %%xmm0 \n" |
|
||||||
DecryptAES256(sched) |
|
||||||
"movups %%xmm0, (%[out]) \n" |
|
||||||
: : [sched]"r"(GetKeySchedule ()), [in]"r"(in), [out]"r"(out) : "%xmm0", "memory" |
|
||||||
); |
|
||||||
} |
|
||||||
|
|
||||||
#define CallAESIMC(offset) \ |
void ECBDecryptionAESNI::Decrypt (const ChipherBlock * in, ChipherBlock * out) |
||||||
"movaps "#offset"(%[shed]), %%xmm0 \n" \ |
{ |
||||||
"aesimc %%xmm0, %%xmm0 \n" \ |
__asm__ |
||||||
"movaps %%xmm0, "#offset"(%[shed]) \n" |
( |
||||||
|
"movups (%[in]), %%xmm0 \n" |
||||||
|
DecryptAES256(sched) |
||||||
|
"movups %%xmm0, (%[out]) \n" |
||||||
|
: : [sched]"r"(GetKeySchedule ()), [in]"r"(in), [out]"r"(out) : "%xmm0", "memory" |
||||||
|
); |
||||||
|
} |
||||||
|
|
||||||
void ECBDecryptionAESNI::SetKey (const AESKey& key) |
void ECBDecryptionAESNI::SetKey (const AESKey& key) |
||||||
{ |
{ |
||||||
ExpandKey (key); // expand encryption key first
|
ExpandKey (key); // expand encryption key first
|
||||||
// then invert it using aesimc
|
// then invert it using aesimc
|
||||||
__asm__ |
__asm__ |
||||||
( |
( |
||||||
CallAESIMC(16) |
CallAESIMC(16) |
||||||
CallAESIMC(32) |
CallAESIMC(32) |
||||||
CallAESIMC(48) |
CallAESIMC(48) |
||||||
CallAESIMC(64) |
CallAESIMC(64) |
||||||
CallAESIMC(80) |
CallAESIMC(80) |
||||||
CallAESIMC(96) |
CallAESIMC(96) |
||||||
CallAESIMC(112) |
CallAESIMC(112) |
||||||
CallAESIMC(128) |
CallAESIMC(128) |
||||||
CallAESIMC(144) |
CallAESIMC(144) |
||||||
CallAESIMC(160) |
CallAESIMC(160) |
||||||
CallAESIMC(176) |
CallAESIMC(176) |
||||||
CallAESIMC(192) |
CallAESIMC(192) |
||||||
CallAESIMC(208) |
CallAESIMC(208) |
||||||
: : [shed]"r"(GetKeySchedule ()) : "%xmm0", "memory" |
: : [shed]"r"(GetKeySchedule ()) : "%xmm0", "memory" |
||||||
); |
); |
||||||
} |
} |
||||||
|
|
||||||
#endif |
#endif |
||||||
|
|
||||||
|
|
||||||
void CBCEncryption::Encrypt (int numBlocks, const ChipherBlock * in, ChipherBlock * out) |
void CBCEncryption::Encrypt (int numBlocks, const ChipherBlock * in, ChipherBlock * out) |
||||||
{ |
{ |
||||||
#ifdef AESNI |
#ifdef AESNI |
||||||
__asm__ |
__asm__ |
||||||
( |
( |
||||||
"movups (%[iv]), %%xmm1 \n" |
"movups (%[iv]), %%xmm1 \n" |
||||||
"1: \n" |
"1: \n" |
||||||
"movups (%[in]), %%xmm0 \n" |
"movups (%[in]), %%xmm0 \n" |
||||||
"pxor %%xmm1, %%xmm0 \n" |
"pxor %%xmm1, %%xmm0 \n" |
||||||
EncryptAES256(sched) |
EncryptAES256(sched) |
||||||
"movaps %%xmm0, %%xmm1 \n" |
"movaps %%xmm0, %%xmm1 \n" |
||||||
"movups %%xmm0, (%[out]) \n" |
"movups %%xmm0, (%[out]) \n" |
||||||
"add $16, %[in] \n" |
"add $16, %[in] \n" |
||||||
"add $16, %[out] \n" |
"add $16, %[out] \n" |
||||||
"dec %[num] \n" |
"dec %[num] \n" |
||||||
"jnz 1b \n" |
"jnz 1b \n" |
||||||
"movups %%xmm1, (%[iv]) \n" |
"movups %%xmm1, (%[iv]) \n" |
||||||
: |
: |
||||||
: [iv]"r"(&m_LastBlock), [sched]"r"(m_ECBEncryption.GetKeySchedule ()), |
: [iv]"r"(&m_LastBlock), [sched]"r"(m_ECBEncryption.GetKeySchedule ()), |
||||||
[in]"r"(in), [out]"r"(out), [num]"r"(numBlocks) |
[in]"r"(in), [out]"r"(out), [num]"r"(numBlocks) |
||||||
: "%xmm0", "%xmm1", "cc", "memory" |
: "%xmm0", "%xmm1", "cc", "memory" |
||||||
); |
); |
||||||
#else |
#else |
||||||
for (int i = 0; i < numBlocks; i++) |
for (int i = 0; i < numBlocks; i++) |
||||||
{ |
|
||||||
m_LastBlock ^= in[i]; |
|
||||||
m_ECBEncryption.Encrypt (&m_LastBlock, &m_LastBlock); |
|
||||||
out[i] = m_LastBlock; |
|
||||||
} |
|
||||||
#endif |
|
||||||
} |
|
||||||
|
|
||||||
void CBCEncryption::Encrypt (const uint8_t * in, std::size_t len, uint8_t * out) |
|
||||||
{ |
{ |
||||||
// len/16
|
m_LastBlock ^= in[i]; |
||||||
int numBlocks = len >> 4; |
m_ECBEncryption.Encrypt (&m_LastBlock, &m_LastBlock); |
||||||
if (numBlocks > 0) |
out[i] = m_LastBlock; |
||||||
Encrypt (numBlocks, (const ChipherBlock *)in, (ChipherBlock *)out); |
|
||||||
} |
} |
||||||
|
#endif |
||||||
|
} |
||||||
|
|
||||||
void CBCEncryption::Encrypt (const uint8_t * in, uint8_t * out) |
void CBCEncryption::Encrypt (const uint8_t * in, std::size_t len, uint8_t * out) |
||||||
{ |
{ |
||||||
|
// len/16
|
||||||
|
int numBlocks = len >> 4; |
||||||
|
if (numBlocks > 0) |
||||||
|
Encrypt (numBlocks, (const ChipherBlock *)in, (ChipherBlock *)out); |
||||||
|
} |
||||||
|
|
||||||
|
void CBCEncryption::Encrypt (const uint8_t * in, uint8_t * out) |
||||||
|
{ |
||||||
#ifdef AESNI |
#ifdef AESNI |
||||||
__asm__ |
__asm__ |
||||||
( |
( |
||||||
"movups (%[iv]), %%xmm1 \n" |
"movups (%[iv]), %%xmm1 \n" |
||||||
"movups (%[in]), %%xmm0 \n" |
"movups (%[in]), %%xmm0 \n" |
||||||
"pxor %%xmm1, %%xmm0 \n" |
"pxor %%xmm1, %%xmm0 \n" |
||||||
EncryptAES256(sched) |
EncryptAES256(sched) |
||||||
"movups %%xmm0, (%[out]) \n" |
"movups %%xmm0, (%[out]) \n" |
||||||
"movups %%xmm0, (%[iv]) \n" |
"movups %%xmm0, (%[iv]) \n" |
||||||
: |
: |
||||||
: [iv]"r"(&m_LastBlock), [sched]"r"(m_ECBEncryption.GetKeySchedule ()), |
: [iv]"r"(&m_LastBlock), [sched]"r"(m_ECBEncryption.GetKeySchedule ()), |
||||||
[in]"r"(in), [out]"r"(out) |
[in]"r"(in), [out]"r"(out) |
||||||
: "%xmm0", "%xmm1", "memory" |
: "%xmm0", "%xmm1", "memory" |
||||||
); |
); |
||||||
#else |
#else |
||||||
Encrypt (1, (const ChipherBlock *)in, (ChipherBlock *)out); |
Encrypt (1, (const ChipherBlock *)in, (ChipherBlock *)out); |
||||||
#endif |
#endif |
||||||
} |
} |
||||||
|
|
||||||
void CBCDecryption::Decrypt (int numBlocks, const ChipherBlock * in, ChipherBlock * out) |
void CBCDecryption::Decrypt (int numBlocks, const ChipherBlock * in, ChipherBlock * out) |
||||||
{ |
{ |
||||||
#ifdef AESNI |
#ifdef AESNI |
||||||
__asm__ |
__asm__ |
||||||
( |
( |
||||||
"movups (%[iv]), %%xmm1 \n" |
"movups (%[iv]), %%xmm1 \n" |
||||||
"1: \n" |
"1: \n" |
||||||
"movups (%[in]), %%xmm0 \n" |
"movups (%[in]), %%xmm0 \n" |
||||||
"movaps %%xmm0, %%xmm2 \n" |
"movaps %%xmm0, %%xmm2 \n" |
||||||
DecryptAES256(sched) |
DecryptAES256(sched) |
||||||
"pxor %%xmm1, %%xmm0 \n" |
"pxor %%xmm1, %%xmm0 \n" |
||||||
"movups %%xmm0, (%[out]) \n" |
"movups %%xmm0, (%[out]) \n" |
||||||
"movaps %%xmm2, %%xmm1 \n" |
"movaps %%xmm2, %%xmm1 \n" |
||||||
"add $16, %[in] \n" |
"add $16, %[in] \n" |
||||||
"add $16, %[out] \n" |
"add $16, %[out] \n" |
||||||
"dec %[num] \n" |
"dec %[num] \n" |
||||||
"jnz 1b \n" |
"jnz 1b \n" |
||||||
"movups %%xmm1, (%[iv]) \n" |
"movups %%xmm1, (%[iv]) \n" |
||||||
: |
: |
||||||
: [iv]"r"(&m_IV), [sched]"r"(m_ECBDecryption.GetKeySchedule ()), |
: [iv]"r"(&m_IV), [sched]"r"(m_ECBDecryption.GetKeySchedule ()), |
||||||
[in]"r"(in), [out]"r"(out), [num]"r"(numBlocks) |
[in]"r"(in), [out]"r"(out), [num]"r"(numBlocks) |
||||||
: "%xmm0", "%xmm1", "%xmm2", "cc", "memory" |
: "%xmm0", "%xmm1", "%xmm2", "cc", "memory" |
||||||
); |
); |
||||||
#else |
#else |
||||||
for (int i = 0; i < numBlocks; i++) |
for (int i = 0; i < numBlocks; i++) |
||||||
{ |
|
||||||
ChipherBlock tmp = in[i]; |
|
||||||
m_ECBDecryption.Decrypt (in + i, out + i); |
|
||||||
out[i] ^= m_IV; |
|
||||||
m_IV = tmp; |
|
||||||
} |
|
||||||
#endif |
|
||||||
} |
|
||||||
|
|
||||||
void CBCDecryption::Decrypt (const uint8_t * in, std::size_t len, uint8_t * out) |
|
||||||
{ |
{ |
||||||
int numBlocks = len >> 4; |
ChipherBlock tmp = in[i]; |
||||||
if (numBlocks > 0) |
m_ECBDecryption.Decrypt (in + i, out + i); |
||||||
Decrypt (numBlocks, (const ChipherBlock *)in, (ChipherBlock *)out); |
out[i] ^= m_IV; |
||||||
|
m_IV = tmp; |
||||||
} |
} |
||||||
|
|
||||||
void CBCDecryption::Decrypt (const uint8_t * in, uint8_t * out) |
|
||||||
{ |
|
||||||
#ifdef AESNI |
|
||||||
__asm__ |
|
||||||
( |
|
||||||
"movups (%[iv]), %%xmm1 \n" |
|
||||||
"movups (%[in]), %%xmm0 \n" |
|
||||||
"movups %%xmm0, (%[iv]) \n" |
|
||||||
DecryptAES256(sched) |
|
||||||
"pxor %%xmm1, %%xmm0 \n" |
|
||||||
"movups %%xmm0, (%[out]) \n" |
|
||||||
: |
|
||||||
: [iv]"r"(&m_IV), [sched]"r"(m_ECBDecryption.GetKeySchedule ()), |
|
||||||
[in]"r"(in), [out]"r"(out) |
|
||||||
: "%xmm0", "%xmm1", "memory" |
|
||||||
); |
|
||||||
#else |
|
||||||
Decrypt (1, (const ChipherBlock *)in, (ChipherBlock *)out); |
|
||||||
#endif |
#endif |
||||||
} |
} |
||||||
|
|
||||||
void TunnelEncryption::Encrypt (const uint8_t * in, uint8_t * out) |
void CBCDecryption::Decrypt (const uint8_t * in, std::size_t len, uint8_t * out) |
||||||
{ |
{ |
||||||
#ifdef AESNI |
int numBlocks = len >> 4; |
||||||
__asm__ |
if (numBlocks > 0) |
||||||
( |
Decrypt (numBlocks, (const ChipherBlock *)in, (ChipherBlock *)out); |
||||||
// encrypt IV
|
} |
||||||
"movups (%[in]), %%xmm0 \n" |
|
||||||
EncryptAES256(sched_iv) |
|
||||||
"movaps %%xmm0, %%xmm1 \n" |
|
||||||
// double IV encryption
|
|
||||||
EncryptAES256(sched_iv) |
|
||||||
"movups %%xmm0, (%[out]) \n" |
|
||||||
// encrypt data, IV is xmm1
|
|
||||||
"1: \n" |
|
||||||
"add $16, %[in] \n" |
|
||||||
"add $16, %[out] \n" |
|
||||||
"movups (%[in]), %%xmm0 \n" |
|
||||||
"pxor %%xmm1, %%xmm0 \n" |
|
||||||
EncryptAES256(sched_l) |
|
||||||
"movaps %%xmm0, %%xmm1 \n" |
|
||||||
"movups %%xmm0, (%[out]) \n" |
|
||||||
"dec %[num] \n" |
|
||||||
"jnz 1b \n" |
|
||||||
: |
|
||||||
: [sched_iv]"r"(m_IVEncryption.GetKeySchedule ()), [sched_l]"r"(m_LayerEncryption.GetKeySchedule ()), |
|
||||||
[in]"r"(in), [out]"r"(out), [num]"r"(63) // 63 blocks = 1008 bytes
|
|
||||||
: "%xmm0", "%xmm1", "cc", "memory" |
|
||||||
); |
|
||||||
#else |
|
||||||
m_IVEncryption.Encrypt ((const ChipherBlock *)in, (ChipherBlock *)out); // iv
|
|
||||||
m_LayerEncryption.SetIV (out); |
|
||||||
m_LayerEncryption.Encrypt (in + 16, i2p::tunnel::TUNNEL_DATA_ENCRYPTED_SIZE, out + 16); // data
|
|
||||||
m_IVEncryption.Encrypt ((ChipherBlock *)out, (ChipherBlock *)out); // double iv
|
|
||||||
#endif |
|
||||||
} |
|
||||||
|
|
||||||
void TunnelDecryption::Decrypt (const uint8_t * in, uint8_t * out) |
void CBCDecryption::Decrypt (const uint8_t * in, uint8_t * out) |
||||||
{ |
{ |
||||||
#ifdef AESNI |
#ifdef AESNI |
||||||
__asm__ |
__asm__ |
||||||
( |
( |
||||||
// decrypt IV
|
"movups (%[iv]), %%xmm1 \n" |
||||||
"movups (%[in]), %%xmm0 \n" |
"movups (%[in]), %%xmm0 \n" |
||||||
DecryptAES256(sched_iv) |
"movups %%xmm0, (%[iv]) \n" |
||||||
"movaps %%xmm0, %%xmm1 \n" |
DecryptAES256(sched) |
||||||
// double IV encryption
|
"pxor %%xmm1, %%xmm0 \n" |
||||||
DecryptAES256(sched_iv) |
"movups %%xmm0, (%[out]) \n" |
||||||
"movups %%xmm0, (%[out]) \n" |
: |
||||||
// decrypt data, IV is xmm1
|
: [iv]"r"(&m_IV), [sched]"r"(m_ECBDecryption.GetKeySchedule ()), |
||||||
"1: \n" |
[in]"r"(in), [out]"r"(out) |
||||||
"add $16, %[in] \n" |
: "%xmm0", "%xmm1", "memory" |
||||||
"add $16, %[out] \n" |
); |
||||||
"movups (%[in]), %%xmm0 \n" |
|
||||||
"movaps %%xmm0, %%xmm2 \n" |
|
||||||
DecryptAES256(sched_l) |
|
||||||
"pxor %%xmm1, %%xmm0 \n" |
|
||||||
"movups %%xmm0, (%[out]) \n" |
|
||||||
"movaps %%xmm2, %%xmm1 \n" |
|
||||||
"dec %[num] \n" |
|
||||||
"jnz 1b \n" |
|
||||||
: |
|
||||||
: [sched_iv]"r"(m_IVDecryption.GetKeySchedule ()), [sched_l]"r"(m_LayerDecryption.GetKeySchedule ()), |
|
||||||
[in]"r"(in), [out]"r"(out), [num]"r"(63) // 63 blocks = 1008 bytes
|
|
||||||
: "%xmm0", "%xmm1", "%xmm2", "cc", "memory" |
|
||||||
); |
|
||||||
#else |
#else |
||||||
m_IVDecryption.Decrypt ((const ChipherBlock *)in, (ChipherBlock *)out); // iv
|
Decrypt (1, (const ChipherBlock *)in, (ChipherBlock *)out); |
||||||
m_LayerDecryption.SetIV (out); |
|
||||||
m_LayerDecryption.Decrypt (in + 16, i2p::tunnel::TUNNEL_DATA_ENCRYPTED_SIZE, out + 16); // data
|
|
||||||
m_IVDecryption.Decrypt ((ChipherBlock *)out, (ChipherBlock *)out); // double iv
|
|
||||||
#endif |
#endif |
||||||
} |
|
||||||
} |
|
||||||
} |
} |
||||||
|
|
||||||
|
} // crypto
|
||||||
|
} // i2p
|
||||||
|
|
||||||
|
@ -0,0 +1,88 @@ |
|||||||
|
#include "TunnelCrypto.h" |
||||||
|
#include "TunnelBase.h" |
||||||
|
#include "AESNIMacros.h" |
||||||
|
|
||||||
|
namespace i2p { |
||||||
|
namespace crypto { |
||||||
|
|
||||||
|
void TunnelEncryption::SetKeys (const AESKey& layerKey, const AESKey& ivKey) |
||||||
|
{ |
||||||
|
m_LayerEncryption.SetKey (layerKey); |
||||||
|
m_IVEncryption.SetKey (ivKey); |
||||||
|
} |
||||||
|
|
||||||
|
void TunnelEncryption::Encrypt (const uint8_t * in, uint8_t * out) |
||||||
|
{ |
||||||
|
#ifdef AESNI |
||||||
|
__asm__ |
||||||
|
( |
||||||
|
// encrypt IV
|
||||||
|
"movups (%[in]), %%xmm0 \n" |
||||||
|
EncryptAES256(sched_iv) |
||||||
|
"movaps %%xmm0, %%xmm1 \n" |
||||||
|
// double IV encryption
|
||||||
|
EncryptAES256(sched_iv) |
||||||
|
"movups %%xmm0, (%[out]) \n" |
||||||
|
// encrypt data, IV is xmm1
|
||||||
|
"1: \n" |
||||||
|
"add $16, %[in] \n" |
||||||
|
"add $16, %[out] \n" |
||||||
|
"movups (%[in]), %%xmm0 \n" |
||||||
|
"pxor %%xmm1, %%xmm0 \n" |
||||||
|
EncryptAES256(sched_l) |
||||||
|
"movaps %%xmm0, %%xmm1 \n" |
||||||
|
"movups %%xmm0, (%[out]) \n" |
||||||
|
"dec %[num] \n" |
||||||
|
"jnz 1b \n" |
||||||
|
: |
||||||
|
: [sched_iv]"r"(m_IVEncryption.GetKeySchedule ()), [sched_l]"r"(m_LayerEncryption.GetKeySchedule ()), |
||||||
|
[in]"r"(in), [out]"r"(out), [num]"r"(63) // 63 blocks = 1008 bytes
|
||||||
|
: "%xmm0", "%xmm1", "cc", "memory" |
||||||
|
); |
||||||
|
#else |
||||||
|
m_IVEncryption.Encrypt ((const ChipherBlock *)in, (ChipherBlock *)out); // iv
|
||||||
|
m_LayerEncryption.SetIV (out); |
||||||
|
m_LayerEncryption.Encrypt (in + 16, i2p::tunnel::TUNNEL_DATA_ENCRYPTED_SIZE, out + 16); // data
|
||||||
|
m_IVEncryption.Encrypt ((ChipherBlock *)out, (ChipherBlock *)out); // double iv
|
||||||
|
#endif |
||||||
|
} |
||||||
|
|
||||||
|
void TunnelDecryption::Decrypt (const uint8_t * in, uint8_t * out) |
||||||
|
{ |
||||||
|
#ifdef AESNI |
||||||
|
__asm__ |
||||||
|
( |
||||||
|
// decrypt IV
|
||||||
|
"movups (%[in]), %%xmm0 \n" |
||||||
|
DecryptAES256(sched_iv) |
||||||
|
"movaps %%xmm0, %%xmm1 \n" |
||||||
|
// double IV encryption
|
||||||
|
DecryptAES256(sched_iv) |
||||||
|
"movups %%xmm0, (%[out]) \n" |
||||||
|
// decrypt data, IV is xmm1
|
||||||
|
"1: \n" |
||||||
|
"add $16, %[in] \n" |
||||||
|
"add $16, %[out] \n" |
||||||
|
"movups (%[in]), %%xmm0 \n" |
||||||
|
"movaps %%xmm0, %%xmm2 \n" |
||||||
|
DecryptAES256(sched_l) |
||||||
|
"pxor %%xmm1, %%xmm0 \n" |
||||||
|
"movups %%xmm0, (%[out]) \n" |
||||||
|
"movaps %%xmm2, %%xmm1 \n" |
||||||
|
"dec %[num] \n" |
||||||
|
"jnz 1b \n" |
||||||
|
: |
||||||
|
: [sched_iv]"r"(m_IVDecryption.GetKeySchedule ()), [sched_l]"r"(m_LayerDecryption.GetKeySchedule ()), |
||||||
|
[in]"r"(in), [out]"r"(out), [num]"r"(63) // 63 blocks = 1008 bytes
|
||||||
|
: "%xmm0", "%xmm1", "%xmm2", "cc", "memory" |
||||||
|
); |
||||||
|
#else |
||||||
|
m_IVDecryption.Decrypt ((const ChipherBlock *)in, (ChipherBlock *)out); // iv
|
||||||
|
m_LayerDecryption.SetIV (out); |
||||||
|
m_LayerDecryption.Decrypt (in + 16, i2p::tunnel::TUNNEL_DATA_ENCRYPTED_SIZE, out + 16); // data
|
||||||
|
m_IVDecryption.Decrypt ((ChipherBlock *)out, (ChipherBlock *)out); // double iv
|
||||||
|
#endif |
||||||
|
} |
||||||
|
|
||||||
|
} // crypto
|
||||||
|
} // i2p
|
@ -0,0 +1,49 @@ |
|||||||
|
#ifndef TUNNEL_CRYPTO_H__ |
||||||
|
#define TUNNEL_CRYPTO_H__ |
||||||
|
|
||||||
|
#include "crypto/aes.h" |
||||||
|
|
||||||
|
namespace i2p { |
||||||
|
namespace crypto { |
||||||
|
|
||||||
|
class TunnelEncryption { // with double IV encryption
|
||||||
|
public: |
||||||
|
void SetKeys (const AESKey& layerKey, const AESKey& ivKey); |
||||||
|
|
||||||
|
void Encrypt (const uint8_t * in, uint8_t * out); // 1024 bytes (16 IV + 1008 data)
|
||||||
|
|
||||||
|
private: |
||||||
|
|
||||||
|
ECBEncryption m_IVEncryption; |
||||||
|
#ifdef AESNI |
||||||
|
ECBEncryption m_LayerEncryption; |
||||||
|
#else |
||||||
|
CBCEncryption m_LayerEncryption; |
||||||
|
#endif |
||||||
|
}; |
||||||
|
|
||||||
|
class TunnelDecryption { // with double IV encryption
|
||||||
|
public: |
||||||
|
|
||||||
|
void SetKeys (const AESKey& layerKey, const AESKey& ivKey) |
||||||
|
{ |
||||||
|
m_LayerDecryption.SetKey (layerKey); |
||||||
|
m_IVDecryption.SetKey (ivKey); |
||||||
|
} |
||||||
|
|
||||||
|
void Decrypt (const uint8_t * in, uint8_t * out); // 1024 bytes (16 IV + 1008 data)
|
||||||
|
|
||||||
|
private: |
||||||
|
|
||||||
|
ECBDecryption m_IVDecryption; |
||||||
|
#ifdef AESNI |
||||||
|
ECBDecryption m_LayerDecryption; |
||||||
|
#else |
||||||
|
CBCDecryption m_LayerDecryption; |
||||||
|
#endif |
||||||
|
}; |
||||||
|
|
||||||
|
} // crypto
|
||||||
|
} // i2p
|
||||||
|
|
||||||
|
#endif |
Loading…
Reference in new issue