avr-crypto-lib/serpent.c

231 lines
4.9 KiB
C

/* serpent.c
* a bitsliced implementation of the serpent cipher for avr microcontrollers
* author: Daniel Otte
* email: daniel.otte@rub.de
* license: GPLv3
*/
#include <stdint.h>
#include <string.h> /* memset() */
#include <avr/pgmspace.h>
#include "serpent.h"
uint8_t sbox[] PROGMEM = {
0x38, 0xF1, 0xA6, 0x5B, 0xED, 0x42, 0x70, 0x9C,
0xFC, 0x27, 0x90, 0x5A, 0x1B, 0xE8, 0x6D, 0x34,
0x86, 0x79, 0x3C, 0xAF, 0xD1, 0xE4, 0x0B, 0x52,
0x0F, 0xB8, 0xC9, 0x63, 0xD1, 0x24, 0xA7, 0x5E,
0x1F, 0x83, 0xC0, 0xB6, 0x25, 0x4A, 0x9E, 0x7D,
0xF5, 0x2B, 0x4A, 0x9C, 0x03, 0xE8, 0xD6, 0x71,
0x72, 0xC5, 0x84, 0x6B, 0xE9, 0x1F, 0xD3, 0xA0,
0x1D, 0xF0, 0xE8, 0x2B, 0x74, 0xCA, 0x93, 0x56,
/* now the inverted sboxes */
0xD3, 0xB0, 0xA6, 0x5C, 0x1E, 0x47, 0xF9, 0x82,
0x58, 0x2E, 0xF6, 0xC3, 0xB4, 0x79, 0x1D, 0xA0,
0xC9, 0xF4, 0xBE, 0x12, 0x03, 0x6D, 0x58, 0xA7,
0x09, 0xA7, 0xBE, 0x6D, 0x35, 0xC2, 0x48, 0xF1,
0x50, 0x83, 0xA9, 0x7E, 0x2C, 0xB6, 0x4F, 0xD1,
0x8F, 0x29, 0x41, 0xDE, 0xB6, 0x53, 0x7C, 0xA0,
0xFA, 0x1D, 0x53, 0x60, 0x49, 0xE7, 0x2C, 0x8B,
0x30, 0x6D, 0x9E, 0xF8, 0x5C, 0xB7, 0xA1, 0x42
};
#define SHR_O(a) c=(a)&1; ((a) = (a)>>1)
#define SHR_I(a) ((a) = (c?0x80:0x00)| ((a)>>1))
static void ip(uint8_t *o, uint32_t *i){
uint8_t c; // carry
uint8_t n,m;
memset(o, 0, 16);
for(n=0; n<16; ++n){
for(m=0; m<2; ++m){
SHR_O(i[0]);
SHR_I(o[n]);
SHR_O(i[1]);
SHR_I(o[n]);
SHR_O(i[2]);
SHR_I(o[n]);
SHR_O(i[3]);
SHR_I(o[n]);
}
}
}
#undef SHR_I
#define SHR_I(a) ((a) = (c?0x80000000L:0x00L)| ((a)>>1)) /* we use 32-bit words here */
static void fp(uint32_t *o, uint32_t *i){
uint8_t c; // carry
uint8_t n,m;
memset(o, 0, 16);
for(n=0; n<4; ++n){
for(m=0; m<8; ++m){
SHR_O(i[n]);
SHR_I(o[0]);
SHR_O(i[n]);
SHR_I(o[1]);
SHR_O(i[n]);
SHR_I(o[2]);
SHR_O(i[n]);
SHR_I(o[3]);
}
}
}
/******************************************************************************/
static void sbox128x(uint8_t box, void* w){
uint8_t sb[16];
uint8_t i,t,x;
box &= 0x0f;
/* load sbox */
for(i=0; i<8; ++i){
t = pgm_read_byte(sbox + box*8 + i);
sb[2*i+0]=t>>4;
sb[2*i+1]=t&0xf;
}
uint8_t o[16];
ip(o, w);
for(i=0; i<16; ++i){
t = ((uint8_t*)o)[i];
x = sb[t>>4];
x <<= 4;
x |= sb[t&0xf];
((uint8_t*)o)[i] = x;
}
fp(w, (uint32_t*)o);
}
static void sbox128(void * w, uint8_t box){
sbox128x(box&0x7, w);
}
static void inv_sbox128(void * w, uint8_t box){
sbox128x(((box&0x7)|0x8), w);
}
/******************************************************************************/
void memxor(void * dest, void * src, uint8_t size){
while(size--){
*((uint8_t*)dest) ^= *((uint8_t*)src);
dest = (uint8_t*)dest +1;
src = (uint8_t*)src +1;
}
}
/******************************************************************************/
uint32_t rotl32(uint32_t a, uint8_t n){
return ((a<<n) | (a>>(32-n)));
}
uint32_t rotr32(uint32_t a, uint8_t n){
return ((a>>n) | (a<<(32-n)));
}
#define X0 (((uint32_t*)b)[0])
#define X1 (((uint32_t*)b)[1])
#define X2 (((uint32_t*)b)[2])
#define X3 (((uint32_t*)b)[3])
static void lt(uint8_t *b){
X0 = rotl32(X0, 13);
X2 = rotl32(X2, 3);
X1 ^= X0 ^ X2;
X3 ^= X2 ^ (X0 << 3);
X1 = rotl32(X1, 1);
X3 = rotl32(X3, 7);
X0 ^= X1 ^ X3;
X2 ^= X3 ^ (X1 << 7);
X0 = rotl32(X0, 5);
X2 = rotr32(X2, 10);
}
static void inv_lt(uint8_t *b){
X2 = rotl32(X2, 10);
X0 = rotr32(X0, 5);
X2 ^= X3 ^ (X1 << 7);
X0 ^= X1 ^ X3;
X3 = rotr32(X3, 7);
X1 = rotr32(X1, 1);
X3 ^= X2 ^ (X0 << 3);
X1 ^= X0 ^ X2;
X2 = rotr32(X2, 3);
X0 = rotr32(X0, 13);
}
#define GOLDEN_RATIO 0x9e3779b9l
static uint32_t gen_w(uint32_t * b, uint8_t i){
uint32_t ret;
ret = b[0] ^ b[3] ^ b[5] ^ b[7] ^ GOLDEN_RATIO ^ (uint32_t)i;
ret = rotl32(ret, 11);
return ret;
}
/* key must be 256bit (32 byte) large! */
void serpent_genctx(void * key, uint8_t keysize, serpent_ctx_t * ctx){
uint32_t buffer[8];
uint8_t i,j;
if(keysize){
/* keysize is less than 256 bit, padding needed */
memset(buffer, 0, 32);
memcpy(buffer, key, (keysize+7)/8);
((uint8_t*)buffer)[keysize/8] |= 1<<(keysize%8);
} else {
/* keysize is 256 bit */
memcpy(buffer, key, 32);
}
for(i=0; i<33; ++i){
for(j=0; j<4; ++j){
ctx->k[i][j] = gen_w(buffer, i*4+j);
memmove(buffer, &(buffer[1]), 7*4); /* shift buffer one to the "left" */
buffer[7] = ctx->k[i][j];
}
}
for(i=0; i<33; ++i){
sbox128(ctx->k[i],3-i);
}
}
void serpent_enc(void* buffer, serpent_ctx_t * ctx){
uint8_t i;
for(i=0; i<31; ++i){
memxor((uint8_t*)buffer, ctx->k[i], 16);
sbox128(buffer, i);
lt((uint8_t*)buffer);
}
memxor((uint8_t*)buffer, ctx->k[i], 16);
sbox128(buffer, i);
++i;
memxor((uint8_t*)buffer, ctx->k[i], 16);
}
void serpent_dec(void* buffer, serpent_ctx_t * ctx){
int8_t i=32;
memxor((uint8_t*)buffer, ctx->k[i], 16);
--i;
inv_sbox128(buffer, i);
memxor((uint8_t*)buffer, ctx->k[i], 16);
--i;
for(; i>=0; --i){
inv_lt((uint8_t*)buffer);
inv_sbox128(buffer, i);
memxor((uint8_t*)buffer, ctx->k[i], 16);
}
}