/**
* The Whirlpool hashing function.
*
*
* References
*
*
* The Whirlpool algorithm was developed by
* Paulo S. L. M. Barreto and
* Vincent Rijmen.
*
* See
* P.S.L.M. Barreto, V. Rijmen,
* ``The Whirlpool hashing function,''
* NESSIE submission, 2000.
*
* @author Paulo S.L.M. Barreto
* @author Vincent Rijmen.
*
* @version 2.0 (2000.05.19)
*
* Differences from version 1.0:
*
* - Original S-box replaced by the tweaked, hardware-efficient version.
*
* =============================================================================
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHORS ''AS IS'' AND ANY EXPRESS
* OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
* WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
* OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
* EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*
*/
#include
#include
#include
#include
#include "nessie.h"
/*
* The number of rounds of the internal dedicated block cipher.
*/
#define R 10
/*
* Though Whirlpool is endianness-neutral, the encryption tables are listed
* in BIG-ENDIAN format, which is adopted throughout this implementation
* (but little-endian notation would be equally suitable if consistently
* employed).
*/
#include "64bit_tables.h"
/**
* The core Whirlpool transform.
*/
static void processBuffer(struct NESSIEstruct * const structpointer) {
int i, r;
u64 K[8]; /* the round key */
u64 block[8]; /* mu(buffer) */
u64 state[8]; /* the cipher state */
u64 L[8];
u8 *buffer = structpointer->buffer;
/*
* map the buffer to a block:
*/
for (i = 0; i < 8; i++, buffer += 8) {
block[i] =
(((u64)buffer[0] ) << 56) ^
(((u64)buffer[1] & 0xffL) << 48) ^
(((u64)buffer[2] & 0xffL) << 40) ^
(((u64)buffer[3] & 0xffL) << 32) ^
(((u64)buffer[4] & 0xffL) << 24) ^
(((u64)buffer[5] & 0xffL) << 16) ^
(((u64)buffer[6] & 0xffL) << 8) ^
(((u64)buffer[7] & 0xffL) );
}
/*
* compute and apply K^0 to the cipher state:
*/
state[0] = block[0] ^ (K[0] = structpointer->hash[0]);
state[1] = block[1] ^ (K[1] = structpointer->hash[1]);
state[2] = block[2] ^ (K[2] = structpointer->hash[2]);
state[3] = block[3] ^ (K[3] = structpointer->hash[3]);
state[4] = block[4] ^ (K[4] = structpointer->hash[4]);
state[5] = block[5] ^ (K[5] = structpointer->hash[5]);
state[6] = block[6] ^ (K[6] = structpointer->hash[6]);
state[7] = block[7] ^ (K[7] = structpointer->hash[7]);
/*
* iterate over all rounds:
*/
for (r = 1; r <= R; r++) {
/*
* compute K^r from K^{r-1}:
*/
L[0] =
C0[(int)(K[0] >> 56) ] ^
C1[(int)(K[7] >> 48) & 0xff] ^
C2[(int)(K[6] >> 40) & 0xff] ^
C3[(int)(K[5] >> 32) & 0xff] ^
C4[(int)(K[4] >> 24) & 0xff] ^
C5[(int)(K[3] >> 16) & 0xff] ^
C6[(int)(K[2] >> 8) & 0xff] ^
C7[(int)(K[1] ) & 0xff] ^
rc[r];
L[1] =
C0[(int)(K[1] >> 56) ] ^
C1[(int)(K[0] >> 48) & 0xff] ^
C2[(int)(K[7] >> 40) & 0xff] ^
C3[(int)(K[6] >> 32) & 0xff] ^
C4[(int)(K[5] >> 24) & 0xff] ^
C5[(int)(K[4] >> 16) & 0xff] ^
C6[(int)(K[3] >> 8) & 0xff] ^
C7[(int)(K[2] ) & 0xff];
L[2] =
C0[(int)(K[2] >> 56) ] ^
C1[(int)(K[1] >> 48) & 0xff] ^
C2[(int)(K[0] >> 40) & 0xff] ^
C3[(int)(K[7] >> 32) & 0xff] ^
C4[(int)(K[6] >> 24) & 0xff] ^
C5[(int)(K[5] >> 16) & 0xff] ^
C6[(int)(K[4] >> 8) & 0xff] ^
C7[(int)(K[3] ) & 0xff];
L[3] =
C0[(int)(K[3] >> 56) ] ^
C1[(int)(K[2] >> 48) & 0xff] ^
C2[(int)(K[1] >> 40) & 0xff] ^
C3[(int)(K[0] >> 32) & 0xff] ^
C4[(int)(K[7] >> 24) & 0xff] ^
C5[(int)(K[6] >> 16) & 0xff] ^
C6[(int)(K[5] >> 8) & 0xff] ^
C7[(int)(K[4] ) & 0xff];
L[4] =
C0[(int)(K[4] >> 56) ] ^
C1[(int)(K[3] >> 48) & 0xff] ^
C2[(int)(K[2] >> 40) & 0xff] ^
C3[(int)(K[1] >> 32) & 0xff] ^
C4[(int)(K[0] >> 24) & 0xff] ^
C5[(int)(K[7] >> 16) & 0xff] ^
C6[(int)(K[6] >> 8) & 0xff] ^
C7[(int)(K[5] ) & 0xff];
L[5] =
C0[(int)(K[5] >> 56) ] ^
C1[(int)(K[4] >> 48) & 0xff] ^
C2[(int)(K[3] >> 40) & 0xff] ^
C3[(int)(K[2] >> 32) & 0xff] ^
C4[(int)(K[1] >> 24) & 0xff] ^
C5[(int)(K[0] >> 16) & 0xff] ^
C6[(int)(K[7] >> 8) & 0xff] ^
C7[(int)(K[6] ) & 0xff];
L[6] =
C0[(int)(K[6] >> 56) ] ^
C1[(int)(K[5] >> 48) & 0xff] ^
C2[(int)(K[4] >> 40) & 0xff] ^
C3[(int)(K[3] >> 32) & 0xff] ^
C4[(int)(K[2] >> 24) & 0xff] ^
C5[(int)(K[1] >> 16) & 0xff] ^
C6[(int)(K[0] >> 8) & 0xff] ^
C7[(int)(K[7] ) & 0xff];
L[7] =
C0[(int)(K[7] >> 56) ] ^
C1[(int)(K[6] >> 48) & 0xff] ^
C2[(int)(K[5] >> 40) & 0xff] ^
C3[(int)(K[4] >> 32) & 0xff] ^
C4[(int)(K[3] >> 24) & 0xff] ^
C5[(int)(K[2] >> 16) & 0xff] ^
C6[(int)(K[1] >> 8) & 0xff] ^
C7[(int)(K[0] ) & 0xff];
K[0] = L[0];
K[1] = L[1];
K[2] = L[2];
K[3] = L[3];
K[4] = L[4];
K[5] = L[5];
K[6] = L[6];
K[7] = L[7];
/*
* apply the r-th round transformation:
*/
L[0] =
C0[(int)(state[0] >> 56) ] ^
C1[(int)(state[7] >> 48) & 0xff] ^
C2[(int)(state[6] >> 40) & 0xff] ^
C3[(int)(state[5] >> 32) & 0xff] ^
C4[(int)(state[4] >> 24) & 0xff] ^
C5[(int)(state[3] >> 16) & 0xff] ^
C6[(int)(state[2] >> 8) & 0xff] ^
C7[(int)(state[1] ) & 0xff] ^
K[0];
L[1] =
C0[(int)(state[1] >> 56) ] ^
C1[(int)(state[0] >> 48) & 0xff] ^
C2[(int)(state[7] >> 40) & 0xff] ^
C3[(int)(state[6] >> 32) & 0xff] ^
C4[(int)(state[5] >> 24) & 0xff] ^
C5[(int)(state[4] >> 16) & 0xff] ^
C6[(int)(state[3] >> 8) & 0xff] ^
C7[(int)(state[2] ) & 0xff] ^
K[1];
L[2] =
C0[(int)(state[2] >> 56) ] ^
C1[(int)(state[1] >> 48) & 0xff] ^
C2[(int)(state[0] >> 40) & 0xff] ^
C3[(int)(state[7] >> 32) & 0xff] ^
C4[(int)(state[6] >> 24) & 0xff] ^
C5[(int)(state[5] >> 16) & 0xff] ^
C6[(int)(state[4] >> 8) & 0xff] ^
C7[(int)(state[3] ) & 0xff] ^
K[2];
L[3] =
C0[(int)(state[3] >> 56) ] ^
C1[(int)(state[2] >> 48) & 0xff] ^
C2[(int)(state[1] >> 40) & 0xff] ^
C3[(int)(state[0] >> 32) & 0xff] ^
C4[(int)(state[7] >> 24) & 0xff] ^
C5[(int)(state[6] >> 16) & 0xff] ^
C6[(int)(state[5] >> 8) & 0xff] ^
C7[(int)(state[4] ) & 0xff] ^
K[3];
L[4] =
C0[(int)(state[4] >> 56) ] ^
C1[(int)(state[3] >> 48) & 0xff] ^
C2[(int)(state[2] >> 40) & 0xff] ^
C3[(int)(state[1] >> 32) & 0xff] ^
C4[(int)(state[0] >> 24) & 0xff] ^
C5[(int)(state[7] >> 16) & 0xff] ^
C6[(int)(state[6] >> 8) & 0xff] ^
C7[(int)(state[5] ) & 0xff] ^
K[4];
L[5] =
C0[(int)(state[5] >> 56) ] ^
C1[(int)(state[4] >> 48) & 0xff] ^
C2[(int)(state[3] >> 40) & 0xff] ^
C3[(int)(state[2] >> 32) & 0xff] ^
C4[(int)(state[1] >> 24) & 0xff] ^
C5[(int)(state[0] >> 16) & 0xff] ^
C6[(int)(state[7] >> 8) & 0xff] ^
C7[(int)(state[6] ) & 0xff] ^
K[5];
L[6] =
C0[(int)(state[6] >> 56) ] ^
C1[(int)(state[5] >> 48) & 0xff] ^
C2[(int)(state[4] >> 40) & 0xff] ^
C3[(int)(state[3] >> 32) & 0xff] ^
C4[(int)(state[2] >> 24) & 0xff] ^
C5[(int)(state[1] >> 16) & 0xff] ^
C6[(int)(state[0] >> 8) & 0xff] ^
C7[(int)(state[7] ) & 0xff] ^
K[6];
L[7] =
C0[(int)(state[7] >> 56) ] ^
C1[(int)(state[6] >> 48) & 0xff] ^
C2[(int)(state[5] >> 40) & 0xff] ^
C3[(int)(state[4] >> 32) & 0xff] ^
C4[(int)(state[3] >> 24) & 0xff] ^
C5[(int)(state[2] >> 16) & 0xff] ^
C6[(int)(state[1] >> 8) & 0xff] ^
C7[(int)(state[0] ) & 0xff] ^
K[7];
state[0] = L[0];
state[1] = L[1];
state[2] = L[2];
state[3] = L[3];
state[4] = L[4];
state[5] = L[5];
state[6] = L[6];
state[7] = L[7];
}
/*
* apply the Miyaguchi-Preneel compression function:
*/
structpointer->hash[0] ^= state[0] ^ block[0];
structpointer->hash[1] ^= state[1] ^ block[1];
structpointer->hash[2] ^= state[2] ^ block[2];
structpointer->hash[3] ^= state[3] ^ block[3];
structpointer->hash[4] ^= state[4] ^ block[4];
structpointer->hash[5] ^= state[5] ^ block[5];
structpointer->hash[6] ^= state[6] ^ block[6];
structpointer->hash[7] ^= state[7] ^ block[7];
}
/**
* Initialize the hashing state.
*/
void NESSIEinit(struct NESSIEstruct * const structpointer) {
int i;
memset(structpointer->bitLength, 0, 32);
structpointer->bufferBits = structpointer->bufferPos = 0;
structpointer->buffer[0] = 0; /* it's only necessary to cleanup buffer[bufferPos] */
for (i = 0; i < 8; i++) {
structpointer->hash[i] = 0L; /* initial value */
}
}
/**
* Delivers input data to the hashing algorithm.
*
* @param source plaintext data to hash.
* @param sourceBits how many bits of plaintext to process.
*
* This method maintains the invariant: bufferBits < 512
*/
void NESSIEadd(const unsigned char * const source,
unsigned long sourceBits,
struct NESSIEstruct * const structpointer) {
/*
sourcePos
|
+-------+-------+-------
||||||||||||||||||||| source
+-------+-------+-------
+-------+-------+-------+-------+-------+-------
|||||||||||||||||||||| buffer
+-------+-------+-------+-------+-------+-------
|
bufferPos
*/
int sourcePos = 0; /* index of leftmost source u8 containing data (1 to 8 bits). */
int sourceGap = (8 - ((int)sourceBits & 7)) & 7; /* space on source[sourcePos]. */
int bufferRem = structpointer->bufferBits & 7; /* occupied bits on buffer[bufferPos]. */
int i;
u32 b, carry;
u8 *buffer = structpointer->buffer;
u8 *bitLength = structpointer->bitLength;
int bufferBits = structpointer->bufferBits;
int bufferPos = structpointer->bufferPos;
/*
* tally the length of the added data:
*/
u64 value = sourceBits;
for (i = 31, carry = 0; i >= 0 && value != 0LL; i--) {
carry += bitLength[i] + ((u32)value & 0xff);
bitLength[i] = (u8)carry;
carry >>= 8;
value >>= 8;
}
/*
* process data in chunks of 8 bits (a more efficient approach would be to take whole-word chunks):
*/
while (sourceBits > 8) {
/* N.B. at least source[sourcePos] and source[sourcePos+1] contain data. */
/*
* take a byte from the source:
*/
b = ((source[sourcePos] << sourceGap) & 0xff) |
((source[sourcePos + 1] & 0xff) >> (8 - sourceGap));
/*
* process this byte:
*/
buffer[bufferPos++] |= (u8)(b >> bufferRem);
bufferBits += 8 - bufferRem; /* bufferBits = 8*bufferPos; */
if (bufferBits == 512) {
/*
* process data block:
*/
processBuffer(structpointer);
/*
* reset buffer:
*/
bufferBits = bufferPos = 0;
}
buffer[bufferPos] = b << (8 - bufferRem);
bufferBits += bufferRem;
/*
* proceed to remaining data:
*/
sourceBits -= 8;
sourcePos++;
}
/* now 0 < sourceBits <= 8; furthermore, all data is in source[sourcePos]. */
b = (source[sourcePos] << sourceGap) & 0xff; /* bits are left-justified on b. */
/*
* process the remaining bits:
*/
buffer[bufferPos] |= b >> bufferRem;
if (bufferRem + sourceBits < 8) {
/*
* all remaining data fits on buffer[bufferPos],
* and there still remains some space.
*/
bufferBits += sourceBits;
} else {
/*
* buffer[bufferPos] is full:
*/
bufferPos++;
bufferBits += 8 - bufferRem; /* bufferBits = 8*bufferPos; */
sourceBits -= 8 - bufferRem;
/* now 0 <= sourceBits < 8; furthermore, all data is in source[sourcePos]. */
if (bufferBits == 512) {
/*
* process data block:
*/
processBuffer(structpointer);
/*
* reset buffer:
*/
bufferBits = bufferPos = 0;
}
buffer[bufferPos] = b << (8 - bufferRem);
bufferBits += (int)sourceBits;
}
structpointer->bufferBits = bufferBits;
structpointer->bufferPos = bufferPos;
}
/**
* Get the hash value from the hashing state.
*
* This method uses the invariant: bufferBits < 512
*/
void NESSIEfinalize(struct NESSIEstruct * const structpointer,
unsigned char * const result) {
int i;
u8 *buffer = structpointer->buffer;
u8 *bitLength = structpointer->bitLength;
int bufferBits = structpointer->bufferBits;
int bufferPos = structpointer->bufferPos;
u8 *digest = result;
/*
* append a '1'-bit:
*/
buffer[bufferPos] |= 0x80U >> (bufferBits & 7);
bufferPos++; /* all remaining bits on the current u8 are set to zero. */
/*
* pad with zero bits to complete 512N + 256 bits:
*/
if (bufferPos > 32) {
if (bufferPos < 64) {
memset(&buffer[bufferPos], 0, 64 - bufferPos);
}
/*
* process data block:
*/
processBuffer(structpointer);
/*
* reset buffer:
*/
bufferPos = 0;
}
if (bufferPos < 32) {
memset(&buffer[bufferPos], 0, 32 - bufferPos);
}
bufferPos = 32;
/*
* append bit length of hashed data:
*/
memcpy(&buffer[32], bitLength, 32);
/*
* process data block:
*/
processBuffer(structpointer);
/*
* return the completed message digest:
*/
for (i = 0; i < 8; i++) {
digest[0] = (u8)(structpointer->hash[i] >> 56);
digest[1] = (u8)(structpointer->hash[i] >> 48);
digest[2] = (u8)(structpointer->hash[i] >> 40);
digest[3] = (u8)(structpointer->hash[i] >> 32);
digest[4] = (u8)(structpointer->hash[i] >> 24);
digest[5] = (u8)(structpointer->hash[i] >> 16);
digest[6] = (u8)(structpointer->hash[i] >> 8);
digest[7] = (u8)(structpointer->hash[i] );
digest += 8;
}
structpointer->bufferBits = bufferBits;
structpointer->bufferPos = bufferPos;
}
static void display(const u8 array[], int length) {
int i;
for (i = 0; i < length; i++) {
printf("%02X", array[i]);
}
}
#define LONG_ITERATION 100000000
/**
* Generate the test vector set for Whirlpool.
*
* The test consists of:
* 1. hashing all bit strings containing only zero bits
* for all lengths from 0 to 1023;
* 2. hashing all 512-bit strings containing a single set bit;
* 3. the iterated hashing of the 512-bit string of zero bits a large number of times.
*/
void makeTestVectors() {
int i;
struct NESSIEstruct w;
u8 digest[DIGESTBYTES];
u8 data[128];
memset(data, 0, sizeof(data));
printf("Message digests of strings of 0-bits and length L:\n");
for (i = 0; i < 1024; i++) {
NESSIEinit(&w);
NESSIEadd(data, i, &w);
NESSIEfinalize(&w, digest);
printf(" L = %4d: ", i); display(digest, DIGESTBYTES); printf("\n");
}
printf("Message digests of all 512-bit strings S containing a single 1-bit:\n");
memset(data, 0, sizeof(data));
for (i = 0; i < 512; i++) {
/* set bit i: */
data[i/8] |= 0x80U >> (i % 8);
NESSIEinit(&w);
NESSIEadd(data, 512, &w);
NESSIEfinalize(&w, digest);
printf(" S = "); display(data, 512/8); printf(": ");
display(digest, DIGESTBYTES); printf("\n");
/* reset bit i: */
data[i/8] = 0;
}
memset(digest, 0, sizeof(digest));
for (i = 0; i < LONG_ITERATION; i++) {
NESSIEinit(&w);
NESSIEadd(digest, 512, &w);
NESSIEfinalize(&w, digest);
}
fflush(stdout);
printf("Iterated message digest computation (%d times): ", LONG_ITERATION);
display(digest, DIGESTBYTES); printf("\n");
}
/*
#define TIMING_ITERATIONS 100000
static void timing() {
int i;
NESSIEstruct w;
u8 digest[DIGESTBYTES];
u8 data[1024];
clock_t elapsed;
float sec;
memset(data, 0, sizeof(data));
printf("Overall timing...");
elapsed = -clock();
for (i = 0; i < TIMING_ITERATIONS; i++) {
NESSIEinit(&w);
NESSIEadd(data, 8*sizeof(data), &w);
NESSIEfinalize(&w, digest);
}
elapsed += clock();
sec = (float)elapsed/CLOCKS_PER_SEC;
printf(" %.1f s, %.1f Mbit/s, %.1f cycles/byte.\n",
sec,
(float)8*sizeof(data)*TIMING_ITERATIONS/sec/1000000,
(float)550e6*sec/(sizeof(data)*TIMING_ITERATIONS));
printf("Compression function timing...");
NESSIEinit(&w);
elapsed = -clock();
for (i = 0; i < TIMING_ITERATIONS; i++) {
processBuffer(&w);
}
elapsed += clock();
NESSIEfinalize(&w, digest);
sec = (float)elapsed/CLOCKS_PER_SEC;
printf(" %.1f s, %.1f Mbit/s, %.1f cycles/byte.\n",
sec,
(float)512*TIMING_ITERATIONS/sec/1000000,
(float)550e6*sec/(64*TIMING_ITERATIONS));
}
*/
/*
int main(int argc, char *argv[]) {
makeTestVectors();
/* timing(); *//* Comment this line out *//*
return 0;
}
*/