/* $Id: sph_simd.h 154 2010-04-26 17:00:24Z tp $ */
/**
 * SIMD interface. SIMD is a family of functions which differ by
 * their output size; this implementation defines SIMD for output
 * sizes 224, 256, 384 and 512 bits.
 *
 * ==========================(LICENSE BEGIN)============================
 *
 * Copyright (c) 2007-2010  Projet RNRT SAPHIR
 * 
 * Permission is hereby granted, free of charge, to any person obtaining
 * a copy of this software and associated documentation files (the
 * "Software"), to deal in the Software without restriction, including
 * without limitation the rights to use, copy, modify, merge, publish,
 * distribute, sublicense, and/or sell copies of the Software, and to
 * permit persons to whom the Software is furnished to do so, subject to
 * the following conditions:
 * 
 * The above copyright notice and this permission notice shall be
 * included in all copies or substantial portions of the Software.
 * 
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
 * IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
 * CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
 *
 * ===========================(LICENSE END)=============================
 *
 * @file     sph_simd.h
 * @author   Thomas Pornin <thomas.pornin@cryptolog.com>
 */

#ifndef SPH_SIMD_H__
#define SPH_SIMD_H__

#include <stddef.h>
#include "sph_types.h"

/**
 * Output size (in bits) for SIMD-224.
 */
#define SPH_SIZE_simd224   224

/**
 * Output size (in bits) for SIMD-256.
 */
#define SPH_SIZE_simd256   256

/**
 * Output size (in bits) for SIMD-384.
 */
#define SPH_SIZE_simd384   384

/**
 * Output size (in bits) for SIMD-512.
 */
#define SPH_SIZE_simd512   512

/**
 * This structure is a context for SIMD computations: it contains the
 * intermediate values and some data from the last entered block. Once
 * an SIMD computation has been performed, the context can be reused for
 * another computation. This specific structure is used for SIMD-224
 * and SIMD-256.
 *
 * The contents of this structure are private. A running SIMD computation
 * can be cloned by copying the context (e.g. with a simple
 * <code>memcpy()</code>).
 */
typedef struct {
#ifndef DOXYGEN_IGNORE
	unsigned char buf[64];    /* first field, for alignment */
	size_t ptr;
	sph_u32 state[16];
	sph_u32 count_low, count_high;
#endif
} sph_simd_small_context;

/**
 * This structure is a context for SIMD computations: it contains the
 * intermediate values and some data from the last entered block. Once
 * an SIMD computation has been performed, the context can be reused for
 * another computation. This specific structure is used for SIMD-384
 * and SIMD-512.
 *
 * The contents of this structure are private. A running SIMD computation
 * can be cloned by copying the context (e.g. with a simple
 * <code>memcpy()</code>).
 */
typedef struct {
#ifndef DOXYGEN_IGNORE
	unsigned char buf[128];    /* first field, for alignment */
	size_t ptr;
	sph_u32 state[32];
	sph_u32 count_low, count_high;
#endif
} sph_simd_big_context;

/**
 * Type for a SIMD-224 context (identical to the common "small" context).
 */
typedef sph_simd_small_context sph_simd224_context;

/**
 * Type for a SIMD-256 context (identical to the common "small" context).
 */
typedef sph_simd_small_context sph_simd256_context;

/**
 * Type for a SIMD-384 context (identical to the common "big" context).
 */
typedef sph_simd_big_context sph_simd384_context;

/**
 * Type for a SIMD-512 context (identical to the common "big" context).
 */
typedef sph_simd_big_context sph_simd512_context;

/**
 * Initialize an SIMD-224 context. This process performs no memory allocation.
 *
 * @param cc   the SIMD-224 context (pointer to a
 *             <code>sph_simd224_context</code>)
 */
void sph_simd224_init(void *cc);

/**
 * Process some data bytes. It is acceptable that <code>len</code> is zero
 * (in which case this function does nothing).
 *
 * @param cc     the SIMD-224 context
 * @param data   the input data
 * @param len    the input data length (in bytes)
 */
void sph_simd224(void *cc, const void *data, size_t len);

/**
 * Terminate the current SIMD-224 computation and output the result into
 * the provided buffer. The destination buffer must be wide enough to
 * accomodate the result (28 bytes). The context is automatically
 * reinitialized.
 *
 * @param cc    the SIMD-224 context
 * @param dst   the destination buffer
 */
void sph_simd224_close(void *cc, void *dst);

/**
 * Add a few additional bits (0 to 7) to the current computation, then
 * terminate it and output the result in the provided buffer, which must
 * be wide enough to accomodate the result (28 bytes). If bit number i
 * in <code>ub</code> has value 2^i, then the extra bits are those
 * numbered 7 downto 8-n (this is the big-endian convention at the byte
 * level). The context is automatically reinitialized.
 *
 * @param cc    the SIMD-224 context
 * @param ub    the extra bits
 * @param n     the number of extra bits (0 to 7)
 * @param dst   the destination buffer
 */
void sph_simd224_addbits_and_close(
	void *cc, unsigned ub, unsigned n, void *dst);

/**
 * Initialize an SIMD-256 context. This process performs no memory allocation.
 *
 * @param cc   the SIMD-256 context (pointer to a
 *             <code>sph_simd256_context</code>)
 */
void sph_simd256_init(void *cc);

/**
 * Process some data bytes. It is acceptable that <code>len</code> is zero
 * (in which case this function does nothing).
 *
 * @param cc     the SIMD-256 context
 * @param data   the input data
 * @param len    the input data length (in bytes)
 */
void sph_simd256(void *cc, const void *data, size_t len);

/**
 * Terminate the current SIMD-256 computation and output the result into
 * the provided buffer. The destination buffer must be wide enough to
 * accomodate the result (32 bytes). The context is automatically
 * reinitialized.
 *
 * @param cc    the SIMD-256 context
 * @param dst   the destination buffer
 */
void sph_simd256_close(void *cc, void *dst);

/**
 * Add a few additional bits (0 to 7) to the current computation, then
 * terminate it and output the result in the provided buffer, which must
 * be wide enough to accomodate the result (32 bytes). If bit number i
 * in <code>ub</code> has value 2^i, then the extra bits are those
 * numbered 7 downto 8-n (this is the big-endian convention at the byte
 * level). The context is automatically reinitialized.
 *
 * @param cc    the SIMD-256 context
 * @param ub    the extra bits
 * @param n     the number of extra bits (0 to 7)
 * @param dst   the destination buffer
 */
void sph_simd256_addbits_and_close(
	void *cc, unsigned ub, unsigned n, void *dst);

/**
 * Initialize an SIMD-384 context. This process performs no memory allocation.
 *
 * @param cc   the SIMD-384 context (pointer to a
 *             <code>sph_simd384_context</code>)
 */
void sph_simd384_init(void *cc);

/**
 * Process some data bytes. It is acceptable that <code>len</code> is zero
 * (in which case this function does nothing).
 *
 * @param cc     the SIMD-384 context
 * @param data   the input data
 * @param len    the input data length (in bytes)
 */
void sph_simd384(void *cc, const void *data, size_t len);

/**
 * Terminate the current SIMD-384 computation and output the result into
 * the provided buffer. The destination buffer must be wide enough to
 * accomodate the result (48 bytes). The context is automatically
 * reinitialized.
 *
 * @param cc    the SIMD-384 context
 * @param dst   the destination buffer
 */
void sph_simd384_close(void *cc, void *dst);

/**
 * Add a few additional bits (0 to 7) to the current computation, then
 * terminate it and output the result in the provided buffer, which must
 * be wide enough to accomodate the result (48 bytes). If bit number i
 * in <code>ub</code> has value 2^i, then the extra bits are those
 * numbered 7 downto 8-n (this is the big-endian convention at the byte
 * level). The context is automatically reinitialized.
 *
 * @param cc    the SIMD-384 context
 * @param ub    the extra bits
 * @param n     the number of extra bits (0 to 7)
 * @param dst   the destination buffer
 */
void sph_simd384_addbits_and_close(
	void *cc, unsigned ub, unsigned n, void *dst);

/**
 * Initialize an SIMD-512 context. This process performs no memory allocation.
 *
 * @param cc   the SIMD-512 context (pointer to a
 *             <code>sph_simd512_context</code>)
 */
void sph_simd512_init(void *cc);

/**
 * Process some data bytes. It is acceptable that <code>len</code> is zero
 * (in which case this function does nothing).
 *
 * @param cc     the SIMD-512 context
 * @param data   the input data
 * @param len    the input data length (in bytes)
 */
void sph_simd512(void *cc, const void *data, size_t len);

/**
 * Terminate the current SIMD-512 computation and output the result into
 * the provided buffer. The destination buffer must be wide enough to
 * accomodate the result (64 bytes). The context is automatically
 * reinitialized.
 *
 * @param cc    the SIMD-512 context
 * @param dst   the destination buffer
 */
void sph_simd512_close(void *cc, void *dst);

/**
 * Add a few additional bits (0 to 7) to the current computation, then
 * terminate it and output the result in the provided buffer, which must
 * be wide enough to accomodate the result (64 bytes). If bit number i
 * in <code>ub</code> has value 2^i, then the extra bits are those
 * numbered 7 downto 8-n (this is the big-endian convention at the byte
 * level). The context is automatically reinitialized.
 *
 * @param cc    the SIMD-512 context
 * @param ub    the extra bits
 * @param n     the number of extra bits (0 to 7)
 * @param dst   the destination buffer
 */
void sph_simd512_addbits_and_close(
	void *cc, unsigned ub, unsigned n, void *dst);

#endif