/**********************************************************************
Copyright(c) 2011-2016 Intel Corporation All rights reserved.
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions
are met:
* Redistributions of source code must retain the above copyright
notice, this list of conditions and the following disclaimer.
* Redistributions in binary form must reproduce the above copyright
notice, this list of conditions and the following disclaimer in
the documentation and/or other materials provided with the
distribution.
* Neither the name of Intel Corporation nor the names of its
contributors may be used to endorse or promote products derived
from this software without specific prior written permission.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
**********************************************************************/
#ifndef _SHA512_MB_H_
#define _SHA512_MB_H_
/**
* @file sha512_mb.h
* @brief Single/Multi-buffer CTX API SHA512 function prototypes and structures
*
* Interface for single and multi-buffer SHA512 functions
*
* Single/Multi-buffer SHA512 Entire or First-Update..Update-Last
*
* The interface to this single/multi-buffer hashing code is carried out through the
* context-level (CTX) init, submit and flush functions and the SHA512_HASH_CTX_MGR and
* SHA512_HASH_CTX objects. Numerous SHA512_HASH_CTX objects may be instantiated by the
* application for use with a single SHA512_HASH_CTX_MGR.
*
* The CTX interface functions carry out the initialization and padding of the jobs
* entered by the user and add them to the multi-buffer manager. The lower level "scheduler"
* layer then processes the jobs in an out-of-order manner. The scheduler layer functions
* are internal and are not intended to be invoked directly. Jobs can be submitted
* to a CTX as a complete buffer to be hashed, using the HASH_ENTIRE flag, or as partial
* jobs which can be started using the HASH_FIRST flag, and later resumed or finished
* using the HASH_UPDATE and HASH_LAST flags respectively.
*
* Note: The submit function does not require data buffers to be block sized.
*
* The SHA512 CTX interface functions are available for 5 architectures: multi-buffer SSE,
* AVX, AVX2, AVX512 and single-buffer SSE4 (which is used in the same way as the
* multi-buffer code). In addition, a multibinary interface is provided, which selects the
* appropriate architecture-specific function at runtime. This multibinary interface
* selects the single buffer SSE4 functions when the platform is detected to be Silvermont.
*
* Usage: The application creates a SHA512_HASH_CTX_MGR object and initializes it
* with a call to sha512_ctx_mgr_init*() function, where henceforth "*" stands for the
* relevant suffix for each architecture; _sse, _avx, _avx2, _avx512(or no suffix for the
* multibinary version). The SHA512_HASH_CTX_MGR object will be used to schedule processor
* resources, with up to 2 SHA512_HASH_CTX objects (or 4 in the AVX2 case, 8 in the AVX512
* case) being processed at a time.
*
* Each SHA512_HASH_CTX must be initialized before first use by the hash_ctx_init macro
* defined in multi_buffer.h. After initialization, the application may begin computing
* a hash by giving the SHA512_HASH_CTX to a SHA512_HASH_CTX_MGR using the submit functions
* sha512_ctx_mgr_submit*() with the HASH_FIRST flag set. When the SHA512_HASH_CTX is
* returned to the application (via this or a later call to sha512_ctx_mgr_submit*() or
* sha512_ctx_mgr_flush*()), the application can then re-submit it with another call to
* sha512_ctx_mgr_submit*(), but without the HASH_FIRST flag set.
*
* Ideally, on the last buffer for that hash, sha512_ctx_mgr_submit_sse is called with
* HASH_LAST, although it is also possible to submit the hash with HASH_LAST and a zero
* length if necessary. When a SHA512_HASH_CTX is returned after having been submitted with
* HASH_LAST, it will contain a valid hash. The SHA512_HASH_CTX can be reused immediately
* by submitting with HASH_FIRST.
*
* For example, you would submit hashes with the following flags for the following numbers
* of buffers:
*
* - one buffer: HASH_FIRST | HASH_LAST (or, equivalently, HASH_ENTIRE)
*
- two buffers: HASH_FIRST, HASH_LAST
*
- three buffers: HASH_FIRST, HASH_UPDATE, HASH_LAST
* etc.
*
*
* The order in which SHA512_CTX objects are returned is in general different from the order
* in which they are submitted.
*
* A few possible error conditions exist:
*
* - Submitting flags other than the allowed entire/first/update/last values
*
- Submitting a context that is currently being managed by a SHA512_HASH_CTX_MGR. (Note:
* This error case is not applicable to the single buffer SSE4 version)
*
- Submitting a context after HASH_LAST is used but before HASH_FIRST is set.
*
*
* These error conditions are reported by returning the SHA512_HASH_CTX immediately after
* a submit with its error member set to a non-zero error code (defined in
* multi_buffer.h). No changes are made to the SHA512_HASH_CTX_MGR in the case of an
* error; no processing is done for other hashes.
*
*/
#include
#include "multi_buffer.h"
#include "types.h"
#ifndef _MSC_VER
#include
#endif
#ifdef __cplusplus
extern "C" {
#endif
// Hash Constants and Typedefs
#define SHA512_DIGEST_NWORDS 8
#define SHA512_MAX_LANES 8
#define SHA512_X4_LANES 4
#define SHA512_MIN_LANES 2
#define SHA512_BLOCK_SIZE 128
#define SHA512_LOG2_BLOCK_SIZE 7
#define SHA512_PADLENGTHFIELD_SIZE 16
#define SHA512_INITIAL_DIGEST \
0x6a09e667f3bcc908,0xbb67ae8584caa73b,0x3c6ef372fe94f82b,0xa54ff53a5f1d36f1, \
0x510e527fade682d1,0x9b05688c2b3e6c1f,0x1f83d9abfb41bd6b,0x5be0cd19137e2179
typedef uint64_t sha512_digest_array[SHA512_DIGEST_NWORDS][SHA512_MAX_LANES];
typedef uint64_t SHA512_WORD_T;
/** @brief Scheduler layer - Holds info describing a single SHA512 job for the multi-buffer manager */
typedef struct {
uint8_t* buffer; //!< pointer to data buffer for this job
uint64_t len; //!< length of buffer for this job in blocks.
DECLARE_ALIGNED(uint64_t result_digest[SHA512_DIGEST_NWORDS], 64);
JOB_STS status; //!< output job status
void* user_data; //!< pointer for user's job-related data
} SHA512_JOB;
/** @brief Scheduler layer - Holds arguments for submitted SHA512 job */
typedef struct {
sha512_digest_array digest;
uint8_t* data_ptr[SHA512_MAX_LANES];
} SHA512_MB_ARGS_X8;
/** @brief Scheduler layer - Lane data */
typedef struct {
SHA512_JOB *job_in_lane;
} SHA512_LANE_DATA;
/** @brief Scheduler layer - Holds state for multi-buffer SHA512 jobs */
typedef struct {
SHA512_MB_ARGS_X8 args;
uint64_t lens[SHA512_MAX_LANES];
uint64_t unused_lanes; //!< each byte is index (00, 01 or 00...03) of unused lanes, byte 2 or 4 is set to FF as a flag
SHA512_LANE_DATA ldata[SHA512_MAX_LANES];
uint32_t num_lanes_inuse;
} SHA512_MB_JOB_MGR;
/** @brief Context layer - Holds state for multi-buffer SHA512 jobs */
typedef struct {
SHA512_MB_JOB_MGR mgr;
} SHA512_HASH_CTX_MGR;
/** @brief Context layer - Holds info describing a single SHA512 job for the multi-buffer CTX manager */
typedef struct {
SHA512_JOB job; // Must be at struct offset 0.
HASH_CTX_STS status; //!< Context status flag
HASH_CTX_ERROR error; //!< Context error flag
uint32_t total_length; //!< Running counter of length processed for this CTX's job
const void* incoming_buffer; //!< pointer to data input buffer for this CTX's job
uint32_t incoming_buffer_length; //!< length of buffer for this job in bytes.
uint8_t partial_block_buffer[SHA512_BLOCK_SIZE * 2]; //!< CTX partial blocks
uint32_t partial_block_buffer_length;
void* user_data; //!< pointer for user to keep any job-related data
} SHA512_HASH_CTX;
/*******************************************************************
* Context level API function prototypes
******************************************************************/
/**
* @brief Initialize the context level SHA512 multi-buffer manager structure.
* @requires SSE4.1
*
* @param mgr Structure holding context level state info
* @returns void
*/
void sha512_ctx_mgr_init_sse (SHA512_HASH_CTX_MGR* mgr);
/**
* @brief Submit a new SHA512 job to the context level multi-buffer manager.
* @requires SSE4.1
*
* @param mgr Structure holding context level state info
* @param ctx Structure holding ctx job info
* @param buffer Pointer to buffer to be processed
* @param len Length of buffer (in bytes) to be processed
* @param flags Input flag specifying job type (first, update, last or entire)
* @returns NULL if no jobs complete or pointer to jobs structure.
*/
SHA512_HASH_CTX* sha512_ctx_mgr_submit_sse (SHA512_HASH_CTX_MGR* mgr, SHA512_HASH_CTX* ctx,
const void* buffer, uint32_t len, HASH_CTX_FLAG flags);
/**
* @brief Finish all submitted SHA512 jobs and return when complete.
* @requires SSE4.1
*
* @param mgr Structure holding context level state info
* @returns NULL if no jobs to complete or pointer to jobs structure.
*/
SHA512_HASH_CTX* sha512_ctx_mgr_flush_sse (SHA512_HASH_CTX_MGR* mgr);
/**
* @brief Initialize the SHA512 multi-buffer manager structure.
* @requires AVX
*
* @param mgr Structure holding context level state info
* @returns void
*/
void sha512_ctx_mgr_init_avx (SHA512_HASH_CTX_MGR* mgr);
/**
* @brief Submit a new SHA512 job to the multi-buffer manager.
* @requires AVX
*
* @param mgr Structure holding context level state info
* @param ctx Structure holding ctx job info
* @param buffer Pointer to buffer to be processed
* @param len Length of buffer (in bytes) to be processed
* @param flags Input flag specifying job type (first, update, last or entire)
* @returns NULL if no jobs complete or pointer to jobs structure.
*/
SHA512_HASH_CTX* sha512_ctx_mgr_submit_avx (SHA512_HASH_CTX_MGR* mgr, SHA512_HASH_CTX* ctx,
const void* buffer, uint32_t len, HASH_CTX_FLAG flags);
/**
* @brief Finish all submitted SHA512 jobs and return when complete.
* @requires AVX
*
* @param mgr Structure holding context level state info
* @returns NULL if no jobs to complete or pointer to jobs structure.
*/
SHA512_HASH_CTX* sha512_ctx_mgr_flush_avx (SHA512_HASH_CTX_MGR* mgr);
/**
* @brief Initialize the SHA512 multi-buffer manager structure.
* @requires AVX2
*
* @param mgr Structure holding context level state info
* @returns void
*/
void sha512_ctx_mgr_init_avx2 (SHA512_HASH_CTX_MGR* mgr);
/**
* @brief Submit a new SHA512 job to the multi-buffer manager.
* @requires AVX2
*
* @param mgr Structure holding context level state info
* @param ctx Structure holding ctx job info
* @param buffer Pointer to buffer to be processed
* @param len Length of buffer (in bytes) to be processed
* @param flags Input flag specifying job type (first, update, last or entire)
* @returns NULL if no jobs complete or pointer to jobs structure.
*/
SHA512_HASH_CTX* sha512_ctx_mgr_submit_avx2 (SHA512_HASH_CTX_MGR* mgr, SHA512_HASH_CTX* ctx,
const void* buffer, uint32_t len, HASH_CTX_FLAG flags);
/**
* @brief Finish all submitted SHA512 jobs and return when complete.
* @requires AVX2
*
* @param mgr Structure holding context level state info
* @returns NULL if no jobs to complete or pointer to jobs structure.
*/
SHA512_HASH_CTX* sha512_ctx_mgr_flush_avx2 (SHA512_HASH_CTX_MGR* mgr);
/**
* @brief Initialize the SHA512 multi-buffer manager structure.
* @requires AVX512
*
* @param mgr Structure holding context level state info
* @returns void
*/
void sha512_ctx_mgr_init_avx512 (SHA512_HASH_CTX_MGR* mgr);
/**
* @brief Submit a new SHA512 job to the multi-buffer manager.
* @requires AVX512
*
* @param mgr Structure holding context level state info
* @param ctx Structure holding ctx job info
* @param buffer Pointer to buffer to be processed
* @param len Length of buffer (in bytes) to be processed
* @param flags Input flag specifying job type (first, update, last or entire)
* @returns NULL if no jobs complete or pointer to jobs structure.
*/
SHA512_HASH_CTX* sha512_ctx_mgr_submit_avx512 (SHA512_HASH_CTX_MGR* mgr, SHA512_HASH_CTX* ctx,
const void* buffer, uint32_t len, HASH_CTX_FLAG flags);
/**
* @brief Finish all submitted SHA512 jobs and return when complete.
* @requires AVX512
*
* @param mgr Structure holding context level state info
* @returns NULL if no jobs to complete or pointer to jobs structure.
*/
SHA512_HASH_CTX* sha512_ctx_mgr_flush_avx512 (SHA512_HASH_CTX_MGR* mgr);
/**
* @brief Initialize the SHA512 multi-buffer manager structure.
* @requires SSE4
*
* @param mgr Structure holding context level state info
* @returns void
*/
void sha512_ctx_mgr_init_sb_sse4 (SHA512_HASH_CTX_MGR* mgr);
/**
* @brief Submit a new SHA512 job to the multi-buffer manager.
* @requires SSE4
*
* @param mgr Structure holding context level state info
* @param ctx Structure holding ctx job info
* @param buffer Pointer to buffer to be processed
* @param len Length of buffer (in bytes) to be processed
* @param flags Input flag specifying job type (first, update, last or entire)
* @returns NULL if no jobs complete or pointer to jobs structure.
*/
SHA512_HASH_CTX* sha512_ctx_mgr_submit_sb_sse4 (SHA512_HASH_CTX_MGR* mgr, SHA512_HASH_CTX* ctx,
const void* buffer, uint32_t len, HASH_CTX_FLAG flags);
/**
* @brief Finish all submitted SHA512 jobs and return when complete.
* @requires SSE4
*
* @param mgr Structure holding context level state info
* @returns NULL if no jobs to complete or pointer to jobs structure.
*/
SHA512_HASH_CTX* sha512_ctx_mgr_flush_sb_sse4 (SHA512_HASH_CTX_MGR* mgr);
/******************** multibinary function prototypes **********************/
/**
* @brief Initialize the SHA512 multi-buffer manager structure.
* @requires SSE4.1 or AVX or AVX2 or AVX512
*
* @param mgr Structure holding context level state info
* @returns void
*/
void sha512_ctx_mgr_init (SHA512_HASH_CTX_MGR* mgr);
/**
* @brief Submit a new SHA512 job to the multi-buffer manager.
* @requires SSE4.1 or AVX or AVX2 or AVX512
*
* @param mgr Structure holding context level state info
* @param ctx Structure holding ctx job info
* @param buffer Pointer to buffer to be processed
* @param len Length of buffer (in bytes) to be processed
* @param flags Input flag specifying job type (first, update, last or entire)
* @returns NULL if no jobs complete or pointer to jobs structure.
*/
SHA512_HASH_CTX* sha512_ctx_mgr_submit (SHA512_HASH_CTX_MGR* mgr, SHA512_HASH_CTX* ctx,
const void* buffer, uint32_t len, HASH_CTX_FLAG flags);
/**
* @brief Finish all submitted SHA512 jobs and return when complete.
* @requires SSE4.1 or AVX or AVX2 or AVX512
*
* @param mgr Structure holding context level state info
* @returns NULL if no jobs to complete or pointer to jobs structure.
*/
SHA512_HASH_CTX* sha512_ctx_mgr_flush (SHA512_HASH_CTX_MGR* mgr);
/*******************************************************************
* Scheduler (internal) level out-of-order function prototypes
******************************************************************/
void sha512_mb_mgr_init_sse (SHA512_MB_JOB_MGR *state);
SHA512_JOB* sha512_mb_mgr_submit_sse (SHA512_MB_JOB_MGR *state, SHA512_JOB* job);
SHA512_JOB* sha512_mb_mgr_flush_sse (SHA512_MB_JOB_MGR *state);
#define sha512_mb_mgr_init_avx sha512_mb_mgr_init_sse
SHA512_JOB* sha512_mb_mgr_submit_avx (SHA512_MB_JOB_MGR *state, SHA512_JOB* job);
SHA512_JOB* sha512_mb_mgr_flush_avx (SHA512_MB_JOB_MGR *state);
void sha512_mb_mgr_init_avx2 (SHA512_MB_JOB_MGR *state);
SHA512_JOB* sha512_mb_mgr_submit_avx2 (SHA512_MB_JOB_MGR *state, SHA512_JOB* job);
SHA512_JOB* sha512_mb_mgr_flush_avx2 (SHA512_MB_JOB_MGR *state);
void sha512_mb_mgr_init_avx512 (SHA512_MB_JOB_MGR *state);
SHA512_JOB* sha512_mb_mgr_submit_avx512 (SHA512_MB_JOB_MGR *state, SHA512_JOB* job);
SHA512_JOB* sha512_mb_mgr_flush_avx512 (SHA512_MB_JOB_MGR *state);
// Single buffer SHA512 APIs, optimized for SLM.
void sha512_sse4 (const void* M, void* D, uint64_t L);
// Note that these APIs comply with multi-buffer APIs' high level usage
void sha512_sb_mgr_init_sse4 (SHA512_MB_JOB_MGR *state);
SHA512_JOB* sha512_sb_mgr_submit_sse4 (SHA512_MB_JOB_MGR *state, SHA512_JOB* job);
SHA512_JOB* sha512_sb_mgr_flush_sse4 (SHA512_MB_JOB_MGR *state);
#ifdef __cplusplus
}
#endif
#endif // _SHA512_MB_H_