summaryrefslogtreecommitdiffstats
path: root/lib/sm3.c
diff options
context:
space:
mode:
Diffstat (limited to 'lib/sm3.c')
-rw-r--r--lib/sm3.c415
1 files changed, 415 insertions, 0 deletions
diff --git a/lib/sm3.c b/lib/sm3.c
new file mode 100644
index 0000000..dc12802
--- /dev/null
+++ b/lib/sm3.c
@@ -0,0 +1,415 @@
+/* sm3.c - Functions to compute SM3 message digest of files or memory blocks
+ according to the specification GM/T 004-2012 Cryptographic Hash Algorithm
+ SM3, published by State Encryption Management Bureau, China.
+
+ SM3 cryptographic hash algorithm.
+ <http://www.sca.gov.cn/sca/xwdt/2010-12/17/content_1002389.shtml>
+
+ Copyright (C) 2017-2023 Free Software Foundation, Inc.
+
+ This file is free software: you can redistribute it and/or modify
+ it under the terms of the GNU Lesser General Public License as
+ published by the Free Software Foundation; either version 2.1 of the
+ License, or (at your option) any later version.
+
+ This file is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ GNU Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public License
+ along with this program. If not, see <https://www.gnu.org/licenses/>. */
+
+/* Written by Jia Zhang <qianyue.zj@alibaba-inc.com>, 2017,
+ considerably copypasting from David Madore's sha256.c */
+
+#include <config.h>
+
+/* Specification. */
+#if HAVE_OPENSSL_SM3
+# define GL_OPENSSL_INLINE _GL_EXTERN_INLINE
+#endif
+#include "sm3.h"
+
+#include <stdint.h>
+#include <string.h>
+
+#include <byteswap.h>
+#ifdef WORDS_BIGENDIAN
+# define SWAP(n) (n)
+#else
+# define SWAP(n) bswap_32 (n)
+#endif
+
+#ifndef DEBUG_SM3
+# define DEBUG_SM3 0
+#endif
+
+#if ! DEBUG_SM3
+# define dbg_printf(fmt, ...) do { } while (0)
+#else
+# define dbg_printf printf
+#endif
+
+#if ! HAVE_OPENSSL_SM3
+
+/* This array contains the bytes used to pad the buffer to the next
+ 64-byte boundary. */
+static const unsigned char fillbuf[64] = { 0x80, 0 /* , 0, 0, ... */ };
+
+
+/*
+ Takes a pointer to a 256 bit block of data (eight 32 bit ints) and
+ initializes it to the start constants of the SM3 algorithm. This
+ must be called before using hash in the call to sm3_hash
+*/
+void
+sm3_init_ctx (struct sm3_ctx *ctx)
+{
+ ctx->state[0] = 0x7380166fUL;
+ ctx->state[1] = 0x4914b2b9UL;
+ ctx->state[2] = 0x172442d7UL;
+ ctx->state[3] = 0xda8a0600UL;
+ ctx->state[4] = 0xa96f30bcUL;
+ ctx->state[5] = 0x163138aaUL;
+ ctx->state[6] = 0xe38dee4dUL;
+ ctx->state[7] = 0xb0fb0e4eUL;
+
+ ctx->total[0] = ctx->total[1] = 0;
+ ctx->buflen = 0;
+}
+
+/* Copy the value from v into the memory location pointed to by *cp,
+ If your architecture allows unaligned access this is equivalent to
+ * (uint32_t *) cp = v */
+static void
+set_uint32 (char *cp, uint32_t v)
+{
+ memcpy (cp, &v, sizeof v);
+}
+
+/* Put result from CTX in first 32 bytes following RESBUF. The result
+ must be in little endian byte order. */
+void *
+sm3_read_ctx (const struct sm3_ctx *ctx, void *resbuf)
+{
+ int i;
+ char *r = resbuf;
+
+ for (i = 0; i < 8; i++)
+ set_uint32 (r + i * sizeof ctx->state[0], SWAP (ctx->state[i]));
+
+ return resbuf;
+}
+
+/* Process the remaining bytes in the internal buffer and the usual
+ prolog according to the standard and write the result to RESBUF. */
+static void
+sm3_conclude_ctx (struct sm3_ctx *ctx)
+{
+ /* Take yet unprocessed bytes into account. */
+ size_t bytes = ctx->buflen;
+ size_t size = (bytes < 56) ? 64 / 4 : 64 * 2 / 4;
+
+ /* Now count remaining bytes. */
+ ctx->total[0] += bytes;
+ if (ctx->total[0] < bytes)
+ ++ctx->total[1];
+
+ /* Put the 64-bit file length in *bits* at the end of the buffer.
+ Use set_uint32 rather than a simple assignment, to avoid risk of
+ unaligned access. */
+ set_uint32 ((char *) &ctx->buffer[size - 2],
+ SWAP ((ctx->total[1] << 3) | (ctx->total[0] >> 29)));
+ set_uint32 ((char *) &ctx->buffer[size - 1],
+ SWAP (ctx->total[0] << 3));
+
+ memcpy (&((char *) ctx->buffer)[bytes], fillbuf, (size - 2) * 4 - bytes);
+
+ /* Process last bytes. */
+ sm3_process_block (ctx->buffer, size * 4, ctx);
+}
+
+void *
+sm3_finish_ctx (struct sm3_ctx *ctx, void *resbuf)
+{
+ sm3_conclude_ctx (ctx);
+ return sm3_read_ctx (ctx, resbuf);
+}
+
+/* Compute SM3 message digest for LEN bytes beginning at BUFFER. The
+ result is always in little endian byte order, so that a byte-wise
+ output yields to the wanted ASCII representation of the message
+ digest. */
+void *
+sm3_buffer (const char *buffer, size_t len, void *resblock)
+{
+ struct sm3_ctx ctx;
+
+ /* Initialize the computation context. */
+ sm3_init_ctx (&ctx);
+
+ /* Process whole buffer but last len % 64 bytes. */
+ sm3_process_bytes (buffer, len, &ctx);
+
+ /* Put result in desired memory area. */
+ return sm3_finish_ctx (&ctx, resblock);
+}
+
+void
+sm3_process_bytes (const void *buffer, size_t len, struct sm3_ctx *ctx)
+{
+ /* When we already have some bits in our internal buffer concatenate
+ both inputs first. */
+ if (ctx->buflen != 0)
+ {
+ size_t left_over = ctx->buflen;
+ size_t add = 128 - left_over > len ? len : 128 - left_over;
+
+ memcpy (&((char *) ctx->buffer)[left_over], buffer, add);
+ ctx->buflen += add;
+
+ if (ctx->buflen > 64)
+ {
+ sm3_process_block (ctx->buffer, ctx->buflen & ~63, ctx);
+
+ ctx->buflen &= 63;
+ /* The regions in the following copy operation cannot overlap,
+ because ctx->buflen < 64 ≤ (left_over + add) & ~63. */
+ memcpy (ctx->buffer,
+ &((char *) ctx->buffer)[(left_over + add) & ~63],
+ ctx->buflen);
+ }
+
+ buffer = (const char *) buffer + add;
+ len -= add;
+ }
+
+ /* Process available complete blocks. */
+ if (len >= 64)
+ {
+#if !(_STRING_ARCH_unaligned || _STRING_INLINE_unaligned)
+# define UNALIGNED_P(p) ((uintptr_t) (p) % alignof (uint32_t) != 0)
+ if (UNALIGNED_P (buffer))
+ while (len > 64)
+ {
+ sm3_process_block (memcpy (ctx->buffer, buffer, 64), 64, ctx);
+ buffer = (const char *) buffer + 64;
+ len -= 64;
+ }
+ else
+#endif
+ {
+ sm3_process_block (buffer, len & ~63, ctx);
+ buffer = (const char *) buffer + (len & ~63);
+ len &= 63;
+ }
+ }
+
+ /* Move remaining bytes in internal buffer. */
+ if (len > 0)
+ {
+ size_t left_over = ctx->buflen;
+
+ memcpy (&((char *) ctx->buffer)[left_over], buffer, len);
+ left_over += len;
+ if (left_over >= 64)
+ {
+ sm3_process_block (ctx->buffer, 64, ctx);
+ left_over -= 64;
+ /* The regions in the following copy operation cannot overlap,
+ because left_over ≤ 64. */
+ memcpy (ctx->buffer, &ctx->buffer[16], left_over);
+ }
+ ctx->buflen = left_over;
+ }
+}
+
+/* --- Code below is the primary difference between sha256.c and sm3.c --- */
+
+/* SM3 round constants */
+#define T(j) sm3_round_constants[j]
+static const uint32_t sm3_round_constants[64] = {
+ 0x79cc4519UL, 0xf3988a32UL, 0xe7311465UL, 0xce6228cbUL,
+ 0x9cc45197UL, 0x3988a32fUL, 0x7311465eUL, 0xe6228cbcUL,
+ 0xcc451979UL, 0x988a32f3UL, 0x311465e7UL, 0x6228cbceUL,
+ 0xc451979cUL, 0x88a32f39UL, 0x11465e73UL, 0x228cbce6UL,
+ 0x9d8a7a87UL, 0x3b14f50fUL, 0x7629ea1eUL, 0xec53d43cUL,
+ 0xd8a7a879UL, 0xb14f50f3UL, 0x629ea1e7UL, 0xc53d43ceUL,
+ 0x8a7a879dUL, 0x14f50f3bUL, 0x29ea1e76UL, 0x53d43cecUL,
+ 0xa7a879d8UL, 0x4f50f3b1UL, 0x9ea1e762UL, 0x3d43cec5UL,
+ 0x7a879d8aUL, 0xf50f3b14UL, 0xea1e7629UL, 0xd43cec53UL,
+ 0xa879d8a7UL, 0x50f3b14fUL, 0xa1e7629eUL, 0x43cec53dUL,
+ 0x879d8a7aUL, 0x0f3b14f5UL, 0x1e7629eaUL, 0x3cec53d4UL,
+ 0x79d8a7a8UL, 0xf3b14f50UL, 0xe7629ea1UL, 0xcec53d43UL,
+ 0x9d8a7a87UL, 0x3b14f50fUL, 0x7629ea1eUL, 0xec53d43cUL,
+ 0xd8a7a879UL, 0xb14f50f3UL, 0x629ea1e7UL, 0xc53d43ceUL,
+ 0x8a7a879dUL, 0x14f50f3bUL, 0x29ea1e76UL, 0x53d43cecUL,
+ 0xa7a879d8UL, 0x4f50f3b1UL, 0x9ea1e762UL, 0x3d43cec5UL,
+};
+
+/* Round functions. */
+#define FF1(X,Y,Z) ( X ^ Y ^ Z )
+#define FF2(X,Y,Z) ( ( X & Y ) | ( X & Z ) | ( Y & Z ) )
+#define GG1(X,Y,Z) ( X ^ Y ^ Z )
+#define GG2(X,Y,Z) ( ( X & Y ) | ( ~X & Z ) )
+
+/* Process LEN bytes of BUFFER, accumulating context into CTX.
+ It is assumed that LEN % 64 == 0.
+ Most of this code comes from David Madore's sha256.c. */
+
+void
+sm3_process_block (const void *buffer, size_t len, struct sm3_ctx *ctx)
+{
+ const uint32_t *words = buffer;
+ size_t nwords = len / sizeof (uint32_t);
+ const uint32_t *endp = words + nwords;
+ uint32_t x[16];
+ uint32_t a = ctx->state[0];
+ uint32_t b = ctx->state[1];
+ uint32_t c = ctx->state[2];
+ uint32_t d = ctx->state[3];
+ uint32_t e = ctx->state[4];
+ uint32_t f = ctx->state[5];
+ uint32_t g = ctx->state[6];
+ uint32_t h = ctx->state[7];
+ uint32_t lolen = len;
+
+ /* First increment the byte count. GM/T 004-2012 specifies the possible
+ length of the file up to 2^64 bits. Here we only compute the
+ number of bytes. Do a double word increment. */
+ ctx->total[0] += lolen;
+ ctx->total[1] += (len >> 31 >> 1) + (ctx->total[0] < lolen);
+
+#define rol(x, n) (((x) << ((n) & 31)) | ((x) >> ((32 - (n)) & 31)))
+#define P0(x) ((x)^rol(x,9)^rol(x,17))
+#define P1(x) ((x)^rol(x,15)^rol(x,23))
+
+#define W1(I) ( x[I&0x0f] )
+#define W2(I) ( tw = P1(x[I&0x0f]^x[(I-9)&0x0f]^rol(x[(I-3)&0x0f],15)) \
+ ^ rol(x[(I-13)&0x0f],7) ^ x[(I-6)&0x0f] \
+ , x[I&0x0f] = tw )
+
+#define R(i,A,B,C,D,E,F,G,H,T,W1,W2) \
+ do { \
+ if (++j) \
+ dbg_printf("%2d %08x %08x %08x %08x %08x %08x %08x %08x\n", \
+ j-1, A, B, C, D, E, F, G, H); \
+ ss1 = rol(rol(A,12) + E + T,7); \
+ ss2 = ss1 ^ rol(A,12); \
+ D += FF##i(A,B,C) + ss2 + (W1 ^ W2); \
+ H += GG##i(E,F,G) + ss1 + W1; \
+ B = rol(B,9); \
+ F = rol(F,19); \
+ H = P0(H); \
+ } while(0)
+
+#define R1(A,B,C,D,E,F,G,H,T,W1,W2) R(1,A,B,C,D,E,F,G,H,T,W1,W2)
+#define R2(A,B,C,D,E,F,G,H,T,W1,W2) R(2,A,B,C,D,E,F,G,H,T,W1,W2)
+
+ while (words < endp)
+ {
+ uint32_t tw;
+ uint32_t ss1, ss2;
+ int j;
+
+ for (j = 0; j < 16; j++)
+ {
+ x[j] = SWAP (*words);
+ words++;
+ }
+
+ j = -1;
+
+ dbg_printf (" j A B C D E "
+ " F G H\n"
+ " %08x %08x %08x %08x %08x %08x %08x %08x\n",
+ a, b, c, d, e, f, g, h);
+
+ R1( a, b, c, d, e, f, g, h, T( 0), W1( 0), W1( 4) );
+ R1( d, a, b, c, h, e, f, g, T( 1), W1( 1), W1( 5) );
+ R1( c, d, a, b, g, h, e, f, T( 2), W1( 2), W1( 6) );
+ R1( b, c, d, a, f, g, h, e, T( 3), W1( 3), W1( 7) );
+ R1( a, b, c, d, e, f, g, h, T( 4), W1( 4), W1( 8) );
+ R1( d, a, b, c, h, e, f, g, T( 5), W1( 5), W1( 9) );
+ R1( c, d, a, b, g, h, e, f, T( 6), W1( 6), W1(10) );
+ R1( b, c, d, a, f, g, h, e, T( 7), W1( 7), W1(11) );
+ R1( a, b, c, d, e, f, g, h, T( 8), W1( 8), W1(12) );
+ R1( d, a, b, c, h, e, f, g, T( 9), W1( 9), W1(13) );
+ R1( c, d, a, b, g, h, e, f, T(10), W1(10), W1(14) );
+ R1( b, c, d, a, f, g, h, e, T(11), W1(11), W1(15) );
+ R1( a, b, c, d, e, f, g, h, T(12), W1(12), W2(16) );
+ R1( d, a, b, c, h, e, f, g, T(13), W1(13), W2(17) );
+ R1( c, d, a, b, g, h, e, f, T(14), W1(14), W2(18) );
+ R1( b, c, d, a, f, g, h, e, T(15), W1(15), W2(19) );
+ R2( a, b, c, d, e, f, g, h, T(16), W1(16), W2(20) );
+ R2( d, a, b, c, h, e, f, g, T(17), W1(17), W2(21) );
+ R2( c, d, a, b, g, h, e, f, T(18), W1(18), W2(22) );
+ R2( b, c, d, a, f, g, h, e, T(19), W1(19), W2(23) );
+ R2( a, b, c, d, e, f, g, h, T(20), W1(20), W2(24) );
+ R2( d, a, b, c, h, e, f, g, T(21), W1(21), W2(25) );
+ R2( c, d, a, b, g, h, e, f, T(22), W1(22), W2(26) );
+ R2( b, c, d, a, f, g, h, e, T(23), W1(23), W2(27) );
+ R2( a, b, c, d, e, f, g, h, T(24), W1(24), W2(28) );
+ R2( d, a, b, c, h, e, f, g, T(25), W1(25), W2(29) );
+ R2( c, d, a, b, g, h, e, f, T(26), W1(26), W2(30) );
+ R2( b, c, d, a, f, g, h, e, T(27), W1(27), W2(31) );
+ R2( a, b, c, d, e, f, g, h, T(28), W1(28), W2(32) );
+ R2( d, a, b, c, h, e, f, g, T(29), W1(29), W2(33) );
+ R2( c, d, a, b, g, h, e, f, T(30), W1(30), W2(34) );
+ R2( b, c, d, a, f, g, h, e, T(31), W1(31), W2(35) );
+ R2( a, b, c, d, e, f, g, h, T(32), W1(32), W2(36) );
+ R2( d, a, b, c, h, e, f, g, T(33), W1(33), W2(37) );
+ R2( c, d, a, b, g, h, e, f, T(34), W1(34), W2(38) );
+ R2( b, c, d, a, f, g, h, e, T(35), W1(35), W2(39) );
+ R2( a, b, c, d, e, f, g, h, T(36), W1(36), W2(40) );
+ R2( d, a, b, c, h, e, f, g, T(37), W1(37), W2(41) );
+ R2( c, d, a, b, g, h, e, f, T(38), W1(38), W2(42) );
+ R2( b, c, d, a, f, g, h, e, T(39), W1(39), W2(43) );
+ R2( a, b, c, d, e, f, g, h, T(40), W1(40), W2(44) );
+ R2( d, a, b, c, h, e, f, g, T(41), W1(41), W2(45) );
+ R2( c, d, a, b, g, h, e, f, T(42), W1(42), W2(46) );
+ R2( b, c, d, a, f, g, h, e, T(43), W1(43), W2(47) );
+ R2( a, b, c, d, e, f, g, h, T(44), W1(44), W2(48) );
+ R2( d, a, b, c, h, e, f, g, T(45), W1(45), W2(49) );
+ R2( c, d, a, b, g, h, e, f, T(46), W1(46), W2(50) );
+ R2( b, c, d, a, f, g, h, e, T(47), W1(47), W2(51) );
+ R2( a, b, c, d, e, f, g, h, T(48), W1(48), W2(52) );
+ R2( d, a, b, c, h, e, f, g, T(49), W1(49), W2(53) );
+ R2( c, d, a, b, g, h, e, f, T(50), W1(50), W2(54) );
+ R2( b, c, d, a, f, g, h, e, T(51), W1(51), W2(55) );
+ R2( a, b, c, d, e, f, g, h, T(52), W1(52), W2(56) );
+ R2( d, a, b, c, h, e, f, g, T(53), W1(53), W2(57) );
+ R2( c, d, a, b, g, h, e, f, T(54), W1(54), W2(58) );
+ R2( b, c, d, a, f, g, h, e, T(55), W1(55), W2(59) );
+ R2( a, b, c, d, e, f, g, h, T(56), W1(56), W2(60) );
+ R2( d, a, b, c, h, e, f, g, T(57), W1(57), W2(61) );
+ R2( c, d, a, b, g, h, e, f, T(58), W1(58), W2(62) );
+ R2( b, c, d, a, f, g, h, e, T(59), W1(59), W2(63) );
+ R2( a, b, c, d, e, f, g, h, T(60), W1(60), W2(64) );
+ R2( d, a, b, c, h, e, f, g, T(61), W1(61), W2(65) );
+ R2( c, d, a, b, g, h, e, f, T(62), W1(62), W2(66) );
+ R2( b, c, d, a, f, g, h, e, T(63), W1(63), W2(67) );
+
+ dbg_printf("%2d %08x %08x %08x %08x %08x %08x %08x %08x\n",
+ j, a, b, c, d, e, f, g, h);
+
+ a = ctx->state[0] ^= a;
+ b = ctx->state[1] ^= b;
+ c = ctx->state[2] ^= c;
+ d = ctx->state[3] ^= d;
+ e = ctx->state[4] ^= e;
+ f = ctx->state[5] ^= f;
+ g = ctx->state[6] ^= g;
+ h = ctx->state[7] ^= h;
+ }
+}
+
+#endif
+
+/*
+ * Hey Emacs!
+ * Local Variables:
+ * coding: utf-8
+ * End:
+ */