andre@0: /* This Source Code Form is subject to the terms of the Mozilla Public andre@0: * License, v. 2.0. If a copy of the MPL was not distributed with this andre@0: * file, You can obtain one at http://mozilla.org/MPL/2.0/. */ andre@0: andre@0: #ifdef FREEBL_NO_DEPEND andre@0: #include "stubs.h" andre@0: #endif andre@0: #include "blapii.h" andre@0: #include "blapit.h" andre@0: #include "gcm.h" andre@0: #include "ctr.h" andre@0: #include "secerr.h" andre@0: #include "prtypes.h" andre@0: #include "pkcs11t.h" andre@0: andre@0: #include andre@0: andre@0: /************************************************************************** andre@0: * First implement the Galois hash function of GCM (gcmHash) * andre@0: **************************************************************************/ andre@0: #define GCM_HASH_LEN_LEN 8 /* gcm hash defines lengths to be 64 bits */ andre@0: andre@0: typedef struct gcmHashContextStr gcmHashContext; andre@0: andre@0: static SECStatus gcmHash_InitContext(gcmHashContext *hash, andre@0: const unsigned char *H, andre@0: unsigned int blocksize); andre@0: static void gcmHash_DestroyContext(gcmHashContext *ghash, PRBool freeit); andre@0: static SECStatus gcmHash_Update(gcmHashContext *ghash, andre@0: const unsigned char *buf, unsigned int len, andre@0: unsigned int blocksize); andre@0: static SECStatus gcmHash_Sync(gcmHashContext *ghash, unsigned int blocksize); andre@0: static SECStatus gcmHash_Final(gcmHashContext *gcm, unsigned char *outbuf, andre@0: unsigned int *outlen, unsigned int maxout, andre@0: unsigned int blocksize); andre@0: static SECStatus gcmHash_Reset(gcmHashContext *ghash, andre@0: const unsigned char *inbuf, andre@0: unsigned int inbufLen, unsigned int blocksize); andre@0: andre@0: /* compile time defines to select how the GF2 multiply is calculated. andre@0: * There are currently 2 algorithms implemented here: MPI and ALGORITHM_1. andre@0: * andre@0: * MPI uses the GF2m implemented in mpi to support GF2 ECC. andre@0: * ALGORITHM_1 is the Algorithm 1 in both NIST SP 800-38D and andre@0: * "The Galois/Counter Mode of Operation (GCM)", McGrew & Viega. andre@0: */ andre@0: #if !defined(GCM_USE_ALGORITHM_1) && !defined(GCM_USE_MPI) andre@0: #define GCM_USE_MPI 1 /* MPI is about 5x faster with the andre@0: * same or less complexity. It's possible to use andre@0: * tables to speed things up even more */ andre@0: #endif andre@0: andre@0: /* GCM defines the bit string to be LSB first, which is exactly andre@0: * opposite everyone else, including hardware. build array andre@0: * to reverse everything. */ andre@0: static const unsigned char gcm_byte_rev[256] = { andre@0: 0x00, 0x80, 0x40, 0xc0, 0x20, 0xa0, 0x60, 0xe0, andre@0: 0x10, 0x90, 0x50, 0xd0, 0x30, 0xb0, 0x70, 0xf0, andre@0: 0x08, 0x88, 0x48, 0xc8, 0x28, 0xa8, 0x68, 0xe8, andre@0: 0x18, 0x98, 0x58, 0xd8, 0x38, 0xb8, 0x78, 0xf8, andre@0: 0x04, 0x84, 0x44, 0xc4, 0x24, 0xa4, 0x64, 0xe4, andre@0: 0x14, 0x94, 0x54, 0xd4, 0x34, 0xb4, 0x74, 0xf4, andre@0: 0x0c, 0x8c, 0x4c, 0xcc, 0x2c, 0xac, 0x6c, 0xec, andre@0: 0x1c, 0x9c, 0x5c, 0xdc, 0x3c, 0xbc, 0x7c, 0xfc, andre@0: 0x02, 0x82, 0x42, 0xc2, 0x22, 0xa2, 0x62, 0xe2, andre@0: 0x12, 0x92, 0x52, 0xd2, 0x32, 0xb2, 0x72, 0xf2, andre@0: 0x0a, 0x8a, 0x4a, 0xca, 0x2a, 0xaa, 0x6a, 0xea, andre@0: 0x1a, 0x9a, 0x5a, 0xda, 0x3a, 0xba, 0x7a, 0xfa, andre@0: 0x06, 0x86, 0x46, 0xc6, 0x26, 0xa6, 0x66, 0xe6, andre@0: 0x16, 0x96, 0x56, 0xd6, 0x36, 0xb6, 0x76, 0xf6, andre@0: 0x0e, 0x8e, 0x4e, 0xce, 0x2e, 0xae, 0x6e, 0xee, andre@0: 0x1e, 0x9e, 0x5e, 0xde, 0x3e, 0xbe, 0x7e, 0xfe, andre@0: 0x01, 0x81, 0x41, 0xc1, 0x21, 0xa1, 0x61, 0xe1, andre@0: 0x11, 0x91, 0x51, 0xd1, 0x31, 0xb1, 0x71, 0xf1, andre@0: 0x09, 0x89, 0x49, 0xc9, 0x29, 0xa9, 0x69, 0xe9, andre@0: 0x19, 0x99, 0x59, 0xd9, 0x39, 0xb9, 0x79, 0xf9, andre@0: 0x05, 0x85, 0x45, 0xc5, 0x25, 0xa5, 0x65, 0xe5, andre@0: 0x15, 0x95, 0x55, 0xd5, 0x35, 0xb5, 0x75, 0xf5, andre@0: 0x0d, 0x8d, 0x4d, 0xcd, 0x2d, 0xad, 0x6d, 0xed, andre@0: 0x1d, 0x9d, 0x5d, 0xdd, 0x3d, 0xbd, 0x7d, 0xfd, andre@0: 0x03, 0x83, 0x43, 0xc3, 0x23, 0xa3, 0x63, 0xe3, andre@0: 0x13, 0x93, 0x53, 0xd3, 0x33, 0xb3, 0x73, 0xf3, andre@0: 0x0b, 0x8b, 0x4b, 0xcb, 0x2b, 0xab, 0x6b, 0xeb, andre@0: 0x1b, 0x9b, 0x5b, 0xdb, 0x3b, 0xbb, 0x7b, 0xfb, andre@0: 0x07, 0x87, 0x47, 0xc7, 0x27, 0xa7, 0x67, 0xe7, andre@0: 0x17, 0x97, 0x57, 0xd7, 0x37, 0xb7, 0x77, 0xf7, andre@0: 0x0f, 0x8f, 0x4f, 0xcf, 0x2f, 0xaf, 0x6f, 0xef, andre@0: 0x1f, 0x9f, 0x5f, 0xdf, 0x3f, 0xbf, 0x7f, 0xff andre@0: }; andre@0: andre@0: andre@0: #ifdef GCM_TRACE andre@0: #include andre@0: andre@0: #define GCM_TRACE_X(ghash,label) { \ andre@0: unsigned char _X[MAX_BLOCK_SIZE]; int i; \ andre@0: gcm_getX(ghash, _X, blocksize); \ andre@0: printf(label,(ghash)->m); \ andre@0: for (i=0; i < blocksize; i++) printf("%02x",_X[i]); \ andre@0: printf("\n"); } andre@0: #define GCM_TRACE_BLOCK(label,buf,blocksize) {\ andre@0: printf(label); \ andre@0: for (i=0; i < blocksize; i++) printf("%02x",buf[i]); \ andre@0: printf("\n"); } andre@0: #else andre@0: #define GCM_TRACE_X(ghash,label) andre@0: #define GCM_TRACE_BLOCK(label,buf,blocksize) andre@0: #endif andre@0: andre@0: #ifdef GCM_USE_MPI andre@0: andre@0: #ifdef GCM_USE_ALGORITHM_1 andre@0: #error "Only define one of GCM_USE_MPI, GCM_USE_ALGORITHM_1" andre@0: #endif andre@0: /* use the MPI functions to calculate Xn = (Xn-1^C_i)*H mod poly */ andre@0: #include "mpi.h" andre@0: #include "secmpi.h" andre@0: #include "mplogic.h" andre@0: #include "mp_gf2m.h" andre@0: andre@0: /* state needed to handle GCM Hash function */ andre@0: struct gcmHashContextStr { andre@0: mp_int H; andre@0: mp_int X; andre@0: mp_int C_i; andre@0: const unsigned int *poly; andre@0: unsigned char buffer[MAX_BLOCK_SIZE]; andre@0: unsigned int bufLen; andre@0: int m; /* XXX what is m? */ andre@0: unsigned char counterBuf[2*GCM_HASH_LEN_LEN]; andre@0: PRUint64 cLen; andre@0: }; andre@0: andre@0: /* f = x^128 + x^7 + x^2 + x + 1 */ andre@0: static const unsigned int poly_128[] = { 128, 7, 2, 1, 0 }; andre@0: andre@0: /* sigh, GCM defines the bit strings exactly backwards from everything else */ andre@0: static void andre@0: gcm_reverse(unsigned char *target, const unsigned char *src, andre@0: unsigned int blocksize) andre@0: { andre@0: unsigned int i; andre@0: for (i=0; i < blocksize; i++) { andre@0: target[blocksize-i-1] = gcm_byte_rev[src[i]]; andre@0: } andre@0: } andre@0: andre@0: /* Initialize a gcmHashContext */ andre@0: static SECStatus andre@0: gcmHash_InitContext(gcmHashContext *ghash, const unsigned char *H, andre@0: unsigned int blocksize) andre@0: { andre@0: mp_err err = MP_OKAY; andre@0: unsigned char H_rev[MAX_BLOCK_SIZE]; andre@0: andre@0: MP_DIGITS(&ghash->H) = 0; andre@0: MP_DIGITS(&ghash->X) = 0; andre@0: MP_DIGITS(&ghash->C_i) = 0; andre@0: CHECK_MPI_OK( mp_init(&ghash->H) ); andre@0: CHECK_MPI_OK( mp_init(&ghash->X) ); andre@0: CHECK_MPI_OK( mp_init(&ghash->C_i) ); andre@0: andre@0: mp_zero(&ghash->X); andre@0: gcm_reverse(H_rev, H, blocksize); andre@0: CHECK_MPI_OK( mp_read_unsigned_octets(&ghash->H, H_rev, blocksize) ); andre@0: andre@0: /* set the irreducible polynomial. Each blocksize has its own polynomial. andre@0: * for now only blocksize 16 (=128 bits) is defined */ andre@0: switch (blocksize) { andre@0: case 16: /* 128 bits */ andre@0: ghash->poly = poly_128; andre@0: break; andre@0: default: andre@0: PORT_SetError(SEC_ERROR_INVALID_ARGS); andre@0: goto cleanup; andre@0: } andre@0: ghash->cLen = 0; andre@0: ghash->bufLen = 0; andre@0: ghash->m = 0; andre@0: PORT_Memset(ghash->counterBuf, 0, sizeof(ghash->counterBuf)); andre@0: return SECSuccess; andre@0: cleanup: andre@0: gcmHash_DestroyContext(ghash, PR_FALSE); andre@0: return SECFailure; andre@0: } andre@0: andre@0: /* Destroy a HashContext (Note we zero the digits so this function andre@0: * is idempotent if called with freeit == PR_FALSE */ andre@0: static void andre@0: gcmHash_DestroyContext(gcmHashContext *ghash, PRBool freeit) andre@0: { andre@0: mp_clear(&ghash->H); andre@0: mp_clear(&ghash->X); andre@0: mp_clear(&ghash->C_i); andre@0: MP_DIGITS(&ghash->H) = 0; andre@0: MP_DIGITS(&ghash->X) = 0; andre@0: MP_DIGITS(&ghash->C_i) = 0; andre@0: if (freeit) { andre@0: PORT_Free(ghash); andre@0: } andre@0: } andre@0: andre@0: static SECStatus andre@0: gcm_getX(gcmHashContext *ghash, unsigned char *T, unsigned int blocksize) andre@0: { andre@0: int len; andre@0: mp_err err; andre@0: unsigned char tmp_buf[MAX_BLOCK_SIZE]; andre@0: unsigned char *X; andre@0: andre@0: len = mp_unsigned_octet_size(&ghash->X); andre@0: if (len <= 0) { andre@0: PORT_SetError(SEC_ERROR_LIBRARY_FAILURE); andre@0: return SECFailure; andre@0: } andre@0: X = tmp_buf; andre@0: PORT_Assert((unsigned int)len <= blocksize); andre@0: if ((unsigned int)len > blocksize) { andre@0: PORT_SetError(SEC_ERROR_LIBRARY_FAILURE); andre@0: return SECFailure; andre@0: } andre@0: /* zero pad the result */ andre@0: if (len != blocksize) { andre@0: PORT_Memset(X,0,blocksize-len); andre@0: X += blocksize-len; andre@0: } andre@0: andre@0: err = mp_to_unsigned_octets(&ghash->X, X, len); andre@0: if (err < 0) { andre@0: PORT_SetError(SEC_ERROR_LIBRARY_FAILURE); andre@0: return SECFailure; andre@0: } andre@0: gcm_reverse(T, tmp_buf, blocksize); andre@0: return SECSuccess; andre@0: } andre@0: andre@0: static SECStatus andre@0: gcm_HashMult(gcmHashContext *ghash, const unsigned char *buf, andre@0: unsigned int count, unsigned int blocksize) andre@0: { andre@0: SECStatus rv = SECFailure; andre@0: mp_err err = MP_OKAY; andre@0: unsigned char tmp_buf[MAX_BLOCK_SIZE]; andre@0: unsigned int i; andre@0: andre@0: for (i=0; i < count; i++, buf += blocksize) { andre@0: ghash->m++; andre@0: gcm_reverse(tmp_buf, buf, blocksize); andre@0: CHECK_MPI_OK(mp_read_unsigned_octets(&ghash->C_i, tmp_buf, blocksize)); andre@0: CHECK_MPI_OK(mp_badd(&ghash->X, &ghash->C_i, &ghash->C_i)); andre@0: /* andre@0: * Looking to speed up GCM, this the the place to do it. andre@0: * There are two areas that can be exploited to speed up this code. andre@0: * andre@0: * 1) H is a constant in this multiply. We can precompute H * (0 - 255) andre@0: * at init time and this becomes an blockize xors of our table lookup. andre@0: * andre@0: * 2) poly is a constant for each blocksize. We can calculate the andre@0: * modulo reduction by a series of adds and shifts. andre@0: * andre@0: * For now we are after functionality, so we will go ahead and use andre@0: * the builtin bmulmod from mpi andre@0: */ andre@0: CHECK_MPI_OK(mp_bmulmod(&ghash->C_i, &ghash->H, andre@0: ghash->poly, &ghash->X)); andre@0: GCM_TRACE_X(ghash, "X%d = ") andre@0: } andre@0: rv = SECSuccess; andre@0: cleanup: andre@0: if (rv != SECSuccess) { andre@0: MP_TO_SEC_ERROR(err); andre@0: } andre@0: return rv; andre@0: } andre@0: andre@0: static void andre@0: gcm_zeroX(gcmHashContext *ghash) andre@0: { andre@0: mp_zero(&ghash->X); andre@0: ghash->m = 0; andre@0: } andre@0: andre@0: #endif andre@0: andre@0: #ifdef GCM_USE_ALGORITHM_1 andre@0: /* use algorithm 1 of McGrew & Viega "The Galois/Counter Mode of Operation" */ andre@0: andre@0: #define GCM_ARRAY_SIZE (MAX_BLOCK_SIZE/sizeof(unsigned long)) andre@0: andre@0: struct gcmHashContextStr { andre@0: unsigned long H[GCM_ARRAY_SIZE]; andre@0: unsigned long X[GCM_ARRAY_SIZE]; andre@0: unsigned long R; andre@0: unsigned char buffer[MAX_BLOCK_SIZE]; andre@0: unsigned int bufLen; andre@0: int m; andre@0: unsigned char counterBuf[2*GCM_HASH_LEN_LEN]; andre@0: PRUint64 cLen; andre@0: }; andre@0: andre@0: static void andre@0: gcm_bytes_to_longs(unsigned long *l, const unsigned char *c, unsigned int len) andre@0: { andre@0: int i,j; andre@0: int array_size = len/sizeof(unsigned long); andre@0: andre@0: PORT_Assert(len % sizeof(unsigned long) == 0); andre@0: for (i=0; i < array_size; i++) { andre@0: unsigned long tmp = 0; andre@0: int byte_offset = i * sizeof(unsigned long); andre@0: for (j=sizeof(unsigned long)-1; j >= 0; j--) { andre@0: tmp = (tmp << PR_BITS_PER_BYTE) | gcm_byte_rev[c[byte_offset+j]]; andre@0: } andre@0: l[i] = tmp; andre@0: } andre@0: } andre@0: andre@0: static void andre@0: gcm_longs_to_bytes(const unsigned long *l, unsigned char *c, unsigned int len) andre@0: { andre@0: int i,j; andre@0: int array_size = len/sizeof(unsigned long); andre@0: andre@0: PORT_Assert(len % sizeof(unsigned long) == 0); andre@0: for (i=0; i < array_size; i++) { andre@0: unsigned long tmp = l[i]; andre@0: int byte_offset = i * sizeof(unsigned long); andre@0: for (j=0; j < sizeof(unsigned long); j++) { andre@0: c[byte_offset+j] = gcm_byte_rev[tmp & 0xff]; andre@0: tmp = (tmp >> PR_BITS_PER_BYTE); andre@0: } andre@0: } andre@0: } andre@0: andre@0: andre@0: /* Initialize a gcmHashContext */ andre@0: static SECStatus andre@0: gcmHash_InitContext(gcmHashContext *ghash, const unsigned char *H, andre@0: unsigned int blocksize) andre@0: { andre@0: PORT_Memset(ghash->X, 0, sizeof(ghash->X)); andre@0: PORT_Memset(ghash->H, 0, sizeof(ghash->H)); andre@0: gcm_bytes_to_longs(ghash->H, H, blocksize); andre@0: andre@0: /* set the irreducible polynomial. Each blocksize has its own polynommial andre@0: * for now only blocksize 16 (=128 bits) is defined */ andre@0: switch (blocksize) { andre@0: case 16: /* 128 bits */ andre@0: ghash->R = (unsigned long) 0x87; /* x^7 + x^2 + x +1 */ andre@0: break; andre@0: default: andre@0: PORT_SetError(SEC_ERROR_INVALID_ARGS); andre@0: goto cleanup; andre@0: } andre@0: ghash->cLen = 0; andre@0: ghash->bufLen = 0; andre@0: ghash->m = 0; andre@0: PORT_Memset(ghash->counterBuf, 0, sizeof(ghash->counterBuf)); andre@0: return SECSuccess; andre@0: cleanup: andre@0: return SECFailure; andre@0: } andre@0: andre@0: /* Destroy a HashContext (Note we zero the digits so this function andre@0: * is idempotent if called with freeit == PR_FALSE */ andre@0: static void andre@0: gcmHash_DestroyContext(gcmHashContext *ghash, PRBool freeit) andre@0: { andre@0: if (freeit) { andre@0: PORT_Free(ghash); andre@0: } andre@0: } andre@0: andre@0: static unsigned long andre@0: gcm_shift_one(unsigned long *t, unsigned int count) andre@0: { andre@0: unsigned long carry = 0; andre@0: unsigned long nextcarry = 0; andre@0: unsigned int i; andre@0: for (i=0; i < count; i++) { andre@0: nextcarry = t[i] >> ((sizeof(unsigned long)*PR_BITS_PER_BYTE)-1); andre@0: t[i] = (t[i] << 1) | carry; andre@0: carry = nextcarry; andre@0: } andre@0: return carry; andre@0: } andre@0: andre@0: static SECStatus andre@0: gcm_getX(gcmHashContext *ghash, unsigned char *T, unsigned int blocksize) andre@0: { andre@0: gcm_longs_to_bytes(ghash->X, T, blocksize); andre@0: return SECSuccess; andre@0: } andre@0: andre@0: #define GCM_XOR(t, s, len) \ andre@0: for (l=0; l < len; l++) t[l] ^= s[l] andre@0: andre@0: static SECStatus andre@0: gcm_HashMult(gcmHashContext *ghash, const unsigned char *buf, andre@0: unsigned int count, unsigned int blocksize) andre@0: { andre@0: unsigned long C_i[GCM_ARRAY_SIZE]; andre@0: unsigned int arraysize = blocksize/sizeof(unsigned long); andre@0: unsigned int i, j, k, l; andre@0: andre@0: for (i=0; i < count; i++, buf += blocksize) { andre@0: ghash->m++; andre@0: gcm_bytes_to_longs(C_i, buf, blocksize); andre@0: GCM_XOR(C_i, ghash->X, arraysize); andre@0: /* multiply X = C_i * H */ andre@0: PORT_Memset(ghash->X, 0, sizeof(ghash->X)); andre@0: for (j=0; j < arraysize; j++) { andre@0: unsigned long H = ghash->H[j]; andre@0: for (k=0; k < sizeof(unsigned long)*PR_BITS_PER_BYTE; k++) { andre@0: if (H & 1) { andre@0: GCM_XOR(ghash->X, C_i, arraysize); andre@0: } andre@0: if (gcm_shift_one(C_i, arraysize)) { andre@0: C_i[0] = C_i[0] ^ ghash->R; andre@0: } andre@0: H = H >> 1; andre@0: } andre@0: } andre@0: GCM_TRACE_X(ghash, "X%d = ") andre@0: } andre@0: return SECSuccess; andre@0: } andre@0: andre@0: andre@0: static void andre@0: gcm_zeroX(gcmHashContext *ghash) andre@0: { andre@0: PORT_Memset(ghash->X, 0, sizeof(ghash->X)); andre@0: ghash->m = 0; andre@0: } andre@0: #endif andre@0: andre@0: /* andre@0: * implement GCM GHASH using the freebl GHASH function. The gcm_HashMult andre@0: * function always takes blocksize lengths of data. gcmHash_Update will andre@0: * format the data properly. andre@0: */ andre@0: static SECStatus andre@0: gcmHash_Update(gcmHashContext *ghash, const unsigned char *buf, andre@0: unsigned int len, unsigned int blocksize) andre@0: { andre@0: unsigned int blocks; andre@0: SECStatus rv; andre@0: andre@0: ghash->cLen += (len*PR_BITS_PER_BYTE); andre@0: andre@0: /* first deal with the current buffer of data. Try to fill it out so andre@0: * we can hash it */ andre@0: if (ghash->bufLen) { andre@0: unsigned int needed = PR_MIN(len, blocksize - ghash->bufLen); andre@0: if (needed != 0) { andre@0: PORT_Memcpy(ghash->buffer+ghash->bufLen, buf, needed); andre@0: } andre@0: buf += needed; andre@0: len -= needed; andre@0: ghash->bufLen += needed; andre@0: if (len == 0) { andre@0: /* didn't add enough to hash the data, nothing more do do */ andre@0: return SECSuccess; andre@0: } andre@0: PORT_Assert(ghash->bufLen == blocksize); andre@0: /* hash the buffer and clear it */ andre@0: rv = gcm_HashMult(ghash, ghash->buffer, 1, blocksize); andre@0: PORT_Memset(ghash->buffer, 0, blocksize); andre@0: ghash->bufLen = 0; andre@0: if (rv != SECSuccess) { andre@0: return SECFailure; andre@0: } andre@0: } andre@0: /* now hash any full blocks remaining in the data stream */ andre@0: blocks = len/blocksize; andre@0: if (blocks) { andre@0: rv = gcm_HashMult(ghash, buf, blocks, blocksize); andre@0: if (rv != SECSuccess) { andre@0: return SECFailure; andre@0: } andre@0: buf += blocks*blocksize; andre@0: len -= blocks*blocksize; andre@0: } andre@0: andre@0: /* save any remainder in the buffer to be hashed with the next call */ andre@0: if (len != 0) { andre@0: PORT_Memcpy(ghash->buffer, buf, len); andre@0: ghash->bufLen = len; andre@0: } andre@0: return SECSuccess; andre@0: } andre@0: andre@0: /* andre@0: * write out any partial blocks zero padded through the GHASH engine, andre@0: * save the lengths for the final completion of the hash andre@0: */ andre@0: static SECStatus andre@0: gcmHash_Sync(gcmHashContext *ghash, unsigned int blocksize) andre@0: { andre@0: int i; andre@0: SECStatus rv; andre@0: andre@0: /* copy the previous counter to the upper block */ andre@0: PORT_Memcpy(ghash->counterBuf, &ghash->counterBuf[GCM_HASH_LEN_LEN], andre@0: GCM_HASH_LEN_LEN); andre@0: /* copy the current counter in the lower block */ andre@0: for (i=0; i < GCM_HASH_LEN_LEN; i++) { andre@0: ghash->counterBuf[GCM_HASH_LEN_LEN+i] = andre@0: (ghash->cLen >> ((GCM_HASH_LEN_LEN-1-i)*PR_BITS_PER_BYTE)) & 0xff; andre@0: } andre@0: ghash->cLen = 0; andre@0: andre@0: /* now zero fill the buffer and hash the last block */ andre@0: if (ghash->bufLen) { andre@0: PORT_Memset(ghash->buffer+ghash->bufLen, 0, blocksize - ghash->bufLen); andre@0: rv = gcm_HashMult(ghash, ghash->buffer, 1, blocksize); andre@0: PORT_Memset(ghash->buffer, 0, blocksize); andre@0: ghash->bufLen = 0; andre@0: if (rv != SECSuccess) { andre@0: return SECFailure; andre@0: } andre@0: } andre@0: return SECSuccess; andre@0: } andre@0: andre@0: /* andre@0: * This does the final sync, hashes the lengths, then returns andre@0: * "T", the hashed output. andre@0: */ andre@0: static SECStatus andre@0: gcmHash_Final(gcmHashContext *ghash, unsigned char *outbuf, andre@0: unsigned int *outlen, unsigned int maxout, andre@0: unsigned int blocksize) andre@0: { andre@0: unsigned char T[MAX_BLOCK_SIZE]; andre@0: SECStatus rv; andre@0: andre@0: rv = gcmHash_Sync(ghash, blocksize); andre@0: if (rv != SECSuccess) { andre@0: return SECFailure; andre@0: } andre@0: andre@0: rv = gcm_HashMult(ghash, ghash->counterBuf, (GCM_HASH_LEN_LEN*2)/blocksize, andre@0: blocksize); andre@0: if (rv != SECSuccess) { andre@0: return SECFailure; andre@0: } andre@0: andre@0: GCM_TRACE_X(ghash, "GHASH(H,A,C) = ") andre@0: andre@0: rv = gcm_getX(ghash, T, blocksize); andre@0: if (rv != SECSuccess) { andre@0: return SECFailure; andre@0: } andre@0: andre@0: if (maxout > blocksize) maxout = blocksize; andre@0: PORT_Memcpy(outbuf, T, maxout); andre@0: *outlen = maxout; andre@0: return SECSuccess; andre@0: } andre@0: andre@0: SECStatus andre@0: gcmHash_Reset(gcmHashContext *ghash, const unsigned char *AAD, andre@0: unsigned int AADLen, unsigned int blocksize) andre@0: { andre@0: SECStatus rv; andre@0: andre@0: ghash->cLen = 0; andre@0: PORT_Memset(ghash->counterBuf, 0, GCM_HASH_LEN_LEN*2); andre@0: ghash->bufLen = 0; andre@0: gcm_zeroX(ghash); andre@0: andre@0: /* now kick things off by hashing the Additional Authenticated Data */ andre@0: if (AADLen != 0) { andre@0: rv = gcmHash_Update(ghash, AAD, AADLen, blocksize); andre@0: if (rv != SECSuccess) { andre@0: return SECFailure; andre@0: } andre@0: rv = gcmHash_Sync(ghash, blocksize); andre@0: if (rv != SECSuccess) { andre@0: return SECFailure; andre@0: } andre@0: } andre@0: return SECSuccess; andre@0: } andre@0: andre@0: /************************************************************************** andre@0: * Now implement the GCM using gcmHash and CTR * andre@0: **************************************************************************/ andre@0: andre@0: /* state to handle the full GCM operation (hash and counter) */ andre@0: struct GCMContextStr { andre@0: gcmHashContext ghash_context; andre@0: CTRContext ctr_context; andre@0: unsigned long tagBits; andre@0: unsigned char tagKey[MAX_BLOCK_SIZE]; andre@0: }; andre@0: andre@0: GCMContext * andre@0: GCM_CreateContext(void *context, freeblCipherFunc cipher, andre@0: const unsigned char *params, unsigned int blocksize) andre@0: { andre@0: GCMContext *gcm = NULL; andre@0: gcmHashContext *ghash; andre@0: unsigned char H[MAX_BLOCK_SIZE]; andre@0: unsigned int tmp; andre@0: PRBool freeCtr = PR_FALSE; andre@0: PRBool freeHash = PR_FALSE; andre@0: const CK_GCM_PARAMS *gcmParams = (const CK_GCM_PARAMS *)params; andre@0: CK_AES_CTR_PARAMS ctrParams; andre@0: SECStatus rv; andre@0: andre@0: if (blocksize > MAX_BLOCK_SIZE || blocksize > sizeof(ctrParams.cb)) { andre@0: PORT_SetError(SEC_ERROR_LIBRARY_FAILURE); andre@0: return NULL; andre@0: } andre@0: gcm = PORT_ZNew(GCMContext); andre@0: if (gcm == NULL) { andre@0: return NULL; andre@0: } andre@0: /* first fill in the ghash context */ andre@0: ghash = &gcm->ghash_context; andre@0: PORT_Memset(H, 0, blocksize); andre@0: rv = (*cipher)(context, H, &tmp, blocksize, H, blocksize, blocksize); andre@0: if (rv != SECSuccess) { andre@0: goto loser; andre@0: } andre@0: rv = gcmHash_InitContext(ghash, H, blocksize); andre@0: if (rv != SECSuccess) { andre@0: goto loser; andre@0: } andre@0: freeHash = PR_TRUE; andre@0: andre@0: /* fill in the Counter context */ andre@0: ctrParams.ulCounterBits = 32; andre@0: PORT_Memset(ctrParams.cb, 0, sizeof(ctrParams.cb)); andre@0: if ((blocksize == 16) && (gcmParams->ulIvLen == 12)) { andre@0: PORT_Memcpy(ctrParams.cb, gcmParams->pIv, gcmParams->ulIvLen); andre@0: ctrParams.cb[blocksize-1] = 1; andre@0: } else { andre@0: rv = gcmHash_Update(ghash, gcmParams->pIv, gcmParams->ulIvLen, andre@0: blocksize); andre@0: if (rv != SECSuccess) { andre@0: goto loser; andre@0: } andre@0: rv = gcmHash_Final(ghash, ctrParams.cb, &tmp, blocksize, blocksize); andre@0: if (rv != SECSuccess) { andre@0: goto loser; andre@0: } andre@0: } andre@0: rv = CTR_InitContext(&gcm->ctr_context, context, cipher, andre@0: (unsigned char *)&ctrParams, blocksize); andre@0: if (rv != SECSuccess) { andre@0: goto loser; andre@0: } andre@0: freeCtr = PR_TRUE; andre@0: andre@0: /* fill in the gcm structure */ andre@0: gcm->tagBits = gcmParams->ulTagBits; /* save for final step */ andre@0: /* calculate the final tag key. NOTE: gcm->tagKey is zero to start with. andre@0: * if this assumption changes, we would need to explicitly clear it here */ andre@0: rv = CTR_Update(&gcm->ctr_context, gcm->tagKey, &tmp, blocksize, andre@0: gcm->tagKey, blocksize, blocksize); andre@0: if (rv != SECSuccess) { andre@0: goto loser; andre@0: } andre@0: andre@0: /* finally mix in the AAD data */ andre@0: rv = gcmHash_Reset(ghash, gcmParams->pAAD, gcmParams->ulAADLen, blocksize); andre@0: if (rv != SECSuccess) { andre@0: goto loser; andre@0: } andre@0: andre@0: return gcm; andre@0: andre@0: loser: andre@0: if (freeCtr) { andre@0: CTR_DestroyContext(&gcm->ctr_context, PR_FALSE); andre@0: } andre@0: if (freeHash) { andre@0: gcmHash_DestroyContext(&gcm->ghash_context, PR_FALSE); andre@0: } andre@0: if (gcm) { andre@0: PORT_Free(gcm); andre@0: } andre@0: return NULL; andre@0: } andre@0: andre@0: void andre@0: GCM_DestroyContext(GCMContext *gcm, PRBool freeit) andre@0: { andre@0: /* these two are statically allocated and will be freed when we free andre@0: * gcm. call their destroy functions to free up any locally andre@0: * allocated data (like mp_int's) */ andre@0: CTR_DestroyContext(&gcm->ctr_context, PR_FALSE); andre@0: gcmHash_DestroyContext(&gcm->ghash_context, PR_FALSE); andre@0: if (freeit) { andre@0: PORT_Free(gcm); andre@0: } andre@0: } andre@0: andre@0: static SECStatus andre@0: gcm_GetTag(GCMContext *gcm, unsigned char *outbuf, andre@0: unsigned int *outlen, unsigned int maxout, andre@0: unsigned int blocksize) andre@0: { andre@0: unsigned int tagBytes; andre@0: unsigned int extra; andre@0: unsigned int i; andre@0: SECStatus rv; andre@0: andre@0: tagBytes = (gcm->tagBits + (PR_BITS_PER_BYTE-1)) / PR_BITS_PER_BYTE; andre@0: extra = tagBytes*PR_BITS_PER_BYTE - gcm->tagBits; andre@0: andre@0: if (outbuf == NULL) { andre@0: *outlen = tagBytes; andre@0: PORT_SetError(SEC_ERROR_OUTPUT_LEN); andre@0: return SECFailure; andre@0: } andre@0: andre@0: if (maxout < tagBytes) { andre@0: *outlen = tagBytes; andre@0: PORT_SetError(SEC_ERROR_OUTPUT_LEN); andre@0: return SECFailure; andre@0: } andre@0: maxout = tagBytes; andre@0: rv = gcmHash_Final(&gcm->ghash_context, outbuf, outlen, maxout, blocksize); andre@0: if (rv != SECSuccess) { andre@0: return SECFailure; andre@0: } andre@0: andre@0: GCM_TRACE_BLOCK("GHASH=", outbuf, blocksize); andre@0: GCM_TRACE_BLOCK("Y0=", gcm->tagKey, blocksize); andre@0: for (i=0; i < *outlen; i++) { andre@0: outbuf[i] ^= gcm->tagKey[i]; andre@0: } andre@0: GCM_TRACE_BLOCK("Y0=", gcm->tagKey, blocksize); andre@0: GCM_TRACE_BLOCK("T=", outbuf, blocksize); andre@0: /* mask off any extra bits we got */ andre@0: if (extra) { andre@0: outbuf[tagBytes-1] &= ~((1 << extra)-1); andre@0: } andre@0: return SECSuccess; andre@0: } andre@0: andre@0: andre@0: /* andre@0: * See The Galois/Counter Mode of Operation, McGrew and Viega. andre@0: * GCM is basically counter mode with a specific initialization and andre@0: * built in macing operation. andre@0: */ andre@0: SECStatus andre@0: GCM_EncryptUpdate(GCMContext *gcm, unsigned char *outbuf, andre@0: unsigned int *outlen, unsigned int maxout, andre@0: const unsigned char *inbuf, unsigned int inlen, andre@0: unsigned int blocksize) andre@0: { andre@0: SECStatus rv; andre@0: unsigned int tagBytes; andre@0: unsigned int len; andre@0: andre@0: tagBytes = (gcm->tagBits + (PR_BITS_PER_BYTE-1)) / PR_BITS_PER_BYTE; andre@0: if (UINT_MAX - inlen < tagBytes) { andre@0: PORT_SetError(SEC_ERROR_INPUT_LEN); andre@0: return SECFailure; andre@0: } andre@0: if (maxout < inlen + tagBytes) { andre@0: *outlen = inlen + tagBytes; andre@0: PORT_SetError(SEC_ERROR_OUTPUT_LEN); andre@0: return SECFailure; andre@0: } andre@0: andre@0: rv = CTR_Update(&gcm->ctr_context, outbuf, outlen, maxout, andre@0: inbuf, inlen, blocksize); andre@0: if (rv != SECSuccess) { andre@0: return SECFailure; andre@0: } andre@0: rv = gcmHash_Update(&gcm->ghash_context, outbuf, *outlen, blocksize); andre@0: if (rv != SECSuccess) { andre@0: PORT_Memset(outbuf, 0, *outlen); /* clear the output buffer */ andre@0: *outlen = 0; andre@0: return SECFailure; andre@0: } andre@0: rv = gcm_GetTag(gcm, outbuf + *outlen, &len, maxout - *outlen, blocksize); andre@0: if (rv != SECSuccess) { andre@0: PORT_Memset(outbuf, 0, *outlen); /* clear the output buffer */ andre@0: *outlen = 0; andre@0: return SECFailure; andre@0: }; andre@0: *outlen += len; andre@0: return SECSuccess; andre@0: } andre@0: andre@0: /* andre@0: * See The Galois/Counter Mode of Operation, McGrew and Viega. andre@0: * GCM is basically counter mode with a specific initialization and andre@0: * built in macing operation. NOTE: the only difference between Encrypt andre@0: * and Decrypt is when we calculate the mac. That is because the mac must andre@0: * always be calculated on the cipher text, not the plain text, so for andre@0: * encrypt, we do the CTR update first and for decrypt we do the mac first. andre@0: */ andre@0: SECStatus andre@0: GCM_DecryptUpdate(GCMContext *gcm, unsigned char *outbuf, andre@0: unsigned int *outlen, unsigned int maxout, andre@0: const unsigned char *inbuf, unsigned int inlen, andre@0: unsigned int blocksize) andre@0: { andre@0: SECStatus rv; andre@0: unsigned int tagBytes; andre@0: unsigned char tag[MAX_BLOCK_SIZE]; andre@0: const unsigned char *intag; andre@0: unsigned int len; andre@0: andre@0: tagBytes = (gcm->tagBits + (PR_BITS_PER_BYTE-1)) / PR_BITS_PER_BYTE; andre@0: andre@0: /* get the authentication block */ andre@0: if (inlen < tagBytes) { andre@0: PORT_SetError(SEC_ERROR_INPUT_LEN); andre@0: return SECFailure; andre@0: } andre@0: andre@0: inlen -= tagBytes; andre@0: intag = inbuf + inlen; andre@0: andre@0: /* verify the block */ andre@0: rv = gcmHash_Update(&gcm->ghash_context, inbuf, inlen, blocksize); andre@0: if (rv != SECSuccess) { andre@0: return SECFailure; andre@0: } andre@0: rv = gcm_GetTag(gcm, tag, &len, blocksize, blocksize); andre@0: if (rv != SECSuccess) { andre@0: return SECFailure; andre@0: } andre@0: /* Don't decrypt if we can't authenticate the encrypted data! andre@0: * This assumes that if tagBits is not a multiple of 8, intag will andre@0: * preserve the masked off missing bits. */ andre@0: if (NSS_SecureMemcmp(tag, intag, tagBytes) != 0) { andre@0: /* force a CKR_ENCRYPTED_DATA_INVALID error at in softoken */ andre@0: PORT_SetError(SEC_ERROR_BAD_DATA); andre@0: return SECFailure; andre@0: } andre@0: /* finish the decryption */ andre@0: return CTR_Update(&gcm->ctr_context, outbuf, outlen, maxout, andre@0: inbuf, inlen, blocksize); andre@0: }