* imported implementation of NLS-v2.
/* $Id: nlsfast.c 444 2006-05-17 07:41:23Z mwp $ */
/* nlsfast: NLS stream cipher and Mundja MAC -- fast implementation */
/* This is "tweaked" to support non-word-multiple keys and
* variable "Konst" to address Joe Cho's attack.
*/
/*
THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE AND AGAINST
INFRINGEMENT ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR
CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
/* interface, multiplication table and SBox */
#include <stdlib.h>
#include <string.h>
#include "nls.h"
#include "nlssbox.h"
#include "nlsmultab.h"
/*
* FOLD is how many register cycles need to be performed after combining the
* last byte of key and non-linear feedback, before every byte depends on every
* byte of the key. This depends on the feedback and nonlinear functions, and
* on where they are combined into the register.
*/
#define FOLD N /* how many iterations of folding to do */
#define INITKONST 0x6996c53a /* value of KONST to use during key loading */
#define KEYP 15 /* where to insert key words */
#define FOLDP 4 /* where to insert non-linear feedback */
#if NLS_LONG_OUTPUT
#define CTRP 2 /* where to insert counter to avoid small cycles */
#endif /*NLS_LONG_OUTPUT*/
#define Byte(x,i) ((UCHAR)(((x) >> (8*i)) & 0xFF))
/* define IS_LITTLE_ENDIAN for faster operation when appropriate */
#ifdef IS_LITTLE_ENDIAN
/* Useful macros -- little endian words on a little endian machine */
#define BYTE2WORD(b) (*(WORD *)(b))
#define WORD2BYTE(w, b) ((*(WORD *)(b)) = w)
#define XORWORD(w, b) ((*(WORD *)(b)) ^= w)
#else
/* Useful macros -- machine independent little-endian version */
#define BYTE2WORD(b) ( \
(((WORD)(b)[3] & 0xFF)<<24) | \
(((WORD)(b)[2] & 0xFF)<<16) | \
(((WORD)(b)[1] & 0xFF)<<8) | \
(((WORD)(b)[0] & 0xFF)) \
)
#define WORD2BYTE(w, b) { \
(b)[3] = Byte(w,3); \
(b)[2] = Byte(w,2); \
(b)[1] = Byte(w,1); \
(b)[0] = Byte(w,0); \
}
#define XORWORD(w, b) { \
(b)[3] ^= Byte(w,3); \
(b)[2] ^= Byte(w,2); \
(b)[1] ^= Byte(w,1); \
(b)[0] ^= Byte(w,0); \
}
#endif
#if NLS_LONG_OUTPUT
#define ZEROCOUNTER(c) c->CtrModF16 = c->CtrMod232 = 0
#else
#define ZEROCOUNTER(c) /* nothing */
#endif /*NLS_LONG_OUTPUT*/
/* give correct offset for the current position of the register,
* where logically R[0] is at position "zero".
*/
#define OFF(zero, i) (((zero)+(i)) % N)
/* Return a non-linear function of some parts of the register.
*/
#define NLFUNC(c,z) \
(c->R[OFF(z,0)] + c->R[OFF(z,16)]) \
^ (c->R[OFF(z,1)] + c->R[OFF(z,13)]) \
^ (c->R[OFF(z,6)] + c->konst)
#if NLS_LONG_OUTPUT
/* Increment counter and mix into register every so often */
#define FIXCTR(c,z) \
{ \
if (++c->CtrModF16 == F16) { \
c->CtrMod232 += c->CtrModF16; \
c->R[OFF(z,CTRP)] += c->CtrMod232; \
c->CtrModF16 = 0; /* account for konst generation */ \
c->konst = NLFUNC(c,z); \
cycle(c); \
} \
}
#endif /*NLS_LONG_OUTPUT*/
static WORD
nltap(nls_ctx *c)
{
return NLFUNC(c, 0);
}
/* step the shift register */
/* After stepping, "zero" moves right one place */
#define STEP(c,z) \
{ register WORD t; \
t = ROTL(c->R[OFF(z,0)],19) + ROTL(c->R[OFF(z,15)],9) + c->konst; \
t ^= Sbox[(t >> 24) & 0xFF]; \
c->R[OFF(z,0)] = t ^ c->R[OFF(z,4)]; \
}
static void
cycle(nls_ctx *c)
{
WORD t;
int i;
/* nonlinear feedback function */
STEP(c,0);
/* shift register */
t = c->R[0];
for (i = 1; i < N; ++i)
c->R[i-1] = c->R[i];
c->R[N-1] = t;
#if NLS_LONG_OUTPUT
FIXCTR(c,0);
#endif /*NLS_LONG_OUTPUT*/
}
/* The Mundja MAC function is modelled after the round function of SHA-256.
* The following lines establish aliases for the MAC accumulator, just
* so that the definition of that function looks more like FIPS-180-2.
*/
#define A c->M[0]
#define B c->M[1]
#define C c->M[2]
#define D c->M[3]
#define E c->M[4]
#define F c->M[5]
#define G c->M[6]
#define H c->M[7]
#define SIGMA0(x) (ROTR((x), 2) ^ ROTR((x), 13) ^ ROTR((x), 22))
#define SIGMA1(x) (ROTR((x), 6) ^ ROTR((x), 11) ^ ROTR((x), 25))
#define CHOOSE(x,y,z) (z ^ (x & (y ^ z)))
#define MAJORITY(x,y,z) ((x & y) | (z & (x | y)))
/* Accumulate a nonlinear function of a register word and an input word for MAC.
* Except for the added S-Box and SOBER LFSR input instead of constants,
* this is exactly a round of SHA-256.
*/
#define SHAFUNC(c,i,k,A,B,C,D,E,F,G,H) \
{ \
WORD t1; \
t1 = H + k + i; \
t1 ^= Sbox[(t1 >> 24) & 0xFF]; \
t1 += SIGMA1(E) + CHOOSE(E, F, G); \
D += t1; \
t1 += SIGMA0(A) + MAJORITY(A, B, C); \
H = t1; \
}
static void
shafunc(nls_ctx *c, WORD i)
{
WORD t;
SHAFUNC(c, i, c->R[MACKONST], A, B, C, D, E, F, G, H);
/* now correct alignment of MAC accumulator */
t = c->M[NMAC-1];
for (i = NMAC-1; i > 0; --i)
c->M[i] = c->M[i-1];
c->M[0] = t;
}
/* Accumulate a CRC of input words, later to be fed into MAC.
*/
#define CRCFUNC(c,i,zero,five) \
{ \
WORD t1; \
t1 = (c->CRC[zero] << 8) ^ Multab[(c->CRC[zero] >> 24) & 0xFF] \
^ c->CRC[five] ^ i; \
c->CRC[zero] = t1; \
}
static void
crcfunc(nls_ctx *c, WORD i)
{
WORD t;
CRCFUNC(c, i, 0, 5);
/* now correct alignment of CRC accumulator */
t = c->CRC[0];
for (i = 1; i < NMAC; ++i)
c->CRC[i-1] = c->CRC[i];
c->CRC[NMAC-1] = t;
}
/* Normal MAC word processing: do both SHA and CRC.
*/
static void
macfunc(nls_ctx *c, WORD i)
{
crcfunc(c, i);
shafunc(c, i);
}
/* initialise to known state
*/
static void
nls_initstate(nls_ctx *c)
{
int i;
/* Register initialised to Fibonacci numbers */
c->R[0] = 1;
c->R[1] = 1;
for (i = 2; i < N; ++i)
c->R[i] = c->R[i-1] + c->R[i-2];
c->konst = INITKONST;
ZEROCOUNTER(c);
}
/* Save the current register state
*/
static void
nls_savestate(nls_ctx *c)
{
int i;
for (i = 0; i < N; ++i)
c->initR[i] = c->R[i];
}
/* initialise to previously saved register state
*/
static void
nls_reloadstate(nls_ctx *c)
{
int i;
for (i = 0; i < N; ++i)
c->R[i] = c->initR[i];
ZEROCOUNTER(c);
}
/* Initialise "konst"
* Tweak -- since Konst now changes regularly, there is no reason
* to avoid a zero high byte.
*/
static void
nls_genkonst(nls_ctx *c)
{
cycle(c);
c->konst = nltap(c);
}
/* Load key material into the register
*/
#define ADDKEY(k) \
c->R[KEYP] += (k);
#define XORNL(nl) \
c->R[FOLDP] ^= (nl);
/* nonlinear diffusion of register for key and MAC */
#define DROUND(z) STEP(c,z); c->R[OFF((z+1),FOLDP)] ^= NLFUNC(c,(z+1));
static void
nls_diffuse(nls_ctx *c)
{
/* relies on FOLD == N! */
DROUND(0);
DROUND(1);
DROUND(2);
DROUND(3);
DROUND(4);
DROUND(5);
DROUND(6);
DROUND(7);
DROUND(8);
DROUND(9);
DROUND(10);
DROUND(11);
DROUND(12);
DROUND(13);
DROUND(14);
DROUND(15);
DROUND(16);
}
/* common actions for loading key material */
/* Tweak: allow non-word-multiple key and nonce materianl
*/
static void
nls_loadkey(nls_ctx *c, UCHAR key[], int keylen)
{
int i, j;
WORD k;
UCHAR xtra[4];
/* start folding in key */
for (i = 0; i < (keylen & ~0x3); i += 4)
{
k = BYTE2WORD(&key[i]);
ADDKEY(k);
cycle(c);
XORNL(nltap(c));
}
/* if there were any extra key bytes, zero pad to a word */
if (i < keylen) {
for (j = 0 /* i unchanged */; i < keylen; ++i)
xtra[j++] = key[i];
for (/* j unchanged */; j < 4; ++j)
xtra[j] = 0;
k = BYTE2WORD(xtra);
ADDKEY(k);
cycle(c);
XORNL(nltap(c));
}
/* also fold in the length of the key */
ADDKEY(keylen);
/* now diffuse */
nls_diffuse(c);
}
/* initialise MAC related registers
*/
void
nls_macinit(nls_ctx *c)
{
int i;
for (i = 0; i < NMAC; ++i) {
c->M[i] = c->R[i];
c->CRC[i] = c->R[i+NMAC];
}
}
/* Published "key" interface
*/
void
nls_key(nls_ctx *c, UCHAR key[], int keylen)
{
nls_initstate(c);
nls_loadkey(c, key, keylen);
nls_genkonst(c);
nls_savestate(c);
nls_macinit(c);
c->nbuf = 0;
ZEROCOUNTER(c);
}
/* Published "nonce" interface
*/
void
nls_nonce(nls_ctx *c, UCHAR nonce[], int noncelen)
{
nls_reloadstate(c);
c->konst = INITKONST; /* TWEAK */
nls_loadkey(c, nonce, noncelen);
nls_genkonst(c); /* TWEAK */
nls_macinit(c);
c->nbuf = 0;
ZEROCOUNTER(c);
}
/* XOR pseudo-random bytes into buffer
* Note: doesn't play well with MAC functions.
*/
#define SROUND(z) STEP(c,z); t = NLFUNC(c,(z+1)); XORWORD(t, buf+(z*4));
void
nls_stream(nls_ctx *c, UCHAR *buf, int nbytes)
{
WORD t = 0;
/* handle any previously buffered bytes */
while (c->nbuf != 0 && nbytes != 0) {
*buf++ ^= c->sbuf & 0xFF;
c->sbuf >>= 8;
c->nbuf -= 8;
--nbytes;
}
/* do lots at a time, if there's enough to do */
while (nbytes >= N*4)
{
#if NLS_LONG_OUTPUT
if (c->CtrModF16 < (F16-18)) {
#endif /*NLS_LONG_OUTPUT*/
SROUND(0);
SROUND(1);
SROUND(2);
SROUND(3);
SROUND(4);
SROUND(5);
SROUND(6);
SROUND(7);
SROUND(8);
SROUND(9);
SROUND(10);
SROUND(11);
SROUND(12);
SROUND(13);
SROUND(14);
SROUND(15);
SROUND(16);
buf += 4*N;
nbytes -= N*4;
#if NLS_LONG_OUTPUT
c->CtrModF16 += 17;
}
else {
do {
cycle(c);
t = nltap(c);
XORWORD(t, buf);
buf += 4;
nbytes -= 4;
} while (F16-18 < c->CtrModF16);
}
#endif /*NLS_LONG_OUTPUT*/
}
/* do small or odd size buffers the slow way */
while (4 <= nbytes) {
cycle(c);
t = nltap(c);
XORWORD(t, buf);
buf += 4;
nbytes -= 4;
}
/* handle any trailing bytes */
if (nbytes != 0) {
cycle(c);
c->sbuf = nltap(c);
c->nbuf = 32;
while (c->nbuf != 0 && nbytes != 0) {
*buf++ ^= c->sbuf & 0xFF;
c->sbuf >>= 8;
c->nbuf -= 8;
--nbytes;
}
}
}
/* accumulate words into MAC without encryption
* Note that plaintext is accumulated for MAC.
*/
#define MROUND(z,A,B,C,D,E,F,G,H) \
t = BYTE2WORD(buf+(z*4)); \
STEP(c,z); \
CRCFUNC(c,t,((z)&0x7),(((z)+5)&0x7)); \
SHAFUNC(c,t,c->R[OFF(z+1,MACKONST)],A,B,C,D,E,F,G,H);
void
nls_maconly(nls_ctx *c, UCHAR *buf, int nbytes)
{
int i;
WORD t = 0;
/* handle any previously buffered bytes */
if (c->nbuf != 0) {
while (c->nbuf != 0 && nbytes != 0) {
c->mbuf ^= (*buf++) << (32 - c->nbuf);
c->nbuf -= 8;
--nbytes;
}
if (c->nbuf != 0) /* not a whole word yet */
return;
/* LFSR already cycled */
macfunc(c, c->mbuf);
}
/* do lots at a time, if there's enough to do */
while (4*N <= nbytes)
{
#if NLS_LONG_OUTPUT
if (c->CtrModF16 < (F16-18)) {
#endif /*NLS_LONG_OUTPUT*/
MROUND( 0,A,B,C,D,E,F,G,H);
MROUND( 1,H,A,B,C,D,E,F,G);
MROUND( 2,G,H,A,B,C,D,E,F);
MROUND( 3,F,G,H,A,B,C,D,E);
MROUND( 4,E,F,G,H,A,B,C,D);
MROUND( 5,D,E,F,G,H,A,B,C);
MROUND( 6,C,D,E,F,G,H,A,B);
MROUND( 7,B,C,D,E,F,G,H,A);
MROUND( 8,A,B,C,D,E,F,G,H);
MROUND( 9,H,A,B,C,D,E,F,G);
MROUND(10,G,H,A,B,C,D,E,F);
MROUND(11,F,G,H,A,B,C,D,E);
MROUND(12,E,F,G,H,A,B,C,D);
MROUND(13,D,E,F,G,H,A,B,C);
MROUND(14,C,D,E,F,G,H,A,B);
MROUND(15,B,C,D,E,F,G,H,A);
MROUND(16,A,B,C,D,E,F,G,H);
buf += 4*N;
nbytes -= 4*N;
/* fix alignment of MAC buffer */
t = c->M[NMAC-1];
for (i = NMAC-1; i > 0; --i)
c->M[i] = c->M[i-1];
c->M[0] = t;
/* fix alignment of CRC buffer */
t = c->CRC[0];
for (i = 1; i < NMAC; ++i)
c->CRC[i-1] = c->CRC[i];
c->CRC[NMAC-1] = t;
#if NLS_LONG_OUTPUT
c->CtrModF16 += 17;
}
else {
do {
cycle(c);
macfunc(c, BYTE2WORD(buf));
buf += 4;
nbytes -= 4;
} while (F16-18 < c->CtrModF16);
}
#endif /*NLS_LONG_OUTPUT*/
}
/* do small or odd size buffers the slow way */
while (4 <= nbytes) {
cycle(c);
macfunc(c, BYTE2WORD(buf));
buf += 4;
nbytes -= 4;
}
/* handle any trailing bytes */
if (nbytes != 0) {
cycle(c);
c->sbuf = nltap(c);
c->mbuf = 0;
c->nbuf = 32;
while (nbytes != 0) {
c->mbuf ^= (*buf++) << (32 - c->nbuf);
c->nbuf -= 8;
--nbytes;
}
}
}
/* Combined MAC and encryption.
* Note that plaintext is accumulated for MAC.
*/
#define EROUND(z,A,B,C,D,E,F,G,H) \
STEP(c,z); \
t3 = BYTE2WORD(buf+(z*4)); \
CRCFUNC(c,t3,((z)&0x7),(((z)+5)&0x7)); \
SHAFUNC(c,t3,c->R[OFF(z+1,MACKONST)],A,B,C,D,E,F,G,H); \
t = NLFUNC(c,(z+1)); \
t ^= t3; \
WORD2BYTE(t,buf+(z*4));
void
nls_encrypt(nls_ctx *c, UCHAR *buf, int nbytes)
{
WORD t = 0, t3 = 0;
int i;
/* handle any previously buffered bytes */
if (c->nbuf != 0) {
while (c->nbuf != 0 && nbytes != 0) {
c->mbuf ^= *buf << (32 - c->nbuf);
*buf ^= (c->sbuf >> (32 - c->nbuf)) & 0xFF;
++buf;
c->nbuf -= 8;
--nbytes;
}
if (c->nbuf != 0) /* not a whole word yet */
return;
/* LFSR already cycled */
macfunc(c, c->mbuf);
}
/* do lots at a time, if there's enough to do */
while (4*N <= nbytes)
{
#if NLS_LONG_OUTPUT
if (c->CtrModF16 < (F16-18)) {
#endif /*NLS_LONG_OUTPUT*/
EROUND( 0,A,B,C,D,E,F,G,H);
EROUND( 1,H,A,B,C,D,E,F,G);
EROUND( 2,G,H,A,B,C,D,E,F);
EROUND( 3,F,G,H,A,B,C,D,E);
EROUND( 4,E,F,G,H,A,B,C,D);
EROUND( 5,D,E,F,G,H,A,B,C);
EROUND( 6,C,D,E,F,G,H,A,B);
EROUND( 7,B,C,D,E,F,G,H,A);
EROUND( 8,A,B,C,D,E,F,G,H);
EROUND( 9,H,A,B,C,D,E,F,G);
EROUND(10,G,H,A,B,C,D,E,F);
EROUND(11,F,G,H,A,B,C,D,E);
EROUND(12,E,F,G,H,A,B,C,D);
EROUND(13,D,E,F,G,H,A,B,C);
EROUND(14,C,D,E,F,G,H,A,B);
EROUND(15,B,C,D,E,F,G,H,A);
EROUND(16,A,B,C,D,E,F,G,H);
buf += 4*N;
nbytes -= 4*N;
/* fix alignment of MAC buffer */
t = c->M[7];
for (i = NMAC-1; i > 0; --i)
c->M[i] = c->M[i-1];
c->M[0] = t;
/* fix alignment of CRC buffer */
t = c->CRC[0];
for (i = 1; i < NMAC; ++i)
c->CRC[i-1] = c->CRC[i];
c->CRC[NMAC-1] = t;
#if NLS_LONG_OUTPUT
c->CtrModF16 += 17;
}
else {
do {
cycle(c);
t = BYTE2WORD(buf);
macfunc(c, t);
t ^= nltap(c);
WORD2BYTE(t, buf);
buf += 4;
nbytes -= 4;
} while (F16-18 < c->CtrModF16);
}
#endif /*NLS_LONG_OUTPUT*/
}
/* do small or odd size buffers the slow way */
while (4 <= nbytes) {
cycle(c);
t = BYTE2WORD(buf);
macfunc(c, t);
t ^= nltap(c);
WORD2BYTE(t, buf);
nbytes -= 4;
buf += 4;
}
/* handle any trailing bytes */
if (nbytes != 0) {
cycle(c);
c->sbuf = nltap(c);
c->mbuf = 0;
c->nbuf = 32;
while (c->nbuf != 0 && nbytes != 0) {
c->mbuf ^= *buf << (32 - c->nbuf);
*buf ^= (c->sbuf >> (32 - c->nbuf)) & 0xFF;
++buf;
c->nbuf -= 8;
--nbytes;
}
}
}
/* Combined MAC and decryption.
* Note that plaintext is accumulated for MAC.
*/
#undef DROUND
#define DROUND(z,A,B,C,D,E,F,G,H) \
STEP(c,z); \
t = NLFUNC(c,(z+1)); \
t3 = BYTE2WORD(buf+(z*4)); \
t ^= t3; \
CRCFUNC(c,t,((z)&0x7),(((z)+5)&0x7)); \
SHAFUNC(c,t,c->R[OFF(z+1,MACKONST)],A,B,C,D,E,F,G,H); \
WORD2BYTE(t, buf+(z*4));
void
nls_decrypt(nls_ctx *c, UCHAR *buf, int nbytes)
{
WORD t = 0, t3 = 0;
int i;
/* handle any previously buffered bytes */
if (c->nbuf != 0) {
while (c->nbuf != 0 && nbytes != 0) {
*buf ^= (c->sbuf >> (32 - c->nbuf)) & 0xFF;
c->mbuf ^= *buf << (32 - c->nbuf);
++buf;
c->nbuf -= 8;
--nbytes;
}
if (c->nbuf != 0) /* not a whole word yet */
return;
/* LFSR already cycled */
macfunc(c, c->mbuf);
}
/* now do lots at a time, if there's enough */
while (4*N <= nbytes)
{
#if NLS_LONG_OUTPUT
if (c->CtrModF16 < (F16-18)) {
#endif /*NLS_LONG_OUTPUT*/
DROUND( 0,A,B,C,D,E,F,G,H);
DROUND( 1,H,A,B,C,D,E,F,G);
DROUND( 2,G,H,A,B,C,D,E,F);
DROUND( 3,F,G,H,A,B,C,D,E);
DROUND( 4,E,F,G,H,A,B,C,D);
DROUND( 5,D,E,F,G,H,A,B,C);
DROUND( 6,C,D,E,F,G,H,A,B);
DROUND( 7,B,C,D,E,F,G,H,A);
DROUND( 8,A,B,C,D,E,F,G,H);
DROUND( 9,H,A,B,C,D,E,F,G);
DROUND(10,G,H,A,B,C,D,E,F);
DROUND(11,F,G,H,A,B,C,D,E);
DROUND(12,E,F,G,H,A,B,C,D);
DROUND(13,D,E,F,G,H,A,B,C);
DROUND(14,C,D,E,F,G,H,A,B);
DROUND(15,B,C,D,E,F,G,H,A);
DROUND(16,A,B,C,D,E,F,G,H);
buf += 4*N;
nbytes -= 4*N;
/* fix alignment of MAC buffer */
t = c->M[7];
for (i = NMAC-1; i > 0; --i)
c->M[i] = c->M[i-1];
c->M[0] = t;
/* fix alignment of CRC buffer */
t = c->CRC[0];
for (i = 1; i < NMAC; ++i)
c->CRC[i-1] = c->CRC[i];
c->CRC[NMAC-1] = t;
#if NLS_LONG_OUTPUT
c->CtrModF16 += 17;
}
else {
do {
cycle(c);
t = nltap(c);
t3 = BYTE2WORD(buf);
t ^= t3;
macfunc(c, t);
WORD2BYTE(t, buf);
buf += 4;
nbytes -= 4;
} while (F16-18 < c->CtrModF16);
}
#endif /*NLS_LONG_OUTPUT*/
}
/* do small or odd size buffers the slow way */
while (4 <= nbytes) {
cycle(c);
t = nltap(c);
t3 = BYTE2WORD(buf);
t ^= t3;
macfunc(c, t);
WORD2BYTE(t, buf);
nbytes -= 4;
buf += 4;
}
/* handle any trailing bytes */
if (nbytes != 0) {
cycle(c);
c->sbuf = nltap(c);
c->mbuf = 0;
c->nbuf = 32;
while (c->nbuf != 0 && nbytes != 0) {
*buf ^= (c->sbuf >> (32 - c->nbuf)) & 0xFF;
c->mbuf ^= *buf << (32 - c->nbuf);
++buf;
c->nbuf -= 8;
--nbytes;
}
}
}
/* Having accumulated a MAC, finish processing and return it.
* Note that any unprocessed bytes are treated as if
* they were encrypted zero bytes, so plaintext (zero) is accumulated.
*/
void
nls_finish(nls_ctx *c, UCHAR *buf, int nbytes)
{
int i;
/* handle any previously buffered bytes */
if (c->nbuf != 0) {
/* LFSR already cycled */
macfunc(c, c->mbuf);
}
/* perturb the MAC to mark end of input.
* Note that only the SHA part is updated, not the CRC. This is an
* action that can't be duplicated by passing in plaintext, hence
* defeating any kind of extension attack.
*/
cycle(c);
shafunc(c, INITKONST + (c->nbuf << 24));
c->nbuf = 0;
/* now add the CRC to the MAC like input material */
for (i = 0; i < NMAC; ++i) {
cycle(c);
crcfunc(c, 0);
shafunc(c, c->CRC[7]);
}
/* continue that process, producing output from the MAC buffer */
while (nbytes > 0) {
cycle(c);
crcfunc(c, 0);
shafunc(c, c->CRC[7]);
if (nbytes >= 4) {
WORD2BYTE(A, buf);
nbytes -= 4;
buf += 4;
}
else {
for (i = 0; i < nbytes; ++i)
buf[i] = Byte(A, i);
break;
}
}
}
|
eSTREAM Project Powered by ViewCVS 1.0-dev |
ViewCVS and CVS Help |