错误的 SHA-1 哈希答案

【问题标题】：Wrong SHA-1 hash错误的 SHA-1 哈希
【发布时间】：2016-02-03 13:28:20
【问题描述】：

我计划将 AVR-Crypto 的 SHA-1 implementation 用于 HMAC。但是，我似乎无法生成正确的 SHA-1 总和。

例如，如果我用以下方式调用函数

  unsigned char sha1sum[20];
  char *msg = "FFFFFFFFFF";

  sha1( sha1sum, msg, strlen(msg));

我得到000000000000000000002C002312290000000029，而不是预期的c1bb92851109fe950a2655fa1d4ba1d04719f6fb。有谁知道可能出了什么问题？这是 AVR-Crypto 的实现

#include <string.h> /* memcpy & co */
#include <stdint.h>
#include "config.h"
#include "debug.h"
#include "sha1.h"

#ifdef DEBUG
#  undef DEBUG
#endif

#include "cli.h"

#define LITTLE_ENDIAN

/********************************************************************************************************/

/**
 * \brief initialises given SHA-1 context
 *
 */
void sha1_init(sha1_ctx_t *state){
    DEBUG_S("\r\nSHA1_INIT");
    state->h[0] = 0x67452301;
    state->h[1] = 0xefcdab89;
    state->h[2] = 0x98badcfe;
    state->h[3] = 0x10325476;
    state->h[4] = 0xc3d2e1f0;
    state->length = 0;
}

/********************************************************************************************************/
/* some helping functions */
uint32_t rotl32(uint32_t n, uint8_t bits){
    return ((n<<bits) | (n>>(32-bits)));
}

uint32_t change_endian32(uint32_t x){
    return (((x)<<24) | ((x)>>24) | (((x)& 0x0000ff00)<<8) | (((x)& 0x00ff0000)>>8));
}


/* three SHA-1 inner functions */
uint32_t ch(uint32_t x, uint32_t y, uint32_t z){
    DEBUG_S("\r\nCH");
    return ((x&y)^((~x)&z));
}

uint32_t maj(uint32_t x, uint32_t y, uint32_t z){
    DEBUG_S("\r\nMAJ");
    return ((x&y)^(x&z)^(y&z));
}

uint32_t parity(uint32_t x, uint32_t y, uint32_t z){
    DEBUG_S("\r\nPARITY");
    return ((x^y)^z);
}

/********************************************************************************************************/
/**
 * \brief "add" a block to the hash
 * This is the core function of the hash algorithm. To understand how it's working
 * and what thoese variables do, take a look at FIPS-182. This is an "alternativ" implementation
 */

#define MASK 0x0000000f

typedef uint32_t (*pf_t)(uint32_t x, uint32_t y, uint32_t z);

void sha1_nextBlock (sha1_ctx_t *state, const void *block){
    uint32_t a[5];
    uint32_t w[16];
    uint32_t temp;
    uint8_t t,s,fi, fib;
    pf_t f[] = {ch,parity,maj,parity};
    uint32_t k[4]={ 0x5a827999,
                    0x6ed9eba1,
                    0x8f1bbcdc,
                    0xca62c1d6};

    /* load the w array (changing the endian and so) */
    for(t=0; t<16; ++t){
        w[t] = change_endian32(((uint32_t*)block)[t]);
    }

#if DEBUG
    uint8_t dbgi;
    for(dbgi=0; dbgi<16; ++dbgi){
        /*
        DEBUG_S("\n\rBlock:");
        DEBUG_B(dbgi);
        DEBUG_C(':');
        */
        cli_putstr_P(PSTR("\r\nBlock:"));
        cli_hexdump(&dbgi, 1);
        cli_putc(':');
        cli_hexdump(&(w[dbgi]) ,4);
    }
#endif

    /* load the state */
    memcpy(a, state->h, 5*sizeof(uint32_t));


    /* the fun stuff */
    for(fi=0,fib=0,t=0; t<=79; ++t){
        s = t & MASK;
        if(t>=16){
            #if DEBUG
             DEBUG_S("\r\n ws = "); cli_hexdump(&(w[s]), 4);
            #endif
            w[s] = rotl32( w[(s+13)&MASK] ^ w[(s+8)&MASK] ^
                 w[(s+ 2)&MASK] ^ w[s] ,1);
            #ifdef DEBUG
             DEBUG_S(" --> ws = "); cli_hexdump(&(w[s]), 4);
            #endif
        }

        uint32_t dtemp;
        temp = rotl32(a[0],5) + (dtemp=f[fi](a[1],a[2],a[3])) + a[4] + k[fi] + w[s];
        memmove(&(a[1]), &(a[0]), 4*sizeof(uint32_t)); /* e=d; d=c; c=b; b=a; */
        a[0] = temp;
        a[2] = rotl32(a[2],30); /* we might also do rotr32(c,2) */
        fib++;
        if(fib==20){
            fib=0;
            fi = (fi+1)%4;
        }
        #if DEBUG
        /* debug dump */
        DEBUG_S("\r\nt = "); DEBUG_B(t);
        DEBUG_S("; a[]: ");
         cli_hexdump(a, 5*4);
        DEBUG_S("; k = ");
         cli_hexdump(&(k[t/20]), 4);
        DEBUG_S("; f(b,c,d) = ");
         cli_hexdump(&dtemp, 4);
        #endif
    }

    /* update the state */
    for(t=0; t<5; ++t){
        state->h[t] += a[t];
    }
    state->length += 512;
}

/********************************************************************************************************/

void sha1_lastBlock(sha1_ctx_t *state, const void *block, uint16_t length){
    uint8_t lb[SHA1_BLOCK_BYTES]; /* local block */
    while(length>=SHA1_BLOCK_BITS){
        sha1_nextBlock(state, block);
        length -= SHA1_BLOCK_BITS;
        block = (uint8_t*)block + SHA1_BLOCK_BYTES;
    }
    state->length += length;
    memset(lb, 0, SHA1_BLOCK_BYTES);
    memcpy (lb, block, (length+7)>>3);

    /* set the final one bit */
    lb[length>>3] |= 0x80>>(length & 0x07);

    if (length>512-64-1){ /* not enouth space for 64bit length value */
        sha1_nextBlock(state, lb);
        state->length -= 512;
        memset(lb, 0, SHA1_BLOCK_BYTES);
    }
    /* store the 64bit length value */
#if defined LITTLE_ENDIAN
        /* this is now rolled up */
    uint8_t i;
    for (i=0; i<8; ++i){
        lb[56+i] = ((uint8_t*)&(state->length))[7-i];
    }
#elif defined BIG_ENDIAN
    *((uint64_t)&(lb[56])) = state->length;
#endif
    sha1_nextBlock(state, lb);
}

/********************************************************************************************************/

void sha1_ctx2hash (void *dest, sha1_ctx_t *state){
#if defined LITTLE_ENDIAN
    uint8_t i;
    for(i=0; i<5; ++i){
        ((uint32_t*)dest)[i] = change_endian32(state->h[i]);
    }
#elif BIG_ENDIAN
    if (dest != state->h)
        memcpy(dest, state->h, SHA1_HASH_BITS/8);
#else
# error unsupported endian type!
#endif
}

/********************************************************************************************************/
/**
 *
 *
 */
void sha1 (void *dest, const void *msg, uint32_t length){
    sha1_ctx_t s;
    DEBUG_S("\r\nBLA BLUB");
    sha1_init(&s);
    while(length & (~0x0001ff)){ /* length>=512 */
        DEBUG_S("\r\none block");
        sha1_nextBlock(&s, msg);
        msg = (uint8_t*)msg + SHA1_BLOCK_BITS/8; /* increment pointer to next block */
        length -= SHA1_BLOCK_BITS;
    }
    sha1_lastBlock(&s, msg, length);
    sha1_ctx2hash(dest, &s);
}

这是标题：

#ifndef SHA1_H_
#define SHA1_H_

#include "stdint.h"
/** \def SHA1_HASH_BITS
 * definees the size of a SHA-1 hash in bits 
 */

/** \def SHA1_HASH_BYTES
 * definees the size of a SHA-1 hash in bytes 
 */

/** \def SHA1_BLOCK_BITS
 * definees the size of a SHA-1 input block in bits 
 */

/** \def SHA1_BLOCK_BYTES
 * definees the size of a SHA-1 input block in bytes 
 */
#define SHA1_HASH_BITS  160
#define SHA1_HASH_BYTES (SHA1_HASH_BITS/8)
#define SHA1_BLOCK_BITS 512
#define SHA1_BLOCK_BYTES (SHA1_BLOCK_BITS/8)

/** \typedef sha1_ctx_t
 * \brief SHA-1 context type
 * 
 * A vatiable of this type may hold the state of a SHA-1 hashing process
 */
typedef struct {
    uint32_t h[5];
//  uint64_t length;
    uint8_t length;
} sha1_ctx_t;

/** \typedef sha1_hash_t
 * \brief hash value type
 * A variable of this type may hold a SHA-1 hash value 
 */
/*
typedef uint8_t sha1_hash_t[SHA1_HASH_BITS/8];
*/

/** \fn sha1_init(sha1_ctx_t *state)
 * \brief initializes a SHA-1 context
 * This function sets a ::sha1_ctx_t variable to the initialization vector
 * for SHA-1 hashing.
 * \param state pointer to the SHA-1 context variable
 */
void sha1_init(sha1_ctx_t *state);

/** \fn sha1_nextBlock(sha1_ctx_t *state, const void *block)
 *  \brief process one input block
 * This function processes one input block and updates the hash context 
 * accordingly
 * \param state pointer to the state variable to update
 * \param block pointer to the message block to process
 */
void sha1_nextBlock (sha1_ctx_t *state, const void *block);

/** \fn sha1_lastBlock(sha1_ctx_t *state, const void *block, uint16_t length_b)
 * \brief processes the given block and finalizes the context
 * This function processes the last block in a SHA-1 hashing process.
 * The block should have a maximum length of a single input block.
 * \param state pointer to the state variable to update and finalize
 * \param block pointer to themessage block to process
 * \param length_b length of the message block in bits  
 */
void sha1_lastBlock (sha1_ctx_t *state, const void *block, uint16_t length_b);

/** \fn sha1_ctx2hash(sha1_hash_t *dest, sha1_ctx_t *state)
 * \brief convert a state variable into an actual hash value
 * Writes the hash value corresponding to the state to the memory pointed by dest.
 * \param dest pointer to the hash value destination
 * \param state pointer to the hash context
 */ 
void sha1_ctx2hash (void *dest, sha1_ctx_t *state);

/** \fn sha1(sha1_hash_t *dest, const void *msg, uint32_t length_b)
 * \brief hashing a message which in located entirely in RAM
 * This function automatically hashes a message which is entirely in RAM with
 * the SHA-1 hashing algorithm.
 * \param dest pointer to the hash value destination
 * \param msg  pointer to the message which should be hashed
 * \param length_b length of the message in bits
 */ 
void sha1(void *dest, const void *msg, uint32_t length_b);



#endif /*SHA1_H_*/

更新如果我用unsigned char sha1sum[20] = 0; 初始化sha1sum，结果总和都是0x00。

【问题讨论】：

你使用char sha1sum[20]，而你的预期输出长度是40字节，为什么？
我的意思是，你打印结果的方式可能有问题，你能不能提交输出000000000000000000002C002312290000000029的代码，我可以看到正确答案应该是46464646464646464646025580DA53484131，而不是c1bb92851109fe950a2655fa1d4ba1d04719f6fb
是吗？我正在使用这个site 来生成（参考）哈希。我输入FFFFFFFFFF，它给了我c1bb92851109fe950a2655fa1d4ba1d04719f6fb。这不是正确的哈希吗？
@user1034749 预期的输出实际上是 20 个字节
while(length & (~0x0001ff)){ /* length>=512 */ .*摇头*

标签： c encryption cryptography sha

【解决方案1】：

问题代码中至少有两个错误（详细如下），但都无法解释显示的结果，以及调用代码中的unsigned char sha1sum[20] = {0} 的附加事实改变了结果。从我们读到的 C 源代码翻译成机器代码有问题！很可能，sha1_ctx2hash 没有写到应该写的地方。

问题可能出在标题中，而不是问题中，编译器错误...由于我们在 8051 上，这可能是/曾经是 pointer types 的问题，尤其是在必须指向相同大小的指针。

另外，确定 8051 编译器是 little-endian 的吗？这似乎是常见的Keil C51 uses big-endian convention。这是编译器+支持库的任意选择，因为在原始的 8051 上没有与多字节数据相关的指令，最接近的是 LCALL，它的堆栈推送是 little-endian，但 LJMP 和 MOV DPTR,# 代码很大-字节序。更新：我们被告知编译器是由 IAR 提供的。根据IAR's documentation 的说法，版本 5 是 big-endian，而在版本 6 中更改为 little-endian。

更新：我们发现了另一个严重问题（除了可能不安全的指针转换和下面讨论的两个错误）。在搜索的某个时刻，将代码替换为没有字节序依赖或指针转换的单个过程，输出变为0000eb1700007f3d000004f0000059290000fc21，并且建议的将是 32 位的值被截断为 16 位。事实上，OP 透露：

我的stdint.h 中有这个：typedef unsigned uint32_t;

这仅在 unsigned int 是 32 位 的编译器上是正确的，而 C 标准给出的唯一保证是它至少是 16 位 >，并且该最小值被大多数 C 编译器用于小于 32 位的 CPU（出于效率原因；有些甚至可以选择禁用将字节操作数提升为整数，甚至对 80+80+96 是 @987654331 感到满意@)。

测试代码中的Bug：sha1( sha1sum, msg, strlen(msg))应该是sha1( sha1sum, msg, strlen(msg)*8)之类的，因为长度参数是以位为单位的。

sha1_lastBlock w.r.t 中的错误。头文件：代码读取

for (i=0; i<8; ++i){
    lb[56+i] = ((uint8_t*)&(state->length))[7-i];
}

假设state->length 是8 个字节，而实际上不是，因为uint64_t length 在标头中已更改为uint8_t length（通常uint64_t 在8051 编译器上不可用）。 big-endian 案例的代码（目前未编译）也受到影响。

如果确实是uint8_t length，因此最多可以接受 31 个字节的长度限制，那么 little-endian 和 big-endian 的情况都会减少到 lb[SHA1_BLOCK_BYTES-1] = state->length;（没有循环）。

或者，对于length 可能使用的任何无符号类型和字节序：

for (i = SHA1_BLOCK_BYTES; state->length != 0; state->length >>= 8)
    lb[--i] = (uint8_t)(state->length);

注意：代码*((uint64_t*)&(lb[56])) = state->length 将length 的8 个字节写入数组lb[] 的末尾，但仅在具有正确uint64_t 的大端机器上才是正确的。

代码在(length+7)%8 < 6 时存在潜在的额外问题：要散列的最后一个字节中的至少一个位未被屏蔽，如果设置它进入散列并使其出错。在对完整字节进行哈希处理的用例中，这不会造成伤害。

原始代码可能是正确的（除了上述潜在的额外问题），但考虑到目标是通过单个调用散列内存中的数据（sha1 所做的），并且既不紧凑也不可读.除其他问题外：

sha1_lastBlock 中（正确地）存在块循环，因此不存在标题中的限制块应具有单个输入块的最大长度；
这使得sha1 中的另一个块循环变得多余；
如果使用uint8_t length，或者散列小于56字节，这两个循环都可以删除；
循环循环可能会因 16 字节的 memmove 和索引表中的向量中的函数调用而减慢；
小端情况下的字节顺序转换效率相当低；
在sha1_ctx2hash 中，#elif BIG_ENDIAN 在我的心理编译器中触发了一个错误，因为BIG_ENDIAN 似乎未定义并且#elif 应该有一个参数；应该是#elif defined BIG_ENDIAN（如上面几行所用）；
pf_t f[] = {ch,parity,maj,parity}; 是 const 的一个很好的候选者，也许是 static：我曾经使用过的每个 8051 的 C 编译器都不会认识到数组在设置后没有改变，因此可以在代码中雕刻；
对于此类编译器，不必要地使用函数指针（如上）是一种会损害性能甚至更糟的久经考验的方法；至少它阻止了调用树的分析，需要在静态地址上通过覆盖分配自动变量，从而显着提高性能和代码大小。

如果你追求速度，你开始的代码是不够的，没有什么能比得上汇编语言。就像二十年前一样，我为一些 8051 工具链编写了 SHA-1，与仅 C 相比，汇编调整节省了大量资金（IIRC：主要是因为从性能角度来看，32 位旋转非常糟糕）。

更新：这里是散列短消息的说明性代码，以字节序中立的方式，没有任何指针转换，并且不依赖于<stdint.h>（事实证明这对于使用的编译器）。请注意length 参数以字节（而不是位）为单位，限制为 55 个字节，不允许在顶部实现 HMAC-SHA-1。这是为了保持代码简单：超过这个限制，我们需要多次迭代压缩函数，因此要么是大量的代码重复，要么至少有两个函数，要么是某种状态机。

#include <limits.h> // for UCHAR_MAX, UINT_MAX, ULONG_MAX

// Compute the SHA-1 hash of a short msg, of length at most 55 bytes
// Result hash must be 20 bytes; it can overlap msg.
// CAUTION: if length>55 the result is wrong, and if length>59
// we loose second-preimage resistance, thus collision-resistance.
void sha1upto55bytes(
          unsigned char *hash,  // result, 20 bytes
    const unsigned char *msg,   // bytes to hash
          unsigned char length  // length of msg in bytes, maximum 55
    )
    {
    // We locally (re)define uint8_t and uint32_t so as not to depend of <stdint.h>
    // which is not available on some old C compilers for embedded systems.
#if 255==UCHAR_MAX
    typedef unsigned char uint8_t;
#endif
#if 16383==UINT_MAX>>9>>9
    typedef unsigned int uint32_t;
#elif  16383==ULONG_MAX>>9>>9
    typedef unsigned long uint32_t;
#endif

    // Internal buffer (64 bytes)
    // We require 8-bit uint8_t, 32-bit uint32_t, and integer promotion; otherwise,
    // we try to abort compilation on the following declaration.
    uint32_t w[
        99==(uint8_t)355              &&  // check uint8_t
        4303==(uint32_t)(-1)/999u/999 &&  // check uint32_t
        440==(uint8_t)55<<3               // check integer promotion
        ? 16 : -1];                       // negative index if error

    // Type for state, so that we can use struct copy for that
    typedef struct state_t { uint32_t q[5]; } state_t;

    // Initial state; use single quotes if the compiler barks
    const state_t s = {{ 0x67452301,0xefcdab89,0x98badcfe,0x10325476,0xc3d2e1f0 }};

    // Active state (20 bytes); on 8051 should be in internal RAM for best performance
    state_t h = s;  // initialize the state using a struct copy

   // Workhorse temporary; on 8051 should be in internal RAM for best performance
    uint32_t x;

    // Workhorse index; on 8051 should be a register for performance
    uint8_t  j;

    // Prepare the single block to hash; this code works regardless of endianness,
    // and does not perform misaligned memory accesses if msg is misaligned.
    x = 0;  // This is only to prevent a bogus compiler warning
    j = 0;
    do
        {   // for each block byte, up to and including high 4 bytes of length
        x <<= 8;
        if (j < length)
            x |= *msg++;    // message byte
        else
            if (j == length)
                x |= 0x80;  // padding byte
        if ((j&3)==3)
            w[j >> 2] = x;
        }
    while (++j!=60);
    w[15] = length << 3;    // length in bits, needs integer promotion for length>31

    // Hash that block
    j = 0;
    do {        // round loop, run 80 times
        do {        // dummy loop (avoid a goto)
            if (j<40) {
                if (j<20) {             // for rounds 0..19
                    x = (((h.q[2] ^ h.q[3])&h.q[1]) ^ h.q[3]) + 0x5A827999;
                    break;  // out of dummy loop
                    }
                else
                    x = 0x6ED9EBA1;     // for rounds 20..39
                }
            else {
                if (j<60) {             // for rounds 40..59
                    x = (h.q[1] | h.q[2])&h.q[3];
                    x |= h.q[1] & h.q[2];
                    x += 0x8F1BBCDC;
                    break;
                    }
                else
                    x = 0xCA62C1D6;     // for rounds 60..79
                }
            // for rounds 20..39 and 60..79
            x += h.q[1] ^ h.q[2] ^ h.q[3];
            }
        while (0);      // end of of dummy loop
        // for all rounds
        x += (h.q[0] << 5) | (h.q[0] >> 27);
        x += h.q[4];
        h.q[4] = h.q[3];
        h.q[3] = h.q[2];
        h.q[2] = (h.q[1] << 30) | (h.q[1] >> 2);
        h.q[1] = h.q[0];
        h.q[0] = x;
        x = w[j & 15];
        if (j>=16) {    // rounds 16..79
            x ^= w[(j + 2) & 15];
            x ^= w[(j + 8) & 15];
            x ^= w[(j + 13) & 15];
            w[j & 15] = x = (x << 1) | (x >> 31);
            }
        h.q[0] += x;    // for all rounds
        }
    while (++j != 80);
    // The five final 32-bit modular additions are made in the next loop, and
    // reuse the constants (rather than a RAM copy), saving code and RAM.

    // Final addition and store result; this code works regardless of endianness,
    // and does not perform misaligned memory accesses if hash is misaligned.
    j = 0;
    do
        {
        x = h.q[j] + s.q[j];    // final 32-bit modular additions
        *hash++ = (uint8_t)(x>>24);
        *hash++ = (uint8_t)(x>>16);
        *hash++ = (uint8_t)(x>> 8);
        *hash++ = (uint8_t)(x    );
        }
    while (++j != 5);
    }

【讨论】：

如果您的输入是 8 个字节或更少，那么首先使用 SHA-1 对其进行散列有什么意义？如果那是为了隐藏该输入（例如密码），从加密/安全的角度来看，SHA-1 是一个非常糟糕的选择，您需要盐（例如用户名、设备序列号..）和基于密码的密钥派生函数，基线是 PBKDF2，最先进的（至少几年前）是 scrypt。
谢谢。你说“小端和大端都减少到lb[63] = state->length;”怎么会是lb[63]？小端大小写的索引不会增加吗？为什么特别是63？确实，如果有可用的程序集实现，那就太好了，但不幸的是，我似乎找不到。
但要迁移到字节序中立，两种字节序类型都可以在sha1_ctx2hash() 中使用if (dest != state->h) memcpy(dest, state->h, SHA1_HASH_BITS/8); 吗？
@Kar：不。您上一条评论中的代码依赖于大端。我将在几分钟内发布整个 shebang 的工作代码。
非常感谢。我已经尝试了您提供的代码，但是对于"FFFFFFFFFF"，我得到了哈希0000eb1700007f3d000004f0000059290000fc21。我不认为这是正确的哈希，但我错过了什么吗？