C:为hexdump格式化字符串(从char *到另一个char *)

时间:2019-01-17 14:13:09

标签: c hex hexdump

我想将一个this.props.onRouteChange('home')指针的十六进制转储写入另一个char*中。

为此,我采取了this code snippet

char*

并像这样修改它:

#include <stdio.h>

void DumpHex(const void* data, size_t size) {
    char ascii[17];
    size_t i, j;
    ascii[16] = '\0';
    for (i = 0; i < size; ++i) {
        printf("%02X ", ((unsigned char*)data)[i]);
        if (((unsigned char*)data)[i] >= ' ' && ((unsigned char*)data)[i] <= '~') {
            ascii[i % 16] = ((unsigned char*)data)[i];
        } else {
            ascii[i % 16] = '.';
        }
        if ((i+1) % 8 == 0 || i+1 == size) {
            printf(" ");
            if ((i+1) % 16 == 0) {
                printf("|  %s \n", ascii);
            } else if (i+1 == size) {
                ascii[(i+1) % 16] = '\0';
                if ((i+1) % 16 <= 8) {
                    printf(" ");
                }
                for (j = (i+1) % 16; j < 16; ++j) {
                    printf("   ");
                }
                printf("|  %s \n", ascii);
            }
        }
    }
}

它工作并返回相同的输出:

#include <stdio.h>

char* DumpHex2(const void* data, size_t size) {
    const int symbolSize = 100;
    char* buffer = calloc(10*size, sizeof(char));
    char* symbol = calloc(symbolSize, sizeof(char));

    char ascii[17];
    size_t i, j;
    ascii[16] = '\0';
    for (i = 0; i < size; ++i) {
        snprintf(symbol, symbolSize, "%02X ", ((unsigned char*)data)[i]);
        strcat(buffer, symbol);
        memset(symbol,0,strlen(symbol));
        if (((unsigned char*)data)[i] >= ' ' && ((unsigned char*)data)[i] <= '~') {
            ascii[i % 16] = ((unsigned char*)data)[i];
        } else {
            ascii[i % 16] = '.';
        }
        if ((i+1) % 8 == 0 || i+1 == size) {
            strcat(buffer, " ");
            if ((i+1) % 16 == 0) {
                snprintf(symbol, symbolSize, "|  %s \n", ascii);
                strcat(buffer, symbol);
                memset(symbol,0,strlen(symbol));
            } else if (i+1 == size) {
                ascii[(i+1) % 16] = '\0';
                if ((i+1) % 16 <= 8) {
                    strcat(buffer, " ");
                }
                for (j = (i+1) % 16; j < 16; ++j) {
                    strcat(buffer, "   ");
                }
                snprintf(symbol, symbolSize, "|  %s \n", ascii);
                strcat(buffer, symbol);
                memset(symbol,0,strlen(symbol));
            }
        }
    }

    free(symbol);

    return buffer;
}

输出:

int main(int argc, char **argv) {
    char* text = "Hello World! é";

    DumpHex(text, strlen(text));

    char* dump = DumpHex2(text, strlen(text));
    printf("%s", dump);
    free(dump);

    return EXIT_SUCCESS;
}

但是,我的修改是:

48 65 6C 6C 6F 20 57 6F  72 6C 64 21 20 C3 A9     |  Hello World! .. 
48 65 6C 6C 6F 20 57 6F  72 6C 64 21 20 C3 A9     |  Hello World! .. 

对我不好(我是C的新手)。有没有一种更容易格式化和附加字符串的方法?

1 个答案:

答案 0 :(得分:2)

您不能在未初始化的数据上使用strlen()

char* buffer = malloc(1000000);
memset(buffer,0,strlen(buffer));

strlen()无法找出分配的内存大小,因为它依赖于终止空字符(0'\0'),而终止空字符可能是也可能不是缓冲区指向的内存中的某个位置。在memset()中指定分配的内存大小:

memset(buffer, 0, 1000000);

或使用calloc()将分配的内存初始化为零:

char buffer = calloc(1000000, sizeof(char));  // or calloc(1000000, 1) since sizeof(char) is 1 by definition.

您的代码中可能仍然存在其他问题。例如,您在DumpHex2()中调用main() 两次,但是从不释放函数分配的内存。为symbol分配的内存也泄漏了。

如果您更新问题以包含您要DumpHex2()生成的文本的确切格式,则答案会更容易。

您应该使用isprint()来确定字符是否可打印。

Shorter和IMHO更易于阅读和理解:

#include <ctype.h>   // isprint()
#include <stddef.h>  // size_t
#include <stdlib.h>  // malloc(), free()
#include <string.h>  // strcat()
#include <stdio.h>   // sprintf()

enum {
    DUMP_BYTES_PER_LINE = 16,
    DUMP_BYTES_GROUP = 8,
    DUMP_CHARS_PER_LINE = DUMP_BYTES_PER_LINE * 4 + DUMP_BYTES_PER_LINE / DUMP_BYTES_GROUP + 4
};

char* DumpHex(const void* data, size_t size)
{
    size_t const num_lines = size / DUMP_BYTES_PER_LINE + ((size % DUMP_BYTES_PER_LINE) > 0);
    size_t const result_length = num_lines * DUMP_CHARS_PER_LINE;

    char *result = malloc((result_length + 1) * sizeof(*result));
    if (!result)
        return NULL;

    memset(result, ' ', result_length);
    result[result_length] = '\0';

    char *dump_pos = result;
    char *plain_pos = result + DUMP_BYTES_PER_LINE * 3 + DUMP_BYTES_PER_LINE / DUMP_BYTES_GROUP + 3;
    char unsigned const *src = data;

    for (size_t i = 0; i < size; ++i, dump_pos += 3, ++plain_pos) {

        sprintf(dump_pos, "%02x ", (int)src[i]);
        dump_pos[3] = ' ';
        *plain_pos = isprint(src[i]) ? src[i] : '.';

        if ((i + 1) % DUMP_BYTES_PER_LINE == 0 || i + 1 == size) {
            *++plain_pos = '\n';

            size_t const bytes_per_line_left = (i + 1) % DUMP_BYTES_PER_LINE;
            plain_pos[bytes_per_line_left ? -(long long)bytes_per_line_left - 3 : -DUMP_BYTES_PER_LINE - 3] = '|';

            dump_pos = plain_pos + 1 - 3;
            plain_pos = dump_pos + DUMP_BYTES_PER_LINE * 3 + DUMP_BYTES_PER_LINE / DUMP_BYTES_GROUP + 5;
        }
        else if ((i + 1) % DUMP_BYTES_GROUP == 0) {
            ++dump_pos;
        }
    }

    return result;
}