从numpy的二进制文件中读取uint32_t

时间:2016-07-13 21:05:33

标签: python c++ numpy fstream

numpy数组的tofile()方法用于将无符号32位整数数组写为二进制文件(test.bin)。然后,使用c ++从文件中读取uint32_t。问题是c ++程序没有读取正确的值。如何解决?

十六进制编辑器显示test.bin是正确的,因为值按预期逐个增加。

fileio.py:

import numpy as np
x = np.arange(20)+65536
y = x.astype(np.uint32)
print(y)
with open("test.bin", "wb+") as f:
    y.tofile(f)

fileio.py的输出:

[65536 65537 65538 65539 65540 65541 65542 65543 65544 65545 65546 65547
 65548 65549 65550 65551 65552 65553 65554 65555]

test.bin :(在十六进制编辑器中.vim与%!xxd命令)

0000000: 0000 0100 0100 0100 0200 0100 0300 0100  ................
0000010: 0400 0100 0500 0100 0600 0100 0700 0100  ................
0000020: 0800 0100 0900 0100 0a00 0100 0b00 0100  ................
0000030: 0c00 0100 0d00 0100 0e00 0100 0f00 0100  ................
0000040: 1000 0100 1100 0100 1200 0100 1300 0100  ................
0000050: 0a                                       .   

fileio.cpp:

#include <iostream>
#include <vector>
#include <string>
#include <fstream>
#include <byteswap.h>

using namespace std;

int main(void){
    vector<char> arr;
    char n;
    int i;
    int num_char=0;
    //ifstream f("test.bin");
    fstream f;
    f.open("test.bin", ios::in | ios::binary);

    while(f>>n){
        cout << int(n) << ' ';
        arr.push_back(n);
        num_char++;
    }
    cout << endl;
    cout << "number of characters: " << num_char << endl;
    size_t uint32t_size = arr.size() * sizeof(char) / sizeof(uint32_t);
    uint32_t* ptr_arr0 = (uint32_t*)arr.data();

    cout << "uint32_t size: " << uint32t_size << endl;
    cout << "uint32_t interpretatin:" << endl;
    for (i = 0; i < uint32t_size; i++){
        cout << ptr_arr0[i] << ' ';
    }
    cout << endl;

    cout << "32bit byteswap: " << endl;
    for (i=0; i < uint32t_size; i++){
        ptr_arr0[i] = bswap_32(ptr_arr0[i]);
        cout << ptr_arr0[i] << ' ';
    }
    cout << endl;
    cout << "characters after byte swap: " << endl;
    for (i=0; i < num_char; i++){
        cout << int(arr[i]) << ' ';
    }
    cout << endl;

}   

fileio.cpp的输出:

0 0 1 0 1 0 1 0 2 0 1 0 3 0 1 0 4 0 1 0 5 0 1 0 6 0 1 0 7 0 1 0 8 0 1 0 0 1 0 0 1 0 0 1 0 0 1 0 0 1 0 14 0 1 0 15 0 1 0 16 0 1 0 17 0 1 0 18 0 1 0 19 0 1 0 
number of characters: 75
uint32_t size: 18
uint32_t interpretatin:
65536 65537 65538 65539 65540 65541 65542 65543 65544 256 16777217 65536 234881280 251658496 268435712 285212928 301990144 318767360 
32bit byteswap: 
256 16777472 33554688 50331904 67109120 83886336 100663552 117440768 134217984 65536 16777217 256 65550 65551 65552 65553 65554 65555 
characters after byte swap: 
0 1 0 0 0 1 0 1 0 1 0 2 0 1 0 3 0 1 0 4 0 1 0 5 0 1 0 6 0 1 0 7 0 1 0 8 0 0 1 0 1 0 0 1 0 1 0 0 14 0 1 0 15 0 1 0 16 0 1 0 17 0 1 0 18 0 1 0 19 0 1 0 0 1 0 

似乎字节交换不是唯一的问题。 c ++程序甚至没有正确读取所有8位整数,如:

... 1 0 8 0 1 0 0 1 0 0 1 0 0 1 0 0 1 0 0 1 0 14 ...

没有数字9,10,11,12,13,尽管test.bin的十六进制编辑器视图中存在这些数字。

可能相关的问题:

更新

readbinary.cpp 它来自reading the binary file into the vector of unsigned chars

#include <iostream>
#include <vector>
#include <string>
#include <fstream>
#include <byteswap.h>
#include <iterator>
using namespace std;

typedef unsigned char BYTE;
std::vector<BYTE> readFile(const char* filename)
{
    // open the file:
    std::ifstream file(filename, std::ios::binary);

    // Stop eating new lines in binary mode!!!
    file.unsetf(std::ios::skipws);

    // get its size:
    std::streampos fileSize;

    file.seekg(0, std::ios::end);
    fileSize = file.tellg();
    file.seekg(0, std::ios::beg);

    // reserve capacity
    std::vector<BYTE> vec;
    vec.reserve(fileSize);

    // read the data:
    vec.insert(vec.begin(),
               std::istream_iterator<BYTE>(file),
               std::istream_iterator<BYTE>());

    return vec;
}


int main(void){
    std::vector<BYTE>  arr = readFile("test.bin");
    int i;
    for (i=0;i<arr.size();i++){
        cout << int(arr[i]) << ' ';
    }
} 

readbinary.cpp的输出(它有9,10,11,12)。

0 0 1 0 1 0 1 0 2 0 1 0 3 0 1 0 4 0 1 0 5 0 1 0 6 0 1 0 7 0 1 0 8 0 1 0 9 0 1 0 10 0 1 0 11 0 1 0 12 0 1 0 13 0 1 0 14 0 1 0 15 0 1 0 16 0 1 0 17 0 1 0 18 0 1 0 19 0 1 0

0 个答案:

没有答案