我需要编写一个程序来解析C中的大型CSV文件(大约2000 * 2000)并以double [] []数组的形式存储。我写了一个程序,它似乎适用于小文件(我检查了4 * 4 csv文件),但对于大文件,它给我不正确的结果。(因为行数和列数错误,程序崩溃后这一点)。
这是代码:
#include<stdio.h>
#include<stdlib.h>
#include<string.h>
int main (void)
{
int rowMaxIndex,columnMaxIndex;
double **mat;
double *matc;
int i,j,idx,len;
char part[5000];
char *token;
char *temp;
char *delim = ",";
double var;
{
FILE *fp;
fp = fopen("X1_CR2_new1.csv","r");
if(fp == NULL)
{
perror("Error while opening the file.\n");
exit(EXIT_FAILURE);
}
// count loop
rowMaxIndex = 0;
columnMaxIndex = 0;
while(fgets(part,5000,fp) != NULL){
token = NULL;
token=strtok(part,delim);
while(token != NULL){
if(rowMaxIndex==0)
{
columnMaxIndex++;}
token=strtok(NULL,delim);
}
rowMaxIndex++;
}
fclose(fp);
printf("Number of rows is %d, and Number of columns is %d", rowMaxIndex, columnMaxIndex);
// allocate the matrix
mat = malloc(rowMaxIndex * sizeof(double*));
for (i = 0; i < rowMaxIndex; i++)
{
mat[i] = malloc(columnMaxIndex * sizeof(double));
}
fclose(fp);
}
// rewind the file to the beginning. The rewind(fp) wasnt working so closed and reopened file.
{
FILE *fp;
fp = fopen("X1_CR2_new1.csv","r");
if(fp == NULL)
{
perror("Error while opening the file.\n");
exit(EXIT_FAILURE);
}
// read loop
i = j = 0;
while(fgets(part,5000,fp)!=NULL)
{
token=strtok(part,delim);
j=0;
while (token != NULL){
mat[i][j]=atof(token);
//printf("\n %f", mat[i][j]);
token=strtok(NULL,delim);
j++;
}
i++;
}
printf("\n The value of mat 1, 2 is %f", mat[1][0]); //print some element to check
free(mat);
fclose(fp);
}
return 0;
}
答案 0 :(得分:2)
您说数据有2000列但您的fgets()
最多可读取4999个字符。您的数据是否有可能超过4999个字符?您可能应该检查读取的每一行是否以换行符结尾(可能是文件中的最后一行)。
顺便说一下,你不需要重新打开文件 - 只需rewind()
。