如何在链接列表中存储CSV文件的内容？

Saby 发表于 Dev

萨比

我正在尝试使用C将csv文件中的内容插入到链接列表中。但是，我得到了很多垃圾输出。源代码如下。

#include<stdio.h>
#include<stdlib.h>
#include<string.h>
struct product *customer_head;

struct customer
{
    long long int c_id;//first 6 characters=date & next 6 characters=time & next characters=counter no & city code

    /*Compulsory Fields (Cannot be Skipped)*/
    char name[57];
    long long int ph_no;//10 digit phone number

    /*Non Compulsory Fields (Can be Skipped)*/
    char address[58];
    char city[25];
    char state_code[2];
    char pin[6];
    char email[60];

    struct customer *next;
};
struct customer * load()
{
    FILE * cust=fopen("customer_db.csv","r");
    struct customer *temp,*ptr;
    customer_head=NULL;
    char str[208];
    char *token,*eptr1,*eptr2;
    int line_cnt=0,i=0;

    while(fgets(str,234,cust)!=NULL)
    {
        line_cnt=0;
        i=0;
        ptr=(struct customer *)malloc(sizeof(struct customer));
        for(;str[i];i++)
        {
            if(str[i]=='\n')
            {
                str[i]='\0';
                i=0;
                break;
            }
        }
        token=strtok(str,",");

        while(token!=NULL)
        {

            if(line_cnt==0)
            ptr->c_id=strtoll(token,&eptr1,10);

            else if(line_cnt==1)
            ptr->ph_no=strtoll(token,&eptr2,10);

            else if(line_cnt==2)
            sprintf(ptr->name,"%s",token);

            else if(line_cnt==3)
            sprintf(ptr->address,"%s",token);

            else if(line_cnt==4)
            sprintf(ptr->city,"%s",token);

            else if(line_cnt==5)
            sprintf(ptr->state_code,"%s",token);

            else if(line_cnt==6)
            sprintf(ptr->pin,"%s",token);

            else
            sprintf(ptr->email,"%s",token);

            line_cnt++;

            token=strtok(NULL,",");

        }
        if(customer_head==NULL)
        customer_head=ptr;
        else
        temp->next=ptr;
        temp=ptr;


    }
}
int print(struct customer *h)
{

    while(h->next!=NULL)
    {
        printf("\nCustomer ID: ");
        printf("%lld",h->c_id);
        printf("\nName: ");
        puts(h->name);
        printf("Phone Number: ");
        printf("%lld",h->ph_no);
        printf("\nAddress: ");
        puts(h->address);
        printf("City: ");
        puts(h->city);
        printf("State Code: ");
        puts(h->state_code);
        printf("PIN: ");
        puts(h->pin);
        printf("Email: ");
        puts(h->email);
        h=h->next;
    }
        printf("\nCustomer ID: ");
        printf("%lld",h->c_id);
        printf("\nName: ");
        puts(h->name);
        printf("Phone Number: ");
        printf("%ld",h->ph_no);
        printf("\nAddress: ");
        puts(h->address);
        printf("City: ");
        puts(h->city);
        printf("State Code: ");
        puts(h->state_code);
        printf("PIN: ");
        puts(h->pin);
        printf("Email: ");
        puts(h->email);

    return 1;
}
int main()
{
    load();
    print(customer_head);
}

我也在这里附加了csv文件。为了使程序更简单，我从csv文件中删除了标题。他们按顺序

客户编号，电话号码，姓名，地址，城市，州代码，PIN码，电子邮件

1403201156540201,2226179183,Katherine_Hamilton,87_Thompson_St.,Fremont,IA,502645,[email protected]
2204201532220103,8023631298,Marc_Knight,-,-,-,-,-
0305201423120305,8025595163,Albie_Rowland,-,Hamburg,NY,140752,-
0607201232220901,4055218053,Grant_Phelps,-,-,-,-,-

破折号（-）表示这些字段应保持为空。

输出如下：

Customer ID: 1403201156540201
Name: Katherine_Hamilton
Phone Number: 2226179183
Address: 87_Thompson_St.
City: Fremont
State Code: [email protected]
PIN: [email protected]
Email: [email protected]

Customer ID: 2204201532220103
Name: Marc_Knight
Phone Number: 8023631298
Address: -
City: -
State Code: -
PIN: -
Email: -

Customer ID: 305201423120305
Name: Albie_Rowland
Phone Number: 8025595163
Address: -
City: Hamburg
State Code: NY140752-
PIN: 140752-
Email: -

Customer ID: 607201232220901
Name: Grant_Phelps
Phone Number: 4055218053
Address: -
City: -
State Code: -
PIN: -
Email: -

如您所见，内容在很多地方都已合并。我不明白为什么。

大卫·兰金

由于从注释中您知道字符数组的声明受字符太少的影响，至少在char state_code[2];使数组不包含导致未定义行为的n终止字符的情况下，应确保对您所有的输入。（不要跳过缓冲区大小）

通常，您会使自己的工作变得比实际需要的要难。您没有固定的输入字段，而没有尝试使用strtok()和计算字段并处理的8部分链中的每个if, else if ...字段，因此只需解析数据sscanf()并验证转换次数以确认解析成功即可，例如

/** fill list from csv file */
list_t *list_from_csv (list_t *list, FILE *fp)
{
    char buf[MAXC];
    node_t data = { .c_id = 0, .next = NULL };

    while (fgets (buf, MAXC, fp)) { /* read each line in file */
        /* parse and VALIDATE values from line */
        if (sscanf (buf, "%lld,%lld,%63[^,],%63[^,],%31[^,],%7[^,],%7[^,],%63[^,\n]",
                    &data.c_id, &data.ph_no, data.name, data.address, data.city,
                    data.state_code, data.pin, data.email) == 8) {
            if (!add (list, &data)) /* validate add to list or break */
                break;
        }
    }

    return list;
}

在这里，list_t只是一个附加的“包装器”结构，该结构为链接列表保留head和tail指针。这使您可以在所需范围内声明多个列表，并通过使tail指针始终指向列表中的最后一个节点（your temp）来允许相同的O（1）插入。在这里，head和tail只是包装器的一部分，并作为参数传递，而不必将列表指针声明为全局（不好的做法）。列表中的每个节点和包装器结构均可编写为：

#define BYTE8   8           /* if you need a constant, #define one (or more) */
#define BYTE32 32
#define BYTE64 64
#define MAXC 1024

typedef struct node_t {     /* list node */
    /* 6 characters=date & 6 characters=time & counter no & city code */
    long long int c_id;

    /*Compulsory Fields (Cannot be Skipped)*/
    char name[BYTE64];
    long long int ph_no;    //10 digit phone number

    /*Non Compulsory Fields (Can be Skipped)*/
    char address[BYTE64];
    char city[BYTE32];
    char state_code[BYTE8];
    char pin[BYTE8];
    char email[BYTE64];

    struct node_t *next;
} node_t;

typedef struct {            /* list wrapper with head & tail pointers */
    node_t *head, *tail;
} list_t;

然后，不要将您的列表写成load()同时包含FILE和列表操作，而是将列表操作分开。只需创建一个add()函数即可将节点添加到列表中，例如

/** add node at end of list, update tail to end */
node_t *add (list_t *l, node_t *data)
{
    node_t *node = malloc (sizeof *node);   /* allocate node */
    if (!node) {                            /* validate allocation */
        perror ("malloc-node");
        return NULL;
    }

    *node = *data;                      /* initialize members values */

    if (!l->head)                       /* if 1st node, node is head/tail */
        l->head = l->tail = node;
    else {                              /* otherwise */
        l->tail->next = node;           /* add at end, update tail pointer */
        l->tail = node;
    }

    return node;    /* return new node */
}

现在，您的加载函数只需要从文件中读取每一行并解析该行，然后调用add()传递指向数据结构的指针以及列表指针作为参数即可。您的load()功能减少为：

/** fill list from csv file */
list_t *list_from_csv (list_t *list, FILE *fp)
{
    char buf[MAXC];
    node_t data = { .c_id = 0, .next = NULL };

    while (fgets (buf, MAXC, fp)) { /* read each line in file */
        /* parse and VALIDATE values from line */
        if (sscanf (buf, "%lld,%lld,%63[^,],%63[^,],%31[^,],%7[^,],%7[^,],%63[^,\n]",
                    &data.c_id, &data.ph_no, data.name, data.address, data.city,
                    data.state_code, data.pin, data.email) == 8) {
            if (!add (list, &data)) /* validate add to list or break */
                break;
        }
    }

    return list;
}

（注意：使用strtok()或时sscanf()，无需'\n'从输入字符串中删除尾随-只需将其作为定界符包含在内即可，strtok()或使用排除在转换之外sscanf()）

此外，您无需多次调用puts()，并printf()在你的清单打印数据的每个节点的价值。查看您进行了多少次函数调用以打印数据。您只需打一个电话printf()，例如

/** print all nodes in list */
void prn_list (list_t *l)
{
    if (!l->head) {
        puts ("list-empty");
        return;
    }

    for (node_t *n = l->head; n; n = n->next)
        printf ("\nCustomer ID: %lld\n"
                "Name: %s\n"
                "Phone Number: %lld\n"
                "Address: %s\n"
                "City: %s\n"
                "State Code: %s\n"
                "PIN: %s\n"
                "Email: %s\n", n->c_id, n->name, n->ph_no, n->address, n->city,
                                n->state_code, n->pin, n->email);
}

在main()简单地声明list_t包装器的实例中，打开/验证您的包装器，FILE然后将指针传递到列表，并将文件流传递到您的list_from_csv()（您的load()），然后打印该列表，最后释放所有您已分配的内存，然后完成。（是的，内存将在退出时被释放，但是会提早养成良好的习惯-不久之后，您将在函数中使用分配内存，否则在释放之前会return导致内存泄漏）

int main (int argc, char **argv) {

    list_t list = { .head = NULL, .tail = NULL };
    /* use filename provided as 1st argument (stdin by default) */
    FILE *fp = argc > 1 ? fopen (argv[1], "r") : stdin;

    if (!fp) {  /* validate file open for reading */
        perror ("file open failed");
        return 1;
    }

    if (!list_from_csv (&list, fp))
        return 1;

    if (fp != stdin)   /* close file if not stdin */
        fclose (fp);

    prn_list (&list);
    del_list (&list);
}

综上所述，您将获得类似于以下内容的内容：

#include <stdio.h>
#include <stdlib.h>
#include <string.h>

#define BYTE8   8           /* if you need a constant, #define one (or more) */
#define BYTE32 32
#define BYTE64 64
#define MAXC 1024

typedef struct node_t {     /* list node */
    /* 6 characters=date & 6 characters=time & counter no & city code */
    long long int c_id;

    /*Compulsory Fields (Cannot be Skipped)*/
    char name[BYTE64];
    long long int ph_no;    //10 digit phone number

    /*Non Compulsory Fields (Can be Skipped)*/
    char address[BYTE64];
    char city[BYTE32];
    char state_code[BYTE8];
    char pin[BYTE8];
    char email[BYTE64];

    struct node_t *next;
} node_t;

typedef struct {            /* list wrapper with head & tail pointers */
    node_t *head, *tail;
} list_t;


/** add node at end of list, update tail to end */
node_t *add (list_t *l, node_t *data)
{
    node_t *node = malloc (sizeof *node);   /* allocate node */
    if (!node) {                            /* validate allocation */
        perror ("malloc-node");
        return NULL;
    }

    *node = *data;                      /* initialize members values */

    if (!l->head)                       /* if 1st node, node is head/tail */
        l->head = l->tail = node;
    else {                              /* otherwise */
        l->tail->next = node;           /* add at end, update tail pointer */
        l->tail = node;
    }

    return node;    /* return new node */
}

/** print all nodes in list */
void prn_list (list_t *l)
{
    if (!l->head) {
        puts ("list-empty");
        return;
    }

    for (node_t *n = l->head; n; n = n->next)
        printf ("\nCustomer ID: %lld\n"
                "Name: %s\n"
                "Phone Number: %lld\n"
                "Address: %s\n"
                "City: %s\n"
                "State Code: %s\n"
                "PIN: %s\n"
                "Email: %s\n", n->c_id, n->name, n->ph_no, n->address, n->city,
                                n->state_code, n->pin, n->email);
}

/** delete all nodes in list */
void del_list (list_t *l)
{
    node_t *n = l->head;

    while (n) {
        node_t *victim = n;
        n = n->next;
        free (victim);
    }
}

/** fill list from csv file */
list_t *list_from_csv (list_t *list, FILE *fp)
{
    char buf[MAXC];
    node_t data = { .c_id = 0, .next = NULL };

    while (fgets (buf, MAXC, fp)) { /* read each line in file */
        /* parse and VALIDATE values from line */
        if (sscanf (buf, "%lld,%lld,%63[^,],%63[^,],%31[^,],%7[^,],%7[^,],%63[^,\n]",
                    &data.c_id, &data.ph_no, data.name, data.address, data.city,
                    data.state_code, data.pin, data.email) == 8) {
            if (!add (list, &data)) /* validate add to list or break */
                break;
        }
    }

    return list;
}

int main (int argc, char **argv) {

    list_t list = { .head = NULL, .tail = NULL };
    /* use filename provided as 1st argument (stdin by default) */
    FILE *fp = argc > 1 ? fopen (argv[1], "r") : stdin;

    if (!fp) {  /* validate file open for reading */
        perror ("file open failed");
        return 1;
    }

    if (!list_from_csv (&list, fp))
        return 1;

    if (fp != stdin)   /* close file if not stdin */
        fclose (fp);

    prn_list (&list);
    del_list (&list);
}

使用/输出示例

将输入文件放在中dat/customer_list.txt，运行该程序，您将收到：

$ ./bin/customer_list dat/customer_list.txt

Customer ID: 1403201156540201
Name: Katherine_Hamilton
Phone Number: 2226179183
Address: 87_Thompson_St.
City: Fremont
State Code: IA
PIN: 502645
Email: [email protected]

Customer ID: 2204201532220103
Name: Marc_Knight
Phone Number: 8023631298
Address: -
City: -
State Code: -
PIN: -
Email: -

Customer ID: 305201423120305
Name: Albie_Rowland
Phone Number: 8025595163
Address: -
City: Hamburg
State Code: NY
PIN: 140752
Email: -

Customer ID: 607201232220901
Name: Grant_Phelps
Phone Number: 4055218053
Address: -
City: -
State Code: -
PIN: -
Email: -

内存使用/错误检查

在您编写的任何动态分配内存的代码中，对于任何分配的内存块，您都有2个责任：（1）始终保留指向该内存块的起始地址的指针，因此，（2）在没有内存块时可以将其释放需要更长的时间。

必须使用一个内存错误检查程序来确保您不尝试访问内存或不要在已分配的块的边界之外/之外写，尝试读取或基于未初始化的值进行条件跳转，最后确认您可以释放已分配的所有内存。

对于Linuxvalgrind是正常的选择。每个平台都有类似的内存检查器。它们都很容易使用，只需通过它运行程序即可。

$ valgrind ./bin/customer_list dat/customer_list.txt
==14823== Memcheck, a memory error detector
==14823== Copyright (C) 2002-2017, and GNU GPL'd, by Julian Seward et al.
==14823== Using Valgrind-3.13.0 and LibVEX; rerun with -h for copyright info
==14823== Command: ./bin/customer_list dat/customer_list.txt
==14823==

Customer ID: 1403201156540201
Name: Katherine_Hamilton
Phone Number: 2226179183
Address: 87_Thompson_St.
City: Fremont
State Code: IA
PIN: 502645
Email: [email protected]

<snipped rest>

==14823==
==14823== HEAP SUMMARY:
==14823==     in use at exit: 0 bytes in 0 blocks
==14823==   total heap usage: 7 allocs, 7 frees, 6,728 bytes allocated
==14823==
==14823== All heap blocks were freed -- no leaks are possible
==14823==
==14823== For counts of detected and suppressed errors, rerun with: -v
==14823== ERROR SUMMARY: 0 errors from 0 contexts (suppressed: 0 from 0)

始终确认已释放已分配的所有内存，并且没有内存错误。

尽管仅通过确保每个字符串都有足够的存储空间就可以解决问题的很大一部分，但是请花一些时间思考使用sscanf()和进行值解析的方法，并且由于您控制了转换，因此无需删除路径中的尾部'\n'。行从文件中读取。（只是不要在从输入字符串解析的值中包含换行符）如果您确实想'\n'从头开始解析，则应使用，例如

    str[strcspn (str, "\n")] = 0;

最后，使用sscanf()和一起使用的格式字符串strcspn()，请确保您完全了解它们的工作原理，请参见man 3 scanf和man 3 strspn

如果您还有其他问题，请告诉我。

本文收集自互联网，转载请注明来源。

如有侵权，请联系 [email protected] 删除。

编辑于 2021-01-27

我来说两句

0 条评论

登录后参与评论

上一篇：PHP中的RESTful API，$。ajax方法无法获取GET返回的数据

TOP 榜单

文章

如何在链接列表中存储CSV文件的内容？

如何在链接列表中存储CSV文件的内容？

Android Studio Kotlin：提取为常量

计算数据帧R中的字符串频率

如何使用Redux-Toolkit重置Redux Store

http：// localhost：3000 /＃！/为什么我在localhost链接中得到“＃！/”。

如何使用tweepy流式传输来自指定用户的推文（仅在该用户发布推文时流式传输）

TreeMap中的自定义排序

TYPO3：将 Formhandler 添加到新闻扩展

遍历元素数组以每X秒在浏览器上显示

在Ubuntu和Windows中，触摸板有时会滞后。硬件问题？

警告消息：在matrix（unlist（drop.item），ncol = 10，byrow = TRUE）中：数据长度[16]不是列数的倍数[10]>？

无法连接网络并在Ubuntu 14.04中找到eth0

将辅助轴原点与主要轴对齐

我可以ping IPv6但不能ping IPv4

在Jenkins服务器中使用Selenium和Ruby进行的黄瓜测试失败，但在本地计算机中通过

提交html表单时为空

使用C ++ 11将数组设置为零

如果从DB接收到的值为空，则JMeter JDBC调用将返回该值作为参数名称

尝试在Dell XPS13 9360上安装Windows 7时出错

如何在R中转置数据

无法使用 envoy 访问 .ssh/config

未捕获的SyntaxError：带有Ajax帖子的意外令牌u