zoukankan      html  css  js  c++  java
  • pandas(七):列表转字典、map使用、为csv加表头

    一、代码

    def clean():
        train = pd.read_csv(os.path.join(raw, "train.txt"),sep="	", header=None,names=["s", "l"])
        train_s = train["s"].tolist()
        train_l = train["l"].tolist()
    
        dev = pd.read_csv(os.path.join(raw, "val.txt"),sep="	", header=None,names=["s", "l"])
        dev_s = dev["s"].tolist()
        dev_l = dev["l"].tolist()
    
        test = pd.read_csv(os.path.join(raw, "test.txt"),sep="	", header=None,names=["s", "l"])
        test_s = test["s"].tolist()
        test_l = test["l"].tolist()
    
        label_list = list(set(train_l + dev_l + test_l))
        label_dict = dict(zip(label_list, range(len(label_list))))
        print(label_list)
        print(label_dict)
    
        with open(os.path.join(data, "class.txt"), "w", encoding="utf8") as f:
            for l in label_list:
                f.write(l + "
    ")
    
        out_train_l = list(map(lambda x: label_dict[x], train_l))
        print(out_train_l)
    
        out_dev_l = list(map(lambda x: label_dict[x], dev_l))
        print(out_dev_l)
    
        out_test_l = list(map(lambda x: label_dict[x], test_l))
        print(out_test_l)
    
        train_df = pd.DataFrame({"setence": train_s, "label": out_train_l})
        train_df.to_csv(os.path.join(data, "train.txt"), sep="	", encoding="utf8", header=None, index=None)
    
        dev_df = pd.DataFrame({"setence": dev_s, "label": out_dev_l})
        dev_df.to_csv(os.path.join(data, "dev.txt"), sep="	", encoding="utf8", header=None, index=None)
    
        test_df = pd.DataFrame({"setence": test_s, "label": out_test_l})
        test_df.to_csv(os.path.join(data, "test.txt"), sep="	", encoding="utf8", header=None, index=None)
  • 相关阅读:
    svn ------ 在服务器上创建项目并提交程序到服务器
    攀岩墙
    群晖docker安装sqli-lab
    win10 hyper-v与VMware冲突解决
    vue3 封装仿antd-vue的Table组件基本实现
    vue3自定义Table组件源码
    idea怎样修改tomcat启动的初始页面
    解决用java代码导入数据到mysql乱码问题
    day01-Markdown语法详解
    windows 10 如何管理自己的磁盘
  • 原文地址:https://www.cnblogs.com/zhangxianrong/p/15258001.html
Copyright © 2011-2022 走看看