summaryrefslogtreecommitdiff
path: root/test.py
blob: f4d1e1856d5f7db36d10d54e98d7efcf5e9b3f51 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
import csv
import pandas as pd
import _pickle as pkl


def trans_csv_to_pickle(filename):
    df = pd.read_csv(filename)
    save_df = pd.DataFrame(columns=["features", "label"])
    d_index = list(df.columns).index('features')
    print(df)
    for i in range(len(df)):
        features = df.loc[i].features.replace("inf", str(100000000.0))
        try:
            features = eval(features)
        except NameError:
            print(features)
            inf = 1e10
            eval(features)
            print(features)
            continue
        for feature in features:
            if not isinstance(feature, float):
                print(features)
                print(feature)
        # print(df.loc[i].label, type(df.loc[i].label))
        save_df.loc[i] = [features, int(df.loc[i].label)]
    print(save_df)
    print(type(save_df.loc[0]['features']))
    save_df.to_csv(filename)
    pkl_name = filename.replace("csv", "pkl")
    f_pkl = open(pkl_name, "wb")
    pkl.dump(save_df, f_pkl)
    f_pkl.close()


if __name__ == '__main__':
    trans_csv_to_pickle("result/ow_doh_features.csv")