forked from ZuowenWang0000/GRUBERT-A-GRU-Based-Method-to-Fuse-BERT-Hidden-Layers-for-Twitter-sentiment-analysis
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathmake_data.py
More file actions
20 lines (15 loc) · 692 Bytes
/
make_data.py
File metadata and controls
20 lines (15 loc) · 692 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
import pandas as pd
from collections import namedtuple
import os
from sklearn.model_selection import train_test_split
import numpy
import sys
def make_training_validation_split(path):
train_df = pd.read_csv(os.path.join(path, "train_split.csv"))
val_df = pd.read_csv(os.path.join(path, "val_split.csv"))
main_df = train_df.append(val_df)
train , val = train_test_split(main_df,stratify=main_df['label'],test_size=0.3,shuffle=True)
train.to_csv(os.path.join(path, "train_split_new.csv"), header=True,index=False)
val.to_csv(os.path.join(path, "val_split_new.csv"),header=True,index=False)
if __name__ == '__main__':
make_training_validation_split(sys.argv[1])