gagan3012 commited on
Commit
dd353f6
·
1 Parent(s): fc96e58

split added

Browse files
Files changed (1) hide show
  1. src/data/process_data.py +1 -1
src/data/process_data.py CHANGED
@@ -11,7 +11,7 @@ def process_data(split='train'):
11
  df = pd.read_csv('data/raw/{}.csv'.format(split))
12
  df.columns = ['Unnamed: 0', 'input_text', 'output_text']
13
  df = df.sample(frac=params['split'], replace=True, random_state=1)
14
- if os.path.exists("data/raw/{}.csv"):
15
  os.remove("data/raw/{}.csv".format(split))
16
  df.to_csv('data/processed/{}.csv'.format(split))
17
 
 
11
  df = pd.read_csv('data/raw/{}.csv'.format(split))
12
  df.columns = ['Unnamed: 0', 'input_text', 'output_text']
13
  df = df.sample(frac=params['split'], replace=True, random_state=1)
14
+ if os.path.exists("data/raw/{}.csv".format(split)):
15
  os.remove("data/raw/{}.csv".format(split))
16
  df.to_csv('data/processed/{}.csv'.format(split))
17