Yehor Smoliakov commited on
Commit
32ee84e
·
1 Parent(s): 11961e0

Add a check for consistency

Browse files
Files changed (1) hide show
  1. app.py +26 -2
app.py CHANGED
@@ -107,12 +107,31 @@ def inference(file_name, _clear_punctuation, _show_chars, _batch_mode):
107
 
108
  df = pl.read_ndjson(file_name)
109
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
110
  inference_seconds = df["inference_total"].sum()
111
 
112
  if _batch_mode:
113
- if "durations" not in df.columns:
114
  raise gr.Error(
115
- "Please use a JSONL file with 'durations' column for batch mode."
116
  )
117
 
118
  duration_seconds = 0
@@ -138,6 +157,11 @@ def inference(file_name, _clear_punctuation, _show_chars, _batch_mode):
138
  for reference in references_batch:
139
  references.extend(reference)
140
  else:
 
 
 
 
 
141
  duration_seconds = df["duration"].sum()
142
 
143
  rtf = inference_seconds / duration_seconds
 
107
 
108
  df = pl.read_ndjson(file_name)
109
 
110
+ required_columns = [
111
+ "filename",
112
+ "inference_start",
113
+ "inference_end",
114
+ "inference_total",
115
+ "duration",
116
+ "reference",
117
+ "prediction",
118
+ ]
119
+ required_columns_batch = [
120
+ "inference_start",
121
+ "inference_end",
122
+ "inference_total",
123
+ "filenames",
124
+ "durations",
125
+ "references",
126
+ "predictions",
127
+ ]
128
+
129
  inference_seconds = df["inference_total"].sum()
130
 
131
  if _batch_mode:
132
+ if not all(col in df.columns for col in required_columns_batch):
133
  raise gr.Error(
134
+ f"Please provide a JSONL file with the following columns: {required_columns_batch}"
135
  )
136
 
137
  duration_seconds = 0
 
157
  for reference in references_batch:
158
  references.extend(reference)
159
  else:
160
+ if not all(col in df.columns for col in required_columns):
161
+ raise gr.Error(
162
+ f"Please provide a JSONL file with the following columns: {required_columns}"
163
+ )
164
+
165
  duration_seconds = df["duration"].sum()
166
 
167
  rtf = inference_seconds / duration_seconds