Spaces:
Running
Running
Yehor Smoliakov
commited on
Commit
·
32ee84e
1
Parent(s):
11961e0
Add a check for consistency
Browse files
app.py
CHANGED
@@ -107,12 +107,31 @@ def inference(file_name, _clear_punctuation, _show_chars, _batch_mode):
|
|
107 |
|
108 |
df = pl.read_ndjson(file_name)
|
109 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
110 |
inference_seconds = df["inference_total"].sum()
|
111 |
|
112 |
if _batch_mode:
|
113 |
-
if
|
114 |
raise gr.Error(
|
115 |
-
"Please
|
116 |
)
|
117 |
|
118 |
duration_seconds = 0
|
@@ -138,6 +157,11 @@ def inference(file_name, _clear_punctuation, _show_chars, _batch_mode):
|
|
138 |
for reference in references_batch:
|
139 |
references.extend(reference)
|
140 |
else:
|
|
|
|
|
|
|
|
|
|
|
141 |
duration_seconds = df["duration"].sum()
|
142 |
|
143 |
rtf = inference_seconds / duration_seconds
|
|
|
107 |
|
108 |
df = pl.read_ndjson(file_name)
|
109 |
|
110 |
+
required_columns = [
|
111 |
+
"filename",
|
112 |
+
"inference_start",
|
113 |
+
"inference_end",
|
114 |
+
"inference_total",
|
115 |
+
"duration",
|
116 |
+
"reference",
|
117 |
+
"prediction",
|
118 |
+
]
|
119 |
+
required_columns_batch = [
|
120 |
+
"inference_start",
|
121 |
+
"inference_end",
|
122 |
+
"inference_total",
|
123 |
+
"filenames",
|
124 |
+
"durations",
|
125 |
+
"references",
|
126 |
+
"predictions",
|
127 |
+
]
|
128 |
+
|
129 |
inference_seconds = df["inference_total"].sum()
|
130 |
|
131 |
if _batch_mode:
|
132 |
+
if not all(col in df.columns for col in required_columns_batch):
|
133 |
raise gr.Error(
|
134 |
+
f"Please provide a JSONL file with the following columns: {required_columns_batch}"
|
135 |
)
|
136 |
|
137 |
duration_seconds = 0
|
|
|
157 |
for reference in references_batch:
|
158 |
references.extend(reference)
|
159 |
else:
|
160 |
+
if not all(col in df.columns for col in required_columns):
|
161 |
+
raise gr.Error(
|
162 |
+
f"Please provide a JSONL file with the following columns: {required_columns}"
|
163 |
+
)
|
164 |
+
|
165 |
duration_seconds = df["duration"].sum()
|
166 |
|
167 |
rtf = inference_seconds / duration_seconds
|