Spaces:
Sleeping
Sleeping
Update tasks/audio.py
Browse files- tasks/audio.py +2 -2
tasks/audio.py
CHANGED
@@ -35,7 +35,7 @@ async def evaluate_audio(request: AudioEvaluationRequest):
|
|
35 |
|
36 |
# Load dataset
|
37 |
logging.info("Chargement des données")
|
38 |
-
dataset = load_dataset(request.dataset_name, token=os.getenv("HF_TOKEN"))
|
39 |
logging.info("Données chargées")
|
40 |
|
41 |
test_dataset = dataset["test"]
|
@@ -51,7 +51,7 @@ async def evaluate_audio(request: AudioEvaluationRequest):
|
|
51 |
audio_arrays = [x["array"] for x in examples["audio"]]
|
52 |
return feature_extractor(audio_arrays, sampling_rate=feature_extractor.sampling_rate, padding="longest", max_length=16000, truncation=True, return_tensors="pt")
|
53 |
|
54 |
-
encoded_data_test = test_dataset.map(preprocess_function, remove_columns="audio", batched=True,
|
55 |
del feature_extractor
|
56 |
del audio_arrays
|
57 |
# Pipeline de classification
|
|
|
35 |
|
36 |
# Load dataset
|
37 |
logging.info("Chargement des données")
|
38 |
+
dataset = load_dataset(request.dataset_name, streaming=True,token=os.getenv("HF_TOKEN"))
|
39 |
logging.info("Données chargées")
|
40 |
|
41 |
test_dataset = dataset["test"]
|
|
|
51 |
audio_arrays = [x["array"] for x in examples["audio"]]
|
52 |
return feature_extractor(audio_arrays, sampling_rate=feature_extractor.sampling_rate, padding="longest", max_length=16000, truncation=True, return_tensors="pt")
|
53 |
|
54 |
+
encoded_data_test = test_dataset.map(preprocess_function, remove_columns="audio", batched=True, keep_in_memory=False)
|
55 |
del feature_extractor
|
56 |
del audio_arrays
|
57 |
# Pipeline de classification
|