CindyDelage commited on
Commit
8111552
·
verified ·
1 Parent(s): 80a180c

Update tasks/audio.py

Browse files
Files changed (1) hide show
  1. tasks/audio.py +2 -2
tasks/audio.py CHANGED
@@ -35,7 +35,7 @@ async def evaluate_audio(request: AudioEvaluationRequest):
35
 
36
  # Load dataset
37
  logging.info("Chargement des données")
38
- dataset = load_dataset(request.dataset_name, token=os.getenv("HF_TOKEN"))
39
  logging.info("Données chargées")
40
 
41
  test_dataset = dataset["test"]
@@ -51,7 +51,7 @@ async def evaluate_audio(request: AudioEvaluationRequest):
51
  audio_arrays = [x["array"] for x in examples["audio"]]
52
  return feature_extractor(audio_arrays, sampling_rate=feature_extractor.sampling_rate, padding="longest", max_length=16000, truncation=True, return_tensors="pt")
53
 
54
- encoded_data_test = test_dataset.map(preprocess_function, remove_columns="audio", batched=True, streaming=True, keep_in_memory=False)
55
  del feature_extractor
56
  del audio_arrays
57
  # Pipeline de classification
 
35
 
36
  # Load dataset
37
  logging.info("Chargement des données")
38
+ dataset = load_dataset(request.dataset_name, streaming=True,token=os.getenv("HF_TOKEN"))
39
  logging.info("Données chargées")
40
 
41
  test_dataset = dataset["test"]
 
51
  audio_arrays = [x["array"] for x in examples["audio"]]
52
  return feature_extractor(audio_arrays, sampling_rate=feature_extractor.sampling_rate, padding="longest", max_length=16000, truncation=True, return_tensors="pt")
53
 
54
+ encoded_data_test = test_dataset.map(preprocess_function, remove_columns="audio", batched=True, keep_in_memory=False)
55
  del feature_extractor
56
  del audio_arrays
57
  # Pipeline de classification