datascienceharp commited on
Commit
d650f60
·
1 Parent(s): e3c4fa8
Files changed (2) hide show
  1. data_curation.py +2 -3
  2. script.py +5 -5
data_curation.py CHANGED
@@ -21,7 +21,7 @@ def take_random_sample(dataset):
21
  """Take a sample from the dataset"""
22
  return dataset.take(size=10,seed=51)
23
 
24
- def prepare_dataset(name):
25
  """
26
  Prepare the dataset for model training.
27
 
@@ -57,5 +57,4 @@ def prepare_dataset(name):
57
  dataset = take_random_sample(dataset)
58
 
59
  # Return the curated dataset
60
- curated_dataset = dataset.clone()
61
- return curated_dataset
 
21
  """Take a sample from the dataset"""
22
  return dataset.take(size=10,seed=51)
23
 
24
+ def prepare_dataset(name="Voxel51/Data-Centric-Visual-AI-Challenge-Train-Set"):
25
  """
26
  Prepare the dataset for model training.
27
 
 
57
  dataset = take_random_sample(dataset)
58
 
59
  # Return the curated dataset
60
+ curated_dataset = dataset.clone(name="curated_dataset")
 
script.py CHANGED
@@ -12,16 +12,13 @@ Your predictions must be in a label_field called "predictions" in the dataset.
12
  See here for more details about hyperparameters for this model: https://docs.ultralytics.com/modes/train/#train-settings
13
  """
14
  import os
15
- from datetime import datetime
16
- from math import log
17
  import yaml
18
 
19
  import fiftyone as fo
20
  import fiftyone.utils.random as four
21
  import fiftyone.utils.huggingface as fouh
22
 
23
- from ultralytics import YOLO
24
-
25
  from data_curation import prepare_dataset
26
 
27
  def export_to_yolo_format(
@@ -68,7 +65,10 @@ def train_model(training_dataset, training_config):
68
  """
69
  Train the YOLO model on the given dataset using the provided configuration.
70
  """
71
- print("Starting the training process...")
 
 
 
72
 
73
  print("Splitting the dataset...")
74
  four.random_split(training_dataset, {"train": training_config['train_split'], "val": training_config['val_split']})
 
12
  See here for more details about hyperparameters for this model: https://docs.ultralytics.com/modes/train/#train-settings
13
  """
14
  import os
15
+
 
16
  import yaml
17
 
18
  import fiftyone as fo
19
  import fiftyone.utils.random as four
20
  import fiftyone.utils.huggingface as fouh
21
 
 
 
22
  from data_curation import prepare_dataset
23
 
24
  def export_to_yolo_format(
 
65
  """
66
  Train the YOLO model on the given dataset using the provided configuration.
67
  """
68
+ training_dataset = fouh.load_from_hub(
69
+ "Voxel51/Data-Centric-Visual-AI-Challenge-Train-Set",
70
+ max_samples=100 #for testing remove this later
71
+ )
72
 
73
  print("Splitting the dataset...")
74
  four.random_split(training_dataset, {"train": training_config['train_split'], "val": training_config['val_split']})