Spaces:
Running
Running
adds packing argument to gpt oss custom config
Browse files
config/train_gpt_oss_custom.py
CHANGED
@@ -92,6 +92,9 @@ class GPTOSSEnhancedCustomConfig:
|
|
92 |
save_steps: int = 500 # Save checkpoint every N steps
|
93 |
save_total_limit: Optional[int] = 3 # Keep only N best checkpoints
|
94 |
save_only_model: bool = False # Save only model weights
|
|
|
|
|
|
|
95 |
|
96 |
# Model Selection
|
97 |
metric_for_best_model: str = "eval_loss"
|
|
|
92 |
save_steps: int = 500 # Save checkpoint every N steps
|
93 |
save_total_limit: Optional[int] = 3 # Keep only N best checkpoints
|
94 |
save_only_model: bool = False # Save only model weights
|
95 |
+
# TRL packing (token packing of multiple samples into a single sequence)
|
96 |
+
# Some configs (e.g., openhermes_fr_memory_optimized) set this to True
|
97 |
+
packing: bool = False
|
98 |
|
99 |
# Model Selection
|
100 |
metric_for_best_model: str = "eval_loss"
|