W&B: Improve resume stability (#6611)
Browse files* log best.pt metrics at train end
* update
* Update __init__.py
* flush callbacks when using evolve
* remember batch size on resuming
* Update train.py
* improve stability of resume
Co-authored-by: Glenn Jocher <[email protected]>
utils/loggers/wandb/wandb_utils.py
CHANGED
@@ -225,9 +225,9 @@ class WandbLogger():
|
|
225 |
if modeldir:
|
226 |
self.weights = Path(modeldir) / "last.pt"
|
227 |
config = self.wandb_run.config
|
228 |
-
opt.weights, opt.save_period, opt.batch_size, opt.bbox_interval, opt.epochs, opt.hyp = str(
|
229 |
-
self.weights), config.save_period, config.batch_size, config.bbox_interval, config.epochs
|
230 |
-
|
231 |
data_dict = self.data_dict
|
232 |
if self.val_artifact is None: # If --upload_dataset is set, use the existing artifact, don't download
|
233 |
self.train_artifact_path, self.train_artifact = self.download_dataset_artifact(data_dict.get('train'),
|
|
|
225 |
if modeldir:
|
226 |
self.weights = Path(modeldir) / "last.pt"
|
227 |
config = self.wandb_run.config
|
228 |
+
opt.weights, opt.save_period, opt.batch_size, opt.bbox_interval, opt.epochs, opt.hyp, opt.imgsz = str(
|
229 |
+
self.weights), config.save_period, config.batch_size, config.bbox_interval, config.epochs,\
|
230 |
+
config.hyp, config.imgsz
|
231 |
data_dict = self.data_dict
|
232 |
if self.val_artifact is None: # If --upload_dataset is set, use the existing artifact, don't download
|
233 |
self.train_artifact_path, self.train_artifact = self.download_dataset_artifact(data_dict.get('train'),
|