vit-base-brain-tumor-detection2 / trainer_state.json

dhritic99/model99123

3644836 verified 6 months ago

7.98 kB

	{
	"best_metric": 0.38773971796035767,
	"best_model_checkpoint": "./vit-base-brain-tumor-detection2/checkpoint-1500",
	"epoch": 30.0,
	"eval_steps": 500,
	"global_step": 1920,
	"is_hyper_param_search": false,
	"is_local_process_zero": true,
	"is_world_process_zero": true,
	"log_history": [
	{
	"epoch": 0.78125,
	"grad_norm": 1.7783442735671997,
	"learning_rate": 2.5000000000000004e-07,
	"loss": 1.3686,
	"step": 50
	},
	{
	"epoch": 1.5625,
	"grad_norm": 1.8243844509124756,
	"learning_rate": 5.000000000000001e-07,
	"loss": 1.3468,
	"step": 100
	},
	{
	"epoch": 2.34375,
	"grad_norm": 2.272806167602539,
	"learning_rate": 7.5e-07,
	"loss": 1.2931,
	"step": 150
	},
	{
	"epoch": 3.125,
	"grad_norm": 1.0346544981002808,
	"learning_rate": 1.0000000000000002e-06,
	"loss": 1.1861,
	"step": 200
	},
	{
	"epoch": 3.90625,
	"grad_norm": 0.897363007068634,
	"learning_rate": 1.25e-06,
	"loss": 1.092,
	"step": 250
	},
	{
	"epoch": 4.6875,
	"grad_norm": 1.0376484394073486,
	"learning_rate": 1.5e-06,
	"loss": 1.0504,
	"step": 300
	},
	{
	"epoch": 5.46875,
	"grad_norm": 1.2069748640060425,
	"learning_rate": 1.75e-06,
	"loss": 0.993,
	"step": 350
	},
	{
	"epoch": 6.25,
	"grad_norm": 1.41449773311615,
	"learning_rate": 2.0000000000000003e-06,
	"loss": 0.9428,
	"step": 400
	},
	{
	"epoch": 7.03125,
	"grad_norm": 3.5506372451782227,
	"learning_rate": 2.25e-06,
	"loss": 0.9065,
	"step": 450
	},
	{
	"epoch": 7.8125,
	"grad_norm": 2.408358573913574,
	"learning_rate": 2.5e-06,
	"loss": 0.8758,
	"step": 500
	},
	{
	"epoch": 7.8125,
	"eval_accuracy": 0.6181640625,
	"eval_loss": 0.891155481338501,
	"eval_runtime": 5.9944,
	"eval_samples_per_second": 170.826,
	"eval_steps_per_second": 21.353,
	"step": 500
	},
	{
	"epoch": 8.59375,
	"grad_norm": 4.127248764038086,
	"learning_rate": 2.7500000000000004e-06,
	"loss": 0.8371,
	"step": 550
	},
	{
	"epoch": 9.375,
	"grad_norm": 4.548064231872559,
	"learning_rate": 3e-06,
	"loss": 0.7951,
	"step": 600
	},
	{
	"epoch": 10.15625,
	"grad_norm": 7.226322174072266,
	"learning_rate": 3.2500000000000002e-06,
	"loss": 0.7666,
	"step": 650
	},
	{
	"epoch": 10.9375,
	"grad_norm": 4.653890132904053,
	"learning_rate": 3.5e-06,
	"loss": 0.7219,
	"step": 700
	},
	{
	"epoch": 11.71875,
	"grad_norm": 3.7779295444488525,
	"learning_rate": 3.7500000000000005e-06,
	"loss": 0.6926,
	"step": 750
	},
	{
	"epoch": 12.5,
	"grad_norm": 3.6519362926483154,
	"learning_rate": 4.000000000000001e-06,
	"loss": 0.646,
	"step": 800
	},
	{
	"epoch": 13.28125,
	"grad_norm": 24.227773666381836,
	"learning_rate": 4.25e-06,
	"loss": 0.6269,
	"step": 850
	},
	{
	"epoch": 14.0625,
	"grad_norm": 8.960350036621094,
	"learning_rate": 4.5e-06,
	"loss": 0.5882,
	"step": 900
	},
	{
	"epoch": 14.84375,
	"grad_norm": 6.60162878036499,
	"learning_rate": 4.75e-06,
	"loss": 0.544,
	"step": 950
	},
	{
	"epoch": 15.625,
	"grad_norm": 10.583850860595703,
	"learning_rate": 5e-06,
	"loss": 0.5256,
	"step": 1000
	},
	{
	"epoch": 15.625,
	"eval_accuracy": 0.7607421875,
	"eval_loss": 0.6331567764282227,
	"eval_runtime": 5.4782,
	"eval_samples_per_second": 186.924,
	"eval_steps_per_second": 23.365,
	"step": 1000
	},
	{
	"epoch": 16.40625,
	"grad_norm": 3.9983010292053223,
	"learning_rate": 4.999850432733413e-06,
	"loss": 0.4768,
	"step": 1050
	},
	{
	"epoch": 17.1875,
	"grad_norm": 12.768200874328613,
	"learning_rate": 4.999401748829942e-06,
	"loss": 0.4863,
	"step": 1100
	},
	{
	"epoch": 17.96875,
	"grad_norm": 14.71330451965332,
	"learning_rate": 4.9986540019763296e-06,
	"loss": 0.4181,
	"step": 1150
	},
	{
	"epoch": 18.75,
	"grad_norm": 9.602484703063965,
	"learning_rate": 4.997607281643338e-06,
	"loss": 0.3901,
	"step": 1200
	},
	{
	"epoch": 19.53125,
	"grad_norm": 27.293039321899414,
	"learning_rate": 4.996261713075046e-06,
	"loss": 0.3496,
	"step": 1250
	},
	{
	"epoch": 20.3125,
	"grad_norm": 3.6233201026916504,
	"learning_rate": 4.994617457273862e-06,
	"loss": 0.3312,
	"step": 1300
	},
	{
	"epoch": 21.09375,
	"grad_norm": 11.52304458618164,
	"learning_rate": 4.992674710981266e-06,
	"loss": 0.2929,
	"step": 1350
	},
	{
	"epoch": 21.875,
	"grad_norm": 6.805290222167969,
	"learning_rate": 4.990433706654258e-06,
	"loss": 0.2653,
	"step": 1400
	},
	{
	"epoch": 22.65625,
	"grad_norm": 15.234956741333008,
	"learning_rate": 4.987894712437552e-06,
	"loss": 0.2635,
	"step": 1450
	},
	{
	"epoch": 23.4375,
	"grad_norm": 3.9582715034484863,
	"learning_rate": 4.985058032131488e-06,
	"loss": 0.2247,
	"step": 1500
	},
	{
	"epoch": 23.4375,
	"eval_accuracy": 0.8935546875,
	"eval_loss": 0.38773971796035767,
	"eval_runtime": 5.9931,
	"eval_samples_per_second": 170.863,
	"eval_steps_per_second": 21.358,
	"step": 1500
	},
	{
	"epoch": 24.21875,
	"grad_norm": 3.0134124755859375,
	"learning_rate": 4.98192400515568e-06,
	"loss": 0.1965,
	"step": 1550
	},
	{
	"epoch": 25.0,
	"grad_norm": 5.4471540451049805,
	"learning_rate": 4.978564534206973e-06,
	"loss": 0.193,
	"step": 1600
	},
	{
	"epoch": 25.78125,
	"grad_norm": 11.847530364990234,
	"learning_rate": 4.974842901390282e-06,
	"loss": 0.1709,
	"step": 1650
	},
	{
	"epoch": 26.5625,
	"grad_norm": 4.015501022338867,
	"learning_rate": 4.970825144183195e-06,
	"loss": 0.158,
	"step": 1700
	},
	{
	"epoch": 27.34375,
	"grad_norm": 4.216943264007568,
	"learning_rate": 4.966511743325682e-06,
	"loss": 0.1452,
	"step": 1750
	},
	{
	"epoch": 28.125,
	"grad_norm": 23.560443878173828,
	"learning_rate": 4.961903214932604e-06,
	"loss": 0.1288,
	"step": 1800
	},
	{
	"epoch": 28.90625,
	"grad_norm": 0.9162831902503967,
	"learning_rate": 4.957000110431956e-06,
	"loss": 0.1195,
	"step": 1850
	},
	{
	"epoch": 29.6875,
	"grad_norm": 2.046557664871216,
	"learning_rate": 4.95180301649889e-06,
	"loss": 0.1002,
	"step": 1900
	},
	{
	"epoch": 30.0,
	"step": 1920,
	"total_flos": 9.52238637305561e+18,
	"train_loss": 0.5872499863306682,
	"train_runtime": 1494.2494,
	"train_samples_per_second": 82.235,
	"train_steps_per_second": 1.285
	}
	],
	"logging_steps": 50,
	"max_steps": 1920,
	"num_input_tokens_seen": 0,
	"num_train_epochs": 30,
	"save_steps": 500,
	"stateful_callbacks": {
	"EarlyStoppingCallback": {
	"args": {
	"early_stopping_patience": 5,
	"early_stopping_threshold": 0.0
	},
	"attributes": {
	"early_stopping_patience_counter": 0
	}
	},
	"TrainerControl": {
	"args": {
	"should_epoch_stop": false,
	"should_evaluate": false,
	"should_log": false,
	"should_save": true,
	"should_training_stop": true
	},
	"attributes": {}
	}
	},
	"total_flos": 9.52238637305561e+18,
	"train_batch_size": 8,
	"trial_name": null,
	"trial_params": null
	}