flan-t5-small-gigatrue / coreconfig.json
Plasmoxy's picture
End of training
be98ce6 verified
raw
history blame contribute delete
689 Bytes
{
"out_name": "flan-t5-small-gigatrue",
"model_archetype": "flan-t5",
"model_name": "google/flan-t5-small",
"tokenizer_name": "google/flan-t5-small",
"model_torch_dtype": "bfloat16",
"dataset_lang": "en",
"dataset_name": "Plasmoxy/gigatrue",
"dataset_tokenized_cache_name": "gigatrue_tokenized_flan_t5_110-35",
"use_half_val_dataset": true,
"max_input_length": 110,
"max_target_length": 35,
"batch_size": 256,
"learning_rate": 0.0003,
"num_train_epochs": 3,
"pkg_versions": {
"optimum": "1.23.3",
"transformers": "4.45.2",
"openvino": "2024.6.0",
"nncf": "2.14.1",
"torch": "2.5.1",
"datasets": "3.2.0",
"peft": "0.13.3.dev0"
}
}