CoderCowMoo
commited on
Commit
·
950d2dd
1
Parent(s):
d015833
Upload model, config, vocab and training log
Browse files- best_model.pth +3 -0
- config.json +159 -0
- trainer_0_log.txt +211 -0
- vocab.json +0 -0
best_model.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd02035aa2815b805f1db26f4cce42a2cfbe30ca0c4825f432961bc74aa4b420
|
3 |
+
size 5607926869
|
config.json
ADDED
@@ -0,0 +1,159 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"output_path": "output",
|
3 |
+
"logger_uri": null,
|
4 |
+
"run_name": "run",
|
5 |
+
"project_name": null,
|
6 |
+
"run_description": "\ud83d\udc38Coqui trainer run.",
|
7 |
+
"print_step": 25,
|
8 |
+
"plot_step": 100,
|
9 |
+
"model_param_stats": false,
|
10 |
+
"wandb_entity": null,
|
11 |
+
"dashboard_logger": "tensorboard",
|
12 |
+
"save_on_interrupt": true,
|
13 |
+
"log_model_step": null,
|
14 |
+
"save_step": 10000,
|
15 |
+
"save_n_checkpoints": 5,
|
16 |
+
"save_checkpoints": true,
|
17 |
+
"save_all_best": false,
|
18 |
+
"save_best_after": 10000,
|
19 |
+
"target_loss": null,
|
20 |
+
"print_eval": false,
|
21 |
+
"test_delay_epochs": 0,
|
22 |
+
"run_eval": true,
|
23 |
+
"run_eval_steps": null,
|
24 |
+
"distributed_backend": "nccl",
|
25 |
+
"distributed_url": "tcp://localhost:54321",
|
26 |
+
"mixed_precision": false,
|
27 |
+
"precision": "fp16",
|
28 |
+
"epochs": 1000,
|
29 |
+
"batch_size": 32,
|
30 |
+
"eval_batch_size": 16,
|
31 |
+
"grad_clip": 0.0,
|
32 |
+
"scheduler_after_epoch": true,
|
33 |
+
"lr": 0.001,
|
34 |
+
"optimizer": "radam",
|
35 |
+
"optimizer_params": null,
|
36 |
+
"lr_scheduler": null,
|
37 |
+
"lr_scheduler_params": {},
|
38 |
+
"use_grad_scaler": false,
|
39 |
+
"allow_tf32": false,
|
40 |
+
"cudnn_enable": true,
|
41 |
+
"cudnn_deterministic": false,
|
42 |
+
"cudnn_benchmark": false,
|
43 |
+
"training_seed": 54321,
|
44 |
+
"model": "xtts",
|
45 |
+
"num_loader_workers": 0,
|
46 |
+
"num_eval_loader_workers": 0,
|
47 |
+
"use_noise_augment": false,
|
48 |
+
"audio": {
|
49 |
+
"sample_rate": 22050,
|
50 |
+
"output_sample_rate": 24000
|
51 |
+
},
|
52 |
+
"use_phonemes": false,
|
53 |
+
"phonemizer": null,
|
54 |
+
"phoneme_language": null,
|
55 |
+
"compute_input_seq_cache": false,
|
56 |
+
"text_cleaner": null,
|
57 |
+
"enable_eos_bos_chars": false,
|
58 |
+
"test_sentences_file": "",
|
59 |
+
"phoneme_cache_path": null,
|
60 |
+
"characters": null,
|
61 |
+
"add_blank": false,
|
62 |
+
"batch_group_size": 0,
|
63 |
+
"loss_masking": null,
|
64 |
+
"min_audio_len": 1,
|
65 |
+
"max_audio_len": Infinity,
|
66 |
+
"min_text_len": 1,
|
67 |
+
"max_text_len": Infinity,
|
68 |
+
"compute_f0": false,
|
69 |
+
"compute_energy": false,
|
70 |
+
"compute_linear_spec": false,
|
71 |
+
"precompute_num_workers": 0,
|
72 |
+
"start_by_longest": false,
|
73 |
+
"shuffle": false,
|
74 |
+
"drop_last": false,
|
75 |
+
"datasets": [
|
76 |
+
{
|
77 |
+
"formatter": "",
|
78 |
+
"dataset_name": "",
|
79 |
+
"path": "",
|
80 |
+
"meta_file_train": "",
|
81 |
+
"ignored_speakers": null,
|
82 |
+
"language": "",
|
83 |
+
"phonemizer": "",
|
84 |
+
"meta_file_val": "",
|
85 |
+
"meta_file_attn_mask": ""
|
86 |
+
}
|
87 |
+
],
|
88 |
+
"test_sentences": [],
|
89 |
+
"eval_split_max_size": null,
|
90 |
+
"eval_split_size": 0.01,
|
91 |
+
"use_speaker_weighted_sampler": false,
|
92 |
+
"speaker_weighted_sampler_alpha": 1.0,
|
93 |
+
"use_language_weighted_sampler": false,
|
94 |
+
"language_weighted_sampler_alpha": 1.0,
|
95 |
+
"use_length_weighted_sampler": false,
|
96 |
+
"length_weighted_sampler_alpha": 1.0,
|
97 |
+
"model_args": {
|
98 |
+
"gpt_batch_size": 1,
|
99 |
+
"enable_redaction": false,
|
100 |
+
"kv_cache": true,
|
101 |
+
"gpt_checkpoint": null,
|
102 |
+
"clvp_checkpoint": null,
|
103 |
+
"decoder_checkpoint": null,
|
104 |
+
"num_chars": 255,
|
105 |
+
"tokenizer_file": "",
|
106 |
+
"gpt_max_audio_tokens": 605,
|
107 |
+
"gpt_max_text_tokens": 402,
|
108 |
+
"gpt_max_prompt_tokens": 70,
|
109 |
+
"gpt_layers": 30,
|
110 |
+
"gpt_n_model_channels": 1024,
|
111 |
+
"gpt_n_heads": 16,
|
112 |
+
"gpt_number_text_tokens": 6681,
|
113 |
+
"gpt_start_text_token": null,
|
114 |
+
"gpt_stop_text_token": null,
|
115 |
+
"gpt_num_audio_tokens": 1026,
|
116 |
+
"gpt_start_audio_token": 1024,
|
117 |
+
"gpt_stop_audio_token": 1025,
|
118 |
+
"gpt_code_stride_len": 1024,
|
119 |
+
"gpt_use_masking_gt_prompt_approach": true,
|
120 |
+
"gpt_use_perceiver_resampler": true,
|
121 |
+
"input_sample_rate": 22050,
|
122 |
+
"output_sample_rate": 24000,
|
123 |
+
"output_hop_length": 256,
|
124 |
+
"decoder_input_dim": 1024,
|
125 |
+
"d_vector_dim": 512,
|
126 |
+
"cond_d_vector_in_each_upsampling_layer": true,
|
127 |
+
"duration_const": 102400
|
128 |
+
},
|
129 |
+
"model_dir": null,
|
130 |
+
"languages": [
|
131 |
+
"en",
|
132 |
+
"es",
|
133 |
+
"fr",
|
134 |
+
"de",
|
135 |
+
"it",
|
136 |
+
"pt",
|
137 |
+
"pl",
|
138 |
+
"tr",
|
139 |
+
"ru",
|
140 |
+
"nl",
|
141 |
+
"cs",
|
142 |
+
"ar",
|
143 |
+
"zh-cn",
|
144 |
+
"hu",
|
145 |
+
"ko",
|
146 |
+
"ja",
|
147 |
+
"hi"
|
148 |
+
],
|
149 |
+
"temperature": 0.75,
|
150 |
+
"length_penalty": 1.0,
|
151 |
+
"repetition_penalty": 5.0,
|
152 |
+
"top_k": 50,
|
153 |
+
"top_p": 0.85,
|
154 |
+
"num_gpt_outputs": 1,
|
155 |
+
"gpt_cond_len": 30,
|
156 |
+
"gpt_cond_chunk_len": 4,
|
157 |
+
"max_ref_len": 30,
|
158 |
+
"sound_norm_refs": false
|
159 |
+
}
|
trainer_0_log.txt
ADDED
@@ -0,0 +1,211 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
> Training Environment:
|
2 |
+
| > Backend: Torch
|
3 |
+
| > Mixed precision: False
|
4 |
+
| > Precision: float32
|
5 |
+
| > Current device: 0
|
6 |
+
| > Num. of GPUs: 1
|
7 |
+
| > Num. of CPUs: 2
|
8 |
+
| > Num. of Torch Threads: 1
|
9 |
+
| > Torch seed: 1
|
10 |
+
| > Torch CUDNN: True
|
11 |
+
| > Torch CUDNN deterministic: False
|
12 |
+
| > Torch CUDNN benchmark: False
|
13 |
+
| > Torch TF32 MatMul: False
|
14 |
+
> Start Tensorboard: tensorboard --logdir=/tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000
|
15 |
+
|
16 |
+
> Model has 518442047 parameters
|
17 |
+
|
18 |
+
[4m[1m > EPOCH: 0/8[0m
|
19 |
+
--> /tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000
|
20 |
+
|
21 |
+
[1m > TRAINING (2023-12-04 15:00:11) [0m
|
22 |
+
|
23 |
+
[1m --> TIME: 2023-12-04 15:00:19 -- STEP: 0/40 -- GLOBAL_STEP: 0[0m
|
24 |
+
| > loss_text_ce: 0.021964602172374725 (0.021964602172374725)
|
25 |
+
| > loss_mel_ce: 4.907757759094238 (4.907757759094238)
|
26 |
+
| > loss: 4.929722309112549 (4.929722309112549)
|
27 |
+
| > grad_norm: 0 (0)
|
28 |
+
| > current_lr: 5e-06
|
29 |
+
| > step_time: 1.4868 (1.4868354797363281)
|
30 |
+
| > loader_time: 6.5441 (6.544092655181885)
|
31 |
+
|
32 |
+
|
33 |
+
[1m > EVALUATION [0m
|
34 |
+
|
35 |
+
|
36 |
+
[1m--> EVAL PERFORMANCE[0m
|
37 |
+
| > avg_loader_time: 0.07195439338684081 [0m(+0)
|
38 |
+
| > avg_loss_text_ce: 0.021994752064347266 [0m(+0)
|
39 |
+
| > avg_loss_mel_ce: 3.3762893676757812 [0m(+0)
|
40 |
+
| > avg_loss: 3.398284101486206 [0m(+0)
|
41 |
+
|
42 |
+
> BEST MODEL : /tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000/best_model_40.pth
|
43 |
+
|
44 |
+
[4m[1m > EPOCH: 1/8[0m
|
45 |
+
--> /tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000
|
46 |
+
|
47 |
+
[1m > TRAINING (2023-12-04 15:02:56) [0m
|
48 |
+
|
49 |
+
[1m --> TIME: 2023-12-04 15:03:03 -- STEP: 10/40 -- GLOBAL_STEP: 50[0m
|
50 |
+
| > loss_text_ce: 0.023661285638809204 (0.023023789189755915)
|
51 |
+
| > loss_mel_ce: 3.8315794467926025 (3.305363488197327)
|
52 |
+
| > loss: 3.855240821838379 (3.328387236595154)
|
53 |
+
| > grad_norm: 0 (0.0)
|
54 |
+
| > current_lr: 5e-06
|
55 |
+
| > step_time: 0.2479 (0.20201985836029052)
|
56 |
+
| > loader_time: 0.0221 (0.017214274406433104)
|
57 |
+
|
58 |
+
|
59 |
+
[1m > EVALUATION [0m
|
60 |
+
|
61 |
+
|
62 |
+
[1m--> EVAL PERFORMANCE[0m
|
63 |
+
| > avg_loader_time:[91m 0.1108086109161377 [0m(+0.03885421752929688)
|
64 |
+
| > avg_loss_text_ce:[92m 0.021816403046250342 [0m(-0.00017834901809692452)
|
65 |
+
| > avg_loss_mel_ce:[92m 3.2666261196136475 [0m(-0.10966324806213379)
|
66 |
+
| > avg_loss:[92m 3.288442516326904 [0m(-0.10984158515930176)
|
67 |
+
|
68 |
+
> BEST MODEL : /tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000/best_model_80.pth
|
69 |
+
|
70 |
+
[4m[1m > EPOCH: 2/8[0m
|
71 |
+
--> /tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000
|
72 |
+
|
73 |
+
[1m > TRAINING (2023-12-04 15:06:18) [0m
|
74 |
+
|
75 |
+
[1m --> TIME: 2023-12-04 15:06:33 -- STEP: 20/40 -- GLOBAL_STEP: 100[0m
|
76 |
+
| > loss_text_ce: 0.017979152500629425 (0.02109259101562202)
|
77 |
+
| > loss_mel_ce: 3.1569440364837646 (2.9896609008312227)
|
78 |
+
| > loss: 3.1749231815338135 (3.0107534766197204)
|
79 |
+
| > grad_norm: 0 (0.0)
|
80 |
+
| > current_lr: 5e-06
|
81 |
+
| > step_time: 0.1982 (0.25715711116790774)
|
82 |
+
| > loader_time: 0.0208 (0.015216124057769776)
|
83 |
+
|
84 |
+
|
85 |
+
[1m > EVALUATION [0m
|
86 |
+
|
87 |
+
|
88 |
+
[1m--> EVAL PERFORMANCE[0m
|
89 |
+
| > avg_loader_time:[92m 0.06513414382934571 [0m(-0.04567446708679199)
|
90 |
+
| > avg_loss_text_ce:[92m 0.021773791685700417 [0m(-4.2611360549924676e-05)
|
91 |
+
| > avg_loss_mel_ce:[92m 3.2272082805633544 [0m(-0.03941783905029306)
|
92 |
+
| > avg_loss:[92m 3.248982048034668 [0m(-0.03946046829223615)
|
93 |
+
|
94 |
+
> BEST MODEL : /tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000/best_model_120.pth
|
95 |
+
|
96 |
+
[4m[1m > EPOCH: 3/8[0m
|
97 |
+
--> /tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000
|
98 |
+
|
99 |
+
[1m > TRAINING (2023-12-04 15:10:08) [0m
|
100 |
+
|
101 |
+
[1m --> TIME: 2023-12-04 15:10:26 -- STEP: 30/40 -- GLOBAL_STEP: 150[0m
|
102 |
+
| > loss_text_ce: 0.021550316363573074 (0.020829477223257224)
|
103 |
+
| > loss_mel_ce: 3.5817322731018066 (2.8207703987757364)
|
104 |
+
| > loss: 3.6032826900482178 (2.8415998578071595)
|
105 |
+
| > grad_norm: 0 (0.0)
|
106 |
+
| > current_lr: 5e-06
|
107 |
+
| > step_time: 0.2316 (0.26780527432759604)
|
108 |
+
| > loader_time: 0.0088 (0.015432175000508625)
|
109 |
+
|
110 |
+
|
111 |
+
[1m > EVALUATION [0m
|
112 |
+
|
113 |
+
|
114 |
+
[1m--> EVAL PERFORMANCE[0m
|
115 |
+
| > avg_loader_time:[91m 0.12182736396789551 [0m(+0.0566932201385498)
|
116 |
+
| > avg_loss_text_ce:[92m 0.021623440831899644 [0m(-0.00015035085380077362)
|
117 |
+
| > avg_loss_mel_ce:[92m 3.205338716506958 [0m(-0.021869564056396396)
|
118 |
+
| > avg_loss:[92m 3.226962184906006 [0m(-0.02201986312866211)
|
119 |
+
|
120 |
+
> BEST MODEL : /tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000/best_model_160.pth
|
121 |
+
|
122 |
+
[4m[1m > EPOCH: 4/8[0m
|
123 |
+
--> /tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000
|
124 |
+
|
125 |
+
[1m > TRAINING (2023-12-04 15:13:43) [0m
|
126 |
+
|
127 |
+
[1m > EVALUATION [0m
|
128 |
+
|
129 |
+
|
130 |
+
[1m--> EVAL PERFORMANCE[0m
|
131 |
+
| > avg_loader_time:[92m 0.06858286857604981 [0m(-0.0532444953918457)
|
132 |
+
| > avg_loss_text_ce:[92m 0.021538139879703523 [0m(-8.530095219612052e-05)
|
133 |
+
| > avg_loss_mel_ce:[92m 3.19382529258728 [0m(-0.011513423919677912)
|
134 |
+
| > avg_loss:[92m 3.2153634548187258 [0m(-0.011598730087280185)
|
135 |
+
|
136 |
+
> BEST MODEL : /tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000/best_model_200.pth
|
137 |
+
|
138 |
+
[4m[1m > EPOCH: 5/8[0m
|
139 |
+
--> /tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000
|
140 |
+
|
141 |
+
[1m > TRAINING (2023-12-04 15:17:08) [0m
|
142 |
+
|
143 |
+
[1m --> TIME: 2023-12-04 15:17:10 -- STEP: 0/40 -- GLOBAL_STEP: 200[0m
|
144 |
+
| > loss_text_ce: 0.023776765912771225 (0.023776765912771225)
|
145 |
+
| > loss_mel_ce: 2.0250589847564697 (2.0250589847564697)
|
146 |
+
| > loss: 2.0488357543945312 (2.0488357543945312)
|
147 |
+
| > grad_norm: 0 (0)
|
148 |
+
| > current_lr: 5e-06
|
149 |
+
| > step_time: 0.9392 (0.9391729831695557)
|
150 |
+
| > loader_time: 1.0643 (1.0642502307891846)
|
151 |
+
|
152 |
+
|
153 |
+
[1m > EVALUATION [0m
|
154 |
+
|
155 |
+
|
156 |
+
[1m--> EVAL PERFORMANCE[0m
|
157 |
+
| > avg_loader_time:[92m 0.06770339012145996 [0m(-0.0008794784545898549)
|
158 |
+
| > avg_loss_text_ce:[92m 0.02152172140777111 [0m(-1.641847193241397e-05)
|
159 |
+
| > avg_loss_mel_ce:[91m 3.21250319480896 [0m(+0.018677902221679865)
|
160 |
+
| > avg_loss:[91m 3.234024906158447 [0m(+0.018661451339721413)
|
161 |
+
|
162 |
+
|
163 |
+
[4m[1m > EPOCH: 6/8[0m
|
164 |
+
--> /tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000
|
165 |
+
|
166 |
+
[1m > TRAINING (2023-12-04 15:17:31) [0m
|
167 |
+
|
168 |
+
[1m --> TIME: 2023-12-04 15:17:40 -- STEP: 10/40 -- GLOBAL_STEP: 250[0m
|
169 |
+
| > loss_text_ce: 0.018674146384000778 (0.021112211793661118)
|
170 |
+
| > loss_mel_ce: 2.7348833084106445 (2.436060166358948)
|
171 |
+
| > loss: 2.7535574436187744 (2.457172393798828)
|
172 |
+
| > grad_norm: 0 (0.0)
|
173 |
+
| > current_lr: 5e-06
|
174 |
+
| > step_time: 0.1765 (0.2836411952972412)
|
175 |
+
| > loader_time: 0.0086 (0.01687464714050293)
|
176 |
+
|
177 |
+
|
178 |
+
[1m > EVALUATION [0m
|
179 |
+
|
180 |
+
|
181 |
+
[1m--> EVAL PERFORMANCE[0m
|
182 |
+
| > avg_loader_time:[92m 0.06701068878173828 [0m(-0.0006927013397216714)
|
183 |
+
| > avg_loss_text_ce:[92m 0.021476111933588983 [0m(-4.560947418212613e-05)
|
184 |
+
| > avg_loss_mel_ce:[92m 3.206305408477783 [0m(-0.006197786331176847)
|
185 |
+
| > avg_loss:[92m 3.2277815341949463 [0m(-0.006243371963500888)
|
186 |
+
|
187 |
+
|
188 |
+
[4m[1m > EPOCH: 7/8[0m
|
189 |
+
--> /tmp/xtts_ft/run/training/GPT_XTTS_FT-December-04-2023_03+00PM-0000000
|
190 |
+
|
191 |
+
[1m > TRAINING (2023-12-04 15:17:57) [0m
|
192 |
+
|
193 |
+
[1m --> TIME: 2023-12-04 15:18:11 -- STEP: 20/40 -- GLOBAL_STEP: 300[0m
|
194 |
+
| > loss_text_ce: 0.023174753412604332 (0.019879171112552285)
|
195 |
+
| > loss_mel_ce: 3.1051435470581055 (2.4108093440532685)
|
196 |
+
| > loss: 3.1283183097839355 (2.430688518285751)
|
197 |
+
| > grad_norm: 0 (0.0)
|
198 |
+
| > current_lr: 5e-06
|
199 |
+
| > step_time: 0.27 (0.29051125049591064)
|
200 |
+
| > loader_time: 0.0138 (0.01517837047576904)
|
201 |
+
|
202 |
+
|
203 |
+
[1m > EVALUATION [0m
|
204 |
+
|
205 |
+
|
206 |
+
[1m--> EVAL PERFORMANCE[0m
|
207 |
+
| > avg_loader_time:[91m 0.11030998229980468 [0m(+0.0432992935180664)
|
208 |
+
| > avg_loss_text_ce:[91m 0.02148539908230305 [0m(+9.287148714065552e-06)
|
209 |
+
| > avg_loss_mel_ce:[91m 3.223378849029541 [0m(+0.01707344055175808)
|
210 |
+
| > avg_loss:[91m 3.244864273071289 [0m(+0.017082738876342596)
|
211 |
+
|
vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|