File size: 1,617 Bytes
9552c2b |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 |
pretrained_model_path: checkpoints/CompVis/stable-diffusion-v1-4
output_dir: /home/user/app/experiments/talking-man
train_data:
video_path: /tmp/gradio/f79f070ba10b1b7872faa157ada00e09644ef2f2/Untitled Video.mp4
prompt: A person of East Asian ethnicity standing in a well-lit office environment
with large windows, speaking directly to the camera, wearing a white shirt, and
conveying a calm and professional demeanor. The background is slightly blurred,
showcasing greenery and modern office decor, with minimal distractions
n_sample_frames: 8
width: 512
height: 512
sample_start_idx: 0
sample_frame_rate: 1
validation_data:
prompts:
- A person of East Asian descent is standing in a bright office setting with large
windows, addressing the camera directly. They are dressed in a white shirt and
project a calm, professional demeanor. The background is slightly out of focus,
highlighting greenery and modern office furnishings, with minimal visual distractions
video_length: 8
width: 512
height: 512
num_inference_steps: 50
guidance_scale: 7.5
validation_steps: 100
trainable_modules:
- attn1.to_q
- attn2.to_q
- attn_temp
train_batch_size: 1
max_train_steps: 300
learning_rate: 3.5e-05
scale_lr: false
lr_scheduler: constant
lr_warmup_steps: 0
adam_beta1: 0.9
adam_beta2: 0.999
adam_weight_decay: 0.01
adam_epsilon: 1.0e-08
max_grad_norm: 1.0
gradient_accumulation_steps: 1
gradient_checkpointing: true
checkpointing_steps: 1000
resume_from_checkpoint: null
mixed_precision: fp16
use_8bit_adam: false
enable_xformers_memory_efficient_attention: true
seed: 31118
|