tmp_rc / infer_config.yaml
Dongchao's picture
Upload v_new
acd6d71 verified
seed: 999
cudnn_deterministic: true
model: diffusion_transformer_1D
dropout_p: 0.1
token_dropout_p: 0.1
num_output_layer: 2
drop_path_rate: 0.0
batch_size: 16
max_length: 8000
min_length: 100
n_worker: 4
minibatch_debug: -1
segment_duration: 12.0
n_epoch: 5
grad_accum: 1
fine_decoder: false
learning_rate: 0.0001
grad_clip: 2.0
warmup_steps: 1000
data_parallel: fsdp
mixed_precision: fp32
grad_precision: fp32
activation_checkpointing: true
weight_decay: 0.05
n_layer: 16
n_head: 12
n_embd: 768
dropout: 0.0
bias: false
block_size: 8192
prefix_lm: false
num_codebooks: 1
num_channels: 32
unet_model_name: transformer-2d
transformer_diffusion_config: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/model_config.json
sq_config: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/sqcodec_config.yaml
sq_resume: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/sqcodec.pth
whisper_path: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/whisper-medium
reason_lm_path: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/audiothinker.pth
llm_path: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/Llama-3.2-3B
reconstruction_path: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/semantic.checkpoint
prompt_path: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/prompt.json
best_rq_ckpt: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/music_ssl.pt
wav_lm_path: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/wavlm
print_freq: 100
save_interval: 5000
resume: null
rank: 0