| seed: 999 | |
| cudnn_deterministic: true | |
| model: diffusion_transformer_1D | |
| dropout_p: 0.1 | |
| token_dropout_p: 0.1 | |
| num_output_layer: 2 | |
| drop_path_rate: 0.0 | |
| batch_size: 16 | |
| max_length: 8000 | |
| min_length: 100 | |
| n_worker: 4 | |
| minibatch_debug: -1 | |
| segment_duration: 12.0 | |
| n_epoch: 5 | |
| grad_accum: 1 | |
| fine_decoder: false | |
| learning_rate: 0.0001 | |
| grad_clip: 2.0 | |
| warmup_steps: 1000 | |
| data_parallel: fsdp | |
| mixed_precision: fp32 | |
| grad_precision: fp32 | |
| activation_checkpointing: true | |
| weight_decay: 0.05 | |
| n_layer: 16 | |
| n_head: 12 | |
| n_embd: 768 | |
| dropout: 0.0 | |
| bias: false | |
| block_size: 8192 | |
| prefix_lm: false | |
| num_codebooks: 1 | |
| num_channels: 32 | |
| unet_model_name: transformer-2d | |
| transformer_diffusion_config: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/model_config.json | |
| sq_config: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/sqcodec_config.yaml | |
| sq_resume: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/sqcodec.pth | |
| whisper_path: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/whisper-medium | |
| reason_lm_path: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/audiothinker.pth | |
| llm_path: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/Llama-3.2-3B | |
| reconstruction_path: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/semantic.checkpoint | |
| prompt_path: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/prompt.json | |
| best_rq_ckpt: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/music_ssl.pt | |
| wav_lm_path: /turing_music_fs/music_data/ydc/exp2/reason_ckpt/wavlm | |
| print_freq: 100 | |
| save_interval: 5000 | |
| resume: null | |
| rank: 0 | |