| { | |
| "dfloat11_config": { | |
| "version": "0.5.0", | |
| "threads_per_block": [ | |
| 512 | |
| ], | |
| "bytes_per_thread": 8, | |
| "pattern_dict": { | |
| "model\\.visual\\.blocks\\.\\d+": [ | |
| "attn.qkv", | |
| "attn.proj", | |
| "mlp.linear_fc1", | |
| "mlp.linear_fc2" | |
| ], | |
| "model\\.visual\\.merger": [ | |
| "linear_fc1", | |
| "linear_fc2" | |
| ], | |
| "model\\.visual\\.deepstack_merger_list\\.\\d+": [ | |
| "linear_fc1", | |
| "linear_fc2" | |
| ], | |
| "model\\.language_model\\.embed_tokens": [], | |
| "model\\.language_model\\.layers\\.\\d+": [ | |
| "self_attn.q_proj", | |
| "self_attn.k_proj", | |
| "self_attn.v_proj", | |
| "self_attn.o_proj", | |
| "mlp.gate_proj", | |
| "mlp.up_proj", | |
| "mlp.down_proj" | |
| ], | |
| "lm_head": [] | |
| } | |
| } | |
| } |