lmg-lora / training_log.json
llama-anon's picture
Upload 5 files
c9497dc
raw
history blame contribute delete
449 Bytes
{
"base_model_name": "Llama2-13B-GPTQ",
"base_model_class": "LlamaForCausalLM",
"base_loaded_in_4bit": false,
"base_loaded_in_8bit": false,
"projections": "q, v",
"loss": 1.7585,
"learning_rate": 1.333858168224178e-07,
"epoch": 0.99,
"current_steps": 2879,
"train_runtime": 2372.2653,
"train_samples_per_second": 2.461,
"train_steps_per_second": 0.019,
"total_flos": 2380933575475200.0,
"train_loss": 1.8855021370781793
}