Elad1 / training_log.json
erave02's picture
Upload folder using huggingface_hub
09156d5
raw
history blame contribute delete
No virus
459 Bytes
{
"base_model_name": "lmsys_vicuna-13b-v1.5",
"base_model_class": "LlamaForCausalLM",
"base_loaded_in_4bit": true,
"base_loaded_in_8bit": false,
"projections": "q, v",
"loss": 1.5336,
"learning_rate": 2.553191489361702e-05,
"epoch": 2.99,
"current_steps": 1629,
"train_runtime": 11129.9267,
"train_samples_per_second": 0.587,
"train_steps_per_second": 0.005,
"total_flos": 1.2901151682330624e+17,
"train_loss": 1.7797385243808521
}