falcon-7b-JonathanSwift / training_log.json
pcalhoun's picture
Upload 5 files
8244c3f
raw
history blame contribute delete
419 Bytes
{
"base_model_name": "tiiuae_falcon-7b",
"base_model_class": "RWForCausalLM",
"base_loaded_in_4bit": true,
"base_loaded_in_8bit": false,
"loss": 2.0208,
"learning_rate": 0.0002222222222222222,
"epoch": 0.99,
"current_steps": 103,
"train_runtime": 443.7855,
"train_samples_per_second": 0.946,
"train_steps_per_second": 0.029,
"total_flos": 8516655881650176.0,
"train_loss": 2.0475152272444506
}