Climate-Education-QA-Chatbot / comprehensive_results.json
Climi's picture
upload everything about the climate education chatbot
74b76c0 verified
{
"experiment_info": {
"name": "Climate Education Chatbot - Optimal Model",
"version": "Experiment 4c - Balanced",
"description": "Best performing model across all experiments",
"timestamp": "2025-06-17T00:58:29.482424"
},
"model_performance": {
"training_loss": 0.5757,
"validation_loss": 0.8844,
"bleu_score": 0.0549,
"average_generation_time": 17.3,
"performance_grade": "OPTIMAL"
},
"experiment_progression": {
"baseline": {
"learning_rate": 2e-05,
"batch_size": 16,
"epochs": 5,
"train_loss": 9.04,
"val_loss": 9.79,
"bleu": 0.0001,
"notes": "Severe underfitting"
},
"experiment_2": {
"learning_rate": 0.0005,
"batch_size": 8,
"epochs": 10,
"train_loss": 0.93,
"val_loss": 0.93,
"bleu": 0.0012,
"notes": "Major leap in text quality"
},
"experiment_3": {
"learning_rate": 0.0003,
"batch_size": 4,
"epochs": 15,
"train_loss": 1.2623,
"val_loss": 1.3637,
"bleu": 0.0392,
"notes": "Smooth fluency; minor factual errors"
},
"experiment_4": {
"learning_rate": 0.0001,
"batch_size": 8,
"epochs": 20,
"train_loss": 0.5757,
"val_loss": 0.8844,
"bleu": 0.0392,
"notes": "Best factual grounding, improved conciseness"
},
"experiment_4b": {
"description": "Speed-up variant",
"bleu": 0.034,
"generation_time": 16.7,
"notes": "Speed-up variant; less repetition but BLEU dropped"
},
"experiment_4c": {
"description": "OPTIMAL - Balanced version",
"bleu": 0.0549,
"generation_time": 17.3,
"notes": "BEST: Stable quality + fast generation"
}
},
"optimal_parameters": {
"max_length": 70,
"min_length": 18,
"temperature": 0.5,
"top_p": 0.8,
"top_k": 40,
"repetition_penalty": 2.0,
"no_repeat_ngram_size": 3,
"num_beams": 1
},
"dataset_info": {
"training_samples": 60,
"validation_samples": 13,
"test_samples": 13,
"domain": "Climate Education",
"model_type": "T5-small generative QA"
},
"achievements": [
"93% reduction in training loss (9.04 \u2192 0.5757)",
"55x improvement in BLEU score (0.0001 \u2192 0.0549)",
"30% speed improvement from baseline",
"Balanced quality and performance",
"Functional interactive chatbot"
]
}