Spaces:
Sleeping
Sleeping
Upload 2 files
Browse files- app.py +8 -9
- evaluation.py +1 -1
app.py
CHANGED
@@ -144,8 +144,8 @@ st.text_area("Generated Response:", value=st.session_state.response, height=150,
|
|
144 |
col1, col2 = st.columns([1, 3]) # Creating two columns for button and metrics display
|
145 |
|
146 |
# Calculate Metrics Button
|
147 |
-
|
148 |
-
|
149 |
st.session_state.metrics = calculate_metrics(question, st.session_state.query_dataset, st.session_state.response, st.session_state.retrieved_documents, st.session_state.time_taken_for_response)
|
150 |
for q in st.session_state.recent_questions:
|
151 |
if q["question"] == st.session_state.last_question:
|
@@ -153,13 +153,12 @@ if st.button("Show Metrics"):
|
|
153 |
|
154 |
# Save updated data to file
|
155 |
save_recent_questions(st.session_state.recent_questions)
|
156 |
-
|
157 |
-
|
158 |
-
|
159 |
-
|
160 |
-
|
161 |
-
|
162 |
-
st.text_area("Metrics:", value=metrics_, height=100, disabled=True)
|
163 |
|
164 |
|
165 |
|
|
|
144 |
col1, col2 = st.columns([1, 3]) # Creating two columns for button and metrics display
|
145 |
|
146 |
# Calculate Metrics Button
|
147 |
+
with col1:
|
148 |
+
if st.button("Show Metrics"):
|
149 |
st.session_state.metrics = calculate_metrics(question, st.session_state.query_dataset, st.session_state.response, st.session_state.retrieved_documents, st.session_state.time_taken_for_response)
|
150 |
for q in st.session_state.recent_questions:
|
151 |
if q["question"] == st.session_state.last_question:
|
|
|
153 |
|
154 |
# Save updated data to file
|
155 |
save_recent_questions(st.session_state.recent_questions)
|
156 |
+
with col2:
|
157 |
+
if st.session_state.metrics is not None:
|
158 |
+
metrics_ = st.session_state.metrics
|
159 |
+
else:
|
160 |
+
metrics_ ={}
|
161 |
+
st.json(metrics_)
|
|
|
162 |
|
163 |
|
164 |
|
evaluation.py
CHANGED
@@ -113,7 +113,7 @@ def calculate_metrics(question, q_dataset, response, docs, time_taken):
|
|
113 |
|
114 |
metrics = {
|
115 |
"RMSE": rmse,
|
116 |
-
"
|
117 |
"response_time": time_taken,
|
118 |
"ground_truth": ground_truth_answer,
|
119 |
"RAG_model_response": response,
|
|
|
113 |
|
114 |
metrics = {
|
115 |
"RMSE": rmse,
|
116 |
+
"predicted_metrics":predicted_metrics,
|
117 |
"response_time": time_taken,
|
118 |
"ground_truth": ground_truth_answer,
|
119 |
"RAG_model_response": response,
|