Spaces:
Runtime error
Runtime error
shlomihod
commited on
Commit
·
afd9d5d
1
Parent(s):
8b90d81
improve captions
Browse files
app.py
CHANGED
@@ -916,12 +916,19 @@ def main():
|
|
916 |
st.metric("MCC", f"{evaluation['mcc']:.2f}")
|
917 |
|
918 |
st.markdown("## Detailed Evaluation")
|
|
|
|
|
|
|
|
|
|
|
919 |
st.caption(
|
920 |
-
"A
|
921 |
-
"
|
922 |
-
" A hit is a correct inference (*inference* is the same as *annotation*), a miss is an incorrect inference (otherwise)."
|
923 |
-
" If the inference could not be determined based on the model output, the *inference* is 'unknown'."
|
924 |
)
|
|
|
|
|
|
|
|
|
925 |
st.dataframe(evaluation["hit_miss"])
|
926 |
|
927 |
with st.expander("Additional Information", expanded=False):
|
|
|
916 |
st.metric("MCC", f"{evaluation['mcc']:.2f}")
|
917 |
|
918 |
st.markdown("## Detailed Evaluation")
|
919 |
+
|
920 |
+
st.caption(
|
921 |
+
"This table showcases all examples (input and output pairs) that were leveraged for the evaluation of the prompt template with the model (for instance, accuracy)."
|
922 |
+
" It comprises the input placeholder values, the unmodified model *output*, the deduced *inference*, and the ground-truth *annotation*."
|
923 |
+
)
|
924 |
st.caption(
|
925 |
+
"A 'hit' signifies a correct inference (when *inference* coincides with *annotation*), while a 'miss' denotes an incorrect inference."
|
926 |
+
" If the *inference* cannot be determined based on the model output, it is labeled as 'unknown'."
|
|
|
|
|
927 |
)
|
928 |
+
st.caption(
|
929 |
+
"The *prompt* column features the complete prompt that the model was prompted to complete, i.e., your prompt template filled with the input placeholders you have used."
|
930 |
+
)
|
931 |
+
|
932 |
st.dataframe(evaluation["hit_miss"])
|
933 |
|
934 |
with st.expander("Additional Information", expanded=False):
|