shlomihod commited on
Commit
afd9d5d
·
1 Parent(s): 8b90d81

improve captions

Browse files
Files changed (1) hide show
  1. app.py +11 -4
app.py CHANGED
@@ -916,12 +916,19 @@ def main():
916
  st.metric("MCC", f"{evaluation['mcc']:.2f}")
917
 
918
  st.markdown("## Detailed Evaluation")
 
 
 
 
 
919
  st.caption(
920
- "A table of all examples (input and output pairs) used to evaluate the prompt template with the model (e.g., accuracy)."
921
- " It consists of the input placeholder values, the model *output* as-is, the *inference*, and the 'ground-truth' *annotation*."
922
- " A hit is a correct inference (*inference* is the same as *annotation*), a miss is an incorrect inference (otherwise)."
923
- " If the inference could not be determined based on the model output, the *inference* is 'unknown'."
924
  )
 
 
 
 
925
  st.dataframe(evaluation["hit_miss"])
926
 
927
  with st.expander("Additional Information", expanded=False):
 
916
  st.metric("MCC", f"{evaluation['mcc']:.2f}")
917
 
918
  st.markdown("## Detailed Evaluation")
919
+
920
+ st.caption(
921
+ "This table showcases all examples (input and output pairs) that were leveraged for the evaluation of the prompt template with the model (for instance, accuracy)."
922
+ " It comprises the input placeholder values, the unmodified model *output*, the deduced *inference*, and the ground-truth *annotation*."
923
+ )
924
  st.caption(
925
+ "A 'hit' signifies a correct inference (when *inference* coincides with *annotation*), while a 'miss' denotes an incorrect inference."
926
+ " If the *inference* cannot be determined based on the model output, it is labeled as 'unknown'."
 
 
927
  )
928
+ st.caption(
929
+ "The *prompt* column features the complete prompt that the model was prompted to complete, i.e., your prompt template filled with the input placeholders you have used."
930
+ )
931
+
932
  st.dataframe(evaluation["hit_miss"])
933
 
934
  with st.expander("Additional Information", expanded=False):