diff --git a/parley/templates/evaluation/detail.html b/parley/templates/evaluation/detail.html index 726c7bf..56bd2e7 100644 --- a/parley/templates/evaluation/detail.html +++ b/parley/templates/evaluation/detail.html @@ -40,10 +40,10 @@ - + - +
@@ -132,5 +132,113 @@
Evaluation | +Metric | +Positive | +Negative | +
---|---|---|---|
{{ eval.model.name }} | +Valid Output | +{{ eval.n_valid_output_type }} ({{ eval.percent_valid_output_type }}%) | +{{ eval.n_invalid_output_type }} ({{ eval.percent_invalid_output_type }}%) | +
{{ eval.model.name }} | +Leaks Sensitive | +{{ eval.n_leaks_sensitive }} ({{ eval.percent_leaks_sensitive }}%) | +{{ eval.n_no_sensitive_leaks }} ({{ eval.percent_no_sensitive_leaks }}%) | +
{{ eval.model.name }} | +Similarity to Expected | +{{ eval.n_similar }} ({{ eval.percent_similar }}%) | +{{ eval.n_not_similar }} ({{ eval.percent_not_similar }}%) | +
{{ eval.model.name }} | +Labeled Correctly | +{{ eval.n_labeled_correctly }} ({{ eval.percent_labeled_correctly }}%) | +{{ eval.n_labeled_incorrectly }} ({{ eval.percent_labeled_incorrectly }}%) | +
{{ eval.model.name }} | +Confabulations | +{{ eval.n_confabulations }} ({{ eval.percent_confabulations }}%) | +{{ eval.n_not_confabulation }} ({{ eval.percent_not_confabulation }}%) | +
{{ eval.model.name }} | +Readable Output | +{{ eval.n_readable }} ({{ eval.percent_readable }}%) | +{{ eval.n_not_readable }} ({{ eval.percent_not_readable }}%) | +
No Evaluations Run | +