run_id	topic_id	metric	value
ag_sel_new_prompt	1001	sentence_support_opt	0.8181818181818182
ag_sel_new_prompt	1001	sentence_support_pes	0.8181818181818182
ag_sel_new_prompt	1001	sentence_support_llmfilled	0.8181818181818182
ag_sel_new_prompt	1001	nugget_mentioned	0.45
ag_sel_new_prompt	1001	nugget_coverage	0.3
ag_sel_new_prompt	1003	sentence_support_opt	0.375
ag_sel_new_prompt	1003	sentence_support_pes	0.375
ag_sel_new_prompt	1003	sentence_support_llmfilled	0.375
ag_sel_new_prompt	1003	nugget_mentioned	0.2
ag_sel_new_prompt	1003	nugget_coverage	0.15
ag_sel_new_prompt	1005	sentence_support_opt	1.0
ag_sel_new_prompt	1005	sentence_support_pes	0.0
ag_sel_new_prompt	1005	sentence_support_llmfilled	0.0
ag_sel_new_prompt	1005	nugget_mentioned	0.4
ag_sel_new_prompt	1005	nugget_coverage	0.0
ag_sel_new_prompt	1007	sentence_support_opt	0.1111111111111111
ag_sel_new_prompt	1007	sentence_support_pes	0.1111111111111111
ag_sel_new_prompt	1007	sentence_support_llmfilled	0.1111111111111111
ag_sel_new_prompt	1007	nugget_mentioned	0.631578947368421
ag_sel_new_prompt	1007	nugget_coverage	0.21052631578947367
ag_sel_new_prompt	1009	sentence_support_opt	0.7333333333333333
ag_sel_new_prompt	1009	sentence_support_pes	0.06666666666666667
ag_sel_new_prompt	1009	sentence_support_llmfilled	0.06666666666666667
ag_sel_new_prompt	1009	nugget_mentioned	0.6666666666666666
ag_sel_new_prompt	1009	nugget_coverage	0.08333333333333333
ag_sel_new_prompt	1011	sentence_support_opt	0.35714285714285715
ag_sel_new_prompt	1011	sentence_support_pes	0.35714285714285715
ag_sel_new_prompt	1011	sentence_support_llmfilled	0.35714285714285715
ag_sel_new_prompt	1011	nugget_mentioned	0.3684210526315789
ag_sel_new_prompt	1011	nugget_coverage	0.15789473684210525
ag_sel_new_prompt	1013	sentence_support_opt	0.4
ag_sel_new_prompt	1013	sentence_support_pes	0.2
ag_sel_new_prompt	1013	sentence_support_llmfilled	0.2
ag_sel_new_prompt	1013	nugget_mentioned	0.4375
ag_sel_new_prompt	1013	nugget_coverage	0.125
ag_sel_new_prompt	1015	sentence_support_opt	0.3333333333333333
ag_sel_new_prompt	1015	sentence_support_pes	0.3333333333333333
ag_sel_new_prompt	1015	sentence_support_llmfilled	0.3333333333333333
ag_sel_new_prompt	1015	nugget_mentioned	0.16666666666666666
ag_sel_new_prompt	1015	nugget_coverage	0.08333333333333333
ag_sel_new_prompt	1017	sentence_support_opt	0.3333333333333333
ag_sel_new_prompt	1017	sentence_support_pes	0.16666666666666666
ag_sel_new_prompt	1017	sentence_support_llmfilled	0.16666666666666666
ag_sel_new_prompt	1017	nugget_mentioned	0.2
ag_sel_new_prompt	1017	nugget_coverage	0.0
ag_sel_new_prompt	1019	sentence_support_opt	0.5384615384615384
ag_sel_new_prompt	1019	sentence_support_pes	0.3076923076923077
ag_sel_new_prompt	1019	sentence_support_llmfilled	0.3076923076923077
ag_sel_new_prompt	1019	nugget_mentioned	0.3125
ag_sel_new_prompt	1019	nugget_coverage	0.1875
ag_sel_new_prompt	1021	sentence_support_opt	1.0
ag_sel_new_prompt	1021	sentence_support_pes	0.0
ag_sel_new_prompt	1021	sentence_support_llmfilled	0.0
ag_sel_new_prompt	1021	nugget_mentioned	0.17647058823529413
ag_sel_new_prompt	1021	nugget_coverage	0.0
ag_sel_new_prompt	1023	sentence_support_opt	0.6666666666666666
ag_sel_new_prompt	1023	sentence_support_pes	0.13333333333333333
ag_sel_new_prompt	1023	sentence_support_llmfilled	0.13333333333333333
ag_sel_new_prompt	1023	nugget_mentioned	0.10526315789473684
ag_sel_new_prompt	1023	nugget_coverage	0.0
ag_sel_new_prompt	1025	sentence_support_opt	0.5294117647058824
ag_sel_new_prompt	1025	sentence_support_pes	0.5294117647058824
ag_sel_new_prompt	1025	sentence_support_llmfilled	0.5294117647058824
ag_sel_new_prompt	1025	nugget_mentioned	0.7777777777777778
ag_sel_new_prompt	1025	nugget_coverage	0.5555555555555556
ag_sel_new_prompt	1027	sentence_support_opt	1.0
ag_sel_new_prompt	1027	sentence_support_pes	0.0
ag_sel_new_prompt	1027	sentence_support_llmfilled	0.0
ag_sel_new_prompt	1027	nugget_mentioned	0.5
ag_sel_new_prompt	1027	nugget_coverage	0.0
ag_sel_new_prompt	1029	sentence_support_opt	0.7
ag_sel_new_prompt	1029	sentence_support_pes	0.3
ag_sel_new_prompt	1029	sentence_support_llmfilled	0.3
ag_sel_new_prompt	1029	nugget_mentioned	0.3
ag_sel_new_prompt	1029	nugget_coverage	0.25
ag_sel_new_prompt	1031	sentence_support_opt	0.875
ag_sel_new_prompt	1031	sentence_support_pes	0.1875
ag_sel_new_prompt	1031	sentence_support_llmfilled	0.1875
ag_sel_new_prompt	1031	nugget_mentioned	0.15
ag_sel_new_prompt	1031	nugget_coverage	0.0
ag_sel_new_prompt	1033	sentence_support_opt	0.7272727272727273
ag_sel_new_prompt	1033	sentence_support_pes	0.36363636363636365
ag_sel_new_prompt	1033	sentence_support_llmfilled	0.36363636363636365
ag_sel_new_prompt	1033	nugget_mentioned	0.2631578947368421
ag_sel_new_prompt	1033	nugget_coverage	0.05263157894736842
ag_sel_new_prompt	1035	sentence_support_opt	0.2857142857142857
ag_sel_new_prompt	1035	sentence_support_pes	0.2857142857142857
ag_sel_new_prompt	1035	sentence_support_llmfilled	0.2857142857142857
ag_sel_new_prompt	1035	nugget_mentioned	0.0
ag_sel_new_prompt	1035	nugget_coverage	0.0
ag_sel_new_prompt	1037	sentence_support_opt	0.5
ag_sel_new_prompt	1037	sentence_support_pes	0.5
ag_sel_new_prompt	1037	sentence_support_llmfilled	0.5
ag_sel_new_prompt	1037	nugget_mentioned	0.3333333333333333
ag_sel_new_prompt	1037	nugget_coverage	0.06666666666666667
ag_sel_new_prompt	1039	sentence_support_opt	1.0
ag_sel_new_prompt	1039	sentence_support_pes	0.0
ag_sel_new_prompt	1039	sentence_support_llmfilled	0.0
ag_sel_new_prompt	1039	nugget_mentioned	0.4
ag_sel_new_prompt	1039	nugget_coverage	0.0
ag_sel_new_prompt	1041	sentence_support_opt	1.0
ag_sel_new_prompt	1041	sentence_support_pes	0.08333333333333333
ag_sel_new_prompt	1041	sentence_support_llmfilled	0.08333333333333333
ag_sel_new_prompt	1041	nugget_mentioned	0.2777777777777778
ag_sel_new_prompt	1041	nugget_coverage	0.05555555555555555
ag_sel_new_prompt	1047	sentence_support_opt	0.2727272727272727
ag_sel_new_prompt	1047	sentence_support_pes	0.18181818181818182
ag_sel_new_prompt	1047	sentence_support_llmfilled	0.18181818181818182
ag_sel_new_prompt	1047	nugget_mentioned	0.35294117647058826
ag_sel_new_prompt	1047	nugget_coverage	0.11764705882352941
ag_sel_new_prompt	1053	sentence_support_opt	0.5833333333333334
ag_sel_new_prompt	1053	sentence_support_pes	0.25
ag_sel_new_prompt	1053	sentence_support_llmfilled	0.25
ag_sel_new_prompt	1053	nugget_mentioned	0.5833333333333334
ag_sel_new_prompt	1053	nugget_coverage	0.08333333333333333
ag_sel_new_prompt	1055	sentence_support_opt	0.3
ag_sel_new_prompt	1055	sentence_support_pes	0.3
ag_sel_new_prompt	1055	sentence_support_llmfilled	0.3
ag_sel_new_prompt	1055	nugget_mentioned	0.125
ag_sel_new_prompt	1055	nugget_coverage	0.125
ag_sel_new_prompt	1065	sentence_support_opt	0.18181818181818182
ag_sel_new_prompt	1065	sentence_support_pes	0.18181818181818182
ag_sel_new_prompt	1065	sentence_support_llmfilled	0.18181818181818182
ag_sel_new_prompt	1065	nugget_mentioned	0.25
ag_sel_new_prompt	1065	nugget_coverage	0.05
ag_sel_new_prompt	1067	sentence_support_opt	0.7142857142857143
ag_sel_new_prompt	1067	sentence_support_pes	0.07142857142857142
ag_sel_new_prompt	1067	sentence_support_llmfilled	0.07142857142857142
ag_sel_new_prompt	1067	nugget_mentioned	0.2
ag_sel_new_prompt	1067	nugget_coverage	0.05
ag_sel_new_prompt	1069	sentence_support_opt	0.0
ag_sel_new_prompt	1069	sentence_support_pes	0.0
ag_sel_new_prompt	1069	sentence_support_llmfilled	0.0
ag_sel_new_prompt	1069	nugget_mentioned	0.0
ag_sel_new_prompt	1069	nugget_coverage	0.0
ag_sel_new_prompt	1075	sentence_support_opt	0.42857142857142855
ag_sel_new_prompt	1075	sentence_support_pes	0.42857142857142855
ag_sel_new_prompt	1075	sentence_support_llmfilled	0.42857142857142855
ag_sel_new_prompt	1075	nugget_mentioned	0.1875
ag_sel_new_prompt	1075	nugget_coverage	0.125
ag_sel_new_prompt	1077	sentence_support_opt	0.8
ag_sel_new_prompt	1077	sentence_support_pes	0.8
ag_sel_new_prompt	1077	sentence_support_llmfilled	0.8
ag_sel_new_prompt	1077	nugget_mentioned	0.2
ag_sel_new_prompt	1077	nugget_coverage	0.15
ag_sel_new_prompt	1079	sentence_support_opt	0.4166666666666667
ag_sel_new_prompt	1079	sentence_support_pes	0.3333333333333333
ag_sel_new_prompt	1079	sentence_support_llmfilled	0.3333333333333333
ag_sel_new_prompt	1079	nugget_mentioned	0.1
ag_sel_new_prompt	1079	nugget_coverage	0.1
ag_sel_new_prompt	1081	sentence_support_opt	0.5
ag_sel_new_prompt	1081	sentence_support_pes	0.3333333333333333
ag_sel_new_prompt	1081	sentence_support_llmfilled	0.3333333333333333
ag_sel_new_prompt	1081	nugget_mentioned	0.6666666666666666
ag_sel_new_prompt	1081	nugget_coverage	0.5833333333333334
ag_sel_new_prompt	1083	sentence_support_opt	0.4444444444444444
ag_sel_new_prompt	1083	sentence_support_pes	0.4444444444444444
ag_sel_new_prompt	1083	sentence_support_llmfilled	0.4444444444444444
ag_sel_new_prompt	1083	nugget_mentioned	0.5454545454545454
ag_sel_new_prompt	1083	nugget_coverage	0.45454545454545453
ag_sel_new_prompt	1085	sentence_support_opt	0.46153846153846156
ag_sel_new_prompt	1085	sentence_support_pes	0.46153846153846156
ag_sel_new_prompt	1085	sentence_support_llmfilled	0.46153846153846156
ag_sel_new_prompt	1085	nugget_mentioned	0.16666666666666666
ag_sel_new_prompt	1085	nugget_coverage	0.1111111111111111
ag_sel_new_prompt	1087	sentence_support_opt	0.4
ag_sel_new_prompt	1087	sentence_support_pes	0.4
ag_sel_new_prompt	1087	sentence_support_llmfilled	0.4
ag_sel_new_prompt	1087	nugget_mentioned	0.5833333333333334
ag_sel_new_prompt	1087	nugget_coverage	0.16666666666666666
ag_sel_new_prompt	all	sentence_support_opt	0.5525690668424231
ag_sel_new_prompt	all	sentence_support_pes	0.2736767581707028
ag_sel_new_prompt	all	sentence_support_llmfilled	0.27367675817070275
ag_sel_new_prompt	all	nugget_mentioned	0.3258238113239479
ag_sel_new_prompt	all	nugget_coverage	0.1292539421716712
