run_id	request_id	metric	value
gptr_ka_q3d3_natv	all	sentences	142.0
gptr_ka_q3d3_natv	all	sentences_with_citations_or_requiring_citations	142.0
gptr_ka_q3d3_natv	all	correctly_cited_sentences	113.0
gptr_ka_q3d3_natv	all	first_instance_sentences_missing_citation	3.0
gptr_ka_q3d3_natv	all	nuggets	815.0
gptr_ka_q3d3_natv	all	nuggets_weighted	477.0
gptr_ka_q3d3_natv	all	correct_nuggets	216.0
gptr_ka_q3d3_natv	all	correct_nuggets_weighted	144.0
gptr_ka_q3d3_natv	all	citations	139.0
gptr_ka_q3d3_natv	all	relevant_citations	71.0
gptr_ka_q3d3_natv	all	supporting_citations	113.0
gptr_ka_q3d3_natv	all	character_count_median	1564.0
gptr_ka_q3d3_natv	all	character_count_max	1882.0
gptr_ka_q3d3_natv	all	citation_relevance_micro	0.5107913669064749
gptr_ka_q3d3_natv	all	citation_relevance_macro	0.5131200396825397
gptr_ka_q3d3_natv	all	citation_support_micro	0.8129496402877698
gptr_ka_q3d3_natv	all	citation_support_macro	0.8138392857142858
gptr_ka_q3d3_natv	all	sentence_support_micro	0.795774647887324
gptr_ka_q3d3_natv	all	sentence_support_macro	0.8006200396825397
gptr_ka_q3d3_natv	all	nugget_coverage_micro	0.2650306748466258
gptr_ka_q3d3_natv	all	nugget_coverage_macro	0.3406706829806848
gptr_ka_q3d3_natv	all	nugget_coverage_weighted_micro	0.3018867924528302
gptr_ka_q3d3_natv	all	nugget_coverage_weighted_macro	0.37470074911415985
gptr_ka_q3d3_natv	all	f1_micro	0.3976312852802464
gptr_ka_q3d3_natv	all	f1_macro	0.45656958655527785
gptr_ka_q3d3_natv	all	f1_weighted_micro	0.43771940443045637
gptr_ka_q3d3_natv	all	f1_weighted_macro	0.4588700220310734
gptr_ka_q3d3_natv	1001	sentences	10.0
gptr_ka_q3d3_natv	1001	character_count	1516.0
gptr_ka_q3d3_natv	1001	sentences_with_citations_or_requiring_citations	10.0
gptr_ka_q3d3_natv	1001	correctly_cited_sentences	9.0
gptr_ka_q3d3_natv	1001	nuggets	101.0
gptr_ka_q3d3_natv	1001	nuggets_weighted	110.0
gptr_ka_q3d3_natv	1001	correct_nuggets	32.0
gptr_ka_q3d3_natv	1001	correct_nuggets_weighted	34.0
gptr_ka_q3d3_natv	1001	citations	10.0
gptr_ka_q3d3_natv	1001	relevant_citations	3.0
gptr_ka_q3d3_natv	1001	supporting_citations	9.0
gptr_ka_q3d3_natv	1001	citation_relevance	0.3
gptr_ka_q3d3_natv	1001	citation_support	0.9
gptr_ka_q3d3_natv	1001	sentence_support	0.9
gptr_ka_q3d3_natv	1001	nugget_coverage	0.31683168316831684
gptr_ka_q3d3_natv	1001	nugget_coverage_weighted	0.3090909090909091
gptr_ka_q3d3_natv	1001	f1	0.4686737184703011
gptr_ka_q3d3_natv	1001	f1_weighted	0.4601503759398497
gptr_ka_q3d3_natv	1003	sentences	9.0
gptr_ka_q3d3_natv	1003	character_count	1833.0
gptr_ka_q3d3_natv	1003	sentences_with_citations_or_requiring_citations	9.0
gptr_ka_q3d3_natv	1003	correctly_cited_sentences	7.0
gptr_ka_q3d3_natv	1003	nuggets	103.0
gptr_ka_q3d3_natv	1003	nuggets_weighted	26.0
gptr_ka_q3d3_natv	1003	correct_nuggets	21.0
gptr_ka_q3d3_natv	1003	correct_nuggets_weighted	6.0
gptr_ka_q3d3_natv	1003	citations	9.0
gptr_ka_q3d3_natv	1003	relevant_citations	4.0
gptr_ka_q3d3_natv	1003	supporting_citations	7.0
gptr_ka_q3d3_natv	1003	citation_relevance	0.4444444444444444
gptr_ka_q3d3_natv	1003	citation_support	0.7777777777777778
gptr_ka_q3d3_natv	1003	sentence_support	0.7777777777777778
gptr_ka_q3d3_natv	1003	nugget_coverage	0.20388349514563106
gptr_ka_q3d3_natv	1003	nugget_coverage_weighted	0.23076923076923078
gptr_ka_q3d3_natv	1003	f1	0.3230769230769231
gptr_ka_q3d3_natv	1003	f1_weighted	0.3559322033898305
gptr_ka_q3d3_natv	1005	sentences	9.0
gptr_ka_q3d3_natv	1005	character_count	1647.0
gptr_ka_q3d3_natv	1005	sentences_with_citations_or_requiring_citations	9.0
gptr_ka_q3d3_natv	1005	correctly_cited_sentences	8.0
gptr_ka_q3d3_natv	1005	nuggets	111.0
gptr_ka_q3d3_natv	1005	nuggets_weighted	32.0
gptr_ka_q3d3_natv	1005	correct_nuggets	20.0
gptr_ka_q3d3_natv	1005	correct_nuggets_weighted	2.0
gptr_ka_q3d3_natv	1005	citations	9.0
gptr_ka_q3d3_natv	1005	relevant_citations	5.0
gptr_ka_q3d3_natv	1005	supporting_citations	8.0
gptr_ka_q3d3_natv	1005	citation_relevance	0.5555555555555556
gptr_ka_q3d3_natv	1005	citation_support	0.8888888888888888
gptr_ka_q3d3_natv	1005	sentence_support	0.8888888888888888
gptr_ka_q3d3_natv	1005	nugget_coverage	0.18018018018018017
gptr_ka_q3d3_natv	1005	nugget_coverage_weighted	0.0625
gptr_ka_q3d3_natv	1005	f1	0.29962546816479396
gptr_ka_q3d3_natv	1005	f1_weighted	0.11678832116788321
gptr_ka_q3d3_natv	1007	sentences	8.0
gptr_ka_q3d3_natv	1007	character_count	1258.0
gptr_ka_q3d3_natv	1007	sentences_with_citations_or_requiring_citations	8.0
gptr_ka_q3d3_natv	1007	correctly_cited_sentences	5.0
gptr_ka_q3d3_natv	1007	first_instance_sentences_missing_citation	1.0
gptr_ka_q3d3_natv	1007	nuggets	22.0
gptr_ka_q3d3_natv	1007	nuggets_weighted	6.0
gptr_ka_q3d3_natv	1007	correct_nuggets	8.0
gptr_ka_q3d3_natv	1007	correct_nuggets_weighted	2.0
gptr_ka_q3d3_natv	1007	citations	7.0
gptr_ka_q3d3_natv	1007	relevant_citations	7.0
gptr_ka_q3d3_natv	1007	supporting_citations	5.0
gptr_ka_q3d3_natv	1007	citation_relevance	1.0
gptr_ka_q3d3_natv	1007	citation_support	0.7142857142857143
gptr_ka_q3d3_natv	1007	sentence_support	0.625
gptr_ka_q3d3_natv	1007	nugget_coverage	0.36363636363636365
gptr_ka_q3d3_natv	1007	nugget_coverage_weighted	0.3333333333333333
gptr_ka_q3d3_natv	1007	f1	0.4597701149425288
gptr_ka_q3d3_natv	1007	f1_weighted	0.43478260869565216
gptr_ka_q3d3_natv	1009	sentences	10.0
gptr_ka_q3d3_natv	1009	character_count	1615.0
gptr_ka_q3d3_natv	1009	sentences_with_citations_or_requiring_citations	10.0
gptr_ka_q3d3_natv	1009	correctly_cited_sentences	10.0
gptr_ka_q3d3_natv	1009	nuggets	15.0
gptr_ka_q3d3_natv	1009	nuggets_weighted	8.0
gptr_ka_q3d3_natv	1009	correct_nuggets	8.0
gptr_ka_q3d3_natv	1009	correct_nuggets_weighted	8.0
gptr_ka_q3d3_natv	1009	citations	10.0
gptr_ka_q3d3_natv	1009	relevant_citations	5.0
gptr_ka_q3d3_natv	1009	supporting_citations	10.0
gptr_ka_q3d3_natv	1009	citation_relevance	0.5
gptr_ka_q3d3_natv	1009	citation_support	1.0
gptr_ka_q3d3_natv	1009	sentence_support	1.0
gptr_ka_q3d3_natv	1009	nugget_coverage	0.5333333333333333
gptr_ka_q3d3_natv	1009	nugget_coverage_weighted	1.0
gptr_ka_q3d3_natv	1009	f1	0.6956521739130436
gptr_ka_q3d3_natv	1009	f1_weighted	1.0
gptr_ka_q3d3_natv	1011	sentences	8.0
gptr_ka_q3d3_natv	1011	character_count	1537.0
gptr_ka_q3d3_natv	1011	sentences_with_citations_or_requiring_citations	8.0
gptr_ka_q3d3_natv	1011	correctly_cited_sentences	7.0
gptr_ka_q3d3_natv	1011	nuggets	63.0
gptr_ka_q3d3_natv	1011	nuggets_weighted	40.0
gptr_ka_q3d3_natv	1011	correct_nuggets	21.0
gptr_ka_q3d3_natv	1011	correct_nuggets_weighted	14.0
gptr_ka_q3d3_natv	1011	citations	8.0
gptr_ka_q3d3_natv	1011	relevant_citations	0.0
gptr_ka_q3d3_natv	1011	supporting_citations	7.0
gptr_ka_q3d3_natv	1011	citation_relevance	0.0
gptr_ka_q3d3_natv	1011	citation_support	0.875
gptr_ka_q3d3_natv	1011	sentence_support	0.875
gptr_ka_q3d3_natv	1011	nugget_coverage	0.3333333333333333
gptr_ka_q3d3_natv	1011	nugget_coverage_weighted	0.35
gptr_ka_q3d3_natv	1011	f1	0.48275862068965514
gptr_ka_q3d3_natv	1011	f1_weighted	0.4999999999999999
gptr_ka_q3d3_natv	1013	sentences	7.0
gptr_ka_q3d3_natv	1013	character_count	1591.0
gptr_ka_q3d3_natv	1013	sentences_with_citations_or_requiring_citations	7.0
gptr_ka_q3d3_natv	1013	correctly_cited_sentences	6.0
gptr_ka_q3d3_natv	1013	nuggets	26.0
gptr_ka_q3d3_natv	1013	nuggets_weighted	12.0
gptr_ka_q3d3_natv	1013	correct_nuggets	16.0
gptr_ka_q3d3_natv	1013	correct_nuggets_weighted	12.0
gptr_ka_q3d3_natv	1013	citations	7.0
gptr_ka_q3d3_natv	1013	relevant_citations	4.0
gptr_ka_q3d3_natv	1013	supporting_citations	6.0
gptr_ka_q3d3_natv	1013	citation_relevance	0.5714285714285714
gptr_ka_q3d3_natv	1013	citation_support	0.8571428571428571
gptr_ka_q3d3_natv	1013	sentence_support	0.8571428571428571
gptr_ka_q3d3_natv	1013	nugget_coverage	0.6153846153846154
gptr_ka_q3d3_natv	1013	nugget_coverage_weighted	1.0
gptr_ka_q3d3_natv	1013	f1	0.7164179104477612
gptr_ka_q3d3_natv	1013	f1_weighted	0.923076923076923
gptr_ka_q3d3_natv	1017	sentences	10.0
gptr_ka_q3d3_natv	1017	character_count	1855.0
gptr_ka_q3d3_natv	1017	sentences_with_citations_or_requiring_citations	10.0
gptr_ka_q3d3_natv	1017	correctly_cited_sentences	8.0
gptr_ka_q3d3_natv	1017	nuggets	109.0
gptr_ka_q3d3_natv	1017	nuggets_weighted	62.0
gptr_ka_q3d3_natv	1017	correct_nuggets	30.0
gptr_ka_q3d3_natv	1017	correct_nuggets_weighted	22.0
gptr_ka_q3d3_natv	1017	citations	10.0
gptr_ka_q3d3_natv	1017	relevant_citations	9.0
gptr_ka_q3d3_natv	1017	supporting_citations	8.0
gptr_ka_q3d3_natv	1017	citation_relevance	0.9
gptr_ka_q3d3_natv	1017	citation_support	0.8
gptr_ka_q3d3_natv	1017	sentence_support	0.8
gptr_ka_q3d3_natv	1017	nugget_coverage	0.27522935779816515
gptr_ka_q3d3_natv	1017	nugget_coverage_weighted	0.3548387096774194
gptr_ka_q3d3_natv	1017	f1	0.4095563139931741
gptr_ka_q3d3_natv	1017	f1_weighted	0.4916201117318436
gptr_ka_q3d3_natv	1025	sentences	7.0
gptr_ka_q3d3_natv	1025	character_count	1446.0
gptr_ka_q3d3_natv	1025	sentences_with_citations_or_requiring_citations	7.0
gptr_ka_q3d3_natv	1025	correctly_cited_sentences	7.0
gptr_ka_q3d3_natv	1025	nuggets	12.0
gptr_ka_q3d3_natv	1025	nuggets_weighted	20.0
gptr_ka_q3d3_natv	1025	correct_nuggets	6.0
gptr_ka_q3d3_natv	1025	correct_nuggets_weighted	10.0
gptr_ka_q3d3_natv	1025	citations	7.0
gptr_ka_q3d3_natv	1025	relevant_citations	2.0
gptr_ka_q3d3_natv	1025	supporting_citations	7.0
gptr_ka_q3d3_natv	1025	citation_relevance	0.2857142857142857
gptr_ka_q3d3_natv	1025	citation_support	1.0
gptr_ka_q3d3_natv	1025	sentence_support	1.0
gptr_ka_q3d3_natv	1025	nugget_coverage	0.5
gptr_ka_q3d3_natv	1025	nugget_coverage_weighted	0.5
gptr_ka_q3d3_natv	1025	f1	0.6666666666666666
gptr_ka_q3d3_natv	1025	f1_weighted	0.6666666666666666
gptr_ka_q3d3_natv	1027	sentences	9.0
gptr_ka_q3d3_natv	1027	character_count	1849.0
gptr_ka_q3d3_natv	1027	sentences_with_citations_or_requiring_citations	9.0
gptr_ka_q3d3_natv	1027	correctly_cited_sentences	9.0
gptr_ka_q3d3_natv	1027	nuggets	7.0
gptr_ka_q3d3_natv	1027	nuggets_weighted	10.0
gptr_ka_q3d3_natv	1027	correct_nuggets	6.0
gptr_ka_q3d3_natv	1027	correct_nuggets_weighted	8.0
gptr_ka_q3d3_natv	1027	citations	9.0
gptr_ka_q3d3_natv	1027	relevant_citations	3.0
gptr_ka_q3d3_natv	1027	supporting_citations	9.0
gptr_ka_q3d3_natv	1027	citation_relevance	0.3333333333333333
gptr_ka_q3d3_natv	1027	citation_support	1.0
gptr_ka_q3d3_natv	1027	sentence_support	1.0
gptr_ka_q3d3_natv	1027	nugget_coverage	0.8571428571428571
gptr_ka_q3d3_natv	1027	nugget_coverage_weighted	0.8
gptr_ka_q3d3_natv	1027	f1	0.923076923076923
gptr_ka_q3d3_natv	1027	f1_weighted	0.888888888888889
gptr_ka_q3d3_natv	1029	sentences	9.0
gptr_ka_q3d3_natv	1029	character_count	1483.0
gptr_ka_q3d3_natv	1029	sentences_with_citations_or_requiring_citations	9.0
gptr_ka_q3d3_natv	1029	correctly_cited_sentences	6.0
gptr_ka_q3d3_natv	1029	nuggets	106.0
gptr_ka_q3d3_natv	1029	nuggets_weighted	58.0
gptr_ka_q3d3_natv	1029	correct_nuggets	13.0
gptr_ka_q3d3_natv	1029	correct_nuggets_weighted	4.0
gptr_ka_q3d3_natv	1029	citations	9.0
gptr_ka_q3d3_natv	1029	relevant_citations	9.0
gptr_ka_q3d3_natv	1029	supporting_citations	6.0
gptr_ka_q3d3_natv	1029	citation_relevance	1.0
gptr_ka_q3d3_natv	1029	citation_support	0.6666666666666666
gptr_ka_q3d3_natv	1029	sentence_support	0.6666666666666666
gptr_ka_q3d3_natv	1029	nugget_coverage	0.12264150943396226
gptr_ka_q3d3_natv	1029	nugget_coverage_weighted	0.06896551724137931
gptr_ka_q3d3_natv	1029	f1	0.20717131474103587
gptr_ka_q3d3_natv	1029	f1_weighted	0.125
gptr_ka_q3d3_natv	1033	sentences	9.0
gptr_ka_q3d3_natv	1033	character_count	1761.0
gptr_ka_q3d3_natv	1033	sentences_with_citations_or_requiring_citations	9.0
gptr_ka_q3d3_natv	1033	correctly_cited_sentences	8.0
gptr_ka_q3d3_natv	1033	nuggets	56.0
gptr_ka_q3d3_natv	1033	nuggets_weighted	28.0
gptr_ka_q3d3_natv	1033	correct_nuggets	14.0
gptr_ka_q3d3_natv	1033	correct_nuggets_weighted	10.0
gptr_ka_q3d3_natv	1033	citations	9.0
gptr_ka_q3d3_natv	1033	relevant_citations	6.0
gptr_ka_q3d3_natv	1033	supporting_citations	8.0
gptr_ka_q3d3_natv	1033	citation_relevance	0.6666666666666666
gptr_ka_q3d3_natv	1033	citation_support	0.8888888888888888
gptr_ka_q3d3_natv	1033	sentence_support	0.8888888888888888
gptr_ka_q3d3_natv	1033	nugget_coverage	0.25
gptr_ka_q3d3_natv	1033	nugget_coverage_weighted	0.35714285714285715
gptr_ka_q3d3_natv	1033	f1	0.3902439024390244
gptr_ka_q3d3_natv	1033	f1_weighted	0.5095541401273885
gptr_ka_q3d3_natv	1041	sentences	10.0
gptr_ka_q3d3_natv	1041	character_count	1882.0
gptr_ka_q3d3_natv	1041	sentences_with_citations_or_requiring_citations	10.0
gptr_ka_q3d3_natv	1041	correctly_cited_sentences	7.0
gptr_ka_q3d3_natv	1041	first_instance_sentences_missing_citation	1.0
gptr_ka_q3d3_natv	1041	nuggets	22.0
gptr_ka_q3d3_natv	1041	nuggets_weighted	10.0
gptr_ka_q3d3_natv	1041	correct_nuggets	7.0
gptr_ka_q3d3_natv	1041	correct_nuggets_weighted	0.0
gptr_ka_q3d3_natv	1041	citations	9.0
gptr_ka_q3d3_natv	1041	relevant_citations	3.0
gptr_ka_q3d3_natv	1041	supporting_citations	7.0
gptr_ka_q3d3_natv	1041	citation_relevance	0.3333333333333333
gptr_ka_q3d3_natv	1041	citation_support	0.7777777777777778
gptr_ka_q3d3_natv	1041	sentence_support	0.7
gptr_ka_q3d3_natv	1041	nugget_coverage	0.3181818181818182
gptr_ka_q3d3_natv	1041	nugget_coverage_weighted	0.0
gptr_ka_q3d3_natv	1041	f1	0.4375
gptr_ka_q3d3_natv	1041	f1_weighted	0.0
gptr_ka_q3d3_natv	1053	sentences	8.0
gptr_ka_q3d3_natv	1053	character_count	1405.0
gptr_ka_q3d3_natv	1053	sentences_with_citations_or_requiring_citations	8.0
gptr_ka_q3d3_natv	1053	correctly_cited_sentences	7.0
gptr_ka_q3d3_natv	1053	nuggets	21.0
gptr_ka_q3d3_natv	1053	nuggets_weighted	14.0
gptr_ka_q3d3_natv	1053	correct_nuggets	8.0
gptr_ka_q3d3_natv	1053	correct_nuggets_weighted	6.0
gptr_ka_q3d3_natv	1053	citations	8.0
gptr_ka_q3d3_natv	1053	relevant_citations	7.0
gptr_ka_q3d3_natv	1053	supporting_citations	7.0
gptr_ka_q3d3_natv	1053	citation_relevance	0.875
gptr_ka_q3d3_natv	1053	citation_support	0.875
gptr_ka_q3d3_natv	1053	sentence_support	0.875
gptr_ka_q3d3_natv	1053	nugget_coverage	0.38095238095238093
gptr_ka_q3d3_natv	1053	nugget_coverage_weighted	0.42857142857142855
gptr_ka_q3d3_natv	1053	f1	0.5308056872037914
gptr_ka_q3d3_natv	1053	f1_weighted	0.5753424657534246
gptr_ka_q3d3_natv	1065	sentences	9.0
gptr_ka_q3d3_natv	1065	character_count	1391.0
gptr_ka_q3d3_natv	1065	sentences_with_citations_or_requiring_citations	9.0
gptr_ka_q3d3_natv	1065	correctly_cited_sentences	5.0
gptr_ka_q3d3_natv	1065	nuggets	30.0
gptr_ka_q3d3_natv	1065	nuggets_weighted	30.0
gptr_ka_q3d3_natv	1065	correct_nuggets	6.0
gptr_ka_q3d3_natv	1065	correct_nuggets_weighted	6.0
gptr_ka_q3d3_natv	1065	citations	9.0
gptr_ka_q3d3_natv	1065	relevant_citations	4.0
gptr_ka_q3d3_natv	1065	supporting_citations	5.0
gptr_ka_q3d3_natv	1065	citation_relevance	0.4444444444444444
gptr_ka_q3d3_natv	1065	citation_support	0.5555555555555556
gptr_ka_q3d3_natv	1065	sentence_support	0.5555555555555556
gptr_ka_q3d3_natv	1065	nugget_coverage	0.2
gptr_ka_q3d3_natv	1065	nugget_coverage_weighted	0.2
gptr_ka_q3d3_natv	1065	f1	0.29411764705882354
gptr_ka_q3d3_natv	1065	f1_weighted	0.29411764705882354
gptr_ka_q3d3_natv	1069	sentences	10.0
gptr_ka_q3d3_natv	1069	character_count	1472.0
gptr_ka_q3d3_natv	1069	sentences_with_citations_or_requiring_citations	10.0
gptr_ka_q3d3_natv	1069	correctly_cited_sentences	4.0
gptr_ka_q3d3_natv	1069	first_instance_sentences_missing_citation	1.0
gptr_ka_q3d3_natv	1069	nuggets	11.0
gptr_ka_q3d3_natv	1069	nuggets_weighted	11.0
gptr_ka_q3d3_natv	1069	correct_nuggets	0.0
gptr_ka_q3d3_natv	1069	correct_nuggets_weighted	0.0
gptr_ka_q3d3_natv	1069	citations	9.0
gptr_ka_q3d3_natv	1069	relevant_citations	0.0
gptr_ka_q3d3_natv	1069	supporting_citations	4.0
gptr_ka_q3d3_natv	1069	citation_relevance	0.0
gptr_ka_q3d3_natv	1069	citation_support	0.4444444444444444
gptr_ka_q3d3_natv	1069	sentence_support	0.4
gptr_ka_q3d3_natv	1069	nugget_coverage	0.0
gptr_ka_q3d3_natv	1069	nugget_coverage_weighted	0.0
gptr_ka_q3d3_natv	1069	f1	0.0
gptr_ka_q3d3_natv	1069	f1_weighted	0.0
