run_id	request_id	metric	value
auto_swarm_mt	all	sentences	219.0
auto_swarm_mt	all	sentences_with_citations_or_requiring_citations	212.0
auto_swarm_mt	all	correctly_cited_sentences	199.0
auto_swarm_mt	all	first_instance_sentences_missing_citation	5.0
auto_swarm_mt	all	nuggets	815.0
auto_swarm_mt	all	nuggets_weighted	477.0
auto_swarm_mt	all	correct_nuggets	224.0
auto_swarm_mt	all	correct_nuggets_weighted	179.0
auto_swarm_mt	all	citations	238.0
auto_swarm_mt	all	relevant_citations	115.0
auto_swarm_mt	all	supporting_citations	228.0
auto_swarm_mt	all	character_count_median	1802.0
auto_swarm_mt	all	character_count_max	2000.0
auto_swarm_mt	all	citation_relevance_micro	0.4831932773109244
auto_swarm_mt	all	citation_relevance_macro	0.5158704932408493
auto_swarm_mt	all	citation_support_micro	0.957983193277311
auto_swarm_mt	all	citation_support_macro	0.961853138691374
auto_swarm_mt	all	sentence_support_micro	0.9386792452830188
auto_swarm_mt	all	sentence_support_macro	0.943660480654966
auto_swarm_mt	all	nugget_coverage_micro	0.2748466257668712
auto_swarm_mt	all	nugget_coverage_macro	0.3602472006674814
auto_swarm_mt	all	nugget_coverage_weighted_micro	0.3752620545073375
auto_swarm_mt	all	nugget_coverage_weighted_macro	0.4060331142601374
auto_swarm_mt	all	f1_micro	0.42519542334969224
auto_swarm_mt	all	f1_macro	0.4791931515329992
auto_swarm_mt	all	f1_weighted_micro	0.5361741839829609
auto_swarm_mt	all	f1_weighted_macro	0.5089427637045885
auto_swarm_mt	1001	sentences	18.0
auto_swarm_mt	1001	character_count	1822.0
auto_swarm_mt	1001	sentences_with_citations_or_requiring_citations	18.0
auto_swarm_mt	1001	correctly_cited_sentences	16.0
auto_swarm_mt	1001	nuggets	101.0
auto_swarm_mt	1001	nuggets_weighted	110.0
auto_swarm_mt	1001	correct_nuggets	50.0
auto_swarm_mt	1001	correct_nuggets_weighted	58.0
auto_swarm_mt	1001	citations	35.0
auto_swarm_mt	1001	relevant_citations	10.0
auto_swarm_mt	1001	supporting_citations	32.0
auto_swarm_mt	1001	citation_relevance	0.2857142857142857
auto_swarm_mt	1001	citation_support	0.9142857142857143
auto_swarm_mt	1001	sentence_support	0.8888888888888888
auto_swarm_mt	1001	nugget_coverage	0.49504950495049505
auto_swarm_mt	1001	nugget_coverage_weighted	0.5272727272727272
auto_swarm_mt	1001	f1	0.6359300476947536
auto_swarm_mt	1001	f1_weighted	0.6619115549215405
auto_swarm_mt	1003	sentences	12.0
auto_swarm_mt	1003	character_count	1782.0
auto_swarm_mt	1003	sentences_with_citations_or_requiring_citations	12.0
auto_swarm_mt	1003	correctly_cited_sentences	11.0
auto_swarm_mt	1003	first_instance_sentences_missing_citation	1.0
auto_swarm_mt	1003	nuggets	103.0
auto_swarm_mt	1003	nuggets_weighted	26.0
auto_swarm_mt	1003	correct_nuggets	16.0
auto_swarm_mt	1003	correct_nuggets_weighted	6.0
auto_swarm_mt	1003	citations	13.0
auto_swarm_mt	1003	relevant_citations	4.0
auto_swarm_mt	1003	supporting_citations	13.0
auto_swarm_mt	1003	citation_relevance	0.3076923076923077
auto_swarm_mt	1003	citation_support	1.0
auto_swarm_mt	1003	sentence_support	0.9166666666666666
auto_swarm_mt	1003	nugget_coverage	0.1553398058252427
auto_swarm_mt	1003	nugget_coverage_weighted	0.23076923076923078
auto_swarm_mt	1003	f1	0.2656603773584905
auto_swarm_mt	1003	f1_weighted	0.3687150837988827
auto_swarm_mt	1005	sentences	17.0
auto_swarm_mt	1005	character_count	1867.0
auto_swarm_mt	1005	sentences_with_citations_or_requiring_citations	17.0
auto_swarm_mt	1005	correctly_cited_sentences	16.0
auto_swarm_mt	1005	nuggets	111.0
auto_swarm_mt	1005	nuggets_weighted	32.0
auto_swarm_mt	1005	correct_nuggets	13.0
auto_swarm_mt	1005	correct_nuggets_weighted	6.0
auto_swarm_mt	1005	citations	18.0
auto_swarm_mt	1005	relevant_citations	11.0
auto_swarm_mt	1005	supporting_citations	17.0
auto_swarm_mt	1005	citation_relevance	0.6111111111111112
auto_swarm_mt	1005	citation_support	0.9444444444444444
auto_swarm_mt	1005	sentence_support	0.9411764705882353
auto_swarm_mt	1005	nugget_coverage	0.11711711711711711
auto_swarm_mt	1005	nugget_coverage_weighted	0.1875
auto_swarm_mt	1005	f1	0.2083124687030546
auto_swarm_mt	1005	f1_weighted	0.3127035830618892
auto_swarm_mt	1007	sentences	10.0
auto_swarm_mt	1007	character_count	1340.0
auto_swarm_mt	1007	sentences_with_citations_or_requiring_citations	10.0
auto_swarm_mt	1007	correctly_cited_sentences	10.0
auto_swarm_mt	1007	nuggets	22.0
auto_swarm_mt	1007	nuggets_weighted	6.0
auto_swarm_mt	1007	correct_nuggets	10.0
auto_swarm_mt	1007	correct_nuggets_weighted	2.0
auto_swarm_mt	1007	citations	10.0
auto_swarm_mt	1007	relevant_citations	10.0
auto_swarm_mt	1007	supporting_citations	10.0
auto_swarm_mt	1007	citation_relevance	1.0
auto_swarm_mt	1007	citation_support	1.0
auto_swarm_mt	1007	sentence_support	1.0
auto_swarm_mt	1007	nugget_coverage	0.45454545454545453
auto_swarm_mt	1007	nugget_coverage_weighted	0.3333333333333333
auto_swarm_mt	1007	f1	0.625
auto_swarm_mt	1007	f1_weighted	0.5
auto_swarm_mt	1009	sentences	22.0
auto_swarm_mt	1009	character_count	2000.0
auto_swarm_mt	1009	sentences_with_citations_or_requiring_citations	21.0
auto_swarm_mt	1009	correctly_cited_sentences	21.0
auto_swarm_mt	1009	nuggets	15.0
auto_swarm_mt	1009	nuggets_weighted	8.0
auto_swarm_mt	1009	correct_nuggets	10.0
auto_swarm_mt	1009	correct_nuggets_weighted	8.0
auto_swarm_mt	1009	citations	21.0
auto_swarm_mt	1009	relevant_citations	20.0
auto_swarm_mt	1009	supporting_citations	21.0
auto_swarm_mt	1009	citation_relevance	0.9523809523809523
auto_swarm_mt	1009	citation_support	1.0
auto_swarm_mt	1009	sentence_support	1.0
auto_swarm_mt	1009	nugget_coverage	0.6666666666666666
auto_swarm_mt	1009	nugget_coverage_weighted	1.0
auto_swarm_mt	1009	f1	0.8
auto_swarm_mt	1009	f1_weighted	1.0
auto_swarm_mt	1011	sentences	10.0
auto_swarm_mt	1011	character_count	1734.0
auto_swarm_mt	1011	sentences_with_citations_or_requiring_citations	10.0
auto_swarm_mt	1011	correctly_cited_sentences	10.0
auto_swarm_mt	1011	nuggets	63.0
auto_swarm_mt	1011	nuggets_weighted	40.0
auto_swarm_mt	1011	correct_nuggets	19.0
auto_swarm_mt	1011	correct_nuggets_weighted	12.0
auto_swarm_mt	1011	citations	10.0
auto_swarm_mt	1011	relevant_citations	0.0
auto_swarm_mt	1011	supporting_citations	10.0
auto_swarm_mt	1011	citation_relevance	0.0
auto_swarm_mt	1011	citation_support	1.0
auto_swarm_mt	1011	sentence_support	1.0
auto_swarm_mt	1011	nugget_coverage	0.30158730158730157
auto_swarm_mt	1011	nugget_coverage_weighted	0.3
auto_swarm_mt	1011	f1	0.46341463414634143
auto_swarm_mt	1011	f1_weighted	0.4615384615384615
auto_swarm_mt	1013	sentences	3.0
auto_swarm_mt	1013	character_count	1405.0
auto_swarm_mt	1013	sentences_with_citations_or_requiring_citations	2.0
auto_swarm_mt	1013	correctly_cited_sentences	2.0
auto_swarm_mt	1013	nuggets	26.0
auto_swarm_mt	1013	nuggets_weighted	12.0
auto_swarm_mt	1013	correct_nuggets	6.0
auto_swarm_mt	1013	correct_nuggets_weighted	6.0
auto_swarm_mt	1013	citations	3.0
auto_swarm_mt	1013	relevant_citations	3.0
auto_swarm_mt	1013	supporting_citations	3.0
auto_swarm_mt	1013	citation_relevance	1.0
auto_swarm_mt	1013	citation_support	1.0
auto_swarm_mt	1013	sentence_support	1.0
auto_swarm_mt	1013	nugget_coverage	0.23076923076923078
auto_swarm_mt	1013	nugget_coverage_weighted	0.5
auto_swarm_mt	1013	f1	0.375
auto_swarm_mt	1013	f1_weighted	0.6666666666666666
auto_swarm_mt	1017	sentences	11.0
auto_swarm_mt	1017	character_count	1968.0
auto_swarm_mt	1017	sentences_with_citations_or_requiring_citations	11.0
auto_swarm_mt	1017	correctly_cited_sentences	11.0
auto_swarm_mt	1017	nuggets	109.0
auto_swarm_mt	1017	nuggets_weighted	62.0
auto_swarm_mt	1017	correct_nuggets	24.0
auto_swarm_mt	1017	correct_nuggets_weighted	20.0
auto_swarm_mt	1017	citations	11.0
auto_swarm_mt	1017	relevant_citations	4.0
auto_swarm_mt	1017	supporting_citations	11.0
auto_swarm_mt	1017	citation_relevance	0.36363636363636365
auto_swarm_mt	1017	citation_support	1.0
auto_swarm_mt	1017	sentence_support	1.0
auto_swarm_mt	1017	nugget_coverage	0.22018348623853212
auto_swarm_mt	1017	nugget_coverage_weighted	0.3225806451612903
auto_swarm_mt	1017	f1	0.3609022556390978
auto_swarm_mt	1017	f1_weighted	0.4878048780487805
auto_swarm_mt	1025	sentences	14.0
auto_swarm_mt	1025	character_count	1942.0
auto_swarm_mt	1025	sentences_with_citations_or_requiring_citations	13.0
auto_swarm_mt	1025	correctly_cited_sentences	12.0
auto_swarm_mt	1025	nuggets	12.0
auto_swarm_mt	1025	nuggets_weighted	20.0
auto_swarm_mt	1025	correct_nuggets	8.0
auto_swarm_mt	1025	correct_nuggets_weighted	14.0
auto_swarm_mt	1025	citations	17.0
auto_swarm_mt	1025	relevant_citations	9.0
auto_swarm_mt	1025	supporting_citations	16.0
auto_swarm_mt	1025	citation_relevance	0.5294117647058824
auto_swarm_mt	1025	citation_support	0.9411764705882353
auto_swarm_mt	1025	sentence_support	0.9230769230769231
auto_swarm_mt	1025	nugget_coverage	0.6666666666666666
auto_swarm_mt	1025	nugget_coverage_weighted	0.7
auto_swarm_mt	1025	f1	0.7741935483870968
auto_swarm_mt	1025	f1_weighted	0.7962085308056872
auto_swarm_mt	1027	sentences	15.0
auto_swarm_mt	1027	character_count	1434.0
auto_swarm_mt	1027	sentences_with_citations_or_requiring_citations	15.0
auto_swarm_mt	1027	correctly_cited_sentences	15.0
auto_swarm_mt	1027	nuggets	7.0
auto_swarm_mt	1027	nuggets_weighted	10.0
auto_swarm_mt	1027	correct_nuggets	6.0
auto_swarm_mt	1027	correct_nuggets_weighted	8.0
auto_swarm_mt	1027	citations	15.0
auto_swarm_mt	1027	relevant_citations	5.0
auto_swarm_mt	1027	supporting_citations	15.0
auto_swarm_mt	1027	citation_relevance	0.3333333333333333
auto_swarm_mt	1027	citation_support	1.0
auto_swarm_mt	1027	sentence_support	1.0
auto_swarm_mt	1027	nugget_coverage	0.8571428571428571
auto_swarm_mt	1027	nugget_coverage_weighted	0.8
auto_swarm_mt	1027	f1	0.923076923076923
auto_swarm_mt	1027	f1_weighted	0.888888888888889
auto_swarm_mt	1029	sentences	11.0
auto_swarm_mt	1029	character_count	1609.0
auto_swarm_mt	1029	sentences_with_citations_or_requiring_citations	11.0
auto_swarm_mt	1029	correctly_cited_sentences	9.0
auto_swarm_mt	1029	nuggets	106.0
auto_swarm_mt	1029	nuggets_weighted	58.0
auto_swarm_mt	1029	correct_nuggets	16.0
auto_swarm_mt	1029	correct_nuggets_weighted	8.0
auto_swarm_mt	1029	citations	12.0
auto_swarm_mt	1029	relevant_citations	11.0
auto_swarm_mt	1029	supporting_citations	9.0
auto_swarm_mt	1029	citation_relevance	0.9166666666666666
auto_swarm_mt	1029	citation_support	0.75
auto_swarm_mt	1029	sentence_support	0.8181818181818182
auto_swarm_mt	1029	nugget_coverage	0.1509433962264151
auto_swarm_mt	1029	nugget_coverage_weighted	0.13793103448275862
auto_swarm_mt	1029	f1	0.25486725663716814
auto_swarm_mt	1029	f1_weighted	0.2360655737704918
auto_swarm_mt	1033	sentences	16.0
auto_swarm_mt	1033	character_count	2000.0
auto_swarm_mt	1033	sentences_with_citations_or_requiring_citations	15.0
auto_swarm_mt	1033	correctly_cited_sentences	15.0
auto_swarm_mt	1033	nuggets	56.0
auto_swarm_mt	1033	nuggets_weighted	28.0
auto_swarm_mt	1033	correct_nuggets	23.0
auto_swarm_mt	1033	correct_nuggets_weighted	18.0
auto_swarm_mt	1033	citations	20.0
auto_swarm_mt	1033	relevant_citations	8.0
auto_swarm_mt	1033	supporting_citations	20.0
auto_swarm_mt	1033	citation_relevance	0.4
auto_swarm_mt	1033	citation_support	1.0
auto_swarm_mt	1033	sentence_support	1.0
auto_swarm_mt	1033	nugget_coverage	0.4107142857142857
auto_swarm_mt	1033	nugget_coverage_weighted	0.6428571428571429
auto_swarm_mt	1033	f1	0.5822784810126582
auto_swarm_mt	1033	f1_weighted	0.782608695652174
auto_swarm_mt	1041	sentences	19.0
auto_swarm_mt	1041	character_count	1979.0
auto_swarm_mt	1041	sentences_with_citations_or_requiring_citations	19.0
auto_swarm_mt	1041	correctly_cited_sentences	19.0
auto_swarm_mt	1041	nuggets	22.0
auto_swarm_mt	1041	nuggets_weighted	10.0
auto_swarm_mt	1041	correct_nuggets	7.0
auto_swarm_mt	1041	correct_nuggets_weighted	0.0
auto_swarm_mt	1041	citations	19.0
auto_swarm_mt	1041	relevant_citations	2.0
auto_swarm_mt	1041	supporting_citations	19.0
auto_swarm_mt	1041	citation_relevance	0.10526315789473684
auto_swarm_mt	1041	citation_support	1.0
auto_swarm_mt	1041	sentence_support	1.0
auto_swarm_mt	1041	nugget_coverage	0.3181818181818182
auto_swarm_mt	1041	nugget_coverage_weighted	0.0
auto_swarm_mt	1041	f1	0.4827586206896552
auto_swarm_mt	1041	f1_weighted	0.0
auto_swarm_mt	1053	sentences	13.0
auto_swarm_mt	1053	character_count	1834.0
auto_swarm_mt	1053	sentences_with_citations_or_requiring_citations	13.0
auto_swarm_mt	1053	correctly_cited_sentences	12.0
auto_swarm_mt	1053	nuggets	21.0
auto_swarm_mt	1053	nuggets_weighted	14.0
auto_swarm_mt	1053	correct_nuggets	13.0
auto_swarm_mt	1053	correct_nuggets_weighted	10.0
auto_swarm_mt	1053	citations	13.0
auto_swarm_mt	1053	relevant_citations	8.0
auto_swarm_mt	1053	supporting_citations	12.0
auto_swarm_mt	1053	citation_relevance	0.6153846153846154
auto_swarm_mt	1053	citation_support	0.9230769230769231
auto_swarm_mt	1053	sentence_support	0.9230769230769231
auto_swarm_mt	1053	nugget_coverage	0.6190476190476191
auto_swarm_mt	1053	nugget_coverage_weighted	0.7142857142857143
auto_swarm_mt	1053	f1	0.7410926365795725
auto_swarm_mt	1053	f1_weighted	0.8053691275167787
auto_swarm_mt	1065	sentences	16.0
auto_swarm_mt	1065	character_count	1619.0
auto_swarm_mt	1065	sentences_with_citations_or_requiring_citations	16.0
auto_swarm_mt	1065	correctly_cited_sentences	11.0
auto_swarm_mt	1065	first_instance_sentences_missing_citation	4.0
auto_swarm_mt	1065	nuggets	30.0
auto_swarm_mt	1065	nuggets_weighted	30.0
auto_swarm_mt	1065	correct_nuggets	3.0
auto_swarm_mt	1065	correct_nuggets_weighted	3.0
auto_swarm_mt	1065	citations	12.0
auto_swarm_mt	1065	relevant_citations	10.0
auto_swarm_mt	1065	supporting_citations	11.0
auto_swarm_mt	1065	citation_relevance	0.8333333333333334
auto_swarm_mt	1065	citation_support	0.9166666666666666
auto_swarm_mt	1065	sentence_support	0.6875
auto_swarm_mt	1065	nugget_coverage	0.1
auto_swarm_mt	1065	nugget_coverage_weighted	0.1
auto_swarm_mt	1065	f1	0.17460317460317462
auto_swarm_mt	1065	f1_weighted	0.17460317460317462
auto_swarm_mt	1069	sentences	12.0
auto_swarm_mt	1069	character_count	1559.0
auto_swarm_mt	1069	sentences_with_citations_or_requiring_citations	9.0
auto_swarm_mt	1069	correctly_cited_sentences	9.0
auto_swarm_mt	1069	nuggets	11.0
auto_swarm_mt	1069	nuggets_weighted	11.0
auto_swarm_mt	1069	correct_nuggets	0.0
auto_swarm_mt	1069	correct_nuggets_weighted	0.0
auto_swarm_mt	1069	citations	9.0
auto_swarm_mt	1069	relevant_citations	0.0
auto_swarm_mt	1069	supporting_citations	9.0
auto_swarm_mt	1069	citation_relevance	0.0
auto_swarm_mt	1069	citation_support	1.0
auto_swarm_mt	1069	sentence_support	1.0
auto_swarm_mt	1069	nugget_coverage	0.0
auto_swarm_mt	1069	nugget_coverage_weighted	0.0
auto_swarm_mt	1069	f1	0.0
auto_swarm_mt	1069	f1_weighted	0.0
