run_id	topic_id	sent_id	annotation_job	judge	annotation
v1_qwen	1001	0	nugget_mentioned	human	"[[""Which AI system demonstrates the foundation laid by Hinton\u2019s pioneering research in deep learning and neural networks?"", ""ChatGPT""]]"
v1_qwen	1001	0	sentence_support	human	True
v1_qwen	1001	1	nugget_mentioned	human	"[[""Which AI system demonstrates the foundation laid by Hinton\u2019s pioneering research in deep learning and neural networks?"", ""ChatGPT""]]"
v1_qwen	1001	1	sentence_support	human	False
v1_qwen	1001	2	nugget_mentioned	human	"[[""Why did Hinton leave Google when he helped develop AI but later grew concerned about its dangers?"", ""To speak out freely about AI dangers.""]]"
v1_qwen	1001	2	sentence_support	gpt-5-mini	False
v1_qwen	1001	3	sentence_support	gpt-5-mini	False
v1_qwen	1001	4	sentence_support	gpt-5-mini	False
v1_qwen	1001	5	nugget_mentioned	human	"[[""Which AI system demonstrates the foundation laid by Hinton\u2019s pioneering research in deep learning and neural networks?"", ""ChatGPT""]]"
v1_qwen	1001	5	sentence_support	human	False
v1_qwen	1001	6	nugget_mentioned	human	"[[""What breakthroughs has Hinton achieved through his 40+ years of work on artificial neural networks?"", ""Breakthroughs that mimic biological brains""]]"
v1_qwen	1001	6	sentence_support	human	False
v1_qwen	1001	7	nugget_mentioned	human	"[[""What breakthroughs has Hinton achieved through his 40+ years of work on artificial neural networks?"", ""Breakthroughs that mimic biological brains""]]"
v1_qwen	1001	7	sentence_support	human	False
v1_qwen	1001	8	sentence_support	human	False
v1_qwen	1003	0	sentence_support	gpt-5-mini	False
v1_qwen	1003	1	sentence_support	human	False
v1_qwen	1003	2	sentence_support	human	False
v1_qwen	1003	3	sentence_support	gpt-5-mini	False
v1_qwen	1003	4	sentence_support	gpt-5-mini	False
v1_qwen	1003	5	nugget_mentioned	human	"[[""What are the criteria of the top 20 digital nomad locations?"", ""A digital nomad visa program or the equivalent""]]"
v1_qwen	1003	5	sentence_support	gpt-5-mini	False
v1_qwen	1005	0	sentence_support	gpt-5-mini	False
v1_qwen	1005	1	sentence_support	gpt-5-mini	False
v1_qwen	1005	2	sentence_support	gpt-5-mini	False
v1_qwen	1005	3	sentence_support	gpt-5-mini	False
v1_qwen	1005	4	nugget_mentioned	human	"[[""what non-EU countries have started issuing digital nomad visas?"", ""Malaysia""], [""What countries does \""Visa Guide\"" rank as the top destinations for remote work? "", ""UAE - 4""]]"
v1_qwen	1005	4	sentence_support	gpt-5-mini	False
v1_qwen	1007	0	sentence_support	human	False
v1_qwen	1007	1	sentence_support	human	False
v1_qwen	1007	2	nugget_mentioned	human	"[[""Which countries' airforces are the purchasers of China's J-10 FIghter?"", ""The Pakistan Air Force""], [""How many J-10 Fighters has Pakistan imported from China?"", "" 36 J-10CE Fighters. ""], [""How many J-10 fighters has Pakistan imported from China in total since its initial purchase?"", ""other""]]"
v1_qwen	1007	2	sentence_support	human	False
v1_qwen	1007	3	nugget_mentioned	human	"[[""Which countries' airforces are the purchasers of China's J-10 FIghter?"", ""The Pakistan Air Force""], [""How many J-10 Fighters has Pakistan imported from China?"", ""other""], [""How many J-10 fighters has Pakistan imported from China in total since its initial purchase?"", ""other""], [""What may some improvements made in China's J-10 Fighter help Pakistan Airforce?"", ""Enable Pakistan Air Force to carry more missiles to perform combat missions""]]"
v1_qwen	1007	3	sentence_support	human	False
v1_qwen	1007	4	nugget_mentioned	human	"[[""Which countries' airforces are the purchasers of China's J-10 FIghter?"", ""The Pakistan Air Force""], [""How many J-10 Fighters has Pakistan imported from China?"", ""other""], [""How many J-10 fighters has Pakistan imported from China in total since its initial purchase?"", ""Increased to 60""]]"
v1_qwen	1007	4	sentence_support	human	False
v1_qwen	1007	5	sentence_support	human	False
v1_qwen	1007	6	sentence_support	human	False
v1_qwen	1009	0	sentence_support	human	False
v1_qwen	1009	1	sentence_support	human	False
v1_qwen	1009	2	sentence_support	human	False
v1_qwen	1009	3	sentence_support	human	False
v1_qwen	1009	4	nugget_mentioned	human	"[[""How does Saharan dust affect immediate weather?"", ""lowers air quality""], [""What are the negative effects of Saharan dust storm on infrastructure?"", ""Worsens visibility on roads""]]"
v1_qwen	1009	4	sentence_support	gpt-5-mini	False
v1_qwen	1009	5	sentence_support	human	False
v1_qwen	1009	6	sentence_support	human	False
v1_qwen	1011	0	sentence_support	human	False
v1_qwen	1011	1	sentence_support	human	False
v1_qwen	1011	2	nugget_mentioned	human	"[[""What are MBS\u2019s goals under Vision 2030?"", ""To reduce Saudi Arabia\u2019s oil dependence  ""], [""What are some of the key goals of Vision 2030 for society and economy?"", ""Diversify the economy from oil""], [""What are the main goals of the 2016- launched Vision 2030?"", ""To diversify Saudi Arabia\u2019s economy ""], [""What are the main goals of the 2016- launched Vision 2030?"", ""To lessen reliance on oil.""]]"
v1_qwen	1011	2	sentence_support	human	False
v1_qwen	1011	3	sentence_support	human	False
v1_qwen	1011	4	sentence_support	human	False
v1_qwen	1013	0	sentence_support	human	False
v1_qwen	1013	1	sentence_support	human	False
v1_qwen	1013	2	nugget_mentioned	human	"[[""What happened after the opening of McDonald's restaurants in Rome opened?"", ""Slow Food Movement formed.""], [""Who is founder of the Slow Food Movement?"", ""Carlo Petrini""], [""When did Carlo Petrini launch the Slow Food Movement?"", ""other""], [""What is the birthplace of the slow food movement?"", ""other""]]"
v1_qwen	1013	2	sentence_support	gpt-5-mini	False
v1_qwen	1013	3	nugget_mentioned	human	"[[""What happened after the opening of McDonald's restaurants in Rome opened?"", ""Slow Food Movement formed.""], [""Who is founder of the Slow Food Movement?"", ""Carlo Petrini""], [""What did Carlo Petrini think was the reason for the disconnection between farmers and consumers? "", "" Large retail stores and fast-food restaurants saturated the city center""]]"
v1_qwen	1013	3	sentence_support	human	False
v1_qwen	1013	4	sentence_support	human	False
v1_qwen	1013	5	sentence_support	gpt-5-mini	False
v1_qwen	1015	0	sentence_support	human	False
v1_qwen	1015	1	sentence_support	human	False
v1_qwen	1015	2	sentence_support	human	False
v1_qwen	1017	0	sentence_support	human	False
v1_qwen	1017	1	sentence_support	human	False
v1_qwen	1017	2	nugget_mentioned	human	"[[""According to John Musker, why does Disney rely on live-action remakes rather than producing new stories?"", ""As a risk-reduction strategy""], [""What motivates Disney to keep producing live-action remakes despite mixed reviews?"", ""Box office success.""]]"
v1_qwen	1017	2	sentence_support	human	False
v1_qwen	1019	0	sentence_support	human	False
v1_qwen	1019	1	sentence_support	human	False
v1_qwen	1019	2	sentence_support	human	False
v1_qwen	1019	3	nugget_mentioned	human	"[[""What is the concept of Tai Chi?"", ""other""]]"
v1_qwen	1019	3	sentence_support	human	False
v1_qwen	1021	0	sentence_support	gpt-5-mini	False
v1_qwen	1021	1	sentence_support	gpt-5-mini	False
v1_qwen	1021	2	sentence_support	gpt-5-mini	False
v1_qwen	1021	3	sentence_support	gpt-5-mini	False
v1_qwen	1021	4	sentence_support	gpt-5-mini	False
v1_qwen	1021	5	sentence_support	gpt-5-mini	False
v1_qwen	1023	0	sentence_support	human	False
v1_qwen	1023	1	sentence_support	gpt-5-mini	False
v1_qwen	1023	2	sentence_support	human	False
v1_qwen	1023	3	sentence_support	gpt-5-mini	False
v1_qwen	1023	4	sentence_support	gpt-5-mini	False
v1_qwen	1023	5	sentence_support	gpt-5-mini	False
v1_qwen	1023	6	sentence_support	human	False
v1_qwen	1023	7	sentence_support	gpt-5-mini	False
v1_qwen	1025	0	nugget_mentioned	human	"[[""How has the gender balance in the construction and maritime industries changed over recent decades?"", ""number of female employees increased""], [""Why are construction and maritime industries more popular with women nowadays?"", ""changing social norms""]]"
v1_qwen	1025	0	sentence_support	human	False
v1_qwen	1025	1	nugget_mentioned	human	"[[""Why are construction and maritime industries more popular with women nowadays?"", ""changing social norms""], [""Why are construction and maritime industries more popular with women nowadays?"", ""variety of opportunities available""], [""What are governments doing to promote and aid women in construction or maritime industries?"", ""inclusive policies""]]"
v1_qwen	1025	1	sentence_support	human	False
v1_qwen	1025	2	nugget_mentioned	human	"[[""How has the gender balance in the construction and maritime industries changed over recent decades?"", ""number of female employees increased""], [""Why are construction and maritime industries more popular with women nowadays?"", ""changing social norms""]]"
v1_qwen	1025	2	sentence_support	human	False
v1_qwen	1025	3	nugget_mentioned	human	"[[""How has the gender balance in the construction and maritime industries changed over recent decades?"", ""number of female employees increased""]]"
v1_qwen	1025	3	sentence_support	human	False
v1_qwen	1025	4	nugget_mentioned	human	"[[""How has the gender balance in the construction and maritime industries changed over recent decades?"", ""number of female employees increased""]]"
v1_qwen	1025	4	sentence_support	gpt-5-mini	False
v1_qwen	1025	5	nugget_mentioned	human	"[[""What are governments doing to promote and aid women in construction or maritime industries?"", ""inclusive policies""]]"
v1_qwen	1025	5	sentence_support	gpt-5-mini	False
v1_qwen	1025	6	sentence_support	human	False
v1_qwen	1027	0	nugget_mentioned	human	"[[""How has the gender balance in the construction and maritime industries changed over recent decades?"", ""number of female employees increased""]]"
v1_qwen	1027	0	sentence_support	gpt-5-mini	False
v1_qwen	1027	1	sentence_support	gpt-5-mini	False
v1_qwen	1027	2	nugget_mentioned	human	"[[""How has the gender balance in the construction and maritime industries changed over recent decades?"", ""number of female employees increased""]]"
v1_qwen	1027	2	sentence_support	gpt-5-mini	False
v1_qwen	1027	3	nugget_mentioned	human	"[[""How has the gender balance in the construction and maritime industries changed over recent decades?"", ""number of female employees increased""]]"
v1_qwen	1027	3	sentence_support	gpt-5-mini	False
v1_qwen	1027	4	sentence_support	gpt-5-mini	False
v1_qwen	1027	5	sentence_support	gpt-5-mini	False
v1_qwen	1027	6	sentence_support	gpt-5-mini	False
v1_qwen	1029	0	sentence_support	gpt-5-mini	False
v1_qwen	1029	1	sentence_support	human	False
v1_qwen	1029	2	sentence_support	gpt-5-mini	False
v1_qwen	1029	3	sentence_support	human	False
v1_qwen	1029	4	sentence_support	human	False
v1_qwen	1029	5	sentence_support	human	False
v1_qwen	1029	6	sentence_support	gpt-5-mini	False
v1_qwen	1029	7	sentence_support	human	False
v1_qwen	1029	8	sentence_support	gpt-5-mini	False
v1_qwen	1029	9	nugget_mentioned	human	"[[""What is science fiction based on?"", ""Speculative scientific discoveries""], [""What is science fiction based on?"", ""Life on other planets""]]"
v1_qwen	1029	9	sentence_support	gpt-5-mini	False
v1_qwen	1031	0	sentence_support	gpt-5-mini	False
v1_qwen	1031	1	sentence_support	gpt-5-mini	False
v1_qwen	1031	2	sentence_support	gpt-5-mini	False
v1_qwen	1031	3	sentence_support	human	False
v1_qwen	1031	4	sentence_support	human	False
v1_qwen	1031	5	sentence_support	human	False
v1_qwen	1033	0	sentence_support	gpt-5-mini	False
v1_qwen	1033	1	sentence_support	human	False
v1_qwen	1033	2	sentence_support	gpt-5-mini	False
v1_qwen	1033	3	sentence_support	human	False
v1_qwen	1033	4	sentence_support	human	False
v1_qwen	1033	5	sentence_support	gpt-5-mini	False
v1_qwen	1033	6	sentence_support	human	False
v1_qwen	1035	0	sentence_support	human	False
v1_qwen	1035	1	sentence_support	human	True
v1_qwen	1035	2	sentence_support	human	False
v1_qwen	1035	3	sentence_support	human	False
v1_qwen	1035	4	sentence_support	human	False
v1_qwen	1035	5	sentence_support	human	True
v1_qwen	1035	6	sentence_support	human	False
v1_qwen	1037	0	sentence_support	human	False
v1_qwen	1039	0	sentence_support	gpt-5-mini	False
v1_qwen	1041	0	sentence_support	gpt-5-mini	False
v1_qwen	1047	0	sentence_support	gpt-5-mini	False
v1_qwen	1047	1	sentence_support	gpt-5-mini	False
v1_qwen	1047	2	sentence_support	human	False
v1_qwen	1047	3	nugget_mentioned	human	"[[""What is the main cause of ocean acidification?"", ""other""], [""What is the main cause of ocean acidification?"", ""water absorbs carbon dioxide from the atmosphere""]]"
v1_qwen	1047	3	sentence_support	human	False
v1_qwen	1047	4	nugget_mentioned	human	"[[""What is the main cause of ocean acidification?"", ""other""]]"
v1_qwen	1047	4	sentence_support	human	False
v1_qwen	1047	5	nugget_mentioned	human	"[[""What do shellfish use to build their shells?"", ""calcium carbonate ""], [""Which ocean creatures have trouble forming shells due to ocean acidification?"", ""other""], [""Which marine organism is vulnerable to increased levels of ocean acidification?"", ""cephalopods""]]"
v1_qwen	1047	5	sentence_support	human	False
v1_qwen	1047	6	sentence_support	gpt-5-mini	False
v1_qwen	1053	0	sentence_support	human	False
v1_qwen	1053	1	sentence_support	human	False
v1_qwen	1053	2	sentence_support	human	False
v1_qwen	1053	3	nugget_mentioned	human	"[[""How has avocado consumption changed in recent years?"", ""increased""]]"
v1_qwen	1053	3	sentence_support	gpt-5-mini	False
v1_qwen	1053	4	nugget_mentioned	human	"[[""How has avocado consumption changed in recent years?"", ""increased""]]"
v1_qwen	1053	4	sentence_support	gpt-5-mini	False
v1_qwen	1053	5	nugget_mentioned	human	"[[""What are the countries and regions that produce and export avocados?"", ""other""], [""What are the countries and regions that produce and export avocados?"", ""Mexico""], [""What are the countries and regions that import avocados?"", ""other""], [""What are the countries and regions that import avocados?"", ""North America""], [""What are the countries and regions that import avocados?"", ""Europe""]]"
v1_qwen	1053	5	sentence_support	human	False
v1_qwen	1053	6	sentence_support	human	False
v1_qwen	1053	7	nugget_mentioned	human	"[[""What are the positive effects of the global demand for avocados on the countries and regions that produce and export them?"", ""other""]]"
v1_qwen	1053	7	sentence_support	human	False
v1_qwen	1053	8	nugget_mentioned	human	"[[""What are the countries and regions that produce and export avocados?"", ""Mexico""]]"
v1_qwen	1053	8	sentence_support	human	False
v1_qwen	1053	9	sentence_support	human	False
v1_qwen	1053	10	nugget_mentioned	human	"[[""What are the positive effects of the global demand for avocados on the countries and regions that produce and export them?"", ""new jobs""]]"
v1_qwen	1053	10	sentence_support	human	False
v1_qwen	1055	0	sentence_support	human	False
v1_qwen	1065	0	sentence_support	human	False
v1_qwen	1065	1	nugget_mentioned	human	"[[""Which designers does Pop Mart collaborate with?"", ""Kasing Lung""]]"
v1_qwen	1065	1	sentence_support	human	False
v1_qwen	1065	2	sentence_support	gpt-5-mini	False
v1_qwen	1065	3	sentence_support	gpt-5-mini	False
v1_qwen	1065	4	sentence_support	gpt-5-mini	False
v1_qwen	1065	5	sentence_support	human	False
v1_qwen	1065	6	nugget_mentioned	human	"[[""Consumers mainly buy blind boxes for what purpose?"", ""seeking surprise""]]"
v1_qwen	1065	6	sentence_support	human	True
v1_qwen	1065	7	sentence_support	human	False
v1_qwen	1067	0	sentence_support	gpt-5-mini	False
v1_qwen	1067	1	sentence_support	human	False
v1_qwen	1067	2	sentence_support	human	False
v1_qwen	1067	3	sentence_support	gpt-5-mini	False
v1_qwen	1067	4	nugget_mentioned	human	"[[""For whom would robotic animal dolls make a big difference?"", ""those with Alzheimer's or dementia, struggling with isolation""]]"
v1_qwen	1067	4	sentence_support	human	False
v1_qwen	1067	5	sentence_support	human	False
v1_qwen	1067	6	sentence_support	human	False
v1_qwen	1067	7	sentence_support	gpt-5-mini	False
v1_qwen	1067	8	sentence_support	human	False
v1_qwen	1067	9	sentence_support	human	False
v1_qwen	1069	0	sentence_support	gpt-5-mini	False
v1_qwen	1069	1	sentence_support	human	False
v1_qwen	1069	2	sentence_support	human	False
v1_qwen	1069	3	sentence_support	human	False
v1_qwen	1069	4	sentence_support	human	False
v1_qwen	1069	5	sentence_support	human	False
v1_qwen	1069	6	sentence_support	gpt-5-mini	False
v1_qwen	1069	7	sentence_support	gpt-5-mini	False
v1_qwen	1069	8	sentence_support	human	False
v1_qwen	1075	0	sentence_support	human	False
v1_qwen	1075	1	sentence_support	human	False
v1_qwen	1075	2	sentence_support	human	False
v1_qwen	1075	3	nugget_mentioned	human	"[[""What is necessary for voice cloning to work?"", ""recordings of the individual""]]"
v1_qwen	1075	3	sentence_support	human	False
v1_qwen	1075	4	nugget_mentioned	human	"[[""What program needs only 5 seconds of voice to create an acceptable replica?"", ""other""]]"
v1_qwen	1075	4	sentence_support	human	True
v1_qwen	1075	5	sentence_support	human	False
v1_qwen	1075	6	sentence_support	human	True
v1_qwen	1077	0	sentence_support	human	True
v1_qwen	1077	1	sentence_support	human	True
v1_qwen	1077	2	sentence_support	gpt-5-mini	False
v1_qwen	1077	3	sentence_support	gpt-5-mini	False
v1_qwen	1077	4	nugget_mentioned	human	"[[""As of 2024, what are the statistics regarding poverty?"", ""40% of Argentinians live in poverty""]]"
v1_qwen	1077	4	sentence_support	gpt-5-mini	False
v1_qwen	1077	5	sentence_support	human	True
v1_qwen	1079	0	sentence_support	gpt-5-mini	False
v1_qwen	1079	1	sentence_support	human	False
v1_qwen	1079	2	sentence_support	human	False
v1_qwen	1079	3	nugget_mentioned	human	"[[""How far has Dr. Goodall's Roots & Shoots program spread? "", ""other""]]"
v1_qwen	1079	3	sentence_support	human	False
v1_qwen	1079	4	nugget_mentioned	human	"[[""What difference does Dr. Goodall believe every individual is capable of?"", ""other""]]"
v1_qwen	1079	4	sentence_support	human	False
v1_qwen	1079	5	sentence_support	human	False
v1_qwen	1081	0	sentence_support	human	False
v1_qwen	1081	1	sentence_support	gpt-5-mini	False
v1_qwen	1081	2	nugget_mentioned	human	"[[""What are important areas in quantum research?"", ""other""], [""What countries and blocs are leading in developing quantum computing?"", ""EU""], [""What countries and blocs are leading in developing quantum computing?"", ""US""], [""What countries and blocs are leading in developing quantum computing?"", ""China""], [""What companies are leading in developing quantum computing?"", ""other""], [""What companies are leading in developing quantum computing?"", ""IBM""], [""What companies are leading in developing quantum computing?"", ""Google""], [""What companies are leading in developing quantum computing?"", ""Microsoft""]]"
v1_qwen	1081	2	sentence_support	human	False
v1_qwen	1083	0	sentence_support	human	False
v1_qwen	1083	1	sentence_support	human	False
v1_qwen	1083	2	nugget_mentioned	human	"[[""What are the causes of the wooly mammoth extinction?"", ""climate change""], [""What environmental factors contributed to the wooly mammoth extinction?"", ""climate change""]]"
v1_qwen	1083	2	sentence_support	human	False
v1_qwen	1083	3	nugget_mentioned	human	"[[""What are the causes of the wooly mammoth extinction?"", ""climate change""], [""What environmental factors contributed to the wooly mammoth extinction?"", ""climate change""], [""What aspects of climate change contributed to the wooly mammoth extinction?"", ""rising temperatures""]]"
v1_qwen	1083	3	sentence_support	human	False
v1_qwen	1083	4	nugget_mentioned	human	"[[""What are the causes of the wooly mammoth extinction?"", ""climate change""], [""What environmental factors contributed to the wooly mammoth extinction?"", ""climate change""], [""What aspects of climate change contributed to the wooly mammoth extinction?"", ""rising temperatures""], [""How did climate change affect mammoth' habitat?"", ""shrank grassland""], [""How did climate change affect mammoth' habitat?"", ""restricted habitat""], [""How did climate change affect mammoth' habitat?"", ""food sources disappearing""]]"
v1_qwen	1083	4	sentence_support	human	False
v1_qwen	1083	5	nugget_mentioned	human	"[[""What are the causes of the wooly mammoth extinction?"", ""changing vegetation""], [""How did climate change affect mammoth' habitat?"", ""shrank grassland""], [""How did climate change affect mammoth' habitat?"", ""restricted habitat""], [""How did climate change affect mammoth' habitat?"", ""pastures becoming swampy""], [""How did climate change affect mammoth' habitat?"", ""food sources disappearing""]]"
v1_qwen	1083	5	sentence_support	human	False
v1_qwen	1083	6	nugget_mentioned	human	"[[""How did climate change affect mammoth' habitat?"", ""shrank grassland""]]"
v1_qwen	1083	6	sentence_support	human	False
v1_qwen	1085	0	sentence_support	human	False
v1_qwen	1085	1	sentence_support	human	False
v1_qwen	1085	2	sentence_support	human	False
v1_qwen	1085	3	sentence_support	human	False
v1_qwen	1085	4	sentence_support	human	False
v1_qwen	1085	5	sentence_support	human	False
v1_qwen	1087	0	sentence_support	human	False
v1_qwen	1087	1	nugget_mentioned	human	"[[""What do Putin and Modi officially characterize Russia/ India relationship as?"", ""special strategic partnership""]]"
v1_qwen	1087	1	sentence_support	human	False
v1_qwen	1087	2	nugget_mentioned	human	"[[""Why is maintaining a relationship with Russia important for India?"", ""leverage against China""]]"
v1_qwen	1087	2	sentence_support	human	False
v1_qwen	1087	3	sentence_support	human	False
v1_qwen	1087	4	nugget_mentioned	human	"[[""In what fields are India and Russia cooperating?"", ""security & military""], [""What do Putin and Modi officially characterize Russia/ India relationship as?"", ""special strategic partnership""]]"
v1_qwen	1087	4	sentence_support	human	False
v1_qwen	1087	5	nugget_mentioned	human	"[[""What do Putin and Modi officially characterize Russia/ India relationship as?"", ""special strategic partnership""]]"
v1_qwen	1087	5	sentence_support	human	False
v1_qwen	1087	6	sentence_support	human	False
