{"id":"https:\/\/openalex.org\/W4416081507","doi":"https:\/\/doi.org\/10.48550\/arxiv.2506.21763","title":"THE-Tree: Can Tracing Historical Evolution Enhance Scientific Verification and Reasoning?","display_name":"THE-Tree: Can Tracing Historical Evolution Enhance Scientific Verification and Reasoning?","publication_year":2025,"publication_date":"2025-06-26","ids":{"openalex":"https:\/\/openalex.org\/W4416081507","doi":"https:\/\/doi.org\/10.48550\/arxiv.2506.21763"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2506.21763","is_oa":true,"landing_page_url":"http:\/\/arxiv.org\/abs\/2506.21763","pdf_url":"https:\/\/arxiv.org\/pdf\/2506.21763","source":{"id":"https:\/\/openalex.org\/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https:\/\/arxiv.org\/pdf\/2506.21763","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https:\/\/openalex.org\/A5100327843","display_name":"Xin Wang","orcid":"https:\/\/orcid.org\/0000-0001-8512-9003"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Xin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Liu, Jiyao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Jiyao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Xiao, Yulong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Yulong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Ning, Junzhi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ning, Junzhi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https:\/\/openalex.org\/A5085801450","display_name":"Lihao Liu","orcid":"https:\/\/orcid.org\/0000-0002-7091-7119"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Lihao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https:\/\/openalex.org\/A5056327997","display_name":"Junjun He","orcid":"https:\/\/orcid.org\/0000-0002-1813-1784"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Junjun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https:\/\/openalex.org\/A5058342038","display_name":"Botian Shi","orcid":"https:\/\/orcid.org\/0000-0003-3677-7252"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Botian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https:\/\/openalex.org\/A5101195156","display_name":"Kaicheng Yu","orcid":"https:\/\/orcid.org\/0009-0006-5695-1317"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Kaicheng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https:\/\/openalex.org\/A5100327843"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https:\/\/openalex.org\/T11948","display_name":"Machine Learning in Materials Science","score":0.35339999198913574,"subfield":{"id":"https:\/\/openalex.org\/subfields\/2505","display_name":"Materials Chemistry"},"field":{"id":"https:\/\/openalex.org\/fields\/25","display_name":"Materials Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},"topics":[{"id":"https:\/\/openalex.org\/T11948","display_name":"Machine Learning in Materials Science","score":0.35339999198913574,"subfield":{"id":"https:\/\/openalex.org\/subfields\/2505","display_name":"Materials Chemistry"},"field":{"id":"https:\/\/openalex.org\/fields\/25","display_name":"Materials Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},{"id":"https:\/\/openalex.org\/T13910","display_name":"Computational and Text Analysis Methods","score":0.09749999642372131,"subfield":{"id":"https:\/\/openalex.org\/subfields\/3300","display_name":"General Social Sciences"},"field":{"id":"https:\/\/openalex.org\/fields\/33","display_name":"Social Sciences"},"domain":{"id":"https:\/\/openalex.org\/domains\/2","display_name":"Social Sciences"}},{"id":"https:\/\/openalex.org\/T11273","display_name":"Advanced Graph Neural Networks","score":0.08789999783039093,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1702","display_name":"Artificial Intelligence"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https:\/\/openalex.org\/keywords\/inference","display_name":"Inference","score":0.48890000581741333},{"id":"https:\/\/openalex.org\/keywords\/haystack","display_name":"Haystack","score":0.4171000123023987},{"id":"https:\/\/openalex.org\/keywords\/novelty","display_name":"Novelty","score":0.40860000252723694},{"id":"https:\/\/openalex.org\/keywords\/tracing","display_name":"Tracing","score":0.4032999873161316},{"id":"https:\/\/openalex.org\/keywords\/benchmark","display_name":"Benchmark (surveying)","score":0.38499999046325684},{"id":"https:\/\/openalex.org\/keywords\/domain","display_name":"Domain (mathematical analysis)","score":0.3752000033855438},{"id":"https:\/\/openalex.org\/keywords\/construct","display_name":"Construct (python library)","score":0.3441999852657318},{"id":"https:\/\/openalex.org\/keywords\/graph","display_name":"Graph","score":0.32429999113082886},{"id":"https:\/\/openalex.org\/keywords\/natural-language","display_name":"Natural language","score":0.31290000677108765}],"concepts":[{"id":"https:\/\/openalex.org\/C41008148","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q21198","display_name":"Computer science","level":0,"score":0.7324000000953674},{"id":"https:\/\/openalex.org\/C2776214188","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q408386","display_name":"Inference","level":2,"score":0.48890000581741333},{"id":"https:\/\/openalex.org\/C2522767166","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q2374463","display_name":"Data science","level":1,"score":0.4602000117301941},{"id":"https:\/\/openalex.org\/C13424479","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q5687237","display_name":"Haystack","level":2,"score":0.4171000123023987},{"id":"https:\/\/openalex.org\/C2778738651","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q16546687","display_name":"Novelty","level":2,"score":0.40860000252723694},{"id":"https:\/\/openalex.org\/C138673069","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q322229","display_name":"Tracing","level":2,"score":0.4032999873161316},{"id":"https:\/\/openalex.org\/C185798385","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.38499999046325684},{"id":"https:\/\/openalex.org\/C36503486","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.3752000033855438},{"id":"https:\/\/openalex.org\/C154945302","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q11660","display_name":"Artificial intelligence","level":1,"score":0.364300012588501},{"id":"https:\/\/openalex.org\/C2780801425","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q5164392","display_name":"Construct (python library)","level":2,"score":0.3441999852657318},{"id":"https:\/\/openalex.org\/C132525143","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q141488","display_name":"Graph","level":2,"score":0.32429999113082886},{"id":"https:\/\/openalex.org\/C195324797","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q33742","display_name":"Natural language","level":2,"score":0.31290000677108765},{"id":"https:\/\/openalex.org\/C176147130","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q909622","display_name":"Evolvability","level":2,"score":0.3125},{"id":"https:\/\/openalex.org\/C206588197","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q846574","display_name":"Reuse","level":2,"score":0.31139999628067017},{"id":"https:\/\/openalex.org\/C197947376","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q5155608","display_name":"Comparability","level":2,"score":0.3028999865055084},{"id":"https:\/\/openalex.org\/C138379479","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1116876","display_name":"Scientific modelling","level":2,"score":0.2980000078678131},{"id":"https:\/\/openalex.org\/C2778583558","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q771245","display_name":"Code reuse","level":3,"score":0.2973000109195709},{"id":"https:\/\/openalex.org\/C80444323","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2897000014781952},{"id":"https:\/\/openalex.org\/C119857082","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q2539","display_name":"Machine learning","level":1,"score":0.2897000014781952},{"id":"https:\/\/openalex.org\/C2778805511","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1713","display_name":"Citation","level":2,"score":0.28949999809265137},{"id":"https:\/\/openalex.org\/C4554734","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q593744","display_name":"Knowledge base","level":2,"score":0.2802000045776367},{"id":"https:\/\/openalex.org\/C137293760","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q3621696","display_name":"Language model","level":2,"score":0.2800000011920929},{"id":"https:\/\/openalex.org\/C2780522230","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1140419","display_name":"Ambiguity","level":2,"score":0.2671999931335449},{"id":"https:\/\/openalex.org\/C176217482","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q860554","display_name":"Metric (unit)","level":2,"score":0.26409998536109924},{"id":"https:\/\/openalex.org\/C2781181686","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.2619999945163727},{"id":"https:\/\/openalex.org\/C189430467","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.26019999384880066},{"id":"https:\/\/openalex.org\/C159149176","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q14489129","display_name":"Evolutionary algorithm","level":2,"score":0.2599000036716461},{"id":"https:\/\/openalex.org\/C166088908","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q308495","display_name":"Abductive reasoning","level":2,"score":0.25519999861717224},{"id":"https:\/\/openalex.org\/C2164484","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.2529999911785126},{"id":"https:\/\/openalex.org\/C183115368","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q856577","display_name":"Weighting","level":2,"score":0.25189998745918274},{"id":"https:\/\/openalex.org\/C2776760102","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q5139990","display_name":"Code (set theory)","level":3,"score":0.25029999017715454}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2506.21763","is_oa":true,"landing_page_url":"http:\/\/arxiv.org\/abs\/2506.21763","pdf_url":"https:\/\/arxiv.org\/pdf\/2506.21763","source":{"id":"https:\/\/openalex.org\/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550\/arxiv.2506.21763","is_oa":true,"landing_page_url":"https:\/\/doi.org\/10.48550\/arxiv.2506.21763","pdf_url":null,"source":{"id":"https:\/\/openalex.org\/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https:\/\/openalex.org\/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https:\/\/openalex.org\/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2506.21763","is_oa":true,"landing_page_url":"http:\/\/arxiv.org\/abs\/2506.21763","pdf_url":"https:\/\/arxiv.org\/pdf\/2506.21763","source":{"id":"https:\/\/openalex.org\/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"are":[4,34,67],"accelerating":[5],"scientific":[6,83,103,216,239],"idea":[7],"generation,":[8],"but":[9],"rigorously":[10],"evaluating":[11,237],"these":[12],"numerous,":[13],"often":[14],"superficial,":[15],"AI-generated":[16],"propositions":[17],"for":[18,140,213],"novelty":[19],"and":[20,42,64,78,128,143,165,172,225],"factual":[21],"accuracy":[22],"is":[23,29,137,162],"a":[24,70,93,106,119,147,174],"critical":[25],"bottleneck;":[26],"manual":[27],"verification":[28],"too":[30],"slow.Existing":[31],"validation":[32],"methods":[33],"inadequate:":[35],"LLMs":[36],"as":[37],"standalone":[38],"verifiers":[39],"may":[40],"hallucinate":[41],"lack":[43,61],"domain":[44],"knowledge":[45],"(our":[46],"findings":[47],"show":[48],"~60\\%":[49],"unawareness":[50],"of":[51,75,82,236],"relevant":[52],"papers":[53,185,240],"in":[54,193],"specific":[55],"domains),":[56],"while":[57],"traditional":[58,209],"citation":[59,210],"networks":[60],"explicit":[62],"causality":[63],"narrative":[65],"surveys":[66],"unstructured.This":[68],"underscores":[69],"core":[71],"challenge:":[72],"the":[73,155,234],"absence":[74],"structured,":[76],"verifiable,":[77],"causally-linked":[79],"historical":[80],"data":[81],"evolution.To":[84],"address":[85],"this,we":[86],"introduce":[87],"\\textbf{THE-Tree}":[88],"(\\textbf{T}echnology":[89],"\\textbf{H}istory":[90],"\\textbf{E}volution":[91],"Tree),":[92],"computational":[94],"framework":[95],"that":[96,153,159,191],"constructs":[97],"such":[98],"domain-specific":[99],"evolution":[100],"trees":[101],"from":[102],"literature.THE-Tree":[104],"employs":[105],"search":[107],"algorithm":[108],"to":[109,179,186,202,208],"explore":[110],"evolutionary":[111,135],"paths.":[112],"During":[113],"its":[114],"node":[115],"expansion,":[116],"it":[117,218,232],"utilizes":[118],"novel":[120],"\"Think-Verbalize-Cite-Verify\"":[121],"process:":[122],"an":[123],"LLM":[124],"proposes":[125],"potential":[126],"advancements":[127],"cites":[129],"supporting":[130],"literature.":[131],"Critically,":[132],"each":[133,160],"proposed":[134],"link":[136],"then":[138],"validated":[139],"logical":[141],"coherence":[142],"evidential":[144],"support":[145],"by":[146,200,222,241],"recovered":[148],"natural":[149],"language":[150],"inference":[151],"mechanism":[152],"interrogates":[154],"cited":[156],"literature,":[157],"ensuring":[158],"step":[161],"grounded.We":[163],"construct":[164],"validate":[166],"88":[167],"THE-Trees":[168],"across":[169,204],"diverse":[170],"domains":[171],"release":[173],"benchmark":[175],"dataset":[176],"including":[177],"up":[178],"71k":[180],"fact":[181],"verifications":[182],"covering":[183],"27k":[184],"foster":[187],"further":[188],"research.Experiments":[189],"demonstrate":[190],"i)":[192],"graph":[194],"completion,":[195],"our":[196],"THE-Tree":[197],"improves":[198,219],"hit@1":[199,220],"8\\%":[201],"14\\%":[203],"multiple":[205],"models":[206],"compared":[207],"networks;":[211],"ii)":[212],"predicting":[214],"future":[215],"developments,":[217],"metric":[221],"nearly":[223],"10\\%;":[224],"iii)":[226],"when":[227],"combined":[228],"with":[229],"other":[230],"methods,":[231],"boosts":[233],"performance":[235],"important":[238],"almost":[242],"100\\%.":[243]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}