{"id":"https:\/\/openalex.org\/W4416188354","doi":"https:\/\/doi.org\/10.48550\/arxiv.2511.07473","title":"RELEAP: Reinforcement-Enhanced Label-Efficient Active Phenotyping for Electronic Health Records","display_name":"RELEAP: Reinforcement-Enhanced Label-Efficient Active Phenotyping for Electronic Health Records","publication_year":2025,"publication_date":"2025-11-08","ids":{"openalex":"https:\/\/openalex.org\/W4416188354","doi":"https:\/\/doi.org\/10.48550\/arxiv.2511.07473"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2511.07473","is_oa":true,"landing_page_url":"http:\/\/arxiv.org\/abs\/2511.07473","pdf_url":"https:\/\/arxiv.org\/pdf\/2511.07473","source":{"id":"https:\/\/openalex.org\/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https:\/\/arxiv.org\/pdf\/2511.07473","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https:\/\/openalex.org\/A5100397647","display_name":"Yang Yang","orcid":"https:\/\/orcid.org\/0000-0002-6417-3483"},"institutions":[{"id":"https:\/\/openalex.org\/I170897317","display_name":"Duke University","ror":"https:\/\/ror.org\/00py81415","country_code":"US","type":"education","lineage":["https:\/\/openalex.org\/I170897317"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yang, Yang","raw_affiliation_strings":["Department of Biostatistics and Bioinformatics, Duke University, Durham, USA"],"affiliations":[{"raw_affiliation_string":"Department of Biostatistics and Bioinformatics, Duke University, Durham, USA","institution_ids":["https:\/\/openalex.org\/I170897317"]}]},{"author_position":"middle","author":{"id":"https:\/\/openalex.org\/A5084752371","display_name":"Kathryn I. Pollak","orcid":"https:\/\/orcid.org\/0000-0002-5559-2416"},"institutions":[{"id":"https:\/\/openalex.org\/I4390039326","display_name":"Duke Cancer Institute","ror":"https:\/\/ror.org\/04vt65461","country_code":null,"type":"healthcare","lineage":["https:\/\/openalex.org\/I4210126298","https:\/\/openalex.org\/I4210144876","https:\/\/openalex.org\/I4390039326"]},{"id":"https:\/\/openalex.org\/I170897317","display_name":"Duke University","ror":"https:\/\/ror.org\/00py81415","country_code":"US","type":"education","lineage":["https:\/\/openalex.org\/I170897317"]},{"id":"https:\/\/openalex.org\/I4210124077","display_name":"Duke Institute for Health Innovation","ror":"https:\/\/ror.org\/031n1rn61","country_code":"US","type":"other","lineage":["https:\/\/openalex.org\/I4210124077"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pollak, Kathryn I.","raw_affiliation_strings":["Duke Cancer Institute, Durham, USA","Department of Population Health Sciences, Duke University School of Medicine, Durham, USA"],"affiliations":[{"raw_affiliation_string":"Duke Cancer Institute, Durham, USA","institution_ids":["https:\/\/openalex.org\/I4210124077","https:\/\/openalex.org\/I4390039326"]},{"raw_affiliation_string":"Department of Population Health Sciences, Duke University School of Medicine, Durham, USA","institution_ids":["https:\/\/openalex.org\/I170897317"]}]},{"author_position":"middle","author":{"id":"https:\/\/openalex.org\/A5036008511","display_name":"Bibhas Chakraborty","orcid":"https:\/\/orcid.org\/0000-0002-7366-0478"},"institutions":[{"id":"https:\/\/openalex.org\/I170897317","display_name":"Duke University","ror":"https:\/\/ror.org\/00py81415","country_code":"US","type":"education","lineage":["https:\/\/openalex.org\/I170897317"]},{"id":"https:\/\/openalex.org\/I165932596","display_name":"National University of Singapore","ror":"https:\/\/ror.org\/01tgyzw49","country_code":"SG","type":"education","lineage":["https:\/\/openalex.org\/I165932596"]},{"id":"https:\/\/openalex.org\/I4210126319","display_name":"Duke-NUS Medical School","ror":"https:\/\/ror.org\/02j1m6098","country_code":"SG","type":"education","lineage":["https:\/\/openalex.org\/I165932596","https:\/\/openalex.org\/I170897317","https:\/\/openalex.org\/I4210126319"]}],"countries":["SG","US"],"is_corresponding":false,"raw_author_name":"Chakraborty, Bibhas","raw_affiliation_strings":["Department of Biostatistics and Bioinformatics, Duke University, Durham, USA","Centre for Quantitative Medicine, Duke-NUS Medical School, Singapore","Programme in Health Services and Systems Research, Duke-NUS Medical School, Singapore","Department of Statistics and Data Science, National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Department of Biostatistics and Bioinformatics, Duke University, Durham, USA","institution_ids":["https:\/\/openalex.org\/I170897317"]},{"raw_affiliation_string":"Centre for Quantitative Medicine, Duke-NUS Medical School, Singapore","institution_ids":["https:\/\/openalex.org\/I4210126319"]},{"raw_affiliation_string":"Programme in Health Services and Systems Research, Duke-NUS Medical School, Singapore","institution_ids":["https:\/\/openalex.org\/I4210126319"]},{"raw_affiliation_string":"Department of Statistics and Data Science, National University of Singapore, Singapore","institution_ids":["https:\/\/openalex.org\/I165932596"]}]},{"author_position":"middle","author":{"id":"https:\/\/openalex.org\/A5000308638","display_name":"Molei Liu","orcid":"https:\/\/orcid.org\/0000-0003-1890-4449"},"institutions":[{"id":"https:\/\/openalex.org\/I4210133846","display_name":"Peking University International Hospital","ror":"https:\/\/ror.org\/03jxhcr96","country_code":"CN","type":"healthcare","lineage":["https:\/\/openalex.org\/I4210133846"]},{"id":"https:\/\/openalex.org\/I20231570","display_name":"Peking University","ror":"https:\/\/ror.org\/02v51f717","country_code":"CN","type":"education","lineage":["https:\/\/openalex.org\/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liu, Molei","raw_affiliation_strings":["Department of Biostatistics, Peking University Health Science Center, Beijing, China","Beijing International Center for Mathematical Research, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Biostatistics, Peking University Health Science Center, Beijing, China","institution_ids":["https:\/\/openalex.org\/I20231570"]},{"raw_affiliation_string":"Beijing International Center for Mathematical Research, Peking University, Beijing, China","institution_ids":["https:\/\/openalex.org\/I20231570","https:\/\/openalex.org\/I4210133846"]}]},{"author_position":"middle","author":{"id":"https:\/\/openalex.org\/A5004052573","display_name":"Doudou Zhou","orcid":"https:\/\/orcid.org\/0000-0002-0830-2287"},"institutions":[{"id":"https:\/\/openalex.org\/I165932596","display_name":"National University of Singapore","ror":"https:\/\/ror.org\/01tgyzw49","country_code":"SG","type":"education","lineage":["https:\/\/openalex.org\/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Zhou, Doudou","raw_affiliation_strings":["Department of Statistics and Data Science, National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Department of Statistics and Data Science, National University of Singapore, Singapore","institution_ids":["https:\/\/openalex.org\/I165932596"]}]},{"author_position":"last","author":{"id":"https:\/\/openalex.org\/A5052512997","display_name":"Chuan Hong","orcid":"https:\/\/orcid.org\/0000-0001-7056-9559"},"institutions":[{"id":"https:\/\/openalex.org\/I170897317","display_name":"Duke University","ror":"https:\/\/ror.org\/00py81415","country_code":"US","type":"education","lineage":["https:\/\/openalex.org\/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hong, Chuan","raw_affiliation_strings":["Department of Biostatistics and Bioinformatics, Duke University, Durham, USA"],"affiliations":[{"raw_affiliation_string":"Department of Biostatistics and Bioinformatics, Duke University, Durham, USA","institution_ids":["https:\/\/openalex.org\/I170897317"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https:\/\/openalex.org\/A5100397647"],"corresponding_institution_ids":["https:\/\/openalex.org\/I170897317"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https:\/\/openalex.org\/T13702","display_name":"Machine Learning in Healthcare","score":0.5486999750137329,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1702","display_name":"Artificial Intelligence"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},"topics":[{"id":"https:\/\/openalex.org\/T13702","display_name":"Machine Learning in Healthcare","score":0.5486999750137329,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1702","display_name":"Artificial Intelligence"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},{"id":"https:\/\/openalex.org\/T12072","display_name":"Machine Learning and Algorithms","score":0.07320000231266022,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1702","display_name":"Artificial Intelligence"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},{"id":"https:\/\/openalex.org\/T10350","display_name":"Electronic Health Records Systems","score":0.04879999905824661,"subfield":{"id":"https:\/\/openalex.org\/subfields\/3605","display_name":"Health Information Management"},"field":{"id":"https:\/\/openalex.org\/fields\/36","display_name":"Health Professions"},"domain":{"id":"https:\/\/openalex.org\/domains\/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https:\/\/openalex.org\/keywords\/heuristics","display_name":"Heuristics","score":0.6579999923706055},{"id":"https:\/\/openalex.org\/keywords\/downstream","display_name":"Downstream (manufacturing)","score":0.6291999816894531},{"id":"https:\/\/openalex.org\/keywords\/annotation","display_name":"Annotation","score":0.5246000289916992},{"id":"https:\/\/openalex.org\/keywords\/reliability","display_name":"Reliability (semiconductor)","score":0.4952000081539154},{"id":"https:\/\/openalex.org\/keywords\/proxy","display_name":"Proxy (statistics)","score":0.4772999882698059},{"id":"https:\/\/openalex.org\/keywords\/heuristic","display_name":"Heuristic","score":0.4593000113964081},{"id":"https:\/\/openalex.org\/keywords\/chart","display_name":"Chart","score":0.4553999900817871}],"concepts":[{"id":"https:\/\/openalex.org\/C127705205","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q5748245","display_name":"Heuristics","level":2,"score":0.6579999923706055},{"id":"https:\/\/openalex.org\/C41008148","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q21198","display_name":"Computer science","level":0,"score":0.6556000113487244},{"id":"https:\/\/openalex.org\/C2776207758","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q5303302","display_name":"Downstream (manufacturing)","level":2,"score":0.6291999816894531},{"id":"https:\/\/openalex.org\/C119857082","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q2539","display_name":"Machine learning","level":1,"score":0.5471000075340271},{"id":"https:\/\/openalex.org\/C2776321320","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q857525","display_name":"Annotation","level":2,"score":0.5246000289916992},{"id":"https:\/\/openalex.org\/C43214815","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.4952000081539154},{"id":"https:\/\/openalex.org\/C154945302","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48069998621940613},{"id":"https:\/\/openalex.org\/C2780148112","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1432581","display_name":"Proxy (statistics)","level":2,"score":0.4772999882698059},{"id":"https:\/\/openalex.org\/C173801870","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q201413","display_name":"Heuristic","level":2,"score":0.4593000113964081},{"id":"https:\/\/openalex.org\/C190812933","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q28923","display_name":"Chart","level":2,"score":0.4553999900817871},{"id":"https:\/\/openalex.org\/C151956035","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1132755","display_name":"Logistic regression","level":2,"score":0.4426000118255615},{"id":"https:\/\/openalex.org\/C77967617","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.4146000146865845},{"id":"https:\/\/openalex.org\/C124101348","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q172491","display_name":"Data mining","level":1,"score":0.3675999939441681},{"id":"https:\/\/openalex.org\/C81917197","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.35100001096725464},{"id":"https:\/\/openalex.org\/C95623464","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.29350000619888306},{"id":"https:\/\/openalex.org\/C3020144179","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q10871684","display_name":"Electronic health record","level":3,"score":0.2822999954223633},{"id":"https:\/\/openalex.org\/C136389625","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q334384","display_name":"Supervised learning","level":3,"score":0.28029999136924744},{"id":"https:\/\/openalex.org\/C83546350","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1139051","display_name":"Regression","level":2,"score":0.26080000400543213}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2511.07473","is_oa":true,"landing_page_url":"http:\/\/arxiv.org\/abs\/2511.07473","pdf_url":"https:\/\/arxiv.org\/pdf\/2511.07473","source":{"id":"https:\/\/openalex.org\/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550\/arxiv.2511.07473","is_oa":true,"landing_page_url":"https:\/\/doi.org\/10.48550\/arxiv.2511.07473","pdf_url":null,"source":{"id":"https:\/\/openalex.org\/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https:\/\/openalex.org\/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https:\/\/openalex.org\/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2511.07473","is_oa":true,"landing_page_url":"http:\/\/arxiv.org\/abs\/2511.07473","pdf_url":"https:\/\/arxiv.org\/pdf\/2511.07473","source":{"id":"https:\/\/openalex.org\/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Objective:":[0],"Electronic":[1],"health":[2],"record":[3],"(EHR)":[4],"phenotyping":[5],"often":[6],"relies":[7],"on":[8,29,98,106],"noisy":[9],"proxy":[10],"labels,":[11],"which":[12,190],"undermine":[13],"the":[14,176,228],"reliability":[15,229],"of":[16,230],"downstream":[17,52,101,161,194,214],"risk":[18,120,232],"prediction.":[19,233],"Active":[20,75],"learning":[21,82,206],"can":[22],"reduce":[23],"annotation":[24],"costs,":[25],"but":[26],"most":[27,192],"rely":[28],"fixed":[30,204],"heuristics":[31],"and":[32,61,69,125,136,153,168,196,226],"do":[33],"not":[34],"ensure":[35],"that":[36,49,221],"phenotype":[37,59,183,211],"refinement":[38,184],"improves":[39],"prediction":[40,53,186],"performance.":[41],"Our":[42],"goal":[43],"was":[44,131],"to":[45,57,151,158,185,203],"develop":[46],"a":[47,78,107,199,217],"framework":[48],"directly":[50],"uses":[51],"performance":[54,162],"as":[55,163],"feedback":[56,99],"guide":[58],"correction":[60,212],"sample":[62],"selection":[63],"under":[64,175],"constrained":[65],"labeling":[66,178],"budgets.":[67],"Materials":[68],"Methods:":[70],"We":[71,103],"propose":[72],"Reinforcement-Enhanced":[73],"Label-Efficient":[74],"Phenotyping":[76],"(RELEAP),":[77],"reinforcement":[79],"learning-based":[80],"active":[81,138,205],"framework.":[83],"RELEAP":[84,105,141,165,188,209],"adaptively":[85],"integrates":[86],"multiple":[87],"querying":[88],"strategies":[89],"and,":[90],"unlike":[91],"prior":[92],"methods,":[93],"updates":[94],"its":[95],"policy":[96],"based":[97],"from":[100,149,156],"models.":[102,129],"evaluated":[104],"de-identified":[108],"Duke":[109],"University":[110],"Health":[111],"System":[112],"(DUHS)":[113],"cohort":[114],"(2014-2024)":[115],"for":[116],"incident":[117],"lung":[118],"cancer":[119],"prediction,":[121],"using":[122],"logistic":[123],"regression":[124],"penalized":[126],"Cox":[127],"survival":[128,154],"Performance":[130],"benchmarked":[132],"against":[133],"noisy-label":[134],"baselines":[135],"single-strategy":[137],"learning.":[139],"Results:":[140],"consistently":[142],"outperformed":[143],"all":[144],"baselines.":[145],"Logistic":[146],"AUC":[147],"increased":[148],"0.774":[150],"0.805":[152],"C-index":[155],"0.718":[157],"0.752.":[159],"Using":[160],"feedback,":[164,215],"produced":[166],"smoother":[167],"more":[169,200],"stable":[170],"gains":[171],"than":[172],"heuristic":[173],"methods":[174],"same":[177],"budget.":[179],"Discussion:":[180],"By":[181],"linking":[182],"outcomes,":[187],"learns":[189],"samples":[191],"improve":[193],"discrimination":[195],"calibration,":[197],"offering":[198,216],"principled":[201],"alternative":[202],"rules.":[207],"Conclusion:":[208],"optimizes":[210],"through":[213],"scalable,":[218],"label-efficient":[219],"paradigm":[220],"reduces":[222],"manual":[223],"chart":[224],"review":[225],"enhances":[227],"EHR-based":[231]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-13T00:00:00"}