{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T11:07:15Z","timestamp":1775214435186,"version":"3.50.1"},"reference-count":47,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2020,10,1]],"date-time":"2020-10-01T00:00:00Z","timestamp":1601510400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2020,10,1]],"date-time":"2020-10-01T00:00:00Z","timestamp":1601510400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2021,10,1]],"date-time":"2021-10-01T00:00:00Z","timestamp":1633046400000},"content-version":"vor","delay-in-days":365,"URL":"http:\/\/www.elsevier.com\/open-access\/userlicense\/1.0\/"}],"funder":[{"DOI":"10.13039\/501100004826","name":"Natural Science Foundation of Beijing Municipality","doi-asserted-by":"publisher","award":["Z190024"],"award-info":[{"award-number":["Z190024"]}],"id":[{"id":"10.13039\/501100004826","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012166","name":"National Key Research and Development Program of China","doi-asserted-by":"publisher","award":["2018YFC0910404"],"award-info":[{"award-number":["2018YFC0910404"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["11801301"],"award-info":[{"award-number":["11801301"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004147","name":"Tsinghua University","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100004147","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Journal of Biomedical Informatics"],"published-print":{"date-parts":[[2020,10]]},"DOI":"10.1016\/j.jbi.2020.103542","type":"journal-article","created":{"date-parts":[[2020,8,24]],"date-time":"2020-08-24T11:43:30Z","timestamp":1598269410000},"page":"103542","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":22,"special_numbering":"C","title":["Unsupervised multi-granular Chinese word segmentation and term discovery via graph partition"],"prefix":"10.1016","volume":"110","author":[{"given":"Zheng","family":"Yuan","sequence":"first","affiliation":[]},{"given":"Yuanhao","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Qiuyang","family":"Yin","sequence":"additional","affiliation":[]},{"given":"Boyao","family":"Li","sequence":"additional","affiliation":[]},{"given":"Xiaobin","family":"Feng","sequence":"additional","affiliation":[]},{"given":"Guoming","family":"Zhang","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6347-0507","authenticated-orcid":false,"given":"Sheng","family":"Yu","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.jbi.2020.103542_b0005","doi-asserted-by":"crossref","first-page":"993","DOI":"10.1093\/jamia\/ocv034","article-title":"Toward high-throughput phenotyping: Unbiased automated feature extraction and selection from knowledge sources","volume":"22","author":"Yu","year":"2015","journal-title":"J. Am. Med. Informatics Assoc."},{"key":"10.1016\/j.jbi.2020.103542_b0010","doi-asserted-by":"crossref","first-page":"e143","DOI":"10.1093\/jamia\/ocw135","article-title":"Surrogate-assisted feature extraction for high-throughput phenotyping","volume":"24","author":"Yu","year":"2017","journal-title":"J. Am. Med. Informatics Assoc."},{"key":"10.1016\/j.jbi.2020.103542_b0015","doi-asserted-by":"crossref","first-page":"54","DOI":"10.1093\/jamia\/ocx111","article-title":"Enabling phenotypic big data with PheNorm","volume":"25","author":"Yu","year":"2018","journal-title":"J. Am. Med. Informatics Assoc."},{"key":"10.1016\/j.jbi.2020.103542_b0020","doi-asserted-by":"crossref","first-page":"417","DOI":"10.1038\/nrg2999","article-title":"Using electronic health records to drive discovery in disease genomics","volume":"12","author":"Kohane","year":"2011","journal-title":"Nat. Rev. Genet."},{"key":"10.1016\/j.jbi.2020.103542_b0025","doi-asserted-by":"crossref","first-page":"1255","DOI":"10.1093\/jamia\/ocz066","article-title":"High-throughput multimodal automated phenotyping (MAP) with application to PheWAS","volume":"26","author":"Liao","year":"2019","journal-title":"J. Am. Med. Informatics Assoc."},{"key":"10.1016\/j.jbi.2020.103542_b0030","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1038\/srep26094","article-title":"Deep patient: an unsupervised representation to predict the future of patients from the electronic health records","volume":"6","author":"Miotto","year":"2016","journal-title":"Sci. Rep."},{"key":"10.1016\/j.jbi.2020.103542_b0035","doi-asserted-by":"crossref","first-page":"433","DOI":"10.1038\/s41591-018-0335-9","article-title":"Evaluation and accurate diagnoses of pediatric diseases using artificial intelligence","volume":"25","author":"Liang","year":"2019","journal-title":"Nat. Med."},{"key":"10.1016\/j.jbi.2020.103542_b0040","doi-asserted-by":"crossref","first-page":"229","DOI":"10.1136\/jamia.2009.002733","article-title":"An overview of MetaMap: Historical perspective and recent advances","volume":"17","author":"Aronson","year":"2010","journal-title":"J. Am. Med. Informatics Assoc."},{"key":"10.1016\/j.jbi.2020.103542_b0045","doi-asserted-by":"crossref","first-page":"507","DOI":"10.1136\/jamia.2009.001560","article-title":"Mayo clinical Text Analysis and Knowledge Extraction System (cTAKES): architecture, component evaluation and applications","volume":"17","author":"Savova","year":"2010","journal-title":"J. Am. Med. Informatics Assoc."},{"key":"10.1016\/j.jbi.2020.103542_b0050","doi-asserted-by":"crossref","first-page":"331","DOI":"10.1093\/jamia\/ocx132","article-title":"CLAMP - a toolkit for efficiently building customized clinical natural language processing pipelines","volume":"25","author":"Soysal","year":"2018","journal-title":"J. Am. Med. Informatics Assoc."},{"key":"10.1016\/j.jbi.2020.103542_b0055","doi-asserted-by":"crossref","first-page":"267D","DOI":"10.1093\/nar\/gkh061","article-title":"The unified medical language system (UMLS): integrating biomedical terminology","volume":"32","author":"Bodenreider","year":"2004","journal-title":"Nucleic Acids Res."},{"key":"10.1016\/j.jbi.2020.103542_b0060","first-page":"1","article-title":"IsoQuest Inc.: description of the netowl (TM) extractor system as used for MUC-7","author":"Krupka","year":"1998","journal-title":"Proc. Seventh Messag. Underst. Conf."},{"key":"10.1016\/j.jbi.2020.103542_b0065","first-page":"1977","article-title":"Definition, dictionaries and tagger for extended named entity hierarchy","author":"Sekine","year":"2004","journal-title":"Proc. 4th Int Conf. Lang. Resour. Eval. Lr."},{"key":"10.1016\/j.jbi.2020.103542_b0070","doi-asserted-by":"crossref","first-page":"808","DOI":"10.1136\/amiajnl-2013-002381","article-title":"A comprehensive study of named entity recognition in Chinese clinical text","volume":"21","author":"Lei","year":"2014","journal-title":"J. Am. Med. Informatics Assoc."},{"key":"10.1016\/j.jbi.2020.103542_b0075","doi-asserted-by":"crossref","DOI":"10.1136\/amiajnl-2013-001806","article-title":"Joint segmentation and named entity recognition using dual decomposition in Chinese discharge summaries","volume":"21","author":"Xu","year":"2014","journal-title":"J. Am. Med. Informatics Assoc."},{"key":"10.1016\/j.jbi.2020.103542_b0080","doi-asserted-by":"crossref","unstructured":"A. McCallum, W. Li, Early results for named entity recognition with conditional random fields, feature induction and web-enhanced lexicons, (2003) 188\u2013191. https:\/\/doi.org\/10.3115\/1119176.1119206.","DOI":"10.3115\/1119176.1119206"},{"key":"10.1016\/j.jbi.2020.103542_b0085","unstructured":"A. Borthwick, A maximum entropy approach to named entity recognition, (1999). http:\/\/www.cs.nyu.edu\/web\/Research\/Theses\/borthwick_andrew.pdf."},{"key":"10.1016\/j.jbi.2020.103542_b0090","first-page":"1064","article-title":"End-to-end sequence labeling via bi-directional LSTM-CNNs-CRF","volume":"2","author":"Ma","year":"2016","journal-title":"54th Annu Meet. Assoc. Comput. Linguist. ACL 2016 - Long Pap."},{"key":"10.1016\/j.jbi.2020.103542_b0095","doi-asserted-by":"crossref","unstructured":"G. Lample, M. Ballesteros, S. Subramanian, K. Kawakami, C. Dyer, Neural architectures for named entity recognition, 2016 Conf. North Am. Chapter Assoc. Comput. Linguist. Hum. Lang. Technol. NAACL HLT 2016 - Proc. Conf. (2016) 260\u2013270. https:\/\/doi.org\/10.18653\/v1\/n16-1030.","DOI":"10.18653\/v1\/N16-1030"},{"key":"10.1016\/j.jbi.2020.103542_b0100","first-page":"624","article-title":"Named entity recognition in chinese clinical text using deep neural network","volume":"216","author":"Wu","year":"2015","journal-title":"Stud. Health Technol. Inform."},{"key":"10.1016\/j.jbi.2020.103542_b0105","doi-asserted-by":"crossref","first-page":"1554","DOI":"10.18653\/v1\/P18-1144","article-title":"Chinese NER using lattice LSTM, ACL 2018","author":"Zhang","year":"2018","journal-title":"56th Annu Meet. Assoc. Comput. Linguist. Proc. Conf. (Long Pap. 1)"},{"key":"10.1016\/j.jbi.2020.103542_b0110","unstructured":"J. Devlin, M.-W. Chang, K. Lee, K. Toutanova, BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding, (2018). http:\/\/arxiv.org\/abs\/1810.04805."},{"key":"10.1016\/j.jbi.2020.103542_b0115","first-page":"1","article-title":"BioBERT: a pre-trained biomedical language representation model for biomedical text mining","author":"Lee","year":"2019","journal-title":"Bioinformatics"},{"key":"10.1016\/j.jbi.2020.103542_b0120","doi-asserted-by":"crossref","unstructured":"K.-J. Chen, S.-H. Liu, Word identification for Mandarin Chinese sentences, in: Proc. 14th Conf. Comput. Linguist. -, Association for Computational Linguistics, Morristown, NJ, USA, 1992: p. 101. https:\/\/doi.org\/10.3115\/992066.992085.","DOI":"10.3115\/992066.992085"},{"key":"10.1016\/j.jbi.2020.103542_b0125","doi-asserted-by":"crossref","unstructured":"F. Peng, F. Feng, A. McCallum, Chinese segmentation and new word detection using conditional random fields, (2004) 562-es. https:\/\/doi.org\/10.3115\/1220355.1220436.","DOI":"10.3115\/1220355.1220436"},{"key":"10.1016\/j.jbi.2020.103542_b0130","doi-asserted-by":"crossref","first-page":"133","DOI":"10.1007\/978-981-13-1927-3_14","article-title":"Effective neural solution for multi-criteria word segmentation","volume":"105","author":"He","year":"2019","journal-title":"Smart Innov. Syst. Technol."},{"key":"10.1016\/j.jbi.2020.103542_b0135","unstructured":"W. Sun, J. Xu, Enhancing Chinese word segmentation using unlabeled data, EMNLP 2011 - Conf. Empir. Methods Nat. Lang. Process. Proc. Conf. (2011) 970\u2013979."},{"key":"10.1016\/j.jbi.2020.103542_b0140","unstructured":"R. Luo, J. Xu, Y. Zhang, X. Ren, X. Sun, PKUSEG: A Toolkit for Multi-Domain Chinese Word Segmentation, (2019). http:\/\/arxiv.org\/abs\/1906.11455."},{"key":"10.1016\/j.jbi.2020.103542_b0145","doi-asserted-by":"crossref","unstructured":"N. Xue, L. Shen, Chinese word segmentation as LMR tagging, in: Proc. Second SIGHAN Work. Chinese Lang. Process. -, Association for Computational Linguistics, Morristown, NJ, USA, 2003: pp. 176\u2013179. https:\/\/doi.org\/10.3115\/1119250.1119278.","DOI":"10.3115\/1119250.1119278"},{"key":"10.1016\/j.jbi.2020.103542_b0150","doi-asserted-by":"crossref","first-page":"647","DOI":"10.18653\/v1\/D13-1061","article-title":"Deep learning for Chinese word segmentation and POS tagging, EMNLP 2013","author":"Zheng","year":"2013","journal-title":"2013 Conf. Empir. Methods Nat. Lang. Process. Proc. Conf."},{"key":"10.1016\/j.jbi.2020.103542_b0155","doi-asserted-by":"crossref","unstructured":"X. Chen, X. Qiu, C. Zhu, P. Liu, X. Huang, Long Short-Term Memory Neural Networks for Chinese Word Segmentation, in: Proc. 2015 Conf. Empir. Methods Nat. Lang. Process., Association for Computational Linguistics, Stroudsburg, PA, USA, 2015: pp. 1197\u20131206. https:\/\/doi.org\/10.18653\/v1\/D15-1141.","DOI":"10.18653\/v1\/D15-1141"},{"key":"10.1016\/j.jbi.2020.103542_b0160","author":"Huang","year":"2015","journal-title":"Bidirectional LSTM-CRF Models for Sequence Tagging"},{"key":"10.1016\/j.jbi.2020.103542_b0165","unstructured":"W. Huang, X. Cheng, K. Chen, T. Wang, W. Chu, Toward Fast and Accurate Neural Chinese Word Segmentation with Multi-Criteria Learning, (2019). http:\/\/arxiv.org\/abs\/1903.04190."},{"key":"10.1016\/j.jbi.2020.103542_b0170","doi-asserted-by":"crossref","first-page":"395","DOI":"10.1007\/s11222-007-9033-z","article-title":"A tutorial on spectral clustering","volume":"17","author":"von Luxburg","year":"2007","journal-title":"Stat. Comput."},{"key":"10.1016\/j.jbi.2020.103542_b0175","doi-asserted-by":"crossref","first-page":"1074","DOI":"10.1109\/43.159993","article-title":"New spectral methods for ratio cut partitioning and clustering","volume":"11","author":"Hagen","year":"1992","journal-title":"IEEE Trans. Comput. Des. Integr. Circuits Syst."},{"key":"10.1016\/j.jbi.2020.103542_b0180","first-page":"888","article-title":"Normalized cuts and image segmentation part of the electrical and computer engineering commons recommended citation normalized cuts and image segmentation normalized cuts and image segmentation","volume":"22","author":"Shi","year":"2000","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"10.1016\/j.jbi.2020.103542_b0185","author":"Wagner","year":"1991","journal-title":"Between Min Cut and Graph Bisection Technische Universit\u00e4t Berlin Between Min Cut and Graph Bisection"},{"key":"10.1016\/j.jbi.2020.103542_b0190","doi-asserted-by":"crossref","unstructured":"C. Zhang, S. Xia, K-means clustering algorithm with improved initial center, Proc. - 2009 2nd Int. Work. Knowl. Discov. Data Mining, WKKD 2009. 1 (2009) 790\u2013792. https:\/\/doi.org\/10.1109\/WKDD.2009.210.","DOI":"10.1109\/WKDD.2009.210"},{"key":"10.1016\/j.jbi.2020.103542_b0195","unstructured":"J. Sun, Jieba chinese word segmentation tool, (2012)."},{"key":"10.1016\/j.jbi.2020.103542_b0200","unstructured":"M. Sun, X. Chen, K. Zhang, Z. Guo, Z. Liu, THULAC: An Efficient Lexical Analyzer for Chinese., (2016)."},{"key":"10.1016\/j.jbi.2020.103542_b0205","doi-asserted-by":"crossref","unstructured":"H.-P. Zhang, H.-K. Yu, D.-Y. Xiong, Q. Liu, HHMM-based Chinese lexical analyzer ICTCLAS, in: Proc. Second SIGHAN Work. Chinese Lang. Process. -, Association for Computational Linguistics, Morristown, NJ, USA, 2003: pp. 184\u2013187. https:\/\/doi.org\/10.3115\/1119250.1119280.","DOI":"10.3115\/1119250.1119280"},{"key":"10.1016\/j.jbi.2020.103542_b0210","first-page":"123","article-title":"The Second International Chinese Word Segmentation Bakeoff","volume":"2005","author":"Emerson","year":"2005","journal-title":"Proc. Fourth SIGHAN Work. Chinese Lang. Process."},{"key":"10.1016\/j.jbi.2020.103542_b0215","doi-asserted-by":"crossref","unstructured":"Z. Sun, Z.-H. Deng, Unsupervised Neural Word Segmentation for Chinese via Segmental Language Modeling, in: Proc. 2018 Conf. Empir. Methods Nat. Lang. Process., Association for Computational Linguistics, Stroudsburg, PA, USA, 2018: pp. 4915\u20134920. https:\/\/doi.org\/10.18653\/v1\/D18-1531.","DOI":"10.18653\/v1\/D18-1531"},{"key":"10.1016\/j.jbi.2020.103542_b0220","doi-asserted-by":"crossref","first-page":"21","DOI":"10.1016\/j.cognition.2009.03.008","article-title":"A Bayesian framework for word segmentation: exploring the effects of context","volume":"112","author":"Goldwater","year":"2009","journal-title":"Cognition"},{"key":"10.1016\/j.jbi.2020.103542_b0225","doi-asserted-by":"crossref","unstructured":"W. Jiang, L. Huang, Q. Liu, Automatic adaptation of annotation standards: Chinese word segmentation and POS tagging - A case study, ACL-IJCNLP 2009 - Jt. Conf. 47th Annu. Meet. Assoc. Comput. Linguist. 4th Int. Jt. Conf. Nat. Lang. Process. AFNLP, Proc. Conf. (2009) 522\u2013530. https:\/\/doi.org\/10.3115\/1687878.1687952.","DOI":"10.3115\/1687878.1687952"},{"key":"10.1016\/j.jbi.2020.103542_b0230","first-page":"27","article-title":"Unknown word detection for chinese by a corpus-based learning method","volume":"3","author":"Chen","year":"1998","journal-title":"Comput. Linguist. Chinese Lang. Lang. Process."},{"key":"10.1016\/j.jbi.2020.103542_b0235","doi-asserted-by":"crossref","unstructured":"K.-J. Chen, W.-Y. Ma, Unknown word extraction for Chinese documents, in: Proc. 19th Int. Conf. Comput. Linguist. -, Association for Computational Linguistics, Morristown, NJ, USA, 2002: pp. 1\u20137. https:\/\/doi.org\/10.3115\/1072228.1072277.","DOI":"10.3115\/1072228.1072277"}],"container-title":["Journal of Biomedical Informatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1532046420301702?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1532046420301702?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2025,10,26]],"date-time":"2025-10-26T22:44:08Z","timestamp":1761518648000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S1532046420301702"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,10]]},"references-count":47,"alternative-id":["S1532046420301702"],"URL":"https:\/\/doi.org\/10.1016\/j.jbi.2020.103542","relation":{},"ISSN":["1532-0464"],"issn-type":[{"value":"1532-0464","type":"print"}],"subject":[],"published":{"date-parts":[[2020,10]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Unsupervised multi-granular Chinese word segmentation and term discovery via graph partition","name":"articletitle","label":"Article Title"},{"value":"Journal of Biomedical Informatics","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.jbi.2020.103542","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2020 Elsevier Inc.","name":"copyright","label":"Copyright"}],"article-number":"103542"}}