{"id":"https:\/\/openalex.org\/W4403792185","doi":"https:\/\/doi.org\/10.1145\/3664647.3681053","title":"CT <sup>2<\/sup> C-QA: Multimodal Question Answering over Chinese Text, Table and Chart","display_name":"CT <sup>2<\/sup> C-QA: Multimodal Question Answering over Chinese Text, Table and Chart","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https:\/\/openalex.org\/W4403792185","doi":"https:\/\/doi.org\/10.1145\/3664647.3681053"},"language":"en","primary_location":{"id":"doi:10.1145\/3664647.3681053","is_oa":false,"landing_page_url":"https:\/\/doi.org\/10.1145\/3664647.3681053","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https:\/\/arxiv.org\/pdf\/2410.21414","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Bowen Zhao","orcid":"https:\/\/orcid.org\/0009-0000-0544-0062"},"institutions":[{"id":"https:\/\/openalex.org\/I24943067","display_name":"Fudan University","ror":"https:\/\/ror.org\/013q1eq08","country_code":"CN","type":"education","lineage":["https:\/\/openalex.org\/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Bowen Zhao","raw_affiliation_strings":["School of Computer Science, Shanghai Key Laboratory of Intelligent Information Processing, Fudan University &amp; Shanghai Collaborative Innovation Center of Intelligent Visual Computing, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Shanghai Key Laboratory of Intelligent Information Processing, Fudan University &amp; Shanghai Collaborative Innovation Center of Intelligent Visual Computing, Fudan University, Shanghai, China","institution_ids":["https:\/\/openalex.org\/I24943067"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Tianhao Cheng","orcid":"https:\/\/orcid.org\/0009-0005-4654-9896"},"institutions":[{"id":"https:\/\/openalex.org\/I24943067","display_name":"Fudan University","ror":"https:\/\/ror.org\/013q1eq08","country_code":"CN","type":"education","lineage":["https:\/\/openalex.org\/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianhao Cheng","raw_affiliation_strings":["School of Computer Science, Shanghai Key Laboratory of Intelligent Information Processing, Fudan University &amp; Shanghai Collaborative Innovation Center of Intelligent Visual Computing, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Shanghai Key Laboratory of Intelligent Information Processing, Fudan University &amp; Shanghai Collaborative Innovation Center of Intelligent Visual Computing, Fudan University, Shanghai, China","institution_ids":["https:\/\/openalex.org\/I24943067"]}]},{"author_position":"middle","author":{"id":"https:\/\/openalex.org\/A5070073283","display_name":"Yuejie Zhang","orcid":"https:\/\/orcid.org\/0000-0001-7993-7223"},"institutions":[{"id":"https:\/\/openalex.org\/I24943067","display_name":"Fudan University","ror":"https:\/\/ror.org\/013q1eq08","country_code":"CN","type":"education","lineage":["https:\/\/openalex.org\/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuejie Zhang","raw_affiliation_strings":["School of Computer Science, Shanghai Key Laboratory of Intelligent Information Processing, Fudan University &amp; Shanghai Collaborative Innovation Center of Intelligent Visual Computing, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Shanghai Key Laboratory of Intelligent Information Processing, Fudan University &amp; Shanghai Collaborative Innovation Center of Intelligent Visual Computing, Fudan University, Shanghai, China","institution_ids":["https:\/\/openalex.org\/I24943067"]}]},{"author_position":"middle","author":{"id":"https:\/\/openalex.org\/A5114859513","display_name":"Ying Cheng","orcid":"https:\/\/orcid.org\/0000-0002-8964-3998"},"institutions":[{"id":"https:\/\/openalex.org\/I24943067","display_name":"Fudan University","ror":"https:\/\/ror.org\/013q1eq08","country_code":"CN","type":"education","lineage":["https:\/\/openalex.org\/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ying Cheng","raw_affiliation_strings":["School of Computer Science, Shanghai Key Laboratory of Intelligent Information Processing, Fudan University &amp; Shanghai Collaborative Innovation Center of Intelligent Visual Computing, Fudan University, Shanghai, China","Fudan University Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Shanghai Key Laboratory of Intelligent Information Processing, Fudan University &amp; Shanghai Collaborative Innovation Center of Intelligent Visual Computing, Fudan University, Shanghai, China","institution_ids":["https:\/\/openalex.org\/I24943067"]},{"raw_affiliation_string":"Fudan University Shanghai, China","institution_ids":["https:\/\/openalex.org\/I24943067"]}]},{"author_position":"middle","author":{"id":"https:\/\/openalex.org\/A5100680617","display_name":"Rui Feng","orcid":"https:\/\/orcid.org\/0000-0002-4747-0574"},"institutions":[{"id":"https:\/\/openalex.org\/I24943067","display_name":"Fudan University","ror":"https:\/\/ror.org\/013q1eq08","country_code":"CN","type":"education","lineage":["https:\/\/openalex.org\/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rui Feng","raw_affiliation_strings":["School of Computer Science, Shanghai Key Laboratory of Intelligent Information Processing, Fudan University &amp; Shanghai Collaborative Innovation Center of Intelligent Visual Computing, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Shanghai Key Laboratory of Intelligent Information Processing, Fudan University &amp; Shanghai Collaborative Innovation Center of Intelligent Visual Computing, Fudan University, Shanghai, China","institution_ids":["https:\/\/openalex.org\/I24943067"]}]},{"author_position":"last","author":{"id":"https:\/\/openalex.org\/A5100462481","display_name":"Xiaobo Zhang","orcid":"https:\/\/orcid.org\/0000-0002-8645-5414"},"institutions":[{"id":"https:\/\/openalex.org\/I4210159329","display_name":"Children's Hospital of Fudan University","ror":"https:\/\/ror.org\/05n13be63","country_code":"CN","type":"healthcare","lineage":["https:\/\/openalex.org\/I4210159329"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaobo Zhang","raw_affiliation_strings":["Children's Hospital of Fudan University &amp; National Children's Medical Center, Shanghai, China","Shanghai Collaborative Innovation Center of Intelligent Visual Computing. Fudan Zhangjiang Institute, Shanghai"],"affiliations":[{"raw_affiliation_string":"Children's Hospital of Fudan University &amp; National Children's Medical Center, Shanghai, China","institution_ids":["https:\/\/openalex.org\/I4210159329"]},{"raw_affiliation_string":"Shanghai Collaborative Innovation Center of Intelligent Visual Computing. Fudan Zhangjiang Institute, Shanghai","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":["https:\/\/openalex.org\/I24943067"],"apc_list":null,"apc_paid":null,"fwci":0.669,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.75982968,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"3897","last_page":"3906"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https:\/\/openalex.org\/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1702","display_name":"Artificial Intelligence"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},"topics":[{"id":"https:\/\/openalex.org\/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1702","display_name":"Artificial Intelligence"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},{"id":"https:\/\/openalex.org\/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},{"id":"https:\/\/openalex.org\/T10181","display_name":"Natural Language Processing Techniques","score":0.9991999864578247,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1702","display_name":"Artificial Intelligence"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https:\/\/openalex.org\/keywords\/question-answering","display_name":"Question answering","score":0.7849620580673218},{"id":"https:\/\/openalex.org\/keywords\/computer-science","display_name":"Computer science","score":0.7017611861228943},{"id":"https:\/\/openalex.org\/keywords\/table","display_name":"Table (database)","score":0.6746561527252197},{"id":"https:\/\/openalex.org\/keywords\/information-retrieval","display_name":"Information retrieval","score":0.5970926880836487},{"id":"https:\/\/openalex.org\/keywords\/chart","display_name":"Chart","score":0.5280186533927917},{"id":"https:\/\/openalex.org\/keywords\/natural-language-processing","display_name":"Natural language processing","score":0.5187987685203552},{"id":"https:\/\/openalex.org\/keywords\/artificial-intelligence","display_name":"Artificial intelligence","score":0.3786836862564087},{"id":"https:\/\/openalex.org\/keywords\/database","display_name":"Database","score":0.18219676613807678},{"id":"https:\/\/openalex.org\/keywords\/statistics","display_name":"Statistics","score":0.13182857632637024},{"id":"https:\/\/openalex.org\/keywords\/mathematics","display_name":"Mathematics","score":0.11444699764251709}],"concepts":[{"id":"https:\/\/openalex.org\/C44291984","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1074173","display_name":"Question answering","level":2,"score":0.7849620580673218},{"id":"https:\/\/openalex.org\/C41008148","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q21198","display_name":"Computer science","level":0,"score":0.7017611861228943},{"id":"https:\/\/openalex.org\/C45235069","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q278425","display_name":"Table (database)","level":2,"score":0.6746561527252197},{"id":"https:\/\/openalex.org\/C23123220","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q816826","display_name":"Information retrieval","level":1,"score":0.5970926880836487},{"id":"https:\/\/openalex.org\/C190812933","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q28923","display_name":"Chart","level":2,"score":0.5280186533927917},{"id":"https:\/\/openalex.org\/C204321447","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q30642","display_name":"Natural language processing","level":1,"score":0.5187987685203552},{"id":"https:\/\/openalex.org\/C154945302","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3786836862564087},{"id":"https:\/\/openalex.org\/C77088390","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q8513","display_name":"Database","level":1,"score":0.18219676613807678},{"id":"https:\/\/openalex.org\/C105795698","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q12483","display_name":"Statistics","level":1,"score":0.13182857632637024},{"id":"https:\/\/openalex.org\/C33923547","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q395","display_name":"Mathematics","level":0,"score":0.11444699764251709}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145\/3664647.3681053","is_oa":false,"landing_page_url":"https:\/\/doi.org\/10.1145\/3664647.3681053","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2410.21414","is_oa":true,"landing_page_url":"http:\/\/arxiv.org\/abs\/2410.21414","pdf_url":"https:\/\/arxiv.org\/pdf\/2410.21414","source":{"id":"https:\/\/openalex.org\/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https:\/\/openalex.org\/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https:\/\/openalex.org\/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2410.21414","is_oa":true,"landing_page_url":"http:\/\/arxiv.org\/abs\/2410.21414","pdf_url":"https:\/\/arxiv.org\/pdf\/2410.21414","source":{"id":"https:\/\/openalex.org\/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https:\/\/openalex.org\/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https:\/\/openalex.org\/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https:\/\/openalex.org\/G5464079932","display_name":null,"funder_award_id":"62172101","funder_id":"https:\/\/openalex.org\/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https:\/\/openalex.org\/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https:\/\/ror.org\/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https:\/\/content.openalex.org\/works\/W4403792185.pdf"},"referenced_works_count":24,"referenced_works":["https:\/\/openalex.org\/W178970520","https:\/\/openalex.org\/W2022074610","https:\/\/openalex.org\/W2123260696","https:\/\/openalex.org\/W2277195237","https:\/\/openalex.org\/W2290551858","https:\/\/openalex.org\/W2396147015","https:\/\/openalex.org\/W2533128854","https:\/\/openalex.org\/W2606982687","https:\/\/openalex.org\/W2772633765","https:\/\/openalex.org\/W2963710346","https:\/\/openalex.org\/W2963890755","https:\/\/openalex.org\/W2963899988","https:\/\/openalex.org\/W2998536339","https:\/\/openalex.org\/W3009260245","https:\/\/openalex.org\/W3009518609","https:\/\/openalex.org\/W3108367078","https:\/\/openalex.org\/W3118916233","https:\/\/openalex.org\/W4256316689","https:\/\/openalex.org\/W4297499129","https:\/\/openalex.org\/W4389520044","https:\/\/openalex.org\/W4389520499","https:\/\/openalex.org\/W4389524107","https:\/\/openalex.org\/W4392384439","https:\/\/openalex.org\/W4393178509"],"related_works":["https:\/\/openalex.org\/W2384605597","https:\/\/openalex.org\/W2387743295","https:\/\/openalex.org\/W3082787378","https:\/\/openalex.org\/W2136007095","https:\/\/openalex.org\/W2366230879","https:\/\/openalex.org\/W3208425359","https:\/\/openalex.org\/W2349927912","https:\/\/openalex.org\/W3159777597","https:\/\/openalex.org\/W4212839359","https:\/\/openalex.org\/W2115758952"],"abstract_inverted_index":{"Multimodal":[0],"Question":[1],"Answering":[2],"(MMQA)":[3],"is":[4,162],"crucial":[5],"as":[6,22,38,100],"it":[7],"enables":[8],"comprehensive":[9,203],"understanding":[10],"and":[11,25,43,46,62,84,98,112,141,152,167,177],"accurate":[12],"responses":[13],"by":[14,196,231],"integrating":[15],"insights":[16,194],"from":[17,88],"diverse":[18],"data":[19],"representations":[20],"such":[21,37],"tables,":[23,61,83,176],"charts,":[24,85],"text.":[26],"Most":[27],"existing":[28],"researches":[29],"in":[30,52,125,163,174,211],"MMQA":[31],"only":[32],"focus":[33],"on":[34],"two":[35],"modalities":[36],"image-text":[39],"QA,":[40,45],"table-text":[41],"QA":[42,74],"chart-text":[44],"there":[47],"remains":[48],"a":[49,70,101,121,143,202],"notable":[50],"scarcity":[51],"studies":[53],"that":[54,76,219],"investigate":[55],"the":[56,105,108,118,159,183,187,192,228],"joint":[57],"analysis":[58],"of":[59,81,107,165,185],"text,":[60,82,175],"charts.":[63,178],"In":[64],"this":[65],"paper,":[66],"we":[67,136],"present":[68,137],"CT2C-QA,":[69],"pioneering":[71],"Chinese":[72],"reasoning-based":[73],"dataset":[75,94],"includes":[77],"an":[78],"extensive":[79],"collection":[80],"meticulously":[86],"compiled":[87],"200":[89],"selectively":[90],"sourced":[91],"webpages.":[92],"Our":[93],"simulates":[95],"real":[96],"webpages":[97],"serves":[99],"great":[102],"test":[103],"for":[104],"capability":[106],"model":[109],"to":[110,120,226],"analyze":[111],"reason":[113],"with":[114,207],"multimodal":[115],"data,":[116],"because":[117],"answer":[119],"question":[122],"could":[123],"appear":[124],"various":[126,208],"modalities,":[127],"or":[128],"even":[129],"potentially":[130],"not":[131],"exist":[132],"at":[133],"all.":[134],"Additionally,":[135],"AED":[138,206],"(Allocating,":[139],"Expert":[140],"Decision),":[142],"multi-agent":[144],"system":[145],"implemented":[146],"through":[147],"collaborative":[148],"deployment,":[149],"information":[150],"interaction,":[151],"collective":[153],"decision-making":[154],"among":[155],"different":[156],"agents.":[157,199],"Specifically,":[158],"Assignment":[160],"Agent":[161,181],"charge":[164],"selecting":[166],"activating":[168],"expert":[169,198],"agents,":[170],"including":[171,213,222],"those":[172],"proficient":[173],"The":[179,215],"Decision":[180],"bears":[182],"responsibility":[184],"delivering":[186],"final":[188],"verdict,":[189],"drawing":[190],"upon":[191],"analytical":[193],"provided":[195],"these":[197],"We":[200],"execute":[201],"analysis,":[204],"comparing":[205],"state-of-the-art":[209],"models":[210],"MMQA,":[212],"GPT-4.":[214],"experimental":[216],"outcomes":[217],"demonstrate":[218],"current":[220],"methodologies,":[221],"GPT-4,":[223],"are":[224],"yet":[225],"meet":[227],"benchmarks":[229],"set":[230],"our":[232],"dataset.":[233]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2024-10-27T00:00:00"}