{"id":"https:\/\/openalex.org\/W4408520950","doi":"https:\/\/doi.org\/10.1109\/cw64301.2024.00058","title":"Benchmarking Geospatial Visual Reasoning over Street Map Images","display_name":"Benchmarking Geospatial Visual Reasoning over Street Map Images","publication_year":2024,"publication_date":"2024-10-29","ids":{"openalex":"https:\/\/openalex.org\/W4408520950","doi":"https:\/\/doi.org\/10.1109\/cw64301.2024.00058"},"language":"en","primary_location":{"id":"doi:10.1109\/cw64301.2024.00058","is_oa":false,"landing_page_url":"https:\/\/doi.org\/10.1109\/cw64301.2024.00058","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Conference on Cyberworlds (CW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https:\/\/openalex.org\/A5083331541","display_name":"Haiting Zhou","orcid":"https:\/\/orcid.org\/0000-0002-1071-7131"},"institutions":[{"id":"https:\/\/openalex.org\/I50760025","display_name":"Hangzhou Dianzi University","ror":"https:\/\/ror.org\/0576gt767","country_code":"CN","type":"education","lineage":["https:\/\/openalex.org\/I50760025"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Haiting Zhou","raw_affiliation_strings":["Hangzhou Dianzi University,School of Computer Science,Hangzhou,China"],"affiliations":[{"raw_affiliation_string":"Hangzhou Dianzi University,School of Computer Science,Hangzhou,China","institution_ids":["https:\/\/openalex.org\/I50760025"]}]},{"author_position":"last","author":{"id":"https:\/\/openalex.org\/A5100581509","display_name":"Zhou Yu","orcid":null},"institutions":[{"id":"https:\/\/openalex.org\/I50760025","display_name":"Hangzhou Dianzi University","ror":"https:\/\/ror.org\/0576gt767","country_code":"CN","type":"education","lineage":["https:\/\/openalex.org\/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhou Yu","raw_affiliation_strings":["Hangzhou Dianzi University,School of Computer Science,Hangzhou,China"],"affiliations":[{"raw_affiliation_string":"Hangzhou Dianzi University,School of Computer Science,Hangzhou,China","institution_ids":["https:\/\/openalex.org\/I50760025"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https:\/\/openalex.org\/A5083331541"],"corresponding_institution_ids":["https:\/\/openalex.org\/I50760025"],"apc_list":null,"apc_paid":null,"fwci":0.3735,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.63334583,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"330","last_page":"331"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https:\/\/openalex.org\/T11106","display_name":"Data Management and Algorithms","score":0.9868999719619751,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1711","display_name":"Signal Processing"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},"topics":[{"id":"https:\/\/openalex.org\/T11106","display_name":"Data Management and Algorithms","score":0.9868999719619751,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1711","display_name":"Signal Processing"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},{"id":"https:\/\/openalex.org\/T10757","display_name":"Geographic Information Systems Studies","score":0.9821000099182129,"subfield":{"id":"https:\/\/openalex.org\/subfields\/3305","display_name":"Geography, Planning and Development"},"field":{"id":"https:\/\/openalex.org\/fields\/33","display_name":"Social Sciences"},"domain":{"id":"https:\/\/openalex.org\/domains\/2","display_name":"Social Sciences"}},{"id":"https:\/\/openalex.org\/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.98089998960495,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https:\/\/openalex.org\/keywords\/geospatial-analysis","display_name":"Geospatial analysis","score":0.8917144536972046},{"id":"https:\/\/openalex.org\/keywords\/benchmarking","display_name":"Benchmarking","score":0.8823658227920532},{"id":"https:\/\/openalex.org\/keywords\/computer-science","display_name":"Computer science","score":0.6448414921760559},{"id":"https:\/\/openalex.org\/keywords\/artificial-intelligence","display_name":"Artificial intelligence","score":0.5037843585014343},{"id":"https:\/\/openalex.org\/keywords\/visualization","display_name":"Visualization","score":0.4407652020454407},{"id":"https:\/\/openalex.org\/keywords\/spatial-intelligence","display_name":"Spatial intelligence","score":0.4158773422241211},{"id":"https:\/\/openalex.org\/keywords\/computer-vision","display_name":"Computer vision","score":0.3798682689666748},{"id":"https:\/\/openalex.org\/keywords\/data-science","display_name":"Data science","score":0.33208298683166504},{"id":"https:\/\/openalex.org\/keywords\/geography","display_name":"Geography","score":0.28208863735198975},{"id":"https:\/\/openalex.org\/keywords\/cartography","display_name":"Cartography","score":0.23993739485740662},{"id":"https:\/\/openalex.org\/keywords\/business","display_name":"Business","score":0.06493964791297913}],"concepts":[{"id":"https:\/\/openalex.org\/C9770341","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1938983","display_name":"Geospatial analysis","level":2,"score":0.8917144536972046},{"id":"https:\/\/openalex.org\/C86251818","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q816754","display_name":"Benchmarking","level":2,"score":0.8823658227920532},{"id":"https:\/\/openalex.org\/C41008148","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q21198","display_name":"Computer science","level":0,"score":0.6448414921760559},{"id":"https:\/\/openalex.org\/C154945302","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5037843585014343},{"id":"https:\/\/openalex.org\/C36464697","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q451553","display_name":"Visualization","level":2,"score":0.4407652020454407},{"id":"https:\/\/openalex.org\/C155911833","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q3817354","display_name":"Spatial intelligence","level":2,"score":0.4158773422241211},{"id":"https:\/\/openalex.org\/C31972630","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q844240","display_name":"Computer vision","level":1,"score":0.3798682689666748},{"id":"https:\/\/openalex.org\/C2522767166","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q2374463","display_name":"Data science","level":1,"score":0.33208298683166504},{"id":"https:\/\/openalex.org\/C205649164","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1071","display_name":"Geography","level":0,"score":0.28208863735198975},{"id":"https:\/\/openalex.org\/C58640448","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q42515","display_name":"Cartography","level":1,"score":0.23993739485740662},{"id":"https:\/\/openalex.org\/C144133560","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q4830453","display_name":"Business","level":0,"score":0.06493964791297913},{"id":"https:\/\/openalex.org\/C162853370","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q39809","display_name":"Marketing","level":1,"score":0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109\/cw64301.2024.00058","is_oa":false,"landing_page_url":"https:\/\/doi.org\/10.1109\/cw64301.2024.00058","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Conference on Cyberworlds (CW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":3,"referenced_works":["https:\/\/openalex.org\/W2947312908","https:\/\/openalex.org\/W2979382951","https:\/\/openalex.org\/W6843405348"],"related_works":["https:\/\/openalex.org\/W4238897586","https:\/\/openalex.org\/W435179959","https:\/\/openalex.org\/W2619091065","https:\/\/openalex.org\/W2059640416","https:\/\/openalex.org\/W1490753184","https:\/\/openalex.org\/W2284465472","https:\/\/openalex.org\/W2291782699","https:\/\/openalex.org\/W1993948687","https:\/\/openalex.org\/W2000169967","https:\/\/openalex.org\/W2112883198"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3],"present":[4],"a":[5],"novel":[6],"VQA":[7],"benchmark":[8],"SM-VQA,":[9],"which":[10],"is":[11,37],"built":[12],"upon":[13],"street":[14,23],"map":[15,24],"images.":[16],"Specifically,":[17],"SM-VQA":[18,36],"contains":[19],"about":[20],"9.5K":[21],"real-world":[22],"images":[25],"collected":[26],"from":[27],"the":[28,65,72],"open":[29],"geospatial":[30,42,59],"database":[31],"OpenStreetMap.":[32],"Each":[33],"image":[34],"in":[35],"also":[38],"associated":[39],"with":[40],"detailed":[41],"annotations,":[43],"enabling":[44],"it":[45],"to":[46,50],"automatically":[47],"generate":[48],"up":[49],"50K":[51],"distinctive":[52],"QA":[53],"pairs":[54],"of":[55,58,64,87],"five":[56],"types":[57],"reasoning":[60],"abilities.":[61],"The":[62,78],"evaluation":[63],"state-of-the-art":[66],"open-source":[67],"and":[68,81,89],"commercial":[69],"LMMs":[70],"reflects":[71],"great":[73],"challenge":[74],"posed":[75],"by":[76],"SM-VQA.":[77],"cutting-edge":[79],"Phi-3V":[80],"GPT-4o":[82],"models":[83],"merely":[84],"achieve":[85],"accuracies":[86],"45.3%":[88],"46.7%":[90],"respectively.":[91]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-19T19:40:27.379048","created_date":"2025-10-10T00:00:00"}