{"id":"https:\/\/openalex.org\/W4378446399","doi":"https:\/\/doi.org\/10.48550\/arxiv.2305.13758","title":"A study of audio mixing methods for piano transcription in violin-piano ensembles","display_name":"A study of audio mixing methods for piano transcription in violin-piano ensembles","publication_year":2023,"publication_date":"2023-05-23","ids":{"openalex":"https:\/\/openalex.org\/W4378446399","doi":"https:\/\/doi.org\/10.48550\/arxiv.2305.13758"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2305.13758","is_oa":true,"landing_page_url":"http:\/\/arxiv.org\/abs\/2305.13758","pdf_url":"https:\/\/arxiv.org\/pdf\/2305.13758","source":{"id":"https:\/\/openalex.org\/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https:\/\/openalex.org\/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https:\/\/openalex.org\/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https:\/\/openalex.org\/licenses\/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https:\/\/arxiv.org\/pdf\/2305.13758","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https:\/\/openalex.org\/A5076443181","display_name":"Hyemi Kim","orcid":"https:\/\/orcid.org\/0000-0003-4713-4658"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kim, Hyemi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https:\/\/openalex.org\/A5034257985","display_name":"Jiyun Park","orcid":"https:\/\/orcid.org\/0000-0001-6105-0691"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Jiyun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https:\/\/openalex.org\/A5115444778","display_name":"Taegyun Kwon","orcid":"https:\/\/orcid.org\/0009-0004-8510-872X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kwon, Taegyun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https:\/\/openalex.org\/A5055794128","display_name":"Dasaem Jeong","orcid":"https:\/\/orcid.org\/0009-0002-3655-1181"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jeong, Dasaem","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https:\/\/openalex.org\/A5056437111","display_name":"Juhan Nam","orcid":"https:\/\/orcid.org\/0000-0003-2664-2119"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nam, Juhan","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https:\/\/openalex.org\/A5076443181"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https:\/\/openalex.org\/T11309","display_name":"Music and Audio Processing","score":0.9991000294685364,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1711","display_name":"Signal Processing"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},"topics":[{"id":"https:\/\/openalex.org\/T11309","display_name":"Music and Audio Processing","score":0.9991000294685364,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1711","display_name":"Signal Processing"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},{"id":"https:\/\/openalex.org\/T11349","display_name":"Music Technology and Sound Studies","score":0.9959999918937683,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},{"id":"https:\/\/openalex.org\/T13996","display_name":"Diverse Musicological Studies","score":0.9750000238418579,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1210","display_name":"Music"},"field":{"id":"https:\/\/openalex.org\/fields\/12","display_name":"Arts and Humanities"},"domain":{"id":"https:\/\/openalex.org\/domains\/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https:\/\/openalex.org\/keywords\/piano","display_name":"Piano","score":0.9750196933746338},{"id":"https:\/\/openalex.org\/keywords\/violin","display_name":"Violin","score":0.9030637741088867},{"id":"https:\/\/openalex.org\/keywords\/midi","display_name":"MIDI","score":0.7796701788902283},{"id":"https:\/\/openalex.org\/keywords\/transcription","display_name":"Transcription (linguistics)","score":0.6717211008071899},{"id":"https:\/\/openalex.org\/keywords\/computer-science","display_name":"Computer science","score":0.6140310764312744},{"id":"https:\/\/openalex.org\/keywords\/rendering","display_name":"Rendering (computer graphics)","score":0.5799924731254578},{"id":"https:\/\/openalex.org\/keywords\/speech-recognition","display_name":"Speech recognition","score":0.5622614622116089},{"id":"https:\/\/openalex.org\/keywords\/mixing","display_name":"Mixing (physics)","score":0.471193790435791},{"id":"https:\/\/openalex.org\/keywords\/acoustics","display_name":"Acoustics","score":0.3704288899898529},{"id":"https:\/\/openalex.org\/keywords\/artificial-intelligence","display_name":"Artificial intelligence","score":0.2487620711326599},{"id":"https:\/\/openalex.org\/keywords\/physics","display_name":"Physics","score":0.09878590703010559}],"concepts":[{"id":"https:\/\/openalex.org\/C124086623","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q5994","display_name":"Piano","level":2,"score":0.9750196933746338},{"id":"https:\/\/openalex.org\/C129554576","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q8355","display_name":"Violin","level":2,"score":0.9030637741088867},{"id":"https:\/\/openalex.org\/C8112396","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q80535","display_name":"MIDI","level":2,"score":0.7796701788902283},{"id":"https:\/\/openalex.org\/C179926584","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q207714","display_name":"Transcription (linguistics)","level":2,"score":0.6717211008071899},{"id":"https:\/\/openalex.org\/C41008148","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q21198","display_name":"Computer science","level":0,"score":0.6140310764312744},{"id":"https:\/\/openalex.org\/C205711294","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.5799924731254578},{"id":"https:\/\/openalex.org\/C28490314","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q189436","display_name":"Speech recognition","level":1,"score":0.5622614622116089},{"id":"https:\/\/openalex.org\/C138777275","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q6884054","display_name":"Mixing (physics)","level":2,"score":0.471193790435791},{"id":"https:\/\/openalex.org\/C24890656","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q82811","display_name":"Acoustics","level":1,"score":0.3704288899898529},{"id":"https:\/\/openalex.org\/C154945302","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2487620711326599},{"id":"https:\/\/openalex.org\/C121332964","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q413","display_name":"Physics","level":0,"score":0.09878590703010559},{"id":"https:\/\/openalex.org\/C41895202","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q8162","display_name":"Linguistics","level":1,"score":0},{"id":"https:\/\/openalex.org\/C62520636","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q944","display_name":"Quantum mechanics","level":1,"score":0},{"id":"https:\/\/openalex.org\/C138885662","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q5891","display_name":"Philosophy","level":0,"score":0},{"id":"https:\/\/openalex.org\/C111919701","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q9135","display_name":"Operating system","level":1,"score":0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2305.13758","is_oa":true,"landing_page_url":"http:\/\/arxiv.org\/abs\/2305.13758","pdf_url":"https:\/\/arxiv.org\/pdf\/2305.13758","source":{"id":"https:\/\/openalex.org\/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https:\/\/openalex.org\/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https:\/\/openalex.org\/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https:\/\/openalex.org\/licenses\/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550\/arxiv.2305.13758","is_oa":true,"landing_page_url":"https:\/\/doi.org\/10.48550\/arxiv.2305.13758","pdf_url":null,"source":{"id":"https:\/\/openalex.org\/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https:\/\/openalex.org\/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https:\/\/openalex.org\/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https:\/\/openalex.org\/licenses\/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2305.13758","is_oa":true,"landing_page_url":"http:\/\/arxiv.org\/abs\/2305.13758","pdf_url":"https:\/\/arxiv.org\/pdf\/2305.13758","source":{"id":"https:\/\/openalex.org\/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https:\/\/openalex.org\/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https:\/\/openalex.org\/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https:\/\/openalex.org\/licenses\/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https:\/\/content.openalex.org\/works\/W4378446399.pdf","grobid_xml":"https:\/\/content.openalex.org\/works\/W4378446399.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https:\/\/openalex.org\/W3133630535","https:\/\/openalex.org\/W2096042855","https:\/\/openalex.org\/W2064626218","https:\/\/openalex.org\/W3086552306","https:\/\/openalex.org\/W619251161","https:\/\/openalex.org\/W599311743","https:\/\/openalex.org\/W589781765","https:\/\/openalex.org\/W4301398814","https:\/\/openalex.org\/W3093121331","https:\/\/openalex.org\/W1797486849"],"abstract_inverted_index":{"While":[0],"piano":[1,11,34],"music":[2],"transcription":[3,35,102],"models":[4],"have":[5],"shown":[6],"high":[7],"performance":[8,14],"for":[9,63],"solo":[10],"recordings,":[12],"their":[13],"degrades":[15],"when":[16],"applied":[17,42],"to":[18,24,43],"ensemble":[19,77],"recordings.":[20],"This":[21],"study":[22],"aims":[23],"analyze":[25],"the":[26,58,68,96,101],"impact":[27],"of":[28,57,75],"different":[29],"data":[30],"augmentation":[31],"methods":[32,49],"on":[33,39,104],"performance,":[36],"specifically":[37],"focusing":[38],"mixing":[40,48],"techniques":[41],"violin-piano":[44,76],"ensembles.":[45],"We":[46,99],"apply":[47],"that":[50],"consider":[51],"both":[52,105],"harmonic":[53],"and":[54,83,86,92,107],"temporal":[55],"characteristics":[56],"audio.":[59],"To":[60],"create":[61],"datasets":[62],"this":[64],"study,":[65],"we":[66],"generated":[67],"PFVN-synth":[69],"dataset,":[70],"which":[71],"contains":[72],"7":[73],"hours":[74],"audio":[78,109],"by":[79],"rendering":[80],"MIDI":[81],"files":[82],"corresponding":[84],"labels,":[85],"also":[87],"collected":[88],"unaccompanied":[89],"violin":[90],"recordings":[91,110],"mixed":[93],"them":[94],"with":[95],"MAESTRO":[97],"dataset.":[98],"evaluated":[100],"results":[103],"synthesized":[106],"real":[108],"datasets.":[111]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}