{"id":"https://openalex.org/W2910231838","doi":"https://doi.org/10.1109/aivr.2018.00030","title":"A Perceptual Evaluation of Generative Adversarial Network Real-Time Synthesized Drum Sounds in a Virtual Environment","display_name":"A Perceptual Evaluation of Generative Adversarial Network Real-Time Synthesized Drum Sounds in a Virtual Environment","publication_year":2018,"publication_date":"2018-12-01","ids":{"openalex":"https://openalex.org/W2910231838","doi":"https://doi.org/10.1109/aivr.2018.00030","mag":"2910231838"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/aivr.2018.00030","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108254805","display_name":"Minwook Chang","orcid":"https://orcid.org/0000-0003-0525-052X"},"institutions":[{"id":"https://openalex.org/I197347611","display_name":"Korea University","ror":"https://ror.org/047dqcg40","country_code":"KR","type":"education","lineage":["https://openalex.org/I197347611"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Minwook Chang","raw_affiliation_strings":["Korea University, Seoul, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Korea University, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I197347611"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022209092","display_name":"Youngwon Ryan Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I197347611","display_name":"Korea University","ror":"https://ror.org/047dqcg40","country_code":"KR","type":"education","lineage":["https://openalex.org/I197347611"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Youngwon Ryan Kim","raw_affiliation_strings":["Korea University, Seoul, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Korea University, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I197347611"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022834069","display_name":"Gerard J. Kim","orcid":"https://orcid.org/0000-0001-9880-8021"},"institutions":[{"id":"https://openalex.org/I197347611","display_name":"Korea University","ror":"https://ror.org/047dqcg40","country_code":"KR","type":"education","lineage":["https://openalex.org/I197347611"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Gerard Jounghyun Kim","raw_affiliation_strings":["Korea University, Seoul, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Korea University, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I197347611"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.072,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":4,"citation_normalized_percentile":{"value":0.524954,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":77,"max":79},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9982,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9981,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/environmental-sound-recognition","display_name":"Environmental Sound Recognition","score":0.55915},{"id":"https://openalex.org/keywords/audio-event-detection","display_name":"Audio Event Detection","score":0.552128},{"id":"https://openalex.org/keywords/sound-synthesis","display_name":"Sound Synthesis","score":0.550517},{"id":"https://openalex.org/keywords/audio-visual-speech-recognition","display_name":"Audio-Visual Speech Recognition","score":0.523796},{"id":"https://openalex.org/keywords/music-generation","display_name":"Music Generation","score":0.5127}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7898989},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5781019},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.55716705},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.54339576},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.506676},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.48800364},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.48528168},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.41034526},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.37780672},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34605232},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/aivr.2018.00030","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":20,"referenced_works":["https://openalex.org/W1510561091","https://openalex.org/W2078118823","https://openalex.org/W2089556706","https://openalex.org/W2099471712","https://openalex.org/W2102003408","https://openalex.org/W2120847449","https://openalex.org/W2145720264","https://openalex.org/W2146187185","https://openalex.org/W2173520492","https://openalex.org/W2316878502","https://openalex.org/W2519091744","https://openalex.org/W2584032004","https://openalex.org/W2604184139","https://openalex.org/W2606176153","https://openalex.org/W2773196778","https://openalex.org/W2786254735","https://openalex.org/W2951535099","https://openalex.org/W2962879692","https://openalex.org/W4295521014","https://openalex.org/W4320013936"],"related_works":["https://openalex.org/W4390718435","https://openalex.org/W4390549206","https://openalex.org/W4386984417","https://openalex.org/W4385572368","https://openalex.org/W4237784285","https://openalex.org/W3137171911","https://openalex.org/W3005996785","https://openalex.org/W2476099471","https://openalex.org/W2380075625","https://openalex.org/W2374712251"],"abstract_inverted_index":{"Conventional":[0],"methods":[1],"of":[2,21,35,123],"real":[3,107],"time":[4,22,108],"sound":[5],"effects":[6],"in":[7],"3D":[8],"graphical":[9],"and":[10,23,46,90,102,105,126],"virtual":[11,135],"environments":[12],"relied":[13],"upon":[14,161],"preparing":[15],"all":[16],"the":[17,43,56,63,76,86,128,131,144,149,153,162],"needed":[18,77,95],"samples":[19,36],"ahead":[20],"simply":[24],"replaying":[25],"them":[26],"as":[27,42],"needed,":[28],"or":[29],"parametrically":[30],"modifying":[31],"a":[32,116,134],"basic":[33],"set":[34],"using":[37],"physically":[38],"based":[39],"techniques":[40],"such":[41],"spring-damper":[44],"simulation":[45],"modal":[47],"analysis/synthesis.":[48],"In":[49],"this":[50],"work,":[51],"we":[52],"propose":[53],"to":[54,62,74,96],"apply":[55],"generative":[57],"adversarial":[58],"network":[59],"(GAN)":[60],"approach":[61],"problem":[64],"at":[65],"hand,":[66],"with":[67,80,85,98,121],"which":[68],"only":[69],"one":[70],"generator":[71],"is":[72],"trained":[73],"produce":[75],"sounds":[78,122,129,151],"fast":[79],"perceptually":[81],"indifferent":[82],"quality.":[83],"Otherwise,":[84],"conventional":[87],"methods,":[88],"separate":[89],"approximate":[91],"models":[92],"would":[93],"be":[94],"deal":[97],"different":[99,124],"material":[100],"properties":[101],"contact":[103],"types,":[104],"manage":[106],"performance.":[109],"We":[110],"demonstrate":[111],"our":[112],"claim":[113],"by":[114],"training":[115],"GAN":[117],"(more":[118],"specifically":[119],"WaveGAN)":[120],"drums":[125],"synthesizing":[127],"on":[130],"fly":[132],"for":[133],"drum":[136],"playing":[137],"environment.":[138],"The":[139],"perceptual":[140],"test":[141],"revealed":[142],"that":[143],"subjects":[145],"could":[146],"not":[147],"discern":[148],"synthesized":[150],"from":[152],"ground":[154],"truth":[155],"nor":[156],"perceived":[157],"any":[158],"noticeable":[159],"delay":[160],"corresponding":[163],"physical":[164],"event.":[165]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2910231838","counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":1}],"updated_date":"2024-12-04T19:52:34.175257","created_date":"2019-01-25"}