{"id":"https://openalex.org/W4375869031","doi":"https://doi.org/10.1109/icassp49357.2023.10096899","title":"Decoupled Non-Parametric Knowledge Distillation for end-to-End Speech Translation","display_name":"Decoupled Non-Parametric Knowledge Distillation for end-to-End Speech Translation","publication_year":2023,"publication_date":"2023-05-05","ids":{"openalex":"https://openalex.org/W4375869031","doi":"https://doi.org/10.1109/icassp49357.2023.10096899"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10096899","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":"https://doi.org/10.1109/icassp49357.2023.10096899","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092339699","display_name":"Hao Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I169689159","display_name":"PLA Information Engineering University","ror":"https://ror.org/00mm1qk40","country_code":"CN","type":"education","lineage":["https://openalex.org/I169689159"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao Zhang","raw_affiliation_strings":["University of Information Engineering, Zhengzhou, China"],"affiliations":[{"raw_affiliation_string":"University of Information Engineering, Zhengzhou, China","institution_ids":["https://openalex.org/I169689159"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024319575","display_name":"Nianwen Si","orcid":"https://orcid.org/0000-0003-4619-4325"},"institutions":[{"id":"https://openalex.org/I169689159","display_name":"PLA Information Engineering University","ror":"https://ror.org/00mm1qk40","country_code":"CN","type":"education","lineage":["https://openalex.org/I169689159"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nianwen Si","raw_affiliation_strings":["Department of Electronic Engineering, Tsinghua University, Beijing, China","University of Information Engineering, Zhengzhou, China"],"affiliations":[{"raw_affiliation_string":"University of Information Engineering, Zhengzhou, China","institution_ids":["https://openalex.org/I169689159"]},{"raw_affiliation_string":"Department of Electronic Engineering, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101560152","display_name":"Yaqi Chen","orcid":"https://orcid.org/0000-0001-6301-802X"},"institutions":[{"id":"https://openalex.org/I169689159","display_name":"PLA Information Engineering University","ror":"https://ror.org/00mm1qk40","country_code":"CN","type":"education","lineage":["https://openalex.org/I169689159"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaqi Chen","raw_affiliation_strings":["University of Information Engineering, Zhengzhou, China"],"affiliations":[{"raw_affiliation_string":"University of Information Engineering, Zhengzhou, China","institution_ids":["https://openalex.org/I169689159"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100635256","display_name":"Wenlin Zhang","orcid":"https://orcid.org/0000-0002-6842-9722"},"institutions":[{"id":"https://openalex.org/I169689159","display_name":"PLA Information Engineering University","ror":"https://ror.org/00mm1qk40","country_code":"CN","type":"education","lineage":["https://openalex.org/I169689159"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenlin Zhang","raw_affiliation_strings":["University of Information Engineering, Zhengzhou, China"],"affiliations":[{"raw_affiliation_string":"University of Information Engineering, Zhengzhou, China","institution_ids":["https://openalex.org/I169689159"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041343362","display_name":"Xukui Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I169689159","display_name":"PLA Information Engineering University","ror":"https://ror.org/00mm1qk40","country_code":"CN","type":"education","lineage":["https://openalex.org/I169689159"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xukui Yang","raw_affiliation_strings":["University of Information Engineering, Zhengzhou, China"],"affiliations":[{"raw_affiliation_string":"University of Information Engineering, Zhengzhou, China","institution_ids":["https://openalex.org/I169689159"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001488518","display_name":"Dan Qu","orcid":"https://orcid.org/0000-0001-9917-7794"},"institutions":[{"id":"https://openalex.org/I169689159","display_name":"PLA Information Engineering University","ror":"https://ror.org/00mm1qk40","country_code":"CN","type":"education","lineage":["https://openalex.org/I169689159"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dan Qu","raw_affiliation_strings":["University of Information Engineering, Zhengzhou, China"],"affiliations":[{"raw_affiliation_string":"University of Information Engineering, Zhengzhou, China","institution_ids":["https://openalex.org/I169689159"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100680995","display_name":"Zhen Li","orcid":"https://orcid.org/0000-0001-5093-4221"},"institutions":[{"id":"https://openalex.org/I169689159","display_name":"PLA Information Engineering University","ror":"https://ror.org/00mm1qk40","country_code":"CN","type":"education","lineage":["https://openalex.org/I169689159"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhen Li","raw_affiliation_strings":["University of Information Engineering, Zhengzhou, China"],"affiliations":[{"raw_affiliation_string":"University of Information Engineering, Zhengzhou, China","institution_ids":["https://openalex.org/I169689159"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.403,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.626095,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":69,"max":80},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Statistical Machine Translation and Natural Language Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Statistical Machine Translation and Natural Language Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Natural Language Processing","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition Technology","score":0.9981,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transcription","display_name":"Transcription (linguistics)","score":0.6063093},{"id":"https://openalex.org/keywords/neural-machine-translation","display_name":"Neural Machine Translation","score":0.565019},{"id":"https://openalex.org/keywords/syntax-based-translation-models","display_name":"Syntax-based Translation Models","score":0.54256},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine Translation","score":0.542353},{"id":"https://openalex.org/keywords/end-to-end-speech-recognition","display_name":"End-to-End Speech Recognition","score":0.539295},{"id":"https://openalex.org/keywords/statistical-machine-translation","display_name":"Statistical Machine Translation","score":0.533839}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8161176},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.775274},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.61855567},{"id":"https://openalex.org/C179926584","wikidata":"https://www.wikidata.org/wiki/Q207714","display_name":"Transcription (linguistics)","level":2,"score":0.6063093},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5198265},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.45680967},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36628377},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.34847862},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07447329},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.061838776},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10096899","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10096899","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"display_name":"Quality education","score":0.73,"id":"https://metadata.un.org/sdg/4"}],"grants":[{"funder":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China","award_id":null}],"datasets":[],"versions":[],"referenced_works_count":26,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W1522301498","https://openalex.org/W1821462560","https://openalex.org/W2183341477","https://openalex.org/W222053410","https://openalex.org/W2962784628","https://openalex.org/W2963532001","https://openalex.org/W2998702515","https://openalex.org/W3036601975","https://openalex.org/W3037217258","https://openalex.org/W3097301532","https://openalex.org/W3113908264","https://openalex.org/W3143377973","https://openalex.org/W3171641923","https://openalex.org/W3172862365","https://openalex.org/W3176455679","https://openalex.org/W4206468798","https://openalex.org/W4221163209","https://openalex.org/W4225388806","https://openalex.org/W4226426325","https://openalex.org/W4281982771","https://openalex.org/W4287649493","https://openalex.org/W4287890956","https://openalex.org/W4300558631","https://openalex.org/W4322577229","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W3026162553","https://openalex.org/W2953684491","https://openalex.org/W2768175398","https://openalex.org/W2505877856","https://openalex.org/W2412887479","https://openalex.org/W2344382886","https://openalex.org/W2080290893","https://openalex.org/W2028097510","https://openalex.org/W2015158429","https://openalex.org/W19111321"],"abstract_inverted_index":{"Existing":[0],"techniques":[1],"often":[2,24],"attempt":[3],"to":[4,14,40,71,128],"make":[5],"knowledge":[6,80,120,134],"transfer":[7],"from":[8,68,90,98],"a":[9,91,99],"powerful":[10],"machine":[11],"translation":[12,16],"(MT)":[13],"speech":[15],"(ST)":[17],"model":[18,44],"with":[19],"some":[20],"elaborate":[21],"techniques,":[22],"which":[23,106,138],"requires":[25],"transcription":[26,111],"as":[27],"extra":[28],"input":[29],"during":[30],"training.":[31],"However,":[32,83],"transcriptions":[33],"are":[34],"not":[35],"always":[36],"available,":[37],"and":[38,112,125],"how":[39],"improve":[41,72],"the":[42,56,73,79,87,108,118,130,133,140,150,158],"ST":[43],"performance":[45],"without":[46,161],"transcription,":[47],"i.e.,":[48],"data":[49,69,74],"efficiency,":[50],"has":[51],"rarely":[52],"been":[53],"studied":[54],"in":[55],"literature.":[57],"In":[58],"this":[59],"paper,":[60],"we":[61,95,116],"propose":[62],"Decoupled":[63],"Non-parametric":[64],"Knowledge":[65],"Distillation":[66],"(DNKD)":[67],"perspective":[70],"efficiency.":[75],"Our":[76],"method":[77,152],"follows":[78],"distillation":[81,121,127],"paradigm.":[82],"instead":[84],"of":[85,132],"obtaining":[86],"teacher":[88],"distribution":[89],"sophisticated":[92],"MT":[93,113],"model,":[94],"construct":[96],"it":[97],"non-parametric":[100],"datastore":[101],"via":[102],"k-Nearest-Neighbor":[103],"(kNN)":[104],"retrieval,":[105],"removes":[107],"dependence":[109],"on":[110,145],"model.":[114],"Then":[115],"decouple":[117],"classic":[119],"loss":[122],"into":[123],"target":[124],"non-target":[126,136],"enhance":[129],"effect":[131],"among":[135],"logits,":[137],"is":[139],"prominent":[141],"\"dark":[142],"knowledge\".":[143],"Experiments":[144],"MuST-C":[146],"corpus":[147],"show":[148],"that,":[149],"proposed":[151],"can":[153],"achieve":[154],"consistent":[155],"improvement":[156],"over":[157],"strong":[159],"baseline":[160],"requiring":[162],"any":[163],"transcription.":[164]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4375869031","counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2024-12-02T20:38:32.832619","created_date":"2023-05-10"}