{"id":"https://openalex.org/W4362689902","doi":"https://doi.org/10.1109/tvlsi.2023.3262787","title":"ACBN: Approximate Calculated Batch Normalization for Efficient DNN On-Device Training Processor","display_name":"ACBN: Approximate Calculated Batch Normalization for Efficient DNN On-Device Training Processor","publication_year":2023,"publication_date":"2023-04-06","ids":{"openalex":"https://openalex.org/W4362689902","doi":"https://doi.org/10.1109/tvlsi.2023.3262787"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvlsi.2023.3262787","pdf_url":null,"source":{"id":"https://openalex.org/S37538908","display_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","issn_l":"1063-8210","issn":["1063-8210","1557-9999"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058256501","display_name":"Baoting Li","orcid":"https://orcid.org/0009-0008-4807-3731"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Baoting Li","raw_affiliation_strings":["School of Microelectronics, Xi’an Jiaotong University, Shaanxi, Xi\u2019an, China"],"affiliations":[{"raw_affiliation_string":"School of Microelectronics, Xi’an Jiaotong University, Shaanxi, Xi\u2019an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055913406","display_name":"Hang Wang","orcid":"https://orcid.org/0000-0002-2714-0703"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hang Wang","raw_affiliation_strings":["School of Microelectronics, Xi’an Jiaotong University, Shaanxi, Xi\u2019an, China"],"affiliations":[{"raw_affiliation_string":"School of Microelectronics, Xi’an Jiaotong University, Shaanxi, Xi\u2019an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012446464","display_name":"Fujie Luo","orcid":null},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fujie Luo","raw_affiliation_strings":["Institute of Artificial Intelligence and Robotics,College of Artificial Intelligence, Xi’an Jiaotong University, Shaanxi, Xi\u2019an, China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence and Robotics,College of Artificial Intelligence, Xi’an Jiaotong University, Shaanxi, Xi\u2019an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044561987","display_name":"Xuchong Zhang","orcid":"https://orcid.org/0000-0003-2772-2700"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuchong Zhang","raw_affiliation_strings":["Institute of Artificial Intelligence and Robotics,College of Artificial Intelligence, Xi’an Jiaotong University, Shaanxi, Xi\u2019an, China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence and Robotics,College of Artificial Intelligence, Xi’an Jiaotong University, Shaanxi, Xi\u2019an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100706029","display_name":"Hongbin Sun","orcid":"https://orcid.org/0000-0003-2153-2906"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongbin Sun","raw_affiliation_strings":["Institute of Artificial Intelligence and Robotics,College of Artificial Intelligence, Xi’an Jiaotong University, Shaanxi, Xi\u2019an, China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence and Robotics,College of Artificial Intelligence, Xi’an Jiaotong University, Shaanxi, Xi\u2019an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047405956","display_name":"Nanning Zheng","orcid":"https://orcid.org/0000-0003-1608-8257"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nanning Zheng","raw_affiliation_strings":["Institute of Artificial Intelligence and Robotics,College of Artificial Intelligence, Xi’an Jiaotong University, Shaanxi, Xi\u2019an, China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence and Robotics,College of Artificial Intelligence, Xi’an Jiaotong University, Shaanxi, Xi\u2019an, China","institution_ids":["https://openalex.org/I87445476"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.557,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.712313,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":80,"max":86},"biblio":{"volume":"31","issue":"6","first_page":"738","last_page":"748"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12676","display_name":"Theory and Applications of Extreme Learning Machines","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12676","display_name":"Theory and Applications of Extreme Learning Machines","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Deep Learning in Computer Vision and Image Recognition","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Advances in Transfer Learning and Domain Adaptation","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/lookup-table","display_name":"Lookup table","score":0.6631157},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.59675056},{"id":"https://openalex.org/keywords/transfer-learning","display_name":"Transfer Learning","score":0.52573},{"id":"https://openalex.org/keywords/semi-supervised-learning","display_name":"Semi-Supervised Learning","score":0.518632},{"id":"https://openalex.org/keywords/representation-learning","display_name":"Representation Learning","score":0.507554},{"id":"https://openalex.org/keywords/unsupervised-learning","display_name":"Unsupervised Learning","score":0.501097}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.76666665},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.7065848},{"id":"https://openalex.org/C134835016","wikidata":"https://www.wikidata.org/wiki/Q690265","display_name":"Lookup table","level":2,"score":0.6631157},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.59675056},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.5749551},{"id":"https://openalex.org/C84462506","wikidata":"https://www.wikidata.org/wiki/Q173142","display_name":"Digital signal processing","level":2,"score":0.51482433},{"id":"https://openalex.org/C84211073","wikidata":"https://www.wikidata.org/wiki/Q117879","display_name":"Floating point","level":2,"score":0.51143545},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4250276},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.42340308},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.39037257},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.34326088},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.21133351},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.20494586},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvlsi.2023.3262787","pdf_url":null,"source":{"id":"https://openalex.org/S37538908","display_name":"IEEE Transactions on Very Large Scale Integration (VLSI) Systems","issn_l":"1063-8210","issn":["1063-8210","1557-9999"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[{"funder":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China","award_id":"62204200"},{"funder":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China","award_id":"62004157"},{"funder":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China","award_id":"2017YFA0700800"},{"funder":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities","award_id":"xtr072022001"}],"datasets":[],"versions":[],"referenced_works_count":39,"referenced_works":["https://openalex.org/W1836465849","https://openalex.org/W2165698076","https://openalex.org/W2285660444","https://openalex.org/W2289252105","https://openalex.org/W2606722458","https://openalex.org/W2625457103","https://openalex.org/W2724189024","https://openalex.org/W2734572653","https://openalex.org/W2773339846","https://openalex.org/W2789027062","https://openalex.org/W2794141774","https://openalex.org/W2803113791","https://openalex.org/W2902138814","https://openalex.org/W2920954974","https://openalex.org/W2921918777","https://openalex.org/W2935524202","https://openalex.org/W2949469598","https://openalex.org/W2951771281","https://openalex.org/W2971734772","https://openalex.org/W2990865680","https://openalex.org/W3004766715","https://openalex.org/W3007895486","https://openalex.org/W3015764133","https://openalex.org/W3040850704","https://openalex.org/W3048705738","https://openalex.org/W3048842964","https://openalex.org/W3091592563","https://openalex.org/W3117204317","https://openalex.org/W3137841151","https://openalex.org/W3157114665","https://openalex.org/W3157174059","https://openalex.org/W3174469560","https://openalex.org/W3185047697","https://openalex.org/W3193784739","https://openalex.org/W4240168186","https://openalex.org/W4285117917","https://openalex.org/W4286571873","https://openalex.org/W4293195632","https://openalex.org/W4297097444"],"related_works":["https://openalex.org/W4321441197","https://openalex.org/W4285261042","https://openalex.org/W3011538607","https://openalex.org/W2990962948","https://openalex.org/W2953716828","https://openalex.org/W2944728705","https://openalex.org/W2904857019","https://openalex.org/W2904022177","https://openalex.org/W2591697403","https://openalex.org/W2359348847"],"abstract_inverted_index":{"Batch":[0],"normalization":[1],"(BN)":[2],"has":[3,29],"been":[4,99],"established":[5],"as":[6],"a":[7,75],"very":[8],"effective":[9],"component":[10],"in":[11,34,59],"deep":[12,20],"learning,":[13],"largely":[14],"helping":[15],"accelerate":[16],"the":[17,35,95,109,113,118,140,148,159,166,173,195,199,220,226],"convergence":[18,92],"of":[19,37,61,94,151,154,161,176,201],"neural":[21],"network":[22],"(DNN)":[23],"training.":[24],"Nevertheless,":[25],"its":[26],"hardware":[27,62,80,114,203],"architecture":[28],"not":[30],"received":[31],"much":[32,76],"attention":[33],"field":[36],"DNN":[38,85,105],"on-device":[39,86],"training":[40,87],"processors.":[41,88],"Several":[42],"previous":[43],"designs":[44],"incur":[45],"either":[46],"high":[47,52],"off-chip":[48],"memory":[49,133],"traffic":[50],"or":[51],"circuit":[53],"complexity,":[54],"and":[55,64,82,91,130,194,218],"hence":[56],"have":[57,98],"deficiencies":[58],"terms":[60],"efficiency":[63,81],"performance.":[65,232],"This":[66],"article":[67],"proposes":[68],"approximately":[69],"calculated":[70],"BN":[71,152,177],"(ACBN)":[72],"to":[73,168],"achieve":[74],"better":[77,231],"tradeoff":[78],"between":[79],"performance":[83],"for":[84,147,172],"The":[89,179],"accuracy":[90],"rate":[93],"proposed":[96,119,141],"ACBN":[97,120,142,180,202],"extensively":[100],"evaluated":[101],"using":[102],"four":[103],"typical":[104],"models.":[106],"Compared":[107],"with":[108,225],"state-of-the-art":[110],"reference":[111,227],"design,":[112],"simulation":[115],"results":[116,196],"show":[117,197],"can":[121],"at":[122],"least":[123],"reduce":[124],"floating":[125],"point":[126],"operations":[127],"by":[128,135,222],"22.2%":[129],"save":[131],"external":[132],"access":[134],"33.3%":[136],"on":[137,156,184],"average.":[138,157],"Moreover,":[139],"introduces":[143],"63.6%":[144],"data":[145,170],"sparsity":[146,171],"backward":[149,174],"propagation":[150,175],"layers":[153],"VGG16":[155],"To":[158],"best":[160],"our":[162],"knowledge,":[163],"we":[164],"are":[165],"first":[167],"introduce":[169],"layers.":[178],"module":[181,204],"is":[182],"implemented":[183],"Zynq":[185],"UltraScale+":[186],"ZCU102":[187],"system-on-chip":[188],"(SoC)":[189],"field-programmable":[190],"gate":[191],"array":[192],"(FPGA),":[193],"that":[198],"implementation":[200],"saves":[205],"33.9%":[206],"look-up":[207],"table":[208],"(LUT),":[209],"49.4%":[210],"flip-flop":[211],"(FF),":[212],"75%":[213],"digital":[214],"signal":[215],"processor":[216],"(DSP),":[217],"reduces":[219],"power":[221],"12.4%":[223],"compared":[224],"design":[228],"while":[229],"achieving":[230]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4362689902","counts_by_year":[{"year":2024,"cited_by_count":2}],"updated_date":"2024-11-07T22:51:13.206741","created_date":"2023-04-08"}