iBet uBet web content aggregator. Adding the entire web to your favor.
iBet uBet web content aggregator. Adding the entire web to your favor.



Link to original content: https://api.openalex.org/works/doi:10.21437/EUROSPEECH.2003-723
{"id":"https://openalex.org/W170533338","doi":"https://doi.org/10.21437/eurospeech.2003-723","title":"syncpitch: a pseudo pitch synchronous algorithm for speaker recognition","display_name":"syncpitch: a pseudo pitch synchronous algorithm for speaker recognition","publication_year":2003,"publication_date":"2003-09-01","ids":{"openalex":"https://openalex.org/W170533338","doi":"https://doi.org/10.21437/eurospeech.2003-723","mag":"170533338"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.2003-723","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050001246","display_name":"Ran D. Zilca","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ran D. Zilca","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039085741","display_name":"Ji\u0159\u00ed Navr\u00e1til","orcid":"https://orcid.org/0000-0001-6348-0812"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiri Navratil","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5111944718","display_name":"Ganesh N. Ramaswamy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ganesh N. Ramaswamy","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.913,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.635881,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":74,"max":76},"biblio":{"volume":null,"issue":null,"first_page":"2649","last_page":"2652"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition Technology","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition Technology","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech Enhancement Techniques","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Audio Signal Classification and Analysis","score":0.9942,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pitch-detection-algorithm","display_name":"Pitch detection algorithm","score":0.7083651},{"id":"https://openalex.org/keywords/nist","display_name":"NIST","score":0.6999881},{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.6421143},{"id":"https://openalex.org/keywords/speaker-verification","display_name":"Speaker Verification","score":0.591888},{"id":"https://openalex.org/keywords/audio-event-detection","display_name":"Audio Event Detection","score":0.553102},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.55076146},{"id":"https://openalex.org/keywords/signal","display_name":"SIGNAL (programming language)","score":0.54343927},{"id":"https://openalex.org/keywords/automatic-speech-recognition","display_name":"Automatic Speech Recognition","score":0.534461},{"id":"https://openalex.org/keywords/speaker-diarization","display_name":"Speaker Diarization","score":0.531456},{"id":"https://openalex.org/keywords/audio-visual-speech-recognition","display_name":"Audio-Visual Speech Recognition","score":0.530001},{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.5016146},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.4686586}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.79055953},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7454867},{"id":"https://openalex.org/C135622632","wikidata":"https://www.wikidata.org/wiki/Q7198851","display_name":"Pitch detection algorithm","level":3,"score":0.7083651},{"id":"https://openalex.org/C111219384","wikidata":"https://www.wikidata.org/wiki/Q6954384","display_name":"NIST","level":2,"score":0.6999881},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.6421143},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.5963661},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.55076146},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.54343927},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.5201567},{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.5016146},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.48760882},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.4686586},{"id":"https://openalex.org/C104267543","wikidata":"https://www.wikidata.org/wiki/Q208163","display_name":"Signal processing","level":3,"score":0.4169107},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37618124},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3015227},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.27745196},{"id":"https://openalex.org/C84462506","wikidata":"https://www.wikidata.org/wiki/Q173142","display_name":"Digital signal processing","level":2,"score":0.1435869},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.2003-723","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality education","id":"https://metadata.un.org/sdg/4","score":0.8}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":10,"referenced_works":["https://openalex.org/W1503442377","https://openalex.org/W1997873121","https://openalex.org/W2014181881","https://openalex.org/W2078953162","https://openalex.org/W2113810833","https://openalex.org/W2139037446","https://openalex.org/W2153408936","https://openalex.org/W2167768673","https://openalex.org/W2397634864","https://openalex.org/W86348706"],"related_works":["https://openalex.org/W4385672897","https://openalex.org/W3146151004","https://openalex.org/W2387604097","https://openalex.org/W2373675101","https://openalex.org/W2206035908","https://openalex.org/W2141992701","https://openalex.org/W2018086531","https://openalex.org/W1980297060","https://openalex.org/W1963976507","https://openalex.org/W106160982"],"abstract_inverted_index":{"Pitch":[0],"mismatch":[1],"between":[2],"enrollment":[3],"and":[4,47,83],"testing":[5],"is":[6,15,132],"a":[7,58,85,92,116,129],"common":[8],"problem":[9],"in":[10,29,41,51,139],"speaker":[11,35,136],"recognition":[12],"systems.":[13],"It":[14],"well":[16],"known":[17],"that":[18,64,100],"the":[19,44,71,95,109,121,143],"fine":[20],"spectral":[21],"structure":[22],"related":[23],"to":[24,66,79,134],"fundamental":[25],"frequency":[26],"manifests":[27],"itself":[28],"Mel":[30],"cepstral":[31],"features":[32],"used":[33],"for":[34],"recognition.":[36],"Therefore":[37],"pitch":[38,68,81,87,103,110],"variations":[39],"result":[40],"variation":[42],"of":[43,94,126],"acoustic":[45],"features,":[46],"potentially":[48],"an":[49],"increase":[50],"error":[52],"rate.":[53],"A":[54],"previous":[55],"study":[56],"introduced":[57],"signal":[59,73],"processing":[60,105],"procedure":[61],"termed":[62,98],"depitch":[63,96],"attempts":[65],"remove":[67],"information":[69],"from":[70],"speech":[72,77,122],"by":[74],"forcing":[75],"every":[76],"frame":[78],"be":[80],"synchronous":[82,104],"include":[84],"single":[86],"cycle.":[88],"This":[89],"paper":[90],"presents":[91],"modification":[93],"algorithm,":[97],"syncpitch,":[99],"performs":[101],"pseudo":[102],"while":[106],"still":[107],"preserving":[108],"information.":[111],"The":[112],"new":[113],"algorithm":[114],"has":[115],"relatively":[117],"moderate":[118],"effect":[119],"on":[120,142],"signal.":[123],"System":[124],"combination":[125],"syncpitch":[127],"with":[128],"baseline":[130],"system":[131],"shown":[133],"improve":[135],"verification":[137],"accuracy":[138],"experiments":[140],"conducted":[141],"2002":[144],"NIST":[145],"Speaker":[146],"Recognition":[147],"Evaluation":[148],"data.":[149]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W170533338","counts_by_year":[{"year":2014,"cited_by_count":1}],"updated_date":"2024-10-23T07:50:40.776751","created_date":"2016-06-24"}