{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,7,11]],"date-time":"2024-07-11T17:30:53Z","timestamp":1720719053265},"reference-count":32,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2018,10,28]],"date-time":"2018-10-28T00:00:00Z","timestamp":1540684800000},"content-version":"vor","delay-in-days":300,"URL":"http:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Procedia Computer Science"],"published-print":{"date-parts":[[2018]]},"DOI":"10.1016\/j.procs.2018.10.485","type":"journal-article","created":{"date-parts":[[2018,11,15]],"date-time":"2018-11-15T06:01:14Z","timestamp":1542261674000},"page":"339-346","update-policy":"http:\/\/dx.doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":1,"special_numbering":"C","title":["Automated Sentence Boundary Detection in Modern Standard Arabic Transcripts using Deep Neural Networks"],"prefix":"10.1016","volume":"142","author":[{"given":"Carlos-Emiliano","family":"Gonz\u00e1lez-Gallardo","sequence":"first","affiliation":[]},{"given":"Elvys Linhares","family":"Pontes","sequence":"additional","affiliation":[]},{"given":"Fatiha","family":"Sadat","sequence":"additional","affiliation":[]},{"given":"Juan-Manuel","family":"Torres-Moreno","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.procs.2018.10.485_bib0001","unstructured":"Alotaiby, F., Foda, S., Alkharashi, I., 2010. Clitics in arabic language: a statistical study, in: 24th Pacific Asia Conference on Language, Information and Computation."},{"key":"10.1016\/j.procs.2018.10.485_bib0002","unstructured":"Althobaiti, M., Kruschwitz, U., Poesio, M., 2014. Aranlp: A java-based library for the processing of arabic text, in: LREC."},{"key":"10.1016\/j.procs.2018.10.485_bib0003","series-title":"Handling Arabic morphological and syntactic ambiguity within the LFG framework with a view to machine translation","author":"Attia","year":"2008"},{"key":"10.1016\/j.procs.2018.10.485_bib0004","unstructured":"Bahdanau, D., Cho, K., Bengio, Y., 2014. Neural machine translation by jointly learning to align and translate. CoRR abs\/1409.0473."},{"key":"10.1016\/j.procs.2018.10.485_bib0005","unstructured":"Baldridge, J., 2005. The OpenNLP project. http:\/\/opennlp.apache.org\/."},{"key":"10.1016\/j.procs.2018.10.485_bib0006","doi-asserted-by":"crossref","unstructured":"Bojanowski, P., Grave, E., Joulin, A., Mikolov, T., 2016. Enriching word vectors with subword information. preprint arXiv:1607.04606.","DOI":"10.1162\/tacl_a_00051"},{"key":"10.1016\/j.procs.2018.10.485_bib0007","unstructured":"Diab, M., 2009. Second generation amira tools for arabic processing: Fast and robust tokenization, pos tagging, and base phrase chunking, in: 2nd International Conference on Arabic Language Resources and Tools."},{"key":"10.1016\/j.procs.2018.10.485_bib0008","doi-asserted-by":"crossref","first-page":"38","DOI":"10.1016\/j.procs.2017.10.092","article-title":"A web-based tool for arabic sentiment analysis","volume":"117","author":"El-Masri","year":"2017","journal-title":"Procedia Computer Science"},{"key":"10.1016\/j.procs.2018.10.485_bib0009","doi-asserted-by":"crossref","first-page":"14","DOI":"10.1145\/1644879.1644881","article-title":"Arabic natural language processing: Challenges and solutions","volume":"8","author":"Farghaly","year":"2009","journal-title":"ACM Transactions on Asian Language Information Processing (TALIP)"},{"key":"10.1016\/j.procs.2018.10.485_bib00010","doi-asserted-by":"crossref","first-page":"327","DOI":"10.1017\/S1351324904003523","article-title":"UIMA: An Architectural Approach to Unstructured Information Processing in the Corporate Research Environment","volume":"10","author":"Ferrucci","year":"2004","journal-title":"Natural Language Engineering"},{"key":"10.1016\/j.procs.2018.10.485_bib00011","unstructured":"Gonz\u00e1lez-Gallardo, C.E., Torres-Moreno, J.M., 2018. Sentence Boundary Detection for French with Subword-Level Information Vectors and Convolutional Neural Networks. preprint arXiv:1802.04559."},{"key":"10.1016\/j.procs.2018.10.485_bib00012","unstructured":"Gotoh, Y., Renals, S., 2000. Sentence boundary detection in broadcast speech transcripts, in: ASR2000-Automatic Speech Recognition: Challenges for the new Millenium ISCA Tutorial and Research Workshop (ITRW)."},{"key":"10.1016\/j.procs.2018.10.485_bib00013","unstructured":"Habash, N., Rambow, O., Roth, R., 2009. Mada+ tokan: A toolkit for arabic tokenization, diacritization, morphological disambiguation, pos tagging, stemming and lemmatization, in: 2nd International Conference on Arabic language resources and tools (MEDAR), Cairo, Egypt, p. 62."},{"key":"10.1016\/j.procs.2018.10.485_bib00014","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/978-3-031-02139-8","article-title":"Introduction to arabic natural language processing","volume":"3","author":"Habash","year":"2010","journal-title":"Synthesis Lectures on Human Language Technologies"},{"key":"10.1016\/j.procs.2018.10.485_bib00015","unstructured":"Hadrich, L.B., Baccour, L., Mourad, G., 2005. Star: un syst\u00e8me de segmentation de textes arabes bas\u00e9 sur lanalyse contextuelle des signes de ponctuations et de certaines particules, in: TALN\u201905."},{"key":"10.1016\/j.procs.2018.10.485_bib00016","doi-asserted-by":"crossref","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","article-title":"Long short-term memory","volume":"9","author":"Hochreiter","year":"1997","journal-title":"Neural Computation"},{"key":"10.1016\/j.procs.2018.10.485_bib00017","series-title":"A survey and comparative study of arabic nlp architectures, in: Intelligent Natural Language Processing: Trends and Applications","first-page":"585","author":"Jaafar","year":"2018"},{"key":"10.1016\/j.procs.2018.10.485_bib00018","series-title":"Natural Language Processing and Information Systems","first-page":"467","article-title":"Cross-language text summarization using sentence and multi-sentence compression","author":"Linhares Pontes","year":"2018"},{"key":"10.1016\/j.procs.2018.10.485_bib00019","doi-asserted-by":"crossref","first-page":"468","DOI":"10.1016\/j.csl.2005.06.002","article-title":"A study in machine learning from imbalanced data for sentence boundary detection in speech","volume":"20","author":"Liu","year":"2006","journal-title":"Computer Speech & Language"},{"key":"10.1016\/j.procs.2018.10.485_bib00020","series-title":"Intelligent Natural Language Processing: Trends and Applications","first-page":"101","article-title":"Automatic machine translation for arabic tweets","author":"Mallek","year":"2018"},{"key":"10.1016\/j.procs.2018.10.485_bib00021","doi-asserted-by":"crossref","unstructured":"Menacer, M.A., Mella, O., Fohr, D., Jouvet, D., Langlois, D., Smaili, K., 2017. An enhanced automatic speech recognition system for arabic, in: Third Arabic Natural Language Processing Workshop, pp. 157-165.","DOI":"10.18653\/v1\/W17-1319"},{"key":"10.1016\/j.procs.2018.10.485_bib00022","unstructured":"Mikolov, T., Chen, K., Corrado, G., Dean, J., 2013. Efficient estimation of word representations in vector space. preprint arXiv:1301.3781."},{"key":"10.1016\/j.procs.2018.10.485_bib00023","unstructured":"Pasha, A., Al-Badrashiny, M., Diab, M.T., El Kholy, A., Eskander, R., Habash, N., Pooleery, M., Rambow, O., Roth, R., 2014. Madamira: A fast, comprehensive tool for morphological analysis and disambiguation of arabic., in: LREC, pp. 1094\u20131101."},{"key":"10.1016\/j.procs.2018.10.485_bib00024","doi-asserted-by":"crossref","unstructured":"Pennington, J., Socher, R., Manning, C., 2014. Glove: Global vectors for word representation, in: Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 1532\u20131543.","DOI":"10.3115\/v1\/D14-1162"},{"key":"10.1016\/j.procs.2018.10.485_bib00025","series-title":"IEEE 2011 Workshop on Automatic Speech Recognition and Understanding","article-title":"The Kaldi speech recognition toolkit","author":"Povey","year":"2011"},{"key":"10.1016\/j.procs.2018.10.485_bib00026","doi-asserted-by":"crossref","unstructured":"Silberztein, M., 2005. Nooj: a linguistic annotation system for corpus processing, in: HLT\/EMNLP on Interactive Demonstrations, Association for Computational Linguistics. pp. 10-11.","DOI":"10.3115\/1225733.1225739"},{"key":"10.1016\/j.procs.2018.10.485_bib00027","unstructured":"Souteh, Y., Bouzoubaa, K., 2011. Safar platform and its morphological layer, in: Eleventh Conference on Language Engineering ESOLEC, pp. 14\u201315."},{"key":"10.1016\/j.procs.2018.10.485_bib00028","series-title":"in: Spoken Language Technology Workshop (SLT)","first-page":"285","article-title":"Lium asr systems for the 2016 multi-genre broadcast arabic challenge","author":"Tomashenko","year":"2016"},{"key":"10.1016\/j.procs.2018.10.485_bib00029","series-title":"Automatic Text Summarization","author":"Torres-Moreno","year":"2014"},{"key":"10.1016\/j.procs.2018.10.485_bib00030","doi-asserted-by":"crossref","unstructured":"Tran, N.T., Luong, V.T., Nguyen, N.L.T., Nghiem, M.Q., 2016. Effective attention-based neural architectures for sentence compression with bidirectional long short-term memory, in: Seventh Symposium on Information and Communication Technology, ACM, New York, NY, USA. pp. 123-130. URL: http:\/\/doi.acm.org\/10.1145\/3011077.3011111, doi:10.1145\/3011077.3011111.","DOI":"10.1145\/3011077.3011111"},{"key":"10.1016\/j.procs.2018.10.485_bib00031","series-title":"Automatic Speech Recognition","author":"Yu","year":"2016"},{"key":"10.1016\/j.procs.2018.10.485_bib00032","unstructured":"Zribi, I., Kammoun, I., Ellouze, M., Belguith, L., Blache, P., 2016. Sentence boundary detection for transcribed tunisian arabic, in: 13th Conference on Natural Language Processing (KONVENS 2016), pp. 323\u2013331."}],"container-title":["Procedia Computer Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1877050918321896?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1877050918321896?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2022,7,30]],"date-time":"2022-07-30T19:57:50Z","timestamp":1659211070000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S1877050918321896"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"references-count":32,"alternative-id":["S1877050918321896"],"URL":"https:\/\/doi.org\/10.1016\/j.procs.2018.10.485","relation":{},"ISSN":["1877-0509"],"issn-type":[{"value":"1877-0509","type":"print"}],"subject":[],"published":{"date-parts":[[2018]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Automated Sentence Boundary Detection in Modern Standard Arabic Transcripts using Deep Neural Networks","name":"articletitle","label":"Article Title"},{"value":"Procedia Computer Science","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.procs.2018.10.485","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2018 The Author(s). Published by Elsevier B.V.","name":"copyright","label":"Copyright"}]}}