@inproceedings{MTMT:34543490, title = {Comparing Classifiers for Recognizing the Emotions by extracting the Spectral Features of Speech Using Machine Learning}, url = {https://m2.mtmt.hu/api/publication/34543490}, author = {Mehra, P. and Kant, Verma S.}, doi = {10.1109/DICCT56244.2023.10110282}, unique-id = {34543490}, year = {2023}, pages = {387-391} } @article{MTMT:33634015, title = {Convolutional Neural Network Based Real Time Arabic Speech Recognition to Arabic Braille for Hearing and Visually Impaired}, url = {https://m2.mtmt.hu/api/publication/33634015}, author = {Bhatia, S. and Devi, A. and Alsuwailem, R.I. and Mashat, A.}, doi = {10.3389/fpubh.2022.898355}, journal-iso = {FRONT PUBLIC HEALTH}, journal = {FRONTIERS IN PUBLIC HEALTH}, volume = {10}, unique-id = {33634015}, year = {2022}, eissn = {2296-2565} } @article{MTMT:33634014, title = {ERIL: An Algorithm for Emotion Recognition from Indian Languages Using Machine Learning}, url = {https://m2.mtmt.hu/api/publication/33634014}, author = {Mehra, P. and Jain, P.}, doi = {10.1007/s11277-022-09829-1}, journal-iso = {WIRELESS PERS COMMUN}, journal = {WIRELESS PERSONAL COMMUNICATIONS}, volume = {126}, unique-id = {33634014}, issn = {0929-6212}, year = {2022}, eissn = {1572-834X}, pages = {2557-2577} } @article{MTMT:33634027, title = {BERIS: An mBERT-based Emotion Recognition Algorithm from Indian Speech}, url = {https://m2.mtmt.hu/api/publication/33634027}, author = {Mehra, Pramod and Verma, Shashi Kant}, doi = {10.1145/3517195}, journal-iso = {ACM T ASIAN LOW-RESO}, journal = {ACM Transactions on Asian and Low-Resource Language Information Processing}, volume = {21}, unique-id = {33634027}, issn = {2375-4699}, abstract = {Emotions, the building blocks of the human intellect, play a vital role in Artificial Intelligence (AI). For a robust AI-based machine, it is important that the machine understands human emotions. COVID-19 has introduced the world to no-touch intelligent systems. With an influx of users, it is critical to create devices that can communicate in a local dialect. A multilingual system is required in countries like India, which has a large population and a diverse range of languages. Given the importance of multilingual emotion recognition, this research introduces BERIS, an Indian language emotion detection system. From the Indian sound recording, BERIS estimates both acoustic and textual characteristics. To extract the textual features, we used Multilingual Bidirectional Encoder Representations from Transformers. For acoustics, BERIS computes the Mel Frequency Cepstral Coefficients and Linear Prediction coefficients, and Pitch. The features extracted are merged in a linear array. Since the dialogues are of varied lengths, the data are normalized to have arrays of equal length. Finally, we split the data into training and validated set to construct a predictive model. The model can predict emotions from the new input. On all the datasets presented, quantitative and qualitative evaluations show that the proposed algorithm outperforms state-of-the-art approaches.}, year = {2022}, eissn = {2375-4702}, pages = {1-19}, orcid-numbers = {Mehra, Pramod/0000-0003-2329-2547} } @inproceedings{MTMT:33634018, title = {Automatic Speaker Verification using Gammatone Frequency Cepstral Coefficients}, url = {https://m2.mtmt.hu/api/publication/33634018}, author = {Choudhary, H. and Sadhya, D. and Patel, V.}, booktitle = {2021 8th International Conference on Signal Processing and Integrated Networks (SPIN)}, doi = {10.1109/SPIN52536.2021.9566150}, unique-id = {33634018}, year = {2021}, pages = {424-428} } @article{MTMT:33634017, title = {Automatic speech recognition: a survey}, url = {https://m2.mtmt.hu/api/publication/33634017}, author = {Malik, M. and Malik, M.K. and Mehmood, K. and Makhdoom, I.}, doi = {10.1007/s11042-020-10073-7}, journal-iso = {MULTIMED TOOLS APPL}, journal = {MULTIMEDIA TOOLS AND APPLICATIONS: AN INTERNATIONAL JOURNAL}, volume = {80}, unique-id = {33634017}, issn = {1380-7501}, year = {2021}, eissn = {1573-7721}, pages = {9411-9457} } @misc{MTMT:33634055, title = {Spectral-warping based noise-robust enhanced children ASR system}, url = {https://m2.mtmt.hu/api/publication/33634055}, author = {Puneet, Bawa and Virender, Kadyan and Vaibhav, Kumar and Ghanshyam, Raghuwanshi}, doi = {10.21203/rs.3.rs-976955/v1}, unique-id = {33634055}, year = {2021} } @article{MTMT:33634016, title = {Real-time pre-processing for improved feature extraction of noisy speech}, url = {https://m2.mtmt.hu/api/publication/33634016}, author = {Raj, P.P.}, doi = {10.1007/s10772-021-09835-x}, journal-iso = {INT J SPEECH TECH}, journal = {INTERNATIONAL JOURNAL OF SPEECH TECHNOLOGY}, volume = {24}, unique-id = {33634016}, issn = {1381-2416}, year = {2021}, eissn = {1572-8110}, pages = {715-728} } @article{MTMT:33634105, title = {A New and Efficient Feature Extraction Method for Robust Speech Recognition Based on Fractional Fourier Transform and Differential Evolution Optimizer}, url = {https://m2.mtmt.hu/api/publication/33634105}, author = {Mohsen, Sadeghi and Hossein, Marvi and Ali, Reza Ahmadyfard}, doi = {10.22075/JME.2020.19267.1821}, journal-iso = {J MODEL ENG}, journal = {JOURNAL OF MODELING IN ENGINEERING}, volume = {18}, unique-id = {33634105}, issn = {2008-4854}, year = {2020}, pages = {85-96} } @article{MTMT:33634019, title = {Arabic digits speech recognition and speaker identification in noisy environment using a hybrid model of VQ and GMM}, url = {https://m2.mtmt.hu/api/publication/33634019}, author = {Ouisaadane, A. and Safi, S. and Frikel, M.}, doi = {10.12928/TELKOMNIKA.V18I4.14215}, journal-iso = {TELKOMNIKA}, journal = {TELKOMNIKA}, volume = {18}, unique-id = {33634019}, issn = {1693-6930}, year = {2020}, eissn = {2302-9293}, pages = {2193-2204} } @mastersthesis{MTMT:33634181, title = {Realce e Reconhecimento de Voz Contínua em Ambientes Adversos}, url = {https://m2.mtmt.hu/api/publication/33634181}, author = {Christian, Dayan Arcos Gordillo}, unique-id = {33634181}, year = {2018} } @mastersthesis{MTMT:33634195, title = {A STUDY ON ISOLATED-WORD MYANMAR SPEECH RECOGNITION VIA ARTIFICIAL NEURAL NETWORKS}, url = {https://m2.mtmt.hu/api/publication/33634195}, author = {Nan, Phyu Phyu Hsan}, unique-id = {33634195}, year = {2018} } @article{MTMT:27393749, title = {A bio-inspired emotion recognition system under real-life conditions}, url = {https://m2.mtmt.hu/api/publication/27393749}, author = {Chenchah, Farah and Lachiri, Zied}, doi = {10.1016/j.apacoust.2016.06.020}, journal-iso = {APPL ACOUST}, journal = {APPLIED ACOUSTICS}, volume = {115}, unique-id = {27393749}, issn = {0003-682X}, year = {2017}, eissn = {1872-910X}, pages = {6-14} } @article{MTMT:27393752, title = {Teknik Normalisasi Fitur Secara Adaptif untuk Sistem Pengenalan Ucapan Tahan Terhadap Gema}, url = {https://m2.mtmt.hu/api/publication/27393752}, author = {Pardede, Hilman Ferdinandus}, journal-iso = {Inkom. Jurnal Informatika, Sistem Kendali, dan Komputer}, journal = {Inkom. Jurnal Informatika, Sistem Kendali, dan Komputer}, volume = {10}, unique-id = {27393752}, year = {2017}, eissn = {2302-6146}, pages = {47-56} } @{MTMT:27393751, title = {Correlative consideration concerning feature extraction techniques for speech recognition—A review}, url = {https://m2.mtmt.hu/api/publication/27393751}, author = {Kaur, Arshpreet and Singh, Amitoj and Kadyan, Virender}, publisher = {Institute of Electrical and Electronics Engineers}, unique-id = {27393751}, year = {2016}, pages = {1-4} } @article{MTMT:31993097, title = {Power-Normalized Cepstral Coefficients (PNCC) for Robust Speech Recognition}, url = {https://m2.mtmt.hu/api/publication/31993097}, author = {Kim, Chanwoo and Stern, Richard M.}, doi = {10.1109/TASLP.2016.2545928}, journal-iso = {IEEE-ACM T AUDIO SPE}, journal = {IEEE-ACM TRANSACTIONS ON AUDIO SPEECH AND LANGUAGE PROCESSING}, volume = {24}, unique-id = {31993097}, issn = {2329-9290}, year = {2016}, eissn = {2329-9304}, pages = {1315-1329}, orcid-numbers = {Stern, Richard M./0000-0003-0557-7282} } @article{MTMT:27393748, title = {Modified Filterbank Analysis Features for Speech Recognition}, url = {https://m2.mtmt.hu/api/publication/27393748}, author = {Eringis, Deividas and Tamulevicius, Gintautas}, journal-iso = {BJMC}, journal = {BALTIC JOURNAL OF MODERN COMPUTING}, volume = {3}, unique-id = {27393748}, issn = {2255-8942}, year = {2015}, eissn = {2255-8950}, pages = {29} } @mastersthesis{MTMT:33634211, title = {CREACIÓN DE SOFTWARE DE RECONOCIMIENTO DE VOZ PARA ESCRITURA DE EXPRESIONES ALGEBRAICAS Y SU NIVEL DE EFICIENCIA CON EL ESTÁNDAR WER-2015}, url = {https://m2.mtmt.hu/api/publication/33634211}, author = {MAXIMILIANO, EPIFANIO ASÍS LÓPEZ}, unique-id = {33634211}, year = {2015} } @article{MTMT:27393744, title = {Comparative study of automatic speech recognition techniques}, url = {https://m2.mtmt.hu/api/publication/27393744}, author = {Cutajar, Michelle and Gatt, Edward and Grech, Ivan and Casha, Owen and Micallef, Joseph}, doi = {10.1049/iet-spr.2012.0151}, journal-iso = {IET SIGNAL PROCESS}, journal = {IET SIGNAL PROCESSING}, volume = {7}, unique-id = {27393744}, issn = {1751-9675}, year = {2013}, eissn = {1751-9683}, pages = {25-46} } @{MTMT:27393747, title = {Malayalam Speech Recognition system and its application for visually impaired people}, url = {https://m2.mtmt.hu/api/publication/27393747}, author = {Anand, Anu V and Devi, P Shobana and Stephen, Jose and Bhadran, VK}, publisher = {Institute of Electrical and Electronics Engineers}, unique-id = {27393747}, year = {2012}, pages = {619-624} } @mastersthesis{MTMT:27393750, title = {TaleTUC: Automatic Speech Recognition for a Bus Route Information System}, url = {https://m2.mtmt.hu/api/publication/27393750}, author = {Andersstuen, Runar and Marcussen, Christoffer Jun}, unique-id = {27393750}, year = {2012} } @inproceedings{MTMT:27393743, title = {Power-normalized cepstral coefficients (PNCC) for robust speech recognition}, url = {https://m2.mtmt.hu/api/publication/27393743}, author = {Kim, Chanwoo and Stern, Richard M}, booktitle = {2012 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2012}, doi = {10.1109/ICASSP.2012.6288820}, publisher = {Institute of Electrical and Electronics Engineers}, unique-id = {27393743}, year = {2012}, pages = {4101-4104} } @inproceedings{MTMT:33634022, title = {Recognition of multiple language voice navigation queries in traffic situations}, url = {https://m2.mtmt.hu/api/publication/33634022}, author = {Sárosi, G. and Mozsolics, T. and Tarján, B. and Balog, A. and Mihajlik, P. and Fegyó, T.}, booktitle = {Analysis of Verbal and Nonverbal Communication and Enactment. The Processing Issues}, doi = {10.1007/978-3-642-25775-9_20}, volume = {6800 LNCS}, unique-id = {33634022}, year = {2011}, pages = {199-213} }