@ARTICLE{Pondel-Sycz_K._System_Early, author={Pondel-Sycz, K. and Bilski, P.}, journal={Bulletin of the Polish Academy of Sciences Technical Sciences}, pages={e149818}, howpublished={online}, year={Early Access}, abstract={The paper presents the analysis of modern Artificial Intelligence algorithms for the automated system supporting human beings during their conversation in Polish language. Their task is to perform Automatic Speech Recognition (ASR) and process it further, for instance fill the computer-based form or perform the Natural Language Processing (NLP) to assign the conversation to one of predefined categories. The State-of-the-Art review is required to select the optimal set of tools to process speech in the difficult conditions, which degrade accuracy of ASR. The paper presents the top-level architecture of the system applicable for the task. Characteristics of Polish language are discussed. Next, existing ASR solutions and architectures with the End-To-End (E2E) deep neural network (DNN) based ASR models are presented in detail. Differences between Recurrent Neural Networks (RNN), Convolutional Neural Networks (CNN) and Transformers in the context of ASR technology are also discussed.}, type={Article}, title={System dedicated to Polish Automatic Speech Recognition - overview of solutions}, URL={http://www.journals.pan.pl/Content/130882/PDF-MASTER/BPASTS-04016-EA.pdf}, doi={10.24425/bpasts.2024.149818}, keywords={automatic speech recognition, deep neural networks, transformer, conformer}, }