dc.contributor.author | Mamyrbayev, Orken | en |
dc.contributor.author | Pavlov, Sergii | en |
dc.contributor.author | Bekarystankyzy, Akbayan | en |
dc.contributor.author | Oralbekova, Dina | en |
dc.contributor.author | Zhumazhanov, Bagashar | en |
dc.contributor.author | Azarova, Larysa | en |
dc.contributor.author | Mussayeva, Dinara | en |
dc.contributor.author | Koval, Tetiana | en |
dc.contributor.author | Gromaszek, Konrad | en |
dc.contributor.author | Issimov, Nurdaulet | en |
dc.contributor.author | Shiyapov, Kadrzhan | en |
dc.contributor.author | Павлов, С. В. | uk |
dc.contributor.author | Азарова, Л. Є. | uk |
dc.date.accessioned | 2024-04-11T09:58:44Z | |
dc.date.available | 2024-04-11T09:58:44Z | |
dc.date.issued | 2023 | |
dc.identifier.citation | Mamyrbayev O., Pavlov S., Oralbekova D., Zhumazhanov B., Azarova L., Mussayeva D., Koval T., Gromaszek K., Issimov N., Shiyapov K. Neurorecognition visualization in multitask end-to-end speech. Proc. SPIE 12985. Optical Fibers and Their Applications 2023. Vol. 12985. 129850G1-8. DOI: https://doi.org/10.1117/12.3022727. | en |
dc.identifier.issn | 0277-786X | |
dc.identifier.uri | http://ir.lib.vntu.edu.ua//handle/123456789/41441 | |
dc.description.abstract | Nowadays, speech-processing technologies with different language systems are successfully used in mobile and stationary
devices. Kazakh is considered a low-resource language, which poses various challenges for conventional speech
recognition methods. This paper presents a proposed model capable of multitasking and handling concurrent speech
recognition, dialect identification, and speaker identification, all in an end-to-end framework. The developed multitask
model enables training three different tasks within a single model. A multitask recognition system is created based on the
WaveNet-CTC model. Experiments show that for the concrete task end-to-end multitask model has better performance
than other models.. | en |
dc.language.iso | en | en |
dc.publisher | Society of Photo-Optical Instrumentation Engineers | en |
dc.relation.ispartof | Proc. SPIE 12985. Optical Fibers and Their Applications 2023. Vol. 12985. 129850G1-8. | en |
dc.subject | end-to-end | en |
dc.subject | multitask training | en |
dc.subject | speech recognition | en |
dc.subject | speaker identification | en |
dc.subject | dialect identification | en |
dc.title | Neurorecognition visualization in multitask end-to-end speech | en |
dc.type | Article | |
dc.identifier.doi | https://doi.org/10.1117/12.3022727 | |