%Aigaion2 BibTeX export from Idiap Publications %Thursday 21 November 2024 01:10:59 PM @TECHREPORT{Khosravani_Idiap-RR-06-2020, author = {Khosravani, Abbas and Musat, Claudiu and Garner, Philip N. and Lazaridis, Alexandros}, keywords = {end-to-end, German language, open vocabulary, speech recognition, subword segmentation}, projects = {Idiap}, month = apr, title = {Comparison of Subword Segmentation Methods for Open-vocabulary ASR using a Difficulty Metric}, booktitle = {Technical Report}, year = {2020}, abstract = {We experiment with subword segmentation approaches that are widely used to address the open vocabulary problem in the context of end-to-end automatic speech recognition (ASR). For morphologically rich languages such as German which has many rare words mainly due to compound words, there is an increasing interest in subword-level word representation based on, e.g., byte-pair encoding and unigram language model. However, we are not aware of any systematic comparative analysis of different approaches. To this end, we propose a framework which estimates a difficulty score of a test utterance for the ASR model based on an out-of-vocabulary metric. Using this framework we run experiments on several subword segmentation approaches, which provides us with comparative analysis on the strengths and weaknesses of them. For the ASR model, we employ a fully convolutional sequence-to-sequence encoder architecture using time-depth separable convolution blocks and a lexicon-free beam search decoding with n-grams subword language model. Additionally, we leverage multiple models with different word representations to investigate their impact on ASR performance.}, pdf = {https://publications.idiap.ch/attachments/reports/2020/Khosravani_Idiap-RR_06-2020.pdf} }