<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="static/style.xsl"?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd"><responseDate>2026-04-14T04:44:41Z</responseDate><request verb="GetRecord" identifier="oai:www.recercat.cat:2117/429991" metadataPrefix="oai_dc">https://recercat.cat/oai/request</request><GetRecord><record><header><identifier>oai:recercat.cat:2117/429991</identifier><datestamp>2025-07-22T18:44:00Z</datestamp><setSpec>com_2072_1033</setSpec><setSpec>col_2072_452951</setSpec></header><metadata><oai_dc:dc xmlns:oai_dc="http://www.openarchives.org/OAI/2.0/oai_dc/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:doc="http://www.lyncode.com/xoai" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/oai_dc/ http://www.openarchives.org/OAI/2.0/oai_dc.xsd">
   <dc:title>Analysis of Catalan-Castilian Code-Switching in Automatic Speech Recognition</dc:title>
   <dc:creator>Serra i Montes, Pol</dc:creator>
   <dc:contributor>Universitat Politècnica de Catalunya. Departament de Teoria del Senyal i Comunicacions</dc:contributor>
   <dc:contributor>Barcelona Supercomputing Center</dc:contributor>
   <dc:contributor>Hernando Pericás, Francisco Javier</dc:contributor>
   <dc:subject>Àrees temàtiques de la UPC::Enginyeria de la telecomunicació::Processament del senyal::Processament de la parla i del senyal acústic</dc:subject>
   <dc:subject>Automatic speech recognition</dc:subject>
   <dc:subject>Deep learning (Machine learning)</dc:subject>
   <dc:subject>Code switching (Linguistics))</dc:subject>
   <dc:subject>ASR</dc:subject>
   <dc:subject>Deep Learning</dc:subject>
   <dc:subject>Transformers</dc:subject>
   <dc:subject>Code-Switching</dc:subject>
   <dc:subject>Reconeixement automàtic de la parla</dc:subject>
   <dc:subject>Aprenentatge profund</dc:subject>
   <dc:subject>Alternança de codi (Lingüística)</dc:subject>
   <dc:description>This Master’s Thesis addresses the challenge of Catalan–Castilian code-switching in speech recognition. It develops synthetic corpora by combining machine-translated text chunks, large language model prompts, and semi-structured dialogues, then uses text-to-speech to produce audio samples. After fine-tuning ASR models, results indicate better recognition of artificially generated code-switching data but highlight limitations in real-world scenarios, such as emergency calls. The research underscores the need to incorporate more authentic recordings for stronger generalization, offering a practical framework to improve code-switching handling in multilingual ASR systems.</dc:description>
   <dc:date>2025-02-11</dc:date>
   <dc:type>Master thesis</dc:type>
   <dc:identifier>https://hdl.handle.net/2117/429991</dc:identifier>
   <dc:identifier>ETSETB-230.193669</dc:identifier>
   <dc:language>eng</dc:language>
   <dc:rights>S'autoritza la difusiÃ³ de l'obra mitjanÃ§ant la llicÃ¨ncia Creative Commons o similar 'Reconeixement-NoComercial- SenseObraDerivada'</dc:rights>
   <dc:rights>Open Access</dc:rights>
   <dc:format>application/pdf</dc:format>
   <dc:publisher>Universitat Politècnica de Catalunya</dc:publisher>
</oai_dc:dc></metadata></record></GetRecord></OAI-PMH>