<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="static/style.xsl"?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd"><responseDate>2026-04-14T06:55:54Z</responseDate><request verb="GetRecord" identifier="oai:www.recercat.cat:2117/112988" metadataPrefix="oai_dc">https://recercat.cat/oai/request</request><GetRecord><record><header><identifier>oai:recercat.cat:2117/112988</identifier><datestamp>2026-01-14T05:51:24Z</datestamp><setSpec>com_2072_1033</setSpec><setSpec>col_2072_452950</setSpec></header><metadata><oai_dc:dc xmlns:oai_dc="http://www.openarchives.org/OAI/2.0/oai_dc/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:doc="http://www.lyncode.com/xoai" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/oai_dc/ http://www.openarchives.org/OAI/2.0/oai_dc.xsd">
   <dc:title>LSTM neural network-based speaker segmentation using acoustic and language modelling</dc:title>
   <dc:creator>India Massana, Miquel Àngel</dc:creator>
   <dc:creator>Rodríguez Fonollosa, José Adrián</dc:creator>
   <dc:creator>Hernando Pericás, Francisco Javier</dc:creator>
   <dc:contributor>Universitat Politècnica de Catalunya. Departament de Teoria del Senyal i Comunicacions</dc:contributor>
   <dc:contributor>Universitat Politècnica de Catalunya. VEU - Grup de Tractament de la Parla</dc:contributor>
   <dc:subject>Àrees temàtiques de la UPC::Enginyeria de la telecomunicació::Processament del senyal::Processament de la parla i del senyal acústic</dc:subject>
   <dc:subject>Automatic speech recognition</dc:subject>
   <dc:subject>Neural networks (Neurobiology)</dc:subject>
   <dc:subject>Speaker segmentation</dc:subject>
   <dc:subject>Neural language modelling</dc:subject>
   <dc:subject>I-vectors</dc:subject>
   <dc:subject>Speaker factors</dc:subject>
   <dc:subject>LSTM neural networks</dc:subject>
   <dc:subject>Reconeixement automàtic de la parla</dc:subject>
   <dc:subject>Xarxes neuronals (Neurobiologia)</dc:subject>
   <dc:description>This  paper  presents  a  new  speaker  change  detection  system based on Long Short-Term Memory (LSTM) neural networks  using  acoustic  data  and  linguistic  content.   Language modelling is combined with two different Joint Factor Analysis (JFA) acoustic approaches: i-vectors and speaker factors.  Both of them are compared with a baseline algorithm that uses cosine distance to detect speaker turn changes. LSTM neural networks with both linguistic and acoustic features have been able to produce a robust speaker segmentation.  The experimental results show that our proposal clearly outperforms the baseline system.</dc:description>
   <dc:description>Peer Reviewed</dc:description>
   <dc:description>Postprint (published version)</dc:description>
   <dc:date>2017</dc:date>
   <dc:type>Conference lecture</dc:type>
   <dc:identifier>India, M., Fonollosa, José A. R., Hernando, J. LSTM neural network-based speaker segmentation using acoustic and language modelling. A: Annual Conference of the International Speech Communication Association. "INTERSPEECH 2017: 20-24 August 2017: Stockholm". Stockholm: International Speech Communication Association (ISCA), 2017, p. 2834-2838.</dc:identifier>
   <dc:identifier>1990-9772</dc:identifier>
   <dc:identifier>https://hdl.handle.net/2117/112988</dc:identifier>
   <dc:identifier>10.21437/Interspeech.2017</dc:identifier>
   <dc:language>eng</dc:language>
   <dc:relation>http://www.isca-speech.org/archive/Interspeech_2017/pdfs/0407.PDF</dc:relation>
   <dc:relation>info:eu-repo/grantAgreement/EC/H2020/115902/EU/Remote Assessment of Disease and Relapse in Central Nervous System Disorders/RADAR-CNS</dc:relation>
   <dc:rights>Open Access</dc:rights>
   <dc:format>5 p.</dc:format>
   <dc:format>application/pdf</dc:format>
   <dc:publisher>International Speech Communication Association (ISCA)</dc:publisher>
</oai_dc:dc></metadata></record></GetRecord></OAI-PMH>