<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="static/style.xsl"?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd"><responseDate>2026-04-13T07:14:45Z</responseDate><request verb="GetRecord" identifier="oai:www.recercat.cat:2117/22969" metadataPrefix="mets">https://recercat.cat/oai/request</request><GetRecord><record><header><identifier>oai:recercat.cat:2117/22969</identifier><datestamp>2025-07-17T13:52:18Z</datestamp><setSpec>com_2072_1033</setSpec><setSpec>col_2072_452950</setSpec></header><metadata><mets xmlns="http://www.loc.gov/METS/" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:doc="http://www.lyncode.com/xoai" ID="&#xa;&#x9;&#x9;&#x9;&#x9;DSpace_ITEM_2117-22969" TYPE="DSpace ITEM" PROFILE="DSpace METS SIP Profile 1.0" xsi:schemaLocation="http://www.loc.gov/METS/ http://www.loc.gov/standards/mets/mets.xsd" OBJID="&#xa;&#x9;&#x9;&#x9;&#x9;hdl:2117/22969">
   <metsHdr CREATEDATE="2026-04-13T09:14:45Z">
      <agent ROLE="CUSTODIAN" TYPE="ORGANIZATION">
         <name>RECERCAT</name>
      </agent>
   </metsHdr>
   <dmdSec ID="DMD_2117_22969">
      <mdWrap MDTYPE="MODS">
         <xmlData xmlns:mods="http://www.loc.gov/mods/v3" xsi:schemaLocation="http://www.loc.gov/mods/v3 http://www.loc.gov/standards/mods/v3/mods-3-1.xsd">
            <mods:mods xsi:schemaLocation="http://www.loc.gov/mods/v3 http://www.loc.gov/standards/mods/v3/mods-3-1.xsd">
               <mods:name>
                  <mods:role>
                     <mods:roleTerm type="text">author</mods:roleTerm>
                  </mods:role>
                  <mods:namePart>Nogueiras Rodríguez, Albino</mods:namePart>
               </mods:name>
               <mods:name>
                  <mods:role>
                     <mods:roleTerm type="text">author</mods:roleTerm>
                  </mods:role>
                  <mods:namePart>Moreno Bilbao, M. Asunción</mods:namePart>
               </mods:name>
               <mods:originInfo>
                  <mods:dateIssued encoding="iso8601">1998</mods:dateIssued>
               </mods:originInfo>
               <mods:identifier type="none"/>
               <mods:abstract>This paper describes NaniBD, a set of tools designed for&#xd;
transcribing and validating speech databases, developed at the&#xd;
Signal Processing Group (GPS) of the Department of Signal&#xd;
Theory and Communications of the Polytechnic University of&#xd;
Catalonia (TSC/UPC). The main purpose of its development&#xd;
was the need of a revision system in order to validate and&#xd;
annotate the Spanish corpus of SpeechDat (II) in the speech&#xd;
processing environment available at GPS. Despite of this,&#xd;
NaniBD is designed as a general-purpose system that might fit&#xd;
any other database, idiom or speech processing system. So far,&#xd;
the system has been used to revise some 200,000 speech files&#xd;
from three different corpora. In this paper we will focus our&#xd;
attention to the actual implementation used in the transcription&#xd;
of a SpeechDat (II) specifications compatible Catalonian corpus.&#xd;
1000 speakers, each of them uttering 44 files, compose this&#xd;
corpus. In this application, we use speech-noise detection,&#xd;
automatic recognition of spontaneous prompts, digit and letter&#xd;
to text translation and access to an external database in order to&#xd;
minimise the amount of time spent by human operators in the&#xd;
revision procedure.Peer ReviewedPostprint (published version)</mods:abstract>
               <mods:language>
                  <mods:languageTerm authority="rfc3066"/>
               </mods:language>
               <mods:accessCondition type="useAndReproduction">http://creativecommons.org/licenses/by-nc-nd/3.0/es/ Open Access Attribution-NonCommercial-NoDerivs 3.0 Spain</mods:accessCondition>
               <mods:subject>
                  <mods:topic>Àrees temàtiques de la UPC::Enginyeria de la telecomunicació::Radiocomunicació i exploració electromagnètica::Teledetecció</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Àrees temàtiques de la UPC::Enginyeria de la telecomunicació::Processament del senyal::Processament de la parla i del senyal acústic</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Remote sensing</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Automatic speech recognition</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Teledetecció</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Reconeixement automàtic de la parla</mods:topic>
               </mods:subject>
               <mods:titleInfo>
                  <mods:title>NaniBD: a set of tools for transcribing and validating speech databases</mods:title>
               </mods:titleInfo>
               <mods:genre>Conference report</mods:genre>
            </mods:mods>
         </xmlData>
      </mdWrap>
   </dmdSec>
   <structMap LABEL="DSpace Object" TYPE="LOGICAL">
      <div TYPE="DSpace Object Contents" ADMID="DMD_2117_22969"/>
   </structMap>
</mets></metadata></record></GetRecord></OAI-PMH>