<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="static/style.xsl"?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd"><responseDate>2026-04-13T14:24:04Z</responseDate><request verb="GetRecord" identifier="oai:www.recercat.cat:2117/22969" metadataPrefix="didl">https://recercat.cat/oai/request</request><GetRecord><record><header><identifier>oai:recercat.cat:2117/22969</identifier><datestamp>2025-07-17T13:52:18Z</datestamp><setSpec>com_2072_1033</setSpec><setSpec>col_2072_452950</setSpec></header><metadata><d:DIDL xmlns:d="urn:mpeg:mpeg21:2002:02-DIDL-NS" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:doc="http://www.lyncode.com/xoai" xsi:schemaLocation="urn:mpeg:mpeg21:2002:02-DIDL-NS http://standards.iso.org/ittf/PubliclyAvailableStandards/MPEG-21_schema_files/did/didl.xsd">
   <d:Item id="hdl_2117_22969">
      <d:Descriptor>
         <d:Statement mimeType="application/xml; charset=utf-8">
            <dii:Identifier xmlns:dii="urn:mpeg:mpeg21:2002:01-DII-NS" xsi:schemaLocation="urn:mpeg:mpeg21:2002:01-DII-NS http://standards.iso.org/ittf/PubliclyAvailableStandards/MPEG-21_schema_files/dii/dii.xsd">urn:hdl:2117/22969</dii:Identifier>
         </d:Statement>
      </d:Descriptor>
      <d:Descriptor>
         <d:Statement mimeType="application/xml; charset=utf-8">
            <oai_dc:dc xmlns:oai_dc="http://www.openarchives.org/OAI/2.0/oai_dc/" xmlns:dc="http://purl.org/dc/elements/1.1/" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/oai_dc/ http://www.openarchives.org/OAI/2.0/oai_dc.xsd">
               <dc:title>NaniBD: a set of tools for transcribing and validating speech databases</dc:title>
               <dc:creator>Nogueiras Rodríguez, Albino</dc:creator>
               <dc:creator>Moreno Bilbao, M. Asunción</dc:creator>
               <dc:subject>Àrees temàtiques de la UPC::Enginyeria de la telecomunicació::Radiocomunicació i exploració electromagnètica::Teledetecció</dc:subject>
               <dc:subject>Àrees temàtiques de la UPC::Enginyeria de la telecomunicació::Processament del senyal::Processament de la parla i del senyal acústic</dc:subject>
               <dc:subject>Remote sensing</dc:subject>
               <dc:subject>Automatic speech recognition</dc:subject>
               <dc:subject>Teledetecció</dc:subject>
               <dc:subject>Reconeixement automàtic de la parla</dc:subject>
               <dc:description>This paper describes NaniBD, a set of tools designed for&#xd;
transcribing and validating speech databases, developed at the&#xd;
Signal Processing Group (GPS) of the Department of Signal&#xd;
Theory and Communications of the Polytechnic University of&#xd;
Catalonia (TSC/UPC). The main purpose of its development&#xd;
was the need of a revision system in order to validate and&#xd;
annotate the Spanish corpus of SpeechDat (II) in the speech&#xd;
processing environment available at GPS. Despite of this,&#xd;
NaniBD is designed as a general-purpose system that might fit&#xd;
any other database, idiom or speech processing system. So far,&#xd;
the system has been used to revise some 200,000 speech files&#xd;
from three different corpora. In this paper we will focus our&#xd;
attention to the actual implementation used in the transcription&#xd;
of a SpeechDat (II) specifications compatible Catalonian corpus.&#xd;
1000 speakers, each of them uttering 44 files, compose this&#xd;
corpus. In this application, we use speech-noise detection,&#xd;
automatic recognition of spontaneous prompts, digit and letter&#xd;
to text translation and access to an external database in order to&#xd;
minimise the amount of time spent by human operators in the&#xd;
revision procedure.</dc:description>
               <dc:description>Peer Reviewed</dc:description>
               <dc:description>Postprint (published version)</dc:description>
               <dc:date>1998</dc:date>
               <dc:type>Conference report</dc:type>
               <dc:relation>http://www.coli.uni-saarland.de/~regneri/courses/res4cl-07/papers/Nog98b.pdf</dc:relation>
               <dc:rights>http://creativecommons.org/licenses/by-nc-nd/3.0/es/</dc:rights>
               <dc:rights>Open Access</dc:rights>
               <dc:rights>Attribution-NonCommercial-NoDerivs 3.0 Spain</dc:rights>
               <dc:publisher>European Language Resources Association (ELRA)</dc:publisher>
            </oai_dc:dc>
         </d:Statement>
      </d:Descriptor>
   </d:Item>
</d:DIDL></metadata></record></GetRecord></OAI-PMH>