<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="static/style.xsl"?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd"><responseDate>2026-04-19T22:14:49Z</responseDate><request verb="GetRecord" identifier="oai:www.recercat.cat:2117/460649" metadataPrefix="mets">https://recercat.cat/oai/request</request><GetRecord><record><header><identifier>oai:recercat.cat:2117/460649</identifier><datestamp>2026-04-17T04:01:50Z</datestamp><setSpec>com_2072_1033</setSpec><setSpec>col_2072_452951</setSpec></header><metadata><mets xmlns="http://www.loc.gov/METS/" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:doc="http://www.lyncode.com/xoai" ID="&#xa;&#x9;&#x9;&#x9;&#x9;DSpace_ITEM_2117-460649" TYPE="DSpace ITEM" PROFILE="DSpace METS SIP Profile 1.0" xsi:schemaLocation="http://www.loc.gov/METS/ http://www.loc.gov/standards/mets/mets.xsd" OBJID="&#xa;&#x9;&#x9;&#x9;&#x9;hdl:2117/460649">
   <metsHdr CREATEDATE="2026-04-20T00:14:49Z">
      <agent ROLE="CUSTODIAN" TYPE="ORGANIZATION">
         <name>RECERCAT</name>
      </agent>
   </metsHdr>
   <dmdSec ID="DMD_2117_460649">
      <mdWrap MDTYPE="MODS">
         <xmlData xmlns:mods="http://www.loc.gov/mods/v3" xsi:schemaLocation="http://www.loc.gov/mods/v3 http://www.loc.gov/standards/mods/v3/mods-3-1.xsd">
            <mods:mods xsi:schemaLocation="http://www.loc.gov/mods/v3 http://www.loc.gov/standards/mods/v3/mods-3-1.xsd">
               <mods:name>
                  <mods:role>
                     <mods:roleTerm type="text">author</mods:roleTerm>
                  </mods:role>
                  <mods:namePart>Fernández Coronado, Alba</mods:namePart>
               </mods:name>
               <mods:extension>
                  <mods:dateAccessioned encoding="iso8601">2026-04-17T04:01:50Z</mods:dateAccessioned>
               </mods:extension>
               <mods:extension>
                  <mods:dateAvailable encoding="iso8601">2026-04-17T04:01:50Z</mods:dateAvailable>
               </mods:extension>
               <mods:originInfo>
                  <mods:dateIssued encoding="iso8601">2026-01-27</mods:dateIssued>
               </mods:originInfo>
               <mods:identifier type="none"/>
               <mods:identifier type="uri">https://hdl.handle.net/2117/460649</mods:identifier>
               <mods:abstract>This thesis presents a series of improvements to the semantic search system deployed on the mango.com e-commerce platform, with the goal of enhancing retrieval accuracy, robustness, and relevance across multiple languages and query types. The work focuses on addressing key limitations of the existing semantic component within a hybrid lexical¿semantic search architecture. The main contributions include the training of a multilingual BERT uncased model to improve robustness to capitalization and diacritics, as well as fine-tuning on fashion-specific data to enhance domain understanding. In addition, limitations in handling attribute-only queries are addressed through the use of intelligent image cropping and a weighted fusion strategy that combines image embeddings with short textual metadata. Furthermore, the CLIP image encoder is fine-tuned to generate semantically richer and more discriminative visual representations, leading to higher similarity scores and improved ranking stability. Experimental results, evaluated on a manually annotated multilingual dataset, demonstrate consistent improvements across locales, increased semantic similarity scores, and more stable ranking performance, without introducing catastrophic forgetting or degrading standard query retrieval. The integration of these enhancements into the full production search pipeline provides a robust foundation for future improvements, including tighter alignment between multilingual text embeddings and the fine-tuned image encoder.</mods:abstract>
               <mods:language>
                  <mods:languageTerm authority="rfc3066"/>
               </mods:language>
               <mods:accessCondition type="useAndReproduction">Restricted access - confidentiality agreement</mods:accessCondition>
               <mods:subject>
                  <mods:topic>Àrees temàtiques de la UPC::Informàtica::Intel·ligència artificial::Aprenentatge automàtic</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Àrees temàtiques de la UPC::Economia i organització d'empreses::Comerç electrònic</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Deep learning</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Semantics--Data processing</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Computer vision</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Electronic commerce</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Cerca semàntica</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Cerca en comerç electrònic</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Recuperació multilingüe</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Sistemes de cerca híbrids</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Cerca multimodal</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Models visió-llenguatge</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>CLIP</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>BERT</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Recuperació de moda</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Adaptació al domini</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Embeddings imatge-text</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Semantic search</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>E-commerce search</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Multilingual retrieval</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Hybrid search systems</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Multimodal search</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Vision-language models</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Image-text embeddings</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Image-text embeddings</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Image-text embeddings</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Aprenentatge profund</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Semàntica--Informàtica</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Visió per ordinador</mods:topic>
               </mods:subject>
               <mods:subject>
                  <mods:topic>Comerç electrònic</mods:topic>
               </mods:subject>
               <mods:titleInfo>
                  <mods:title>Improvement and integration of a deep learning-based semantic model into a hybrid lexical-semantic search engine</mods:title>
               </mods:titleInfo>
               <mods:genre>Master thesis</mods:genre>
            </mods:mods>
         </xmlData>
      </mdWrap>
   </dmdSec>
   <structMap LABEL="DSpace Object" TYPE="LOGICAL">
      <div TYPE="DSpace Object Contents" ADMID="DMD_2117_460649"/>
   </structMap>
</mets></metadata></record></GetRecord></OAI-PMH>