<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="static/style.xsl"?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd"><responseDate>2026-04-14T02:57:13Z</responseDate><request verb="GetRecord" identifier="oai:www.recercat.cat:10256/28374" metadataPrefix="didl">https://recercat.cat/oai/request</request><GetRecord><record><header><identifier>oai:recercat.cat:10256/28374</identifier><datestamp>2026-03-07T19:50:53Z</datestamp><setSpec>com_2072_452966</setSpec><setSpec>com_2072_2054</setSpec><setSpec>col_2072_452969</setSpec></header><metadata><d:DIDL xmlns:d="urn:mpeg:mpeg21:2002:02-DIDL-NS" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:doc="http://www.lyncode.com/xoai" xsi:schemaLocation="urn:mpeg:mpeg21:2002:02-DIDL-NS http://standards.iso.org/ittf/PubliclyAvailableStandards/MPEG-21_schema_files/did/didl.xsd">
   <d:DIDLInfo>
      <dcterms:created xmlns:dcterms="http://purl.org/dc/terms/" xsi:schemaLocation="http://purl.org/dc/terms/ http://dublincore.org/schemas/xmls/qdc/dcterms.xsd">2026-03-07T19:50:53Z</dcterms:created>
   </d:DIDLInfo>
   <d:Item id="hdl_10256_28374">
      <d:Descriptor>
         <d:Statement mimeType="application/xml; charset=utf-8">
            <dii:Identifier xmlns:dii="urn:mpeg:mpeg21:2002:01-DII-NS" xsi:schemaLocation="urn:mpeg:mpeg21:2002:01-DII-NS http://standards.iso.org/ittf/PubliclyAvailableStandards/MPEG-21_schema_files/dii/dii.xsd">urn:hdl:10256/28374</dii:Identifier>
         </d:Statement>
      </d:Descriptor>
      <d:Descriptor>
         <d:Statement mimeType="application/xml; charset=utf-8">
            <oai_dc:dc xmlns:oai_dc="http://www.openarchives.org/OAI/2.0/oai_dc/" xmlns:dc="http://purl.org/dc/elements/1.1/" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/oai_dc/ http://www.openarchives.org/OAI/2.0/oai_dc.xsd">
               <dc:title>Deep Reinforcement Learning for robot manipulation</dc:title>
               <dc:creator>Mulia, Vania Katherine</dc:creator>
               <dc:subject>DRL (Deep Reinforcement Learning)</dc:subject>
               <dc:subject>Deep learning (Machine learning)</dc:subject>
               <dc:subject>Aprenentatge profund (Aprenentatge automàtic)</dc:subject>
               <dc:subject>Robots -- Control systems</dc:subject>
               <dc:subject>Sim-to-real transfer</dc:subject>
               <dc:subject>Peg-in-hole task</dc:subject>
               <dc:subject>Robots -- Sistemes de control</dc:subject>
               <dc:description>Robotic manipulation continues to be an active area of research due to its&#xd;
broad range of real-world applications. Among its benchmark tasks, the peg-in hole problem remains particularly challenging, requiring high-precision control&#xd;
under environmental uncertainty. This thesis presents a framework based on Deep&#xd;
Reinforcement Learning (DRL) to train a robotic manipulator to autonomously&#xd;
solve the peg-in-hole task. The proposed approach uses curriculum learning&#xd;
to train a single policy capable of handling all phases of the task: approach,&#xd;
contact-based hole search, and insertion. The curriculum is further extended to&#xd;
incorporate observation noise and force penalization, encouraging the emergence of&#xd;
compliant behaviors during contact. Training is conducted in a custom-designed,&#xd;
physics-based simulation environment. Simulation results demonstrate that the&#xd;
learned policy can complete the peg-in-hole task, though it faces difficulties in&#xd;
balancing task success with compliant interaction. To evaluate the potential for&#xd;
real-world deployment, the trained policy is transferred to a physical robot. Tests&#xd;
reveal several sources of sim-to-real discrepancy, particularly in the modeling&#xd;
of contact dynamics. Nonetheless, partial success in real-world trials suggests&#xd;
the viability of sim-to-real transfer for DRL-trained policies. Overall, this work&#xd;
contributes to the understanding of DRL’s capabilities and limitations in solving&#xd;
complex robotic manipulation tasks such as peg-in-hole assembly.</dc:description>
               <dc:description>9</dc:description>
               <dc:date>2026-03-07T19:50:53Z</dc:date>
               <dc:date>2026-03-07T19:50:53Z</dc:date>
               <dc:date>2025-06</dc:date>
               <dc:type>info:eu-repo/semantics/masterThesis</dc:type>
               <dc:identifier>https://hdl.handle.net/10256/28374</dc:identifier>
               <dc:rights>Attribution-NonCommercial-NoDerivatives 4.0 International</dc:rights>
               <dc:rights>http://creativecommons.org/licenses/by-nc-nd/4.0/</dc:rights>
               <dc:rights>info:eu-repo/semantics/openAccess</dc:rights>
               <dc:publisher>Universitat de Girona. Institut de Recerca en Visió per Computador i Robòtica</dc:publisher>
               <dc:source>Erasmus Mundus Joint Master in Intelligent Field Robotic Systems (IFROS)</dc:source>
            </oai_dc:dc>
         </d:Statement>
      </d:Descriptor>
   </d:Item>
</d:DIDL></metadata></record></GetRecord></OAI-PMH>