<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="static/style.xsl"?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd"><responseDate>2026-04-17T04:12:21Z</responseDate><request verb="GetRecord" identifier="oai:www.recercat.cat:2117/101910" metadataPrefix="didl">https://recercat.cat/oai/request</request><GetRecord><record><header><identifier>oai:recercat.cat:2117/101910</identifier><datestamp>2025-07-22T17:35:57Z</datestamp><setSpec>com_2072_1033</setSpec><setSpec>col_2072_452951</setSpec></header><metadata><d:DIDL xmlns:d="urn:mpeg:mpeg21:2002:02-DIDL-NS" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:doc="http://www.lyncode.com/xoai" xsi:schemaLocation="urn:mpeg:mpeg21:2002:02-DIDL-NS http://standards.iso.org/ittf/PubliclyAvailableStandards/MPEG-21_schema_files/did/didl.xsd">
   <d:Item id="hdl_2117_101910">
      <d:Descriptor>
         <d:Statement mimeType="application/xml; charset=utf-8">
            <dii:Identifier xmlns:dii="urn:mpeg:mpeg21:2002:01-DII-NS" xsi:schemaLocation="urn:mpeg:mpeg21:2002:01-DII-NS http://standards.iso.org/ittf/PubliclyAvailableStandards/MPEG-21_schema_files/dii/dii.xsd">urn:hdl:2117/101910</dii:Identifier>
         </d:Statement>
      </d:Descriptor>
      <d:Descriptor>
         <d:Statement mimeType="application/xml; charset=utf-8">
            <oai_dc:dc xmlns:oai_dc="http://www.openarchives.org/OAI/2.0/oai_dc/" xmlns:dc="http://purl.org/dc/elements/1.1/" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/oai_dc/ http://www.openarchives.org/OAI/2.0/oai_dc.xsd">
               <dc:title>Data mining in Breast Cancer</dc:title>
               <dc:creator>Carrio Viladrich, Laura</dc:creator>
               <dc:subject>Àrees temàtiques de la UPC::Informàtica</dc:subject>
               <dc:subject>Machine learning</dc:subject>
               <dc:subject>Databases</dc:subject>
               <dc:subject>Aprenentatge automàtic</dc:subject>
               <dc:subject>Bases de dades</dc:subject>
               <dc:description>Machine learning and data mining methods can be the future of the clinical decision&#xd;
process like pathological diagnosis. In this project we studied Breast Cancer Wisconsin&#xd;
dataset and applied different algorithms, concretely classifiers, in order to predict the&#xd;
diagnosis and the prognostic of the cancer.&#xd;
In order to classify the different types of cancer we divided the classification in two steps&#xd;
and we tested different algorithms for each step. The first step is the diagnosis&#xd;
classification. Diagnosis consistsin predict if the cancer is malignant and benign. And the&#xd;
second step is the prognostic classification. Prognostic consist in predict if cancer is&#xd;
recurrent or non-recurrent.&#xd;
After applying different models for each steps the result is that the best model to predict&#xd;
the diagnosis is the Decision Forest model. And the best model to predict the prognostic&#xd;
is the Boosted Decision Tree model.&#xd;
So, we conclude that the two step classifier with Decision Forest model and Boosted&#xd;
Decision Tree model is the best classifier.</dc:description>
               <dc:date>2016</dc:date>
               <dc:type>Bachelor thesis</dc:type>
               <dc:rights>Open Access</dc:rights>
               <dc:publisher>Universitat Politècnica de Catalunya</dc:publisher>
            </oai_dc:dc>
         </d:Statement>
      </d:Descriptor>
   </d:Item>
</d:DIDL></metadata></record></GetRecord></OAI-PMH>