<?xml version="1.0" encoding="UTF-8"?>
<mets:METS xmlns:mets="http://www.loc.gov/METS/" xmlns:xlink="http://www.w3.org/TR/xlink/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:dim="http://www.dspace.org/xmlns/dspace/dim" OBJEDIT="/xmlui/admin/item?itemID=100257" OBJID="/xmlui/handle/11531/98725" PROFILE="DSPACE METS SIP Profile 1.0" LABEL="DSpace Item" ID="hdl:11531/98725">
<mets:dmdSec GROUPID="group_dmd_0" ID="dmd_1">
<mets:mdWrap MDTYPE="OTHER" OTHERMDTYPE="DIM">
<mets:xmlData>
<dim:dim dspaceType="ITEM">
<dim:field authority="2eb5ff1c-50ea-4d6f-a940-b0a0e5a1091c" element="contributor" qualifier="advisor" confidence="UNCERTAIN" language="es-ES" mdschema="dc">Pérez Barajas, Manuel</dim:field>
<dim:field authority="10444360-c9ab-4ec3-aaec-4dab351d0f3b" element="contributor" qualifier="author" confidence="UNCERTAIN" language="es-ES" mdschema="dc">Catalán Criado, Ángel</dim:field>
<dim:field element="contributor" qualifier="other" language="es_ES" mdschema="dc">Universidad Pontificia Comillas, Escuela Técnica Superior de Ingeniería (ICAI)</dim:field>
<dim:field element="date" qualifier="accessioned" mdschema="dc">2025-05-09T17:35:52Z</dim:field>
<dim:field element="date" qualifier="available" mdschema="dc">2025-05-09T17:35:52Z</dim:field>
<dim:field element="date" qualifier="issued" language="es_ES" mdschema="dc">2025</dim:field>
<dim:field element="identifier" qualifier="uri" mdschema="dc">http://hdl.handle.net/11531/98725</dim:field>
<dim:field element="description" language="es_ES" mdschema="dc">Máster Universitario en Big Data</dim:field>
<dim:field element="description" qualifier="abstract" language="es-ES" mdschema="dc">El objetivo de este proyecto es mostrar cómo con analítica de datos y conocimientos de ETL (Extract-Transform-Load) es posible no sólo automatizar tareas (y su consecuente ahorro) sino también poder acceder a la información/datos de una manera rápida y masiva, pudiendo así analizarla y explotarla.
En este proyecto se desarrollará el proceso de parseo de archivos PDF-XFA a un formato tabular, para su posterior uso y análisis.</dim:field>
<dim:field element="description" qualifier="abstract" language="en-GB" mdschema="dc">The objective of this project is to demonstrate how, with data analytics and ETL (Extract-Transform-Load) knowledge, it is possible not only to automate tasks (and consequently save time) but also to access information/data quickly and extensively, enabling analysis and exploitation.
This project will develop the process of parsing PDF-XFA files into a tabular format for subsequent use and analysis.</dim:field>
<dim:field element="format" qualifier="mimetype" language="es_ES" mdschema="dc">application/pdf</dim:field>
<dim:field element="language" qualifier="iso" language="es_ES" mdschema="dc">es-ES</dim:field>
<dim:field element="rights" language="es_ES" mdschema="dc">Attribution-NonCommercial-NoDerivs 3.0 United States</dim:field>
<dim:field element="rights" qualifier="uri" language="es_ES" mdschema="dc">http://creativecommons.org/licenses/by-nc-nd/3.0/us/</dim:field>
<dim:field element="subject" qualifier="other" language="es_ES" mdschema="dc">H0Z</dim:field>
<dim:field element="title" language="es_ES" mdschema="dc">Automatización del parseo de documentos PDF-XFA (XML Forms Architecture) y la posterior explotación analítica de su información</dim:field>
<dim:field element="type" language="es_ES" mdschema="dc">info:eu-repo/semantics/masterThesis</dim:field>
<dim:field element="rights" qualifier="accessRights" language="es_ES" mdschema="dc">info:eu-repo/semantics/openAccess</dim:field>
<dim:field element="keywords" language="es-ES" mdschema="dc">ETL, XML, PDF, PDF-XFA, parsear, análisis, XFA</dim:field>
<dim:field element="keywords" language="en-GB" mdschema="dc">ETL, XML, PDF, PDF-XFA, parser, analysis, XFA</dim:field>
</dim:dim>
</mets:xmlData>
</mets:mdWrap>
</mets:dmdSec>
<mets:fileSec>
<mets:fileGrp USE="CONTENT">
<mets:file CHECKSUMTYPE="MD5" GROUPID="group_file_726843" ID="file_726843" MIMETYPE="application/pdf" SIZE="1923428" CHECKSUM="bd6a4cc018ee9fa762d94f4fe5342a99">
<mets:FLocat LOCTYPE="URL" xlink:title="TFM - Catalan Criado, Angel.pdf" xlink:label="Trabajo Fin de Máster" xlink:type="locator" xlink:href="/xmlui/bitstream/handle/11531/98725/TFM%20-%20Catalan%20Criado%2c%20Angel.pdf?sequence=1&amp;isAllowed=y"/>
</mets:file>
<mets:file CHECKSUMTYPE="MD5" GROUPID="group_file_726844" ID="file_726844" MIMETYPE="application/pdf" SIZE="84826" CHECKSUM="bd6a4cc018ee9fa762d94f4fe5342a99">
<mets:FLocat LOCTYPE="URL" xlink:title="Anexo I - Catalan Criado, Angel.pdf" xlink:label="Autorización" xlink:type="locator" xlink:href="/xmlui/bitstream/handle/11531/98725/Anexo%20I%20-%20Catalan%20Criado%2c%20Angel.pdf?sequence=2&amp;isAllowed=n"/>
</mets:file>
</mets:fileGrp>
</mets:fileSec>
<mets:structMap LABEL="DSpace" TYPE="LOGICAL">
<mets:div DMDID="dmd_1" TYPE="DSpace Item">
<mets:div ID="div_2" TYPE="DSpace Content Bitstream">
<mets:fptr FILEID="file_726843"/>
</mets:div>
<mets:div ID="div_3" TYPE="DSpace Content Bitstream">
<mets:fptr FILEID="file_726844"/>
</mets:div>
</mets:div>
</mets:structMap>
</mets:METS>
