<?xml version="1.0" encoding="UTF-8"?>
<mets:METS xmlns:mets="http://www.loc.gov/METS/" xmlns:xlink="http://www.w3.org/TR/xlink/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:dim="http://www.dspace.org/xmlns/dspace/dim" OBJEDIT="/xmlui/admin/item?itemID=105607" OBJID="/xmlui/handle/11531/104035" PROFILE="DSPACE METS SIP Profile 1.0" LABEL="DSpace Item" ID="hdl:11531/104035">
<mets:dmdSec GROUPID="group_dmd_0" ID="dmd_1">
<mets:mdWrap MDTYPE="OTHER" OTHERMDTYPE="DIM">
<mets:xmlData>
<dim:dim dspaceType="ITEM">
<dim:field authority="9D5ECDB6-B42C-4752-947E-DBADED0E6230" element="contributor" qualifier="advisor" confidence="UNCERTAIN" language="es-ES" mdschema="dc">Pizarroso Gonzalo, Jaime</dim:field>
<dim:field authority="c8dfb6a8-28cb-4c70-86ac-de81a2d0608e" element="contributor" qualifier="advisor" confidence="UNCERTAIN" language="es-ES" mdschema="dc">Güitta López, Lucía</dim:field>
<dim:field authority="68e41e6e-5988-4da8-ba53-6357a3cab9f9" element="contributor" qualifier="author" confidence="UNCERTAIN" language="es-ES" mdschema="dc">Pérez Ibarz, Guzman Ignacio</dim:field>
<dim:field element="contributor" qualifier="other" language="es_ES" mdschema="dc">Universidad Pontificia Comillas, Escuela Técnica Superior de Ingeniería (ICAI)</dim:field>
<dim:field element="date" qualifier="accessioned" mdschema="dc">2025-09-15T08:01:36Z</dim:field>
<dim:field element="date" qualifier="available" mdschema="dc">2025-09-15T08:01:36Z</dim:field>
<dim:field element="date" qualifier="issued" language="es_ES" mdschema="dc">2026</dim:field>
<dim:field element="identifier" qualifier="uri" mdschema="dc">http://hdl.handle.net/11531/104035</dim:field>
<dim:field element="description" language="es_ES" mdschema="dc">Grado en Ingeniería Matemática e Inteligencia Artificial</dim:field>
<dim:field element="description" qualifier="abstract" language="es-ES" mdschema="dc">Este proyecto explora si un agente de aprendizaje por refuerzo puede aprender a operar
Bitcoin de forma rentable interactuando únicamente con datos históricos de mercado. Se
desarrollan agentes basados en Proximal Policy Optimization (PPO) para el par BTC/USDT
a frecuencia de 5 minutos, comparando espacios de acción de dos y tres acciones y empleando
Optuna para la optimización automática de hiperparámetros. Ante el fracaso de las políticas
únicas en periodos de mercado heterogéneos, se diseña un ensamble consciente del régimen:
un Modelo Oculto de Markov detecta el régimen vigente y activa un agente especialista
entrenado con datos aumentados de 2018–2020. El ensamble supera a Buy &amp; Hold en el
conjunto de prueba mixto (+52,6% ROI, Sortino 3,52 frente a 1,21), mientras que en el
periodo alcista el agente de dos acciones casi lo iguala (+9,9% ROI).</dim:field>
<dim:field element="description" qualifier="abstract" language="en-GB" mdschema="dc">This project investigates whether a reinforcement learning agent can learn to trade Bitcoin
profitably by interacting with historical market data alone. PPO-based agents are developed
for the BTC/USDT pair at 5-minute frequency, comparing two- and three-action spaces and
using Optuna for automated hyperparameter search. Motivated by the consistent failure
of single-policy agents across heterogeneous market regimes, a regime-aware ensemble is
designed: a Hidden Markov Model identifies the prevailing market regime and activates
a specialist agent trained on cross-period augmented data from 2018–2020. The ensemble
surpasses Buy &amp; Hold on the mixed-regime test set (+52.6% ROI, Sortino 3.52 vs 1.21), while
on the bullish dataset the two-action agent nearly matches it (+9.9% ROI, Sortino 1.62).</dim:field>
<dim:field element="format" qualifier="mimetype" language="es_ES" mdschema="dc">application/pdf</dim:field>
<dim:field element="language" qualifier="iso" language="es_ES" mdschema="dc">en-GB</dim:field>
<dim:field element="rights" language="es_ES" mdschema="dc">Attribution-NonCommercial-NoDerivs 3.0 United States</dim:field>
<dim:field element="rights" qualifier="uri" language="es_ES" mdschema="dc">http://creativecommons.org/licenses/by-nc-nd/3.0/us/</dim:field>
<dim:field element="subject" qualifier="other" language="es_ES" mdschema="dc">KMI</dim:field>
<dim:field element="title" language="es_ES" mdschema="dc">Reinforcement Learning for Automated Crypto Trading: An Experimental Study ofAlgorithmic Strategies</dim:field>
<dim:field element="type" language="es_ES" mdschema="dc">info:eu-repo/semantics/bachelorThesis</dim:field>
<dim:field element="rights" qualifier="accessRights" language="es_ES" mdschema="dc">info:eu-repo/semantics/restrictedAccess</dim:field>
<dim:field element="keywords" language="es-ES" mdschema="dc">Aprendizaje por refuerzo; Proximal Policy Optimization(PPO); Trading algorítmico; Criptomonedas; ensamble consciente del régimen; Modelo Oculto de Markov; Optuna</dim:field>
<dim:field element="keywords" language="en-GB" mdschema="dc">Reinforcement learning; Proximal Policy Optimization(PPO); Algorithmic trading; Cryptocurrency; Regime-aware ensemble; Hidden Markov Model; Optuna</dim:field>
</dim:dim>
</mets:xmlData>
</mets:mdWrap>
</mets:dmdSec>
<mets:fileSec>
<mets:fileGrp USE="CONTENT">
<mets:file CHECKSUMTYPE="MD5" GROUPID="group_file_851155" ID="file_851155" MIMETYPE="application/pdf" SIZE="1728535" CHECKSUM="6f3abab0e3003b9b8190698ccb7210fa">
<mets:FLocat LOCTYPE="URL" xlink:title="Pérez Ibarz, Guzmán Ignacio - TFG.pdf" xlink:label="Trabajo Fin de Grado" xlink:type="locator" xlink:href="/xmlui/bitstream/handle/11531/104035/P%c3%a9rez%20Ibarz%2c%20Guzm%c3%a1n%20Ignacio%20-%20TFG.pdf?sequence=1&amp;isAllowed=n"/>
</mets:file>
<mets:file CHECKSUMTYPE="MD5" GROUPID="group_file_851156" ID="file_851156" MIMETYPE="application/pdf" SIZE="253918" CHECKSUM="90334d36e5f00be52168d715cce9a632">
<mets:FLocat LOCTYPE="URL" xlink:title="Pérez Ibarz, Guzmán Ignacio - Anexo I.pdf" xlink:label="Autorización" xlink:type="locator" xlink:href="/xmlui/bitstream/handle/11531/104035/P%c3%a9rez%20Ibarz%2c%20Guzm%c3%a1n%20Ignacio%20-%20Anexo%20I.pdf?sequence=2&amp;isAllowed=n"/>
</mets:file>
</mets:fileGrp>
</mets:fileSec>
<mets:structMap LABEL="DSpace" TYPE="LOGICAL">
<mets:div DMDID="dmd_1" TYPE="DSpace Item">
<mets:div ID="div_2" TYPE="DSpace Content Bitstream">
<mets:fptr FILEID="file_851155"/>
</mets:div>
<mets:div ID="div_3" TYPE="DSpace Content Bitstream">
<mets:fptr FILEID="file_851156"/>
</mets:div>
</mets:div>
</mets:structMap>
</mets:METS>
