<?xml version="1.0" encoding="UTF-8"?>
<mets:METS xmlns:mets="http://www.loc.gov/METS/" xmlns:xlink="http://www.w3.org/TR/xlink/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:dim="http://www.dspace.org/xmlns/dspace/dim" OBJEDIT="/xmlui/admin/item?itemID=111802" OBJID="/xmlui/handle/11531/110122" PROFILE="DSPACE METS SIP Profile 1.0" LABEL="DSpace Item" ID="hdl:11531/110122">
<mets:dmdSec GROUPID="group_dmd_0" ID="dmd_1">
<mets:mdWrap MDTYPE="OTHER" OTHERMDTYPE="DIM">
<mets:xmlData>
<dim:dim dspaceType="ITEM">
<dim:field authority="0000-0003-0889-0450" element="contributor" qualifier="author" confidence="ACCEPTED" language="es-ES" mdschema="dc">Rodríguez Abella, Álvaro</dim:field>
<dim:field authority="FCF70144-A2AF-4EFD-910D-FB16B12C465E" element="contributor" qualifier="author" confidence="ACCEPTED" language="es-ES" mdschema="dc">Silvestre, Joao Pedro</dim:field>
<dim:field authority="8B0C798F-A2CF-4733-941E-2C1B1BD5012A" element="contributor" qualifier="author" confidence="ACCEPTED" language="es-ES" mdschema="dc">Tabuada, Paulo</dim:field>
<dim:field element="date" qualifier="accessioned" mdschema="dc">2026-05-18T13:34:55Z</dim:field>
<dim:field element="date" qualifier="available" mdschema="dc">2026-05-18T13:34:55Z</dim:field>
<dim:field element="date" qualifier="issued" language="es_ES" mdschema="dc">2025-05-01</dim:field>
<dim:field element="identifier" qualifier="issn" language="es_ES" mdschema="dc">2640-3498</dim:field>
<dim:field element="identifier" qualifier="uri" mdschema="dc">http://hdl.handle.net/11531/110122</dim:field>
<dim:field element="description" language="es_ES" mdschema="dc">Artículos en revistas</dim:field>
<dim:field element="description" qualifier="abstract" language="es-ES" mdschema="dc">.</dim:field>
<dim:field element="description" qualifier="abstract" language="en-GB" mdschema="dc">A key component of transformers is the attention mechanism orchestrating how each token influences the propagation of every other token along the layers of a transformer. In this paper we provide a rigorous, mathematical analysis of the asymptotic properties of attention in transformers. Although we present several results based on different assumptions, all of them point to the same conclusion, all tokens asymptotically converge to each other, a phenomenon that has been empirically reported in the literature. Our findings are carefully compared with existing theoretical results and illustrated by simulations and experimental studies using the GPT-2 model.</dim:field>
<dim:field element="format" qualifier="mimetype" language="es_ES" mdschema="dc">application/pdf</dim:field>
<dim:field element="language" qualifier="iso" language="es_ES" mdschema="dc">en-GB</dim:field>
<dim:field element="rights" language="es_ES" mdschema="dc">Creative Commons Reconocimiento-NoComercial-SinObraDerivada España</dim:field>
<dim:field element="rights" qualifier="uri" language="es_ES" mdschema="dc">http://creativecommons.org/licenses/by-nc-nd/3.0/es/</dim:field>
<dim:field element="source" language="es_ES" mdschema="dc">Revista: Proceedings of Machine Learning Research, Periodo: 1, Volumen: , Número: 267, Página inicial: 174, Página final: 184</dim:field>
<dim:field element="title" language="es_ES" mdschema="dc">Consensus is all you get: the role of attention in transformers</dim:field>
<dim:field element="type" language="es_ES" mdschema="dc">info:eu-repo/semantics/article</dim:field>
<dim:field element="description" qualifier="version" language="es_ES" mdschema="dc">info:eu-repo/semantics/publishedVersion</dim:field>
<dim:field element="rights" qualifier="holder" language="es_ES" mdschema="dc"/>
<dim:field element="rights" qualifier="accessRights" language="es_ES" mdschema="dc">info:eu-repo/semantics/openAccess</dim:field>
<dim:field element="keywords" language="es-ES" mdschema="dc">.</dim:field>
<dim:field element="keywords" language="en-GB" mdschema="dc">transformers; attention mechanism; token convergence; asymptotic analysis.</dim:field>
</dim:dim>
</mets:xmlData>
</mets:mdWrap>
</mets:dmdSec>
<mets:fileSec>
<mets:fileGrp USE="CONTENT">
<mets:file CHECKSUMTYPE="MD5" GROUPID="group_file_852248" ID="file_852248" MIMETYPE="application/pdf" SIZE="986503" CHECKSUM="8d279542c98e29ce1266e4fa86aa2948">
<mets:FLocat LOCTYPE="URL" xlink:title="abella25a.pdf" xlink:type="locator" xlink:href="/xmlui/bitstream/handle/11531/110122/abella25a.pdf?sequence=1&amp;isAllowed=y"/>
</mets:file>
</mets:fileGrp>
</mets:fileSec>
<mets:structMap LABEL="DSpace" TYPE="LOGICAL">
<mets:div DMDID="dmd_1" TYPE="DSpace Item">
<mets:div ID="div_2" TYPE="DSpace Content Bitstream">
<mets:fptr FILEID="file_852248"/>
</mets:div>
</mets:div>
</mets:structMap>
</mets:METS>
