<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="static/style.xsl"?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd"><responseDate>2026-06-01T15:20:55Z</responseDate><request verb="GetRecord" identifier="oai:riuma.uma.es:10630/45373" metadataPrefix="qdc">https://riuma.uma.es/rest/oai/request</request><GetRecord><record><header><identifier>oai:riuma.uma.es:10630/45373</identifier><datestamp>2026-02-12T00:46:14Z</datestamp><setSpec>com_10630_2254</setSpec><setSpec>col_10630_37959</setSpec></header><metadata><qdc:qualifieddc xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dcterms="http://purl.org/dc/terms/" xmlns:doc="http://www.lyncode.com/xoai" xmlns:qdc="http://dspace.org/qualifieddc/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://purl.org/dc/elements/1.1/ http://dublincore.org/schemas/xmls/qdc/2006/01/06/dc.xsd http://purl.org/dc/terms/ http://dublincore.org/schemas/xmls/qdc/2006/01/06/dcterms.xsd http://dspace.org/qualifieddc/ http://www.ukoln.ac.uk/metadata/dcmi/xmlschema/qualifieddc.xsd">
   <dc:title>Learning Decentralized Routing Policies via Graph Attention-based Multi-Agent Reinforcement Learning in Lunar Delay-Tolerant Networks</dc:title>
   <dc:creator>Lozano Cuadra, Federico</dc:creator>
   <dc:creator>Soret, Beatriz</dc:creator>
   <dc:creator>Sánchez Net, Marc</dc:creator>
   <dc:creator>Cauligi, Abhishek</dc:creator>
   <dc:creator>Rossi, Federico</dc:creator>
   <dc:subject>Aprendizaje automático</dc:subject>
   <dc:subject>Astronáutica - Sistemas de comunicaciones</dc:subject>
   <dcterms:abstract>We present a fully decentralized routing framework for multi-robot exploration missions operating under the constraints of a Lunar Delay-Tolerant Network (LDTN). In this setting, autonomous rovers must relay collected data to a lander under intermittent connectivity and unknown mobility patterns. We formulate the problem as a Partially Observable Markov Decision Problem (POMDP) and propose a Graph Attention-based Multi-Agent Reinforcement Learning (GAT-MARL) policy that performs Centralized Training, Decentralized Execution (CTDE). Our method relies only on local observations and does not require global topology updates or packet replication, unlike classical approaches such as shortest path and controlled flooding-based algorithms. Through Monte Carlo simulations in randomized exploration environments, GAT-MARL provides higher delivery rates, no duplications, and fewer packet losses, and is able to leverage short-term mobility forecasts; offering a scalable solution for future space robotic systems for planetary exploration, as demonstrated by successful generalization to larger rover teams.</dcterms:abstract>
   <dcterms:issued>2025-10-23</dcterms:issued>
   <dc:type>conference output</dc:type>
   <dc:identifier>https://arxiv.org/pdf/2510.20436</dc:identifier>
   <dc:identifier>https://hdl.handle.net/10630/45373</dc:identifier>
   <dc:language>eng</dc:language>
   <dc:relation>International Conference on Space Robotics 2025 (iSpaRo)</dc:relation>
   <dc:relation>Sendai, Japon</dc:relation>
   <dc:relation>1-4 Diciembre 2025</dc:relation>
   <dc:rights>http://creativecommons.org/licenses/by/4.0/</dc:rights>
   <dc:rights>open access</dc:rights>
   <dc:rights>Attribution 4.0 International</dc:rights>
</qdc:qualifieddc>
</metadata></record></GetRecord></OAI-PMH>