Citation

BibTex format

@article{Rizvi:2025:10.1109/tmlcn.2024.3521876,
author = {Rizvi, D and Boyle, D},
doi = {10.1109/tmlcn.2024.3521876},
journal = {IEEE Transactions on Machine Learning in Communications and Networking},
pages = {117--132},
title = {Multi-agent reinforcement learning with action masking for UAV-enabled mobile communications},
url = {http://dx.doi.org/10.1109/tmlcn.2024.3521876},
volume = {3},
year = {2025}
}

RIS format (EndNote, RefMan)

TY  - JOUR
AB - Unmanned Aerial Vehicles (UAVs) are increasingly used as aerial base stations to provide ad hoc communications infrastructure. Building upon prior research efforts which consider either static nodes, 2D trajectories or single UAV systems, this paper focuses on the use of multiple UAVs for providing wireless communication to mobile users in the absence of terrestrial communications infrastructure. In particular, we jointly optimize UAV 3D trajectory and NOMA power allocation to maximize system throughput. Firstly, a weighted K-means-based clustering algorithm establishes UAV-user associations at regular intervals. Then the efficacy of training a novel Shared Deep Q-Network (SDQN) with action masking is explored. Unlike training each UAV separately using DQN, the SDQN reduces training time by using the experiences of multiple UAVs instead of a single agent. We also show that SDQN can be used to train a multi-agent system with differing action spaces. Simulation results confirm that: 1) training a shared DQN outperforms a conventional DQN in terms of maximum system throughput (+20%) and training time (-10%); 2) it can converge for agents with different action spaces, yielding a 9% increase in throughput compared to Mutual DQN algorithm; and 3) combining NOMA with an SDQN architecture enables the network to achieve a better sum rate compared with existing baseline schemes.
AU - Rizvi,D
AU - Boyle,D
DO - 10.1109/tmlcn.2024.3521876
EP - 132
PY - 2025///
SN - 2831-316X
SP - 117
TI - Multi-agent reinforcement learning with action masking for UAV-enabled mobile communications
T2 - IEEE Transactions on Machine Learning in Communications and Networking
UR - http://dx.doi.org/10.1109/tmlcn.2024.3521876
UR - https://doi.org/10.1109/tmlcn.2024.3521876
VL - 3
ER -

Contact us

Dyson School of Design Engineering
Imperial College London
25 Exhibition Road
South Kensington
London
SW7 2DB

design.engineering@imperial.ac.uk
Tel: +44 (0) 20 7594 8888

Campus Map