
{"id":126,"date":"2024-12-28T21:40:34","date_gmt":"2024-12-29T02:40:34","guid":{"rendered":"https:\/\/aamas2025.org\/?page_id=126"},"modified":"2025-04-22T00:14:26","modified_gmt":"2025-04-22T04:14:26","slug":"accepted-extended-abstracts","status":"publish","type":"page","link":"https:\/\/aamas2025.org\/index.php\/conference\/program\/accepted-extended-abstracts\/","title":{"rendered":"Accepted Extended Abstracts (with video links)"},"content":{"rendered":"\n<h2 class=\"wp-block-heading\">Accepted Extended Abstracts (Main Technical Track)<\/h2>\n\n\n\n<p>Some extended abstracts have links to author-made short video presentations (typically about 5 minutes long) in the last column.<\/p>\n\n\n\n<figure class=\"wp-block-table is-style-stripes\"><table><thead><tr><th class=\"has-text-align-left\" data-align=\"left\"><strong>ID<\/strong><\/th><th class=\"has-text-align-left\" data-align=\"left\"><strong>Title<\/strong><\/th><th class=\"has-text-align-left\" data-align=\"left\"><strong>Authors<\/strong><\/th><th class=\"has-text-align-left\" data-align=\"left\"><strong>Video<\/strong><\/th><\/tr><\/thead><tbody><tr><td class=\"has-text-align-left\" data-align=\"left\"><\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">5<\/td><td class=\"has-text-align-left\" data-align=\"left\">PANDA: Priority-Based Collision Avoidance Framework for Heterogeneous UAVs Navigating in Dense Airspace<\/td><td class=\"has-text-align-left\" data-align=\"left\">Agamdeep Singh, Jaskirat Singh, Sujit Pb<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">7<\/td><td class=\"has-text-align-left\" data-align=\"left\">Nash Equilibrium and Learning Dynamics in Three-Player Matching m-Action Games<\/td><td class=\"has-text-align-left\" data-align=\"left\">Yuma Fujimoto, Kaito Ariu, Kenshi Abe<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">16<\/td><td class=\"has-text-align-left\" data-align=\"left\">Adapting Beyond the Depth Limit: Counter Strategies in Large Imperfect Information Games<\/td><td class=\"has-text-align-left\" data-align=\"left\">David Milec, Vojtech Kovarik, Viliam Lis\u00fd<\/td><td class=\"has-text-align-left\" data-align=\"left\"><a href=\"https:\/\/drive.google.com\/file\/d\/12x7agN57KFOe_PG0N0GVFzX6_rn5cSjz\/view?usp=sharing\" target=\"_blank\" rel=\"noreferrer noopener\">Link<\/a><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">17<\/td><td class=\"has-text-align-left\" data-align=\"left\">Dynamic Option Creation in Option-Critic Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Mateus Begnini Melchiades, Gabriel De Oliveira Ramos, Bruno Castro Da Silva<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">26<\/td><td class=\"has-text-align-left\" data-align=\"left\">Offline Meta Reinforcement Learning with Weighted Policy Constraints and Proximal Context Collection<\/td><td class=\"has-text-align-left\" data-align=\"left\">Haorui Li, Jiaqi Liang, Linjing Li, Daniel Dajun Zeng<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">75<\/td><td class=\"has-text-align-left\" data-align=\"left\">Efficient Model Checking with Semantically-Equivalent Models for vGOAL<\/td><td class=\"has-text-align-left\" data-align=\"left\">Yi Yang, Tom Holvoet<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">88<\/td><td class=\"has-text-align-left\" data-align=\"left\">Empowering Generalization for Deep Reinforcement Learning via Symbolic Planning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Tianpei Yang, Srijita Das, Christabel Wayllace, Matthew E. Taylor<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">102<\/td><td class=\"has-text-align-left\" data-align=\"left\">ADAGE: A generic two-layer framework for adaptive agent based modelling<\/td><td class=\"has-text-align-left\" data-align=\"left\">Benjamin Patrick Evans, Sihan Zeng, Sumitra Ganesh, Leo Ardon<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">103<\/td><td class=\"has-text-align-left\" data-align=\"left\">Truman: A Large Language Model-based Multi-agent Simulator for Synthetic Money Laundering Data Generation<\/td><td class=\"has-text-align-left\" data-align=\"left\">Dattatray Vishnu Kute, Zihao Xu, Yuekang Li, Fethi A Rabhi<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">109<\/td><td class=\"has-text-align-left\" data-align=\"left\">Predicting Team Performance from Communications in Simulated Search-and-Rescue<\/td><td class=\"has-text-align-left\" data-align=\"left\">Ali Jalal-Kamali, Nikolos M Gurney, David V. Pynadath<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">113<\/td><td class=\"has-text-align-left\" data-align=\"left\">Local Anomaly Detection with Partial Observation in Multi-agent Systems as a Data Matching Game<\/td><td class=\"has-text-align-left\" data-align=\"left\">Zixin Ye, Christopher Leckie, Tansu Alpcan<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">117<\/td><td class=\"has-text-align-left\" data-align=\"left\">Resource Allocation under the Latin Square Constraint<\/td><td class=\"has-text-align-left\" data-align=\"left\">Yasushi Kawase, Bodhayan Roy, Mohammad Azharuddin Sanpui<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">123<\/td><td class=\"has-text-align-left\" data-align=\"left\">Group Fairness in Multi-period Mobile Facility Location Problems<\/td><td class=\"has-text-align-left\" data-align=\"left\">Haris Aziz, Hau Chan, Xingchen Sha, Toby Walsh, Lirong Xia<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">133<\/td><td class=\"has-text-align-left\" data-align=\"left\">Shapley Value-based Approach for Distributing Revenue of Matchmaking of Private Transactions in Blockchains<\/td><td class=\"has-text-align-left\" data-align=\"left\">Rasheed, Parth Desai, Yash Chaurasia, Sujit Gujar<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">134<\/td><td class=\"has-text-align-left\" data-align=\"left\">Neighborhood Stability in Assignments on Graphs<\/td><td class=\"has-text-align-left\" data-align=\"left\">Haris Aziz, Grzegorz Lisowski, Mashbat Suzuki, Jeremy Vollen<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">155<\/td><td class=\"has-text-align-left\" data-align=\"left\">Transformer Guided Coevolution: Improved Team Formation in Multiagent Adversarial Games<\/td><td class=\"has-text-align-left\" data-align=\"left\">Pranav Rajbhandari, Prithviraj Dasgupta, Donald Sofge<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">172<\/td><td class=\"has-text-align-left\" data-align=\"left\">Robust Strategies for Stochastic Multi-Agent Systems<\/td><td class=\"has-text-align-left\" data-align=\"left\">Rapha\u00ebl Berthon, Joost-Pieter Katoen, Munyque Mittelmann, Aniello Murano<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">173<\/td><td class=\"has-text-align-left\" data-align=\"left\">Shifting Power: Leveraging LLMs to Simulate Human Aversion in ABMs of Bilateral Financial Exchanges<\/td><td class=\"has-text-align-left\" data-align=\"left\">A Bond Market Study., Alicia Vidler, Toby Walsh<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">175<\/td><td class=\"has-text-align-left\" data-align=\"left\">Observer-Aware Probabilistic Planning under Partial Observability<\/td><td class=\"has-text-align-left\" data-align=\"left\">Salom\u00e9 Lepers, Vincent Thomas, Olivier Buffet<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">181<\/td><td class=\"has-text-align-left\" data-align=\"left\">Multi-Agent Systems for Bullying Intervention<\/td><td class=\"has-text-align-left\" data-align=\"left\">Luis Zhinin-Vera, Jos\u00e9 J Gonz\u00e1lez-Garc\u00eda, V\u00edctor L\u00f3pez-Jaquero, Elena Navarro, Pascual Gonz\u00e1lez<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">188<\/td><td class=\"has-text-align-left\" data-align=\"left\">Heuristics-Assisted Experience Replay Strategy for Cooperative Multi-Agent Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Xie Yi, Ziqing Zhou, Chun Ouyang, Siao Liu, Linqiang Hu, Zhongxue Gan<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">190<\/td><td class=\"has-text-align-left\" data-align=\"left\">Fair Assignment on Multi-Stage Graphs<\/td><td class=\"has-text-align-left\" data-align=\"left\">Vibulan J, Swapnil Dhamal, Shweta Jain, Ojassvi Kumar, Aman Kumar, Harpreet Singh<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">192<\/td><td class=\"has-text-align-left\" data-align=\"left\">Prompt Tuning with Diffusion for Few-Shot Pre-trained Policy Generalization<\/td><td class=\"has-text-align-left\" data-align=\"left\">Shengchao Hu, Wanru Zhao, Weixiong Lin, Li Shen, Ya Zhang, Dacheng Tao<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">202<\/td><td class=\"has-text-align-left\" data-align=\"left\">Regret Guarantees for a UCB-based Algorithm for Volatile Combinatorial Bandits<\/td><td class=\"has-text-align-left\" data-align=\"left\">Andra Siva Sai Teja, Kumar Abhishek, Sujit Gujar, Yadati Narahari, Ganesh Ghalme<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">205<\/td><td class=\"has-text-align-left\" data-align=\"left\">Voter Participation Control in Online Polls<\/td><td class=\"has-text-align-left\" data-align=\"left\">Koustav De, Palash Dey, Swagato Sanyal<\/td><td class=\"has-text-align-left\" data-align=\"left\"><a href=\"https:\/\/drive.google.com\/file\/d\/19n3em-nKIubGOcavYGfBc0VVXNkzK0ev\/view?usp=share_link\" target=\"_blank\" rel=\"noreferrer noopener\">Link<\/a><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">217<\/td><td class=\"has-text-align-left\" data-align=\"left\">Learning Heterogeneous Agent Collaboration in Decentralized Multi-Agent Systems via Intrinsic Motivation<\/td><td class=\"has-text-align-left\" data-align=\"left\">Jahir Sadik Monon, Deeparghya Dutta Barua, Md Mosaddek Khan<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">222<\/td><td class=\"has-text-align-left\" data-align=\"left\">Leveraging Fully-Observable Solutions for Improved Partially-Observable Offline Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Chulabhaya Wijesundara, Andrea Baisero, Gregory David Castanon, Alan Carlin, Robert Platt, Christopher Amato<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">223<\/td><td class=\"has-text-align-left\" data-align=\"left\">Fast Adaption by Policy Deviation Integral Meta-reinforcement Learning with Applications to High-speed Trains Operation<\/td><td class=\"has-text-align-left\" data-align=\"left\">Haotong Zhang, Wanyuan Wang<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">235<\/td><td class=\"has-text-align-left\" data-align=\"left\">RallyDiffuser: A Representation-Guided Diffusion Model Framework for Strategic Planning in Badminton<\/td><td class=\"has-text-align-left\" data-align=\"left\">Bing-Zhi Ke, Kuang-Da Wang, Wen-Chih Peng<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">253<\/td><td class=\"has-text-align-left\" data-align=\"left\">Negotiated Reasoning: On Provably Addressing Relative Over-Generalization<\/td><td class=\"has-text-align-left\" data-align=\"left\">Junjie Sheng, Wenhao Li, Bo Jin, Hongyuan Zha, Jun Wang, Xiangfeng Wang<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">260<\/td><td class=\"has-text-align-left\" data-align=\"left\">Dynamic Conservative Degree Allocation for Offline Multi-Agent Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Haosheng Chen, Yun Hua, Junjie Sheng, Wenhao Li, Bo Jin, Xiangfeng Wang<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">267<\/td><td class=\"has-text-align-left\" data-align=\"left\">Stochastic k-Submodular Bandits with Full Bandit Feedback<\/td><td class=\"has-text-align-left\" data-align=\"left\">Guanyu Nie, Vaneet Aggarwal, Christopher John Quinn<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">274<\/td><td class=\"has-text-align-left\" data-align=\"left\">Learning Fair and Preferable Allocations through Neural Network<\/td><td class=\"has-text-align-left\" data-align=\"left\">Ryota Maruo, Koh Takeuchi, Hisashi Kashima<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">275<\/td><td class=\"has-text-align-left\" data-align=\"left\">MORL4Water: A Modular Multi-Objective Reinforcement Learning Toolkit for Water Resource Management<\/td><td class=\"has-text-align-left\" data-align=\"left\">Zuzanna Osika, Roxana R\u0103dulescu, Jazmin Zatarain Salazar, Frans A Oliehoek, Pradeep K. Murukannaiah<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">278<\/td><td class=\"has-text-align-left\" data-align=\"left\">Towards Automating the Design of Value-Aligned Clinical Protocols<\/td><td class=\"has-text-align-left\" data-align=\"left\">Manel Rodriguez-Soto, Nardine Osman, Carles Sierra, Rocio Cintas-Garcia, Cristina Farriols-Danes, Montserrat Garcia-Retortillo, Silvia Minguez-Maso, Jordi Martinez-Roldan<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">296<\/td><td class=\"has-text-align-left\" data-align=\"left\">Adaptive Offline Data Replay in Offline-to-Online Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Xu Liu, Tong Yu, Shuai Li<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">304<\/td><td class=\"has-text-align-left\" data-align=\"left\">Enhancing Offline Safe Reinforcement Learning with Trajectory-Constrained Diffusion Planning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Hengrui Zhang, Youfang Lin, Shuo Shen, Hanfeng Lin, Peng Cheng, Sheng Han, Kai Lv<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">311<\/td><td class=\"has-text-align-left\" data-align=\"left\">IBGP: Imperfect Byzantine Generals Problem for Zero-Shot Robustness in Communicative Multi-Agent Systems<\/td><td class=\"has-text-align-left\" data-align=\"left\">Yihuan Mao, Yipeng Kang, Peilun Li, Ning Zhang, Wei Xu, Chongjie Zhang<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">317<\/td><td class=\"has-text-align-left\" data-align=\"left\">CADP: Towards Better Centralized Learning for Decentralized Execution in MARL<\/td><td class=\"has-text-align-left\" data-align=\"left\">Yihe Zhou, Shunyu Liu, Yunpeng Qing, Tongya Zheng, Kaixuan Chen, Jie Song, Mingli Song<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">347<\/td><td class=\"has-text-align-left\" data-align=\"left\">On the Distortion of Multi-Winner Elections on the Line Metric<\/td><td class=\"has-text-align-left\" data-align=\"left\">Negar Babashah, Hasti Karimi, Masoud Seddighin, Golnoosh Shahkarami<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">348<\/td><td class=\"has-text-align-left\" data-align=\"left\">Enhancing Lifelong Multi-Agent Path-finding by Using Artificial Potential Fields<\/td><td class=\"has-text-align-left\" data-align=\"left\">Arseniy Pertzovsky, Roni Stern, Roie Zivan, Ariel Felner<\/td><td class=\"has-text-align-left\" data-align=\"left\"><a href=\"https:\/\/www.youtube.com\/watch?v=0VBcFXBY7Qg\" target=\"_blank\" rel=\"noreferrer noopener\">Link<\/a><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">350<\/td><td class=\"has-text-align-left\" data-align=\"left\">On-Policy Reinforcement Learning From Failure via Sparse Reward Densification<\/td><td class=\"has-text-align-left\" data-align=\"left\">Mingkang Wu, Yongcan Cao<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">362<\/td><td class=\"has-text-align-left\" data-align=\"left\">Enhancing Robot Navigation Policies with Task-Specific Uncertainty Management<\/td><td class=\"has-text-align-left\" data-align=\"left\">Gokul Puthumanaillam, Paulo Padrao, Jose Fuentes, Leonardo Bobadilla, Melkior Ornik<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">364<\/td><td class=\"has-text-align-left\" data-align=\"left\">DyLam: A Dynamic Reward Weighting Framework for Reinforcement Learning Algorithms<\/td><td class=\"has-text-align-left\" data-align=\"left\">Mateus Gon\u00e7alves Machado, Hansenclever Bassani<\/td><td class=\"has-text-align-left\" data-align=\"left\"><a href=\"https:\/\/www.youtube.com\/watch?v=Y1tKJ5YFBZs\" target=\"_blank\" rel=\"noreferrer noopener\">Link<\/a><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">365<\/td><td class=\"has-text-align-left\" data-align=\"left\">Requirements-based Explainability for Multi Agent Systems<\/td><td class=\"has-text-align-left\" data-align=\"left\">Sebastian Rodriguez, John Thangarajah, Michael Winikoff<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">366<\/td><td class=\"has-text-align-left\" data-align=\"left\">The Effectiveness of Best-Response Dynamics in Reducing Price of Anarchy for Markov Potential Games<\/td><td class=\"has-text-align-left\" data-align=\"left\">Dingyang Chen, Xiaoling Zeng, Thinh T. Doan, Qi Zhang<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">380<\/td><td class=\"has-text-align-left\" data-align=\"left\">Learning Bayesian Game Families, with Application To Mechanism Design<\/td><td class=\"has-text-align-left\" data-align=\"left\">Madelyn Gatchel, Michael P. Wellman<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">386<\/td><td class=\"has-text-align-left\" data-align=\"left\">Policies with Sparse Inter-Agent Dependencies in Dynamic Games: A Dynamic Programming Approach<\/td><td class=\"has-text-align-left\" data-align=\"left\">Xinjie Liu, Jingqi Li, Filippos Fotiadis, Mustafa O. Karabag, Jesse Milzman, David Fridovich-Keil, Ufuk Topcu<\/td><td class=\"has-text-align-left\" data-align=\"left\"><a href=\"https:\/\/www.youtube.com\/watch?v=un-0I8votLw\" target=\"_blank\" rel=\"noreferrer noopener\">Link<\/a><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">396<\/td><td class=\"has-text-align-left\" data-align=\"left\">Optimal Mechanism Design for Crowdfunding of Public Goods<\/td><td class=\"has-text-align-left\" data-align=\"left\">Yukun Cheng, Xiaotie Deng, Baqiao Quan<\/td><td class=\"has-text-align-left\" data-align=\"left\"><a href=\"https:\/\/www.youtube.com\/watch?v=sxMymkgMl8Q\" target=\"_blank\" rel=\"noreferrer noopener\">Link<\/a><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">426<\/td><td class=\"has-text-align-left\" data-align=\"left\">Adaptive Budget Optimization for Multichannel Advertising Using Combinatorial Bandits<\/td><td class=\"has-text-align-left\" data-align=\"left\">Briti Gangopadhyay, Zhao Wang, Alberto Silvio Chiappa, Shingo Takamatsu<\/td><td class=\"has-text-align-left\" data-align=\"left\"><a href=\"https:\/\/drive.google.com\/file\/d\/1MbvSHRQljuRi9Gel3OnRoTZ7RZowr_sJ\/view?usp=sharing\" target=\"_blank\" rel=\"noreferrer noopener\">Link<\/a><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">429<\/td><td class=\"has-text-align-left\" data-align=\"left\">Parameterized Complexity of Hedonic Games with Enemy-Oriented Preferences<\/td><td class=\"has-text-align-left\" data-align=\"left\">Martin Durand, Laurin Erlacher, Johanne M\u00fcller Vistisen, Sofia Simola<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">433<\/td><td class=\"has-text-align-left\" data-align=\"left\">Egalitarianism in Online Coalition Formation<\/td><td class=\"has-text-align-left\" data-align=\"left\">Saar Cohen, Noa Agmon<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">444<\/td><td class=\"has-text-align-left\" data-align=\"left\">Distributed Value Decomposition Networks with Networked Agents<\/td><td class=\"has-text-align-left\" data-align=\"left\">Guilherme S. Varela, Alberto Sardinha, Francisco S. Melo<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">448<\/td><td class=\"has-text-align-left\" data-align=\"left\">Interaction Protocols in an Imperative Agent-Oriented Programming Language: the case of BSPL and SARL<\/td><td class=\"has-text-align-left\" data-align=\"left\">Matteo Baldoni, Cristina Baroglio, St\u00e9phane Galland, Roberto Micalizio, Fatma Outay, Stefano Tedeschi<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">449<\/td><td class=\"has-text-align-left\" data-align=\"left\">Managing an Agent\u2019s Changing Intentions Using LTL\ud835\udc53 Synthesis<\/td><td class=\"has-text-align-left\" data-align=\"left\">Giuseppe De Giacomo, Yves Lesperance, Gianmarco Parretti, Fabio Patrizi, Renzo Schram<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">452<\/td><td class=\"has-text-align-left\" data-align=\"left\">Compensating latent nonlinear dynamics for practical consensus control<\/td><td class=\"has-text-align-left\" data-align=\"left\">Krzysztof Kowalczyk, Dominik Baumann, Cristian R. Rojas, Pawe\u0142 Wachel<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">463<\/td><td class=\"has-text-align-left\" data-align=\"left\">CDSA: Conservative Denoising Score-based Algorithm for Offline Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Zeyuan Liu, Yang Kai, Jiafei Lyu, Xiu Li<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">464<\/td><td class=\"has-text-align-left\" data-align=\"left\">Social Ranking for Feature Selection<\/td><td class=\"has-text-align-left\" data-align=\"left\">Laurent Gourv\u00e8s, Stefano Moretti, Satya Tamby<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">483<\/td><td class=\"has-text-align-left\" data-align=\"left\">Learning Pre-Trained Tacit Behavior for Efficient Multi-Agent Adversarial Coordination<\/td><td class=\"has-text-align-left\" data-align=\"left\">Shiqing Yao, Jiajun Chai, Haixin Yu, Yongzhe Chang, Yuanheng Zhu, Xueqian Wang<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">505<\/td><td class=\"has-text-align-left\" data-align=\"left\">Reducing Variance Caused by Communication in Decentralized Multi-agent Deep Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Changxi Zhu, Mehdi Dastani, Shihan Wang<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">507<\/td><td class=\"has-text-align-left\" data-align=\"left\">Making Universal Policies Universal<\/td><td class=\"has-text-align-left\" data-align=\"left\">Niklas Hoepner, David Kuric, Herke Van Hoof<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">520<\/td><td class=\"has-text-align-left\" data-align=\"left\">Boosting Robustness in Preference-Based Reinforcement Learning with Dynamic Sparsity<\/td><td class=\"has-text-align-left\" data-align=\"left\">Calarina Muslimani, Bram Grooten, Deepak Ranganatha Sastry Mamillapalli, Mykola Pechenizkiy, Decebal Constantin Mocanu, Matthew E. Taylor<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">525<\/td><td class=\"has-text-align-left\" data-align=\"left\">LogiEx: Integrating Formal Logic and Large Language Model for Explainable Planning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Ziyan An, Xia Wang, Hendrik Baier, Zirong Chen, Abhishek Dubey, Taylor T Johnson, Jonathan Sprinkle, Ayan Mukhopadhyay, Meiyi Ma<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">541<\/td><td class=\"has-text-align-left\" data-align=\"left\">ChatBDI: Think BDI<\/td><td class=\"has-text-align-left\" data-align=\"left\">Talk Llm, Andrea Gatti, Viviana Mascardi, Angelo Ferrando<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">546<\/td><td class=\"has-text-align-left\" data-align=\"left\">Modeling the Collaborative Edge Data Caching Problem via a Dynamic DCOP<\/td><td class=\"has-text-align-left\" data-align=\"left\">Ziyang Song, Ziyu Chen, Jinhui Huang, Cheng Zhang, Jingyuan He<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">547<\/td><td class=\"has-text-align-left\" data-align=\"left\">Reasoning and Planning with Dynamic Social Norms<\/td><td class=\"has-text-align-left\" data-align=\"left\">Taylor Olson, Roberto Salas-Damian, Kenneth Forbus<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">557<\/td><td class=\"has-text-align-left\" data-align=\"left\">Predictive Improvement through Latent Space Optimisation<\/td><td class=\"has-text-align-left\" data-align=\"left\">Alexander McCaffrey, Eduardo Alonso, Esther Mondragon<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">565<\/td><td class=\"has-text-align-left\" data-align=\"left\">Knowledge Transfer in Model-Based Reinforcement Learning Agents for Efficient Multi-Task Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Dmytro Kuzmenko, Nadiya Shvai<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">584<\/td><td class=\"has-text-align-left\" data-align=\"left\">Hierarchical Multi-agent Reinforcement Learning for Cyber Network Defense<\/td><td class=\"has-text-align-left\" data-align=\"left\">Aditya Vikram Singh, Ethan Rathbun, Emma Graham, Lisa Oakley, Simona Boboila, Alina Oprea, Peter Chin<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">586<\/td><td class=\"has-text-align-left\" data-align=\"left\">Practical Comparisons of Reservoir Topology Performance and Input Distribution in Digital Reservoir Computers<\/td><td class=\"has-text-align-left\" data-align=\"left\">Lewis Thelen, Vikram Ravindra<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">588<\/td><td class=\"has-text-align-left\" data-align=\"left\">Dynamic Reward Sharing to Enhance Learning in the Context of Multiagent Teams<\/td><td class=\"has-text-align-left\" data-align=\"left\">Kyle Tilbury, David Radke<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">590<\/td><td class=\"has-text-align-left\" data-align=\"left\">AlphaZeroES: Direct Score Maximization Outperforms Planning Loss Minimization<\/td><td class=\"has-text-align-left\" data-align=\"left\">Carlos Martin, Tuomas Sandholm<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">626<\/td><td class=\"has-text-align-left\" data-align=\"left\">Rethinking Explainable AI: Explanations can be Deceiving<\/td><td class=\"has-text-align-left\" data-align=\"left\">Peta Masters, Daniel Gallagher, Luc Moreau, Mor Vered<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">644<\/td><td class=\"has-text-align-left\" data-align=\"left\">FedHPD: Heterogeneous Federated Reinforcement Learning via Policy Distillation<\/td><td class=\"has-text-align-left\" data-align=\"left\">Wenzheng Jiang, Ji Wang, Xiongtao Zhang, Weidong Bao, Cheston Tan, Flint Xiaofeng Fan<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">656<\/td><td class=\"has-text-align-left\" data-align=\"left\">Navigating Social Dilemmas with LLM-based Agents via Consideration of Future Consequences<\/td><td class=\"has-text-align-left\" data-align=\"left\">Dung Nguyen, Hung Le, Kien Do, Sunil Gupta, Svetha Venkatesh, Truyen Tran<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">673<\/td><td class=\"has-text-align-left\" data-align=\"left\">The Costly Bargain: Economic Impacts of Price-Seeking Behavior in Aging Populations<\/td><td class=\"has-text-align-left\" data-align=\"left\">Fuguang Chen, Alan Tsang<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">677<\/td><td class=\"has-text-align-left\" data-align=\"left\">Traffic Anomaly Detection through Generative Modeling of Multi-Agent Interactions in Traffic Flow<\/td><td class=\"has-text-align-left\" data-align=\"left\">Zhuojun Chen, Tacitus Hui, Xinghua Zhu, Dongzhe Su<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">682<\/td><td class=\"has-text-align-left\" data-align=\"left\">Satisfactory Budget Division<\/td><td class=\"has-text-align-left\" data-align=\"left\">Laurent Gourv\u00e8s, Michael Lampis, Nikolaos Melissinos, Aris Pagourtzis<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">689<\/td><td class=\"has-text-align-left\" data-align=\"left\">Decentralized Deep Reinforcement Learning for Cooperative Multi-Agent Flight Trajectory Planning in Adverse Weather<\/td><td class=\"has-text-align-left\" data-align=\"left\">Bizhao Pang, Mingcheng Zhang, Xinting Hu, Sameer Alam, Guglielmo Lulli<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">705<\/td><td class=\"has-text-align-left\" data-align=\"left\">Mitigating Non-Stationarity in Deep Reinforcement Learning with Clustering Orthogonal Weight Modification<\/td><td class=\"has-text-align-left\" data-align=\"left\">Guoqing Ma, Yuhan Zhang, Yuming Dai, Guangfu Hao, Yang Chen, Shan Yu<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">722<\/td><td class=\"has-text-align-left\" data-align=\"left\">SFedRec: A Federated Learning Framework for Dynamic Session-based Recommendation<\/td><td class=\"has-text-align-left\" data-align=\"left\">Hexiao Zhang, Yanni Tang, Jiamou Liu, Wu Chen<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">723<\/td><td class=\"has-text-align-left\" data-align=\"left\">Environmental Policies within Cournot Oligopoly<\/td><td class=\"has-text-align-left\" data-align=\"left\">Liang Shan, Zhengyang Liu, Haoqiang Huang, Zihe Wang<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">732<\/td><td class=\"has-text-align-left\" data-align=\"left\">Efficient Training of Generalizable Visuomotor Policies via Control-Aware Augmentation<\/td><td class=\"has-text-align-left\" data-align=\"left\">Yinuo Zhao, Kun Wu, Tianjiao Yi, Zhiyuan Xu, Zhengping Che, Chi Harold Liu, Jian Tang<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">735<\/td><td class=\"has-text-align-left\" data-align=\"left\">Multiplayer Games With Incomplete Information for Hyperproperty Verification<\/td><td class=\"has-text-align-left\" data-align=\"left\">Raven Beutner, Bernd Finkbeiner<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">736<\/td><td class=\"has-text-align-left\" data-align=\"left\">RainbowArena: A Multi-Agent Toolkit for Reinforcement Learning and Large Language Models in Competitive Tabletop Games<\/td><td class=\"has-text-align-left\" data-align=\"left\">Yingzhuo Liu, Shuodi Liu, Hongsong Tang, Yubing Ma, Zikang Li, Junge Zhang, Liuyu Xiang, Zhaofeng He<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">747<\/td><td class=\"has-text-align-left\" data-align=\"left\">Multi-Agent Pickup and Delivery with Batteries<\/td><td class=\"has-text-align-left\" data-align=\"left\">Marcello Bavaro, Francesco Amigoni<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">755<\/td><td class=\"has-text-align-left\" data-align=\"left\">Model of the influence of external signals on the trust of the agent in Multi Agent System<\/td><td class=\"has-text-align-left\" data-align=\"left\">Frederique Lalieu, Tomasz Zurek, Tom Van Engers<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">758<\/td><td class=\"has-text-align-left\" data-align=\"left\">What Is a Counterfactual Cause in Action Theories?<\/td><td class=\"has-text-align-left\" data-align=\"left\">Daxin Liu, Vaishak Belle<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">768<\/td><td class=\"has-text-align-left\" data-align=\"left\">Quantitative Operational Monitoring for BDI Agents<\/td><td class=\"has-text-align-left\" data-align=\"left\">Marie Farrell, Angelo Ferrando, Mengwei Xu<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">782<\/td><td class=\"has-text-align-left\" data-align=\"left\">Integrating Large Language Models with Reinforcement Learning for Generalization in Strategic Card Games<\/td><td class=\"has-text-align-left\" data-align=\"left\">Wannian Xia, Meng Fang, Zihao Guo, Yali Du, Bo Xu<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">814<\/td><td class=\"has-text-align-left\" data-align=\"left\">Lite-DIO Is Actually What You Need for Efficient Inertial Localization<\/td><td class=\"has-text-align-left\" data-align=\"left\">Yan Li, Meng Liu, Zhongchen Shi, Yanqing Hou, Liang Xie, Hongbo Chen, Erwei Yin<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">824<\/td><td class=\"has-text-align-left\" data-align=\"left\">Equilibrium selection via communication partition<\/td><td class=\"has-text-align-left\" data-align=\"left\">Wei-Chen Lee, Alessandro Abate, Michael J. Wooldridge<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">826<\/td><td class=\"has-text-align-left\" data-align=\"left\">Bidirectional Distillation: A Mixed-Play Framework for Multi-Agent Generalizable Behaviors<\/td><td class=\"has-text-align-left\" data-align=\"left\">Lang Feng, Jiahao Lin, Dong Xing, Li Zhang, De Ma, Gang Pan<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">842<\/td><td class=\"has-text-align-left\" data-align=\"left\">Experience-replay Innovative Dynamics<\/td><td class=\"has-text-align-left\" data-align=\"left\">Tuo Zhang, Leonardo Stella, Julian Barreiro-Gomez<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">844<\/td><td class=\"has-text-align-left\" data-align=\"left\">Multi-Agent Reinforcement Learning with Selective State-Space Models<\/td><td class=\"has-text-align-left\" data-align=\"left\">Jemma Daniel, Ruan John De Kock, Louay Ben Nessir, Sasha Abramowitz, Omayma Mahjoub, Wiem Khlifi, Juan Claude Formanek, Arnu Pretorius<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">860<\/td><td class=\"has-text-align-left\" data-align=\"left\">Entropic Exploration for Constrained Multiagent Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Ayhan Alp Aydeniz, Enrico Marchesini, Robert Loftin, Christopher Amato, Kagan Tumer<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">862<\/td><td class=\"has-text-align-left\" data-align=\"left\">Decision-Making in Evolving Environments: A Bayesian Multi-Agent Bandit Framework<\/td><td class=\"has-text-align-left\" data-align=\"left\">Mohammad Essa Alsomali, Leandro Soriano Marcolino, Barry Porter, Roberto Rodrigues-Filho<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">863<\/td><td class=\"has-text-align-left\" data-align=\"left\">CPE: A New Paradigm for Policy Extraction in Offline Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Zhaohui Yang, Xiaoxuan Wang, Linjing Li<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">869<\/td><td class=\"has-text-align-left\" data-align=\"left\">Agential AI for Integrated Continual Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Deliberative Behavior, And Comprehensible Models, Zeki Doruk Erden, Boi Faltings<\/td><td class=\"has-text-align-left\" data-align=\"left\"><a href=\"https:\/\/youtu.be\/xpA5Xgn26jo?si=opZx2pCt8h9iuTuS\" target=\"_blank\" rel=\"noreferrer noopener\">Link<\/a><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">876<\/td><td class=\"has-text-align-left\" data-align=\"left\">Runtime Verification with Rational Multi-Monitors<\/td><td class=\"has-text-align-left\" data-align=\"left\">Davide Catta, Angelo Ferrando, Vadim Malvone<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">877<\/td><td class=\"has-text-align-left\" data-align=\"left\">Where is the nearest EV charging station? Evolutionary optimization of the gas\/charging stations topology<\/td><td class=\"has-text-align-left\" data-align=\"left\">Enrique Mateos-Melero, Javier Moralejo-Pi\u00f1as, \u00c1ngela Dur\u00e1n-Pinto, Francisco Martinez-Gil, Mar\u00eda Soriano, Fernando Fern\u00e1ndez<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">890<\/td><td class=\"has-text-align-left\" data-align=\"left\">Improving the effectiveness of potential-based reward shaping in reinforcement learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Henrik M\u00fcller, Daniel Kudenko<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">897<\/td><td class=\"has-text-align-left\" data-align=\"left\">Can you see how I learn? Human observers\u2019 inferences about Reinforcement Learning agents\u2019 learning processes<\/td><td class=\"has-text-align-left\" data-align=\"left\">Bernhard Hilpert, Muhan Hou, Kim Baraka, Joost Broekens<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">906<\/td><td class=\"has-text-align-left\" data-align=\"left\">Distributed Adaptive Macroscopic Ensemble Task Allocation of Heterogeneous Robot Teams in Dynamic Environments<\/td><td class=\"has-text-align-left\" data-align=\"left\">Victoria Edwards, M. Ani Hsieh<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">949<\/td><td class=\"has-text-align-left\" data-align=\"left\">Trading-off Accuracy and Communication Cost in Federated Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Mattia Jacopo Villani, Emanuele Natale, Frederik Mallmann-Trenn<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">951<\/td><td class=\"has-text-align-left\" data-align=\"left\">When to Stop Getting Tested: The Theory of Diagnostic Tests<\/td><td class=\"has-text-align-left\" data-align=\"left\">Anson Kahng, Joseph Saber<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">952<\/td><td class=\"has-text-align-left\" data-align=\"left\">Cultural Evolution of Cooperation among LLM Agents<\/td><td class=\"has-text-align-left\" data-align=\"left\">Aron Vallinder, Edward Hughes<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">957<\/td><td class=\"has-text-align-left\" data-align=\"left\">Is an exponentially growing action space really that bad? Validating a Core Assumption for using Multi-Agent RL<\/td><td class=\"has-text-align-left\" data-align=\"left\">Ruan John De Kock, Arnu Pretorius, Jonathan P. Shock<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">962<\/td><td class=\"has-text-align-left\" data-align=\"left\">Adaptive Multi-Round Influence Maximization with Limited Information<\/td><td class=\"has-text-align-left\" data-align=\"left\">Diodato Ferraioli, Vincenzo Auletta, Cosimo Vinci, Francesco Carbone<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">970<\/td><td class=\"has-text-align-left\" data-align=\"left\">Weighted Envy Freeness With Bounded Subsidies<\/td><td class=\"has-text-align-left\" data-align=\"left\">Noga Klein Elmalem, Rica Gonen, Erel Segal-Halevi<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">971<\/td><td class=\"has-text-align-left\" data-align=\"left\">Combining Normative Ethics Principles to Learn Prosocial Behaviour<\/td><td class=\"has-text-align-left\" data-align=\"left\">Jessica Woodgate, Nirav Ajmeri<\/td><td class=\"has-text-align-left\" data-align=\"left\"><a href=\"https:\/\/jessica-woodgate.github.io\/publications\/AAMAS25_combining_video.html\" target=\"_blank\" rel=\"noreferrer noopener\">Link<\/a><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">972<\/td><td class=\"has-text-align-left\" data-align=\"left\">Participatory Budgeting Project Strength via Candidate Control<\/td><td class=\"has-text-align-left\" data-align=\"left\">Piotr Faliszewski, \u0141ukasz Janeczko, Du\u0161an Knop, Jan Pokorn\u00fd, \u0160imon Schierreich, Mateusz S\u0142uszniak, Krzysztof Sornat<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">975<\/td><td class=\"has-text-align-left\" data-align=\"left\">Bridging the Gap between Partially Observable Stochastic Games and Sparse POMDP Methods<\/td><td class=\"has-text-align-left\" data-align=\"left\">Tyler Becker, Zachary N Sunberg<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">978<\/td><td class=\"has-text-align-left\" data-align=\"left\">Towards Fair and Efficient Policy Learning in Cooperative Multi-Agent Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Umer Siddique, Peilang Li, Yongcan Cao<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">991<\/td><td class=\"has-text-align-left\" data-align=\"left\">Diversity-seeking swap games in networks<\/td><td class=\"has-text-align-left\" data-align=\"left\">Yaqiao Li, Lata Narayanan, Jaroslav Opatrny<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">993<\/td><td class=\"has-text-align-left\" data-align=\"left\">(Submodular) Hedonic Games with Common Ranking Property<\/td><td class=\"has-text-align-left\" data-align=\"left\">Bugra Caskurlu, Ali Eser<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1002<\/td><td class=\"has-text-align-left\" data-align=\"left\">Action-Dependent Optimality-Preserving Reward Shaping<\/td><td class=\"has-text-align-left\" data-align=\"left\">Grant Collier Forbes, Jianxun Wang, Leonardo Villalobos-Arias, Arnav Jhala, David Roberts<\/td><td class=\"has-text-align-left\" data-align=\"left\"><a href=\"https:\/\/drive.google.com\/file\/d\/1TtZwHAxOCcp-1QWBePWi3_AwTx_Xul5P\/view?usp=sharing\" target=\"_blank\" rel=\"noreferrer noopener\">Link<\/a><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1018<\/td><td class=\"has-text-align-left\" data-align=\"left\">Planning for Temporally Extended Goals based on alpha-CTL<\/td><td class=\"has-text-align-left\" data-align=\"left\">Viviane Bonadia Dos Santos, Leliane N. De Barros, Maria Viviane De Menezes, Silvio Do Lago Pereira<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1021<\/td><td class=\"has-text-align-left\" data-align=\"left\">Efficient Multi-Agent Delegated Search<\/td><td class=\"has-text-align-left\" data-align=\"left\">Curtis Bechtel, Shaddin Dughmi<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1025<\/td><td class=\"has-text-align-left\" data-align=\"left\">Fairness in Cooperative Multiagent Multiobjective Reinforcement Learning using the Expected Scalarized Reward Criterion<\/td><td class=\"has-text-align-left\" data-align=\"left\">Fares Chouaki, Aur\u00e9lie Beynier, Nicolas Maudet, Paolo Viappiani<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1040<\/td><td class=\"has-text-align-left\" data-align=\"left\">Formal Verification of Manipulation Dialogues<\/td><td class=\"has-text-align-left\" data-align=\"left\">Andreas Br\u00e4nnstr\u00f6m, Chiaki Sakama, Juan Carlos Nieves<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1042<\/td><td class=\"has-text-align-left\" data-align=\"left\">Learning to explore when mistakes are not allowed<\/td><td class=\"has-text-align-left\" data-align=\"left\">Charly Pecqueux-Gu\u00e9z\u00e9nec, Stephane Doncieux, Nicolas Perrin-Gilbert<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1053<\/td><td class=\"has-text-align-left\" data-align=\"left\">Tools in the Loop: Quantifying Uncertainty of LLM Question Answering Systems That Use Tools<\/td><td class=\"has-text-align-left\" data-align=\"left\">Panagiotis Lymperopoulos, Vasanth Sarathy<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1070<\/td><td class=\"has-text-align-left\" data-align=\"left\">DECAF: Learning to be Fair in Multi-agent Resource Allocation<\/td><td class=\"has-text-align-left\" data-align=\"left\">Ashwin Kumar, William Yeoh<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1073<\/td><td class=\"has-text-align-left\" data-align=\"left\">Online Competitive Information Gathering for Partially Observable Trajectory Games<\/td><td class=\"has-text-align-left\" data-align=\"left\">Mel Krusniak, Hang Xu, Parker Palermo, Forrest John Laine<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1090<\/td><td class=\"has-text-align-left\" data-align=\"left\">Diverse Heterogeneous Graph Conditioned Diffusion for Multi-Agent Teaming<\/td><td class=\"has-text-align-left\" data-align=\"left\">Luis Manuel Pimentel, Sean Charles Ye, James Ellis Grant Pagan, Matthew Gombolay<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1104<\/td><td class=\"has-text-align-left\" data-align=\"left\">Symplex: Learning social norm hierarchies by combining autonomous exploration and expert imitation<\/td><td class=\"has-text-align-left\" data-align=\"left\">Oliver Deane, Oliver Ray<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1138<\/td><td class=\"has-text-align-left\" data-align=\"left\">Weighted Envy-free Allocation with Subsidy<\/td><td class=\"has-text-align-left\" data-align=\"left\">Haris Aziz, Xin Huang, Kei Kimura, Indrajit Saha, Zhaohong Sun, Mashbat Suzuki, Makoto Yokoo<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1141<\/td><td class=\"has-text-align-left\" data-align=\"left\">Learning Flexible Heterogeneous Coordination With Capability-Aware Shared Hypernetworks<\/td><td class=\"has-text-align-left\" data-align=\"left\">Kevin Fu, Pierce Howell, Shalin Jain, Harish Ravichandar<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1154<\/td><td class=\"has-text-align-left\" data-align=\"left\">Evaluating and Improving Graph-based Explanation Methods for Multi-Agent Coordination<\/td><td class=\"has-text-align-left\" data-align=\"left\">Siva Kailas, Shalin Jain, Harish Ravichandar<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1155<\/td><td class=\"has-text-align-left\" data-align=\"left\">Liquid Welfare and Revenue Monotonicity in Adaptive Clinching Auctions<\/td><td class=\"has-text-align-left\" data-align=\"left\">Ryosuke Sato<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1163<\/td><td class=\"has-text-align-left\" data-align=\"left\">Open-World Classification with Bayesian Gaussian Mixture Models<\/td><td class=\"has-text-align-left\" data-align=\"left\">Justin Clarke, Przemyslaw A. Grabowicz, David Jensen<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1194<\/td><td class=\"has-text-align-left\" data-align=\"left\">Asynchronous Cooperative Multi-Agent Reinforcement Learning with Limited Communication<\/td><td class=\"has-text-align-left\" data-align=\"left\">Sydney Dolan, Siddharth Nayak, Jasmine Jerry Aloor, Hamsa Balakrishnan<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1204<\/td><td class=\"has-text-align-left\" data-align=\"left\">Resolving Multiple-Dynamic Model Uncertainty in Hypothesis-Driven Belief-MDPs<\/td><td class=\"has-text-align-left\" data-align=\"left\">Ofer Dagan, Tyler Becker, Zachary N Sunberg<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1210<\/td><td class=\"has-text-align-left\" data-align=\"left\">Matching Markets with Chores<\/td><td class=\"has-text-align-left\" data-align=\"left\">Thorben Tr\u00f6bst, Jugal Garg, Vijay Vazirani<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1216<\/td><td class=\"has-text-align-left\" data-align=\"left\">EconTwo: A Two-Level Multi-Agent Framework for Dynamic Macroeconomic Modeling with Shock Resilience<\/td><td class=\"has-text-align-left\" data-align=\"left\">Zhixun Chen, Zijing Shi, Yaodong Yang, Meng Fang, Yali Du<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1237<\/td><td class=\"has-text-align-left\" data-align=\"left\">Group-fair Facility Location Games with Externalities<\/td><td class=\"has-text-align-left\" data-align=\"left\">Minming Li, Cheng Peng, Ying Wang, Houyu Zhou<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1254<\/td><td class=\"has-text-align-left\" data-align=\"left\">Using Assistance Rewards Without Introducing Bias: Overcoming Sparse Rewards in Multi-Agent Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Yue Yang, Bernd Meyer, Frits De Nijs<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1262<\/td><td class=\"has-text-align-left\" data-align=\"left\">Pure Nash Equilibrium and Strong Nash Equilibrum Computation in Aggregate Games<\/td><td class=\"has-text-align-left\" data-align=\"left\">Jared Soundy, Mohammad T. Irfan, Hau Chan<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1263<\/td><td class=\"has-text-align-left\" data-align=\"left\">On the existence of EFX allocations in multigraphs<\/td><td class=\"has-text-align-left\" data-align=\"left\">Alkmini Sgouritsa, Minas Marios Sotiriou<\/td><td class=\"has-text-align-left\" data-align=\"left\"><a href=\"https:\/\/drive.google.com\/file\/d\/1sgXU1MYGVzNOXpF90VYGTyqcf7jxdl1d\/view?usp=drive_link\" target=\"_blank\" rel=\"noreferrer noopener\">Link<\/a><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1291<\/td><td class=\"has-text-align-left\" data-align=\"left\">Decoding Negotiation Dynamics: The Impact of Opponent Identity and Privacy on Strategy<\/td><td class=\"has-text-align-left\" data-align=\"left\">Deception, And Emotional Transparency In Human-Agent Interaction, Nusrath Jahan, Johnathan Mell<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1297<\/td><td class=\"has-text-align-left\" data-align=\"left\">Tacit Learning with Adaptive Information Selection for Cooperative Multi-Agent Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Lunjun Liu, Weilai Jiang, Yaonan Wang<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1308<\/td><td class=\"has-text-align-left\" data-align=\"left\">Will Systems of LLM Agents Lead to Cooperation: An Investigation into a Social Dilemma<\/td><td class=\"has-text-align-left\" data-align=\"left\">Richard Willis, Yali Du, Joel Z Leibo<\/td><td class=\"has-text-align-left\" data-align=\"left\"><a href=\"https:\/\/www.dropbox.com\/scl\/fi\/6m0csb0lmjbe6o8hnqo7g\/llm.mp4?rlkey=3rgrl8a6xjm9r3nnuryz5nc4k&amp;st=u7o1oram&amp;dl=0\" target=\"_blank\" rel=\"noreferrer noopener\">Link<\/a><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1335<\/td><td class=\"has-text-align-left\" data-align=\"left\">To Stand on the Shoulders of Giants: Should We Protect Initial Discoveries in Multi-Agent Exploration?<\/td><td class=\"has-text-align-left\" data-align=\"left\">Hodaya Lampert, Reshef Meir, Kinneret Teodorescu<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1348<\/td><td class=\"has-text-align-left\" data-align=\"left\">Coordinating Competing Electric Vehicle Fleets: An Agent-Based Charging Capacity Market<\/td><td class=\"has-text-align-left\" data-align=\"left\">Lennard Sund, Janik Muires, Ramin Ahadi, Konstantina Valogianni, Wolfgang Ketter<\/td><td class=\"has-text-align-left\" data-align=\"left\"><a href=\"https:\/\/vimeo.com\/1066575001\/2587eb2c60?share=copy\" target=\"_blank\" rel=\"noreferrer noopener\">Link<\/a><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1359<\/td><td class=\"has-text-align-left\" data-align=\"left\">Fusing Physical and Cognitive Stimuli: An Eye Movement Emotion Recognition Framework Based on Hierarchical Attention Mechanism<\/td><td class=\"has-text-align-left\" data-align=\"left\">Zhi Lin Li, Xiaomei Tao<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1366<\/td><td class=\"has-text-align-left\" data-align=\"left\">Adaptive Microtolling in Competitive Online Congestion Games via Multiagent Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Behrad Koohy, Sebastian Stein, Enrico Gerding<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1384<\/td><td class=\"has-text-align-left\" data-align=\"left\">Context Adaptive Memory-Efficient LLM Inference for Edge Multi-Agent Systems<\/td><td class=\"has-text-align-left\" data-align=\"left\">Hamza Mohammed, Sai Chand Boyapati, Hang Yin<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><tr><td class=\"has-text-align-left\" data-align=\"left\">1395<\/td><td class=\"has-text-align-left\" data-align=\"left\">A Minimalist Approach to Augmentation-based Self-supervised Representation Learning for On-policy Reinforcement Learning<\/td><td class=\"has-text-align-left\" data-align=\"left\">Nasik Muhammad Nafi, William Hsu<\/td><td class=\"has-text-align-left\" data-align=\"left\"><\/td><\/tr><\/tbody><\/table><\/figure>\n","protected":false},"excerpt":{"rendered":"<p>Accepted Extended Abstracts (Main Technical Track) Some extended abstracts have links to author-made short video presentations (typically about 5 minutes long) in the last column.&hellip;<\/p>\n","protected":false},"author":1,"featured_media":0,"parent":116,"menu_order":0,"comment_status":"closed","ping_status":"closed","template":"","meta":{"footnotes":""},"_links":{"self":[{"href":"https:\/\/aamas2025.org\/index.php\/wp-json\/wp\/v2\/pages\/126"}],"collection":[{"href":"https:\/\/aamas2025.org\/index.php\/wp-json\/wp\/v2\/pages"}],"about":[{"href":"https:\/\/aamas2025.org\/index.php\/wp-json\/wp\/v2\/types\/page"}],"author":[{"embeddable":true,"href":"https:\/\/aamas2025.org\/index.php\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/aamas2025.org\/index.php\/wp-json\/wp\/v2\/comments?post=126"}],"version-history":[{"count":33,"href":"https:\/\/aamas2025.org\/index.php\/wp-json\/wp\/v2\/pages\/126\/revisions"}],"predecessor-version":[{"id":2461,"href":"https:\/\/aamas2025.org\/index.php\/wp-json\/wp\/v2\/pages\/126\/revisions\/2461"}],"up":[{"embeddable":true,"href":"https:\/\/aamas2025.org\/index.php\/wp-json\/wp\/v2\/pages\/116"}],"wp:attachment":[{"href":"https:\/\/aamas2025.org\/index.php\/wp-json\/wp\/v2\/media?parent=126"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}