@article{孙松林:1, author = {[孙松林, 张昕然]}, title = {通信资源调度对称MARL问题策略估计误差分析}, publisher = {北京邮电大学学报}, year = {2019}, journal = {北京邮电大学学报}, volume = {42}, number = {2}, eid = {1}, pages = {1-6}, keywords = {强化学习;对称多智能体强化学习;策略估计}, doi = https://journal.bupt.edu.cn/CN/10.13190/j.jbupt.2018-121 }