# encoding:utf-8 @article{peters2019ergodicity, title={The ergodicity problem in economics}, author={Peters, Ole}, journal={Nature Physics}, volume={15}, number={12}, pages={1216--1221}, year={2019}, publisher={Nature Publishing Group} } @inproceedings{boyan1996learning, title={Learning evaluation functions for large acyclic domains}, author={Boyan, Justin A and Moore, Andrew W}, booktitle={Proceedings of the Thirteenth International Conference on Machine Learning}, pages={63--70}, year={1996} } @article{boyan2002technical, title={Technical update: Least-squares temporal difference learning}, author={Boyan, Justin A}, journal={Machine learning}, volume={49}, number={2-3}, pages={233--246}, year={2002}, publisher={Springer} } @article{pakes1969some, title={Some conditions for ergodicity and recurrence of Markov chains}, author={Pakes, Anthony G}, journal={Operations Research}, volume={17}, number={6}, pages={1058--1061}, year={1969}, publisher={INFORMS} } @article{kaplan1979sufficient, title={A sufficient condition of nonergodicity of a {Markov} chain (Corresp.)}, author={Kaplan, Michael}, journal={IEEE Transactions on Information Theory}, volume={25}, number={4}, pages={470--471}, year={1979}, publisher={IEEE} } @article{wiewiora2003potential, title={Potential-based shaping and Q-value initialization are equivalent}, author={Wiewiora, Eric}, journal={Journal of Artificial Intelligence Research}, volume={19}, pages={205--208}, year={2003} } @inproceedings{devlin2012dynamic, title={Dynamic potential-based reward shaping}, author={Devlin, Sam Michael and Kudenko, Daniel}, booktitle={11th International Conference on Autonomous Agents and Multiagent Systems (AAMAS 2012)}, pages={433--440}, year={2012}, organization={IFAAMAS} } @misc{abdelkader20152048, title={2048 is NP-Complete}, author={Abdelkader, Ahmed and Acharya, Aditya and Dasler, Philip}, year={2015}, } @incollection{bangole2023game, title={Game Playing (2048) Using Deep Neural Networks}, author={Bangole, Narendra Kumar Rao and Moulya, RB and Pranthi, R and Reddy, Sreelekha and Namratha, R}, booktitle={The Software Principles of Design for Data Modeling}, pages={133--144}, year={2023}, publisher={IGI Global} } @inproceedings{matsuzaki2020further, title={A further investigation of neural network players for game 2048}, author={Matsuzaki, Kiminori}, booktitle={Advances in Computer Games: 16th International Conference, ACG 2019, Macao, China, August 11--13, 2019, Revised Selected Papers 16}, pages={53--65}, year={2020}, organization={Springer} } @inproceedings{majeed2018q, title={On Q-learning Convergence for Non-Markov Decision Processes.}, author={Majeed, Sultan Javed and Hutter, Marcus and others}, booktitle={IJCAI}, volume={18}, pages={2546--2552}, year={2018} } @article{guei2021optimistic, title={Optimistic temporal difference learning for 2048}, author={Guei, Hung and Chen, Lung-Pin and Wu, I-Chen}, journal={IEEE Transactions on Games}, volume={14}, number={3}, pages={478--487}, year={2022}, publisher={IEEE} } @inproceedings{rodgers2014an, title={An investigation into 2048 AI strategies}, author={Rodgers, Philip and Levine, John}, booktitle={2014 IEEE Conference on Computational Intelligence and Games}, pages={1--2}, year={2014}, organization={IEEE} } @inproceedings{szubert2014temporal, title={Temporal difference learning of n-tuple networks for the game 2048}, author={Szubert, Marcin and Ja{\'s}kowski, Wojciech}, booktitle={2014 IEEE Conference on Computational Intelligence and Games}, pages={1--8}, year={2014}, organization={IEEE} } @article{jaskowski2017mastering, title={Mastering 2048 with delayed temporal coherence learning, multistage weight promotion, redundant encoding, and carousel shaping}, author={Ja{\'s}kowski, Wojciech}, journal={IEEE Transactions on Games}, volume={10}, number={1}, pages={3--14}, year={2017}, publisher={IEEE} } @article{yeh2016multistage, title={Multistage temporal difference learning for 2048-like games}, author={Yeh, Kun-Hao and Wu, I-Chen and Hsueh, Chu-Hsuan and Chang, Chia-Chuan and Liang, Chao-Chin and Chiang, Han}, journal={IEEE Transactions on Computational Intelligence and AI in Games}, volume={9}, number={4}, pages={369--380}, year={2016}, publisher={IEEE} } @inproceedings{wu2014multi, title={Multi-stage temporal difference learning for 2048}, author={Wu, I-Chen and Yeh, Kun-Hao and Liang, Chao-Chin and Chang, Chia-Chuan and Chiang, Han}, booktitle={Technologies and Applications of Artificial Intelligence: 19th International Conference, TAAI 2014, Taipei, Taiwan, November 21-23, 2014. Proceedings}, pages={366--378}, year={2014}, organization={Springer} } @article{kondo2019playing, title={Playing game 2048 with deep convolutional neural networks trained by supervised learning}, author={Kondo, Naoki and Matsuzaki, Kiminori}, journal={Journal of Information Processing}, volume={27}, pages={340--347}, year={2019}, publisher={Information Processing Society of Japan} } @inproceedings{matsuzaki2017developing, title={Developing a 2048 player with backward temporal coherence learning and restart}, author={Matsuzaki, Kiminori}, booktitle={Advances in Computer Games: 15th International Conferences, ACG 2017, Leiden, The Netherlands, July 3--5, 2017, Revised Selected Papers 15}, pages={176--187}, year={2017}, organization={Springer} } @inproceedings{matsuzaki2016systematic, title={Systematic selection of N-tuple networks with consideration of interinfluence for game 2048}, author={Matsuzaki, Kiminori}, booktitle={2016 Conference on Technologies and Applications of Artificial Intelligence (TAAI)}, pages={186--193}, year={2016}, organization={IEEE} } @inproceedings{oka2016systematic, title={Systematic selection of N-tuple networks for 2048}, author={Oka, Kazuto and Matsuzaki, Kiminori}, booktitle={International Conference on Computers and Games}, pages={81--92}, year={2016}, organization={Springer} } @article{matsuzaki2021developing, title={Developing value networks for game 2048 with reinforcement learning}, author={Matsuzaki, Kiminori}, journal={Journal of Information Processing}, volume={29}, pages={336--346}, year={2021}, publisher={Information Processing Society of Japan} } @book{Sutton2018book, author = {Sutton, Richard S. and Barto, Andrew G.}, edition = {Second}, publisher = {The MIT Press}, title = {Reinforcement Learning: An Introduction}, year = {2018 } }