From 8783cf0272ddbcda55095b9872ccf4f72ca0d3bc Mon Sep 17 00:00:00 2001 From: Lenovo Date: Mon, 3 Jun 2024 13:52:09 +0800 Subject: [PATCH] 再补一句 --- document.tex | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/document.tex b/document.tex index 171700a..7ac46a9 100644 --- a/document.tex +++ b/document.tex @@ -91,10 +91,13 @@ do not explicitly utilize exploration strategies We proved that the 2048 game is acyclic between non-absorbing states. This is the fundamental reason why explicit exploration cannot be employed in the 2048 game. + Compared to explicit exploration strategies, + backward learning, restart, and optimistic initialization + are more suitable for acyclic MDPs or MDPs with acyclic structures. \end{abstract} \begin{IEEEkeywords} -Acyclicity, 2048 game, ergodicity, backward learning. +Acyclicity, 2048 game, ergodicity, exploration, backward learning. \end{IEEEkeywords} -- libgit2 0.26.0