Update Experimental Framework.tex

3182787f · Ruizhi Chen · 3c299656 · 3182787f
Commit 3182787f authored Sep 10, 2020 by Ruizhi Chen
Hide whitespace changes
Inline Side-by-side

Showing with 1 additions and 1 deletions

AAAI2021/tex/Experimental Framework.tex
+1 -1

No files found.
--- a/AAAI2021/tex/Experimental Framework.tex
+++ b/AAAI2021/tex/Experimental Framework.tex
@@ -51,7 +51,7 @@ Unlike previous studies[][], the agents in this paper are totally independent. I
 		\STATE $P(\hat{t}|s) = \pi^L_{old}(\hat{t}|s)$ 
 		\STATE Sample $\hat{t}$ with $P(\hat{t}|s)$
 		\STATE Get reward $R(\hat{t},t)$
-		\STATE $J(\theta^S,\theta^L)=E_{\pi_{old}^S,\pi^L}[R(\hat{t},t)\cdot\frac{\pi^L(s|t)}{\pi^L_{old}(s|t)}]$
+		\STATE $J(\theta^S,\theta^L)=E_{\pi^S,\pi_{old}^L}[R(\hat{t},t)\cdot\frac{\pi^L(s|t)}{\pi^L_{old}(s|t)}]$
 		\STATE Update $\theta^L$ by $\bigtriangledown_{\theta^L}J$
 		\ENDFOR
 		\STATE $\pi_{old}^L\leftarrow \pi^L$