Merge branch 'master' of http://62.234.201.16/hao/AAAI21_Emergent_language

a39f832c · haoyifan · 442e08c8 · a1e0bd69 · a39f832c
Commit a39f832c authored Sep 10, 2020 by haoyifan
Hide whitespace changes
Inline Side-by-side

Showing with 1 additions and 1 deletions

AAAI2021/tex/theory.tex
+1 -1

No files found.
--- a/AAAI2021/tex/theory.tex
+++ b/AAAI2021/tex/theory.tex
@@ -45,7 +45,7 @@
 		\STATE $P(\hat{t}|s) = \pi^L_{old}(\hat{t}|s)$ 
 		\STATE Sample $\hat{t}$ with $P(\hat{t}|s)$
 		\STATE Get reward $r(\hat{t},t)$
-		\STATE $J(\theta^S,\theta^L)=E_{\pi_{old}^S,\pi^L}[r(\hat{t},t)\cdot\frac{\pi^L(s|t)}{\pi^L_{old}(s|t)}]$
+		\STATE $J(\theta^S,\theta^L)=E_{\pi^S,\pi_{old}^L}[r(\hat{t},t)\cdot\frac{\pi^L(s|t)}{\pi^L_{old}(s|t)}]$
 		\STATE Update $\theta^L$ by $\bigtriangledown_{\theta^L}J$
 		\ENDFOR
 		\STATE $\pi_{old}^L\leftarrow \pi^L$