Fix Bellman equation <noupdate>

2026-02-04 07:41:43 +01:00 · 2024-06-10 11:10:56 +02:00
parent bd7c52ba15
commit 76ce62296c
1 changed files with 1 additions and 1 deletions
--- a/src/year1/cognition-and-neuroscience/module2/sections/_dopamine.tex
+++ b/src/year1/cognition-and-neuroscience/module2/sections/_dopamine.tex
@ -111,7 +111,7 @@
    \item[Bellman equation] \marginnote{Bellman equation}
        Given an action $a_t$ performed in the state $s_t$ following a policy $\pi$,
        the expected future reward is given by the following equation:
-        \[ Q_\pi(s_t, a_t) = r_t + \gamma \sum_{s_{t+1}} \prob{s_{t+1 | s_t, a_t}} Q_\pi(s_{t+1}, \pi(s_{t+1})) \]
+        \[ Q_\pi(s_t, a_t) = r_t + \gamma \sum_{s_{t+1}} \prob{s_{t+1} | s_t, a_t} Q_\pi(s_{t+1}, \pi(s_{t+1})) \]
        where $\gamma$ is a discount factor.
 \end{description}