Merge pull request #1 from liuktc/patch-1

Update _rnn.tex
2026-02-04 07:41:43 +01:00 · 2024-10-27 17:38:37 +01:00
parent cff26da369 9e8675ab9d
commit 606151025c
1 changed files with 2 additions and 2 deletions
--- a/src/year2/natural-language-processing/sections/_rnn.tex
+++ b/src/year2/natural-language-processing/sections/_rnn.tex
@ -39,7 +39,7 @@
    \begin{description}
        \item[Training]
            Given the predicted distribution $\hat{\vec{y}}^{(t)}$ and ground-truth $\vec{y}^{(t)}$ at step $t$, the loss is computed as the cross-entropy:
-            \[ \mathcal{L}^{(t)}(\matr{\theta}) = - \sum_{v \in V} \vec{y}_v^{(t)} \log\left( \hat{\vec{y}}_w^{(t)} \right) \]
+            \[ \mathcal{L}^{(t)}(\matr{\theta}) = - \sum_{v \in V} \vec{y}_v^{(t)} \log\left( \hat{\vec{y}}_v^{(t)} \right) \]

            \begin{description}
                \item[Teacher forcing] \marginnote{Teacher forcing}
@ -68,4 +68,4 @@
            \item[Greedy] Select the token with the highest probability.
            \item[Sampling] Randomly sample the token following the probabilities of the output distribution.
        \end{descriptionlist}
-\end{description}
+\end{description}