Merge pull request #6 from fraktc/patch-2

Le virgole sono importanti
2026-02-04 07:41:43 +01:00 · 2026-01-19 02:43:34 +01:00
parent 9e9c616993 4e1020dbe0
commit 8a6e886fc9
1 changed files with 3 additions and 3 deletions
--- a/src/year2/natural-language-processing/sections/_language_models.tex
+++ b/src/year2/natural-language-processing/sections/_language_models.tex
@ -190,7 +190,7 @@
        This is equivalent to computing the probability of the whole sentence, which expanded using the chain rule becomes:
        \[
            \begin{split}
-                \prob{w_1, \dots, w_{i-1} w_i} &= \prob{w_1} \prob{w_2 | w_1} \prob{w_3 | w_{1..2}} \dots \prob{w_n | w_{1..n-1}} \\
+                \prob{w_1, \dots, w_{i-1}, w_i} &= \prob{w_1} \prob{w_2 | w_1} \prob{w_3 | w_{1..2}} \dots \prob{w_n | w_{1..n-1}} \\
                &= \prod_{i=1}^{n} \prob{w_i | w_{1..i-1}}
            \end{split}
        \]
@ -224,7 +224,7 @@
                \begin{description}
                    \item[Estimating $\mathbf{N}$-gram probabilities]
                        Consider the bigram case, the probability that a token $w_i$ follows $w_{i-1}$ can be determined through counting:
-                        \[ \prob{w_i | w_{i-1}} = \frac{\texttt{count}(w_{i-1} w_i)}{\texttt{count}(w_{i-1})} \]
+                        \[ \prob{w_i | w_{i-1}} = \frac{\texttt{count}(w_{i-1}, w_i)}{\texttt{count}(w_{i-1})} \]
                \end{description}
                \begin{remark}
@ -378,4 +378,4 @@ Only for $n$-grams that occur enough times a representative probability can be e
                c^* = \big( \texttt{count}(w_{i-1}w_i) + 1 \big) \frac{\texttt{count}(w_{i-1})}{\texttt{count}(w_{i-1}) + \vert V \vert}
            \]
        \end{example}
-\end{description}
+\end{description}