Add SMM finite numbers

2026-02-04 07:41:43 +01:00 · 2023-09-22 16:42:08 +02:00
parent f33ff9fa98
commit 0031937a19
7 changed files with 348 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,8 @@
+*.synctex.gz
+*.log
+*.fls
+*.fdb_latexmk
+*.aux
+*.toc
+*.out
+[!_]*.pdf
--- a/statistical-and-mathematical-methods-for-ai/img/_inherent_error.pdf
+++ b/statistical-and-mathematical-methods-for-ai/img/_inherent_error.pdf
--- a/statistical-and-mathematical-methods-for-ai/img/floatingpoint_range.png
+++ b/statistical-and-mathematical-methods-for-ai/img/floatingpoint_range.png
--- a/statistical-and-mathematical-methods-for-ai/img/inherent_error.drawio
+++ b/statistical-and-mathematical-methods-for-ai/img/inherent_error.drawio
@ -0,0 +1,88 @@
+<mxfile host="app.diagrams.net" modified="2023-09-22T09:37:27.395Z" agent="Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:109.0) Gecko/20100101 Firefox/117.0" etag="3qzh6VvLSaXopiRghqnY" version="21.7.0" type="device">
+  <diagram name="Pagina-1" id="mETDQKEhh33VIil_YAIY">
+    <mxGraphModel dx="819" dy="401" grid="1" gridSize="10" guides="1" tooltips="1" connect="1" arrows="1" fold="1" page="1" pageScale="1" pageWidth="827" pageHeight="1169" math="0" shadow="0">
+      <root>
+        <mxCell id="0" />
+        <mxCell id="1" parent="0" />
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-1" value="" style="ellipse;whiteSpace=wrap;html=1;" parent="1" vertex="1">
+          <mxGeometry x="200" y="300" width="150" height="150" as="geometry" />
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-2" value="" style="ellipse;fillStyle=auto;fillColor=#99CCFF;" parent="1" vertex="1">
+          <mxGeometry x="280" y="340" width="10" height="10" as="geometry" />
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-3" value="" style="ellipse;fillColor=#99CCFF;" parent="1" vertex="1">
+          <mxGeometry x="280" y="400" width="10" height="10" as="geometry" />
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-4" value="U&amp;nbsp; " style="text;html=1;strokeColor=none;fillColor=none;align=right;verticalAlign=middle;whiteSpace=wrap;rounded=0;fontFamily=Times New Roman;fontSize=15;" parent="1" vertex="1">
+          <mxGeometry x="240" y="330" width="40" height="30" as="geometry" />
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-5" value="&lt;div align=&quot;right&quot;&gt;&lt;font style=&quot;font-size: 15px;&quot; face=&quot;Times New Roman&quot;&gt;&amp;nbsp;U&lt;/font&gt;&lt;font style=&quot;font-size: 15px;&quot; face=&quot;Times New Roman&quot;&gt;+ΔU&amp;nbsp; &lt;br&gt;&lt;/font&gt;&lt;/div&gt;" style="text;html=1;strokeColor=none;fillColor=none;align=right;verticalAlign=middle;whiteSpace=wrap;rounded=0;" parent="1" vertex="1">
+          <mxGeometry x="230" y="390" width="50" height="30" as="geometry" />
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-6" value="" style="ellipse;whiteSpace=wrap;html=1;" parent="1" vertex="1">
+          <mxGeometry x="420" y="300" width="150" height="150" as="geometry" />
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-7" value="" style="ellipse;fillStyle=auto;fillColor=#99CCFF;" parent="1" vertex="1">
+          <mxGeometry x="480" y="340" width="10" height="10" as="geometry" />
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-8" value="" style="ellipse;fillColor=#99CCFF;" parent="1" vertex="1">
+          <mxGeometry x="480" y="400" width="10" height="10" as="geometry" />
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-9" value="&amp;nbsp;V" style="text;html=1;strokeColor=none;fillColor=none;align=left;verticalAlign=middle;whiteSpace=wrap;rounded=0;fontFamily=Times New Roman;fontSize=15;" parent="1" vertex="1">
+          <mxGeometry x="490" y="330" width="50" height="30" as="geometry" />
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-10" value="&lt;div align=&quot;left&quot;&gt;&lt;font style=&quot;font-size: 15px;&quot; face=&quot;Times New Roman&quot;&gt;&amp;nbsp;V&lt;/font&gt;&lt;font style=&quot;font-size: 15px;&quot; face=&quot;Times New Roman&quot;&gt;+ΔV&amp;nbsp; &lt;br&gt;&lt;/font&gt;&lt;/div&gt;" style="text;html=1;strokeColor=none;fillColor=none;align=left;verticalAlign=middle;whiteSpace=wrap;rounded=0;" parent="1" vertex="1">
+          <mxGeometry x="490" y="390" width="50" height="30" as="geometry" />
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-11" value="" style="endArrow=classic;html=1;exitX=1;exitY=0.5;exitDx=0;exitDy=0;entryX=0;entryY=0.5;entryDx=0;entryDy=0;curved=1;" parent="1" source="AFoxFzemWGuV3oYDkwgm-2" target="AFoxFzemWGuV3oYDkwgm-7" edge="1">
+          <mxGeometry width="50" height="50" relative="1" as="geometry">
+            <mxPoint x="410" y="420" as="sourcePoint" />
+            <mxPoint x="460" y="370" as="targetPoint" />
+            <Array as="points">
+              <mxPoint x="390" y="310" />
+            </Array>
+          </mxGeometry>
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-12" value="" style="endArrow=classic;html=1;exitX=1;exitY=0.5;exitDx=0;exitDy=0;entryX=0;entryY=0.5;entryDx=0;entryDy=0;curved=1;" parent="1" source="AFoxFzemWGuV3oYDkwgm-3" target="AFoxFzemWGuV3oYDkwgm-8" edge="1">
+          <mxGeometry width="50" height="50" relative="1" as="geometry">
+            <mxPoint x="300" y="355" as="sourcePoint" />
+            <mxPoint x="530" y="355" as="targetPoint" />
+            <Array as="points">
+              <mxPoint x="390" y="360" />
+            </Array>
+          </mxGeometry>
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-13" value="&lt;font face=&quot;Times New Roman&quot; size=&quot;1&quot;&gt;&lt;i&gt;&lt;font style=&quot;font-size: 15px;&quot;&gt;f&lt;/font&gt;&lt;/i&gt;&lt;/font&gt;" style="text;html=1;strokeColor=none;fillColor=none;align=center;verticalAlign=middle;whiteSpace=wrap;rounded=0;" parent="1" vertex="1">
+          <mxGeometry x="330" y="290" width="110" height="30" as="geometry" />
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-15" value="" style="endArrow=none;dashed=1;html=1;dashPattern=1 3;strokeWidth=2;rounded=0;entryX=0.5;entryY=0;entryDx=0;entryDy=0;exitX=0.5;exitY=1;exitDx=0;exitDy=0;" parent="1" source="AFoxFzemWGuV3oYDkwgm-7" target="AFoxFzemWGuV3oYDkwgm-8" edge="1">
+          <mxGeometry width="50" height="50" relative="1" as="geometry">
+            <mxPoint x="450" y="380" as="sourcePoint" />
+            <mxPoint x="500" y="330" as="targetPoint" />
+          </mxGeometry>
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-16" value="" style="endArrow=none;dashed=1;html=1;dashPattern=1 3;strokeWidth=2;rounded=0;entryX=0.5;entryY=1;entryDx=0;entryDy=0;exitX=0.5;exitY=0;exitDx=0;exitDy=0;" parent="1" source="AFoxFzemWGuV3oYDkwgm-3" target="AFoxFzemWGuV3oYDkwgm-2" edge="1">
+          <mxGeometry width="50" height="50" relative="1" as="geometry">
+            <mxPoint x="270" y="410" as="sourcePoint" />
+            <mxPoint x="320" y="360" as="targetPoint" />
+          </mxGeometry>
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-17" value="&lt;font style=&quot;font-size: 15px;&quot; face=&quot;Times New Roman&quot;&gt;Δ&lt;/font&gt;U&amp;nbsp; " style="text;html=1;strokeColor=none;fillColor=none;align=right;verticalAlign=middle;whiteSpace=wrap;rounded=0;fontFamily=Times New Roman;fontSize=15;" parent="1" vertex="1">
+          <mxGeometry x="240" y="360" width="40" height="30" as="geometry" />
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-18" value="&lt;div align=&quot;left&quot;&gt;&lt;font style=&quot;font-size: 15px;&quot; face=&quot;Times New Roman&quot;&gt;&amp;nbsp;&lt;/font&gt;&lt;font style=&quot;font-size: 15px;&quot; face=&quot;Times New Roman&quot;&gt;ΔV&amp;nbsp; &lt;br&gt;&lt;/font&gt;&lt;/div&gt;" style="text;html=1;strokeColor=none;fillColor=none;align=left;verticalAlign=middle;whiteSpace=wrap;rounded=0;" parent="1" vertex="1">
+          <mxGeometry x="490" y="360" width="30" height="30" as="geometry" />
+        </mxCell>
+        <mxCell id="AFoxFzemWGuV3oYDkwgm-19" value="&lt;div align=&quot;left&quot;&gt;&lt;font style=&quot;font-size: 15px;&quot; face=&quot;Times New Roman&quot;&gt;Inherent error &lt;/font&gt;&lt;/div&gt;" style="text;html=1;strokeColor=none;fillColor=none;align=left;verticalAlign=middle;whiteSpace=wrap;rounded=0;" parent="1" vertex="1">
+          <mxGeometry x="580" y="355" width="90" height="40" as="geometry" />
+        </mxCell>
+        <mxCell id="x--qwbr77Wqyja1BnvlK-2" value="" style="endArrow=classic;html=1;rounded=0;entryX=1;entryY=0.5;entryDx=0;entryDy=0;exitX=0;exitY=0.5;exitDx=0;exitDy=0;strokeWidth=2;" edge="1" parent="1" source="AFoxFzemWGuV3oYDkwgm-19" target="AFoxFzemWGuV3oYDkwgm-18">
+          <mxGeometry width="50" height="50" relative="1" as="geometry">
+            <mxPoint x="600" y="375" as="sourcePoint" />
+            <mxPoint x="450" y="370" as="targetPoint" />
+          </mxGeometry>
+        </mxCell>
+      </root>
+    </mxGraphModel>
+  </diagram>
+</mxfile>
--- a/statistical-and-mathematical-methods-for-ai/img/machine_eps.png
+++ b/statistical-and-mathematical-methods-for-ai/img/machine_eps.png
--- a/statistical-and-mathematical-methods-for-ai/main.tex
+++ b/statistical-and-mathematical-methods-for-ai/main.tex
@ -0,0 +1,51 @@
+\documentclass[11pt]{article}
+\usepackage[margin=3cm]{geometry}
+\usepackage{graphicx}
+\usepackage{amsmath, amsfonts, amssymb, amsthm, mathtools}
+\usepackage{hyperref}
+\usepackage[nameinlink]{cleveref}
+\usepackage[all]{hypcap} % Links hyperref to object top and not caption
+\usepackage[inline]{enumitem}
+\usepackage{marginnote}
+
+\title{Statistical and Mathematical Methods for Artificial Intelligence}
+\date{2023 -- 2024}
+
+\hypersetup{
+    colorlinks,
+    citecolor=black,
+    filecolor=black,
+    linkcolor=black,
+    urlcolor=black,
+    linktoc=all
+}
+
+\setlist[description]{labelindent=\parindent}   % Indents `description`
+
+\newtheorem{example}{Example}[section]
+
+
+\begin{document}
+
+    \makeatletter
+    \begin{titlepage}
+        \centering
+        \vspace*{\fill}
+        \huge
+        \textbf{\@title}
+        \vspace*{\fill}
+
+        \Large
+        Academic Year \@date\\
+        Alma Mater Studiorum $\cdot$ University of Bologna
+        \vspace*{1cm}
+    \end{titlepage}
+    \makeatother
+    \pagenumbering{roman}
+    \tableofcontents
+    \newpage
+    \pagenumbering{arabic}
+
+    \input{sections/finite_numbers.tex}
+
+\end{document}
--- a/statistical-and-mathematical-methods-for-ai/sections/finite_numbers.tex
+++ b/statistical-and-mathematical-methods-for-ai/sections/finite_numbers.tex
@ -0,0 +1,201 @@
+\section{Finite numbers}
+
+
+
+\subsection{Sources of error}
+
+\begin{description}
+    \item[Measure error] 
+        Precision of the measurement instrument.
+
+    \item[Arithmetic error] 
+        Propagation of rounding errors in each step of an algorithm.
+
+    \item[Truncation error] 
+        Approximating an infinite procedure into a finite number of iterations.
+
+    \item[Inherent error] 
+        Caused by the finite representation of the data (floating-point).
+        \begin{figure}[h]
+            \centering
+            \includegraphics[width=0.6\textwidth]{img/_inherent_error.pdf}
+            \caption{Inherent error visualization}
+        \end{figure}
+\end{description}
+
+
+
+\subsection{Error measurement}
+
+Let $x$ be a value and $\hat{x}$ its approximation. Then:
+\begin{description}
+    \item[Absolute error] 
+        \begin{equation}
+            E_{a} = \hat{x} - x
+        \end{equation}
+        Note that, out of context, the absolute error is meaningless.
+    \item[Relative error] 
+        \begin{equation}
+            E_{a} = \frac{\hat{x} - x}{x}
+        \end{equation}
+\end{description}
+
+
+
+\subsection{Representation in base \texorpdfstring{$\beta$}{B}}
+
+Let $\beta \in \mathbb{N}_{> 1}$ be the base.
+Each $x \in \mathbb{R} \smallsetminus \{0\}$ can be uniquely represented as:
+\begin{equation} \label{eq:finnum_b_representation}
+    x = \texttt{sign}(x) \cdot (d_1\beta^{-1} + d_2\beta^{-2} + \dots d_n\beta^{-n})\beta^p
+\end{equation}
+where:
+\begin{itemize}
+    \item $0 \leq d_i \leq \beta-1$
+    \item $d_1 \neq 0$
+    \item starting from an index $i$, not all $d_j$ ($j \geq i$) are equal to $\beta-1$
+\end{itemize}
+%
+\Cref{eq:finnum_b_representation} can be represented using the normalized scientific notation as:
+\begin{equation}
+    x = \pm (0.d_1d_2\dots) \beta^p
+\end{equation}
+where $0.d_1d_2\dots$ is the \textbf{mantissa} and $\beta^p$ the \textbf{exponent}.
+
+
+
+\subsection{Floating-point}
+
+A floating-point system $\mathcal{F}(\beta, t, L, U)$ is defined by the parameters:
+\begin{itemize}
+    \item $\beta$: base
+    \item $t$: precision (number of digits in the mantissa)
+    \item $[L, U]$: range of the exponent
+\end{itemize}
+%
+Each $x \in \mathcal{F}(\beta, t, L, U)$ can be represented in its normalized form:
+\begin{eqnarray}
+    x = \pm (0.d_1d_2 \dots d_t) \beta^p & L \leq p \leq U
+\end{eqnarray}
+\begin{example}
+    In $\mathcal{F}(10, 5, -3, 3)$, $x=12.\bar{3}$ is represented as:
+    \begin{equation*}
+        \texttt{fl}(x) = + 0.12333 \cdot 10^2
+    \end{equation*}
+\end{example}
+
+
+\subsubsection{Numbers distribution}
+Given a floating-point system $\mathcal{F}(\beta, t, L, U)$, the total amount of representable numbers is:
+\begin{equation*}
+    2(\beta-1) \beta^{t-1} (U-L+1)+1
+\end{equation*}
+%
+Representable numbers are more sparse towards the exponent upper bound and more dense towards the lower bound.
+It must be noted that there is an underflow area around 0.
+\begin{figure}[h]
+    \centering
+    \includegraphics[width=0.8\textwidth]{img/floatingpoint_range.png}
+    \caption{Floating-point numbers in $\mathcal{F}(2, 3, -1, 2)$}
+\end{figure}
+
+
+\subsubsection{Numbers representation}
+Given a floating-point system $\mathcal{F}(\beta, t, L, U)$, the representation of $x \in \mathbb{R}$ can result in:
+\begin{description}
+    \item[Exact representation] 
+        if $p \in [L, U]$ and $d_i=0$ for $i>t$.
+
+    \item[Approximation] 
+        if $p \in [L, U]$ but $d_i$ may not be 0 for $i>t$. 
+        In this case, the representation is obtained by truncating or rounding the value.
+
+    \item[Underflow] 
+        if $p < L$. In this case, the values is approximated as 0.
+
+    \item[Overflow] 
+        if $p > U$. In this case, an exception is usually raised.
+\end{description}
+
+
+\subsubsection{Machine precision}
+Machine precision $\varepsilon_{\text{mach}}$ determines the accuracy of a floating-point system.
+Depending on the approximation approach, machine precision can be computes as:
+\begin{description}
+    \item[Truncation] $\varepsilon_{\text{mach}} = \beta^{1-t}$
+    \item[Rounding] $\varepsilon_{\text{mach}} = \frac{1}{2}\beta^{1-t}$
+\end{description}
+Therefore, rounding results in more accurate representations.
+
+$\varepsilon_{\text{mach}}$ is the smallest distance among the representable numbers (\Cref{fig:finnum_eps}).
+\begin{figure}[h]
+    \centering
+    \includegraphics[width=0.2\textwidth]{img/machine_eps.png}
+    \caption{Visualization of $\varepsilon_{\text{mach}}$ in $\mathcal{F}(2, 3, -1, 2)$}
+    \label{fig:finnum_eps}
+\end{figure}\\
+%
+In alternative, $\varepsilon_{\text{mach}}$ can be defined as the smallest representable number such that:
+\begin{equation*}
+    \texttt{fl}(1 + \varepsilon_{\text{mach}}) > 1.
+\end{equation*}
+
+
+\subsubsection{IEEE standard}
+IEEE 754 defines two floating-point formats:
+\begin{description}
+    \item[Single precision] Stored in 32 bits. Represents the system $\mathcal{F}(2, 24, -128, 127)$.
+        \begin{center}
+            \small
+            \begin{tabular}{|c|c|c|}
+                \hline
+                1 (sign) & 8 (exponent) & 23 (mantissa) \\
+                \hline
+            \end{tabular}
+        \end{center}
+
+    \item[Double precision] Stored in 64 bits. Represents the system $\mathcal{F}(2, 53, -1024, 1023)$.
+        \begin{center}
+            \small
+            \begin{tabular}{|c|c|c|}
+                \hline
+                1 (sign) & 11 (exponent) & 52 (mantissa) \\
+                \hline
+            \end{tabular}
+        \end{center}
+\end{description}
+As the first digit of the mantissa is always 1, it does not need to be stored.
+Moreover, special configurations are reserved to represent \texttt{Inf} and \texttt{NaN}.
+
+
+\subsubsection{Floating-point arithmetic}
+Let:
+\begin{itemize}
+    \item $+: \mathbb{R} \times \mathbb{R} \rightarrow \mathbb{R}$ be a real numbers operation.
+    \item $\oplus: \mathcal{F} \times \mathcal{F} \rightarrow \mathcal{F}$ be the corresponding operation in a floating-point system.
+\end{itemize}
+%
+To compute $x \oplus y$, a machine:
+\begin{enumerate}
+    \item Calculates $x + y$ in a high precision register (still approximated, but more precise than the storing system)
+    \item Stores the result as $\texttt{fl}(x + y)$
+\end{enumerate}
+
+A floating-point operation causes a small rounding error:
+\begin{equation}
+    \left\Vert \frac{(x \oplus y) - (x + y)}{x+y} \right\Vert < \varepsilon_{\text{mach}}
+\end{equation}
+%
+Although, some operations may be subject to the \textbf{cancellation} problem which causes information loss.
+\begin{example}
+    Given $x = 1$ and $y = 1 \cdot 10^{-16}$, we want to compute $x + y$ in $\mathcal{F}(10, 16, U, L)$.\\
+    \begin{equation*}
+        \begin{split}
+            z & = \texttt{fl}(x) + \texttt{fl}(y) \\
+              & = 0.1 \cdot 10^1 + 0.1 \cdot 10^{-15} \\
+              & = (0.1 + 0.\overbrace{0\dots0}^{\mathclap{16\text{ zeros}}}1) \cdot 10^1 \\
+              & = 0.1\overbrace{0\dots0}^{\mathclap{15\text{ zeros}}}1 \cdot 10^1
+        \end{split}
+    \end{equation*}
+    Then, we have that $\texttt{fl}(z) = 0.1\overbrace{0\dots0}^{\mathclap{15\text{ zeros}}} \cdot 10^1 = 1 = x$.
+\end{example}