mirror of
https://github.com/Andreaierardi/Master-DataScience-Notes.git
synced 2024-12-01 08:02:55 +01:00
130 lines
13 KiB
TeX
130 lines
13 KiB
TeX
\relax
|
||
\@nameuse{bbl@beforestart}
|
||
\babel@aux{english}{}
|
||
\@writefile{toc}{\contentsline {chapter}{\numberline {1}Lecture 1 - 09-03-2020}{5}\protected@file@percent }
|
||
\@writefile{lof}{\addvspace {10\p@ }}
|
||
\@writefile{lot}{\addvspace {10\p@ }}
|
||
\@writefile{toc}{\contentsline {section}{\numberline {1.1}Introduction of the course}{5}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {1.2}Examples}{5}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {subsection}{\numberline {1.2.1}Spam filtering}{8}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {chapter}{\numberline {2}Lecture 2 - 07-04-2020}{9}\protected@file@percent }
|
||
\@writefile{lof}{\addvspace {10\p@ }}
|
||
\@writefile{lot}{\addvspace {10\p@ }}
|
||
\@writefile{toc}{\contentsline {section}{\numberline {2.1}Argomento}{9}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {2.2}Loss}{9}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2.1}Absolute Loss}{9}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {2.1}{\ignorespaces Example of domain of $K_{NN}$}}{10}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2.2}Square Loss}{10}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {2.2}{\ignorespaces Example of domain of $K_{NN}$}}{10}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2.3}Example of information of square loss}{11}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2.4}labels and losses}{12}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2.5}Example TF(idf) documents encoding}{14}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {chapter}{\numberline {3}Lecture 3 - 07-04-2020}{16}\protected@file@percent }
|
||
\@writefile{lof}{\addvspace {10\p@ }}
|
||
\@writefile{lot}{\addvspace {10\p@ }}
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {3.1}{\ignorespaces Example of domain of $K_{NN}$}}{16}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {3.1}Overfitting}{18}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {subsection}{\numberline {3.1.1}Noise in the data}{18}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {3.2}Underfitting}{20}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {3.3}Nearest neighbour}{20}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {3.2}{\ignorespaces Example of domain of $K_{NN}$}}{21}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {3.3}{\ignorespaces Example of domain of $K_{NN}$}}{21}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {chapter}{\numberline {4}Lecture 4 - 07-04-2020}{23}\protected@file@percent }
|
||
\@writefile{lof}{\addvspace {10\p@ }}
|
||
\@writefile{lot}{\addvspace {10\p@ }}
|
||
\@writefile{toc}{\contentsline {section}{\numberline {4.1}Computing $h_{NN}$}{23}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {4.1}{\ignorespaces Example of domain of $K_{NN}$}}{24}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {4.2}Tree Predictor}{25}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {4.2}{\ignorespaces Example of domain of $K_{NN}$}}{25}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {4.3}{\ignorespaces Example of domain of $K_{NN}$}}{26}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {4.4}{\ignorespaces Example of domain of $K_{NN}$}}{27}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {4.5}{\ignorespaces Example of domain of $K_{NN}$}}{27}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {4.6}{\ignorespaces Example of domain of $K_{NN}$}}{27}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {4.7}{\ignorespaces Example of domain of $K_{NN}$}}{28}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {chapter}{\numberline {5}Lecture 5 - 07-04-2020}{29}\protected@file@percent }
|
||
\@writefile{lof}{\addvspace {10\p@ }}
|
||
\@writefile{lot}{\addvspace {10\p@ }}
|
||
\@writefile{toc}{\contentsline {section}{\numberline {5.1}Tree Classifier}{29}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {5.1}{\ignorespaces Example of domain of $K_{NN}$}}{29}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {5.2}{\ignorespaces Example of domain of $K_{NN}$}}{30}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {5.2}Jensen’s inequality}{31}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {5.3}{\ignorespaces Example of domain of $K_{NN}$}}{31}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {5.4}{\ignorespaces Example of domain of $K_{NN}$}}{31}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {5.5}{\ignorespaces Example of domain of $K_{NN}$}}{32}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {5.6}{\ignorespaces Example of domain of $K_{NN}$}}{33}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {5.7}{\ignorespaces Example of domain of $K_{NN}$}}{34}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {5.8}{\ignorespaces Example of domain of $K_{NN}$}}{34}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {5.9}{\ignorespaces Example of domain of $K_{NN}$}}{34}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {5.3}Tree Predictor}{35}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {5.10}{\ignorespaces Example of domain of $K_{NN}$}}{35}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {5.4}Statistical model for Machine Learning}{36}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {chapter}{\numberline {6}Lecture 6 - 07-04-2020}{38}\protected@file@percent }
|
||
\@writefile{lof}{\addvspace {10\p@ }}
|
||
\@writefile{lot}{\addvspace {10\p@ }}
|
||
\@writefile{toc}{\contentsline {section}{\numberline {6.1}Bayes Optimal Predictor}{38}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {subsection}{\numberline {6.1.1}Square Loss}{39}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {6.1}{\ignorespaces Example of domain of $K_{NN}$}}{39}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {subsection}{\numberline {6.1.2}Zero-one loss for binary classification}{40}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {6.2}{\ignorespaces Example of domain of $K_{NN}$}}{41}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {6.3}{\ignorespaces Example of domain of $K_{NN}$}}{41}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {6.4}{\ignorespaces Example of domain of $K_{NN}$}}{42}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {6.2}Bayes Risk}{43}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {6.5}{\ignorespaces Example of domain of $K_{NN}$}}{43}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {chapter}{\numberline {7}Lecture 7 - 07-04-2020}{45}\protected@file@percent }
|
||
\@writefile{lof}{\addvspace {10\p@ }}
|
||
\@writefile{lot}{\addvspace {10\p@ }}
|
||
\@writefile{toc}{\contentsline {section}{\numberline {7.1}Chernoff-Hoffding bound}{45}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {7.2}Union Bound}{46}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {7.1}{\ignorespaces Example}}{46}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {7.2}{\ignorespaces Example}}{47}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {7.3}{\ignorespaces Example}}{47}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {7.4}{\ignorespaces Example}}{48}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {7.5}{\ignorespaces Example}}{48}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {7.6}{\ignorespaces Draw of how $\hat {h}$, $h^*$ and $f^*$ are represented}}{49}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {7.3}Studying overfitting of a ERM}{50}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {chapter}{\numberline {8}Lecture 8 - 07-04-2020}{52}\protected@file@percent }
|
||
\@writefile{lof}{\addvspace {10\p@ }}
|
||
\@writefile{lot}{\addvspace {10\p@ }}
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {8.1}{\ignorespaces Representation of $\hat {h}$, $h^*$ and $f^*$ }}{52}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {8.2}{\ignorespaces Example}}{53}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {8.1}The problem of estimating risk in practise}{53}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {8.2}Cross-validation}{55}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {8.3}{\ignorespaces Splitting test and training set}}{55}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {8.4}{\ignorespaces K-folds}}{56}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {8.3}Nested cross validation}{57}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {8.5}{\ignorespaces Nested Cross Validation}}{57}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {chapter}{\numberline {9}Lecture 9 - 07-04-2020}{58}\protected@file@percent }
|
||
\@writefile{lof}{\addvspace {10\p@ }}
|
||
\@writefile{lot}{\addvspace {10\p@ }}
|
||
\@writefile{toc}{\contentsline {section}{\numberline {9.1}Tree predictors}{58}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {9.1}{\ignorespaces Tree building}}{58}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {9.2}{\ignorespaces Tree with at most N node}}{59}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {subsection}{\numberline {9.1.1}Catalan Number}{60}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {9.3}{\ignorespaces Algorithm for tree predictors}}{62}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {chapter}{\numberline {10}Lecture 10 - 07-04-2020}{64}\protected@file@percent }
|
||
\@writefile{lof}{\addvspace {10\p@ }}
|
||
\@writefile{lot}{\addvspace {10\p@ }}
|
||
\@writefile{toc}{\contentsline {section}{\numberline {10.1}TO BE DEFINE}{64}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {10.2}MANCANO 20 MINUTI DI LEZIONE}{64}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {10.1}{\ignorespaces Point (2) - where \hskip 1em\relax $y = cx +q$ \hskip 2em\relax $y = -cx +q $}}{66}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {10.3}Compare risk for zero-one loss}{66}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {10.2}{\ignorespaces Point}}{67}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {chapter}{\numberline {11}Lecture 11 - 20-04-2020}{68}\protected@file@percent }
|
||
\@writefile{lof}{\addvspace {10\p@ }}
|
||
\@writefile{lot}{\addvspace {10\p@ }}
|
||
\@writefile{toc}{\contentsline {section}{\numberline {11.1}Analysis of $K_{NN}$}{68}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {11.1}{\ignorespaces Example of domain of $K_{NN}$}}{68}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {11.2}{\ignorespaces Diagonal length}}{69}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {11.3}{\ignorespaces Shape of the function}}{70}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {subsection}{\numberline {11.1.1}Study of $K_{NN}$}{71}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {subsection}{\numberline {11.1.2}study of trees}{72}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {section}{\numberline {11.2}Non-parametric Algorithms}{73}\protected@file@percent }
|
||
\@writefile{lof}{\contentsline {figure}{\numberline {11.4}{\ignorespaces Parametric and non parametric growing as training set getting larger}}{74}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {subsection}{\numberline {11.2.1}Example of parametric algorithms}{74}\protected@file@percent }
|
||
\@writefile{toc}{\contentsline {chapter}{\numberline {12}Lecture 12 - 21-04-2020}{75}\protected@file@percent }
|
||
\@writefile{lof}{\addvspace {10\p@ }}
|
||
\@writefile{lot}{\addvspace {10\p@ }}
|
||
\@writefile{toc}{\contentsline {section}{\numberline {12.1}Non parametrics algorithms}{75}\protected@file@percent }
|
||
\bibstyle{abbrv}
|
||
\bibdata{main}
|