Skip to content

Commit 9183ee8

Browse files
committed
updated classes 0 1 and 2
1 parent 7fceda1 commit 9183ee8

11 files changed

+249
-73
lines changed

0 - Introduction/pres.pdf

166 Bytes
Binary file not shown.

0 - Introduction/pres.tex

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -335,7 +335,7 @@
335335
\makecell[{{p{0.27\textwidth}}}]{\centering $\{(x,y)\}$} & \makecell[{{p{0.27\textwidth}}}]{\centering $\{x\}$} & \makecell[{{p{0.27\textwidth}}}]{\centering $\{(x,u,r,x')\}$}\\
336336
\hline
337337
\makecell[{{p{0.07\textwidth}}}]{\textbf{Sub-task}} &
338-
\makecell[{{p{0.27\textwidth}}}]{\centering Classification, Regression} & \makecell[{{p{0.27\textwidth}}}]{\centering Clustering, Density estimation, Dimensionnality reduction} & \makecell[{{p{0.27\textwidth}}}]{\centering Value estimation, Policy optimization}\\
338+
\makecell[{{p{0.27\textwidth}}}]{\centering Classification, Regression} & \makecell[{{p{0.27\textwidth}}}]{\centering Clustering, Density estimation, Dimensionality reduction} & \makecell[{{p{0.27\textwidth}}}]{\centering Value estimation, Policy optimization}\\
339339
\hline
340340
\makecell[{{p{0.07\textwidth}}}]{\textbf{Algo ex.}} &
341341
\makecell[{{p{0.27\textwidth}}}]{\centering Neural Networks, SVM, Random Forests} & \makecell[{{p{0.27\textwidth}}}]{\centering k-means, PCA, HCA} & \makecell[{{p{0.27\textwidth}}}]{\centering Q-learning}\\
@@ -364,7 +364,7 @@
364364
~\\
365365
\underline{Ability to fit the training data (regression):}
366366
\begin{itemize}
367-
\item Mean Square Error, \href{https://en.wikipedia.org/wiki/Coefficient_of_determination}{coeffient of determination}.
367+
\item Mean Square Error, \href{https://en.wikipedia.org/wiki/Coefficient_of_determination}{coefficient of determination}.
368368
$$MSE = \frac{1}{N}\sum_i \left(y_i - f(x_i)\right)^2$$
369369
$$R^2 = 1-\frac{\sum_i \left(y_i - f(x_i)\right)^2}{\sum_i \left(y_i - \bar{y}\right)^2}$$
370370
\end{itemize}
@@ -407,7 +407,7 @@
407407
\item ML Notions:
408408
\begin{itemize}
409409
\item maximize margin
410-
\item minimize difference btw class distributions (cross-entropy)
410+
\item minimize difference btw class distributions (cross-entropy \href{https://en.wikipedia.org/wiki/Cross_entropy}{[link]})
411411
\end{itemize}
412412
\end{itemize}
413413
$$H(p,\hat{p}) = \sum_i p(x_i) \log (\hat{p}(x_i)) = \mathbb{E}_p \left(\log(\hat{p})\right)$$
@@ -472,7 +472,7 @@
472472
Back to the example of Predictive Maintenance tasks.
473473
\begin{itemize}
474474
\item Visualizing system state\\
475-
\hspace{1cm} $\rightarrow$ Dimensionnality reduction (Unsupervized learning)
475+
\hspace{1cm} $\rightarrow$ Dimensionality reduction (Unsupervized learning)
476476
\item Detecting anomalies\\
477477
\hspace{1cm} $\rightarrow$ Density estimation (Unsupervized learning)
478478
\item Predicting RUL or TTF\\
708 KB
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
293 KB
Binary file not shown.
Binary file not shown.

1 - Unsupervized Learning/Unsupervized Learning.ipynb

Lines changed: 135 additions & 47 deletions
Large diffs are not rendered by default.

2 - Text data preprocessing/Text data preprocessing.ipynb

Lines changed: 95 additions & 19 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,15 @@
11
{
22
"cells": [
3+
{
4+
"cell_type": "markdown",
5+
"metadata": {
6+
"toc": true
7+
},
8+
"source": [
9+
"<h1>Table of Contents<span class=\"tocSkip\"></span></h1>\n",
10+
"<div class=\"toc\"><ul class=\"toc-item\"><li><span><a href=\"#1.-Load-the-data\" data-toc-modified-id=\"1.-Load-the-data-1\"><span class=\"toc-item-num\">1&nbsp;&nbsp;</span>1. Load the data</a></span></li><li><span><a href=\"#2.-Filtering-out-the-noise\" data-toc-modified-id=\"2.-Filtering-out-the-noise-2\"><span class=\"toc-item-num\">2&nbsp;&nbsp;</span>2. Filtering out the noise</a></span></li><li><span><a href=\"#3.-Even-better-filtering\" data-toc-modified-id=\"3.-Even-better-filtering-3\"><span class=\"toc-item-num\">3&nbsp;&nbsp;</span>3. Even better filtering</a></span></li><li><span><a href=\"#4.-Term-frequency-times-inverse-document-frequency\" data-toc-modified-id=\"4.-Term-frequency-times-inverse-document-frequency-4\"><span class=\"toc-item-num\">4&nbsp;&nbsp;</span>4. Term frequency times inverse document frequency</a></span></li><li><span><a href=\"#5.-Utility-function\" data-toc-modified-id=\"5.-Utility-function-5\"><span class=\"toc-item-num\">5&nbsp;&nbsp;</span>5. Utility function</a></span></li></ul></div>"
11+
]
12+
},
313
{
414
"cell_type": "markdown",
515
"metadata": {},
@@ -40,8 +50,13 @@
4050
},
4151
{
4252
"cell_type": "code",
43-
"execution_count": 2,
44-
"metadata": {},
53+
"execution_count": 1,
54+
"metadata": {
55+
"ExecuteTime": {
56+
"end_time": "2018-10-08T13:52:39.328796Z",
57+
"start_time": "2018-10-08T13:52:39.172635Z"
58+
}
59+
},
4560
"outputs": [
4661
{
4762
"name": "stdout",
@@ -93,8 +108,13 @@
93108
},
94109
{
95110
"cell_type": "code",
96-
"execution_count": 3,
97-
"metadata": {},
111+
"execution_count": 2,
112+
"metadata": {
113+
"ExecuteTime": {
114+
"end_time": "2018-10-08T13:52:47.404302Z",
115+
"start_time": "2018-10-08T13:52:42.691109Z"
116+
}
117+
},
98118
"outputs": [],
99119
"source": [
100120
"from sklearn.feature_extraction.text import CountVectorizer\n",
@@ -104,8 +124,13 @@
104124
},
105125
{
106126
"cell_type": "code",
107-
"execution_count": 4,
108-
"metadata": {},
127+
"execution_count": 3,
128+
"metadata": {
129+
"ExecuteTime": {
130+
"end_time": "2018-10-08T13:52:49.004851Z",
131+
"start_time": "2018-10-08T13:52:48.926879Z"
132+
}
133+
},
109134
"outputs": [
110135
{
111136
"name": "stdout",
@@ -145,8 +170,13 @@
145170
},
146171
{
147172
"cell_type": "code",
148-
"execution_count": 5,
149-
"metadata": {},
173+
"execution_count": 4,
174+
"metadata": {
175+
"ExecuteTime": {
176+
"end_time": "2018-10-08T13:52:58.115382Z",
177+
"start_time": "2018-10-08T13:52:51.966698Z"
178+
}
179+
},
150180
"outputs": [],
151181
"source": [
152182
"from nltk import wordpunct_tokenize \n",
@@ -181,8 +211,12 @@
181211
},
182212
{
183213
"cell_type": "code",
184-
"execution_count": 6,
214+
"execution_count": 5,
185215
"metadata": {
216+
"ExecuteTime": {
217+
"end_time": "2018-10-08T13:52:58.148578Z",
218+
"start_time": "2018-10-08T13:52:58.117096Z"
219+
},
186220
"scrolled": true
187221
},
188222
"outputs": [
@@ -216,8 +250,12 @@
216250
},
217251
{
218252
"cell_type": "code",
219-
"execution_count": 7,
253+
"execution_count": 6,
220254
"metadata": {
255+
"ExecuteTime": {
256+
"end_time": "2018-10-08T13:53:01.283024Z",
257+
"start_time": "2018-10-08T13:53:01.261090Z"
258+
},
221259
"scrolled": false
222260
},
223261
"outputs": [
@@ -320,16 +358,21 @@
320358
},
321359
{
322360
"cell_type": "code",
323-
"execution_count": 8,
324-
"metadata": {},
361+
"execution_count": 7,
362+
"metadata": {
363+
"ExecuteTime": {
364+
"end_time": "2018-10-08T13:53:06.126250Z",
365+
"start_time": "2018-10-08T13:53:06.102174Z"
366+
}
367+
},
325368
"outputs": [
326369
{
327370
"data": {
328371
"text/plain": [
329372
"(2893, 14279)"
330373
]
331374
},
332-
"execution_count": 8,
375+
"execution_count": 7,
333376
"metadata": {},
334377
"output_type": "execute_result"
335378
}
@@ -349,8 +392,13 @@
349392
},
350393
{
351394
"cell_type": "code",
352-
"execution_count": 9,
353-
"metadata": {},
395+
"execution_count": 8,
396+
"metadata": {
397+
"ExecuteTime": {
398+
"end_time": "2018-10-08T13:53:08.606440Z",
399+
"start_time": "2018-10-08T13:53:08.601960Z"
400+
}
401+
},
354402
"outputs": [
355403
{
356404
"name": "stdout",
@@ -427,8 +475,13 @@
427475
},
428476
{
429477
"cell_type": "code",
430-
"execution_count": 10,
431-
"metadata": {},
478+
"execution_count": 9,
479+
"metadata": {
480+
"ExecuteTime": {
481+
"end_time": "2018-10-08T13:53:15.239967Z",
482+
"start_time": "2018-10-08T13:53:11.837369Z"
483+
}
484+
},
432485
"outputs": [],
433486
"source": [
434487
"import load_spam\n",
@@ -438,8 +491,13 @@
438491
},
439492
{
440493
"cell_type": "code",
441-
"execution_count": 11,
442-
"metadata": {},
494+
"execution_count": 10,
495+
"metadata": {
496+
"ExecuteTime": {
497+
"end_time": "2018-10-08T13:53:16.164299Z",
498+
"start_time": "2018-10-08T13:53:16.156978Z"
499+
}
500+
},
443501
"outputs": [
444502
{
445503
"name": "stdout",
@@ -485,6 +543,24 @@
485543
"nbconvert_exporter": "python",
486544
"pygments_lexer": "ipython3",
487545
"version": "3.6.4"
546+
},
547+
"toc": {
548+
"base_numbering": 1,
549+
"nav_menu": {},
550+
"number_sections": true,
551+
"sideBar": true,
552+
"skip_h1_title": false,
553+
"title_cell": "Table of Contents",
554+
"title_sidebar": "Contents",
555+
"toc_cell": true,
556+
"toc_position": {
557+
"height": "calc(100% - 180px)",
558+
"left": "10px",
559+
"top": "150px",
560+
"width": "384px"
561+
},
562+
"toc_section_display": true,
563+
"toc_window_display": true
488564
}
489565
},
490566
"nbformat": 4,

0 commit comments

Comments
 (0)