{"payload":{"allShortcutsEnabled":false,"fileTree":{"2017-fall/seminars":{"items":[{"name":"data","path":"2017-fall/seminars/data","contentType":"directory"},{"name":"images","path":"2017-fall/seminars/images","contentType":"directory"},{"name":"sem01-intro.ipynb","path":"2017-fall/seminars/sem01-intro.ipynb","contentType":"file"},{"name":"sem01-tools.ipynb","path":"2017-fall/seminars/sem01-tools.ipynb","contentType":"file"},{"name":"sem02-linregr-part1.pdf","path":"2017-fall/seminars/sem02-linregr-part1.pdf","contentType":"file"},{"name":"sem02-linregr-part2.ipynb","path":"2017-fall/seminars/sem02-linregr-part2.ipynb","contentType":"file"},{"name":"sem03-linregr.ipynb","path":"2017-fall/seminars/sem03-linregr.ipynb","contentType":"file"},{"name":"sem04-linclass-metrics.pdf","path":"2017-fall/seminars/sem04-linclass-metrics.pdf","contentType":"file"},{"name":"sem05-linclass.ipynb","path":"2017-fall/seminars/sem05-linclass.ipynb","contentType":"file"},{"name":"sem05-linclass.pdf","path":"2017-fall/seminars/sem05-linclass.pdf","contentType":"file"},{"name":"sem06-knn.pdf","path":"2017-fall/seminars/sem06-knn.pdf","contentType":"file"},{"name":"sem07-trees.ipynb","path":"2017-fall/seminars/sem07-trees.ipynb","contentType":"file"},{"name":"sem08_bvd.pdf","path":"2017-fall/seminars/sem08_bvd.pdf","contentType":"file"},{"name":"sem09-gbm-part1.pdf","path":"2017-fall/seminars/sem09-gbm-part1.pdf","contentType":"file"},{"name":"sem09-gbm-part2.ipynb","path":"2017-fall/seminars/sem09-gbm-part2.ipynb","contentType":"file"},{"name":"sem10-nn-part1.pdf","path":"2017-fall/seminars/sem10-nn-part1.pdf","contentType":"file"},{"name":"sem10-nn-part2.ipynb","path":"2017-fall/seminars/sem10-nn-part2.ipynb","contentType":"file"},{"name":"sem11-visualization.ipynb","path":"2017-fall/seminars/sem11-visualization.ipynb","contentType":"file"}],"totalCount":18},"2017-fall":{"items":[{"name":"homeworks-practice","path":"2017-fall/homeworks-practice","contentType":"directory"},{"name":"homeworks-theory","path":"2017-fall/homeworks-theory","contentType":"directory"},{"name":"lecture-notes","path":"2017-fall/lecture-notes","contentType":"directory"},{"name":"seminars","path":"2017-fall/seminars","contentType":"directory"}],"totalCount":4},"":{"items":[{"name":"2016-fall","path":"2016-fall","contentType":"directory"},{"name":"2016-spring","path":"2016-spring","contentType":"directory"},{"name":"2017-fall","path":"2017-fall","contentType":"directory"},{"name":"2017-spring","path":"2017-spring","contentType":"directory"},{"name":"2018-fall","path":"2018-fall","contentType":"directory"},{"name":"2018-spring","path":"2018-spring","contentType":"directory"},{"name":"2019-fall","path":"2019-fall","contentType":"directory"},{"name":"2019-spring","path":"2019-spring","contentType":"directory"},{"name":"2020-fall","path":"2020-fall","contentType":"directory"},{"name":"2020-spring","path":"2020-spring","contentType":"directory"},{"name":"2021-fall","path":"2021-fall","contentType":"directory"},{"name":"2021-spring","path":"2021-spring","contentType":"directory"},{"name":"2022-fall","path":"2022-fall","contentType":"directory"},{"name":"2022-spring","path":"2022-spring","contentType":"directory"},{"name":"2023-fall","path":"2023-fall","contentType":"directory"},{"name":"2023-spring","path":"2023-spring","contentType":"directory"},{"name":".gitignore","path":".gitignore","contentType":"file"},{"name":"README.md","path":"README.md","contentType":"file"}],"totalCount":18}},"fileTreeProcessingTime":10.628796,"foldersToFetch":[],"repo":{"id":67353330,"defaultBranch":"master","name":"ml-course-hse","ownerLogin":"esokolov","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2016-09-04T15:36:26.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/1822514?v=4","public":true,"private":false,"isOrgOwned":false},"symbolsExpanded":false,"treeExpanded":true,"refInfo":{"name":"master","listCacheKey":"v0:1709110718.0","canEdit":false,"refType":"branch","currentOid":"fb465e4cb6ed5fb2c2741009743dbd1e11fb9783"},"path":"2017-fall/seminars/sem03-linregr.ipynb","currentUser":null,"blob":{"rawLines":["{"," \"cells\": ["," {"," \"cell_type\": \"markdown\","," \"metadata\": {},"," \"source\": ["," \"# Предобработка данных и функции потерь в линейной регрессии\""," ]"," },"," {"," \"cell_type\": \"markdown\","," \"metadata\": {},"," \"source\": ["," \"## Данные\\n\","," \"Для демонстраций загрузим набор данных [Automobile Data Set](https://archive.ics.uci.edu/ml/datasets/Automobile). В данных присутствуют категориальные, целочисленные и вещественнозначные признаки.\""," ]"," },"," {"," \"cell_type\": \"code\","," \"execution_count\": 1,"," \"metadata\": {"," \"collapsed\": true"," },"," \"outputs\": [],"," \"source\": ["," \"import pandas as pd\\n\","," \"X_raw = pd.read_csv(\\\"https://archive.ics.uci.edu/ml/machine-learning-databases/autos/imports-85.data\\\", \\\\\\n\","," \" header=None, na_values=[\\\"?\\\"])\""," ]"," },"," {"," \"cell_type\": \"code\","," \"execution_count\": 68,"," \"metadata\": {},"," \"outputs\": ["," {"," \"data\": {"," \"text/html\": ["," \"
\\n\","," \" | 0 | \\n\","," \"1 | \\n\","," \"2 | \\n\","," \"3 | \\n\","," \"4 | \\n\","," \"5 | \\n\","," \"6 | \\n\","," \"7 | \\n\","," \"8 | \\n\","," \"9 | \\n\","," \"... | \\n\","," \"16 | \\n\","," \"17 | \\n\","," \"18 | \\n\","," \"19 | \\n\","," \"20 | \\n\","," \"21 | \\n\","," \"22 | \\n\","," \"23 | \\n\","," \"24 | \\n\","," \"25 | \\n\","," \"
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \\n\","," \"3 | \\n\","," \"NaN | \\n\","," \"alfa-romero | \\n\","," \"gas | \\n\","," \"std | \\n\","," \"two | \\n\","," \"convertible | \\n\","," \"rwd | \\n\","," \"front | \\n\","," \"88.6 | \\n\","," \"... | \\n\","," \"130 | \\n\","," \"mpfi | \\n\","," \"3.47 | \\n\","," \"2.68 | \\n\","," \"9.0 | \\n\","," \"111.0 | \\n\","," \"5000.0 | \\n\","," \"21 | \\n\","," \"27 | \\n\","," \"13495.1 | \\n\","," \"
1 | \\n\","," \"3 | \\n\","," \"NaN | \\n\","," \"alfa-romero | \\n\","," \"gas | \\n\","," \"std | \\n\","," \"two | \\n\","," \"convertible | \\n\","," \"rwd | \\n\","," \"front | \\n\","," \"88.6 | \\n\","," \"... | \\n\","," \"130 | \\n\","," \"mpfi | \\n\","," \"3.47 | \\n\","," \"2.68 | \\n\","," \"9.0 | \\n\","," \"111.0 | \\n\","," \"5000.0 | \\n\","," \"21 | \\n\","," \"27 | \\n\","," \"16500.0 | \\n\","," \"
2 | \\n\","," \"1 | \\n\","," \"NaN | \\n\","," \"alfa-romero | \\n\","," \"gas | \\n\","," \"std | \\n\","," \"two | \\n\","," \"hatchback | \\n\","," \"rwd | \\n\","," \"front | \\n\","," \"94.5 | \\n\","," \"... | \\n\","," \"152 | \\n\","," \"mpfi | \\n\","," \"2.68 | \\n\","," \"3.47 | \\n\","," \"9.0 | \\n\","," \"154.0 | \\n\","," \"5000.0 | \\n\","," \"19 | \\n\","," \"26 | \\n\","," \"16500.0 | \\n\","," \"
3 | \\n\","," \"2 | \\n\","," \"164.0 | \\n\","," \"audi | \\n\","," \"gas | \\n\","," \"std | \\n\","," \"four | \\n\","," \"sedan | \\n\","," \"fwd | \\n\","," \"front | \\n\","," \"99.8 | \\n\","," \"... | \\n\","," \"109 | \\n\","," \"mpfi | \\n\","," \"3.19 | \\n\","," \"3.40 | \\n\","," \"10.0 | \\n\","," \"102.0 | \\n\","," \"5500.0 | \\n\","," \"24 | \\n\","," \"30 | \\n\","," \"13950.0 | \\n\","," \"
4 | \\n\","," \"2 | \\n\","," \"164.0 | \\n\","," \"audi | \\n\","," \"gas | \\n\","," \"std | \\n\","," \"four | \\n\","," \"sedan | \\n\","," \"4wd | \\n\","," \"front | \\n\","," \"99.4 | \\n\","," \"... | \\n\","," \"136 | \\n\","," \"mpfi | \\n\","," \"3.19 | \\n\","," \"3.40 | \\n\","," \"8.0 | \\n\","," \"115.0 | \\n\","," \"5500.0 | \\n\","," \"18 | \\n\","," \"22 | \\n\","," \"17450.0 | \\n\","," \"
5 rows × 26 columns
\\n\","," \"\\n\","," \" | 0 | \\n\","," \"1 | \\n\","," \"9 | \\n\","," \"10 | \\n\","," \"11 | \\n\","," \"12 | \\n\","," \"13 | \\n\","," \"16 | \\n\","," \"18 | \\n\","," \"19 | \\n\","," \"... | \\n\","," \"2 | \\n\","," \"3 | \\n\","," \"4 | \\n\","," \"5 | \\n\","," \"6 | \\n\","," \"7 | \\n\","," \"8 | \\n\","," \"14 | \\n\","," \"15 | \\n\","," \"17 | \\n\","," \"
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \\n\","," \"3.0 | \\n\","," \"122.0 | \\n\","," \"88.6 | \\n\","," \"168.8 | \\n\","," \"64.1 | \\n\","," \"48.8 | \\n\","," \"2548.0 | \\n\","," \"130.0 | \\n\","," \"3.47 | \\n\","," \"2.68 | \\n\","," \"... | \\n\","," \"alfa-romero | \\n\","," \"gas | \\n\","," \"std | \\n\","," \"two | \\n\","," \"convertible | \\n\","," \"rwd | \\n\","," \"front | \\n\","," \"dohc | \\n\","," \"four | \\n\","," \"mpfi | \\n\","," \"
1 | \\n\","," \"3.0 | \\n\","," \"122.0 | \\n\","," \"88.6 | \\n\","," \"168.8 | \\n\","," \"64.1 | \\n\","," \"48.8 | \\n\","," \"2548.0 | \\n\","," \"130.0 | \\n\","," \"3.47 | \\n\","," \"2.68 | \\n\","," \"... | \\n\","," \"alfa-romero | \\n\","," \"gas | \\n\","," \"std | \\n\","," \"two | \\n\","," \"convertible | \\n\","," \"rwd | \\n\","," \"front | \\n\","," \"dohc | \\n\","," \"four | \\n\","," \"mpfi | \\n\","," \"
2 | \\n\","," \"1.0 | \\n\","," \"122.0 | \\n\","," \"94.5 | \\n\","," \"171.2 | \\n\","," \"65.5 | \\n\","," \"52.4 | \\n\","," \"2823.0 | \\n\","," \"152.0 | \\n\","," \"2.68 | \\n\","," \"3.47 | \\n\","," \"... | \\n\","," \"alfa-romero | \\n\","," \"gas | \\n\","," \"std | \\n\","," \"two | \\n\","," \"hatchback | \\n\","," \"rwd | \\n\","," \"front | \\n\","," \"ohcv | \\n\","," \"six | \\n\","," \"mpfi | \\n\","," \"
3 | \\n\","," \"2.0 | \\n\","," \"164.0 | \\n\","," \"99.8 | \\n\","," \"176.6 | \\n\","," \"66.2 | \\n\","," \"54.3 | \\n\","," \"2337.0 | \\n\","," \"109.0 | \\n\","," \"3.19 | \\n\","," \"3.40 | \\n\","," \"... | \\n\","," \"audi | \\n\","," \"gas | \\n\","," \"std | \\n\","," \"four | \\n\","," \"sedan | \\n\","," \"fwd | \\n\","," \"front | \\n\","," \"ohc | \\n\","," \"four | \\n\","," \"mpfi | \\n\","," \"
4 | \\n\","," \"2.0 | \\n\","," \"164.0 | \\n\","," \"99.4 | \\n\","," \"176.6 | \\n\","," \"66.4 | \\n\","," \"54.3 | \\n\","," \"2824.0 | \\n\","," \"136.0 | \\n\","," \"3.19 | \\n\","," \"3.40 | \\n\","," \"... | \\n\","," \"audi | \\n\","," \"gas | \\n\","," \"std | \\n\","," \"four | \\n\","," \"sedan | \\n\","," \"4wd | \\n\","," \"front | \\n\","," \"ohc | \\n\","," \"five | \\n\","," \"mpfi | \\n\","," \"
5 rows × 25 columns
\\n\","," \"\\n\","," \" | 0 | \\n\","," \"1 | \\n\","," \"9 | \\n\","," \"10 | \\n\","," \"11 | \\n\","," \"12 | \\n\","," \"13 | \\n\","," \"16 | \\n\","," \"18 | \\n\","," \"19 | \\n\","," \"... | \\n\","," \"15_three | \\n\","," \"15_twelve | \\n\","," \"15_two | \\n\","," \"17_2bbl | \\n\","," \"17_4bbl | \\n\","," \"17_idi | \\n\","," \"17_mfi | \\n\","," \"17_mpfi | \\n\","," \"17_spdi | \\n\","," \"17_spfi | \\n\","," \"
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \\n\","," \"3.0 | \\n\","," \"122.0 | \\n\","," \"88.6 | \\n\","," \"168.8 | \\n\","," \"64.1 | \\n\","," \"48.8 | \\n\","," \"2548.0 | \\n\","," \"130.0 | \\n\","," \"3.47 | \\n\","," \"2.68 | \\n\","," \"... | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"1 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"
1 | \\n\","," \"3.0 | \\n\","," \"122.0 | \\n\","," \"88.6 | \\n\","," \"168.8 | \\n\","," \"64.1 | \\n\","," \"48.8 | \\n\","," \"2548.0 | \\n\","," \"130.0 | \\n\","," \"3.47 | \\n\","," \"2.68 | \\n\","," \"... | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"1 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"
2 | \\n\","," \"1.0 | \\n\","," \"122.0 | \\n\","," \"94.5 | \\n\","," \"171.2 | \\n\","," \"65.5 | \\n\","," \"52.4 | \\n\","," \"2823.0 | \\n\","," \"152.0 | \\n\","," \"2.68 | \\n\","," \"3.47 | \\n\","," \"... | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"1 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"
3 | \\n\","," \"2.0 | \\n\","," \"164.0 | \\n\","," \"99.8 | \\n\","," \"176.6 | \\n\","," \"66.2 | \\n\","," \"54.3 | \\n\","," \"2337.0 | \\n\","," \"109.0 | \\n\","," \"3.19 | \\n\","," \"3.40 | \\n\","," \"... | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"1 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"
4 | \\n\","," \"2.0 | \\n\","," \"164.0 | \\n\","," \"99.4 | \\n\","," \"176.6 | \\n\","," \"66.4 | \\n\","," \"54.3 | \\n\","," \"2824.0 | \\n\","," \"136.0 | \\n\","," \"3.19 | \\n\","," \"3.40 | \\n\","," \"... | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"1 | \\n\","," \"0 | \\n\","," \"0 | \\n\","," \"
5 rows × 65 columns
\\n\","," \"\\n\","," \" | 0 | \\n\","," \"1 | \\n\","," \"2 | \\n\","," \"3 | \\n\","," \"4 | \\n\","," \"5 | \\n\","," \"6 | \\n\","," \"7 | \\n\","," \"8 | \\n\","," \"9 | \\n\","," \"... | \\n\","," \"55 | \\n\","," \"56 | \\n\","," \"57 | \\n\","," \"58 | \\n\","," \"59 | \\n\","," \"60 | \\n\","," \"61 | \\n\","," \"62 | \\n\","," \"63 | \\n\","," \"64 | \\n\","," \"
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \\n\","," \"1.0 | \\n\","," \"0.298429 | \\n\","," \"0.058309 | \\n\","," \"0.413433 | \\n\","," \"0.324786 | \\n\","," \"0.083333 | \\n\","," \"0.411171 | \\n\","," \"0.260377 | \\n\","," \"0.664286 | \\n\","," \"0.290476 | \\n\","," \"... | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"1.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"
1 | \\n\","," \"1.0 | \\n\","," \"0.298429 | \\n\","," \"0.058309 | \\n\","," \"0.413433 | \\n\","," \"0.324786 | \\n\","," \"0.083333 | \\n\","," \"0.411171 | \\n\","," \"0.260377 | \\n\","," \"0.664286 | \\n\","," \"0.290476 | \\n\","," \"... | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"1.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"
2 | \\n\","," \"0.6 | \\n\","," \"0.298429 | \\n\","," \"0.230321 | \\n\","," \"0.449254 | \\n\","," \"0.444444 | \\n\","," \"0.383333 | \\n\","," \"0.517843 | \\n\","," \"0.343396 | \\n\","," \"0.100000 | \\n\","," \"0.666667 | \\n\","," \"... | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"1.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"
3 | \\n\","," \"0.8 | \\n\","," \"0.518325 | \\n\","," \"0.384840 | \\n\","," \"0.529851 | \\n\","," \"0.504274 | \\n\","," \"0.541667 | \\n\","," \"0.329325 | \\n\","," \"0.181132 | \\n\","," \"0.464286 | \\n\","," \"0.633333 | \\n\","," \"... | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"1.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"
4 | \\n\","," \"0.8 | \\n\","," \"0.518325 | \\n\","," \"0.373178 | \\n\","," \"0.529851 | \\n\","," \"0.521368 | \\n\","," \"0.541667 | \\n\","," \"0.518231 | \\n\","," \"0.283019 | \\n\","," \"0.464286 | \\n\","," \"0.633333 | \\n\","," \"... | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"1.0 | \\n\","," \"0.0 | \\n\","," \"0.0 | \\n\","," \"
5 rows × 65 columns
\\n\","," \"