diff --git a/machine_learning_notes.ipynb b/machine_learning_notes.ipynb index e68f269..c1b8ca6 100644 --- a/machine_learning_notes.ipynb +++ b/machine_learning_notes.ipynb @@ -74,14 +74,14 @@ }, { "cell_type": "code", - "execution_count": 18, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ "import warnings\n", "warnings.filterwarnings('ignore')\n", "\n", - "import os\n", + "import os, io\n", "import pandas as pd\n", "import numpy as np\n", "import matplotlib.pyplot as plt\n", @@ -112,11 +112,7 @@ "# training evaluation\n", "from sklearn.metrics import mean_squared_log_error\n", "from sklearn.metrics import mean_squared_error\n", - "\n", - "# file browser\n", - "from selectfile import FileBrowser\n", - "train_file_picker = FileBrowser()\n", - "test_file_picker = FileBrowser()\n" + "\n" ] }, { @@ -128,242 +124,28 @@ }, { "cell_type": "code", - "execution_count": 20, - "metadata": {}, - "outputs": [ - { - "data": { - "application/vnd.jupyter.widget-view+json": { - "model_id": "794945c894fd4d79a29a68d38431fdcd", - "version_major": 2, - "version_minor": 0 - }, - "text/plain": [ - "VBox(children=(HTML(value='

/home/rodolfo/Desktop/machine_learning_notes/data/train.csv

'),))" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "train_file_picker.widget()" - ] - }, - { - "cell_type": "code", - "execution_count": 16, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ - "df = pd.read_csv(train_file_picker.path)" + "try:\n", + " from google.colab import files\n", + " files.upload()\n", + " uploaded_files = [f for f in uploaded.keys()]\n", + " df = pd.read_csv(io.StringIO(uploaded[uploaded_files[0]].decode('utf-8')))\n", + "except:\n", + " from selectfile import FileBrowser\n", + " train_file_picker = FileBrowser()\n", + " train_file_picker.widget()\n", + " \n", + "#df = pd.read_csv(train_file_picker.path)\n" ] }, { "cell_type": "code", - "execution_count": 28, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
IdMSSubClassMSZoningLotFrontageLotAreaStreetAlleyLotShapeLandContourUtilities...PoolAreaPoolQCFenceMiscFeatureMiscValMoSoldYrSoldSaleTypeSaleConditionSalePrice
0160RL65.08450PaveNaNRegLvlAllPub...0NaNNaNNaN022008WDNormal208500
1220RL80.09600PaveNaNRegLvlAllPub...0NaNNaNNaN052007WDNormal181500
2360RL68.011250PaveNaNIR1LvlAllPub...0NaNNaNNaN092008WDNormal223500
3470RL60.09550PaveNaNIR1LvlAllPub...0NaNNaNNaN022006WDAbnorml140000
4560RL84.014260PaveNaNIR1LvlAllPub...0NaNNaNNaN0122008WDNormal250000
\n", - "

5 rows × 81 columns

\n", - "
" - ], - "text/plain": [ - " Id MSSubClass MSZoning LotFrontage LotArea Street Alley LotShape \\\n", - "0 1 60 RL 65.0 8450 Pave NaN Reg \n", - "1 2 20 RL 80.0 9600 Pave NaN Reg \n", - "2 3 60 RL 68.0 11250 Pave NaN IR1 \n", - "3 4 70 RL 60.0 9550 Pave NaN IR1 \n", - "4 5 60 RL 84.0 14260 Pave NaN IR1 \n", - "\n", - " LandContour Utilities ... PoolArea PoolQC Fence MiscFeature MiscVal \\\n", - "0 Lvl AllPub ... 0 NaN NaN NaN 0 \n", - "1 Lvl AllPub ... 0 NaN NaN NaN 0 \n", - "2 Lvl AllPub ... 0 NaN NaN NaN 0 \n", - "3 Lvl AllPub ... 0 NaN NaN NaN 0 \n", - "4 Lvl AllPub ... 0 NaN NaN NaN 0 \n", - "\n", - " MoSold YrSold SaleType SaleCondition SalePrice \n", - "0 2 2008 WD Normal 208500 \n", - "1 5 2007 WD Normal 181500 \n", - "2 9 2008 WD Normal 223500 \n", - "3 2 2006 WD Abnorml 140000 \n", - "4 12 2008 WD Normal 250000 \n", - "\n", - "[5 rows x 81 columns]" - ] - }, - "execution_count": 28, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "df.head()" ] @@ -377,31 +159,16 @@ }, { "cell_type": "code", - "execution_count": 23, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "application/vnd.jupyter.widget-view+json": { - "model_id": "dbd1464bceba427ca79eefabe718b61a", - "version_major": 2, - "version_minor": 0 - }, - "text/plain": [ - "VBox(children=(HTML(value='

/home/rodolfo/Desktop/machine_learning_notes/data/train.csv

'),))" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "test_file_picker.widget()" ] }, { "cell_type": "code", - "execution_count": 24, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -410,209 +177,9 @@ }, { "cell_type": "code", - "execution_count": 27, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
IdMSSubClassMSZoningLotFrontageLotAreaStreetAlleyLotShapeLandContourUtilities...PoolAreaPoolQCFenceMiscFeatureMiscValMoSoldYrSoldSaleTypeSaleConditionSalePrice
0160RL65.08450PaveNaNRegLvlAllPub...0NaNNaNNaN022008WDNormal208500
1220RL80.09600PaveNaNRegLvlAllPub...0NaNNaNNaN052007WDNormal181500
2360RL68.011250PaveNaNIR1LvlAllPub...0NaNNaNNaN092008WDNormal223500
3470RL60.09550PaveNaNIR1LvlAllPub...0NaNNaNNaN022006WDAbnorml140000
4560RL84.014260PaveNaNIR1LvlAllPub...0NaNNaNNaN0122008WDNormal250000
\n", - "

5 rows × 81 columns

\n", - "
" - ], - "text/plain": [ - " Id MSSubClass MSZoning LotFrontage LotArea Street Alley LotShape \\\n", - "0 1 60 RL 65.0 8450 Pave NaN Reg \n", - "1 2 20 RL 80.0 9600 Pave NaN Reg \n", - "2 3 60 RL 68.0 11250 Pave NaN IR1 \n", - "3 4 70 RL 60.0 9550 Pave NaN IR1 \n", - "4 5 60 RL 84.0 14260 Pave NaN IR1 \n", - "\n", - " LandContour Utilities ... PoolArea PoolQC Fence MiscFeature MiscVal \\\n", - "0 Lvl AllPub ... 0 NaN NaN NaN 0 \n", - "1 Lvl AllPub ... 0 NaN NaN NaN 0 \n", - "2 Lvl AllPub ... 0 NaN NaN NaN 0 \n", - "3 Lvl AllPub ... 0 NaN NaN NaN 0 \n", - "4 Lvl AllPub ... 0 NaN NaN NaN 0 \n", - "\n", - " MoSold YrSold SaleType SaleCondition SalePrice \n", - "0 2 2008 WD Normal 208500 \n", - "1 5 2007 WD Normal 181500 \n", - "2 9 2008 WD Normal 223500 \n", - "3 2 2006 WD Abnorml 140000 \n", - "4 12 2008 WD Normal 250000 \n", - "\n", - "[5 rows x 81 columns]" - ] - }, - "execution_count": 27, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "df_test.head()" ] @@ -1283,7 +850,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.6.5" + "version": "3.6.3" } }, "nbformat": 4,