diff --git a/Python-Basic-Data-Cleaning.ipynb b/Python-Basic-Data-Cleaning.ipynb index 81b7df3..6efe415 100644 --- a/Python-Basic-Data-Cleaning.ipynb +++ b/Python-Basic-Data-Cleaning.ipynb @@ -11,7 +11,7 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 4, "id": "dd24ccc0", "metadata": {}, "outputs": [], @@ -22,7 +22,7 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 5, "id": "e75c7c42", "metadata": {}, "outputs": [ @@ -221,7 +221,7 @@ "[5 rows x 82 columns]" ] }, - "execution_count": 3, + "execution_count": 5, "metadata": {}, "output_type": "execute_result" } @@ -236,7 +236,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 6, "id": "89727911", "metadata": {}, "outputs": [], @@ -251,7 +251,7 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 7, "id": "122bfa3b", "metadata": {}, "outputs": [], @@ -271,7 +271,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 8, "id": "b962446e", "metadata": {}, "outputs": [ @@ -477,7 +477,7 @@ "[5 rows x 32 columns]" ] }, - "execution_count": 6, + "execution_count": 8, "metadata": {}, "output_type": "execute_result" } @@ -489,7 +489,7 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 9, "id": "5f2a4bac", "metadata": {}, "outputs": [], @@ -501,7 +501,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 10, "id": "19f80a57", "metadata": {}, "outputs": [ @@ -735,7 +735,7 @@ "[5 rows x 31 columns]" ] }, - "execution_count": 8, + "execution_count": 10, "metadata": {}, "output_type": "execute_result" } @@ -746,7 +746,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 11, "id": "5dba9a9c", "metadata": {}, "outputs": [ @@ -787,7 +787,7 @@ "Name: 526301100, dtype: object" ] }, - "execution_count": 9, + "execution_count": 11, "metadata": {}, "output_type": "execute_result" } @@ -799,7 +799,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 12, "id": "791a379b", "metadata": {}, "outputs": [], @@ -810,7 +810,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 13, "id": "dd76c23f", "metadata": {}, "outputs": [ @@ -1212,7 +1212,7 @@ "[370 rows x 31 columns]" ] }, - "execution_count": 11, + "execution_count": 13, "metadata": {}, "output_type": "execute_result" } @@ -1223,7 +1223,7 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 14, "id": "d0ab5134", "metadata": {}, "outputs": [ @@ -1264,7 +1264,7 @@ "dtype: object" ] }, - "execution_count": 12, + "execution_count": 14, "metadata": {}, "output_type": "execute_result" } @@ -1332,7 +1332,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 15, "id": "52ff9cea", "metadata": {}, "outputs": [ @@ -1383,7 +1383,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 16, "id": "a7531b07", "metadata": {}, "outputs": [], @@ -1394,7 +1394,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 17, "id": "23aac6d1", "metadata": {}, "outputs": [ @@ -1445,7 +1445,7 @@ }, { "cell_type": "code", - "execution_count": 24, + "execution_count": 18, "id": "4443cdeb", "metadata": {}, "outputs": [ @@ -1672,7 +1672,7 @@ "
\n", + " | order | \n", + "ms-subclass | \n", + "ms-zoning | \n", + "lot-frontage | \n", + "lot-area | \n", + "utilities | \n", + "lot-config | \n", + "land-slope | \n", + "neighborhood | \n", + "bldg-type | \n", + "... | \n", + "gr-liv-area | \n", + "bedroom-abvgr | \n", + "totrms-abvgrd | \n", + "paved-drive | \n", + "wood-deck-sf | \n", + "fence | \n", + "mo-sold | \n", + "yr-sold | \n", + "sale-type | \n", + "saleprice | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PID | \n", + "\n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " | \n", + " |
527302110 | \n", + "20 | \n", + "20 | \n", + "RL | \n", + "85.0 | \n", + "13175 | \n", + "AllPub | \n", + "Inside | \n", + "Gtl | \n", + "NWAmes | \n", + "1Fam | \n", + "... | \n", + "2073 | \n", + "3 | \n", + "7 | \n", + "Y | \n", + "349 | \n", + "MnPrv | \n", + "2 | \n", + "2010 | \n", + "WD | \n", + "210000 | \n", + "
527358140 | \n", + "21 | \n", + "20 | \n", + "RL | \n", + "105.0 | \n", + "11751 | \n", + "AllPub | \n", + "Inside | \n", + "Gtl | \n", + "NWAmes | \n", + "1Fam | \n", + "... | \n", + "1844 | \n", + "3 | \n", + "7 | \n", + "Y | \n", + "0 | \n", + "MnPrv | \n", + "1 | \n", + "2010 | \n", + "COD | \n", + "190000 | \n", + "
527358200 | \n", + "22 | \n", + "85 | \n", + "RL | \n", + "85.0 | \n", + "10625 | \n", + "AllPub | \n", + "Inside | \n", + "Gtl | \n", + "NWAmes | \n", + "1Fam | \n", + "... | \n", + "1173 | \n", + "3 | \n", + "6 | \n", + "Y | \n", + "0 | \n", + "MnPrv | \n", + "1 | \n", + "2010 | \n", + "WD | \n", + "170000 | \n", + "
534152100 | \n", + "115 | \n", + "60 | \n", + "RL | \n", + "80.0 | \n", + "10421 | \n", + "AllPub | \n", + "Inside | \n", + "Gtl | \n", + "NWAmes | \n", + "1Fam | \n", + "... | \n", + "1714 | \n", + "3 | \n", + "7 | \n", + "Y | \n", + "228 | \n", + "MnPrv | \n", + "3 | \n", + "2010 | \n", + "WD | \n", + "196500 | \n", + "
534176230 | \n", + "117 | \n", + "60 | \n", + "RL | \n", + "80.0 | \n", + "9600 | \n", + "AllPub | \n", + "Inside | \n", + "Gtl | \n", + "NWAmes | \n", + "1Fam | \n", + "... | \n", + "1645 | \n", + "4 | \n", + "7 | \n", + "Y | \n", + "0 | \n", + "GdWo | \n", + "6 | \n", + "2010 | \n", + "WD | \n", + "171000 | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
902204120 | \n", + "2653 | \n", + "50 | \n", + "RM | \n", + "50.0 | \n", + "6000 | \n", + "AllPub | \n", + "Inside | \n", + "Gtl | \n", + "OldTown | \n", + "1Fam | \n", + "... | \n", + "1566 | \n", + "5 | \n", + "7 | \n", + "Y | \n", + "24 | \n", + "MnPrv | \n", + "8 | \n", + "2006 | \n", + "WD | \n", + "139000 | \n", + "
902206090 | \n", + "2655 | \n", + "50 | \n", + "RM | \n", + "56.0 | \n", + "9576 | \n", + "AllPub | \n", + "Inside | \n", + "Gtl | \n", + "OldTown | \n", + "1Fam | \n", + "... | \n", + "1182 | \n", + "3 | \n", + "5 | \n", + "Y | \n", + "0 | \n", + "GdWo | \n", + "5 | \n", + "2006 | \n", + "WD | \n", + "120000 | \n", + "
902400110 | \n", + "2667 | \n", + "75 | \n", + "RM | \n", + "90.0 | \n", + "22950 | \n", + "AllPub | \n", + "Inside | \n", + "Gtl | \n", + "OldTown | \n", + "1Fam | \n", + "... | \n", + "3608 | \n", + "4 | \n", + "12 | \n", + "Y | \n", + "0 | \n", + "GdPrv | \n", + "6 | \n", + "2006 | \n", + "WD | \n", + "475000 | \n", + "
903229040 | \n", + "2675 | \n", + "190 | \n", + "RM | \n", + "65.0 | \n", + "7800 | \n", + "AllPub | \n", + "Inside | \n", + "Gtl | \n", + "OldTown | \n", + "2fmCon | \n", + "... | \n", + "1118 | \n", + "3 | \n", + "5 | \n", + "Y | \n", + "0 | \n", + "MnPrv | \n", + "5 | \n", + "2006 | \n", + "WD | \n", + "119900 | \n", + "
903234030 | \n", + "2683 | \n", + "30 | \n", + "RM | \n", + "50.0 | \n", + "6000 | \n", + "AllPub | \n", + "Inside | \n", + "Gtl | \n", + "OldTown | \n", + "1Fam | \n", + "... | \n", + "1103 | \n", + "2 | \n", + "5 | \n", + "Y | \n", + "166 | \n", + "MnPrv | \n", + "7 | \n", + "2006 | \n", + "WD | \n", + "110500 | \n", + "
87 rows × 31 columns
\n", + "