diff --git a/practice.ipynb b/practice.ipynb new file mode 100644 index 0000000..ca0b747 --- /dev/null +++ b/practice.ipynb @@ -0,0 +1,1664 @@ +{ + "nbformat": 4, + "nbformat_minor": 0, + "metadata": { + "colab": { + "provenance": [], + "authorship_tag": "ABX9TyPfqMnDc7BAvcI0UR60Fi0h", + "include_colab_link": true + }, + "kernelspec": { + "name": "python3", + "display_name": "Python 3" + }, + "language_info": { + "name": "python" + } + }, + "cells": [ + { + "cell_type": "markdown", + "metadata": { + "id": "view-in-github", + "colab_type": "text" + }, + "source": [ + "\"Open" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 226 + }, + "id": "NqS5tBSdxgRS", + "outputId": "83279482-9637-4da2-8179-c84b37b69e47" + }, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + " price area bedrooms bathrooms stories mainroad guestroom \\\n", + "540 1820000.0 3000 2 1.0 1 yes no \n", + "541 1767150.0 2400 3 1.0 1 no no \n", + "542 1750000.0 3620 2 1.0 1 yes no \n", + "543 1750000.0 2910 3 1.0 1 no no \n", + "544 1750000.0 3850 3 1.0 2 yes no \n", + "\n", + " basement hotwaterheating airconditioning parking prefarea \\\n", + "540 yes no no 2 no \n", + "541 no no no 0 no \n", + "542 no no no 0 no \n", + "543 no no no 0 no \n", + "544 no no no 0 no \n", + "\n", + " furnishingstatus \n", + "540 unfurnished \n", + "541 semi-furnished \n", + "542 unfurnished \n", + "543 furnished \n", + "544 unfurnished " + ], + "text/html": [ + "\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
priceareabedroomsbathroomsstoriesmainroadguestroombasementhotwaterheatingairconditioningparkingprefareafurnishingstatus
5401820000.0300021.01yesnoyesnono2nounfurnished
5411767150.0240031.01nonononono0nosemi-furnished
5421750000.0362021.01yesnononono0nounfurnished
5431750000.0291031.01nonononono0nofurnished
5441750000.0385031.02yesnononono0nounfurnished
\n", + "
\n", + "
\n", + "\n", + "
\n", + " \n", + "\n", + " \n", + "\n", + " \n", + "
\n", + "\n", + "\n", + "
\n", + " \n", + "\n", + "\n", + "\n", + " \n", + "
\n", + "\n", + "
\n", + "
\n" + ], + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "dataframe", + "summary": "{\n \"name\": \"df\",\n \"rows\": 5,\n \"fields\": [\n {\n \"column\": \"price\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 30311.29327494952,\n \"min\": 1750000.0,\n \"max\": 1820000.0,\n \"num_unique_values\": 3,\n \"samples\": [\n 1820000.0,\n 1767150.0,\n 1750000.0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"area\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 581,\n \"min\": 2400,\n \"max\": 3850,\n \"num_unique_values\": 5,\n \"samples\": [\n 2400,\n 3850,\n 3620\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"bedrooms\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0,\n \"min\": 2,\n \"max\": 3,\n \"num_unique_values\": 2,\n \"samples\": [\n 3,\n 2\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"bathrooms\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0.0,\n \"min\": 1.0,\n \"max\": 1.0,\n \"num_unique_values\": 1,\n \"samples\": [\n 1.0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"stories\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0,\n \"min\": 1,\n \"max\": 2,\n \"num_unique_values\": 2,\n \"samples\": [\n 2\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"mainroad\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 2,\n \"samples\": [\n \"no\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"guestroom\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 1,\n \"samples\": [\n \"no\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"basement\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 2,\n \"samples\": [\n \"no\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"hotwaterheating\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 1,\n \"samples\": [\n \"no\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"airconditioning\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 1,\n \"samples\": [\n \"no\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"parking\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n \"max\": 2,\n \"num_unique_values\": 2,\n \"samples\": [\n 0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"prefarea\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 1,\n \"samples\": [\n \"no\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"furnishingstatus\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 3,\n \"samples\": [\n \"unfurnished\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}" + } + }, + "metadata": {}, + "execution_count": 3 + } + ], + "source": [ + "import pandas as pd\n", + "import seaborn as sns\n", + "import matplotlib.pyplot as plt\n", + "\n", + "#Load the dataset\n", + "data = 'Housing.csv'\n", + "df = pd.read_csv(data)\n", + "df.head(5)\n", + "df.tail(5)" + ] + }, + { + "cell_type": "code", + "source": [ + "df.describe()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 300 + }, + "id": "b5c0atj-0onX", + "outputId": "f46f425a-06c6-4a6c-c984-51ec47085709" + }, + "execution_count": 4, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + " price area bedrooms bathrooms stories \\\n", + "count 5.440000e+02 545.000000 545.000000 543.000000 545.000000 \n", + "mean 4.760855e+06 5150.541284 2.965138 1.285451 1.805505 \n", + "std 1.867122e+06 2170.141023 0.738064 0.502310 0.867492 \n", + "min 1.750000e+06 1650.000000 1.000000 1.000000 1.000000 \n", + "25% 3.430000e+06 3600.000000 2.000000 1.000000 1.000000 \n", + "50% 4.340000e+06 4600.000000 3.000000 1.000000 2.000000 \n", + "75% 5.740000e+06 6360.000000 3.000000 2.000000 2.000000 \n", + "max 1.330000e+07 16200.000000 6.000000 4.000000 4.000000 \n", + "\n", + " parking \n", + "count 545.000000 \n", + "mean 0.693578 \n", + "std 0.861586 \n", + "min 0.000000 \n", + "25% 0.000000 \n", + "50% 0.000000 \n", + "75% 1.000000 \n", + "max 3.000000 " + ], + "text/html": [ + "\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
priceareabedroomsbathroomsstoriesparking
count5.440000e+02545.000000545.000000543.000000545.000000545.000000
mean4.760855e+065150.5412842.9651381.2854511.8055050.693578
std1.867122e+062170.1410230.7380640.5023100.8674920.861586
min1.750000e+061650.0000001.0000001.0000001.0000000.000000
25%3.430000e+063600.0000002.0000001.0000001.0000000.000000
50%4.340000e+064600.0000003.0000001.0000002.0000000.000000
75%5.740000e+066360.0000003.0000002.0000002.0000001.000000
max1.330000e+0716200.0000006.0000004.0000004.0000003.000000
\n", + "
\n", + "
\n", + "\n", + "
\n", + " \n", + "\n", + " \n", + "\n", + " \n", + "
\n", + "\n", + "\n", + "
\n", + " \n", + "\n", + "\n", + "\n", + " \n", + "
\n", + "\n", + "
\n", + "
\n" + ], + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "dataframe", + "summary": "{\n \"name\": \"df\",\n \"rows\": 8,\n \"fields\": [\n {\n \"column\": \"price\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 4050987.2502240124,\n \"min\": 544.0,\n \"max\": 13300000.0,\n \"num_unique_values\": 8,\n \"samples\": [\n 4760854.669117647,\n 4340000.0,\n 544.0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"area\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 4906.2698868605785,\n \"min\": 545.0,\n \"max\": 16200.0,\n \"num_unique_values\": 8,\n \"samples\": [\n 5150.54128440367,\n 4600.0,\n 545.0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"bedrooms\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 191.74878444768592,\n \"min\": 0.7380638605685743,\n \"max\": 545.0,\n \"num_unique_values\": 7,\n \"samples\": [\n 545.0,\n 2.9651376146788992,\n 3.0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"bathrooms\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 191.43771613213667,\n \"min\": 0.5023102796865925,\n \"max\": 543.0,\n \"num_unique_values\": 6,\n \"samples\": [\n 543.0,\n 1.285451197053407,\n 4.0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"stories\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 192.04914398408363,\n \"min\": 0.8674924629255264,\n \"max\": 545.0,\n \"num_unique_values\": 6,\n \"samples\": [\n 545.0,\n 1.8055045871559634,\n 4.0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"parking\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 192.40854964721385,\n \"min\": 0.0,\n \"max\": 545.0,\n \"num_unique_values\": 6,\n \"samples\": [\n 545.0,\n 0.6935779816513762,\n 3.0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}" + } + }, + "metadata": {}, + "execution_count": 4 + } + ] + }, + { + "cell_type": "code", + "source": [ + "df.shape" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "0o-UJKN10sFI", + "outputId": "02aeea22-3ace-41b5-b009-bd2fdf7bc3f5" + }, + "execution_count": 6, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "(545, 13)" + ] + }, + "metadata": {}, + "execution_count": 6 + } + ] + }, + { + "cell_type": "code", + "source": [ + "df.info()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "sQRsz4tP0tez", + "outputId": "0f6c5765-9d34-4985-9fb3-44132df64831" + }, + "execution_count": 7, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "\n", + "RangeIndex: 545 entries, 0 to 544\n", + "Data columns (total 13 columns):\n", + " # Column Non-Null Count Dtype \n", + "--- ------ -------------- ----- \n", + " 0 price 544 non-null float64\n", + " 1 area 545 non-null int64 \n", + " 2 bedrooms 545 non-null int64 \n", + " 3 bathrooms 543 non-null float64\n", + " 4 stories 545 non-null int64 \n", + " 5 mainroad 545 non-null object \n", + " 6 guestroom 544 non-null object \n", + " 7 basement 544 non-null object \n", + " 8 hotwaterheating 545 non-null object \n", + " 9 airconditioning 544 non-null object \n", + " 10 parking 545 non-null int64 \n", + " 11 prefarea 545 non-null object \n", + " 12 furnishingstatus 544 non-null object \n", + "dtypes: float64(2), int64(4), object(7)\n", + "memory usage: 55.5+ KB\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "df['basement'].value_counts()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "C6H2NAxm1OtP", + "outputId": "d95704fe-c0d4-4ceb-c7ed-13b76ed3e766" + }, + "execution_count": 8, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "basement\n", + "no 354\n", + "yes 190\n", + "Name: count, dtype: int64" + ] + }, + "metadata": {}, + "execution_count": 8 + } + ] + }, + { + "cell_type": "code", + "source": [ + "sns.histplot(df['basement'], kde=True)\n", + "plt.show()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 449 + }, + "id": "kIkFbI791WIJ", + "outputId": "ee5da8d2-549e-4bdd-d0c4-cabad00b6d96" + }, + "execution_count": 9, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/plain": [ + "
" + ], + "image/png": "\n" + }, + "metadata": {} + } + ] + }, + { + "cell_type": "code", + "source": [ + "sns.boxplot(x='price',data=df)\n", + "plt.show()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 449 + }, + "id": "rt4xv9Ws1nYp", + "outputId": "d2156ed1-60eb-49aa-c37a-ff61f7065978" + }, + "execution_count": 10, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/plain": [ + "
" + ], + "image/png": "\n" + }, + "metadata": {} + } + ] + }, + { + "cell_type": "code", + "source": [ + "#Select only the numeric columns\n", + "numeric_df=df.select_dtypes(include=['number'])\n", + "\n", + "#Perform the comparison on numeric columns\n", + "(numeric_df<0).sum()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "yYLHDjuf2PAS", + "outputId": "c25e9389-3b0e-4aa6-f8ae-15b577f7baec" + }, + "execution_count": 14, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "price 0\n", + "area 0\n", + "bedrooms 0\n", + "bathrooms 0\n", + "stories 0\n", + "parking 0\n", + "dtype: int64" + ] + }, + "metadata": {}, + "execution_count": 14 + } + ] + }, + { + "cell_type": "code", + "source": [ + "df.isnull().sum()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "-WJVBOOr2tsq", + "outputId": "e7e9baa4-2880-4004-9013-b99e01c260d0" + }, + "execution_count": 15, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "price 1\n", + "area 0\n", + "bedrooms 0\n", + "bathrooms 2\n", + "stories 0\n", + "mainroad 0\n", + "guestroom 1\n", + "basement 1\n", + "hotwaterheating 0\n", + "airconditioning 1\n", + "parking 0\n", + "prefarea 0\n", + "furnishingstatus 1\n", + "dtype: int64" + ] + }, + "metadata": {}, + "execution_count": 15 + } + ] + }, + { + "cell_type": "code", + "source": [ + "df.isna().sum()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "cdSFVfxC3aMt", + "outputId": "598d99df-b8ea-4a8c-d593-2d0640a47d7a" + }, + "execution_count": 16, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "price 1\n", + "area 0\n", + "bedrooms 0\n", + "bathrooms 2\n", + "stories 0\n", + "mainroad 0\n", + "guestroom 1\n", + "basement 1\n", + "hotwaterheating 0\n", + "airconditioning 1\n", + "parking 0\n", + "prefarea 0\n", + "furnishingstatus 1\n", + "dtype: int64" + ] + }, + "metadata": {}, + "execution_count": 16 + } + ] + }, + { + "cell_type": "code", + "source": [ + "import seaborn as sns\n", + "import matplotlib.pyplot as plt\n", + "plt.figure(figsize=(10,6))\n", + "sns.heatmap(df.isnull(),cbar=False,cmap='viridis')\n", + "plt.title('Missing values in Housing Prices Dataset')\n", + "plt.show()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 524 + }, + "id": "dbxCGHJi3e8j", + "outputId": "f3af5f1f-2e19-4367-a040-eb7839cd0692" + }, + "execution_count": 18, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/plain": [ + "
" + ], + "image/png": "\n" + }, + "metadata": {} + } + ] + }, + { + "cell_type": "code", + "source": [ + "for col in ['mainroad','guestroom','basement','airconditioning','prefarea','furnishingstatus']:\n", + " #Removed empty strings\n", + " df[col]=df[col].astype('category').cat.codes\n", + " df.head(5)\n", + " df.info()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "cUKB_QI-48yJ", + "outputId": "4dae7b9e-fd76-4ca7-c40f-4d8b964cc3b1" + }, + "execution_count": 21, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "\n", + "RangeIndex: 545 entries, 0 to 544\n", + "Data columns (total 13 columns):\n", + " # Column Non-Null Count Dtype \n", + "--- ------ -------------- ----- \n", + " 0 price 544 non-null float64\n", + " 1 area 545 non-null int64 \n", + " 2 bedrooms 545 non-null int64 \n", + " 3 bathrooms 543 non-null float64\n", + " 4 stories 545 non-null int64 \n", + " 5 mainroad 545 non-null int8 \n", + " 6 guestroom 545 non-null int8 \n", + " 7 basement 545 non-null int8 \n", + " 8 hotwaterheating 545 non-null object \n", + " 9 airconditioning 545 non-null int8 \n", + " 10 parking 545 non-null int64 \n", + " 11 prefarea 545 non-null object \n", + " 12 furnishingstatus 544 non-null object \n", + "dtypes: float64(2), int64(4), int8(4), object(3)\n", + "memory usage: 40.6+ KB\n", + "\n", + "RangeIndex: 545 entries, 0 to 544\n", + "Data columns (total 13 columns):\n", + " # Column Non-Null Count Dtype \n", + "--- ------ -------------- ----- \n", + " 0 price 544 non-null float64\n", + " 1 area 545 non-null int64 \n", + " 2 bedrooms 545 non-null int64 \n", + " 3 bathrooms 543 non-null float64\n", + " 4 stories 545 non-null int64 \n", + " 5 mainroad 545 non-null int8 \n", + " 6 guestroom 545 non-null int8 \n", + " 7 basement 545 non-null int8 \n", + " 8 hotwaterheating 545 non-null object \n", + " 9 airconditioning 545 non-null int8 \n", + " 10 parking 545 non-null int64 \n", + " 11 prefarea 545 non-null object \n", + " 12 furnishingstatus 544 non-null object \n", + "dtypes: float64(2), int64(4), int8(4), object(3)\n", + "memory usage: 40.6+ KB\n", + "\n", + "RangeIndex: 545 entries, 0 to 544\n", + "Data columns (total 13 columns):\n", + " # Column Non-Null Count Dtype \n", + "--- ------ -------------- ----- \n", + " 0 price 544 non-null float64\n", + " 1 area 545 non-null int64 \n", + " 2 bedrooms 545 non-null int64 \n", + " 3 bathrooms 543 non-null float64\n", + " 4 stories 545 non-null int64 \n", + " 5 mainroad 545 non-null int8 \n", + " 6 guestroom 545 non-null int8 \n", + " 7 basement 545 non-null int8 \n", + " 8 hotwaterheating 545 non-null object \n", + " 9 airconditioning 545 non-null int8 \n", + " 10 parking 545 non-null int64 \n", + " 11 prefarea 545 non-null object \n", + " 12 furnishingstatus 544 non-null object \n", + "dtypes: float64(2), int64(4), int8(4), object(3)\n", + "memory usage: 40.6+ KB\n", + "\n", + "RangeIndex: 545 entries, 0 to 544\n", + "Data columns (total 13 columns):\n", + " # Column Non-Null Count Dtype \n", + "--- ------ -------------- ----- \n", + " 0 price 544 non-null float64\n", + " 1 area 545 non-null int64 \n", + " 2 bedrooms 545 non-null int64 \n", + " 3 bathrooms 543 non-null float64\n", + " 4 stories 545 non-null int64 \n", + " 5 mainroad 545 non-null int8 \n", + " 6 guestroom 545 non-null int8 \n", + " 7 basement 545 non-null int8 \n", + " 8 hotwaterheating 545 non-null object \n", + " 9 airconditioning 545 non-null int8 \n", + " 10 parking 545 non-null int64 \n", + " 11 prefarea 545 non-null object \n", + " 12 furnishingstatus 544 non-null object \n", + "dtypes: float64(2), int64(4), int8(4), object(3)\n", + "memory usage: 40.6+ KB\n", + "\n", + "RangeIndex: 545 entries, 0 to 544\n", + "Data columns (total 13 columns):\n", + " # Column Non-Null Count Dtype \n", + "--- ------ -------------- ----- \n", + " 0 price 544 non-null float64\n", + " 1 area 545 non-null int64 \n", + " 2 bedrooms 545 non-null int64 \n", + " 3 bathrooms 543 non-null float64\n", + " 4 stories 545 non-null int64 \n", + " 5 mainroad 545 non-null int8 \n", + " 6 guestroom 545 non-null int8 \n", + " 7 basement 545 non-null int8 \n", + " 8 hotwaterheating 545 non-null object \n", + " 9 airconditioning 545 non-null int8 \n", + " 10 parking 545 non-null int64 \n", + " 11 prefarea 545 non-null int8 \n", + " 12 furnishingstatus 544 non-null object \n", + "dtypes: float64(2), int64(4), int8(5), object(2)\n", + "memory usage: 36.8+ KB\n", + "\n", + "RangeIndex: 545 entries, 0 to 544\n", + "Data columns (total 13 columns):\n", + " # Column Non-Null Count Dtype \n", + "--- ------ -------------- ----- \n", + " 0 price 544 non-null float64\n", + " 1 area 545 non-null int64 \n", + " 2 bedrooms 545 non-null int64 \n", + " 3 bathrooms 543 non-null float64\n", + " 4 stories 545 non-null int64 \n", + " 5 mainroad 545 non-null int8 \n", + " 6 guestroom 545 non-null int8 \n", + " 7 basement 545 non-null int8 \n", + " 8 hotwaterheating 545 non-null object \n", + " 9 airconditioning 545 non-null int8 \n", + " 10 parking 545 non-null int64 \n", + " 11 prefarea 545 non-null int8 \n", + " 12 furnishingstatus 545 non-null int8 \n", + "dtypes: float64(2), int64(4), int8(6), object(1)\n", + "memory usage: 33.1+ KB\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "single_value_columns = df.nunique() == 1\n", + "\n", + "#Check if any column has a single unique value\n", + "if single_value_columns.any():\n", + " print(\"Yes, the dataset contains columns with unique single value\")\n", + " print(\"Colums with a unique single value:\",df.columns[single_value_columns].tolist())\n", + "\n", + "else:\n", + " print(\"No, the dataset does not contain any columns with a unique single value\")" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "1i0MLxF-5vD6", + "outputId": "0a949617-a651-45e5-b59c-a011390bbc4f" + }, + "execution_count": 22, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "No, the dataset does not contain any columns with a unique single value\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "df = df.drop(columns=['stories'])\n", + "df.head(5)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 226 + }, + "id": "NIM1X2fz7gEU", + "outputId": "73cbf7a2-6fc9-44f9-c6fd-446ed005057d" + }, + "execution_count": 23, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + " price area bedrooms bathrooms mainroad guestroom basement \\\n", + "0 13300000.0 7420 4 2.0 1 1 1 \n", + "1 12250000.0 8960 4 4.0 1 1 1 \n", + "2 12250000.0 9960 3 2.0 1 1 2 \n", + "3 12215000.0 7500 4 2.0 1 1 2 \n", + "4 11410000.0 7420 4 1.0 1 2 2 \n", + "\n", + " hotwaterheating airconditioning parking prefarea furnishingstatus \n", + "0 no 2 2 1 0 \n", + "1 no 2 3 0 0 \n", + "2 no 1 2 1 1 \n", + "3 no 2 3 1 0 \n", + "4 no 2 2 0 0 " + ], + "text/html": [ + "\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
priceareabedroomsbathroomsmainroadguestroombasementhotwaterheatingairconditioningparkingprefareafurnishingstatus
013300000.0742042.0111no2210
112250000.0896044.0111no2300
212250000.0996032.0112no1211
312215000.0750042.0112no2310
411410000.0742041.0122no2200
\n", + "
\n", + "
\n", + "\n", + "
\n", + " \n", + "\n", + " \n", + "\n", + " \n", + "
\n", + "\n", + "\n", + "
\n", + " \n", + "\n", + "\n", + "\n", + " \n", + "
\n", + "\n", + "
\n", + "
\n" + ], + "application/vnd.google.colaboratory.intrinsic+json": { + "type": "dataframe", + "variable_name": "df", + "summary": "{\n \"name\": \"df\",\n \"rows\": 545,\n \"fields\": [\n {\n \"column\": \"price\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 1867121.9543386477,\n \"min\": 1750000.0,\n \"max\": 13300000.0,\n \"num_unique_values\": 218,\n \"samples\": [\n 5040000.0,\n 1820000.0,\n 4130000.0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"area\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 2170,\n \"min\": 1650,\n \"max\": 16200,\n \"num_unique_values\": 284,\n \"samples\": [\n 6000,\n 2684,\n 5360\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"bedrooms\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0,\n \"min\": 1,\n \"max\": 6,\n \"num_unique_values\": 6,\n \"samples\": [\n 4,\n 3,\n 1\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"bathrooms\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0.5023102796865925,\n \"min\": 1.0,\n \"max\": 4.0,\n \"num_unique_values\": 4,\n \"samples\": [\n 4.0,\n 3.0,\n 2.0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"mainroad\",\n \"properties\": {\n \"dtype\": \"int8\",\n \"num_unique_values\": 2,\n \"samples\": [\n 0,\n 1\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"guestroom\",\n \"properties\": {\n \"dtype\": \"int8\",\n \"num_unique_values\": 3,\n \"samples\": [\n 1,\n 2\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"basement\",\n \"properties\": {\n \"dtype\": \"int8\",\n \"num_unique_values\": 3,\n \"samples\": [\n 1,\n 2\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"hotwaterheating\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 2,\n \"samples\": [\n \"yes\",\n \"no\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"airconditioning\",\n \"properties\": {\n \"dtype\": \"int8\",\n \"num_unique_values\": 3,\n \"samples\": [\n 2,\n 1\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"parking\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n \"max\": 3,\n \"num_unique_values\": 4,\n \"samples\": [\n 3,\n 1\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"prefarea\",\n \"properties\": {\n \"dtype\": \"int8\",\n \"num_unique_values\": 2,\n \"samples\": [\n 0,\n 1\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"furnishingstatus\",\n \"properties\": {\n \"dtype\": \"int8\",\n \"num_unique_values\": 4,\n \"samples\": [\n 1,\n -1\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}" + } + }, + "metadata": {}, + "execution_count": 23 + } + ] + }, + { + "cell_type": "code", + "source": [ + "import matplotlib.pyplot as plt\n", + "year=[2000,2001,2002,2003,2004,2005]\n", + "itemA=[400,80,120,300,150,90]\n", + "itemB=[120,100,80,120,260,90]\n", + "plt.subplot(221)\n", + "\n", + "plt.fill_between(year, min(itemA), itemA, alpha=0.5)\n", + "plt.subplot(222)\n", + "plt.fill_between(year, min (itemA), itemA, alpha=0.5)\n", + "plt.fill_between (year, min (itemB), itemB, alpha=0.5)\n", + "plt.show()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 228 + }, + "id": "1hSF4toF8Am7", + "outputId": "3d3a8cf9-c2c6-4420-cd85-532d8188f69f" + }, + "execution_count": 32, + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/plain": [ + "
" + ], + "image/png": "\n" + }, + "metadata": {} + } + ] + } + ] +} \ No newline at end of file