{ "cells": [ { "cell_type": "markdown", "id": "9048b835", "metadata": {}, "source": [ "# Use AI-powered tools to recommend optimal water usage based on crop types, soil, and weather data." ] }, { "cell_type": "markdown", "id": "7ed72255", "metadata": {}, "source": [ "### Project Topic:\n", "# EDA on Agricultural Data and prediction of optimal water usage based on crop types, soil, and weather data." ] }, { "cell_type": "markdown", "id": "bd6d582c", "metadata": {}, "source": [ "### Data Description:\n", "
| \n", " | count | \n", "mean | \n", "std | \n", "min | \n", "25% | \n", "50% | \n", "75% | \n", "max | \n", "
|---|---|---|---|---|---|---|---|---|
| temperature | \n", "10000.0 | \n", "27.353989 | \n", "7.190753 | \n", "15.000291 | \n", "21.158222 | \n", "27.313215 | \n", "33.500159 | \n", "39.992942 | \n", "
| humidity | \n", "10000.0 | \n", "60.362390 | \n", "23.143564 | \n", "20.012620 | \n", "40.315664 | \n", "60.471742 | \n", "80.518338 | \n", "99.993986 | \n", "
| wind_speed | \n", "10000.0 | \n", "7.750731 | \n", "4.158219 | \n", "0.500698 | \n", "4.179345 | \n", "7.779987 | \n", "11.297771 | \n", "14.998564 | \n", "
| evapotranspiration | \n", "10000.0 | \n", "5.488420 | \n", "2.600951 | \n", "1.000050 | \n", "3.221715 | \n", "5.500272 | \n", "7.724046 | \n", "9.998104 | \n", "
| rainfall_pattern | \n", "10000.0 | \n", "99.372761 | \n", "57.856836 | \n", "0.003347 | \n", "48.854444 | \n", "98.743438 | \n", "150.095407 | \n", "199.994429 | \n", "
| soil_moisture_levels | \n", "10000.0 | \n", "22.471766 | \n", "10.074207 | \n", "5.001640 | \n", "13.860081 | \n", "22.477858 | \n", "31.265796 | \n", "39.997889 | \n", "
| water_retention_capacity | \n", "10000.0 | \n", "30.074961 | \n", "11.471362 | \n", "10.005200 | \n", "20.098278 | \n", "30.110084 | \n", "40.026922 | \n", "49.995004 | \n", "
| drainage_properties | \n", "10000.0 | \n", "3.022900 | \n", "1.412577 | \n", "1.000000 | \n", "2.000000 | \n", "3.000000 | \n", "4.000000 | \n", "5.000000 | \n", "
| crop_water_requirement | \n", "10000.0 | \n", "7.002511 | \n", "2.889619 | \n", "2.002289 | \n", "4.475812 | \n", "7.046044 | \n", "9.467741 | \n", "11.999170 | \n", "
| water_requirement | \n", "10000.0 | \n", "11.619264 | \n", "4.059433 | \n", "1.280000 | \n", "8.650000 | \n", "11.560000 | \n", "14.500000 | \n", "23.580000 | \n", "
| \n", " | count | \n", "mean | \n", "std | \n", "min | \n", "25% | \n", "50% | \n", "75% | \n", "max | \n", "
|---|---|---|---|---|---|---|---|---|
| temperature | \n", "10000.0 | \n", "27.353989 | \n", "7.190753 | \n", "15.000291 | \n", "21.158222 | \n", "27.313215 | \n", "33.500159 | \n", "39.992942 | \n", "
| humidity | \n", "10000.0 | \n", "60.271793 | \n", "17.357673 | \n", "30.009465 | \n", "45.236748 | \n", "60.353807 | \n", "75.388753 | \n", "89.995490 | \n", "
| wind_speed | \n", "10000.0 | \n", "10.001008 | \n", "5.735475 | \n", "0.000962 | \n", "5.074958 | \n", "10.041362 | \n", "14.893477 | \n", "19.998020 | \n", "
| evapotranspiration | \n", "10000.0 | \n", "5.989707 | \n", "2.311957 | \n", "2.000044 | \n", "3.974858 | \n", "6.000242 | \n", "7.976930 | \n", "9.998315 | \n", "
| soil_moisture_levels | \n", "10000.0 | \n", "27.580465 | \n", "12.944606 | \n", "5.012156 | \n", "16.424813 | \n", "27.689425 | \n", "38.861113 | \n", "49.986044 | \n", "
| water_retention_capacity | \n", "10000.0 | \n", "34.961224 | \n", "14.298403 | \n", "10.006501 | \n", "22.599920 | \n", "34.961572 | \n", "47.391100 | \n", "59.993755 | \n", "
| crop_water_requirement | \n", "10000.0 | \n", "11.504598 | \n", "4.900640 | \n", "3.001664 | \n", "7.192825 | \n", "11.552267 | \n", "15.749134 | \n", "19.996182 | \n", "
| water_requirement | \n", "10000.0 | \n", "14.416114 | \n", "5.394774 | \n", "0.000000 | \n", "10.174467 | \n", "14.516146 | \n", "18.683850 | \n", "25.000000 | \n", "
| \n", " | temperature | \n", "humidity | \n", "wind_speed | \n", "evapotranspiration | \n", "rainfall_pattern | \n", "soil_type | \n", "soil_moisture_levels | \n", "water_retention_capacity | \n", "drainage_properties | \n", "crop_type | \n", "crop_water_requirement | \n", "growth_stage | \n", "water_requirement | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "24.363503 | \n", "49.891265 | \n", "11.084976 | \n", "6.743301 | \n", "Moderate | \n", "Sandy | \n", "19.897240 | \n", "35.673364 | \n", "4 | \n", "Wheat | \n", "11.656577 | \n", "Vegetative | \n", "17.80 | \n", "
| 1 | \n", "38.767858 | \n", "46.632968 | \n", "3.175424 | \n", "5.133632 | \n", "Low | \n", "Silty | \n", "19.440264 | \n", "46.812501 | \n", "2 | \n", "Rice | \n", "5.141654 | \n", "Fruiting | \n", "10.58 | \n", "
| 2 | \n", "33.299849 | \n", "34.092313 | \n", "5.526276 | \n", "9.680487 | \n", "Low | \n", "Clay | \n", "30.805983 | \n", "43.495237 | \n", "5 | \n", "Rice | \n", "5.427771 | \n", "Flowering | \n", "16.74 | \n", "
| 3 | \n", "29.966462 | \n", "68.581334 | \n", "10.117569 | \n", "2.970806 | \n", "Low | \n", "Clay | \n", "5.105964 | \n", "44.601767 | \n", "4 | \n", "Rice | \n", "2.668952 | \n", "Seedling | \n", "4.76 | \n", "
| 4 | \n", "18.900466 | \n", "58.129933 | \n", "7.490295 | \n", "6.290708 | \n", "Low | \n", "Sandy | \n", "38.141026 | \n", "10.108229 | \n", "4 | \n", "Soybean | \n", "3.652293 | \n", "Vegetative | \n", "9.54 | \n", "
| \n", " | temperature | \n", "humidity | \n", "wind_speed | \n", "evapotranspiration | \n", "rainfall_pattern | \n", "soil_type | \n", "soil_moisture_levels | \n", "water_retention_capacity | \n", "drainage_properties | \n", "crop_type | \n", "crop_water_requirement | \n", "growth_stage | \n", "water_requirement | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 9995 | \n", "36.441400 | \n", "82.622318 | \n", "19.045509 | \n", "8.032271 | \n", "moderate | \n", "loamy | \n", "31.747844 | \n", "26.106453 | \n", "good | \n", "maize | \n", "15.084630 | \n", "seedling | \n", "15.641018 | \n", "
| 9996 | \n", "37.437721 | \n", "32.808837 | \n", "14.956484 | \n", "8.116215 | \n", "low | \n", "clay | \n", "47.597710 | \n", "28.731312 | \n", "poor | \n", "maize | \n", "4.992290 | \n", "vegetative | \n", "10.341907 | \n", "
| 9997 | \n", "38.667698 | \n", "48.221908 | \n", "0.389117 | \n", "4.156555 | \n", "moderate | \n", "clay | \n", "46.441333 | \n", "29.085087 | \n", "poor | \n", "wheat | \n", "13.740037 | \n", "vegetative | \n", "18.723048 | \n", "
| 9998 | \n", "24.937200 | \n", "56.599200 | \n", "8.020097 | \n", "5.474558 | \n", "moderate | \n", "clay | \n", "14.020896 | \n", "16.481613 | \n", "moderate | \n", "wheat | \n", "3.225509 | \n", "seedling | \n", "6.158259 | \n", "
| 9999 | \n", "20.428510 | \n", "40.335889 | \n", "5.147960 | \n", "5.899390 | \n", "high | \n", "clay | \n", "9.463352 | \n", "57.364348 | \n", "good | \n", "rice | \n", "3.960593 | \n", "vegetative | \n", "3.657213 | \n", "
| \n", " | temperature | \n", "humidity | \n", "wind_speed | \n", "evapotranspiration | \n", "rainfall_pattern | \n", "soil_type | \n", "soil_moisture_levels | \n", "water_retention_capacity | \n", "drainage_properties | \n", "crop_type | \n", "crop_water_requirement | \n", "growth_stage | \n", "water_requirement | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "24.363503 | \n", "49.891265 | \n", "11.084976 | \n", "6.743301 | \n", "moderate | \n", "sandy | \n", "19.897240 | \n", "35.673364 | \n", "good | \n", "wheat | \n", "11.656577 | \n", "vegetative | \n", "17.800000 | \n", "
| 1 | \n", "38.767858 | \n", "46.632968 | \n", "3.175424 | \n", "5.133632 | \n", "low | \n", "silty | \n", "19.440264 | \n", "46.812501 | \n", "poor | \n", "rice | \n", "5.141654 | \n", "fruiting | \n", "10.580000 | \n", "
| 2 | \n", "33.299849 | \n", "34.092313 | \n", "5.526276 | \n", "9.680487 | \n", "low | \n", "clay | \n", "30.805983 | \n", "43.495237 | \n", "good | \n", "rice | \n", "5.427771 | \n", "flowering | \n", "16.740000 | \n", "
| 3 | \n", "29.966462 | \n", "68.581334 | \n", "10.117569 | \n", "2.970806 | \n", "low | \n", "clay | \n", "5.105964 | \n", "44.601767 | \n", "good | \n", "rice | \n", "2.668952 | \n", "seedling | \n", "4.760000 | \n", "
| 4 | \n", "18.900466 | \n", "58.129933 | \n", "7.490295 | \n", "6.290708 | \n", "low | \n", "sandy | \n", "38.141026 | \n", "10.108229 | \n", "good | \n", "soybean | \n", "3.652293 | \n", "vegetative | \n", "9.540000 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 9995 | \n", "36.441400 | \n", "82.622318 | \n", "19.045509 | \n", "8.032271 | \n", "moderate | \n", "loamy | \n", "31.747844 | \n", "26.106453 | \n", "good | \n", "maize | \n", "15.084630 | \n", "seedling | \n", "15.641018 | \n", "
| 9996 | \n", "37.437721 | \n", "32.808837 | \n", "14.956484 | \n", "8.116215 | \n", "low | \n", "clay | \n", "47.597710 | \n", "28.731312 | \n", "poor | \n", "maize | \n", "4.992290 | \n", "vegetative | \n", "10.341907 | \n", "
| 9997 | \n", "38.667698 | \n", "48.221908 | \n", "0.389117 | \n", "4.156555 | \n", "moderate | \n", "clay | \n", "46.441333 | \n", "29.085087 | \n", "poor | \n", "wheat | \n", "13.740037 | \n", "vegetative | \n", "18.723048 | \n", "
| 9998 | \n", "24.937200 | \n", "56.599200 | \n", "8.020097 | \n", "5.474558 | \n", "moderate | \n", "clay | \n", "14.020896 | \n", "16.481613 | \n", "moderate | \n", "wheat | \n", "3.225509 | \n", "seedling | \n", "6.158259 | \n", "
| 9999 | \n", "20.428510 | \n", "40.335889 | \n", "5.147960 | \n", "5.899390 | \n", "high | \n", "clay | \n", "9.463352 | \n", "57.364348 | \n", "good | \n", "rice | \n", "3.960593 | \n", "vegetative | \n", "3.657213 | \n", "
20000 rows × 13 columns
\n", "| crop_type | \n", "cotton | \n", "maize | \n", "rice | \n", "soybean | \n", "wheat | \n", "
|---|---|---|---|---|---|
| soil_type | \n", "\n", " | \n", " | \n", " | \n", " | \n", " |
| clay | \n", "408 | \n", "1233 | \n", "1638 | \n", "418 | \n", "1293 | \n", "
| loamy | \n", "389 | \n", "1546 | \n", "2085 | \n", "388 | \n", "1619 | \n", "
| peaty | \n", "381 | \n", "410 | \n", "381 | \n", "401 | \n", "397 | \n", "
| sandy | \n", "396 | \n", "1289 | \n", "1512 | \n", "445 | \n", "1327 | \n", "
| silty | \n", "445 | \n", "416 | \n", "372 | \n", "409 | \n", "402 | \n", "
| \n", " | temperature | \n", "humidity | \n", "wind_speed | \n", "evapotranspiration | \n", "rainfall_pattern | \n", "soil_type | \n", "soil_moisture_levels | \n", "water_retention_capacity | \n", "drainage_properties | \n", "crop_type | \n", "crop_water_requirement | \n", "growth_stage | \n", "water_requirement | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "24.363503 | \n", "49.891265 | \n", "11.084976 | \n", "6.743301 | \n", "moderate | \n", "sandy | \n", "19.897240 | \n", "35.673364 | \n", "good | \n", "wheat | \n", "11.656577 | \n", "vegetative | \n", "17.800000 | \n", "
| 1 | \n", "38.767858 | \n", "46.632968 | \n", "3.175424 | \n", "5.133632 | \n", "low | \n", "silty | \n", "19.440264 | \n", "46.812501 | \n", "poor | \n", "rice | \n", "5.141654 | \n", "fruiting | \n", "10.580000 | \n", "
| 2 | \n", "33.299849 | \n", "34.092313 | \n", "5.526276 | \n", "9.680487 | \n", "low | \n", "clay | \n", "30.805983 | \n", "43.495237 | \n", "good | \n", "rice | \n", "5.427771 | \n", "flowering | \n", "16.740000 | \n", "
| 3 | \n", "29.966462 | \n", "68.581334 | \n", "10.117569 | \n", "2.970806 | \n", "low | \n", "clay | \n", "5.105964 | \n", "44.601767 | \n", "good | \n", "rice | \n", "2.668952 | \n", "seedling | \n", "4.760000 | \n", "
| 4 | \n", "18.900466 | \n", "58.129933 | \n", "7.490295 | \n", "6.290708 | \n", "low | \n", "sandy | \n", "38.141026 | \n", "10.108229 | \n", "good | \n", "soybean | \n", "3.652293 | \n", "vegetative | \n", "9.540000 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 9945 | \n", "21.337525 | \n", "62.197254 | \n", "2.344412 | \n", "4.631634 | \n", "low | \n", "sandy | \n", "17.896590 | \n", "44.737860 | \n", "moderate | \n", "rice | \n", "9.162647 | \n", "seedling | \n", "13.950691 | \n", "
| 9946 | \n", "23.272177 | \n", "46.771673 | \n", "2.904303 | \n", "3.088485 | \n", "moderate | \n", "sandy | \n", "37.309088 | \n", "20.675634 | \n", "moderate | \n", "rice | \n", "19.589935 | \n", "reproductive | \n", "24.287477 | \n", "
| 9947 | \n", "21.744901 | \n", "39.783952 | \n", "1.656181 | \n", "8.191589 | \n", "low | \n", "loamy | \n", "37.343293 | \n", "27.072254 | \n", "moderate | \n", "wheat | \n", "8.793199 | \n", "reproductive | \n", "10.117127 | \n", "
| 9948 | \n", "27.785910 | \n", "58.924869 | \n", "18.705377 | \n", "9.882006 | \n", "moderate | \n", "loamy | \n", "7.039639 | \n", "22.525524 | \n", "poor | \n", "rice | \n", "10.566823 | \n", "reproductive | \n", "12.651426 | \n", "
| 9949 | \n", "26.003711 | \n", "57.810094 | \n", "9.503248 | \n", "6.371027 | \n", "high | \n", "sandy | \n", "31.465744 | \n", "58.007976 | \n", "moderate | \n", "maize | \n", "6.606401 | \n", "vegetative | \n", "11.557175 | \n", "
19950 rows × 13 columns
\n", "| \n", " | temperature | \n", "humidity | \n", "wind_speed | \n", "evapotranspiration | \n", "rainfall_pattern | \n", "soil_type | \n", "soil_moisture_levels | \n", "water_retention_capacity | \n", "drainage_properties | \n", "crop_type | \n", "crop_water_requirement | \n", "growth_stage | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "24.363503 | \n", "49.891265 | \n", "11.084976 | \n", "6.743301 | \n", "2 | \n", "3 | \n", "19.897240 | \n", "35.673364 | \n", "0 | \n", "4 | \n", "11.656577 | \n", "5 | \n", "
| 1 | \n", "38.767858 | \n", "46.632968 | \n", "3.175424 | \n", "5.133632 | \n", "1 | \n", "4 | \n", "19.440264 | \n", "46.812501 | \n", "2 | \n", "2 | \n", "5.141654 | \n", "1 | \n", "
| 2 | \n", "33.299849 | \n", "34.092313 | \n", "5.526276 | \n", "9.680487 | \n", "1 | \n", "0 | \n", "30.805983 | \n", "43.495237 | \n", "0 | \n", "2 | \n", "5.427771 | \n", "0 | \n", "
| 3 | \n", "29.966462 | \n", "68.581334 | \n", "10.117569 | \n", "2.970806 | \n", "1 | \n", "0 | \n", "5.105964 | \n", "44.601767 | \n", "0 | \n", "2 | \n", "2.668952 | \n", "4 | \n", "
| 4 | \n", "18.900466 | \n", "58.129933 | \n", "7.490295 | \n", "6.290708 | \n", "1 | \n", "3 | \n", "38.141026 | \n", "10.108229 | \n", "0 | \n", "3 | \n", "3.652293 | \n", "5 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 9945 | \n", "21.337525 | \n", "62.197254 | \n", "2.344412 | \n", "4.631634 | \n", "1 | \n", "3 | \n", "17.896590 | \n", "44.737860 | \n", "1 | \n", "2 | \n", "9.162647 | \n", "4 | \n", "
| 9946 | \n", "23.272177 | \n", "46.771673 | \n", "2.904303 | \n", "3.088485 | \n", "2 | \n", "3 | \n", "37.309088 | \n", "20.675634 | \n", "1 | \n", "2 | \n", "19.589935 | \n", "3 | \n", "
| 9947 | \n", "21.744901 | \n", "39.783952 | \n", "1.656181 | \n", "8.191589 | \n", "1 | \n", "1 | \n", "37.343293 | \n", "27.072254 | \n", "1 | \n", "4 | \n", "8.793199 | \n", "3 | \n", "
| 9948 | \n", "27.785910 | \n", "58.924869 | \n", "18.705377 | \n", "9.882006 | \n", "2 | \n", "1 | \n", "7.039639 | \n", "22.525524 | \n", "2 | \n", "2 | \n", "10.566823 | \n", "3 | \n", "
| 9949 | \n", "26.003711 | \n", "57.810094 | \n", "9.503248 | \n", "6.371027 | \n", "0 | \n", "3 | \n", "31.465744 | \n", "58.007976 | \n", "1 | \n", "1 | \n", "6.606401 | \n", "5 | \n", "
19950 rows × 12 columns
\n", "| \n", " | temperature | \n", "humidity | \n", "wind_speed | \n", "evapotranspiration | \n", "rainfall_pattern | \n", "soil_type | \n", "soil_moisture_levels | \n", "water_retention_capacity | \n", "drainage_properties | \n", "crop_type | \n", "crop_water_requirement | \n", "growth_stage | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 5894 | \n", "26.598407 | \n", "42.149641 | \n", "0.695710 | \n", "5.608873 | \n", "0 | \n", "2 | \n", "15.138744 | \n", "25.487128 | \n", "1 | \n", "1 | \n", "2.691879 | \n", "0 | \n", "
| 3728 | \n", "19.069775 | \n", "35.054734 | \n", "5.761526 | \n", "7.116713 | \n", "2 | \n", "4 | \n", "26.096311 | \n", "24.745144 | \n", "0 | \n", "0 | \n", "3.429500 | \n", "0 | \n", "
| 8958 | \n", "30.229885 | \n", "51.106921 | \n", "2.499416 | \n", "6.382200 | \n", "2 | \n", "1 | \n", "32.859179 | \n", "49.931009 | \n", "0 | \n", "4 | \n", "11.339668 | \n", "4 | \n", "
| 7671 | \n", "29.033896 | \n", "76.898183 | \n", "12.474345 | \n", "1.979009 | \n", "1 | \n", "0 | \n", "31.801616 | \n", "43.191603 | \n", "0 | \n", "4 | \n", "9.009872 | \n", "5 | \n", "
| 5999 | \n", "18.734541 | \n", "92.398151 | \n", "11.483827 | \n", "6.459768 | \n", "2 | \n", "1 | \n", "37.455377 | \n", "24.536591 | \n", "2 | \n", "0 | \n", "8.775372 | \n", "0 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 1284 | \n", "23.161533 | \n", "82.783232 | \n", "5.913171 | \n", "7.638741 | \n", "0 | \n", "1 | \n", "22.048223 | \n", "37.835740 | \n", "0 | \n", "2 | \n", "12.828733 | \n", "3 | \n", "
| 1964 | \n", "29.296807 | \n", "62.887204 | \n", "16.136234 | \n", "8.060363 | \n", "0 | \n", "3 | \n", "31.350929 | \n", "28.752004 | \n", "0 | \n", "2 | \n", "5.458406 | \n", "3 | \n", "
| 5390 | \n", "18.486256 | \n", "31.967812 | \n", "3.335577 | \n", "9.486479 | \n", "2 | \n", "4 | \n", "5.619945 | \n", "44.365977 | \n", "1 | \n", "4 | \n", "7.783862 | \n", "0 | \n", "
| 860 | \n", "34.388190 | \n", "95.962995 | \n", "4.532613 | \n", "2.478128 | \n", "1 | \n", "1 | \n", "18.492764 | \n", "14.965406 | \n", "1 | \n", "1 | \n", "10.760131 | \n", "1 | \n", "
| 5795 | \n", "34.877757 | \n", "42.627733 | \n", "6.945767 | \n", "7.173486 | \n", "2 | \n", "0 | \n", "10.330274 | \n", "55.375904 | \n", "0 | \n", "2 | \n", "15.078790 | \n", "5 | \n", "
16000 rows × 12 columns
\n", "GridSearchCV(cv=5, estimator=LinearRegression(),\n",
" param_grid={'copy_X': [True, False],\n",
" 'fit_intercept': [True, False]},\n",
" scoring='neg_mean_squared_error', verbose=1)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. GridSearchCV(cv=5, estimator=LinearRegression(),\n",
" param_grid={'copy_X': [True, False],\n",
" 'fit_intercept': [True, False]},\n",
" scoring='neg_mean_squared_error', verbose=1)LinearRegression()
LinearRegression()