{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "564dfa7f-55ae-423a-ae59-22ac4f00364f", "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "from sklearn.model_selection import StratifiedShuffleSplit, cross_val_score, train_test_split\n", "from sklearn.ensemble import RandomForestClassifier\n", "from sklearn.preprocessing import LabelEncoder, MinMaxScaler\n", "from sklearn.metrics import classification_report, confusion_matrix\n", "import numpy as np\n", "import seaborn as sns\n", "import matplotlib.pyplot as plt\n", "import pickle\n", "import os\n", "import subprocess\n", "np.random.seed(42)" ] }, { "cell_type": "code", "execution_count": 2, "id": "b0867074-62b1-4bff-9188-0c6e73f814d0", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "CSV Loaded, Dataset shape: (154, 6)\n" ] } ], "source": [ "# Load the data\n", "df = pd.read_csv(\"csv/ems_data.csv\")\n", "print(\"CSV Loaded, Dataset shape:\", df.shape)" ] }, { "cell_type": "code", "execution_count": 3, "id": "0e2ebde8-90f1-483a-a3cb-4119878459d2", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | species | \n", "emsConcentration | \n", "soakDuration | \n", "lowestTemp | \n", "highestTemp | \n", "result | \n", "
---|---|---|---|---|---|---|
0 | \n", "Cotton - TM-1 | \n", "1.50 | \n", "180 | \n", "20.0 | \n", "32.0 | \n", "1 | \n", "
1 | \n", "Hemp - Lembang A | \n", "0.25 | \n", "360 | \n", "25.0 | \n", "30.0 | \n", "0 | \n", "
2 | \n", "Cotton - TM-1 | \n", "3.50 | \n", "360 | \n", "20.0 | \n", "32.0 | \n", "0 | \n", "
3 | \n", "Hyoscyamus niger - Black Henbane | \n", "0.02 | \n", "60 | \n", "25.0 | \n", "28.0 | \n", "1 | \n", "
4 | \n", "Sunflower - Helianthus annuus (BBS-1) | \n", "1.00 | \n", "480 | \n", "22.0 | \n", "25.0 | \n", "0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
149 | \n", "Maize - Zea mays (B73) | \n", "1.20 | \n", "720 | \n", "25.0 | \n", "30.0 | \n", "0 | \n", "
150 | \n", "Hyoscyamus niger - Black Henbane | \n", "0.09 | \n", "60 | \n", "25.0 | \n", "28.0 | \n", "0 | \n", "
151 | \n", "Hemp - Kumamoto | \n", "0.25 | \n", "360 | \n", "25.0 | \n", "30.0 | \n", "0 | \n", "
152 | \n", "Chinese cabbage - Brassica rapa ssp. pekinensis | \n", "0.30 | \n", "480 | \n", "4.0 | \n", "20.0 | \n", "0 | \n", "
153 | \n", "Marigold - Tagetes erecta | \n", "0.08 | \n", "360 | \n", "25.0 | \n", "30.0 | \n", "0 | \n", "
154 rows × 6 columns
\n", "\n", " | species | \n", "sum | \n", "
---|---|---|
0 | \n", "Chinese cabbage - Brassica rapa ssp. pekinensis | \n", "5 | \n", "
1 | \n", "Cotton - Luyanmian21 | \n", "8 | \n", "
2 | \n", "Cotton - TM-1 | \n", "8 | \n", "
3 | \n", "Fenugreek - Trigonella foenum-graecum | \n", "4 | \n", "
4 | \n", "Fodder Barley - Hordeum vulgare | \n", "25 | \n", "
5 | \n", "Hemp - Bandung A | \n", "8 | \n", "
6 | \n", "Hemp - Indochina | \n", "8 | \n", "
7 | \n", "Hemp - Kumamoto | \n", "8 | \n", "
8 | \n", "Hemp - Lembang A | \n", "8 | \n", "
9 | \n", "Hemp - Seiki Selskin | \n", "8 | \n", "
10 | \n", "Hyoscyamus niger - Black Henbane | \n", "10 | \n", "
11 | \n", "Jasmine - Jasminum grandiflorum | \n", "4 | \n", "
12 | \n", "Maize - Zea mays (B73) | \n", "4 | \n", "
13 | \n", "Marigold - Tagetes erecta | \n", "9 | \n", "
14 | \n", "Marigold - Tagetes patula | \n", "13 | \n", "
15 | \n", "Sesame - Tilottama | \n", "9 | \n", "
16 | \n", "Sunflower - Helianthus annuus (BBS-1) | \n", "6 | \n", "
17 | \n", "Watermelon - G42 | \n", "9 | \n", "
\n", " | soakDuration | \n", "lowestTemp | \n", "highestTemp | \n", "
---|---|---|---|
0 | \n", "180 | \n", "20.0 | \n", "32.0 | \n", "
1 | \n", "360 | \n", "25.0 | \n", "30.0 | \n", "
2 | \n", "360 | \n", "20.0 | \n", "32.0 | \n", "
3 | \n", "60 | \n", "25.0 | \n", "28.0 | \n", "
4 | \n", "480 | \n", "22.0 | \n", "25.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "
149 | \n", "720 | \n", "25.0 | \n", "30.0 | \n", "
150 | \n", "60 | \n", "25.0 | \n", "28.0 | \n", "
151 | \n", "360 | \n", "25.0 | \n", "30.0 | \n", "
152 | \n", "480 | \n", "4.0 | \n", "20.0 | \n", "
153 | \n", "360 | \n", "25.0 | \n", "30.0 | \n", "
154 rows × 3 columns
\n", "\n", " | soakDuration | \n", "lowestTemp | \n", "highestTemp | \n", "
---|---|---|---|
0 | \n", "0.060543 | \n", "0.68 | \n", "1.000000 | \n", "
1 | \n", "0.123173 | \n", "0.88 | \n", "0.857143 | \n", "
2 | \n", "0.123173 | \n", "0.68 | \n", "1.000000 | \n", "
3 | \n", "0.018789 | \n", "0.88 | \n", "0.714286 | \n", "
4 | \n", "0.164927 | \n", "0.76 | \n", "0.500000 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "
149 | \n", "0.248434 | \n", "0.88 | \n", "0.857143 | \n", "
150 | \n", "0.018789 | \n", "0.88 | \n", "0.714286 | \n", "
151 | \n", "0.123173 | \n", "0.88 | \n", "0.857143 | \n", "
152 | \n", "0.164927 | \n", "0.04 | \n", "0.142857 | \n", "
153 | \n", "0.123173 | \n", "0.88 | \n", "0.857143 | \n", "
154 rows × 3 columns
\n", "\n", " | species | \n", "emsConcentration | \n", "soakDuration | \n", "lowestTemp | \n", "highestTemp | \n", "result | \n", "
---|---|---|---|---|---|---|
0 | \n", "2 | \n", "1.50 | \n", "0.060543 | \n", "0.68 | \n", "1.000000 | \n", "1 | \n", "
1 | \n", "8 | \n", "0.25 | \n", "0.123173 | \n", "0.88 | \n", "0.857143 | \n", "0 | \n", "
2 | \n", "2 | \n", "3.50 | \n", "0.123173 | \n", "0.68 | \n", "1.000000 | \n", "0 | \n", "
3 | \n", "10 | \n", "0.02 | \n", "0.018789 | \n", "0.88 | \n", "0.714286 | \n", "1 | \n", "
4 | \n", "16 | \n", "1.00 | \n", "0.164927 | \n", "0.76 | \n", "0.500000 | \n", "0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
149 | \n", "12 | \n", "1.20 | \n", "0.248434 | \n", "0.88 | \n", "0.857143 | \n", "0 | \n", "
150 | \n", "10 | \n", "0.09 | \n", "0.018789 | \n", "0.88 | \n", "0.714286 | \n", "0 | \n", "
151 | \n", "7 | \n", "0.25 | \n", "0.123173 | \n", "0.88 | \n", "0.857143 | \n", "0 | \n", "
152 | \n", "0 | \n", "0.30 | \n", "0.164927 | \n", "0.04 | \n", "0.142857 | \n", "0 | \n", "
153 | \n", "13 | \n", "0.08 | \n", "0.123173 | \n", "0.88 | \n", "0.857143 | \n", "0 | \n", "
154 rows × 6 columns
\n", "RandomForestClassifier(random_state=42)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
RandomForestClassifier(random_state=42)