{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Pesticide: Summary of the data\n", "\n", "> Summary plots and tables \n", "\n" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Imports\n", "\n", "This bit imports any libraries included in the following including those from `Pesticide` to handle the data.\n", "\n", "The first cell import general libraries and sets the folder to allow importing Pesticide which is done in the second cell" ] }, { "cell_type": "code", "execution_count": 1, "metadata": { "tags": [ "hide-cell" ] }, "outputs": [], "source": [ "import pandas as pd\n", "from pandasql import sqldf\n", "import numpy as np\n", "\n", "import seaborn as sns\n", "import matplotlib.pyplot as plt\n", "\n", "import os\n", "from pathlib import Path\n", "import sys\n", "\n", "# this sets the path for Pesticide so we can import the functions\n", "# N.B. PesticideDocs and Pesticide need to be in same folder\n", "# tried to load from github using https://pypi.org/project/httpimport/ but \n", "# couldn't get to work due to modular structure i.e. how to access src/plotfuncts/plot1.py greatplot\n", "\n", "module_path = Path( os.getcwd() )\n", "module_path = module_path.parent.__str__() + '\\\\Pesticide'\n", "\n", "sys.path.insert(0, module_path)\n", "\n", "\n" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "tags": [ "hide-cell" ] }, "outputs": [], "source": [ "from src.data_loading.loads_from_url import *\n", "from src.data_cleaning.modify_dfs import *\n", "from src.data_visualisation.plot_funcs import *\n", "from src.utils.utils import *\n", "\n", "cwd = module_path\n", "\n", "folder_path = os.path.join(cwd,'data')\n", "\n", "create_csvs=False\n", "if create_csvs:\n", " getAllFilesThenSave(folder_path)\n" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Summaries of the data\n", "\n", "The data is loaded then rows near the beginning and end are shown below\n", "\n", "After this `df.describe()` and `df.info()` are used to get more info on the dataframe." ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | sample_id | \n", "date_of_sampling | \n", "description | \n", "country_of_origin | \n", "retail_outlet | \n", "address | \n", "brand_name | \n", "packer_/_manufacturer_/_importer | \n", "pesticide_residues_found_in_mg/kg_(mrl) | \n", "product | \n", "address_postcode | \n", "packer__postcode | \n", "chem_name | \n", "amount_detected | \n", "mrl | \n", "amount_pc | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1958/2016 | \n", "2016-08-08 | \n", "Bramley Apples | \n", "UK | \n", "Asda | \n", "Creechbarrow Road, Taunton TA1 2AN | \n", "Asda | \n", "Asda Stores Ltd Leeds, UK LS11 5AD | \n", "boscalid 0.03 (MRL = 2) | \n", "Apple | \n", "TA1 2AN | \n", "LS11 5AD | \n", "boscalid | \n", "0.03 | \n", "2.0 | \n", "0.015000 | \n", "
1 | \n", "1958/2016 | \n", "2016-08-08 | \n", "Bramley Apples | \n", "UK | \n", "Asda | \n", "Creechbarrow Road, Taunton TA1 2AN | \n", "Asda | \n", "Asda Stores Ltd Leeds, UK LS11 5AD | \n", "pyraclostrobin 0.01 (MRL = 0.5) | \n", "Apple | \n", "TA1 2AN | \n", "LS11 5AD | \n", "pyraclostrobin | \n", "0.01 | \n", "0.5 | \n", "0.020000 | \n", "
2 | \n", "0230/2016 | \n", "2016-08-08 | \n", "Bramley Apples | \n", "UK | \n", "Co-op | \n", "Northgate, Louth LN11 0LT | \n", "Co-op | \n", "Co-operative Group Ltd Manchester M60 0AG | \n", "boscalid 0.05 (MRL = 2) | \n", "Apple | \n", "LN11 0LT | \n", "M60 0AG | \n", "boscalid | \n", "0.05 | \n", "2.0 | \n", "0.025000 | \n", "
3 | \n", "0230/2016 | \n", "2016-08-08 | \n", "Bramley Apples | \n", "UK | \n", "Co-op | \n", "Northgate, Louth LN11 0LT | \n", "Co-op | \n", "Co-operative Group Ltd Manchester M60 0AG | \n", "flonicamid (sum) 0.02 (MRL = 0.2) | \n", "Apple | \n", "LN11 0LT | \n", "M60 0AG | \n", "flonicamid (sum) | \n", "0.02 | \n", "0.2 | \n", "0.100000 | \n", "
4 | \n", "0230/2016 | \n", "2016-08-08 | \n", "Bramley Apples | \n", "UK | \n", "Co-op | \n", "Northgate, Louth LN11 0LT | \n", "Co-op | \n", "Co-operative Group Ltd Manchester M60 0AG | \n", "pyraclostrobin 0.03 (MRL = 0.5) | \n", "Apple | \n", "LN11 0LT | \n", "M60 0AG | \n", "pyraclostrobin | \n", "0.03 | \n", "0.5 | \n", "0.060000 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
23947 | \n", "0792/2022 | \n", "2022-09-08 | \n", "Marfona Unwashed Potatoes | \n", "UK | \n", "Stoke Fruit Farm | \n", "77 Havant Road, Hayling Island, Hampshire PO11... | \n", "None stated | \n", "Stoke Fruit Farm 77 Havant Road, Hayling Islan... | \n", "maleic hydrazide 7.7 (MRL = 60) | \n", "Potatoes_(GB) | \n", "PO11 0PT | \n", "PO11 0PT | \n", "maleic hydrazide | \n", "7.70 | \n", "60.0 | \n", "0.128333 | \n", "
23948 | \n", "0765/2022 | \n", "2022-09-14 | \n", "Sagitta Potatoes | \n", "UK | \n", "Total Produce Ltd. | \n", "Callywith Gate Industrial Estate, Launceston R... | \n", "None stated | \n", "CS Duston & Son Colwith Farm, Par, Cornwall | \n", "maleic hydrazide 17 (MRL = 60) | \n", "Potatoes_(GB) | \n", "PL31 2RQ | \n", "0 | \n", "maleic hydrazide | \n", "17.00 | \n", "60.0 | \n", "0.283333 | \n", "
23949 | \n", "0938/2022 | \n", "2022-09-01 | \n", "Marfona Ware Potatoes | \n", "UK | \n", "Tulipland Potatoes Ltd | \n", "Fengate, Moulton Chapel PE12 0XL | \n", "None stated | \n", "Garden of Elveden | \n", "NaN | \n", "Potatoes_(GB) | \n", "PE12 0XL | \n", "0 | \n", "0 | \n", "0.00 | \n", "0.0 | \n", "0.000000 | \n", "
23950 | \n", "0833/2022 | \n", "2022-08-31 | \n", "Lady Rosetta | \n", "England (UK) | \n", "Tyrrells Crisps | \n", "Tyrrells Court, Stretford Bridge, Leominster H... | \n", "None stated | \n", "KP Crisps | \n", "NaN | \n", "Potatoes_(GB) | \n", "HR6 9DQ | \n", "0 | \n", "0 | \n", "0.00 | \n", "0.0 | \n", "0.000000 | \n", "
23951 | \n", "0833/2022 | \n", "2022-08-31 | \n", "Lady Rosetta | \n", "England (UK) | \n", "Tyrrells Crisps | \n", "Tyrrells Court, Stretford Bridge, Leominster H... | \n", "None stated | \n", "KP Crisps | \n", "NaN | \n", "Potatoes_(GB) | \n", "HR6 9DQ | \n", "0 | \n", "0 | \n", "0.00 | \n", "0.0 | \n", "0.000000 | \n", "
23952 rows × 16 columns
\n", "\n", " | sample_id | \n", "date_of_sampling | \n", "description | \n", "country_of_origin | \n", "retail_outlet | \n", "address | \n", "brand_name | \n", "packer_/_manufacturer_/_importer | \n", "pesticide_residues_found_in_mg/kg_(mrl) | \n", "product | \n", "address_postcode | \n", "packer__postcode | \n", "chem_name | \n", "amount_detected | \n", "mrl | \n", "amount_pc | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
count | \n", "23952 | \n", "23952 | \n", "23952 | \n", "23952 | \n", "23898 | \n", "23898 | \n", "23898 | \n", "23896 | \n", "16576 | \n", "23952 | \n", "23952 | \n", "23952 | \n", "23952 | \n", "23952.000000 | \n", "23952.000000 | \n", "23952.000000 | \n", "
unique | \n", "10732 | \n", "NaN | \n", "4254 | \n", "121 | \n", "1140 | \n", "4380 | \n", "831 | \n", "3341 | \n", "4260 | \n", "131 | \n", "1638 | \n", "821 | \n", "186 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
top | \n", "2430/2018 | \n", "NaN | \n", "Conference Pears | \n", "UK | \n", "Tesco | \n", "Albert Row, Oystermouth Road, Swansea SA1 3RA | \n", "None stated | \n", "Tesco Stores Ltd Welwyn Garden City AL7 1GA | \n", "chlormequat 0.03 (MRL = 0.6) | \n", "Grapes | \n", "UB2 5XJ | \n", "0 | \n", "0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
freq | \n", "42 | \n", "NaN | \n", "614 | \n", "8006 | \n", "3549 | \n", "140 | \n", "6617 | \n", "2086 | \n", "88 | \n", "1667 | \n", "343 | \n", "9546 | \n", "8831 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
mean | \n", "NaN | \n", "2017-10-15 21:31:26.573146112 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.231456 | \n", "2.694487 | \n", "0.213602 | \n", "
min | \n", "NaN | \n", "2016-01-18 00:00:00 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "
25% | \n", "NaN | \n", "2016-11-30 00:00:00 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "
50% | \n", "NaN | \n", "2017-11-28 00:00:00 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.020000 | \n", "0.500000 | \n", "0.012000 | \n", "
75% | \n", "NaN | \n", "2018-07-16 00:00:00 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.080000 | \n", "3.000000 | \n", "0.066667 | \n", "
max | \n", "NaN | \n", "2022-09-21 00:00:00 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "48.000000 | \n", "182.000000 | \n", "240.000000 | \n", "
std | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "1.118951 | \n", "6.792256 | \n", "2.942220 | \n", "
\n", " | country_of_origin | \n", "amount_detected | \n", "mrl | \n", "amount_pc | \n", "number_of_tests | \n", "
---|---|---|---|---|---|
0 | \n", "UK | \n", "0.195679 | \n", "1.548986 | \n", "0.155359 | \n", "4698 | \n", "
1 | \n", "Spain | \n", "0.146144 | \n", "3.146354 | \n", "0.293926 | \n", "988 | \n", "
2 | \n", "England (UK) | \n", "0.405924 | \n", "3.488212 | \n", "0.048455 | \n", "397 | \n", "
3 | \n", "South Africa | \n", "0.324500 | \n", "3.499751 | \n", "0.098734 | \n", "376 | \n", "
4 | \n", "Italy | \n", "0.124684 | \n", "1.740408 | \n", "0.625776 | \n", "364 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
116 | \n", "St Lucia | \n", "1.500000 | \n", "2.000000 | \n", "0.750000 | \n", "1 | \n", "
117 | \n", "Macedonia | \n", "0.132857 | \n", "2.571429 | \n", "0.051429 | \n", "1 | \n", "
118 | \n", "South West Atlantic | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "1 | \n", "
119 | \n", "Russia | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "1 | \n", "
120 | \n", "Aegean Sea | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "1 | \n", "
121 rows × 5 columns
\n", "\n", " | sample_id | \n", "date_of_sampling | \n", "description | \n", "country_of_origin | \n", "retail_outlet | \n", "address | \n", "brand_name | \n", "packer_/_manufacturer_/_importer | \n", "pesticide_residues_found_in_mg/kg_(mrl) | \n", "product | \n", "address_postcode | \n", "packer__postcode | \n", "chem_name | \n", "amount_detected | \n", "mrl | \n", "amount_pc | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1958/2016 | \n", "2016-08-08 | \n", "Bramley Apples | \n", "UK | \n", "Asda | \n", "Creechbarrow Road, Taunton TA1 2AN | \n", "Asda | \n", "Asda Stores Ltd Leeds, UK LS11 5AD | \n", "boscalid 0.03 (MRL = 2) | \n", "Apple | \n", "TA1 2AN | \n", "LS11 5AD | \n", "boscalid | \n", "0.03 | \n", "2.0 | \n", "0.015000 | \n", "
1 | \n", "1958/2016 | \n", "2016-08-08 | \n", "Bramley Apples | \n", "UK | \n", "Asda | \n", "Creechbarrow Road, Taunton TA1 2AN | \n", "Asda | \n", "Asda Stores Ltd Leeds, UK LS11 5AD | \n", "pyraclostrobin 0.01 (MRL = 0.5) | \n", "Apple | \n", "TA1 2AN | \n", "LS11 5AD | \n", "pyraclostrobin | \n", "0.01 | \n", "0.5 | \n", "0.020000 | \n", "
2 | \n", "0230/2016 | \n", "2016-08-08 | \n", "Bramley Apples | \n", "UK | \n", "Co-op | \n", "Northgate, Louth LN11 0LT | \n", "Co-op | \n", "Co-operative Group Ltd Manchester M60 0AG | \n", "boscalid 0.05 (MRL = 2) | \n", "Apple | \n", "LN11 0LT | \n", "M60 0AG | \n", "boscalid | \n", "0.05 | \n", "2.0 | \n", "0.025000 | \n", "
3 | \n", "0230/2016 | \n", "2016-08-08 | \n", "Bramley Apples | \n", "UK | \n", "Co-op | \n", "Northgate, Louth LN11 0LT | \n", "Co-op | \n", "Co-operative Group Ltd Manchester M60 0AG | \n", "flonicamid (sum) 0.02 (MRL = 0.2) | \n", "Apple | \n", "LN11 0LT | \n", "M60 0AG | \n", "flonicamid (sum) | \n", "0.02 | \n", "0.2 | \n", "0.100000 | \n", "
4 | \n", "0230/2016 | \n", "2016-08-08 | \n", "Bramley Apples | \n", "UK | \n", "Co-op | \n", "Northgate, Louth LN11 0LT | \n", "Co-op | \n", "Co-operative Group Ltd Manchester M60 0AG | \n", "pyraclostrobin 0.03 (MRL = 0.5) | \n", "Apple | \n", "LN11 0LT | \n", "M60 0AG | \n", "pyraclostrobin | \n", "0.03 | \n", "0.5 | \n", "0.060000 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
23947 | \n", "0792/2022 | \n", "2022-09-08 | \n", "Marfona Unwashed Potatoes | \n", "UK | \n", "Stoke Fruit Farm | \n", "77 Havant Road, Hayling Island, Hampshire PO11... | \n", "None stated | \n", "Stoke Fruit Farm 77 Havant Road, Hayling Islan... | \n", "maleic hydrazide 7.7 (MRL = 60) | \n", "Potatoes_(GB) | \n", "PO11 0PT | \n", "PO11 0PT | \n", "maleic hydrazide | \n", "7.70 | \n", "60.0 | \n", "0.128333 | \n", "
23948 | \n", "0765/2022 | \n", "2022-09-14 | \n", "Sagitta Potatoes | \n", "UK | \n", "Total Produce Ltd. | \n", "Callywith Gate Industrial Estate, Launceston R... | \n", "None stated | \n", "CS Duston & Son Colwith Farm, Par, Cornwall | \n", "maleic hydrazide 17 (MRL = 60) | \n", "Potatoes_(GB) | \n", "PL31 2RQ | \n", "0 | \n", "maleic hydrazide | \n", "17.00 | \n", "60.0 | \n", "0.283333 | \n", "
23949 | \n", "0938/2022 | \n", "2022-09-01 | \n", "Marfona Ware Potatoes | \n", "UK | \n", "Tulipland Potatoes Ltd | \n", "Fengate, Moulton Chapel PE12 0XL | \n", "None stated | \n", "Garden of Elveden | \n", "NaN | \n", "Potatoes_(GB) | \n", "PE12 0XL | \n", "0 | \n", "0 | \n", "0.00 | \n", "0.0 | \n", "0.000000 | \n", "
23950 | \n", "0833/2022 | \n", "2022-08-31 | \n", "Lady Rosetta | \n", "England (UK) | \n", "Tyrrells Crisps | \n", "Tyrrells Court, Stretford Bridge, Leominster H... | \n", "None stated | \n", "KP Crisps | \n", "NaN | \n", "Potatoes_(GB) | \n", "HR6 9DQ | \n", "0 | \n", "0 | \n", "0.00 | \n", "0.0 | \n", "0.000000 | \n", "
23951 | \n", "0833/2022 | \n", "2022-08-31 | \n", "Lady Rosetta | \n", "England (UK) | \n", "Tyrrells Crisps | \n", "Tyrrells Court, Stretford Bridge, Leominster H... | \n", "None stated | \n", "KP Crisps | \n", "NaN | \n", "Potatoes_(GB) | \n", "HR6 9DQ | \n", "0 | \n", "0 | \n", "0.00 | \n", "0.0 | \n", "0.000000 | \n", "
23952 rows × 16 columns
\n", "