diff --git a/solution.ipynb b/solution.ipynb new file mode 100644 index 0000000..50d2569 --- /dev/null +++ b/solution.ipynb @@ -0,0 +1,354 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 2, + "id": "743289bd", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
countryfood_categoryconsumptionco2_emission
1Argentinapork10.5137.20
2Argentinapoultry38.6641.53
3Argentinabeef55.481712.00
4Argentinalamb_goat1.5654.63
5Argentinafish4.366.96
\n", + "
" + ], + "text/plain": [ + " country food_category consumption co2_emission\n", + "1 Argentina pork 10.51 37.20\n", + "2 Argentina poultry 38.66 41.53\n", + "3 Argentina beef 55.48 1712.00\n", + "4 Argentina lamb_goat 1.56 54.63\n", + "5 Argentina fish 4.36 6.96" + ] + }, + "execution_count": 2, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "import numpy as np\n", + "import pandas as pd\n", + "import matplotlib.pyplot as plt\n", + "\n", + "plt.rcParams['figure.figsize'] = (10, 8)\n", + " \n", + "food_consumption = pd.read_csv('./food_consumption.csv', index_col=0)\n", + "food_consumption.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "7859490a", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + " country food_category consumption co2_emission\n", + "397 Belgium pork 38.65 136.80\n", + "398 Belgium poultry 12.20 13.11\n", + "399 Belgium beef 15.63 482.31\n", + "400 Belgium lamb_goat 1.32 46.23\n", + "401 Belgium fish 18.97 30.29\n", + " country food_category consumption co2_emission\n", + "56 USA pork 27.64 97.83\n", + "57 USA poultry 50.01 53.72\n", + "58 USA beef 36.24 1118.29\n", + "59 USA lamb_goat 0.43 15.06\n", + "60 USA fish 12.35 19.72\n" + ] + } + ], + "source": [ + "#filter for Belgium\n", + "be_consumption = food_consumption[food_consumption['country'] == 'Belgium']\n", + "be_consumption.head()\n", + "print(be_consumption.head())\n", + "# Filter for USA\n", + "usa_consumption = food_consumption[food_consumption['country'] == 'USA']\n", + "print(usa_consumption.head())\n" + ] + }, + { + "cell_type": "code", + "execution_count": 42, + "id": "bc426426", + "metadata": {}, + "outputs": [], + "source": [ + "df_be_consumption = pd.DataFrame(be_consumption)\n", + "df_usa_consumption = pd.DataFrame(usa_consumption)" + ] + }, + { + "cell_type": "code", + "execution_count": 103, + "id": "620d99bb", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "42.13272727272727\n", + "12.59\n", + "44.650000000000006\n", + "14.58\n" + ] + } + ], + "source": [ + "#Q-1) Calculate mean and median consumption in Belgium\n", + "print(df_be_consumption['consumption'].mean())\n", + "print(df_be_consumption['consumption'].median())\n", + "#Q-2) Calculate mean and median consumption of USA\n", + "print(df_usa_consumption['consumption'].mean())\n", + "print(df_usa_consumption['consumption'].median())\n" + ] + }, + { + "cell_type": "code", + "execution_count": 104, + "id": "10604251", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
meanmedian
country
Belgium42.13272712.59
USA44.65000014.58
\n", + "
" + ], + "text/plain": [ + " mean median\n", + "country \n", + "Belgium 42.132727 12.59\n", + "USA 44.650000 14.58" + ] + }, + "execution_count": 104, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Q-3) Group by country, select consumption column, and compute mean and median\n", + "\n", + "be_and_usa = food_consumption[(food_consumption['country'] == 'Belgium') | (food_consumption['country'] == 'USA')]\n", + "df_be_and_usa = pd.DataFrame(be_and_usa)\n", + "df_groupby_country = df_be_and_usa.groupby('country')\n", + "df_groupby_country['consumption'].agg(['mean','median'])\n" + ] + }, + { + "cell_type": "code", + "execution_count": 114, + "id": "094384b4", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 114, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "#Q-4)Plot the histogram of co2_emission for rice\n", + "\n", + "rice_consumption = food_consumption[food_consumption['food_category'] == 'rice']\n", + "rice_consumption['co2_emission'].plot.hist()\n" + ] + }, + { + "cell_type": "code", + "execution_count": 115, + "id": "8a1b5e41", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "mean 37.591615\n", + "median 15.200000\n", + "Name: co2_emission, dtype: float64" + ] + }, + "execution_count": 115, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "#Q-5) Calculate mean and median of co2_emission with .agg()\n", + "# rice_consumption = food_consumption[food_consumption['food_category'] == 'rice']\n", + "rice_consumption['co2_emission'].agg(['mean','median'])\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": 134, + "id": "1ac143be", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[ 0. 3.54 11.026 25.59 99.978 1712. ]\n" + ] + } + ], + "source": [ + "#Q-6) Calculate the quintiles of co2_emission\n", + "co2_emission = food_consumption['co2_emission']\n", + "print(np.quantile(co2_emission,np.linspace(0, 1, 6)))\n", + "\n", + " " + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.8.7" + }, + "vscode": { + "interpreter": { + "hash": "25806a9c2e3dc763ae4258cd2f35b673ccac1f110c3a8dc1fe65620c13ebb849" + } + } + }, + "nbformat": 4, + "nbformat_minor": 5 +}