From 902b136695dfa42c3f63ebdddab96a045ae72db5 Mon Sep 17 00:00:00 2001
From: Corentin Vande Kerckhove <corentinvdk@gmail.com>
Date: Tue, 1 Nov 2022 10:13:36 +0100
Subject: [PATCH] add first exercise

---
 data-collection/exercise1.ipynb | 711 ++++++++++++++++++++++++++++++++
 1 file changed, 711 insertions(+)
 create mode 100644 data-collection/exercise1.ipynb

diff --git a/data-collection/exercise1.ipynb b/data-collection/exercise1.ipynb
new file mode 100644
index 0000000..3bcf0da
--- /dev/null
+++ b/data-collection/exercise1.ipynb
@@ -0,0 +1,711 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import requests\n",
+    "import urllib.request\n",
+    "import time\n",
+    "from bs4 import BeautifulSoup\n",
+    "import numpy as np\n",
+    "import pandas as pd\n",
+    "from urllib.request import urlopen"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "url = 'https://en.wikipedia.org/wiki/Epidemiology_of_depression'"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "html = urlopen(url)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "soup = BeautifulSoup(html, 'html.parser')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "tables = soup.find_all('table')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#convert number as string to integer\n",
+    "#re.sub() returns the substring that match the regrex\n",
+    "import re\n",
+    "def process_num(num):\n",
+    "    return float(re.sub(r'[^\\w\\s.]','',num))\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'1156.30'"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "num1 = re.sub(r'[^\\w\\s.]','','1,156.30')\n",
+    "num1"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>Rank</th>\n",
+       "      <th>DALY rate</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <td>United States</td>\n",
+       "      <td>1</td>\n",
+       "      <td>1454.74</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>Nepal</td>\n",
+       "      <td>2</td>\n",
+       "      <td>1424.48</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>East Timor</td>\n",
+       "      <td>3</td>\n",
+       "      <td>1404.10</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>Bangladesh</td>\n",
+       "      <td>4</td>\n",
+       "      <td>1401.53</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>India</td>\n",
+       "      <td>5</td>\n",
+       "      <td>1400.84</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>Pakistan</td>\n",
+       "      <td>6</td>\n",
+       "      <td>1400.42</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>Brazil</td>\n",
+       "      <td>7</td>\n",
+       "      <td>1396.10</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>Maldives</td>\n",
+       "      <td>8</td>\n",
+       "      <td>1391.61</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>Bhutan</td>\n",
+       "      <td>9</td>\n",
+       "      <td>1385.53</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>Afghanistan</td>\n",
+       "      <td>10</td>\n",
+       "      <td>1385.14</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "               Rank  DALY rate\n",
+       "United States     1    1454.74\n",
+       "Nepal             2    1424.48\n",
+       "East Timor        3    1404.10\n",
+       "Bangladesh        4    1401.53\n",
+       "India             5    1400.84\n",
+       "Pakistan          6    1400.42\n",
+       "Brazil            7    1396.10\n",
+       "Maldives          8    1391.61\n",
+       "Bhutan            9    1385.53\n",
+       "Afghanistan      10    1385.14"
+      ]
+     },
+     "execution_count": 9,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "ranks = []\n",
+    "rates = []\n",
+    "countries = []\n",
+    "links = []\n",
+    "\n",
+    "for table in tables:\n",
+    "    rows = table.find_all('tr')\n",
+    "    \n",
+    "    for row in rows:\n",
+    "        cells = row.find_all('td')\n",
+    "        \n",
+    "        if len(cells) > 1:\n",
+    "            rank = cells[0]\n",
+    "            ranks.append(int(rank.text))\n",
+    "            \n",
+    "            country = cells[1]\n",
+    "            countries.append(country.text.strip())\n",
+    "            \n",
+    "            rate = cells[2]\n",
+    "            rates.append(process_num(rate.text.strip()))\n",
+    "            \n",
+    "            link = cells[1].find('a').get('href')\n",
+    "            links.append('https://en.wikipedia.org/'+ link)\n",
+    "            \n",
+    "df1 = pd.DataFrame(ranks, index= countries, columns = ['Rank'])\n",
+    "df1['DALY rate'] = rates\n",
+    "\n",
+    "df1.head(10)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "789.14 3\n",
+      "Country: Benin, Sunshine Hours: 263.05\n",
+      "515.99 2\n",
+      "Country: Togo, Sunshine Hours: 258.0\n",
+      "710.25 3\n",
+      "Country: Ghana, Sunshine Hours: 236.75\n",
+      "866.0500000000001 4\n",
+      "Country: Cameroon, Sunshine Hours: 216.51\n",
+      "344.03999999999996 2\n",
+      "Country: Gabon, Sunshine Hours: 172.02\n",
+      "1334.54 5\n",
+      "Country: Nigeria, Sunshine Hours: 266.91\n",
+      "711.91 2\n",
+      "Country: Sudan, Sunshine Hours: 355.95\n",
+      "336.1 1\n",
+      "Country: Eritrea, Sunshine Hours: 336.1\n",
+      "641.8 2\n",
+      "Country: Burkina Faso, Sunshine Hours: 320.9\n",
+      "320.32 1\n",
+      "Country: Niger, Sunshine Hours: 320.32\n",
+      "670.6400000000001 2\n",
+      "Country: Chad, Sunshine Hours: 335.32\n",
+      "307.0 1\n",
+      "Country: Gambia, Sunshine Hours: 307.0\n",
+      "629.2 2\n",
+      "Country: Senegal, Sunshine Hours: 314.6\n",
+      "620.5999999999999 2\n",
+      "Country: Somalia, Sunshine Hours: 310.3\n",
+      "327.9 1\n",
+      "Country: Djibouti, Sunshine Hours: 327.9\n",
+      "964.0099999999999 3\n",
+      "Country: Mali, Sunshine Hours: 321.34\n",
+      "653.3 2\n",
+      "Country: Algeria, Sunshine Hours: 326.65\n",
+      "609.99 2\n",
+      "Country: Tunisia, Sunshine Hours: 305.0\n",
+      "946.64 3\n",
+      "Country: Morocco, Sunshine Hours: 315.55\n",
+      "2253.8500000000004 6\n",
+      "Country: Egypt, Sunshine Hours: 375.64\n",
+      "635.6199999999999 2\n",
+      "Country: Libya, Sunshine Hours: 317.81\n",
+      "1212.01 4\n",
+      "Country: Kenya, Sunshine Hours: 303.0\n",
+      "234.1 1\n",
+      "Country: Angola, Sunshine Hours: 234.1\n",
+      "1213.1399999999999 4\n",
+      "Country: Tanzania, Sunshine Hours: 303.28\n",
+      "556.97 2\n",
+      "Country: Ethiopia, Sunshine Hours: 278.49\n",
+      "666.5 2\n",
+      "Country: Mauritania, Sunshine Hours: 333.25\n",
+      "1884.79 6\n",
+      "Country: South Africa, Sunshine Hours: 314.13\n",
+      "1028.0 3\n",
+      "Country: Botswana, Sunshine Hours: 342.67\n",
+      "889.6400000000001 3\n",
+      "Country: Zambia, Sunshine Hours: 296.55\n",
+      "613.08 2\n",
+      "Country: Zimbabwe, Sunshine Hours: 306.54\n",
+      "838.76 3\n",
+      "Country: Malawi, Sunshine Hours: 279.59\n",
+      "1718.66 6\n",
+      "Country: Madagascar, Sunshine Hours: 286.44\n",
+      "283.8 1\n",
+      "Country: Mozambique, Sunshine Hours: 283.8\n",
+      "681.8 3\n",
+      "Country: Uganda, Sunshine Hours: 227.27\n",
+      "237.34 1\n",
+      "Country: Burundi, Sunshine Hours: 237.34\n",
+      "488.0 2\n",
+      "Country: Guinea, Sunshine Hours: 244.0\n",
+      "270.7 1\n",
+      "Country: Guinea-Bissau, Sunshine Hours: 270.7\n",
+      "309.79 2\n",
+      "Country: Equatorial Guinea, Sunshine Hours: 154.9\n",
+      "747.5 2\n",
+      "Country: Namibia, Sunshine Hours: 373.75\n",
+      "317.51 1\n",
+      "Country: Afghanistan, Sunshine Hours: 317.51\n",
+      "220.74 1\n",
+      "Country: Azerbaijan, Sunshine Hours: 220.74\n",
+      "206.6 1\n",
+      "Country: Bangladesh, Sunshine Hours: 206.6\n",
+      "1091.49 5\n",
+      "Country: China, Sunshine Hours: 218.3\n",
+      "973.66 4\n",
+      "Country: India, Sunshine Hours: 243.41\n",
+      "298.33000000000004 1\n",
+      "Country: Indonesia, Sunshine Hours: 298.33\n",
+      "282.61 1\n",
+      "Country: Iran, Sunshine Hours: 282.61\n",
+      "324.08000000000004 1\n",
+      "Country: Iraq, Sunshine Hours: 324.08\n",
+      "331.1 1\n",
+      "Country: Israel, Sunshine Hours: 331.1\n",
+      "361.71000000000004 2\n",
+      "Country: Japan, Sunshine Hours: 180.86\n",
+      "486.29999999999995 2\n",
+      "Country: Kazakhstan, Sunshine Hours: 243.15\n",
+      "279.15 1\n",
+      "Country: Mongolia, Sunshine Hours: 279.15\n",
+      "249.2 1\n",
+      "Country: North Korea, Sunshine Hours: 249.2\n",
+      "349.33000000000004 1\n",
+      "Country: Oman, Sunshine Hours: 349.33\n",
+      "598.4300000000001 2\n",
+      "Country: Pakistan, Sunshine Hours: 299.22\n",
+      "210.31 1\n",
+      "Country: Philippines, Sunshine Hours: 210.31\n",
+      "1578.2299999999998 8\n",
+      "Country: Russia, Sunshine Hours: 197.28\n",
+      "647.3 2\n",
+      "Country: Saudi Arabia, Sunshine Hours: 323.65\n",
+      "202.24 1\n",
+      "Country: Singapore, Sunshine Hours: 202.24\n",
+      "439.33000000000004 2\n",
+      "Country: South Korea, Sunshine Hours: 219.67\n",
+      "870.0099999999999 4\n",
+      "Country: Thailand, Sunshine Hours: 217.5\n",
+      "466.76 2\n",
+      "Country: Turkey, Sunshine Hours: 233.38\n",
+      "282.39 1\n",
+      "Country: Uzbekistan, Sunshine Hours: 282.39\n",
+      "849.4 4\n",
+      "Country: Vietnam, Sunshine Hours: 212.35\n",
+      "254.4 1\n",
+      "Country: Albania, Sunshine Hours: 254.4\n",
+      "247.4 1\n",
+      "Country: Armenia, Sunshine Hours: 247.4\n",
+      "188.4 1\n",
+      "Country: Austria, Sunshine Hours: 188.4\n",
+      "180.7 1\n",
+      "Country: Belarus, Sunshine Hours: 180.7\n",
+      "154.6 1\n",
+      "Country: Belgium, Sunshine Hours: 154.6\n",
+      "176.9 1\n",
+      "Country: Bosnia and Herzegovina, Sunshine Hours: 176.9\n",
+      "217.7 1\n",
+      "Country: Bulgaria, Sunshine Hours: 217.7\n",
+      "191.3 1\n",
+      "Country: Croatia, Sunshine Hours: 191.3\n",
+      "166.8 1\n",
+      "Country: Czech Republic, Sunshine Hours: 166.8\n",
+      "331.40999999999997 1\n",
+      "Country: Cyprus, Sunshine Hours: 331.41\n",
+      "173.9 1\n",
+      "Country: Denmark, Sunshine Hours: 173.9\n",
+      "182.6 1\n",
+      "Country: Estonia, Sunshine Hours: 182.6\n",
+      "185.8 1\n",
+      "Country: Finland, Sunshine Hours: 185.8\n",
+      "449.8 2\n",
+      "Country: France, Sunshine Hours: 224.9\n",
+      "204.6 1\n",
+      "Country: Georgia, Sunshine Hours: 204.6\n",
+      "328.79999999999995 2\n",
+      "Country: Germany, Sunshine Hours: 164.4\n",
+      "595.0 2\n",
+      "Country: Greece, Sunshine Hours: 297.5\n",
+      "198.8 1\n",
+      "Country: Hungary, Sunshine Hours: 198.8\n",
+      "132.6 1\n",
+      "Country: Iceland, Sunshine Hours: 132.6\n",
+      "145.3 1\n",
+      "Country: Ireland, Sunshine Hours: 145.3\n",
+      "438.8 2\n",
+      "Country: Italy, Sunshine Hours: 219.4\n",
+      "175.4 1\n",
+      "Country: Latvia, Sunshine Hours: 175.4\n",
+      "169.1 1\n",
+      "Country: Lithuania, Sunshine Hours: 169.1\n",
+      "305.4 1\n",
+      "Country: Malta, Sunshine Hours: 305.4\n",
+      "212.6 1\n",
+      "Country: Moldova, Sunshine Hours: 212.6\n",
+      "166.2 1\n",
+      "Country: Netherlands, Sunshine Hours: 166.2\n",
+      "166.8 1\n",
+      "Country: Norway, Sunshine Hours: 166.8\n",
+      "157.1 1\n",
+      "Country: Poland, Sunshine Hours: 157.1\n",
+      "280.6 1\n",
+      "Country: Portugal, Sunshine Hours: 280.6\n",
+      "211.5 1\n",
+      "Country: Romania, Sunshine Hours: 211.5\n",
+      "203.8 1\n",
+      "Country: Slovakia, Sunshine Hours: 203.8\n",
+      "197.4 1\n",
+      "Country: Slovenia, Sunshine Hours: 197.4\n",
+      "826.6 3\n",
+      "Country: Spain, Sunshine Hours: 275.53\n",
+      "374.29999999999995 2\n",
+      "Country: Sweden, Sunshine Hours: 187.15\n",
+      "156.6 1\n",
+      "Country: Switzerland, Sunshine Hours: 156.6\n",
+      "195.5 1\n",
+      "Country: Ukraine, Sunshine Hours: 195.5\n",
+      "306.0 2\n",
+      "Country: United Kingdom, Sunshine Hours: 153.0\n",
+      "1825.24 9\n",
+      "Country: Canada, Sunshine Hours: 202.8\n",
+      "225.98000000000002 1\n",
+      "Country: Honduras, Sunshine Hours: 225.98\n",
+      "1038.5 4\n",
+      "Country: Mexico, Sunshine Hours: 259.62\n",
+      "275.99 1\n",
+      "Country: Nicaragua, Sunshine Hours: 275.99\n",
+      "174.35 1\n",
+      "Country: Panama, Sunshine Hours: 174.35\n",
+      "295.7 1\n",
+      "Country: El Salvador, Sunshine Hours: 295.7\n",
+      "15218.579999999998 54\n",
+      "Country: United States, Sunshine Hours: 281.83\n",
+      "1149.52 5\n",
+      "Country: Argentina, Sunshine Hours: 229.9\n",
+      "228.89000000000001 1\n",
+      "Country: Bolivia, Sunshine Hours: 228.89\n",
+      "1322.58 6\n",
+      "Country: Brazil, Sunshine Hours: 220.43\n",
+      "953.81 6\n",
+      "Country: Colombia, Sunshine Hours: 158.97\n",
+      "1324.27 5\n",
+      "Country: Chile, Sunshine Hours: 264.85\n",
+      "381.90999999999997 2\n",
+      "Country: Ecuador, Sunshine Hours: 190.95\n",
+      "280.3 1\n",
+      "Country: Paraguay, Sunshine Hours: 280.3\n",
+      "604.0 3\n",
+      "Country: Peru, Sunshine Hours: 201.33\n",
+      "248.14000000000001 1\n",
+      "Country: Uruguay, Sunshine Hours: 248.14\n",
+      "579.0899999999999 2\n",
+      "Country: Venezuela, Sunshine Hours: 289.54\n",
+      "2553.15 9\n",
+      "Country: Australia, Sunshine Hours: 283.68\n",
+      "192.2 1\n",
+      "Country: Fiji, Sunshine Hours: 192.2\n",
+      "613.1999999999999 3\n",
+      "Country: New Zealand, Sunshine Hours: 204.4\n",
+      "246.3 1\n",
+      "Country: Papua New Guinea, Sunshine Hours: 246.3\n",
+      "233.0 1\n",
+      "Country: Solomon Islands, Sunshine Hours: 233.0\n"
+     ]
+    }
+   ],
+   "source": [
+    "sun_url = urlopen('https://en.wikipedia.org/wiki/List_of_cities_by_sunshine_duration')\n",
+    "sun = BeautifulSoup(sun_url, 'html.parser')\n",
+    "tables = sun.find_all('table')\n",
+    "\n",
+    "#Dictionary to hold the name of the country and its corresponding temperature\n",
+    "country_suns = {}\n",
+    "\n",
+    "#Dictionary to hold the country and its frequency in the table\n",
+    "count = {}\n",
+    "for table in tables:\n",
+    "    if len(table) >1:\n",
+    "        rows = table.find_all('tr')\n",
+    "        \n",
+    "        #Skip the first row, which is the name of the columns\n",
+    "        for row in rows[1:]:\n",
+    "            cells = row.find_all('td')\n",
+    "            country = cells[0].text.strip()\n",
+    "            \n",
+    "            #If country in the list of country we found previously\n",
+    "            #append the country to the dictionary\n",
+    "            if country in countries:\n",
+    "                \n",
+    "                sun = cells[-2].text.strip()\n",
+    "                sun = process_num(sun)/10\n",
+    "                \n",
+    "                #If country is already in the dictionary\n",
+    "                #add to the existing sun hours of that country and the count to keep track of how many times we add\n",
+    "                if country in country_suns:\n",
+    "                    count[country] += 1\n",
+    "                    country_suns[country] += sun\n",
+    "                    \n",
+    "                else:\n",
+    "                    count[country] = 1\n",
+    "                    country_suns[country] = sun\n",
+    "                    \n",
+    "\n",
+    "#Find the average temperature of each country\n",
+    "for country in country_suns:\n",
+    "    print(country_suns[country],count[country])\n",
+    "    country_suns[country] = round(country_suns[country]/count[country],2)\n",
+    "    print('Country: {}, Sunshine Hours: {}'.format(country,country_suns[country]))\n",
+    "                "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 20,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "<class 'pandas.core.frame.DataFrame'>\n",
+      "Index: 192 entries, United States to Japan\n",
+      "Data columns (total 3 columns):\n",
+      "Rank                   192 non-null int64\n",
+      "DALY rate              192 non-null float64\n",
+      "Sunshine Hours/Year    122 non-null float64\n",
+      "dtypes: float64(2), int64(1)\n",
+      "memory usage: 11.0+ KB\n"
+     ]
+    }
+   ],
+   "source": [
+    "df2 = pd.DataFrame.from_dict(country_suns,orient='index', columns = ['Sunshine Hours/Year'])\n",
+    "\n",
+    "df = df1.join(df2)\n",
+    "\n",
+    "df.info()\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 21,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.dropna(inplace=True)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 38,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "<class 'pandas.core.frame.DataFrame'>\n",
+      "Index: 122 entries, United States to Japan\n",
+      "Data columns (total 3 columns):\n",
+      "Rank                   122 non-null int64\n",
+      "DALY rate              122 non-null float64\n",
+      "Sunshine Hours/Year    122 non-null float64\n",
+      "dtypes: float64(2), int64(1)\n",
+      "memory usage: 8.8+ KB\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "<matplotlib.axes._subplots.AxesSubplot at 0x1a1a728410>"
+      ]
+     },
+     "execution_count": 38,
+     "metadata": {},
+     "output_type": "execute_result"
+    },
+    {
+     "data": {
+      "image/png": "\n",
+      "text/plain": [
+       "<Figure size 432x288 with 1 Axes>"
+      ]
+     },
+     "metadata": {
+      "needs_background": "light"
+     },
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "df.info()\n",
+    "\n",
+    "import matplotlib.pyplot as plt\n",
+    "import seaborn as sns\n",
+    "\n",
+    "sns.scatterplot('Rank', 'Sunshine Hours/Year', data=df)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 36,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>Rank</th>\n",
+       "      <th>DALY rate</th>\n",
+       "      <th>Sunshine Hours/Year</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <td>Rank</td>\n",
+       "      <td>1.000000</td>\n",
+       "      <td>-0.963597</td>\n",
+       "      <td>0.346623</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>DALY rate</td>\n",
+       "      <td>-0.963597</td>\n",
+       "      <td>1.000000</td>\n",
+       "      <td>-0.285906</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>Sunshine Hours/Year</td>\n",
+       "      <td>0.346623</td>\n",
+       "      <td>-0.285906</td>\n",
+       "      <td>1.000000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                         Rank  DALY rate  Sunshine Hours/Year\n",
+       "Rank                 1.000000  -0.963597             0.346623\n",
+       "DALY rate           -0.963597   1.000000            -0.285906\n",
+       "Sunshine Hours/Year  0.346623  -0.285906             1.000000"
+      ]
+     },
+     "execution_count": 36,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df.corr()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.7.4"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
\ No newline at end of file
-- 
GitLab