Copy and Paste Your Assignment HereDear Top Assignment Expert Team,I am struggeling to finalize my python assignement, using Jupyter Notebook.There are no detailed requirements, it can be done based...

1 answer below »
Copy and Paste Your Assignment HereDear Top Assignment Expert Team,I am struggeling to finalize my python assignement, using Jupyter Notebook.There are no detailed requirements, it can be done based on some ideas. Important is to show some visualization, as started but since the data structure is obviously not correct, I cannot really continue with this task.Would be great to get a feedback from you and maybe we can talk via Skype, Whatsapp for discussing the price and details that can be provided until Tuesday midnight.Thanks & kind regardsTanjamy email is: [email protected]
Answered Same DaySep 29, 2021

Answer To: Copy and Paste Your Assignment HereDear Top Assignment Expert Team,I am struggeling to finalize my...

Kshitij answered on Oct 01 2021
132 Votes
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
"import pandas as pd\n",
"import numpy as np\n",
"import matplotlib.pyplot as plt\n",
"from pandas import Series"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Index(['LocID', 'Location', 'VarID', 'Variant', 'Time', 'MidPeriod', 'PopMale',\n",
" 'PopFemale', 'PopTotal'],\n",
" dtype='object')\n"
]
}
],
"source": [
"df = pd.read_csv ('WPP2019_TotalPopulationBySex(1)', encoding=\"cp1252\")\n",
"df_wbv = pd.DataFrame(df)\n",
"print(df_wbv.columns)"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"
\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"
LocIDLocationVarIDVariantTimeMidPeriodPopMalePopFemalePopTotal
04Afghanistan2Medium19501950.54099.2433652.8747752.117
14Afghanistan2Medium19511951.54134.7563705.3957840.151
24Afghanistan2Medium19521952.54174.4503761.5467935.996
34Afghanistan2Medium19531953.54218.3363821.3488039.684
44Afghanistan2Medium19541954.54266.4843884.8328151.316
\n",
"
"
],
"text/plain": [
" LocID Location VarID Variant Time MidPeriod PopMale PopFemale \\\n",
"0
4 Afghanistan 2 Medium 1950 1950.5 4099.243 3652.874 \n",
"1 4 Afghanistan 2 Medium 1951 1951.5 4134.756 3705.395 \n",
"2 4 Afghanistan 2 Medium 1952 1952.5 4174.450 3761.546 \n",
"3 4 Afghanistan 2 Medium 1953 1953.5 4218.336 3821.348 \n",
"4 4 Afghanistan 2 Medium 1954 1954.5 4266.484 3884.832 \n",
"\n",
" PopTotal \n",
"0 7752.117 \n",
"1 7840.151 \n",
"2 7935.996 \n",
"3 8039.684 \n",
"4 8151.316 "
]
},
"execution_count": 3,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# View our data\n",
"df_wbv.head()"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"\n",
"RangeIndex: 422655 entries, 0 to 422654\n",
"Data columns (total 9 columns):\n",
"LocID 422655 non-null int64\n",
"Location 422655 non-null object\n",
"VarID 422655 non-null int64\n",
"Variant 422655 non-null object\n",
"Time 422655 non-null int64\n",
"MidPeriod 422655 non-null float64\n",
"PopMale 422655 non-null float64\n",
"PopFemale 422655 non-null float64\n",
"PopTotal 422655 non-null float64\n",
"dtypes: float64(4), int64(3), object(2)\n",
"memory usage: 29.0+ MB\n"
]
}
],
"source": [
"# Viewing the details of the table\n",
"df_wbv.info()"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {},
"outputs": [],
"source": [
"df_wbv.to_excel(\"output.xlsx\")"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Medium 43035\n",
"Constant mortality 43035\n",
"Momentum 43035\n",
"No change 43035\n",
"Zero migration 43035\n",
"Constant fertility 43035\n",
"Low 43035\n",
"Instant replacement 43035\n",
"High 43035\n",
"Median PI 8835\n",
"Lower 95 PI 8835\n",
"Upper 95 PI 8835\n",
"Lower 80 PI 8835\n",
"Name: Variant, dtype: int64"
]
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# Exploring the data\n",
"df_wbv.Variant.value_counts()"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Northern America 2966\n",
"Latin America and the Caribbean 2966\n",
"Europe 2966\n",
"Republic of Korea 1483\n",
"Saint Barthélemy 1483\n",
"British Virgin Islands 1483\n",
"Cameroon 1483\n",
"Sierra Leone 1483\n",
"Hungary 1483\n",
"Paraguay 1483\n",
"India 1483\n",
"Turkmenistan 1483\n",
"United Republic of Tanzania 1483\n",
"Tajikistan 1483\n",
"Asia 1483\n",
"Micronesia 1483\n",
"Saudi Arabia 1483\n",
"Ecuador 1483\n",
"Slovakia 1483\n",
"Algeria 1483\n",
"Bermuda 1483\n",
"Timor-Leste 1483\n",
"Seychelles 1483\n",
"Russian Federation 1483\n",
"Turks and Caicos Islands 1483\n",
"Burkina Faso 1483\n",
"Eastern Asia 1483\n",
"Nicaragua 1483\n",
"Indonesia 1483\n",
"Martinique 1483\n",
" ... \n",
"Ireland 1483\n",
"Central and Southern Asia 1483\n",
"Burundi 1483\n",
"Senegal 1483\n",
"Central Asia 1483\n",
"Finland 1483\n",
"More developed regions 1483\n",
"Guatemala 1483\n",
"Australia 1483\n",
"Jordan 1483\n",
"Côte d'Ivoire 1483\n",
"French Guiana 1483\n",
"Holy See 1483\n",
"Malawi 1483\n",
"Lesotho 1483\n",
"Cyprus 1483\n",
"Mali 1483\n",
"Maldives 1483\n",
"Angola 1483\n",
"Dominica 1483\n",
"Western Europe 1483\n",
"Oman 1483\n",
"Ukraine 1483\n",
"Somalia 1483\n",
"Tunisia 1483\n",
"Southern Asia 1483\n",
"Serbia 1483\n",
"Low-income countries 1483\n",
"Canada 1483\n",
"Bolivia (Plurinational State of) 1483\n",
"Name: Location, Length: 282, dtype: int64"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df.Location.value_counts()"
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"
\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"
LocIDLocationVarIDVariantTimeMidPeriodPopMalePopFemalePopTotal
14496276Germany2Medium19501950.532283.90537682.34769966.252
14497276Germany2Medium19511951.532476.98837823.02370300.011
14498276Germany2Medium19521952.532662.84537957.43070620.275
14499276Germany2Medium19531953.532838.82038091.01970929.839
14500276Germany2Medium19541954.533005.14038228.25371233.393
\n",
"
"
],
"text/plain": [
" LocID Location VarID Variant Time MidPeriod PopMale PopFemale \\\n",
"14496 276 Germany 2 Medium 1950 1950.5 32283.905 37682.347 \n",
"14497 276 Germany 2 Medium 1951 1951.5 32476.988 37823.023 \n",
"14498 276 Germany 2 Medium 1952 1952.5 32662.845 37957.430 \n",
"14499 276 Germany 2 Medium 1953 1953.5 32838.820 38091.019 \n",
"14500 276 Germany 2 Medium 1954 1954.5 33005.140 38228.253 \n",
"\n",
" PopTotal \n",
"14496 69966.252 \n",
"14497 70300.011 \n",
"14498 70620.275 \n",
"14499 70929.839 \n",
"14500 71233.393 "
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_wbv[df_wbv.Location == 'Germany'].head()"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {},
"outputs": [],
"source": [
"df = df_wbv[df_wbv.Variant == 'Medium']\n",
"years = df['Time'].unique()\n",
"germany_pop = list(df[df.Location == 'Germany']['PopTotal'])\n",
"afghanistan_pop = list(df[df.Location == 'Afghanistan']['PopTotal'])\n",
"netherlands_pop = list(df[df.Location == 'Netherlands']['PopTotal'])\n",
"hungary_pop = list(df[df.Location == 'Hungary']['PopTotal'])\n",
"new_zealand_pop = list(df[df.Location == 'New Zealand']['PopTotal'])"
]
},
{
"cell_type": "code",
"execution_count": 10,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"
"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
],
"source": [
"# Population comparison of some random Countries\n",
"\n",
"plt.plot(years, germany_pop, color='b', label='Germany')\n",
"plt.plot(years, afghanistan_pop, color='r', label='Afghanistan')\n",
"plt.plot(years, netherlands_pop, color='g', label='Netherlands')\n",
"plt.plot(years, hungary_pop, color='y', label='Hungary')\n",
"plt.plot(years, new_zealand_pop, color='c', label='New Zealand')\n",
"axes = plt.gca()\n",
"plt.legend(loc=\"center right\")\n",
"plt.show()"
]
},
{
"cell_type": "code",
"execution_count": 11,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"
\n",
"