import pandas

world = pandas.read_csv('https://raw.githubusercontent.com/jenfly/datajam-python/master/data/gapminder.csv')
world['pop_millions'] = world['population'] / 1e6
world_2015 = world[world['year'] == 2015]


region_pop = world_2015.groupby('region', as_index=False)['pop_millions'].sum()
region_pop


region_pop.plot(x='region', y='pop_millions', kind='bar')

<AxesSubplot:xlabel='region'>


region_pop.plot(x='region', y='pop_millions', kind='bar');


world_2015.plot(x='gdp_per_capita', y='life_expectancy', kind='scatter');


import seaborn as sns


sns.set_theme()


sns.relplot(data=world_2015, x='gdp_per_capita', y='life_expectancy');


sns.relplot(data=world_2015, x='gdp_per_capita', y='life_expectancy', hue='region');


g = sns.relplot(data=world_2015, x='gdp_per_capita', y='life_expectancy', hue='region')
g.set(xscale='log', title='Life Expectancy vs. GDP per Capita in 2015');


g.savefig('figures/life_exp_vs_gdp_percap.png')


g = sns.relplot(data=world_2015, x='gdp_per_capita', y='life_expectancy', hue='region',
                size='pop_millions', sizes=(40, 400), alpha=0.8)
g.set(xscale='log', title='Life Expectancy vs. GDP per Capita in 2015');


g = sns.relplot(data=world_2015, x='gdp_per_capita', y='life_expectancy', hue='region')
g.set(xscale='log');


g = sns.relplot(data=world_2015, x='gdp_per_capita', y='life_expectancy', col='region')
g.set(xscale='log');


g = sns.relplot(data=world_2015, x='gdp_per_capita', y='life_expectancy', col='region',
                col_wrap=3, height=3)
g.set(xscale='log');


g = sns.relplot(data=world_2015, x='gdp_per_capita', y='life_expectancy', col='region',
                col_wrap=3, height=3, hue='income_group')
g.set(xscale='log');


income_order= ['Low', 'Lower middle', 'Upper middle', 'High']
g = sns.relplot(data=world_2015, x='gdp_per_capita', y='life_expectancy', col='region',
                col_wrap=3, height=3, hue='income_group', hue_order=income_order)
g.set(xscale='log');


world.groupby('year', as_index=False)['pop_millions'].sum()


sns.relplot(data=world, x='year', y='pop_millions', kind='line', 
            estimator='sum', ci=None);


sns.relplot(data=world, x='year', y='pop_millions', hue='income_group', hue_order=income_order,
            style='income_group', kind='line', estimator='sum', ci=None);


sns.relplot(data=world, x='year', y='pop_millions', hue='income_group', hue_order=income_order,
            style='income_group', kind='line', estimator='sum', ci=None, col='region',
            col_wrap=3, height=3);


pop_long = world[['country', 'year', 'population']]
pop_long.head()


pop_wide = pop_long.pivot(index='year', columns='country', values='population')
pop_wide.head()


g = sns.catplot(data=world_2015, x='region', y='life_expectancy', kind='bar', aspect=1.5)
g.set(title='Mean Life Expectancy by Region in 2015');


import plotly.express as px


px.scatter(data_frame=world_2015, x='gdp_per_capita', y='life_expectancy', color='region',
           size='pop_millions', size_max=30, log_x=True, hover_data=['country'],
           title='Life Expectancy vs. GDP per Capita in 2015')


fig = px.scatter(data_frame=world_2015, x='gdp_per_capita', y='life_expectancy', color='region',
                 size='pop_millions', size_max=30, log_x=True, hover_data=['country'],
                 title='Life Expectancy vs. GDP per Capita in 2015')
fig.show()
fig.write_html('figures/plotly_life_exp_vs_gdp_percap.html')


fig.write_image('figures/plotly_life_exp_vs_gdp_percap.png')


px.scatter(data_frame=world_2015, x='gdp_per_capita', y='life_expectancy', 
           facet_col='region', facet_col_wrap=3,
           color='income_group', category_orders={'income_group' : income_order},
           log_x=True, hover_data=['country'],
           title='Life Expectancy vs. GDP per Capita in 2015')


px.scatter(data_frame=world, x='gdp_per_capita', y='life_expectancy', color='region',
           size='pop_millions', size_max=30, log_x=True, range_y=(20, 90),
           title='Life Expectancy vs. GDP per Capita (1950-2015)',
           animation_frame='year')

	region	pop_millions
0	Africa	1191.9177
1	Americas	982.6889
2	Asia	4391.6350
3	Europe	740.4830
4	Oceania	38.4860

	year	pop_millions
0	1950	2521.5914
1	1955	2755.4391
2	1960	3014.5238
3	1965	3317.6620
4	1970	3676.8109
5	1975	4052.1130
6	1980	4428.6840
7	1985	4841.1945
8	1990	5294.2122
9	1995	5714.3521
10	2000	6101.9393
11	2005	6495.9793
12	2010	6918.4071
13	2015	7345.2106

	country	year	population
0	Afghanistan	1950	7750000
1	Afghanistan	1955	8270000
2	Afghanistan	1960	9000000
3	Afghanistan	1965	9940000
4	Afghanistan	1970	11100000

country	Afghanistan	Albania	Algeria	Angola	Antigua and Barbuda	Argentina	Armenia	Australia	Austria	Azerbaijan	...	United Kingdom	United States	Uruguay	Uzbekistan	Vanuatu	Venezuela	Vietnam	Yemen	Zambia	Zimbabwe
year
1950	7750000	1260000	8870000	4550000	46300	17200000	1350000	8180000	6940000	2930000	...	50600000	159000000	2240000	6260000	47700	5480000	24800000	4400000	2310000	2750000
1955	8270000	1420000	9830000	5120000	52900	18900000	1560000	9210000	6950000	3330000	...	51100000	172000000	2370000	7300000	54900	6760000	28100000	4770000	2630000	3200000
1960	9000000	1640000	11100000	5640000	55300	20600000	1870000	10300000	7070000	3900000	...	52400000	187000000	2540000	8550000	63700	8150000	32700000	5170000	3040000	3750000
1965	9940000	1900000	12600000	6200000	60800	22300000	2210000	11400000	7310000	4590000	...	54300000	200000000	2690000	10100000	74300	9820000	37900000	5640000	3560000	4410000
1970	11100000	2150000	14600000	6780000	67100	24000000	2530000	12800000	7520000	5180000	...	55600000	210000000	2810000	12100000	85400	11600000	43400000	6190000	4170000	5180000

Lesson 2: Intro to Data Visualization¶

Lesson Overview¶

Setup¶

Data Visualization Libraries¶

The Broader Landscape¶

matplotlib & seaborn¶

plotly¶

Simple Plots with Pandas¶

Statistical Plots with Seaborn¶

Types of Plots¶

Relational Plots¶

Distribution Plots¶

Categorical Plots¶

Getting Started¶

Semantic Mapping¶

Exercise 2.1¶

Customize Axes¶

Saving a Figure¶

Note: Viewing Documentation¶

Note: Saving Pandas Plots¶

Add Another Semantic Mapping¶

Facets¶

Statistical Transformations¶

Exercise 2.2¶

Bonus: Figure-Level vs. Axes-Level Functions¶

Bonus: Long vs. Wide Data¶

Categorical Plot¶

Interactive Plots with Plotly¶

Saving a Figure¶

Facets¶

Animations¶

Getting Help¶

Thank You!¶