import pandas as pd

url = 'https://raw.githubusercontent.com/shoukewei/data/main/data-pydm/gdp_top_six_economies.csv'
df = pd.read_csv(url) 
df.head()


import hvplot.pandas


df.hvplot(x='Year',
          y='United States',
          ylabel= 'GDP of United States(current US$)',
          width=700, height=400,
          title="GDP of the United States")


df.hvplot(x='Year',
          y = ['United States', 'China', 'Japan','Germany','United Kingdom','India'],
          ylabel= 'GDP (current US$)',
          width=700, height=400,
          title='GDP of World top 6 Economies')


df.hvplot(x='Year',
          y = ['United States', 'China', 'Japan','Germany','United Kingdom','India'],
          ylabel= 'GDP (current US$)',
          width=700, height=400,
          title='GDP of World top 6 Economies',
          group_label='GDP',
          legend='top_left')


gdp_mean = df.agg('mean')
gdp_mean = gdp_mean.drop('Year')
gdp_mean

China             5.070277e+12
Germany           2.941571e+12
India             1.199736e+12
Japan             4.864806e+12
United Kingdom    2.206106e+12
United States     1.320973e+13
dtype: float64


gdp_mean.hvplot.bar(width=700, height=400,
                    xlabel='World top 6 economies',
                    ylabel='Average GDP (current US$)')


gdp_mean.hvplot.bar(width=700, height=400,
                    xlabel='World top 6 economies',
                    ylabel='GDP (current US$)',
                    color='tomato')


df.hvplot.bar(x='Year',
              y='China',
              width=700, height=400,
              ylabel='GDP (current US$)',
              rot=90)


df.hvplot.bar(x='Year',
              y = ['United States', 'China', 'Japan','Germany','United Kingdom','India'],
              stacked=True,
              width=700, height=400,
              ylabel='GDP (current US$)',
              rot=90)


df.hvplot.barh(x='Year',
               y = ['United States', 'China', 'Japan','Germany','United Kingdom','India'],
               stacked=True,
               width=700, height=400,
               ylabel='GDP (current US$)',
               legend='bottom_right')


df.hvplot.scatter(x="China",
                  y="United States",
                  size=50,
                  alpha=0.7,
                  xlabel="GDP of China",
                  ylabel="GDP of the United States",
                  color='red',
                  title="GDP of United States Vs. China",
                  )


df.hvplot.scatter(x="China",
                  y="United States",
                  size=50,
                  alpha=0.7,
                  xlabel="GDP of China",
                  ylabel="GDP of the United States",
                  title="GDP of United States Vs. China",
                  c='Year')


df.hvplot.hist(y='Japan',
               width=700, height=400,
               bins=20,
               alpha=0.9,
               xlabel= 'GDP of Japan (current US$)',
               ylabel='Frequency',
               title='GDP Distribution of Japan')


df.hvplot.hist(y = ['United States', 'China', 'Japan'],
               width=700, height=400,
               alpha=0.7,
               bins=30,
               xlabel= 'GDP of United States, China and Japan (current US$)',
               ylabel='Frequency')


df.hvplot.box(y=['United States', 'China', 'Japan','Germany','United Kingdom','India'],
              height=400,
              box_width=0.6,
              xlabel= 'World top 6 economies',
              ylabel='GDP (current US$)')


df.hvplot.box(y=['United States', 'China', 'Japan','Germany','United Kingdom','India'],
              height=400,
              box_width=0.6,
              invert=True,
              xlabel= 'World top 6 economies',
              ylabel='GDP (current US$)')


df_melt = pd.melt(df, id_vars=['Year'], 
                  value_vars=['China', 'Germany', 'India', 'Japan', 'United Kingdom','United States'],
                  var_name='Country',
                  value_name='GDP')
df_melt


df_melt.hvplot.box(y='GDP',
                   by='Country',
                   height=400,
                   box_width=0.6,
                   xlabel= 'World top 6 economies',
                   ylabel='GDP (current US$)')


df.hvplot.violin(y=['United States', 'China', 'Japan','Germany','United Kingdom','India'],
                 height=400,
                 xlabel= 'World top 6 economies',
                 ylabel='GDP (current US$)',
                 ylim=(-3.500e+13,5.000e+13))


df_melt.hvplot.violin(y='GDP',
                      by='Country',
                      height=400,
                      xlabel= 'World top 6 economies',
                      ylabel='GDP (current US$)',
                      ylim=(-3.500e+13,5.000e+13))


df.hvplot.area(x='Year',
               y='Germany', 
               height=400,
               alpha=0.4,
               xlabel= 'Germany',
               ylabel='GDP (current US$)')


df.hvplot.area(x='Year',
               y=['United States', 'China', 'Japan','Germany','United Kingdom','India'],
               xlabel= 'Year',
               ylabel='GDP (current US$)',
               width=700,height=400,
               alpha=0.4)


df.hvplot.area(x='Year',
               y=['United States', 'China', 'Japan','Germany','United Kingdom','India'],
               xlabel= 'Year',
               ylabel='GDP (current US$)',
               width=700,height=400,
               stacked=False, 
               alpha=0.4)


df.hvplot.kde(y='United States',
              width=700, height=400,
              alpha=0.9,
              color='orangered',
              xlabel='The United States GDP (current US$)',
              ylabel='Density',
              title='The United States GDP Distribution')


df.hvplot.kde(y=['United States', 'China', 'Japan','Germany','United Kingdom','India'],
              width=700, height=400,
              alpha=0.9,
              ylabel='Density')


df.hvplot.step(x='Year', 
               y=['United States', 'China', 'Japan','Germany','United Kingdom','India'], 
               value_label='GDP (current US$)', 
               legend='top', 
               height=500, width=700)


df_melt.hvplot.heatmap(x='Year', 
                       y='Country', 
                       C='GDP', 
                       height=500, width=700, 
                       colorbar=False)


df_new = df.set_index('Year')
df_new.head()


htmap = df_new.hvplot.heatmap(x='columns', 
    y='index', 
    title='GDP of World Top 6 Economies 1991—2020', 
    cmap=["#75968f", "#a5bab7", "#c9d9d3", "#e2e2e2", "#dfccce", "#ddb7b1", "#cc7878", "#933b41", "#550b1d"], 
    xaxis='top', 
    rot=70,
    width=700, height=400)
htmap.opts(
    toolbar=None, 
    fontsize={'title': 10, 'xticks': 5, 'yticks': 5}
)


df_trans = df_new.transpose()

htmap = df_trans.hvplot.heatmap(x='columns', 
    y='index', 
    title='GDP of World Top 6 Economies 1991—2020', 
    cmap=["#75968f", "#a5bab7", "#c9d9d3", "#e2e2e2", "#dfccce", "#ddb7b1", "#cc7878", "#933b41", "#550b1d"], 
    xaxis='bottom', 
    rot=70,
    width=700, height=400)
htmap.opts(
    toolbar=None, 
    fontsize={'title': 10, 'xticks': 5, 'yticks': 5})


df.hvplot.bivariate('United States', 'China')


df.hvplot.hexbin('United States', 'China', 
                 clabel='Count',
                 gridsize=20, 
                 height=400, width=700)


from hvplot.plotting import scatter_matrix


scatter_matrix(df, alpha=0.5, 
               width=600, height=600,
               tools=['box_select', 'hover'],
               xrotation=90)


df_sub = df[['United States', 'China', 'Japan','Germany','United Kingdom','India']]
scatter_matrix(df_sub, chart='bivariate', 
               width=600, height=600,
               tools=['box_select', 'hover'],
               diagonal='kde',
               xrotation=90
               )


df_sub = df[['United States', 'China', 'Japan','Germany','United Kingdom','India']]
scatter_matrix(df_sub, chart='hexbin', 
               width=600, height=600,
               gridsize=20,
               tools=['box_select', 'hover'],
               diagonal='kde',
               xrotation=90)


df.hvplot.table(columns=['Year','United States', 'China', 'Japan','Germany','United Kingdom','India'],
                sortable=True, 
                selectable=True,
                width=900, height=200)

	Year	China	Germany	India	Japan	United Kingdom	United States
0	1991	3.833733e+11	1.868945e+12	2.701053e+11	3.584420e+12	1.142797e+12	6.158129e+12
1	1992	4.269157e+11	2.131572e+12	2.882084e+11	3.908809e+12	1.179660e+12	6.520327e+12
2	1993	4.447313e+11	2.071324e+12	2.792960e+11	4.454144e+12	1.061389e+12	6.858559e+12
3	1994	5.643247e+11	2.205074e+12	3.272756e+11	4.998798e+12	1.140490e+12	7.287236e+12
4	1995	7.345479e+11	2.585792e+12	3.602820e+11	5.545564e+12	1.346423e+12	7.639749e+12

	Year	Country	GDP
0	1991	China	3.833733e+11
1	1992	China	4.269157e+11
2	1993	China	4.447313e+11
3	1994	China	5.643247e+11
4	1995	China	7.345479e+11
...	...	...	...
175	2016	United States	1.869511e+13
176	2017	United States	1.947962e+13
177	2018	United States	2.052716e+13
178	2019	United States	2.137257e+13
179	2020	United States	2.089374e+13

	China	Germany	India	Japan	United Kingdom	United States
Year
1991	3.833733e+11	1.868945e+12	2.701053e+11	3.584420e+12	1.142797e+12	6.158129e+12
1992	4.269157e+11	2.131572e+12	2.882084e+11	3.908809e+12	1.179660e+12	6.520327e+12
1993	4.447313e+11	2.071324e+12	2.792960e+11	4.454144e+12	1.061389e+12	6.858559e+12
1994	5.643247e+11	2.205074e+12	3.272756e+11	4.998798e+12	1.140490e+12	7.287236e+12
1995	7.345479e+11	2.585792e+12	3.602820e+11	5.545564e+12	1.346423e+12	7.639749e+12

Table of Contents

1. Read the Dataset¶

2. Basic Plot Methods¶

3. Line Plot¶

3.1 Single line¶

3.2 Multiple lines¶

3.3 Change legend title and position¶

4. Bar Plot¶

4.1 Bar plot of more variables¶

4.2 Change bar color¶

4.3 Time series bar plot¶

4.4 Stacked bar plot¶

4.5 Horizontal bar plot¶

5. Scatter Plot¶

5.1 Scatter plot¶

5.2 Add color bar¶

6. Histogram¶

6.1 Single histogram¶

6.2 Overlapped Histogram¶

7. Box Plot¶

7.1 Simple box plot¶

7.2 horizontal box¶

7.3 Box plot for data with categorical column¶

8. Violin Plot¶

8.1 Simple violin plot¶

8.2 Create violin plot for data with categorical column¶

9. Area Plot¶

9.1 Single area plot¶

9.2 Overlapped stacked area plot¶

9.3 Overlapped unstacked area plot¶

10. KDE Plot¶

10.1 Simple KDE plot¶

10.2 Overlapped KDEs¶

11. Step Plot¶

12. Heatmap¶

12.1 Create a heatmap for the dataset with a categorical column¶

12.2 Create a heatmap for the dataset without a categorical column¶

12.3 Transpose heatmap¶

13. Bivariate¶

14. Hexbin¶

15. Scatter Matrix¶

15.1 Default scatter matrix¶

15.2 Change entry and diagonal plots¶

16. Table Plot¶

Summary¶