import pandas as pd
import hvplot.pandas


url = 'https://raw.githubusercontent.com/shoukewei/data/main/data-pydm/gdp_top_six_economies.csv'
df = pd.read_csv(url) 
df.head()


df.hvplot(x='Year',
          y = ['United States', 'China', 'Japan','Germany','United Kingdom','India'],
          ylabel= 'GDP (current US$)',
          width=700, height=400,
          title="GDP of World top 6 Economies",
          group_label='GDP',
          legend='top_left')


df.hvplot(x='Year',
          y = ['United States', 'China', 'Japan','Germany','United Kingdom','India'],
          ylabel= 'GDP (current US$)',
          width=300, height=250,
          group_label='GDP',
          subplots=True).cols(3)


df.hvplot(x='Year',
          y = ['United States', 'China', 'Japan','Germany','United Kingdom','India'],
          ylabel= 'GDP (current US$)',
          width=300, height=300,
          group_label='GDP',
          subplots=True,
          shared_axes=False).cols(3)


df_melt = pd.melt(df, id_vars=['Year'], 
                  value_vars=['China', 'Germany', 'India', 'Japan', 'United Kingdom','United States'],
                  var_name="Country",
                  value_name='GDP')
df_melt


df_melt.hvplot.scatter(x='Year', y='GDP', 
                       by='Country',
                       subplots=True, 
                       shared_axes=False,
                       width=400, height=250, 
                       alpha=0.5).cols(2)


df_melt.sort_values('GDP').hvplot.scatter(x='Year', y='GDP', 
                                  row='Country',col='Year', 
                                  width=400, height=250,
                                  alpha=0.9,rot=90)


line_usa = df.hvplot(x='Year', y='United States',
                     width=700, height=400,
                     ylabel='GDP (current US$)',
                     rot=90)

bar_china = df.hvplot.bar(x='Year',
              y='China',
              width=700, height=400,
              ylabel='GDP (current US$)',
                          color='tomato',
              rot=90)

line_usa * bar_china


df.hvplot.bivariate(x='China', y='United States', legend=False) *\
df.hvplot.scatter(x="China", y="United States", size=30, alpha=0.7,
                  xlabel="GDP of China",
                  ylabel="GDP of the United States",
                  color='red')


boxplot = df_melt.hvplot.box(y='GDP', by='Country', height=400, width=700, legend=False)
boxplot


scatterplot = df_melt.hvplot.scatter(x="Country", y="GDP",c='orange').opts(jitter=0.5)
scatterplot


boxplot * scatterplot


multiline = df.hvplot(x='Year',
            y = ['United States', 'China', 'Japan','Germany','United Kingdom','India'],
            ylabel= 'GDP (current US$)',
            width=450, height=400,
            title="GDP of World top 6 Economies",
            group_label='GDP',
            legend='top_left')

stackedbar = df.hvplot.bar(x='Year',
             y = ['United States', 'China', 'Japan','Germany','United Kingdom','India'],
             stacked=True,
             width=450, height=400,
             ylabel='GDP (current US$)',
             legend='top_left',
             rot=90)
multiline + stackedbar


boxplot = df.hvplot.box(y=['United States', 'China', 'Japan','Germany','United Kingdom','India'],
              width=450,height=400,
              box_width=0.6,
              xlabel= 'World top 6 economies',
              ylabel='GDP (current US$)')

areaplot = df.hvplot.area(x='Year',
               y=['United States', 'China', 'Japan','Germany','United Kingdom','India'],
               xlabel= 'Year',
               ylabel='GDP (current US$)',
               width=450,height=400,
               legend='top_left',
                          alpha=0.4)


(multiline + stackedbar + boxplot + areaplot).cols(2)


bivariate = df.hvplot.bivariate(x='China', y='United States', legend=False, 
                                width=550, height=400)
scatter = df.hvplot.scatter(x="China", y="United States", size=30, alpha=0.7,
                            xlabel="GDP of China",
                            ylabel="GDP of the United States",
                            color='red')
table = df.hvplot.table(['China', 'United States'], width=350, height=350)

bivariate * scatter + table

	Year	China	Germany	India	Japan	United Kingdom	United States
0	1991	3.833733e+11	1.868945e+12	2.701053e+11	3.584420e+12	1.142797e+12	6.158129e+12
1	1992	4.269157e+11	2.131572e+12	2.882084e+11	3.908809e+12	1.179660e+12	6.520327e+12
2	1993	4.447313e+11	2.071324e+12	2.792960e+11	4.454144e+12	1.061389e+12	6.858559e+12
3	1994	5.643247e+11	2.205074e+12	3.272756e+11	4.998798e+12	1.140490e+12	7.287236e+12
4	1995	7.345479e+11	2.585792e+12	3.602820e+11	5.545564e+12	1.346423e+12	7.639749e+12

	Year	Country	GDP
0	1991	China	3.833733e+11
1	1992	China	4.269157e+11
2	1993	China	4.447313e+11
3	1994	China	5.643247e+11
4	1995	China	7.345479e+11
...	...	...	...
175	2016	United States	1.869511e+13
176	2017	United States	1.947962e+13
177	2018	United States	2.052716e+13
178	2019	United States	2.137257e+13
179	2020	United States	2.089374e+13

Table of Contents

Preparation¶

1. Subplots¶

1.1 Subplots with linked and normalized axes¶

1.2 Subplots with different ranges¶

1.3 Subplots for dataset with category variable¶

1.4 Grid subplots¶

2. Overlay Plots¶

2.1 Line plot and bar plot¶

2.2 Bivariate and scatter Plot¶

2.3 Scatter plot and box Plot¶

(1) Create a box plot¶

(2) Create a jitter scatter plot¶

(3) Overlay the plots¶

3. Layout Plots¶

3.1 One row¶

3.2 More rows¶

4. Combine the Overlay and Layout Plots¶

Summary¶