import pandas as pd

url = 'https://raw.githubusercontent.com/shoukewei/data/main/data-pydm/gdp_china_outlier_treated.csv'

df = pd.read_csv(url)
df.head()


df.columns=['Province','GDP Rank','Year','GDP','Population','Fix Investment','Trade','Fiscal Expenditure','Urban Income']
df.head()


import hvplot.pandas


df.hvplot.box(y=['GDP','Population','Fix Investment','Trade','Fiscal Expenditure','Urban Income'], 
              groupby='Province',
              width=600,height=400)


df.hvplot.bivariate(x='Trade', y='GDP', 
                  width=500, groupby='Province',
                  widget_location='left_top')


conda install -c pyviz panel


pip install panel


import panel as pn

df.hvplot.bivariate(x='Trade', 
                  y='GDP', 
                  width=600, groupby='Province',
                  widgets={'Province': pn.widgets.DiscreteSlider})


x = pn.widgets.Select(name='x', 
                      options=['Year', 'Population','Fix Investment','Trade','Fiscal Expenditure','Urban Income'])
y = pn.widgets.Select(name='y', 
                      options=['GDP','Population','Fix Investment','Trade','Fiscal Expenditure','Urban Income'])

kind = pn.widgets.Select(name='kind', value='scatter', 
                         options=['bivariate', 'scatter'])

plot = df.hvplot(x=x, y=y, kind=kind, colorbar=False, width=600)
pn.Row(pn.WidgetBox(x, y, kind), plot)


x = pn.widgets.Select(name='x', 
                      options=['Year', 'Population','Fix Investment','Trade','Fiscal Expenditure','Urban Income'])
y = pn.widgets.Select(name='y', 
                      options=['GDP','Population','Fix Investment','Trade','Fiscal Expenditure','Urban Income'])

kind = pn.widgets.Select(name='kind', value='scatter', 
                         options=['line','bivariate', 'scatter'])

by_province = pn.widgets.Checkbox(name='Province')
color = pn.widgets.ColorPicker(value='#ff0000')

@pn.depends(by_province, color)
def by_province_name(by_province, color):
    return 'Province' if by_province else color

plot = df.hvplot(x=x, y=y, kind=kind, c=by_province_name, colorbar=False, width=600)

pn.Row(pn.WidgetBox(x, y, kind, color, by_province), plot)


gdp_slider = pn.widgets.FloatSlider(name='Minimum GDP', start=0, end=round(max(df['GDP'])), value=0)
gdp_slider


import numpy as np

dfi = df.interactive(width=700)

dfi[dfi['GDP'] > gdp_slider]


import numpy as np

dfi[dfi['GDP'] > gdp_slider].hvplot.hist(y='GDP', bins=np.linspace(0, 10, 30))


dfi[dfi['GDP'] > gdp_slider].hvplot.bivariate(x='Trade', y='GDP', width=700)


hvexplorer = hvplot.explorer(df)
hvexplorer


hvexplorer.plot_code()

"df.hvplot(by=['Province'], kind='scatter', x='Trade', y=['GDP'])"


df.hvplot(by=['Province'], kind='scatter', title='GDP Scatter', x='Trade', y=['GDP'])


hvexplorer.param.set_param(kind='scatter', x='Population', y_multi=['GDP'], by=['Province'])
hvexplorer.labels.title = 'GDP Scatter'


settings = hvexplorer.settings()
settings

{'by': ['Province'],
 'kind': 'scatter',
 'title': 'GDP Scatter',
 'x': 'Population',
 'y': ['GDP']}


df.hvplot(**settings)


hvexplorer.save('./results/plot.html')

	prov	gdpr	year	gdp	pop	finv	trade	fexpen	uinc
0	Guangdong	First	2000	1.074125	8.650000	0.314513	1.408147	0.108032	0.976157
1	Guangdong	First	2001	1.203925	8.733000	0.348443	1.501391	0.132133	1.041519
2	Guangdong	First	2002	1.350242	8.842000	0.385078	1.830169	0.152108	1.113720
3	Guangdong	First	2003	1.584464	8.963000	0.481320	2.346735	0.169563	1.238043
4	Guangdong	First	2004	1.886462	9.052298	0.587002	2.955899	0.185295	1.362765

	Province	GDP Rank	Year	GDP	Population	Fix Investment	Trade	Fiscal Expenditure	Urban Income
0	Guangdong	First	2000	1.074125	8.650000	0.314513	1.408147	0.108032	0.976157
1	Guangdong	First	2001	1.203925	8.733000	0.348443	1.501391	0.132133	1.041519
2	Guangdong	First	2002	1.350242	8.842000	0.385078	1.830169	0.152108	1.113720
3	Guangdong	First	2003	1.584464	8.963000	0.481320	2.346735	0.169563	1.238043
4	Guangdong	First	2004	1.886462	9.052298	0.587002	2.955899	0.185295	1.362765

Table of Contents

1. Data Preparation¶

1.1 Read the Dataset¶

1.2 Change variable names¶

2. Groupby Method¶

2.1 Pandas-like API¶

2.2 Simple box plot¶

2.3 Change the widget location¶

2.4 Refine the widgets with Panel¶

3. Using Widgets as Arguments¶

4. Using functions¶

5. Interactive¶

5.1 Create a float slider¶

5.2 Filter data¶

5.3 Create a histogram¶

5.4 Create bivariate¶

6. Explorer¶

6.1 For the whole dataset¶

6.2 Plot code¶

6.3 Customized settings¶

6.4 Save the plot¶

Summary¶