import pandas as pd
import altair as alt


from vega_datasets import data


df = data.seattle_weather()
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 1461 entries, 0 to 1460
Data columns (total 6 columns):
 #   Column         Non-Null Count  Dtype         
---  ------         --------------  -----         
 0   date           1461 non-null   datetime64[ns]
 1   precipitation  1461 non-null   float64       
 2   temp_max       1461 non-null   float64       
 3   temp_min       1461 non-null   float64       
 4   wind           1461 non-null   float64       
 5   weather        1461 non-null   object        
dtypes: datetime64[ns](1), float64(4), object(1)
memory usage: 68.6+ KB


df['year'] = df.date.apply(lambda x: x.strftime('%Y'))
df['month'] = df.date.apply(lambda x: x.strftime('%m'))
df['day'] = df.date.apply(lambda x: x.strftime('%a'))
df['dayOfYear'] = df.date.apply(lambda x: x.strftime('%j'))


df.head()


c = alt.Chart(df).mark_bar().encode(
    x = 'year',
    y = 'count(precipitation)',
tooltip=['year', 'count(precipitation)'])
c


c = alt.Chart(df).mark_bar().encode(
    x = 'year',
    y = 'sum(precipitation)',
tooltip=['year', 'sum(precipitation)'])

c


c = alt.Chart(df).mark_bar().encode(
    x = 'year',
    y = 'min(precipitation)',
tooltip=['year', 'min(precipitation)'])

c


c = alt.Chart(df).mark_bar().encode(
    x = 'year',
    y = 'max(precipitation)',
tooltip=['year', 'max(precipitation)'])

c


c = alt.Chart(df).mark_bar().encode(
    x = 'year',
    y = 'mean(precipitation)',
tooltip=['year', 'mean(precipitation)'])

c


c = alt.Chart(df).mark_bar().encode(
    y = 'year',
    x = 'sum(precipitation)',
    color='month',
    tooltip=['year', 'month', 'sum(precipitation)'])

c


c = alt.Chart(df).mark_line().encode(
    x = 'date',
    y = 'precipitation',
tooltip = ['date', 'precipitation']).interactive()
c


c = alt.Chart(df[(df.date>'2011-12-31')&(df.date<'2012-02-01')]).mark_line().encode(
    x = 'date',
    y = 'precipitation',
tooltip = ['date', 'precipitation']).interactive()
c


c = alt.Chart(df).mark_line().encode(
    x = 'dayOfYear',
    y = 'precipitation',
    color = 'year',
tooltip = ['date', 'precipitation']).interactive()
c


c = alt.Chart(df).mark_line().encode(
    x = 'month',
    y = 'sum(precipitation)',
    color = 'year',
tooltip = ['date', 'precipitation']).interactive()
c


c = alt.Chart(df).mark_area().encode(
    x = 'month',
    y = 'sum(precipitation)',
    color = 'year',
tooltip = ['month', 'year', 'sum(precipitation)']).interactive()
c

	date	precipitation	temp_max	temp_min	wind	weather	year	month	day	dayOfYear
0	2012-01-01	0.0	12.8	5.0	4.7	drizzle	2012	01	Sun	001
1	2012-01-02	10.9	10.6	2.8	4.5	rain	2012	01	Mon	002
2	2012-01-03	0.8	11.7	7.2	2.3	rain	2012	01	Tue	003
3	2012-01-04	20.3	12.2	5.6	4.7	rain	2012	01	Wed	004
4	2012-01-05	1.3	8.9	2.8	6.1	rain	2012	01	Thu	005

Bar, Line and Area Plots with Altair and Python

Standard Imports¶

Seattle Weather Data¶

Adding Some Categorical Values¶

Bar Charts¶

Altair Aggregation¶

1. Count¶

2. Sum¶

3. Min¶

4. Max¶

5. Mean¶

Improving the charts¶

Line Charts¶

Line Charts and Aggregation¶

Area Chart!¶

The Original Video