New Variables ..sumprop.., ..sumpct.. in the bin Statistic

In [1]:
import pandas as pd

from lets_plot import *
In [2]:
LetsPlot.setup_html()
In [3]:
df = pd.read_csv("https://raw.githubusercontent.com/JetBrains/lets-plot-docs/master/data/mpg.csv")
print(df.shape)
df.head()
(234, 12)
Out[3]:
Unnamed: 0 manufacturer model displ year cyl trans drv cty hwy fl class
0 1 audi a4 1.8 1999 4 auto(l5) f 18 29 p compact
1 2 audi a4 1.8 1999 4 manual(m5) f 21 29 p compact
2 3 audi a4 2.0 2008 4 manual(m6) f 20 31 p compact
3 4 audi a4 2.0 2008 4 auto(av) f 21 30 p compact
4 5 audi a4 2.8 1999 6 auto(l5) f 16 26 p compact
In [4]:
g = ggplot(df, aes(x="cty")) + facet_grid(x="cyl")
In [5]:
# Default plot
g + geom_histogram(binwidth=5, center=5)
Out[5]:
In [6]:
# When y='..sumprop..', sum of values in each group is equal to 1
g + geom_histogram(aes(y='..sumprop..'), binwidth=5, center=5)
Out[6]:
In [7]:
# When y='..sumpct..', sum of values in each group is equal to 100
g + geom_histogram(aes(y='..sumpct..'), binwidth=5, center=5)
Out[7]: