Data Science Desktop Survival Guide
by Graham Williams |
|||||
Analysis of Variance ANOVA |
ds %>%
group_by(x) %>% summarise( n = n(), sm = mean(y), rssq = sum((y - sm)^2) ) %>% summarise( om = sum(n * sm) / sum(n), ssq = sum(n * (sm - om)^2), rssq = sum(rssq), df1 = n_distinct(x) - 1, mse = ssq / df1, df2 = sum(n) - n_distinct(x), rmse = rssq / df2, F = mse / rmse, P = pf(F, df1, df2, lower.tail=FALSE) )
|