duke_forest <- duke_forest |>
mutate(
decade_built = (year_built %/% 10) * 10,
decade_built_cat = case_when(
decade_built <= 1940 ~ "1940 or before",
decade_built >= 1990 ~ "1990 or after",
.default = as.character(decade_built)
)
)
mean_area_decade <- duke_forest |>
group_by(decade_built_cat) |>
summarize(mean_area = mean(area))
ggplot(
mean_area_decade,
aes(y = decade_built_cat, x = mean_area)
) +
geom_point(size = 4) +
geom_segment(
aes(
x = 0,
xend = mean_area,
y = decade_built_cat,
yend = decade_built_cat
)
) +
labs(
x = "Mean area (square feet)",
y = "Decade built",
title = "Mean area of houses in Duke Forest, by decade built"
)