-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathregressionsgerade_ausreisser.R
31 lines (28 loc) · 1.37 KB
/
regressionsgerade_ausreisser.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
library(ggplot2)
library(dplyr)
qm <- readRDS(url("https://data.tadaa-data.de/qm_survey_ss2017.rds"))
dunkel <- round(cor(qm$alter, qm$beziehungen), 2)
hell <- round(cor(filter(qm, alter <= 28)$alter,
filter(qm, alter <= 28)$beziehungen), 2)
qm %>%
mutate(
alter_z = tadaatoolbox::z(alter),
Modellierbarkeit = ifelse(alter_z < 2, "fitted", "Ausreißer")
) %>%
ggplot(aes(x = alter, y = beziehungen, alpha = Modellierbarkeit,
shape = Modellierbarkeit, color = Modellierbarkeit)) +
geom_smooth(data = qm, aes(x = alter, y = beziehungen),
inherit.aes = F, method = "lm", color = "cadetblue", se = F) +
geom_jitter(width = .2, height = .3, size = 2) +
geom_smooth(data = filter(qm, alter <= 28), aes(x = alter, y = beziehungen),
inherit.aes = F, method = "lm", color = "#4dccff", se = F) +
scale_x_continuous(breaks = scales::pretty_breaks()) +
scale_y_continuous(breaks = scales::pretty_breaks()) +
scale_alpha_manual(values = c(.8, .3)) +
scale_shape_manual(values = c(13, 19)) +
scale_color_manual(values = c("dark red", "dark gray")) +
labs(title = "Modellierbarkeit des Zusammenhangs zw. Alter und Beziehungsanzahl",
subtitle = paste0(
"Regressionsgerade mit Ausreißern (dunkel; r = ", dunkel,
") und ohne Ausreißer (hell; r = ", hell, ")"),
x = "Alter", y = "Beziehungen")