df <- birthwt %>%
mutate(race = factor(race, labels = c("White", "Black", "Other")),
smoke = factor(smoke, labels = c("Non-smoker", "Smoker")))
# 年齢と体重の散布図
p1 <- ggplot(df, aes(x = age, y = bwt)) +
geom_point() +
geom_smooth(method = "lm") +
labs(title = "年齢と出生時体重の関係",
x = "母親の年齢", y = "出生時体重 (g)")
# 体重と体重の散布図
p2 <- ggplot(df, aes(x = lwt, y = bwt)) +
geom_point() +
geom_smooth(method = "lm") +
labs(title = "母体重と出生時体重の関係",
x = "母体重 (lbs)", y = "出生時体重 (g)")
# 人種と体重のボックスプロット
p3 <- ggplot(df, aes(x = race, y = bwt, fill = race)) +
geom_boxplot() +
labs(title = "人種と出生時体重の関係",
x = "人種", y = "出生時体重 (g)")
# 喫煙と体重のボックスプロット
p4 <- ggplot(df, aes(x = smoke, y = bwt, fill = smoke)) +
geom_boxplot() +
labs(title = "喫煙状態と出生時体重の関係",
x = "喫煙状態", y = "出生時体重 (g)")
# ptlと体重のボックスプロット
p5 <- ggplot(df, aes(x = factor(ptl), y = bwt)) +
geom_boxplot() +
labs(title = "早産歴と出生時体重の関係",
x = "早産回数", y = "出生時体重 (g)")
# htと体重のボックスプロット
p6 <- ggplot(df, aes(x = factor(ht), y = bwt)) +
geom_boxplot() +
labs(title = "高血圧と出生時体重の関係",
x = "高血圧", y = "出生時体重 (g)")
(p1 + p2) / (p3 + p4) / (p5 + p6)
model <- lm(bwt ~ race * age, data = df)
Characteristic | Beta | 95% CI1 | p-value |
race | |||
White | — | — | |
Black | 1,023 | -347, 2,392 | 0.14 |
Other | 326 | -750, 1,402 | 0.6 |
age | 21 | -4.1, 47 | 0.10 |
race * age | |||
Black * age | -63 | -123, -2.0 | 0.043 |
Other * age | -26 | -72, 20 | 0.3 |
1 CI = Confidence Interval |
ggplot(df, aes(x = age, y = bwt, color = race)) +
geom_point() +
geom_smooth(method = "lm") +
labs(title = "人種別の年齢と出生時体重の関係",
x = "母親の年齢",
y = "出生時体重 (g)")
