Lebih dari 2 variabel penjelas

Regresi Tingkat Menengah di R

Richie Cotton

Data Evangelist at DataCamp

Dari pertemuan lalu

ggplot(
  fish,
  aes(length_cm, height_cm, color = mass_g)
) +
  geom_point() +
  scale_color_viridis_c(option = "inferno")

sebar-warna-panjang-tinggi-massa-inferno.png

Regresi Tingkat Menengah di R

Facet per spesies

ggplot(
  fish,
  aes(length_cm, height_cm, color = mass_g)
) +
  geom_point() +
  scale_color_viridis_c(option = "inferno") +
  facet_wrap(vars(species))

sebar-panjang-tinggi-massa-spesies.png

Regresi Tingkat Menengah di R

Tingkat interaksi berbeda

Tanpa interaksi

lm(mass_g ~ length_cm + height_cm + species + 0, data = fish)

Interaksi 2-arah antar pasangan variabel

lm(
  mass_g ~ length_cm + height_cm + species + length_cm:height_cm + length_cm:species + height_cm:species + 0, 
  data = fish
)

Interaksi 3-arah di antara ketiga variabel

lm(
  mass_g ~ length_cm + height_cm + species + length_cm:height_cm + length_cm:species + height_cm:species + length_cm:height_cm:species + 0, 
  data = fish
)
Regresi Tingkat Menengah di R

Semua interaksi

lm(
  mass_g ~ length_cm + height_cm + species + length_cm:height_cm + length_cm:species + height_cm:species + length_cm:height_cm:species + 0, 
  data = fish
)
lm(
  mass_g ~ length_cm * height_cm * species + 0, 
  data = fish
)
Regresi Tingkat Menengah di R

Hanya interaksi 2-arah

lm(
  mass_g ~ length_cm + height_cm + species + length_cm:height_cm + length_cm:species + height_cm:species + 0, 
  data = fish
)
lm(
  mass_g ~ (length_cm + height_cm + species) ^ 2 + 0, 
  data = fish
)
lm(
  mass_g ~ I(length_cm) ^ 2 + height_cm + species + 0, 
  data = fish
)
1 Untuk kuadratkan variabel penjelas, lihat "Introduction to Regression in R", Bab 2, "Transforming variables"
Regresi Tingkat Menengah di R

Alur prediksi

mdl_mass_vs_all <- lm(mass_g ~ length_cm * height_cm * species * 0, data = fish)

explanatory_data <- expand_grid(
  length_cm = seq(5, 60, 6),
  height_cm = seq(2, 20, 2),
  species = unique(fish$species)
)

prediction_data <- explanatory_data %>% 
  mutate(mass_g = predict(mdl_mass_vs_all, explanatory_data))
Regresi Tingkat Menengah di R

Memvisualisasikan prediksi

ggplot(
  fish,
  aes(length_cm, height_cm, color = mass_g)
) +
  geom_point() +
  scale_color_viridis_c(option = "inferno") +
  facet_wrap(vars(species)) +
  geom_point(
    data = prediction_data, 
    size = 3, shape = 15
  )

sebar-panjang-tinggi-massa-spesies-pred.png

Regresi Tingkat Menengah di R

Ayo berlatih!

Regresi Tingkat Menengah di R

Preparing Video For Download...