Slide 9
Slide 9 text
食材 の準備 =
欠損値
messy
データ準備・前処理
library(nycflights13)
#まず確認
library(skimr)
skim(flights)
library(tidyverse)
glimpse(flights)
#余分なゴミを落とす
flight_data <-
flights %>%
mutate(
arr_delay = ifelse(arr_delay >= 30, "late", "on_time"),
arr_delay = factor(arr_delay),
date = as.Date(time_hour)
) %>%
inner_join(weather, by = c("origin", "time_hour")) %>%
select(dep_time, flight, origin, dest, air_time, distance,
carrier, date, arr_delay, time_hour) %>%
na.omit() %>%
mutate_if(is.character, as.factor)