library(fable)
library(tsibble)
library(lubridate)
+library(ggplot2)
-logfile <- file("data/photos.vanrenterghem.biz.access.kvp.log")
+logfile <- file("data/photos.vanrenterghem.biz.access.kvp.log.1")
apachelog <- stream_in(logfile)
#apachelog$time <- gsub("\\[|\\]", "", apachelog$time)
apachelog %>%
mutate(time = gsub("\\[|\\]", "", time),
- time = dmy_hms(time)) %>%
- group_by(time) %>%
+ time = dmy_hms(time),
+ datehour = floor_date(time, unit = "hour")
+ ) %>%
+ filter(time > ymd_h("2018-08-22 12")) %>%
+ group_by(datehour) %>%
summarise(hits = n()) ->
- apachelog
+ apachelog_tidy
+
+apachelog_tsbl <- as.tsibble(apachelog_tidy, index = datehour)
+apachelog_tsbl %>%
+ ARIMA(log(hits)) %>%
+ forecast(h=5) %>%
+ autoplot +
+ ggtitle("Forecasting website hits using apache log only") +
+ xlab("Date time")
-as.tsibble(apachelog, index = time)