Adjusted some things after getting complete set of log files
This commit is contained in:
parent
fdb6c94b25
commit
45bf0d9af9
@ -14,6 +14,8 @@
|
||||
|
||||
# setwd("C:/Users/nwickelmaier/Nextcloud/Documents/MDS/2023ss/60100_master_thesis/code")
|
||||
|
||||
#+ setup, include = FALSE
|
||||
knitr::opts_chunk$set(warning = FALSE, message = FALSE)
|
||||
|
||||
#' # Preprocessing raw log files into data frame
|
||||
|
||||
@ -34,17 +36,11 @@
|
||||
|
||||
#' Choose which folders with raw log files should be included:
|
||||
|
||||
folders <- c(
|
||||
"_2016"
|
||||
, "_2017a"
|
||||
, "_2017b"
|
||||
, "_2018"
|
||||
)
|
||||
folders <- "all"
|
||||
|
||||
dirpaths <- paste0("../data/HAUM Logs/", folders)
|
||||
dirpaths <- paste0("../data/haum_logs_2016-2023/", folders)
|
||||
|
||||
fnames <- dir(dirpaths, pattern = "*.log", full.names = TRUE)
|
||||
# TODO: Enter all data
|
||||
length(fnames)
|
||||
head(fnames)
|
||||
|
||||
@ -59,6 +55,7 @@ head(dat$logs)
|
||||
# incomplete final line found on '_2016/2016_11_18-11_31_0.log'
|
||||
# incomplete final line found on '_2016/2016_11_18-11_38_30.log'
|
||||
# incomplete final line found on '_2016/2016_11_18-11_40_36.log'
|
||||
# ...
|
||||
|
||||
## --> files have a last line that looks like a binary entry??
|
||||
|
||||
@ -74,6 +71,7 @@ d2 <- dim(dat)[1]
|
||||
|
||||
#' The files contain `r d1-d2` corrupt lines that were remooved from the data.
|
||||
|
||||
|
||||
#' ### Extract relevant infos
|
||||
|
||||
date <- sapply(dat$logs, gsub,
|
||||
@ -124,9 +122,12 @@ dat$y <- moves[,2]
|
||||
dat$scale <- moves[,3]
|
||||
dat$rotation <- moves[,4]
|
||||
|
||||
dat$logs <- NULL
|
||||
# remove original log files from data so file becomes smaller
|
||||
|
||||
str(dat)
|
||||
|
||||
head(dat[, 3:ncol(dat)], 20)
|
||||
head(dat[, 2:ncol(dat)], 20)
|
||||
|
||||
## TODO: Replace artwork and popup numbers with informative strings
|
||||
|
||||
|
@ -14,8 +14,10 @@ dat <- read.table("../data/rawdata_logfiles.csv", header = TRUE, sep = ";")
|
||||
# "ShowPopup", "HidePopup"))
|
||||
#
|
||||
|
||||
#dat$logs <- NULL # do not need original log files
|
||||
dat$date <- as.POSIXct(dat$date) # create date object
|
||||
dat <- dat[order(dat$date), ]
|
||||
|
||||
rownames(dat) <- NULL
|
||||
|
||||
str(dat)
|
||||
head(dat)
|
||||
@ -31,16 +33,16 @@ table(year(dat$date))
|
||||
#' Number of events total and per year
|
||||
|
||||
table(dat$event)
|
||||
# Start Application Show Application
|
||||
# 1679 1656
|
||||
# Transform start Transform stop
|
||||
# 2119815 1944618
|
||||
# Show Info Show Front
|
||||
# 71955 71043
|
||||
# Artwork/OpenCard Artwork/CloseCard
|
||||
# 64990 56750
|
||||
# ShowPopup HidePopup
|
||||
# 44070 43813
|
||||
# Artwork/CloseCard Artwork/OpenCard
|
||||
# 80026 92588
|
||||
# HidePopup Show Application
|
||||
# 59932 3179
|
||||
# Show Front Show Info
|
||||
# 106945 108113
|
||||
# ShowPopup Start Application
|
||||
# 60350 3210
|
||||
# Transform start Transform stop
|
||||
# 3219109 2966724
|
||||
# --> more "openups" than "closes" (not surprisingly)
|
||||
|
||||
table(dat$event, year(dat$date))
|
||||
@ -58,7 +60,9 @@ length(unique(as.Date(dat$date)))
|
||||
table(dat$artwork)
|
||||
lattice::barchart(table(dat$artwork))
|
||||
|
||||
|
||||
#' ## Corona Gaps
|
||||
table(diff(as.Date(dat$date)))
|
||||
dat[diff(as.Date(dat$date)) > 50, ]
|
||||
|
||||
#' ## Plots from Visualization Tool
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user