diff --git a/code/00_current-analysis.R b/code/00_current-analysis.R index 80e5ada..d66cbfc 100644 --- a/code/00_current-analysis.R +++ b/code/00_current-analysis.R @@ -9,7 +9,7 @@ # (3.4) Artwork sequences # (3.5) Topics # -# input: ../data/haum/event_logfiles_glossar_2023-10-29_10-26-42.csv +# input: results/haum/event_logfiles_glossar_2023-10-29_10-26-42.csv # output: # # last mod: 2023-11-15, NW @@ -27,7 +27,7 @@ library(bupaverse) #--------------- (1) Read data --------------- -dat <- read.table("../data/haum/event_logfiles_glossar_2023-11-03_17-46-28.csv", +dat <- read.table("results/haum/event_logfiles_glossar_2023-11-03_17-46-28.csv", sep = ";", header = TRUE) dat$date <- as.POSIXct(dat$date) dat$date.start <- as.POSIXct(dat$date.start) diff --git a/code/00_pm.py b/code/00_pm.py index 7324041..7e07a36 100644 --- a/code/00_pm.py +++ b/code/00_pm.py @@ -12,7 +12,7 @@ from sklearn.cluster import KMeans ###### Load data and create event logs ###### -dat = pd.read_csv("../data/haum/event_logfiles_glossar_2023-11-03_17-46-28.csv", sep = ";") +dat = pd.read_csv("results/haum/event_logfiles_glossar_2023-11-03_17-46-28.csv", sep = ";") dat = dat[dat.date < "2020-03-13"] # --> only pre corona (before artworks were updated) diff --git a/code/01_clustering.R b/code/01_clustering.R index ff3ec2a..8648934 100644 --- a/code/01_clustering.R +++ b/code/01_clustering.R @@ -9,7 +9,7 @@ # # input: results/eval_heuristics_artworks.csv # results/eval_all-miners_complete.csv -# ../data/haum/event_logfiles_glossar_2023-11-03_17-46-28.csv +# results/haum/event_logfiles_glossar_2023-11-03_17-46-28.csv # output: ../figures/clustering_heuristics.pdf # ../figures/clustering_heuristics.png # ../figures/processmaps/dfg_complete_R.pdf @@ -143,7 +143,7 @@ for (art in as.numeric(rownames(eval_inductive))) { #--------------- (4) Read event logs --------------- -dat <- read.table("../data/haum/event_logfiles_glossar_2023-11-03_17-46-28.csv", +dat <- read.table("results/haum/event_logfiles_glossar_2023-11-03_17-46-28.csv", sep = ";", header = TRUE) dat$date <- as.POSIXct(dat$date) dat$date.start <- as.POSIXct(dat$date.start) diff --git a/code/01_preprocessing_8o8m.R b/code/01_preprocessing_8o8m.R index e9690b9..b34f021 100644 --- a/code/01_preprocessing_8o8m.R +++ b/code/01_preprocessing_8o8m.R @@ -13,7 +13,7 @@ datraw <- parse_logfiles(folders, path = "../data/8o8m/LogFiles/") #artworks <- unique(na.omit(datraw$artwork)) # export data -write.table(datraw, paste0("../data/8o8m/raw_logfiles_", now, ".csv"), +write.table(datraw, paste0("results/8o8m/raw_logfiles_", now, ".csv"), sep = ";", row.names = FALSE) #datraw[is.na(datraw$artwork), ] @@ -32,6 +32,6 @@ topics <- extract_topics(artworks, xmlfiles = paste0(artworks, "_en.xml"), # extracted like this? (It works fine for the English versions...) # export data -write.table(datlogs, paste0("../data/8o8m/event_logfiles_", now, ".csv"), +write.table(datlogs, paste0("results/8o8m/event_logfiles_", now, ".csv"), sep = ";", row.names = FALSE) diff --git a/code/01_preprocessing_haum.R b/code/01_preprocessing_haum.R index 4df1f24..8aabb9f 100644 --- a/code/01_preprocessing_haum.R +++ b/code/01_preprocessing_haum.R @@ -30,12 +30,12 @@ now <- format(Sys.time(), "%Y-%m-%d_%H-%M-%S") #datraw <- parse_logfiles(folders, path) -datraw <- read.table("../data/haum/raw_logfiles_2023-10-25_16-20-45.csv", +datraw <- read.table("results/haum/raw_logfiles_2023-10-25_16-20-45.csv", sep = ";", header = TRUE) ## Export data -#write.table(datraw, paste0("../data/haum/raw_logfiles_small_", now, ".csv"), +#write.table(datraw, paste0("results/haum/raw_logfiles_small_", now, ".csv"), # sep = ";", row.names = FALSE) #--------------- (2) Create event logs --------------- @@ -107,7 +107,7 @@ dat2 <- merge(dat1, sfdat, by.x = "date", by.y = "date", all.x = TRUE) ## Export data -write.table(dat2, paste0("../data/haum/event_logfiles_glossar_", now, ".csv"), +write.table(dat2, paste0("results/haum/event_logfiles_glossar_", now, ".csv"), sep = ";", row.names = FALSE) # TODO: Maybe add infos about artworks? diff --git a/code/03_plots_8o8m.R b/code/03_plots_8o8m.R index 4ad9350..0a84d4f 100644 --- a/code/03_plots_8o8m.R +++ b/code/03_plots_8o8m.R @@ -5,7 +5,7 @@ devtools::load_all("../../../../software/mtt") library(ggplot2) # Read data -datlogs <- read.table("../data/8o8m/event_logfiles_2023-09-22_18-54-49.csv", +datlogs <- read.table("results/8o8m/event_logfiles_2023-09-22_18-54-49.csv", sep = ";", header = TRUE) datlogs$date <- as.Date(datlogs$date.start) datlogs$date.start <- as.POSIXct(datlogs$date.start) diff --git a/code/03_plots_haum.R b/code/03_plots_haum.R index 34bbaac..58fa3c1 100644 --- a/code/03_plots_haum.R +++ b/code/03_plots_haum.R @@ -7,7 +7,7 @@ library(lattice) #plot(1:10, col = cc, pch = 16, cex = 2) # Read data -datlogs <- read.table("../data/haum/event_logfiles_metadata_2023-09-23_01-31-30.csv", +datlogs <- read.table("results/haum/event_logfiles_metadata_2023-09-23_01-31-30.csv", sep = ";", header = TRUE) datlogs$date <- as.Date(datlogs$date) datlogs$date.start <- as.POSIXct(datlogs$date.start) diff --git a/code/04_modeling_haum.R b/code/04_modeling_haum.R index 6cd676d..5124f4f 100644 --- a/code/04_modeling_haum.R +++ b/code/04_modeling_haum.R @@ -2,7 +2,7 @@ # Read data -dat0 <- read.table("../data/haum/event_logfiles_2023-10-25_17-29-52.csv", +dat0 <- read.table("results/haum/event_logfiles_2023-10-25_17-29-52.csv", sep = ";", header = TRUE) dat0$date.start <- as.POSIXct(dat0$date.start) dat0$date.stop <- as.POSIXct(dat0$date.stop) diff --git a/code/check_traces.R b/code/check_traces.R index cf26e79..72c2364 100644 --- a/code/check_traces.R +++ b/code/check_traces.R @@ -2,9 +2,9 @@ # Read data -# dat <- read.table("../data/haum/event_logfiles_metadata_2023-09-23_01-31-30.csv", +# dat <- read.table("results/haum/event_logfiles_metadata_2023-09-23_01-31-30.csv", # sep = ";", header = TRUE) -dat <- read.table("../data/haum/event_logfiles_small_metadata_2023-10-15_10-08-43.csv", +dat <- read.table("results/haum/event_logfiles_small_metadata_2023-10-15_10-08-43.csv", sep = ";", header = TRUE) dat$date <- as.Date(dat$date) dat$date.start <- as.POSIXct(dat$date.start) diff --git a/code/read_trans_matrix.R b/code/read_trans_matrix.R index aa67370..5ac83ac 100644 --- a/code/read_trans_matrix.R +++ b/code/read_trans_matrix.R @@ -1,6 +1,6 @@ # setwd("C:/Users/nwickelmaier/Nextcloud/Documents/MDS/2023ss/60100_master_thesis/code") -dat <- as.data.frame(do.call(rbind, XML::xmlToList("../data/haum/trans.xml"))) +dat <- as.data.frame(do.call(rbind, XML::xmlToList("../museums/haum/trans.xml"))) dat$a <- as.numeric(dat$a) dat$b <- as.numeric(dat$b) @@ -16,7 +16,7 @@ plot(ty ~ tx, dat, xlim = c(0, 3840), ylim = c(0, 2160)) # read log data -datlogs <- read.table("../data/haum/event_logfiles_metadata_2023-09-23_01-31-30.csv", +datlogs <- read.table("results/haum/event_logfiles_metadata_2023-09-23_01-31-30.csv", sep = ";", header = TRUE) datlogs$date <- as.Date(datlogs$date) datlogs$date.start <- as.POSIXct(datlogs$date.start)