rapids/src/features/messages_features.R

27 lines
1.4 KiB
R

# If you want to implement extra features, source(..) a new file and duplicate the line "features <- merge(...)", then
# swap base_sms_features(...) for your own function
source("renv/activate.R")
source("src/features/messages/messages_base.R")
library("dplyr", warn.conflicts = FALSE)
messages <- read.csv(snakemake@input[[1]])
day_segments_labels <- read.csv(snakemake@input[["day_segments_labels"]])
requested_features <- snakemake@params[["features"]]
messages_type <- snakemake@params[["messages_type"]]
features <- data.frame(local_segment = character(), stringsAsFactors = FALSE)
day_segments <- day_segments_labels %>% pull(label)
for (day_segment in day_segments)
features <- merge(features, base_messages_features(messages, messages_type, day_segment, requested_features), all = TRUE)
if(ncol(features) != length(requested_features) + 1)
stop(paste0("The number of features in the output dataframe (=", ncol(features),") does not match the expected value (=", length(requested_features)," + 1). Verify your Messages (SMS) feature extraction functions"))
features <- features %>% separate(col = local_segment,
into = c("local_segment_label", "local_start_date", "local_start_time", "local_end_date", "local_end_time"),
sep = "#",
remove = FALSE)
write.csv(features, snakemake@output[[1]], row.names = FALSE)