Clean up categories.
parent
d092e17e33
commit
0b16aa6fe4
|
@ -2,8 +2,10 @@ library(conflicted)
|
|||
library(yaml)
|
||||
library(RPostgreSQL)
|
||||
library(tidyverse)
|
||||
conflicts_prefer(dplyr::filter,
|
||||
dplyr::lag)
|
||||
conflicts_prefer(
|
||||
dplyr::filter,
|
||||
dplyr::lag
|
||||
)
|
||||
library(magrittr)
|
||||
|
||||
# read the password from file
|
||||
|
@ -15,9 +17,11 @@ drv <- RPostgres::Postgres()
|
|||
|
||||
# creates a connection to the postgres database
|
||||
# note that "con" will be used later in each connection to the database
|
||||
con <- RPostgres::dbConnect(drv, dbname = "staw",
|
||||
con <- RPostgres::dbConnect(drv,
|
||||
dbname = "staw",
|
||||
host = "eol.ijs.si", port = 5432,
|
||||
user = "staw_db", password = pw)
|
||||
user = "staw_db", password = pw
|
||||
)
|
||||
|
||||
rm(pw, credentials) # removes the password
|
||||
|
||||
|
@ -30,4 +34,18 @@ df_app_categories <- tbl(con, "app_categories") %>%
|
|||
head(df_app_categories)
|
||||
table(df_app_categories$play_store_genre)
|
||||
|
||||
# Correct some mistakes
|
||||
df_app_categories %<>% mutate(
|
||||
play_store_genre = {
|
||||
function(x) {
|
||||
case_when(
|
||||
x == "Education,Education" ~ "Education",
|
||||
x == "EducationEducation" ~ "Education",
|
||||
x == "not_found" ~ "System",
|
||||
.default = x
|
||||
)
|
||||
}
|
||||
}(play_store_genre)
|
||||
)
|
||||
|
||||
dbDisconnect(con)
|
||||
|
|
Loading…
Reference in New Issue