From 0e66a5a963b8453e9f3025c163e2795069f291c3 Mon Sep 17 00:00:00 2001 From: junos Date: Wed, 19 Apr 2023 09:29:40 +0200 Subject: [PATCH] Completely remove PACKAGE_NAMES_HASHED and instead provide a differently structured file. --- presentation/ApplicationCategories.R | 13 +++++++++++-- .../play_store_application_genre_catalogue.csv | 2 +- 2 files changed, 12 insertions(+), 3 deletions(-) diff --git a/presentation/ApplicationCategories.R b/presentation/ApplicationCategories.R index f9916fb..4a696b5 100644 --- a/presentation/ApplicationCategories.R +++ b/presentation/ApplicationCategories.R @@ -48,12 +48,21 @@ df_app_categories %<>% } }(play_store_genre) ) %>% - rename(genre = play_store_genre) + select(-package_name) %>% + rename( + genre = play_store_genre, + package_name = package_hash) table(df_app_categories$genre) +df_app_categories %>% + group_by(genre) %>% + count() %>% + arrange(desc(n)) %>% + write_csv("play_store_categories_count.csv") + write_csv( - x = select(df_app_categories, c(package_hash, genre)), + x = select(df_app_categories, c(package_name, genre)), file = "play_store_application_genre_catalogue.csv" ) diff --git a/presentation/play_store_application_genre_catalogue.csv b/presentation/play_store_application_genre_catalogue.csv index 42783cc..5e04779 100644 --- a/presentation/play_store_application_genre_catalogue.csv +++ b/presentation/play_store_application_genre_catalogue.csv @@ -1,4 +1,4 @@ -package_hash,genre +package_name,genre 98a5c1a9c7717f791cb4083199ff5c91a958df844a47dc89c7319b2bb824ac94,Personalization c9112978f6b1c96c767496a15a6dbb9c8dccabe847c31ecc9e5f706de24342a6,Communication 650ab12d7007ee573df2291f3a9207442e3897a9a5b2f5068ad685c0d04751ea,Tools