2020-04-21 00:05:54 +02:00
|
|
|
def optional_ar_input(wildcards):
|
|
|
|
with open("data/external/"+wildcards.pid, encoding="ISO-8859-1") as external_file:
|
|
|
|
external_file_content = external_file.readlines()
|
|
|
|
platform = external_file_content[1].strip()
|
2020-06-23 17:33:34 +02:00
|
|
|
if platform == "android":
|
|
|
|
return ["data/raw/{pid}/" + config["ACTIVITY_RECOGNITION"]["DB_TABLE"]["ANDROID"] + "_with_datetime_unified.csv",
|
|
|
|
"data/processed/{pid}/" + config["ACTIVITY_RECOGNITION"]["DB_TABLE"]["ANDROID"] + "_deltas.csv"]
|
|
|
|
elif platform == "ios":
|
|
|
|
return ["data/raw/{pid}/"+config["ACTIVITY_RECOGNITION"]["DB_TABLE"]["IOS"]+"_with_datetime_unified.csv",
|
|
|
|
"data/processed/{pid}/"+config["ACTIVITY_RECOGNITION"]["DB_TABLE"]["IOS"]+"_deltas.csv"]
|
2020-04-21 00:05:54 +02:00
|
|
|
else:
|
2020-06-23 17:33:34 +02:00
|
|
|
return []
|
2020-04-21 00:05:54 +02:00
|
|
|
|
2020-06-19 07:27:28 +02:00
|
|
|
def optional_conversation_input(wildcards):
|
|
|
|
with open("data/external/"+wildcards.pid, encoding="ISO-8859-1") as external_file:
|
|
|
|
external_file_content = external_file.readlines()
|
|
|
|
platform = external_file_content[1].strip()
|
|
|
|
if platform == "android":
|
2020-06-23 17:33:34 +02:00
|
|
|
return ["data/raw/{pid}/" + config["CONVERSATION"]["DB_TABLE"]["ANDROID"] + "_with_datetime.csv"]
|
2020-06-19 07:27:28 +02:00
|
|
|
else:
|
2020-06-23 17:33:34 +02:00
|
|
|
return ["data/raw/{pid}/" + config["CONVERSATION"]["DB_TABLE"]["ANDROID"] + "_with_datetime.csv"]
|
2020-06-19 07:27:28 +02:00
|
|
|
|
2020-06-11 18:25:49 +02:00
|
|
|
def optional_location_input(wildcards):
|
|
|
|
if config["BARNETT_LOCATION"]["LOCATIONS_TO_USE"] == "RESAMPLE_FUSED":
|
2020-06-23 17:33:34 +02:00
|
|
|
return expand("data/raw/{{pid}}/{sensor}_resampled.csv", sensor=config["BARNETT_LOCATION"]["DB_TABLE"])
|
2020-06-11 18:25:49 +02:00
|
|
|
else:
|
2020-06-23 17:33:34 +02:00
|
|
|
return expand("data/raw/{{pid}}/{sensor}_with_datetime.csv", sensor=config["BARNETT_LOCATION"]["DB_TABLE"])
|
2020-06-11 18:25:49 +02:00
|
|
|
|
2020-06-23 17:33:34 +02:00
|
|
|
rule messages_features:
|
2019-10-24 22:27:43 +02:00
|
|
|
input:
|
2020-06-23 17:33:34 +02:00
|
|
|
expand("data/raw/{{pid}}/{sensor}_with_datetime.csv", sensor=config["MESSAGES"]["DB_TABLE"])
|
2019-10-24 22:27:43 +02:00
|
|
|
params:
|
2020-06-23 17:33:34 +02:00
|
|
|
messages_type = "{messages_type}",
|
2019-10-24 22:27:43 +02:00
|
|
|
day_segment = "{day_segment}",
|
2020-06-23 17:33:34 +02:00
|
|
|
features = lambda wildcards: config["MESSAGES"]["FEATURES"][wildcards.messages_type]
|
2019-10-24 22:27:43 +02:00
|
|
|
output:
|
2020-06-23 17:33:34 +02:00
|
|
|
"data/processed/{pid}/messages_{messages_type}_{day_segment}.csv"
|
2019-10-24 22:27:43 +02:00
|
|
|
script:
|
2020-06-23 17:33:34 +02:00
|
|
|
"../src/features/messages_features.R"
|
2019-10-25 16:21:09 +02:00
|
|
|
|
2020-04-08 17:51:18 +02:00
|
|
|
rule call_features:
|
2019-10-25 16:21:09 +02:00
|
|
|
input:
|
2020-06-23 17:33:34 +02:00
|
|
|
expand("data/raw/{{pid}}/{sensor}_with_datetime_unified.csv", sensor=config["CALLS"]["DB_TABLE"])
|
2019-10-25 16:21:09 +02:00
|
|
|
params:
|
|
|
|
call_type = "{call_type}",
|
|
|
|
day_segment = "{day_segment}",
|
2020-04-08 17:51:18 +02:00
|
|
|
features = lambda wildcards: config["CALLS"]["FEATURES"][wildcards.call_type]
|
2019-10-25 16:21:09 +02:00
|
|
|
output:
|
2020-06-23 17:33:34 +02:00
|
|
|
"data/processed/{pid}/calls_{call_type}_{day_segment}.csv"
|
2019-10-25 16:21:09 +02:00
|
|
|
script:
|
2020-04-08 17:51:18 +02:00
|
|
|
"../src/features/call_features.R"
|
2019-11-05 16:47:55 +01:00
|
|
|
|
|
|
|
rule battery_deltas:
|
|
|
|
input:
|
2020-06-23 17:33:34 +02:00
|
|
|
expand("data/raw/{{pid}}/{sensor}_with_datetime_unified.csv", sensor=config["BATTERY"]["DB_TABLE"])
|
2019-11-05 16:47:55 +01:00
|
|
|
output:
|
|
|
|
"data/processed/{pid}/battery_deltas.csv"
|
|
|
|
script:
|
2019-11-05 21:17:20 +01:00
|
|
|
"../src/features/battery_deltas.R"
|
|
|
|
|
2019-11-27 21:27:48 +01:00
|
|
|
rule screen_deltas:
|
|
|
|
input:
|
2020-06-23 17:33:34 +02:00
|
|
|
screen = expand("data/raw/{{pid}}/{sensor}_with_datetime.csv", sensor=config["SCREEN"]["DB_TABLE"]),
|
2020-03-03 01:26:20 +01:00
|
|
|
participant_info = "data/external/{pid}"
|
2019-11-27 21:27:48 +01:00
|
|
|
output:
|
|
|
|
"data/processed/{pid}/screen_deltas.csv"
|
|
|
|
script:
|
|
|
|
"../src/features/screen_deltas.R"
|
|
|
|
|
2019-11-27 21:53:37 +01:00
|
|
|
rule google_activity_recognition_deltas:
|
|
|
|
input:
|
2020-06-23 17:33:34 +02:00
|
|
|
expand("data/raw/{{pid}}/{sensor}_with_datetime_unified.csv", sensor=config["ACTIVITY_RECOGNITION"]["DB_TABLE"]["ANDROID"])
|
2019-11-27 21:53:37 +01:00
|
|
|
output:
|
2020-06-23 17:33:34 +02:00
|
|
|
expand("data/processed/{{pid}}/{sensor}_deltas.csv", sensor=config["ACTIVITY_RECOGNITION"]["DB_TABLE"]["ANDROID"])
|
2019-11-27 21:53:37 +01:00
|
|
|
script:
|
2020-04-21 00:05:54 +02:00
|
|
|
"../src/features/activity_recognition_deltas.R"
|
|
|
|
|
|
|
|
rule ios_activity_recognition_deltas:
|
|
|
|
input:
|
2020-06-23 17:33:34 +02:00
|
|
|
expand("data/raw/{{pid}}/{sensor}_with_datetime_unified.csv", sensor=config["ACTIVITY_RECOGNITION"]["DB_TABLE"]["IOS"])
|
2020-04-21 00:05:54 +02:00
|
|
|
output:
|
2020-06-23 17:33:34 +02:00
|
|
|
expand("data/processed/{{pid}}/{sensor}_deltas.csv", sensor=config["ACTIVITY_RECOGNITION"]["DB_TABLE"]["IOS"])
|
2020-04-21 00:05:54 +02:00
|
|
|
script:
|
|
|
|
"../src/features/activity_recognition_deltas.R"
|
2019-11-27 21:53:37 +01:00
|
|
|
|
2020-04-09 19:20:39 +02:00
|
|
|
rule location_barnett_features:
|
2019-11-05 21:17:20 +01:00
|
|
|
input:
|
2020-06-11 18:25:49 +02:00
|
|
|
locations = optional_location_input
|
2019-11-05 21:17:20 +01:00
|
|
|
params:
|
2020-04-09 19:20:39 +02:00
|
|
|
features = config["BARNETT_LOCATION"]["FEATURES"],
|
2019-12-10 01:15:10 +01:00
|
|
|
locations_to_use = config["BARNETT_LOCATION"]["LOCATIONS_TO_USE"],
|
2019-11-05 21:17:20 +01:00
|
|
|
accuracy_limit = config["BARNETT_LOCATION"]["ACCURACY_LIMIT"],
|
2020-03-05 16:32:38 +01:00
|
|
|
timezone = config["BARNETT_LOCATION"]["TIMEZONE"],
|
2020-06-11 18:25:49 +02:00
|
|
|
minutes_data_used = config["BARNETT_LOCATION"]["MINUTES_DATA_USED"],
|
2020-03-05 16:32:38 +01:00
|
|
|
day_segment = "{day_segment}"
|
2019-11-05 21:17:20 +01:00
|
|
|
output:
|
2020-03-05 16:32:38 +01:00
|
|
|
"data/processed/{pid}/location_barnett_{day_segment}.csv"
|
2019-11-05 21:17:20 +01:00
|
|
|
script:
|
2020-04-09 19:20:39 +02:00
|
|
|
"../src/features/location_barnett_features.R"
|
2019-11-06 18:19:30 +01:00
|
|
|
|
2020-04-03 19:07:09 +02:00
|
|
|
rule bluetooth_features:
|
2019-11-06 18:19:30 +01:00
|
|
|
input:
|
2020-06-23 17:33:34 +02:00
|
|
|
expand("data/raw/{{pid}}/{sensor}_with_datetime.csv", sensor=config["BLUETOOTH"]["DB_TABLE"])
|
2019-11-06 18:19:30 +01:00
|
|
|
params:
|
|
|
|
day_segment = "{day_segment}",
|
2020-04-03 19:07:09 +02:00
|
|
|
features = config["BLUETOOTH"]["FEATURES"]
|
2019-11-06 18:19:30 +01:00
|
|
|
output:
|
|
|
|
"data/processed/{pid}/bluetooth_{day_segment}.csv"
|
|
|
|
script:
|
2020-04-03 19:07:09 +02:00
|
|
|
"../src/features/bluetooth_features.R"
|
2020-04-21 00:05:54 +02:00
|
|
|
|
2020-04-08 20:36:36 +02:00
|
|
|
rule activity_features:
|
2019-11-06 19:34:47 +01:00
|
|
|
input:
|
2020-04-21 00:05:54 +02:00
|
|
|
optional_ar_input
|
2019-11-18 20:22:08 +01:00
|
|
|
params:
|
|
|
|
segment = "{day_segment}",
|
2020-04-21 00:05:54 +02:00
|
|
|
features = config["ACTIVITY_RECOGNITION"]["FEATURES"]
|
2019-11-06 19:34:47 +01:00
|
|
|
output:
|
2020-04-21 00:05:54 +02:00
|
|
|
"data/processed/{pid}/activity_recognition_{day_segment}.csv"
|
2019-11-06 19:34:47 +01:00
|
|
|
script:
|
2020-04-21 00:05:54 +02:00
|
|
|
"../src/features/activity_recognition.py"
|
2019-11-08 18:18:21 +01:00
|
|
|
|
2020-04-09 22:06:25 +02:00
|
|
|
rule battery_features:
|
2019-11-08 18:18:21 +01:00
|
|
|
input:
|
|
|
|
"data/processed/{pid}/battery_deltas.csv"
|
2019-11-25 18:53:32 +01:00
|
|
|
params:
|
|
|
|
day_segment = "{day_segment}",
|
2020-04-09 22:06:25 +02:00
|
|
|
features = config["BATTERY"]["FEATURES"]
|
2019-11-08 18:18:21 +01:00
|
|
|
output:
|
2019-11-25 18:53:32 +01:00
|
|
|
"data/processed/{pid}/battery_{day_segment}.csv"
|
2019-11-08 18:18:21 +01:00
|
|
|
script:
|
2020-04-09 22:06:25 +02:00
|
|
|
"../src/features/battery_features.py"
|
2019-11-27 20:25:17 +01:00
|
|
|
|
2020-04-08 17:05:16 +02:00
|
|
|
rule screen_features:
|
2019-11-27 20:25:17 +01:00
|
|
|
input:
|
2019-12-04 22:04:37 +01:00
|
|
|
screen_deltas = "data/processed/{pid}/screen_deltas.csv",
|
|
|
|
phone_sensed_bins = "data/interim/{pid}/phone_sensed_bins.csv"
|
2019-11-27 20:25:17 +01:00
|
|
|
params:
|
|
|
|
day_segment = "{day_segment}",
|
2020-03-04 18:21:36 +01:00
|
|
|
reference_hour_first_use = config["SCREEN"]["REFERENCE_HOUR_FIRST_USE"],
|
2020-04-08 17:05:16 +02:00
|
|
|
features_deltas = config["SCREEN"]["FEATURES_DELTAS"],
|
2020-03-03 23:31:15 +01:00
|
|
|
episode_types = config["SCREEN"]["EPISODE_TYPES"],
|
2019-12-05 17:07:40 +01:00
|
|
|
bin_size = config["PHONE_VALID_SENSED_DAYS"]["BIN_SIZE"]
|
2019-11-27 20:25:17 +01:00
|
|
|
output:
|
|
|
|
"data/processed/{pid}/screen_{day_segment}.csv"
|
|
|
|
script:
|
2020-04-08 17:05:16 +02:00
|
|
|
"../src/features/screen_features.py"
|
2020-01-14 15:51:39 +01:00
|
|
|
|
2020-04-08 20:02:53 +02:00
|
|
|
rule light_features:
|
2020-01-14 15:51:39 +01:00
|
|
|
input:
|
2020-06-23 17:33:34 +02:00
|
|
|
expand("data/raw/{{pid}}/{sensor}_with_datetime.csv", sensor=config["LIGHT"]["DB_TABLE"]),
|
2020-01-14 15:51:39 +01:00
|
|
|
params:
|
|
|
|
day_segment = "{day_segment}",
|
2020-04-08 20:02:53 +02:00
|
|
|
features = config["LIGHT"]["FEATURES"],
|
2020-01-14 15:51:39 +01:00
|
|
|
output:
|
|
|
|
"data/processed/{pid}/light_{day_segment}.csv"
|
|
|
|
script:
|
2020-04-08 20:02:53 +02:00
|
|
|
"../src/features/light_features.py"
|
2020-01-15 20:15:24 +01:00
|
|
|
|
2020-06-19 07:27:28 +02:00
|
|
|
rule conversation_features:
|
|
|
|
input:
|
|
|
|
optional_conversation_input
|
|
|
|
params:
|
|
|
|
day_segment = "{day_segment}",
|
|
|
|
features = config["CONVERSATION"]["FEATURES"],
|
|
|
|
recordingMinutes = config["CONVERSATION"]["RECORDINGMINUTES"],
|
|
|
|
pausedMinutes = config["CONVERSATION"]["PAUSEDMINUTES"],
|
|
|
|
output:
|
|
|
|
"data/processed/{pid}/conversation_{day_segment}.csv"
|
|
|
|
script:
|
|
|
|
"../src/features/conversation_features.py"
|
|
|
|
|
2020-04-02 23:36:28 +02:00
|
|
|
rule accelerometer_features:
|
2020-01-15 20:15:24 +01:00
|
|
|
input:
|
2020-06-23 17:33:34 +02:00
|
|
|
expand("data/raw/{{pid}}/{sensor}_with_datetime.csv", sensor=config["ACCELEROMETER"]["DB_TABLE"]),
|
2020-01-15 20:15:24 +01:00
|
|
|
params:
|
|
|
|
day_segment = "{day_segment}",
|
2020-06-22 18:01:17 +02:00
|
|
|
magnitude = config["ACCELEROMETER"]["FEATURES"]["MAGNITUDE"],
|
|
|
|
exertional_activity_episode = config["ACCELEROMETER"]["FEATURES"]["EXERTIONAL_ACTIVITY_EPISODE"],
|
|
|
|
nonexertional_activity_episode = config["ACCELEROMETER"]["FEATURES"]["NONEXERTIONAL_ACTIVITY_EPISODE"],
|
|
|
|
valid_sensed_minutes = config["ACCELEROMETER"]["FEATURES"]["VALID_SENSED_MINUTES"],
|
2020-01-15 20:15:24 +01:00
|
|
|
output:
|
|
|
|
"data/processed/{pid}/accelerometer_{day_segment}.csv"
|
|
|
|
script:
|
2020-04-02 23:36:28 +02:00
|
|
|
"../src/features/accelerometer_features.py"
|
2020-01-29 22:22:53 +01:00
|
|
|
|
2020-04-08 19:31:43 +02:00
|
|
|
rule applications_foreground_features:
|
2020-02-07 17:52:55 +01:00
|
|
|
input:
|
2020-06-23 17:33:34 +02:00
|
|
|
expand("data/interim/{{pid}}/{sensor}_with_datetime_with_genre.csv", sensor=config["APPLICATIONS_FOREGROUND"]["DB_TABLE"])
|
2020-02-07 17:52:55 +01:00
|
|
|
params:
|
|
|
|
day_segment = "{day_segment}",
|
|
|
|
single_categories = config["APPLICATIONS_FOREGROUND"]["SINGLE_CATEGORIES"],
|
|
|
|
multiple_categories = config["APPLICATIONS_FOREGROUND"]["MULTIPLE_CATEGORIES"],
|
|
|
|
single_apps = config["APPLICATIONS_FOREGROUND"]["SINGLE_APPS"],
|
|
|
|
excluded_categories = config["APPLICATIONS_FOREGROUND"]["EXCLUDED_CATEGORIES"],
|
|
|
|
excluded_apps = config["APPLICATIONS_FOREGROUND"]["EXCLUDED_APPS"],
|
2020-04-08 19:31:43 +02:00
|
|
|
features = config["APPLICATIONS_FOREGROUND"]["FEATURES"],
|
2020-02-07 17:52:55 +01:00
|
|
|
output:
|
|
|
|
"data/processed/{pid}/applications_foreground_{day_segment}.csv"
|
|
|
|
script:
|
2020-04-08 19:31:43 +02:00
|
|
|
"../src/features/applications_foreground_features.py"
|
2020-02-07 17:52:55 +01:00
|
|
|
|
2020-05-15 23:51:00 +02:00
|
|
|
rule wifi_features:
|
|
|
|
input:
|
2020-06-23 17:33:34 +02:00
|
|
|
expand("data/raw/{{pid}}/{sensor}_with_datetime.csv", sensor=config["WIFI"]["DB_TABLE"])
|
2020-05-15 23:51:00 +02:00
|
|
|
params:
|
|
|
|
day_segment = "{day_segment}",
|
|
|
|
features = config["WIFI"]["FEATURES"]
|
|
|
|
output:
|
|
|
|
"data/processed/{pid}/wifi_{day_segment}.csv"
|
|
|
|
script:
|
|
|
|
"../src/features/wifi_features.R"
|
|
|
|
|
2020-04-08 21:31:43 +02:00
|
|
|
rule fitbit_heartrate_features:
|
2020-02-07 17:35:15 +01:00
|
|
|
input:
|
2020-05-15 23:51:00 +02:00
|
|
|
heartrate_summary_data = "data/raw/{pid}/fitbit_heartrate_summary_with_datetime.csv",
|
|
|
|
heartrate_intraday_data = "data/raw/{pid}/fitbit_heartrate_intraday_with_datetime.csv"
|
2020-02-07 17:35:15 +01:00
|
|
|
params:
|
|
|
|
day_segment = "{day_segment}",
|
2020-06-12 22:04:03 +02:00
|
|
|
summary_features = config["HEARTRATE"]["SUMMARY_FEATURES"],
|
|
|
|
intraday_features = config["HEARTRATE"]["INTRADAY_FEATURES"]
|
2020-02-07 17:35:15 +01:00
|
|
|
output:
|
|
|
|
"data/processed/{pid}/fitbit_heartrate_{day_segment}.csv"
|
|
|
|
script:
|
2020-04-08 21:31:43 +02:00
|
|
|
"../src/features/fitbit_heartrate_features.py"
|
2020-02-07 17:35:15 +01:00
|
|
|
|
2020-04-03 23:03:45 +02:00
|
|
|
rule fitbit_step_features:
|
2020-01-29 22:22:53 +01:00
|
|
|
input:
|
2020-06-23 17:33:34 +02:00
|
|
|
step_data = "data/raw/{pid}/fitbit_step_intraday_with_datetime.csv"
|
2020-01-29 22:22:53 +01:00
|
|
|
params:
|
|
|
|
day_segment = "{day_segment}",
|
2020-04-03 23:03:45 +02:00
|
|
|
features_all_steps = config["STEP"]["FEATURES"]["ALL_STEPS"],
|
|
|
|
features_sedentary_bout = config["STEP"]["FEATURES"]["SEDENTARY_BOUT"],
|
|
|
|
features_active_bout = config["STEP"]["FEATURES"]["ACTIVE_BOUT"],
|
2020-03-09 20:59:51 +01:00
|
|
|
threshold_active_bout = config["STEP"]["THRESHOLD_ACTIVE_BOUT"],
|
|
|
|
include_zero_step_rows = config["STEP"]["INCLUDE_ZERO_STEP_ROWS"]
|
2020-01-29 22:22:53 +01:00
|
|
|
output:
|
|
|
|
"data/processed/{pid}/fitbit_step_{day_segment}.csv"
|
|
|
|
script:
|
2020-04-03 23:03:45 +02:00
|
|
|
"../src/features/fitbit_step_features.py"
|
2020-04-13 19:24:52 +02:00
|
|
|
|
2020-05-15 23:51:00 +02:00
|
|
|
rule fitbit_sleep_features:
|
|
|
|
input:
|
|
|
|
sleep_summary_data = "data/raw/{pid}/fitbit_sleep_summary_with_datetime.csv",
|
|
|
|
sleep_intraday_data = "data/raw/{pid}/fitbit_sleep_intraday_with_datetime.csv"
|
2020-04-13 19:24:52 +02:00
|
|
|
params:
|
|
|
|
day_segment = "{day_segment}",
|
2020-06-13 00:44:05 +02:00
|
|
|
summary_features = config["SLEEP"]["SUMMARY_FEATURES"],
|
|
|
|
sleep_types = config["SLEEP"]["SLEEP_TYPES"]
|
2020-04-13 19:24:52 +02:00
|
|
|
output:
|
2020-05-15 23:51:00 +02:00
|
|
|
"data/processed/{pid}/fitbit_sleep_{day_segment}.csv"
|
2020-04-13 19:24:52 +02:00
|
|
|
script:
|
2020-05-15 23:51:00 +02:00
|
|
|
"../src/features/fitbit_sleep_features.py"
|