import datetime import pandas as pd from pyprojroot import here import participants.query_db participants_inactive_usernames = participants.query_db.get_usernames( tester=False, # True participants are wanted. active=False, # They have all finished their participation. collection_start=datetime.date.fromisoformat( "2020-08-01" ), # This is the timeframe of the main study. last_upload=datetime.date.fromisoformat("2021-09-01"), ) participants_overview_si = pd.read_csv( "E:/STRAWbaseline/Participants_overview_Slovenia.csv", sep=";" ) participants_overview_be = pd.read_csv( "E:/STRAWbaseline/Participants_overview_Belgium.csv", sep=";" ) participants_true_si = participants_overview_si[ participants_overview_si["Wristband_SerialNo"] != "DECLINED" ] participants_true_be = participants_overview_be[ participants_overview_be["SmartphoneBrand+Generation"].str.slice(0, 3) != "Not" ] # Concatenate participants from both countries. participants_usernames_empatica = pd.concat( [participants_true_be, participants_true_si] ) # Filter only the participants from the main study (queried from the database). participants_usernames_empatica = participants_usernames_empatica[ participants_usernames_empatica["Username"].isin(participants_inactive_usernames) ] # Rename and select columns. participants_usernames_empatica = participants_usernames_empatica.rename( columns={"Username": "label", "Wristband_SerialNo": "empatica_id"} )[["label", "empatica_id"]] # Adapt for csv export. participants_usernames_empatica["empatica_id"] = participants_usernames_empatica[ "empatica_id" ].str.replace(",", ";") participants_usernames_empatica.to_csv( here("rapids/data/external/main_study_participants.csv"), header=True, index=False, line_terminator="\n", )