From 8acac501251105332d1d3d4863e88744b9528844 Mon Sep 17 00:00:00 2001 From: Primoz Date: Tue, 25 Oct 2022 15:26:43 +0000 Subject: [PATCH] Add safenet when features dataframe is empty. --- src/features/all_cleaning_overall/straw/main.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/src/features/all_cleaning_overall/straw/main.py b/src/features/all_cleaning_overall/straw/main.py index 9474a514..1963808a 100644 --- a/src/features/all_cleaning_overall/straw/main.py +++ b/src/features/all_cleaning_overall/straw/main.py @@ -14,7 +14,7 @@ def straw_cleaning(sensor_data_files, provider, target): features = pd.read_csv(sensor_data_files["sensor_data"][0]) - features = features[features['local_segment_label'] == 'working_day'] # Filtriranje ustreznih časovnih segmentov + # features = features[features['local_segment_label'] == 'working_day'] # Filtriranje ustreznih časovnih segmentov # print(features) # sys.exit() @@ -36,7 +36,6 @@ def straw_cleaning(sensor_data_files, provider, target): return pd.DataFrame(columns=excluded_columns) graph_bf_af(features, "2target_rows_after") - print("HERE1", target, features["pid"]) # (2) QUALITY CHECK (DATA YIELD COLUMN) drops the rows where E4 or phone data is low quality phone_data_yield_unit = provider["PHONE_DATA_YIELD_FEATURE"].split("_")[3].lower() @@ -66,6 +65,8 @@ def straw_cleaning(sensor_data_files, provider, target): # print(features["empatica_data_yield"].sort_values()) features = features[features["empatica_data_yield"] >= provider["EMPATICA_DATA_YIELD_RATIO_THRESHOLD"]].reset_index(drop=True) + if features.empty: + return pd.DataFrame(columns=excluded_columns) graph_bf_af(features, "3data_yield_drop_rows")