Update heatmaps of overall data yield

2021-06-04 22:58:27 -04:00 · 2021-06-04 22:58:27 -04:00 · 4d37696158
parent 654f6f3c3d
commit 4d37696158
5 changed files with 905 additions and 69 deletions
--- a/2
+++ b/2
@ -381,6 +381,8 @@ if config["HEATMAP_SENSOR_ROW_COUNT_PER_TIME_SEGMENT"]["PLOT"]:
    files_to_compute.append("reports/data_exploration/heatmap_sensor_row_count_per_time_segment.html")

 if config["HEATMAP_PHONE_DATA_YIELD_PER_PARTICIPANT_PER_TIME_SEGMENT"]["PLOT"]:
+    if not config["PHONE_DATA_YIELD"]["PROVIDERS"]["RAPIDS"]["COMPUTE"]:
+        raise ValueError("Error: [PHONE_DATA_YIELD][PROVIDERS][RAPIDS][COMPUTE] must be True in config.yaml to get heatmaps of overall data yield.")
    files_to_compute.append("reports/data_exploration/heatmap_phone_data_yield_per_participant_per_time_segment.html")

 if config["HEATMAP_FEATURE_CORRELATION_MATRIX"]["PLOT"]:
--- a/rules/reports.smk
+++ b/rules/reports.smk
@ -49,11 +49,13 @@ rule merge_heatmap_sensor_row_count_per_time_segment:

 rule heatmap_phone_data_yield_per_participant_per_time_segment:
    input:
-        phone_data_yield = expand("data/processed/features/{pid}/phone_data_yield.csv", pid=config["PIDS"]),
-        participant_file = expand("data/external/participant_files/{pid}.yaml", pid=config["PIDS"]),
-        time_segments_labels = expand("data/interim/time_segments/{pid}_time_segments_labels.csv", pid=config["PIDS"])
+        participant_files = expand("data/external/participant_files/{pid}.yaml", pid=config["PIDS"]),
+        time_segments_file = config["TIME_SEGMENTS"]["FILE"],
+        phone_data_yield = "data/processed/features/all_participants/all_sensor_features.csv",
    params:
-        time = config["HEATMAP_PHONE_DATA_YIELD_PER_PARTICIPANT_PER_TIME_SEGMENT"]["TIME"]
+        pids = config["PIDS"],
+        time = config["HEATMAP_PHONE_DATA_YIELD_PER_PARTICIPANT_PER_TIME_SEGMENT"]["TIME"],
+        time_segments_type = config["TIME_SEGMENTS"]["TYPE"]
    output:
        "reports/data_exploration/heatmap_phone_data_yield_per_participant_per_time_segment.html"
    script:
--- a/src/visualization/heatmap_phone_data_yield_per_participant_per_time_segment.py
+++ b/src/visualization/heatmap_phone_data_yield_per_participant_per_time_segment.py
@ -1,93 +1,87 @@
+from plotly_color_utils import sample_colorscale
 import pandas as pd
-import numpy as np
-import plotly.graph_objects as go
+import plotly.express as px
 import yaml



+def getPidAndLabel(participant_file_paths, pids):
+    pid2label, y_axis_labels = {}, []
+    for participant_file_path, pid in zip(participant_file_paths, pids):

+        with open(participant_file_path, "r", encoding="utf-8") as f:
+            participant_file = yaml.safe_load(f)
+        label = str(participant_file["PHONE"]["LABEL"])

-def getPhoneDataYieldHeatmap(data_for_plot, y_axis_labels, time_segment, type, time, html_file):
+        pid2label[pid] = label
+        y_axis_labels.append(pid + "." + label)
+    return pid2label, y_axis_labels

-    fig = go.Figure(data=go.Heatmap(z=data_for_plot.values.tolist(),
-                                       x=data_for_plot.columns.tolist(),
-                                       y=y_axis_labels,
-                                       hovertext=data_for_plot.values.tolist(),
-                                       hovertemplate="Time since first segment: %{x}<br>Participant: %{y}<br>Ratiovalidyielded" + type + ": %{z}<extra></extra>" if time == "RELATIVE_TIME" else "Time: %{x}<br>Participant: %{y}<br>Ratiovalidyielded" + type + ": %{z}<extra></extra>",
-                                       zmin=0, zmax=1,
-                                       colorscale="Viridis"))
+def getPhoneDataYieldHeatmap(phone_data_yield, time, time_segment, html_file):

    if time == "RELATIVE_TIME":
-        fig.update_layout(title="Heatmap of valid yielded " + type + " ratio for " + time_segment + " segments.<br>y-axis shows participant information (format: pid.label).<br>x-axis shows the time since their first segment.<br>z-axis (color) shows valid yielded " + type + " ratio during a segment instance.")
-    else:
-        fig.update_layout(title="Heatmap of valid yielded " + type + " ratio for " + time_segment + " segments.<br>y-axis shows participant information (format: pid.label).<br>x-axis shows the time.<br>z-axis (color) shows valid yielded " + type + " ratio during a segment instance.")
+        # Number of minutes after the first start date time of local segments
+        phone_data_yield["local_segment_end_datetime"] = (phone_data_yield["local_segment_end_datetime"] - phone_data_yield["local_segment_start_datetime"].min()) + pd.Timestamp(2000,1,1)
+        phone_data_yield["local_segment_start_datetime"] = (phone_data_yield["local_segment_start_datetime"] - phone_data_yield["local_segment_start_datetime"].min()) + pd.Timestamp(2000,1,1)

-    fig["layout"]["xaxis"].update(side="bottom")
-    fig["layout"].update(xaxis_title="Time Since First Segment" if time == "RELATIVE_TIME" else "Time")
-    fig["layout"].update(margin=dict(t=160))
-    
-    html_file.write(fig.to_html(full_html=False, include_plotlyjs="cdn"))
+    for type in ["minutes", "hours"]:
+
+        column_name = "phone_data_yield_rapids_ratiovalidyielded" + type
+
+        fig = px.timeline(phone_data_yield,
+                          x_start="local_segment_start_datetime",
+                          x_end="local_segment_end_datetime",
+                          y="y_axis_label",
+                          color=column_name,
+                          color_continuous_scale="Viridis",
+                          opacity=0.7,
+                          hover_data={'local_segment_start_datetime':False, 'local_segment_end_datetime':False, 'local_segment':True})
+
+        fig.update_layout(title="Heatmap of valid yielded " + type + " ratio for " + time_segment + " segments and " + time.lower().replace("_", " ") + ".<br>y-axis shows participant information (format: pid.label).<br>x-axis shows the time" + (" since their first segment" if time == "RELATIVE_TIME" else "") + ".<br>z-axis (color) shows valid yielded " + type + " ratio during a segment instance.",
+                    xaxis=dict(side="bottom", title="Time Since First Segment" if time == "RELATIVE_TIME" else "Time"),
+                    yaxis=dict(side="left", title="Participant information"),
+                    margin=dict(t=160))
+
+        if time == "RELATIVE_TIME":
+            fig.update_layout(xaxis_tickformat="%y years %j days<br>%X")
+
+        html_file.write(fig.to_html(full_html=False, include_plotlyjs="cdn"))
+
+    return html_file




+pid2label, y_axis_labels = getPidAndLabel(snakemake.input["participant_files"], snakemake.params["pids"])
+time_segments_type = snakemake.params["time_segments_type"] # FREQUENCY or PERIODIC or EVENT
+time = snakemake.params["time"] # ABSOLUTE_TIME or RELATIVE_TIME
+time_segments = pd.read_csv(snakemake.input["time_segments_file"])["label"].unique()

+phone_data_yield = pd.read_csv(snakemake.input["phone_data_yield"], parse_dates=["local_segment_start_datetime", "local_segment_end_datetime"]).sort_values(by=["pid", "local_segment_start_datetime"])
+if time_segments_type == "FREQUENCY":
+    phone_data_yield["local_segment_label"] = phone_data_yield["local_segment_label"].str.split("\d+", expand=True, n=1)[0]

-time = snakemake.params["time"]
-y_axis_labels, phone_data_yield_minutes, phone_data_yield_hours = [], {}, {}
-for phone_data_yield_path, participant_file_path, time_segments_path in zip(snakemake.input["phone_data_yield"], snakemake.input["participant_file"], snakemake.input["time_segments_labels"]):
-    
-    # set pid.label as y_axis_label
-    pid = phone_data_yield_path.split("/")[3]
-    time_segments = pd.read_csv(time_segments_path, header=0)["label"]
-
-    with open(participant_file_path, "r", encoding="utf-8") as f:
-        participant_file = yaml.safe_load(f)
-    label = participant_file["PHONE"]["LABEL"]
-
-    y_axis_label = pid + "." + label
-    y_axis_labels.append(y_axis_label)
-
-    
-    phone_data_yield = pd.read_csv(phone_data_yield_path, index_col=["local_segment_start_datetime"], parse_dates=["local_segment_start_datetime"])
-    # make sure the phone_data_yield file contains "phone_data_yield_rapids_ratiovalidyieldedminutes" and "phone_data_yield_rapids_ratiovalidyieldedhours" columns
+html_file = open(snakemake.output[0], "w", encoding="utf-8")
+if phone_data_yield.empty:
+    html_file.write("There is no sensor data for the sensors in [PHONE_DATA_YIELD][SENSORS].")
+else:
+    # Make sure the phone_data_yield file contains both "phone_data_yield_rapids_ratiovalidyieldedminutes" and "phone_data_yield_rapids_ratiovalidyieldedhours" columns
    if ("phone_data_yield_rapids_ratiovalidyieldedminutes" not in phone_data_yield.columns) or ("phone_data_yield_rapids_ratiovalidyieldedhours" not in phone_data_yield.columns):
        raise ValueError("Please make sure [PHONE_DATA_YIELD][RAPIDS][COMPUTE] is True AND [PHONE_DATA_YIELD][RAPIDS][FEATURES] contains [ratiovalidyieldedminutes, ratiovalidyieldedhours].")

-    if not phone_data_yield.empty:
+    phone_data_yield[["phone_data_yield_rapids_ratiovalidyieldedminutes", "phone_data_yield_rapids_ratiovalidyieldedhours"]] = phone_data_yield[["phone_data_yield_rapids_ratiovalidyieldedminutes", "phone_data_yield_rapids_ratiovalidyieldedhours"]].round(3).clip(upper=1)
+    phone_data_yield["y_axis_label"] = phone_data_yield["pid"].apply(lambda pid: pid + "." + str(pid2label[pid]))

+    if time_segments_type == "EVENT":
+        html_file = getPhoneDataYieldHeatmap(phone_data_yield, time, "event", html_file)
+    else: # FREQUENCY or PERIODIC
        for time_segment in time_segments:
+                        
            phone_data_yield_per_segment = phone_data_yield[phone_data_yield["local_segment_label"] == time_segment]

            if not phone_data_yield_per_segment.empty:

-                if time == "RELATIVE_TIME":
-                    # set number of minutes after the first start date time of local segments as x_axis_label
-                    phone_data_yield_per_segment.index = phone_data_yield_per_segment.index - phone_data_yield_per_segment.index.min()
-                elif time == "ABSOLUTE_TIME":
-                    pass
-                else:
-                    raise ValueError("[HEATMAP_PHONE_DATA_YIELD_PER_PARTICIPANT_PER_TIME_SEGMENT][TIME] can only be RELATIVE_TIME or ABSOLUTE_TIME")
+                html_file = getPhoneDataYieldHeatmap(phone_data_yield_per_segment, time, time_segment, html_file)

-                phone_data_yield_minutes_per_segment = phone_data_yield_per_segment[["phone_data_yield_rapids_ratiovalidyieldedminutes"]].rename(columns={"phone_data_yield_rapids_ratiovalidyieldedminutes": y_axis_label})
-                phone_data_yield_hours_per_segment = phone_data_yield_per_segment[["phone_data_yield_rapids_ratiovalidyieldedhours"]].rename(columns={"phone_data_yield_rapids_ratiovalidyieldedhours": y_axis_label})
-
-                if time_segment not in phone_data_yield_minutes.keys():
-                    phone_data_yield_minutes[time_segment] = phone_data_yield_minutes_per_segment
-                    phone_data_yield_hours[time_segment] = phone_data_yield_hours_per_segment
-                else:
-                    phone_data_yield_minutes[time_segment] = pd.concat([phone_data_yield_minutes[time_segment], phone_data_yield_minutes_per_segment], axis=1, sort=True)
-                    phone_data_yield_hours[time_segment] = pd.concat([phone_data_yield_hours[time_segment], phone_data_yield_hours_per_segment], axis=1, sort=True)
-
-
-html_file = open(snakemake.output[0], "a", encoding="utf-8")
-if len(phone_data_yield_minutes.keys()) == 0:
-    html_file.write("There is no sensor data for the sensors in [PHONE_DATA_YIELD][SENSORS].")
-for time_segment in phone_data_yield_minutes.keys():
-    minutes_data_for_plot = phone_data_yield_minutes[time_segment].transpose().reindex(pd.Index(y_axis_labels)).round(3)
-    hours_data_for_plot = phone_data_yield_hours[time_segment].transpose().reindex(pd.Index(y_axis_labels)).round(3)
-
-    getPhoneDataYieldHeatmap(minutes_data_for_plot, y_axis_labels, time_segment, "minutes", time, html_file)
-    getPhoneDataYieldHeatmap(hours_data_for_plot, y_axis_labels, time_segment, "hours", time, html_file)

 html_file.close()
--- a/src/visualization/plotly_color_utils.py
+++ b/src/visualization/plotly_color_utils.py
@ -0,0 +1,835 @@
+"""
+Source: https://github.com/plotly/plotly.py/pull/3136
+=====
+colors
+=====
+Functions that manipulate colors and arrays of colors.
+-----
+There are three basic types of color types: rgb, hex and tuple:
+rgb - An rgb color is a string of the form 'rgb(a,b,c)' where a, b and c are
+integers between 0 and 255 inclusive.
+hex - A hex color is a string of the form '#xxxxxx' where each x is a
+character that belongs to the set [0,1,2,3,4,5,6,7,8,9,a,b,c,d,e,f]. This is
+just the set of characters used in the hexadecimal numeric system.
+tuple - A tuple color is a 3-tuple of the form (a,b,c) where a, b and c are
+floats between 0 and 1 inclusive.
+-----
+Colormaps and Colorscales:
+A colormap or a colorscale is a correspondence between values - Pythonic
+objects such as strings and floats - to colors.
+There are typically two main types of colormaps that exist: numerical and
+categorical colormaps.
+Numerical:
+----------
+Numerical colormaps are used when the coloring column being used takes a
+spectrum of values or numbers.
+A classic example from the Plotly library:
+```
+rainbow_colorscale =  [
+    [0, 'rgb(150,0,90)'], [0.125, 'rgb(0,0,200)'],
+    [0.25, 'rgb(0,25,255)'], [0.375, 'rgb(0,152,255)'],
+    [0.5, 'rgb(44,255,150)'], [0.625, 'rgb(151,255,0)'],
+    [0.75, 'rgb(255,234,0)'], [0.875, 'rgb(255,111,0)'],
+    [1, 'rgb(255,0,0)']
+]
+```
+Notice that this colorscale is a list of lists with each inner list containing
+a number and a color. These left hand numbers in the nested lists go from 0 to
+1, and they are like pointers tell you when a number is mapped to a specific
+color.
+If you have a column of numbers `col_num` that you want to plot, and you know
+```
+min(col_num) = 0
+max(col_num) = 100
+```
+then if you pull out the number `12.5` in the list and want to figure out what
+color the corresponding chart element (bar, scatter plot, etc) is going to be,
+you'll figure out that proportionally 12.5 to 100 is the same as 0.125 to 1.
+So, the point will be mapped to 'rgb(0,0,200)'.
+All other colors between the pinned values in a colorscale are linearly
+interpolated.
+Categorical:
+------------
+Alternatively, a categorical colormap is used to assign a specific value in a
+color column to a specific color everytime it appears in the dataset.
+A column of strings in a panadas.dataframe that is chosen to serve as the
+color index would naturally use a categorical colormap. However, you can
+choose to use a categorical colormap with a column of numbers.
+Be careful! If you have a lot of unique numbers in your color column you will
+end up with a colormap that is massive and may slow down graphing performance.
+"""
+from __future__ import absolute_import
+
+import decimal
+from numbers import Number
+import six
+
+from _plotly_utils import exceptions
+
+
+# Built-in qualitative color sequences and sequential,
+# diverging and cyclical color scales.
+
+DEFAULT_PLOTLY_COLORS = [
+    "rgb(31, 119, 180)",
+    "rgb(255, 127, 14)",
+    "rgb(44, 160, 44)",
+    "rgb(214, 39, 40)",
+    "rgb(148, 103, 189)",
+    "rgb(140, 86, 75)",
+    "rgb(227, 119, 194)",
+    "rgb(127, 127, 127)",
+    "rgb(188, 189, 34)",
+    "rgb(23, 190, 207)",
+]
+
+PLOTLY_SCALES = {
+    "Greys": [[0, "rgb(0,0,0)"], [1, "rgb(255,255,255)"]],
+    "YlGnBu": [
+        [0, "rgb(8,29,88)"],
+        [0.125, "rgb(37,52,148)"],
+        [0.25, "rgb(34,94,168)"],
+        [0.375, "rgb(29,145,192)"],
+        [0.5, "rgb(65,182,196)"],
+        [0.625, "rgb(127,205,187)"],
+        [0.75, "rgb(199,233,180)"],
+        [0.875, "rgb(237,248,217)"],
+        [1, "rgb(255,255,217)"],
+    ],
+    "Greens": [
+        [0, "rgb(0,68,27)"],
+        [0.125, "rgb(0,109,44)"],
+        [0.25, "rgb(35,139,69)"],
+        [0.375, "rgb(65,171,93)"],
+        [0.5, "rgb(116,196,118)"],
+        [0.625, "rgb(161,217,155)"],
+        [0.75, "rgb(199,233,192)"],
+        [0.875, "rgb(229,245,224)"],
+        [1, "rgb(247,252,245)"],
+    ],
+    "YlOrRd": [
+        [0, "rgb(128,0,38)"],
+        [0.125, "rgb(189,0,38)"],
+        [0.25, "rgb(227,26,28)"],
+        [0.375, "rgb(252,78,42)"],
+        [0.5, "rgb(253,141,60)"],
+        [0.625, "rgb(254,178,76)"],
+        [0.75, "rgb(254,217,118)"],
+        [0.875, "rgb(255,237,160)"],
+        [1, "rgb(255,255,204)"],
+    ],
+    "Bluered": [[0, "rgb(0,0,255)"], [1, "rgb(255,0,0)"]],
+    # modified RdBu based on
+    # www.sandia.gov/~kmorel/documents/ColorMaps/ColorMapsExpanded.pdf
+    "RdBu": [
+        [0, "rgb(5,10,172)"],
+        [0.35, "rgb(106,137,247)"],
+        [0.5, "rgb(190,190,190)"],
+        [0.6, "rgb(220,170,132)"],
+        [0.7, "rgb(230,145,90)"],
+        [1, "rgb(178,10,28)"],
+    ],
+    # Scale for non-negative numeric values
+    "Reds": [
+        [0, "rgb(220,220,220)"],
+        [0.2, "rgb(245,195,157)"],
+        [0.4, "rgb(245,160,105)"],
+        [1, "rgb(178,10,28)"],
+    ],
+    # Scale for non-positive numeric values
+    "Blues": [
+        [0, "rgb(5,10,172)"],
+        [0.35, "rgb(40,60,190)"],
+        [0.5, "rgb(70,100,245)"],
+        [0.6, "rgb(90,120,245)"],
+        [0.7, "rgb(106,137,247)"],
+        [1, "rgb(220,220,220)"],
+    ],
+    "Picnic": [
+        [0, "rgb(0,0,255)"],
+        [0.1, "rgb(51,153,255)"],
+        [0.2, "rgb(102,204,255)"],
+        [0.3, "rgb(153,204,255)"],
+        [0.4, "rgb(204,204,255)"],
+        [0.5, "rgb(255,255,255)"],
+        [0.6, "rgb(255,204,255)"],
+        [0.7, "rgb(255,153,255)"],
+        [0.8, "rgb(255,102,204)"],
+        [0.9, "rgb(255,102,102)"],
+        [1, "rgb(255,0,0)"],
+    ],
+    "Rainbow": [
+        [0, "rgb(150,0,90)"],
+        [0.125, "rgb(0,0,200)"],
+        [0.25, "rgb(0,25,255)"],
+        [0.375, "rgb(0,152,255)"],
+        [0.5, "rgb(44,255,150)"],
+        [0.625, "rgb(151,255,0)"],
+        [0.75, "rgb(255,234,0)"],
+        [0.875, "rgb(255,111,0)"],
+        [1, "rgb(255,0,0)"],
+    ],
+    "Portland": [
+        [0, "rgb(12,51,131)"],
+        [0.25, "rgb(10,136,186)"],
+        [0.5, "rgb(242,211,56)"],
+        [0.75, "rgb(242,143,56)"],
+        [1, "rgb(217,30,30)"],
+    ],
+    "Jet": [
+        [0, "rgb(0,0,131)"],
+        [0.125, "rgb(0,60,170)"],
+        [0.375, "rgb(5,255,255)"],
+        [0.625, "rgb(255,255,0)"],
+        [0.875, "rgb(250,0,0)"],
+        [1, "rgb(128,0,0)"],
+    ],
+    "Hot": [
+        [0, "rgb(0,0,0)"],
+        [0.3, "rgb(230,0,0)"],
+        [0.6, "rgb(255,210,0)"],
+        [1, "rgb(255,255,255)"],
+    ],
+    "Blackbody": [
+        [0, "rgb(0,0,0)"],
+        [0.2, "rgb(230,0,0)"],
+        [0.4, "rgb(230,210,0)"],
+        [0.7, "rgb(255,255,255)"],
+        [1, "rgb(160,200,255)"],
+    ],
+    "Earth": [
+        [0, "rgb(0,0,130)"],
+        [0.1, "rgb(0,180,180)"],
+        [0.2, "rgb(40,210,40)"],
+        [0.4, "rgb(230,230,50)"],
+        [0.6, "rgb(120,70,20)"],
+        [1, "rgb(255,255,255)"],
+    ],
+    "Electric": [
+        [0, "rgb(0,0,0)"],
+        [0.15, "rgb(30,0,100)"],
+        [0.4, "rgb(120,0,100)"],
+        [0.6, "rgb(160,90,0)"],
+        [0.8, "rgb(230,200,0)"],
+        [1, "rgb(255,250,220)"],
+    ],
+    "Viridis": [
+        [0, "#440154"],
+        [0.06274509803921569, "#48186a"],
+        [0.12549019607843137, "#472d7b"],
+        [0.18823529411764706, "#424086"],
+        [0.25098039215686274, "#3b528b"],
+        [0.3137254901960784, "#33638d"],
+        [0.3764705882352941, "#2c728e"],
+        [0.4392156862745098, "#26828e"],
+        [0.5019607843137255, "#21918c"],
+        [0.5647058823529412, "#1fa088"],
+        [0.6274509803921569, "#28ae80"],
+        [0.6901960784313725, "#3fbc73"],
+        [0.7529411764705882, "#5ec962"],
+        [0.8156862745098039, "#84d44b"],
+        [0.8784313725490196, "#addc30"],
+        [0.9411764705882353, "#d8e219"],
+        [1, "#fde725"],
+    ],
+    "Cividis": [
+        [0.000000, "rgb(0,32,76)"],
+        [0.058824, "rgb(0,42,102)"],
+        [0.117647, "rgb(0,52,110)"],
+        [0.176471, "rgb(39,63,108)"],
+        [0.235294, "rgb(60,74,107)"],
+        [0.294118, "rgb(76,85,107)"],
+        [0.352941, "rgb(91,95,109)"],
+        [0.411765, "rgb(104,106,112)"],
+        [0.470588, "rgb(117,117,117)"],
+        [0.529412, "rgb(131,129,120)"],
+        [0.588235, "rgb(146,140,120)"],
+        [0.647059, "rgb(161,152,118)"],
+        [0.705882, "rgb(176,165,114)"],
+        [0.764706, "rgb(192,177,109)"],
+        [0.823529, "rgb(209,191,102)"],
+        [0.882353, "rgb(225,204,92)"],
+        [0.941176, "rgb(243,219,79)"],
+        [1.000000, "rgb(255,233,69)"],
+    ],
+}
+
+
+def color_parser(colors, function):
+    """
+    Takes color(s) and a function and applies the function on the color(s)
+    In particular, this function identifies whether the given color object
+    is an iterable or not and applies the given color-parsing function to
+    the color or iterable of colors. If given an iterable, it will only be
+    able to work with it if all items in the iterable are of the same type
+    - rgb string, hex string or tuple
+    """
+    if isinstance(colors, str):
+        return function(colors)
+
+    if isinstance(colors, tuple) and isinstance(colors[0], Number):
+        return function(colors)
+
+    if hasattr(colors, "__iter__"):
+        if isinstance(colors, tuple):
+            new_color_tuple = tuple(function(item) for item in colors)
+            return new_color_tuple
+
+        else:
+            new_color_list = [function(item) for item in colors]
+            return new_color_list
+
+
+def validate_colors(colors, colortype="tuple"):
+    """
+    Validates color(s) and returns a list of color(s) of a specified type
+    """
+    from numbers import Number
+
+    if colors is None:
+        colors = DEFAULT_PLOTLY_COLORS
+
+    if isinstance(colors, str):
+        if colors in PLOTLY_SCALES:
+            colors_list = colorscale_to_colors(PLOTLY_SCALES[colors])
+            # TODO: fix _gantt.py/_scatter.py so that they can accept the
+            # actual colorscale and not just a list of the first and last
+            # color in the plotly colorscale. In resolving this issue we
+            # will be removing the immediate line below
+            colors = [colors_list[0]] + [colors_list[-1]]
+        elif "rgb" in colors or "#" in colors:
+            colors = [colors]
+        else:
+            raise exceptions.PlotlyError(
+                "If your colors variable is a string, it must be a "
+                "Plotly scale, an rgb color or a hex color."
+            )
+
+    elif isinstance(colors, tuple):
+        if isinstance(colors[0], Number):
+            colors = [colors]
+        else:
+            colors = list(colors)
+
+    # convert color elements in list to tuple color
+    for j, each_color in enumerate(colors):
+        if "rgb" in each_color:
+            each_color = color_parser(each_color, unlabel_rgb)
+            for value in each_color:
+                if value > 255.0:
+                    raise exceptions.PlotlyError(
+                        "Whoops! The elements in your rgb colors "
+                        "tuples cannot exceed 255.0."
+                    )
+            each_color = color_parser(each_color, unconvert_from_RGB_255)
+            colors[j] = each_color
+
+        if "#" in each_color:
+            each_color = color_parser(each_color, hex_to_rgb)
+            each_color = color_parser(each_color, unconvert_from_RGB_255)
+
+            colors[j] = each_color
+
+        if isinstance(each_color, tuple):
+            for value in each_color:
+                if value > 1.0:
+                    raise exceptions.PlotlyError(
+                        "Whoops! The elements in your colors tuples "
+                        "cannot exceed 1.0."
+                    )
+            colors[j] = each_color
+
+    if colortype == "rgb" and not isinstance(colors, six.string_types):
+        for j, each_color in enumerate(colors):
+            rgb_color = color_parser(each_color, convert_to_RGB_255)
+            colors[j] = color_parser(rgb_color, label_rgb)
+
+    return colors
+
+
+def validate_colors_dict(colors, colortype="tuple"):
+    """
+    Validates dictionary of color(s)
+    """
+    # validate each color element in the dictionary
+    for key in colors:
+        if "rgb" in colors[key]:
+            colors[key] = color_parser(colors[key], unlabel_rgb)
+            for value in colors[key]:
+                if value > 255.0:
+                    raise exceptions.PlotlyError(
+                        "Whoops! The elements in your rgb colors "
+                        "tuples cannot exceed 255.0."
+                    )
+            colors[key] = color_parser(colors[key], unconvert_from_RGB_255)
+
+        if "#" in colors[key]:
+            colors[key] = color_parser(colors[key], hex_to_rgb)
+            colors[key] = color_parser(colors[key], unconvert_from_RGB_255)
+
+        if isinstance(colors[key], tuple):
+            for value in colors[key]:
+                if value > 1.0:
+                    raise exceptions.PlotlyError(
+                        "Whoops! The elements in your colors tuples "
+                        "cannot exceed 1.0."
+                    )
+
+    if colortype == "rgb":
+        for key in colors:
+            colors[key] = color_parser(colors[key], convert_to_RGB_255)
+            colors[key] = color_parser(colors[key], label_rgb)
+
+    return colors
+
+
+def convert_colors_to_same_type(
+    colors,
+    colortype="rgb",
+    scale=None,
+    return_default_colors=False,
+    num_of_defualt_colors=2,
+):
+    """
+    Converts color(s) to the specified color type
+    Takes a single color or an iterable of colors, as well as a list of scale
+    values, and outputs a 2-pair of the list of color(s) converted all to an
+    rgb or tuple color type, aswell as the scale as the second element. If
+    colors is a Plotly Scale name, then 'scale' will be forced to the scale
+    from the respective colorscale and the colors in that colorscale will also
+    be coverted to the selected colortype. If colors is None, then there is an
+    option to return portion of the DEFAULT_PLOTLY_COLORS
+    :param (str|tuple|list) colors: either a plotly scale name, an rgb or hex
+        color, a color tuple or a list/tuple of colors
+    :param (list) scale: see docs for validate_scale_values()
+    :rtype (tuple) (colors_list, scale) if scale is None in the function call,
+        then scale will remain None in the returned tuple
+    """
+    colors_list = []
+
+    if colors is None and return_default_colors is True:
+        colors_list = DEFAULT_PLOTLY_COLORS[0:num_of_defualt_colors]
+
+    if isinstance(colors, str):
+        if colors in PLOTLY_SCALES:
+            colors_list = colorscale_to_colors(PLOTLY_SCALES[colors])
+            if scale is None:
+                scale = colorscale_to_scale(PLOTLY_SCALES[colors])
+
+        elif "rgb" in colors or "#" in colors:
+            colors_list = [colors]
+
+    elif isinstance(colors, tuple):
+        if isinstance(colors[0], Number):
+            colors_list = [colors]
+        else:
+            colors_list = list(colors)
+
+    elif isinstance(colors, list):
+        colors_list = colors
+
+    # validate scale
+    if scale is not None:
+        validate_scale_values(scale)
+
+        if len(colors_list) != len(scale):
+            raise exceptions.PlotlyError(
+                "Make sure that the length of your scale matches the length "
+                "of your list of colors which is {}.".format(len(colors_list))
+            )
+
+    # convert all colors to rgb
+    for j, each_color in enumerate(colors_list):
+        if "#" in each_color:
+            each_color = color_parser(each_color, hex_to_rgb)
+            each_color = color_parser(each_color, label_rgb)
+            colors_list[j] = each_color
+
+        elif isinstance(each_color, tuple):
+            each_color = color_parser(each_color, convert_to_RGB_255)
+            each_color = color_parser(each_color, label_rgb)
+            colors_list[j] = each_color
+
+    if colortype == "rgb":
+        return (colors_list, scale)
+    elif colortype == "tuple":
+        for j, each_color in enumerate(colors_list):
+            each_color = color_parser(each_color, unlabel_rgb)
+            each_color = color_parser(each_color, unconvert_from_RGB_255)
+            colors_list[j] = each_color
+        return (colors_list, scale)
+    else:
+        raise exceptions.PlotlyError(
+            "You must select either rgb or tuple for your colortype variable."
+        )
+
+
+def convert_dict_colors_to_same_type(colors_dict, colortype="rgb"):
+    """
+    Converts a colors in a dictionary of colors to the specified color type
+    :param (dict) colors_dict: a dictionary whose values are single colors
+    """
+    for key in colors_dict:
+        if "#" in colors_dict[key]:
+            colors_dict[key] = color_parser(colors_dict[key], hex_to_rgb)
+            colors_dict[key] = color_parser(colors_dict[key], label_rgb)
+
+        elif isinstance(colors_dict[key], tuple):
+            colors_dict[key] = color_parser(colors_dict[key], convert_to_RGB_255)
+            colors_dict[key] = color_parser(colors_dict[key], label_rgb)
+
+    if colortype == "rgb":
+        return colors_dict
+    elif colortype == "tuple":
+        for key in colors_dict:
+            colors_dict[key] = color_parser(colors_dict[key], unlabel_rgb)
+            colors_dict[key] = color_parser(colors_dict[key], unconvert_from_RGB_255)
+        return colors_dict
+    else:
+        raise exceptions.PlotlyError(
+            "You must select either rgb or tuple for your colortype variable."
+        )
+
+
+def validate_scale_values(scale):
+    """
+    Validates scale values from a colorscale
+    :param (list) scale: a strictly increasing list of floats that begins
+        with 0 and ends with 1. Its usage derives from a colorscale which is
+        a list of two-lists (a list with two elements) of the form
+        [value, color] which are used to determine how interpolation weighting
+        works between the colors in the colorscale. Therefore scale is just
+        the extraction of these values from the two-lists in order
+    """
+    if len(scale) < 2:
+        raise exceptions.PlotlyError(
+            "You must input a list of scale values that has at least two values."
+        )
+
+    if (scale[0] != 0) or (scale[-1] != 1):
+        raise exceptions.PlotlyError(
+            "The first and last number in your scale must be 0.0 and 1.0 "
+            "respectively."
+        )
+
+    if not all(x < y for x, y in zip(scale, scale[1:])):
+        raise exceptions.PlotlyError(
+            "'scale' must be a list that contains a strictly increasing "
+            "sequence of numbers."
+        )
+
+
+def validate_colorscale(colorscale):
+    """Validate the structure, scale values and colors of colorscale."""
+    if not isinstance(colorscale, list):
+        # TODO Write tests for these exceptions
+        raise exceptions.PlotlyError("A valid colorscale must be a list.")
+    if not all(isinstance(innerlist, list) for innerlist in colorscale):
+        raise exceptions.PlotlyError("A valid colorscale must be a list of lists.")
+    colorscale_colors = colorscale_to_colors(colorscale)
+    scale_values = colorscale_to_scale(colorscale)
+
+    validate_scale_values(scale_values)
+    validate_colors(colorscale_colors)
+
+
+def make_colorscale(colors, scale=None):
+    """
+    Makes a colorscale from a list of colors and a scale
+    Takes a list of colors and scales and constructs a colorscale based
+    on the colors in sequential order. If 'scale' is left empty, a linear-
+    interpolated colorscale will be generated. If 'scale' is a specificed
+    list, it must be the same legnth as colors and must contain all floats
+    For documentation regarding to the form of the output, see
+    https://plot.ly/python/reference/#mesh3d-colorscale
+    :param (list) colors: a list of single colors
+    """
+    colorscale = []
+
+    # validate minimum colors length of 2
+    if len(colors) < 2:
+        raise exceptions.PlotlyError(
+            "You must input a list of colors that has at least two colors."
+        )
+
+    if scale is None:
+        scale_incr = 1.0 / (len(colors) - 1)
+        return [[i * scale_incr, color] for i, color in enumerate(colors)]
+
+    else:
+        if len(colors) != len(scale):
+            raise exceptions.PlotlyError(
+                "The length of colors and scale must be the same."
+            )
+
+        validate_scale_values(scale)
+
+        colorscale = [list(tup) for tup in zip(scale, colors)]
+        return colorscale
+
+
+def find_intermediate_color(lowcolor, highcolor, intermed, colortype="tuple"):
+    """
+    Returns the color at a given distance between two colors
+    This function takes two color tuples, where each element is between 0
+    and 1, along with a value 0 < intermed < 1 and returns a color that is
+    intermed-percent from lowcolor to highcolor. If colortype is set to 'rgb',
+    the function will automatically convert the rgb type to a tuple, find the
+    intermediate color and return it as an rgb color.
+    """
+    if colortype == "rgb":
+        # convert to tuple color, eg. (1, 0.45, 0.7)
+        lowcolor = unlabel_rgb(lowcolor)
+        highcolor = unlabel_rgb(highcolor)
+
+    diff_0 = float(highcolor[0] - lowcolor[0])
+    diff_1 = float(highcolor[1] - lowcolor[1])
+    diff_2 = float(highcolor[2] - lowcolor[2])
+
+    inter_med_tuple = (
+        lowcolor[0] + intermed * diff_0,
+        lowcolor[1] + intermed * diff_1,
+        lowcolor[2] + intermed * diff_2,
+    )
+
+    if colortype == "rgb":
+        # back to an rgb string, e.g. rgb(30, 20, 10)
+        inter_med_rgb = label_rgb(inter_med_tuple)
+        return inter_med_rgb
+
+    return inter_med_tuple
+
+
+def unconvert_from_RGB_255(colors):
+    """
+    Return a tuple where each element gets divided by 255
+    Takes a (list of) color tuple(s) where each element is between 0 and
+    255. Returns the same tuples where each tuple element is normalized to
+    a value between 0 and 1
+    """
+    return (colors[0] / (255.0), colors[1] / (255.0), colors[2] / (255.0))
+
+
+def convert_to_RGB_255(colors):
+    """
+    Multiplies each element of a triplet by 255
+    Each coordinate of the color tuple is rounded to the nearest float and
+    then is turned into an integer. If a number is of the form x.5, then
+    if x is odd, the number rounds up to (x+1). Otherwise, it rounds down
+    to just x. This is the way rounding works in Python 3 and in current
+    statistical analysis to avoid rounding bias
+    :param (list) rgb_components: grabs the three R, G and B values to be
+        returned as computed in the function
+    """
+    rgb_components = []
+
+    for component in colors:
+        rounded_num = decimal.Decimal(str(component * 255.0)).quantize(
+            decimal.Decimal("1"), rounding=decimal.ROUND_HALF_EVEN
+        )
+        # convert rounded number to an integer from 'Decimal' form
+        rounded_num = int(rounded_num)
+        rgb_components.append(rounded_num)
+
+    return (rgb_components[0], rgb_components[1], rgb_components[2])
+
+
+def n_colors(lowcolor, highcolor, n_colors, colortype="tuple"):
+    """
+    Splits a low and high color into a list of n_colors colors in it
+    Accepts two color tuples and returns a list of n_colors colors
+    which form the intermediate colors between lowcolor and highcolor
+    from linearly interpolating through RGB space. If colortype is 'rgb'
+    the function will return a list of colors in the same form.
+    """
+    if colortype == "rgb":
+        # convert to tuple
+        lowcolor = unlabel_rgb(lowcolor)
+        highcolor = unlabel_rgb(highcolor)
+
+    diff_0 = float(highcolor[0] - lowcolor[0])
+    incr_0 = diff_0 / (n_colors - 1)
+    diff_1 = float(highcolor[1] - lowcolor[1])
+    incr_1 = diff_1 / (n_colors - 1)
+    diff_2 = float(highcolor[2] - lowcolor[2])
+    incr_2 = diff_2 / (n_colors - 1)
+    list_of_colors = []
+
+    for index in range(n_colors):
+        new_tuple = (
+            lowcolor[0] + (index * incr_0),
+            lowcolor[1] + (index * incr_1),
+            lowcolor[2] + (index * incr_2),
+        )
+        list_of_colors.append(new_tuple)
+
+    if colortype == "rgb":
+        # back to an rgb string
+        list_of_colors = color_parser(list_of_colors, label_rgb)
+
+    return list_of_colors
+
+
+def label_rgb(colors):
+    """
+    Takes tuple (a, b, c) and returns an rgb color 'rgb(a, b, c)'
+    """
+    return "rgb(%s, %s, %s)" % (colors[0], colors[1], colors[2])
+
+
+def unlabel_rgb(colors):
+    """
+    Takes rgb color(s) 'rgb(a, b, c)' and returns tuple(s) (a, b, c)
+    This function takes either an 'rgb(a, b, c)' color or a list of
+    such colors and returns the color tuples in tuple(s) (a, b, c)
+    """
+    str_vals = ""
+    for index in range(len(colors)):
+        try:
+            float(colors[index])
+            str_vals = str_vals + colors[index]
+        except ValueError:
+            if colors[index] == "," or colors[index] == ".":
+                str_vals = str_vals + colors[index]
+
+    str_vals = str_vals + ","
+    numbers = []
+    str_num = ""
+    for char in str_vals:
+        if char != ",":
+            str_num = str_num + char
+        else:
+            numbers.append(float(str_num))
+            str_num = ""
+    return (numbers[0], numbers[1], numbers[2])
+
+
+def hex_to_rgb(value):
+    """
+    Calculates rgb values from a hex color code.
+    :param (string) value: Hex color string
+    :rtype (tuple) (r_value, g_value, b_value): tuple of rgb values
+    """
+    value = value.lstrip("#")
+    hex_total_length = len(value)
+    rgb_section_length = hex_total_length // 3
+    return tuple(
+        int(value[i : i + rgb_section_length], 16)
+        for i in range(0, hex_total_length, rgb_section_length)
+    )
+
+
+def colorscale_to_colors(colorscale):
+    """
+    Extracts the colors from colorscale as a list
+    """
+    color_list = []
+    for item in colorscale:
+        color_list.append(item[1])
+    return color_list
+
+
+def colorscale_to_scale(colorscale):
+    """
+    Extracts the interpolation scale values from colorscale as a list
+    """
+    scale_list = []
+    for item in colorscale:
+        scale_list.append(item[0])
+    return scale_list
+
+
+def convert_colorscale_to_rgb(colorscale):
+    """
+    Converts the colors in a colorscale to rgb colors
+    A colorscale is an array of arrays, each with a numeric value as the
+    first item and a color as the second. This function specifically is
+    converting a colorscale with tuple colors (each coordinate between 0
+    and 1) into a colorscale with the colors transformed into rgb colors
+    """
+    for color in colorscale:
+        color[1] = convert_to_RGB_255(color[1])
+
+    for color in colorscale:
+        color[1] = label_rgb(color[1])
+    return colorscale
+
+
+def named_colorscales():
+    """
+    Returns lowercased names of built-in continuous colorscales.
+    """
+    from _plotly_utils.basevalidators import ColorscaleValidator
+
+    return [c for c in ColorscaleValidator("", "").named_colorscales]
+
+
+def get_colorscale(name):
+    """
+    Returns the colorscale for a given name. See `named_colorscales` for the
+    built-in colorscales.
+    """
+    from _plotly_utils.basevalidators import ColorscaleValidator
+
+    if not isinstance(name, str):
+        raise exceptions.PlotlyError("Name argument have to be a string.")
+
+    name = name.lower()
+    if name[-2:] == "_r":
+        should_reverse = True
+        name = name[:-2]
+    else:
+        should_reverse = False
+
+    if name in ColorscaleValidator("", "").named_colorscales:
+        colorscale = ColorscaleValidator("", "").named_colorscales[name]
+    else:
+        raise exceptions.PlotlyError(f"Colorscale {name} is not a built-in scale.")
+
+    if should_reverse:
+        colorscale = colorscale[::-1]
+    return make_colorscale(colorscale)
+
+
+def sample_colorscale(colorscale, samplepoints, low=0.0, high=1.0, colortype="rgb"):
+    """
+    Samples a colorscale at specific points.
+    Interpolates between colors in a colorscale to find the specific colors
+    corresponding to the specified sample values. The colorscale can be specified
+    as a list of `[scale, color]` pairs, as a list of colors, or as a named
+    plotly colorscale. The samplepoints can be specefied as an iterable of specific
+    points in the range [0.0, 1.0], or as an integer number of points which will
+    be spaced equally between the low value (default 0.0) and the high value
+    (default 1.0). The output is a list of colors, formatted according to the
+    specified colortype.
+    """
+    from bisect import bisect_left
+
+    try:
+        validate_colorscale(colorscale)
+    except exceptions.PlotlyError:
+        if isinstance(colorscale, str):
+            colorscale = get_colorscale(colorscale)
+        else:
+            colorscale = make_colorscale(colorscale)
+
+    scale = colorscale_to_scale(colorscale)
+    validate_scale_values(scale)
+    colors = colorscale_to_colors(colorscale)
+    colors = validate_colors(colors, colortype="tuple")
+
+    if isinstance(samplepoints, int):
+        samplepoints = [
+            low + idx / (samplepoints - 1) * (high - low) for idx in range(samplepoints)
+        ]
+    elif isinstance(samplepoints, float):
+        samplepoints = [samplepoints]
+
+    sampled_colors = []
+    for point in samplepoints:
+        high = bisect_left(scale, point)
+        low = high - 1
+        interpolant = (point - scale[low]) / (scale[high] - scale[low])
+        sampled_color = find_intermediate_color(colors[low], colors[high], interpolant)
+        sampled_colors.append(sampled_color)
+    return validate_colors(sampled_colors, colortype=colortype)
--- a/tools/config.schema.yaml
+++ b/tools/config.schema.yaml
@ -1187,10 +1187,13 @@ properties:
  
  HEATMAP_PHONE_DATA_YIELD_PER_PARTICIPANT_PER_TIME_SEGMENT:
    type: object
-    required: [PLOT]
+    required: [PLOT, TIME]
    properties:
      PLOT:
        type: boolean
+      TIME:
+        type: string
+        enum: [ABSOLUTE_TIME, RELATIVE_TIME]
  
  HEATMAP_SENSORS_PER_MINUTE_PER_TIME_SEGMENT:
    type: object