stress_at_work_analysis/Untitled.ipynb

316 lines
11 KiB
Plaintext
Raw Blame History

This file contains ambiguous Unicode characters!

This file contains ambiguous Unicode characters that may be confused with others in your current locale. If your use case is intentional and legitimate, you can safely ignore this warning. Use the Escape button to highlight these characters.

{
"cells": [
{
"cell_type": "code",
"execution_count": 2,
"metadata": {},
"outputs": [],
"source": [
"import os\n",
"import sys\n",
"import matplotlib.pyplot as plt\n",
"import seaborn as sns\n",
"\n",
"nb_dir = os.path.split(os.getcwd())[0]\n",
"if nb_dir not in sys.path:\n",
" sys.path.append(nb_dir)\n",
" \n",
"from features.communication import *\n",
"import participants.query_db\n",
"\n",
"participants_inactive_usernames = participants.query_db.get_usernames()\n",
"df_sms = get_sms_data(participants_inactive_usernames)\n",
"df_calls = get_call_data(participants_inactive_usernames)"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"df_calls"
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>id</th>\n",
" <th>_id</th>\n",
" <th>timestamp</th>\n",
" <th>device_id</th>\n",
" <th>call_type</th>\n",
" <th>call_duration</th>\n",
" <th>trace</th>\n",
" <th>participant_id</th>\n",
" <th>username</th>\n",
" <th>freq</th>\n",
" <th>contact_id</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>118</td>\n",
" <td>1</td>\n",
" <td>1581936081010</td>\n",
" <td>78082f9f-98c2-468d-b4a2-7c835bd812bd</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b</td>\n",
" <td>13</td>\n",
" <td>uploader_20449</td>\n",
" <td>21</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>176</td>\n",
" <td>3</td>\n",
" <td>1582295247982</td>\n",
" <td>78082f9f-98c2-468d-b4a2-7c835bd812bd</td>\n",
" <td>1</td>\n",
" <td>196</td>\n",
" <td>87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b</td>\n",
" <td>13</td>\n",
" <td>uploader_20449</td>\n",
" <td>21</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>209</td>\n",
" <td>4</td>\n",
" <td>1582305634014</td>\n",
" <td>78082f9f-98c2-468d-b4a2-7c835bd812bd</td>\n",
" <td>2</td>\n",
" <td>237</td>\n",
" <td>87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b</td>\n",
" <td>13</td>\n",
" <td>uploader_20449</td>\n",
" <td>21</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>210</td>\n",
" <td>5</td>\n",
" <td>1582561530334</td>\n",
" <td>78082f9f-98c2-468d-b4a2-7c835bd812bd</td>\n",
" <td>2</td>\n",
" <td>126</td>\n",
" <td>87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b</td>\n",
" <td>13</td>\n",
" <td>uploader_20449</td>\n",
" <td>21</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>253</td>\n",
" <td>6</td>\n",
" <td>1582627576077</td>\n",
" <td>78082f9f-98c2-468d-b4a2-7c835bd812bd</td>\n",
" <td>2</td>\n",
" <td>255</td>\n",
" <td>87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b</td>\n",
" <td>13</td>\n",
" <td>uploader_20449</td>\n",
" <td>21</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4645</th>\n",
" <td>5874</td>\n",
" <td>131</td>\n",
" <td>1625602519843</td>\n",
" <td>4b62a655-cbf0-4ac0-a448-06726f45b56a</td>\n",
" <td>2</td>\n",
" <td>2270</td>\n",
" <td>f4ebca8dc7305fe424d6bf7fbcd2e5086f98b453</td>\n",
" <td>90</td>\n",
" <td>uploader_53573</td>\n",
" <td>6</td>\n",
" <td>9</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4646</th>\n",
" <td>5882</td>\n",
" <td>139</td>\n",
" <td>1625753023456</td>\n",
" <td>4b62a655-cbf0-4ac0-a448-06726f45b56a</td>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" <td>2e5d63f6fddca2b66be810b5946c42eda24f2dbe</td>\n",
" <td>90</td>\n",
" <td>uploader_53573</td>\n",
" <td>2</td>\n",
" <td>13</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4647</th>\n",
" <td>5883</td>\n",
" <td>140</td>\n",
" <td>1625754998767</td>\n",
" <td>4b62a655-cbf0-4ac0-a448-06726f45b56a</td>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" <td>2e5d63f6fddca2b66be810b5946c42eda24f2dbe</td>\n",
" <td>90</td>\n",
" <td>uploader_53573</td>\n",
" <td>2</td>\n",
" <td>13</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4648</th>\n",
" <td>5884</td>\n",
" <td>141</td>\n",
" <td>1625823008392</td>\n",
" <td>4b62a655-cbf0-4ac0-a448-06726f45b56a</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>7316d58b7bb7de097a2421c56010ac024a489451</td>\n",
" <td>90</td>\n",
" <td>uploader_53573</td>\n",
" <td>1</td>\n",
" <td>21</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4649</th>\n",
" <td>5903</td>\n",
" <td>158</td>\n",
" <td>1626110930233</td>\n",
" <td>4b62a655-cbf0-4ac0-a448-06726f45b56a</td>\n",
" <td>2</td>\n",
" <td>53</td>\n",
" <td>7db4e9acf7c73837ddecdae5da523a28c774ba94</td>\n",
" <td>90</td>\n",
" <td>uploader_53573</td>\n",
" <td>1</td>\n",
" <td>24</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>4650 rows × 11 columns</p>\n",
"</div>"
],
"text/plain": [
" id _id timestamp device_id \\\n",
"0 118 1 1581936081010 78082f9f-98c2-468d-b4a2-7c835bd812bd \n",
"1 176 3 1582295247982 78082f9f-98c2-468d-b4a2-7c835bd812bd \n",
"2 209 4 1582305634014 78082f9f-98c2-468d-b4a2-7c835bd812bd \n",
"3 210 5 1582561530334 78082f9f-98c2-468d-b4a2-7c835bd812bd \n",
"4 253 6 1582627576077 78082f9f-98c2-468d-b4a2-7c835bd812bd \n",
"... ... ... ... ... \n",
"4645 5874 131 1625602519843 4b62a655-cbf0-4ac0-a448-06726f45b56a \n",
"4646 5882 139 1625753023456 4b62a655-cbf0-4ac0-a448-06726f45b56a \n",
"4647 5883 140 1625754998767 4b62a655-cbf0-4ac0-a448-06726f45b56a \n",
"4648 5884 141 1625823008392 4b62a655-cbf0-4ac0-a448-06726f45b56a \n",
"4649 5903 158 1626110930233 4b62a655-cbf0-4ac0-a448-06726f45b56a \n",
"\n",
" call_type call_duration trace \\\n",
"0 2 0 87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b \n",
"1 1 196 87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b \n",
"2 2 237 87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b \n",
"3 2 126 87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b \n",
"4 2 255 87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b \n",
"... ... ... ... \n",
"4645 2 2270 f4ebca8dc7305fe424d6bf7fbcd2e5086f98b453 \n",
"4646 3 0 2e5d63f6fddca2b66be810b5946c42eda24f2dbe \n",
"4647 3 0 2e5d63f6fddca2b66be810b5946c42eda24f2dbe \n",
"4648 2 0 7316d58b7bb7de097a2421c56010ac024a489451 \n",
"4649 2 53 7db4e9acf7c73837ddecdae5da523a28c774ba94 \n",
"\n",
" participant_id username freq contact_id \n",
"0 13 uploader_20449 21 0 \n",
"1 13 uploader_20449 21 0 \n",
"2 13 uploader_20449 21 0 \n",
"3 13 uploader_20449 21 0 \n",
"4 13 uploader_20449 21 0 \n",
"... ... ... ... ... \n",
"4645 90 uploader_53573 6 9 \n",
"4646 90 uploader_53573 2 13 \n",
"4647 90 uploader_53573 2 13 \n",
"4648 90 uploader_53573 1 21 \n",
"4649 90 uploader_53573 1 24 \n",
"\n",
"[4650 rows x 11 columns]"
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"contact_features(enumerate_contacts(df_calls))"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "straw2analysis",
"language": "python",
"name": "straw2analysis"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.9.6"
}
},
"nbformat": 4,
"nbformat_minor": 2
}