{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import os\n", "import sys\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "\n", "nb_dir = os.path.split(os.getcwd())[0]\n", "if nb_dir not in sys.path:\n", " sys.path.append(nb_dir)\n", " \n", "from features.communication import *\n", "import participants.query_db\n", "\n", "participants_inactive_usernames = participants.query_db.get_usernames()\n", "df_sms = get_sms_data(participants_inactive_usernames)\n", "df_calls = get_call_data(participants_inactive_usernames)" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
id_idtimestampdevice_idcall_typecall_durationtraceparticipant_idusernamefreqcontact_idtotal_call_durationno_contacts
01181158193608101078082f9f-98c2-468d-b4a2-7c835bd812bd2087ae5eb2c5b7fe30bea2821e2ec052453d89ea6b13uploader_2044921028445
11763158229524798278082f9f-98c2-468d-b4a2-7c835bd812bd119687ae5eb2c5b7fe30bea2821e2ec052453d89ea6b13uploader_2044921028445
22094158230563401478082f9f-98c2-468d-b4a2-7c835bd812bd223787ae5eb2c5b7fe30bea2821e2ec052453d89ea6b13uploader_2044921028445
32105158256153033478082f9f-98c2-468d-b4a2-7c835bd812bd212687ae5eb2c5b7fe30bea2821e2ec052453d89ea6b13uploader_2044921028445
42536158262757607778082f9f-98c2-468d-b4a2-7c835bd812bd225587ae5eb2c5b7fe30bea2821e2ec052453d89ea6b13uploader_2044921028445
..........................................
435255605916212756895899f54e35c-d7cb-4f4c-8dc1-17dc86f2635e205eb72fe829c2af4a654007220119bdcf47499555107uploader_89606117022
433654432916207461426369f54e35c-d7cb-4f4c-8dc1-17dc86f2635e21896dd761532337dfe596eb2e34f4c91216b38e28e2107uploader_8960611818922
431652371016201401099089f54e35c-d7cb-4f4c-8dc1-17dc86f2635e2859c4eab1dfc0114aecd64a7f594977acc9ab7936c107uploader_896061198522
434755244416209716791229f54e35c-d7cb-4f4c-8dc1-17dc86f2635e1120a9fa73b6137d09288429de20172095978730e4b8107uploader_8960612012022
433153642616206303286359f54e35c-d7cb-4f4c-8dc1-17dc86f2635e2184cfe98eee4a27b377f4cde1ea5c39d24d0475b533107uploader_8960612118422
\n", "

4650 rows × 13 columns

\n", "
" ], "text/plain": [ " id _id timestamp device_id \\\n", "0 118 1 1581936081010 78082f9f-98c2-468d-b4a2-7c835bd812bd \n", "1 176 3 1582295247982 78082f9f-98c2-468d-b4a2-7c835bd812bd \n", "2 209 4 1582305634014 78082f9f-98c2-468d-b4a2-7c835bd812bd \n", "3 210 5 1582561530334 78082f9f-98c2-468d-b4a2-7c835bd812bd \n", "4 253 6 1582627576077 78082f9f-98c2-468d-b4a2-7c835bd812bd \n", "... ... ... ... ... \n", "4352 5560 59 1621275689589 9f54e35c-d7cb-4f4c-8dc1-17dc86f2635e \n", "4336 5443 29 1620746142636 9f54e35c-d7cb-4f4c-8dc1-17dc86f2635e \n", "4316 5237 10 1620140109908 9f54e35c-d7cb-4f4c-8dc1-17dc86f2635e \n", "4347 5524 44 1620971679122 9f54e35c-d7cb-4f4c-8dc1-17dc86f2635e \n", "4331 5364 26 1620630328635 9f54e35c-d7cb-4f4c-8dc1-17dc86f2635e \n", "\n", " call_type call_duration trace \\\n", "0 2 0 87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b \n", "1 1 196 87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b \n", "2 2 237 87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b \n", "3 2 126 87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b \n", "4 2 255 87ae5eb2c5b7fe30bea2821e2ec052453d89ea6b \n", "... ... ... ... \n", "4352 2 0 5eb72fe829c2af4a654007220119bdcf47499555 \n", "4336 2 189 6dd761532337dfe596eb2e34f4c91216b38e28e2 \n", "4316 2 85 9c4eab1dfc0114aecd64a7f594977acc9ab7936c \n", "4347 1 120 a9fa73b6137d09288429de20172095978730e4b8 \n", "4331 2 184 cfe98eee4a27b377f4cde1ea5c39d24d0475b533 \n", "\n", " participant_id username freq contact_id total_call_duration \\\n", "0 13 uploader_20449 21 0 2844 \n", "1 13 uploader_20449 21 0 2844 \n", "2 13 uploader_20449 21 0 2844 \n", "3 13 uploader_20449 21 0 2844 \n", "4 13 uploader_20449 21 0 2844 \n", "... ... ... ... ... ... \n", "4352 107 uploader_89606 1 17 0 \n", "4336 107 uploader_89606 1 18 189 \n", "4316 107 uploader_89606 1 19 85 \n", "4347 107 uploader_89606 1 20 120 \n", "4331 107 uploader_89606 1 21 184 \n", "\n", " no_contacts \n", "0 5 \n", "1 5 \n", "2 5 \n", "3 5 \n", "4 5 \n", "... ... \n", "4352 22 \n", "4336 22 \n", "4316 22 \n", "4347 22 \n", "4331 22 \n", "\n", "[4650 rows x 13 columns]" ] }, "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ "contact_features(enumerate_contacts(df_calls))" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
id_idtimestampdevice_idmessage_typetraceparticipant_idusernamefreqcontact_idno_contacts
1953797158296443459778082f9f-98c2-468d-b4a2-7c835bd812bd2417b9c87f5b573530bcffba8577777b3a964d67113uploader_20449506
1963808158296443497478082f9f-98c2-468d-b4a2-7c835bd812bd2417b9c87f5b573530bcffba8577777b3a964d67113uploader_20449506
19738210158296598860978082f9f-98c2-468d-b4a2-7c835bd812bd2417b9c87f5b573530bcffba8577777b3a964d67113uploader_20449506
19838311158296598887378082f9f-98c2-468d-b4a2-7c835bd812bd2417b9c87f5b573530bcffba8577777b3a964d67113uploader_20449506
19939612158296598887378082f9f-98c2-468d-b4a2-7c835bd812bd2417b9c87f5b573530bcffba8577777b3a964d67113uploader_20449506
....................................
51936137416197893606659f54e35c-d7cb-4f4c-8dc1-17dc86f2635e22340c1d2b9e5d550373423a599014468a4dc3678107uploader_8960631216
51946135216197872738299f54e35c-d7cb-4f4c-8dc1-17dc86f2635e12340c1d2b9e5d550373423a599014468a4dc3678107uploader_8960631216
5417669021016209804371989f54e35c-d7cb-4f4c-8dc1-17dc86f2635e1198d7e63a2b4d8a7ca9bb92f74e6974ca17edc56107uploader_8960611316
5447677025616214076680199f54e35c-d7cb-4f4c-8dc1-17dc86f2635e1d4a67b53e704247de47064850efd3647e8dcaffb107uploader_8960611416
5440674224816212533135449f54e35c-d7cb-4f4c-8dc1-17dc86f2635e1ffbc6a5f0f601cf2d9cdad9d3a588633e1a1967c107uploader_8960611516
\n", "

5864 rows × 11 columns

\n", "
" ], "text/plain": [ " id _id timestamp device_id \\\n", "195 379 7 1582964434597 78082f9f-98c2-468d-b4a2-7c835bd812bd \n", "196 380 8 1582964434974 78082f9f-98c2-468d-b4a2-7c835bd812bd \n", "197 382 10 1582965988609 78082f9f-98c2-468d-b4a2-7c835bd812bd \n", "198 383 11 1582965988873 78082f9f-98c2-468d-b4a2-7c835bd812bd \n", "199 396 12 1582965988873 78082f9f-98c2-468d-b4a2-7c835bd812bd \n", "... ... ... ... ... \n", "5193 6137 4 1619789360665 9f54e35c-d7cb-4f4c-8dc1-17dc86f2635e \n", "5194 6135 2 1619787273829 9f54e35c-d7cb-4f4c-8dc1-17dc86f2635e \n", "5417 6690 210 1620980437198 9f54e35c-d7cb-4f4c-8dc1-17dc86f2635e \n", "5447 6770 256 1621407668019 9f54e35c-d7cb-4f4c-8dc1-17dc86f2635e \n", "5440 6742 248 1621253313544 9f54e35c-d7cb-4f4c-8dc1-17dc86f2635e \n", "\n", " message_type trace participant_id \\\n", "195 2 417b9c87f5b573530bcffba8577777b3a964d671 13 \n", "196 2 417b9c87f5b573530bcffba8577777b3a964d671 13 \n", "197 2 417b9c87f5b573530bcffba8577777b3a964d671 13 \n", "198 2 417b9c87f5b573530bcffba8577777b3a964d671 13 \n", "199 2 417b9c87f5b573530bcffba8577777b3a964d671 13 \n", "... ... ... ... \n", "5193 2 2340c1d2b9e5d550373423a599014468a4dc3678 107 \n", "5194 1 2340c1d2b9e5d550373423a599014468a4dc3678 107 \n", "5417 1 198d7e63a2b4d8a7ca9bb92f74e6974ca17edc56 107 \n", "5447 1 d4a67b53e704247de47064850efd3647e8dcaffb 107 \n", "5440 1 ffbc6a5f0f601cf2d9cdad9d3a588633e1a1967c 107 \n", "\n", " username freq contact_id no_contacts \n", "195 uploader_20449 5 0 6 \n", "196 uploader_20449 5 0 6 \n", "197 uploader_20449 5 0 6 \n", "198 uploader_20449 5 0 6 \n", "199 uploader_20449 5 0 6 \n", "... ... ... ... ... \n", "5193 uploader_89606 3 12 16 \n", "5194 uploader_89606 3 12 16 \n", "5417 uploader_89606 1 13 16 \n", "5447 uploader_89606 1 14 16 \n", "5440 uploader_89606 1 15 16 \n", "\n", "[5864 rows x 11 columns]" ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "contact_features(enumerate_contacts(df_sms))" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "scrolled": true }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
participant_idno_calls_no_sms_rationo_incoming_calls_no_recieved_sms_rationo_outgoing_calls_no_sent_sms_rationo_calls_contacts_no_sms_contacts_ratio
0130.6500000.7000000.7500000.454545
1140.5903610.5555560.6111110.714286
2150.0331130.9605260.0266670.173913
3160.5652170.6666670.7500000.666667
4170.9166670.2592590.9836070.857143
..................
56910.1962030.8469390.2280700.666667
57920.4444440.5714290.4000000.600000
58930.4322030.6857140.5128210.428571
591060.7058820.4545450.7500000.769231
601070.2049690.8791210.1926610.578947
\n", "

61 rows × 5 columns

\n", "
" ], "text/plain": [ " participant_id no_calls_no_sms_ratio \\\n", "0 13 0.650000 \n", "1 14 0.590361 \n", "2 15 0.033113 \n", "3 16 0.565217 \n", "4 17 0.916667 \n", ".. ... ... \n", "56 91 0.196203 \n", "57 92 0.444444 \n", "58 93 0.432203 \n", "59 106 0.705882 \n", "60 107 0.204969 \n", "\n", " no_incoming_calls_no_recieved_sms_ratio \\\n", "0 0.700000 \n", "1 0.555556 \n", "2 0.960526 \n", "3 0.666667 \n", "4 0.259259 \n", ".. ... \n", "56 0.846939 \n", "57 0.571429 \n", "58 0.685714 \n", "59 0.454545 \n", "60 0.879121 \n", "\n", " no_outgoing_calls_no_sent_sms_ratio \\\n", "0 0.750000 \n", "1 0.611111 \n", "2 0.026667 \n", "3 0.750000 \n", "4 0.983607 \n", ".. ... \n", "56 0.228070 \n", "57 0.400000 \n", "58 0.512821 \n", "59 0.750000 \n", "60 0.192661 \n", "\n", " no_calls_contacts_no_sms_contacts_ratio \n", "0 0.454545 \n", "1 0.714286 \n", "2 0.173913 \n", "3 0.666667 \n", "4 0.857143 \n", ".. ... \n", "56 0.666667 \n", "57 0.600000 \n", "58 0.428571 \n", "59 0.769231 \n", "60 0.578947 \n", "\n", "[61 rows x 5 columns]" ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "calls_sms_features(df_calls, df_sms)" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "straw2analysis", "language": "python", "name": "straw2analysis" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.6" } }, "nbformat": 4, "nbformat_minor": 2 }