From 08780c35cb72ae22ab33667e59f7973b02ef20b2 Mon Sep 17 00:00:00 2001 From: katya96 Date: Mon, 14 Sep 2020 13:43:18 +0200 Subject: [PATCH 1/2] added new file for participants who did not do most of sessions --- ...ants_who_did_not_do_most_of_sessions.ipynb | 41 +++++++++++++++++++ 1 file changed, 41 insertions(+) create mode 100644 scripts/cov_participants_who_did_not_do_most_of_sessions.ipynb diff --git a/scripts/cov_participants_who_did_not_do_most_of_sessions.ipynb b/scripts/cov_participants_who_did_not_do_most_of_sessions.ipynb new file mode 100644 index 0000000..e33a08f --- /dev/null +++ b/scripts/cov_participants_who_did_not_do_most_of_sessions.ipynb @@ -0,0 +1,41 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.7.4" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} -- GitLab From d82330b44e0fa7c5dec70f8d9402cb4fdf95bc73 Mon Sep 17 00:00:00 2001 From: katya96 Date: Wed, 16 Sep 2020 08:40:58 +0200 Subject: [PATCH 2/2] changes to cov_participants_who_did_not_do_most_of_sessions --- ...d_not_do_most_of_sessions-checkpoint.ipynb | 1078 +++++++++++++++++ .../__pycache__/cov_functions.cpython-37.pyc | Bin 9791 -> 9804 bytes ...ants_who_did_not_do_most_of_sessions.ipynb | 1041 +++++++++++++++- scripts/cov_preprocess.ipynb | 6 +- 4 files changed, 2120 insertions(+), 5 deletions(-) create mode 100644 scripts/.ipynb_checkpoints/cov_participants_who_did_not_do_most_of_sessions-checkpoint.ipynb diff --git a/scripts/.ipynb_checkpoints/cov_participants_who_did_not_do_most_of_sessions-checkpoint.ipynb b/scripts/.ipynb_checkpoints/cov_participants_who_did_not_do_most_of_sessions-checkpoint.ipynb new file mode 100644 index 0000000..33bf102 --- /dev/null +++ b/scripts/.ipynb_checkpoints/cov_participants_who_did_not_do_most_of_sessions-checkpoint.ipynb @@ -0,0 +1,1078 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Description: \n", + "\n", + "1. loading participants' data from sessions 8 to 11\n", + "2. filtering them for only APPROVED\n", + "3. if their participation was approved, setting it to 1 \n", + "4. merging data frames for different sessions, setting 0 for cases when participation was not approved" + ] + }, + { + "cell_type": "code", + "execution_count": 53, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd\n", + "import numpy as np\n", + "from cov_functions import *\n", + "import logging as lg\n", + "import logging.handlers\n", + "import os \n", + "from functools import reduce" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Loading session 8 " + ] + }, + { + "cell_type": "code", + "execution_count": 54, + "metadata": {}, + "outputs": [], + "source": [ + "conf = {\"session\": 8,\n", + " \"session_type\": \"long\"\n", + " }" + ] + }, + { + "cell_type": "code", + "execution_count": 55, + "metadata": {}, + "outputs": [], + "source": [ + "data_path = os.path.join(\"../../data/session\"+str(conf[\"session\"])+\"/\")\n", + "# Set up a specific logger with our desired output level\n", + "lg.basicConfig(filename=data_path+'log.txt',level=logging.INFO)\n", + "lg.info(\"\")\n", + "lg.info(\" LOG START\")\n", + "prolific_uk_d = pd.read_csv(data_path+\"prolific_data_uk.csv\")\n", + "prolific_be_d = pd.read_csv(data_path+\"prolific_data_be.csv\")\n", + "frames = [prolific_uk_d, prolific_be_d]\n", + "\n", + "prolific_d = pd.concat(frames)\n", + "\n", + "# 1. Clean prolific data\n", + "prolific_d = prolific_d.set_index(\"participant_id\", drop= True)\n", + "\n", + "# change index label to PROLIFICID\n", + "new_index = prolific_d.index.rename('PROLIFICID')\n", + "prolific_d.index = new_index\n", + "\n", + "session8 = prolific_d\n", + "session8 = session8[session8.status ==\"APPROVED\"]\n", + "session8 = session8['status']\n", + "session8 = session8.to_frame()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Function that changes values of approved rows to 1" + ] + }, + { + "cell_type": "code", + "execution_count": 56, + "metadata": {}, + "outputs": [], + "source": [ + "def ids(status):\n", + " if status == 'APPROVED':\n", + " return 1.0\n", + " else: \n", + " return 0.0" + ] + }, + { + "cell_type": "code", + "execution_count": 57, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
PROLIFICIDsession8
05cae6a77b38ea60016e548891.0
156ca0400b30699000bd9d94f1.0
25dd59fe0a6438056ac3973821.0
35caccbc4976d010014b9cd9d1.0
45e3deeeb387fb9000abb714c1.0
.........
3295ea8049b3698931ef59db2271.0
3305ea68597086c7251f22a528e1.0
3315ea6c3016666f50351c718761.0
3325ea93292936cd300093792151.0
3335ea87b7a3de5172c19d4c8a01.0
\n", + "

334 rows × 2 columns

\n", + "
" + ], + "text/plain": [ + " PROLIFICID session8\n", + "0 5cae6a77b38ea60016e54889 1.0\n", + "1 56ca0400b30699000bd9d94f 1.0\n", + "2 5dd59fe0a6438056ac397382 1.0\n", + "3 5caccbc4976d010014b9cd9d 1.0\n", + "4 5e3deeeb387fb9000abb714c 1.0\n", + ".. ... ...\n", + "329 5ea8049b3698931ef59db227 1.0\n", + "330 5ea68597086c7251f22a528e 1.0\n", + "331 5ea6c3016666f50351c71876 1.0\n", + "332 5ea93292936cd30009379215 1.0\n", + "333 5ea87b7a3de5172c19d4c8a0 1.0\n", + "\n", + "[334 rows x 2 columns]" + ] + }, + "execution_count": 57, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "session8 = session8['status'].apply(lambda status: ids(status))\n", + "session8 = session8.to_frame()\n", + "session8.reset_index(inplace = True)\n", + "session8.rename(columns={'status':'session8'}, inplace=True)\n", + "session8" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Loading session 9" + ] + }, + { + "cell_type": "code", + "execution_count": 58, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
PROLIFICIDsession9
05c584e854e32ef00014af6851.0
15dc3224ff3795b23e5ec7c651.0
25d7c060606189b0017ba79c91.0
35e87376eb4921a37c33affb41.0
45e932b48bb285314d5ed56ba1.0
.........
3295ea56ecd5d022354cb1c061e1.0
3305ea93292936cd300093792151.0
3315ea1e8daeebbed0dabdaee6d1.0
3325ea30b6232a8c709ed3c645e1.0
3335ea8049b3698931ef59db2271.0
\n", + "

334 rows × 2 columns

\n", + "
" + ], + "text/plain": [ + " PROLIFICID session9\n", + "0 5c584e854e32ef00014af685 1.0\n", + "1 5dc3224ff3795b23e5ec7c65 1.0\n", + "2 5d7c060606189b0017ba79c9 1.0\n", + "3 5e87376eb4921a37c33affb4 1.0\n", + "4 5e932b48bb285314d5ed56ba 1.0\n", + ".. ... ...\n", + "329 5ea56ecd5d022354cb1c061e 1.0\n", + "330 5ea93292936cd30009379215 1.0\n", + "331 5ea1e8daeebbed0dabdaee6d 1.0\n", + "332 5ea30b6232a8c709ed3c645e 1.0\n", + "333 5ea8049b3698931ef59db227 1.0\n", + "\n", + "[334 rows x 2 columns]" + ] + }, + "execution_count": 58, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "conf = {\"session\": 9,\n", + " \"session_type\": \"short\"\n", + " }\n", + "data_path = os.path.join(\"../../data/session\"+str(conf[\"session\"])+\"/\")\n", + "# Set up a specific logger with our desired output level\n", + "lg.basicConfig(filename=data_path+'log.txt',level=logging.INFO)\n", + "lg.info(\"\")\n", + "lg.info(\" LOG START\")\n", + "prolific_uk_d = pd.read_csv(data_path+\"prolific_data_uk.csv\")\n", + "prolific_be_d = pd.read_csv(data_path+\"prolific_data_be.csv\")\n", + "frames = [prolific_uk_d, prolific_be_d]\n", + "\n", + "prolific_d = pd.concat(frames)\n", + "\n", + "# 1. Clean prolific data\n", + "prolific_d = prolific_d.set_index(\"participant_id\", drop= True)\n", + "\n", + "# change index label to PROLIFICID\n", + "new_index = prolific_d.index.rename('PROLIFICID')\n", + "prolific_d.index = new_index\n", + "\n", + "session9 = prolific_d\n", + "session9 = session9[session9.status ==\"APPROVED\"]\n", + "session9 = session9['status']\n", + "session9 = session9.to_frame()\n", + "session9 = session9['status'].apply(lambda status: ids(status))\n", + "session9 = session9.to_frame()\n", + "session9.reset_index(inplace = True)\n", + "session9.rename(columns={'status':'session9'}, inplace=True)\n", + "session9" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Loading session 10" + ] + }, + { + "cell_type": "code", + "execution_count": 59, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
PROLIFICIDsession10
05d9b55b519e9b6001550cf9f1.0
15c58a9908f34eb00015748671.0
25ddf87d7952798000c74a4781.0
35d920df12b679a00182bbc731.0
45e1b2b3e4a955b350b1e0a631.0
.........
3285ea72a2e0120e60efc328d9d1.0
3295ea68597086c7251f22a528e1.0
3305ea160b5485d2e00092fd2e21.0
3315ea6c3016666f50351c718761.0
3325ea84aca3297e825a9d92aa51.0
\n", + "

333 rows × 2 columns

\n", + "
" + ], + "text/plain": [ + " PROLIFICID session10\n", + "0 5d9b55b519e9b6001550cf9f 1.0\n", + "1 5c58a9908f34eb0001574867 1.0\n", + "2 5ddf87d7952798000c74a478 1.0\n", + "3 5d920df12b679a00182bbc73 1.0\n", + "4 5e1b2b3e4a955b350b1e0a63 1.0\n", + ".. ... ...\n", + "328 5ea72a2e0120e60efc328d9d 1.0\n", + "329 5ea68597086c7251f22a528e 1.0\n", + "330 5ea160b5485d2e00092fd2e2 1.0\n", + "331 5ea6c3016666f50351c71876 1.0\n", + "332 5ea84aca3297e825a9d92aa5 1.0\n", + "\n", + "[333 rows x 2 columns]" + ] + }, + "execution_count": 59, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "conf = {\"session\": 10,\n", + " \"session_type\": \"short\"\n", + " }\n", + "data_path = os.path.join(\"../../data/session\"+str(conf[\"session\"])+\"/\")\n", + "# Set up a specific logger with our desired output level\n", + "lg.basicConfig(filename=data_path+'log.txt',level=logging.INFO)\n", + "lg.info(\"\")\n", + "lg.info(\" LOG START\")\n", + "prolific_uk_d = pd.read_csv(data_path+\"prolific_data_uk.csv\")\n", + "prolific_be_d = pd.read_csv(data_path+\"prolific_data_be.csv\")\n", + "frames = [prolific_uk_d, prolific_be_d]\n", + "\n", + "prolific_d = pd.concat(frames)\n", + "\n", + "# 1. Clean prolific data\n", + "prolific_d = prolific_d.set_index(\"participant_id\", drop= True)\n", + "\n", + "# change index label to PROLIFICID\n", + "new_index = prolific_d.index.rename('PROLIFICID')\n", + "prolific_d.index = new_index\n", + "\n", + "session10 = prolific_d\n", + "session10 = session10[session10.status ==\"APPROVED\"]\n", + "session10 = session10['status']\n", + "session10 = session10.to_frame()\n", + "session10 = session10['status'].apply(lambda status: ids(status))\n", + "session10 = session10.to_frame()\n", + "session10.reset_index(inplace = True)\n", + "session10.rename(columns={'status':'session10'}, inplace=True)\n", + "session10" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Loading session 11" + ] + }, + { + "cell_type": "code", + "execution_count": 60, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
PROLIFICIDsession11
05e5ad8d315b8d42db10b84ce1.0
15d9b55b519e9b6001550cf9f1.0
25d7c060606189b0017ba79c91.0
35e81c1359984aa89fe6b8c131.0
45e4875f3110b3730eefa32a11.0
.........
3185ea17128cc936f013db64e701.0
3195ea04e98271c1b03ee09cbac1.0
3205ea8049b3698931ef59db2271.0
3215eaafa4b9f58200867cb6cc81.0
3225ea84aca3297e825a9d92aa51.0
\n", + "

323 rows × 2 columns

\n", + "
" + ], + "text/plain": [ + " PROLIFICID session11\n", + "0 5e5ad8d315b8d42db10b84ce 1.0\n", + "1 5d9b55b519e9b6001550cf9f 1.0\n", + "2 5d7c060606189b0017ba79c9 1.0\n", + "3 5e81c1359984aa89fe6b8c13 1.0\n", + "4 5e4875f3110b3730eefa32a1 1.0\n", + ".. ... ...\n", + "318 5ea17128cc936f013db64e70 1.0\n", + "319 5ea04e98271c1b03ee09cbac 1.0\n", + "320 5ea8049b3698931ef59db227 1.0\n", + "321 5eaafa4b9f58200867cb6cc8 1.0\n", + "322 5ea84aca3297e825a9d92aa5 1.0\n", + "\n", + "[323 rows x 2 columns]" + ] + }, + "execution_count": 60, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "conf = {\"session\": 11,\n", + " \"session_type\": \"short\"\n", + " }\n", + "data_path = os.path.join(\"../../data/session\"+str(conf[\"session\"])+\"/\")\n", + "# Set up a specific logger with our desired output level\n", + "lg.basicConfig(filename=data_path+'log.txt',level=logging.INFO)\n", + "lg.info(\"\")\n", + "lg.info(\" LOG START\")\n", + "prolific_uk_d = pd.read_csv(data_path+\"prolific_data_uk.csv\")\n", + "prolific_be_d = pd.read_csv(data_path+\"prolific_data_be.csv\")\n", + "frames = [prolific_uk_d, prolific_be_d]\n", + "\n", + "prolific_d = pd.concat(frames)\n", + "\n", + "# 1. Clean prolific data\n", + "prolific_d = prolific_d.set_index(\"participant_id\", drop= True)\n", + "\n", + "# change index label to PROLIFICID\n", + "new_index = prolific_d.index.rename('PROLIFICID')\n", + "prolific_d.index = new_index\n", + "\n", + "session11 = prolific_d\n", + "session11 = session11[session11.status ==\"APPROVED\"]\n", + "session11 = session11['status']\n", + "session11 = session11.to_frame()\n", + "session11 = session11['status'].apply(lambda status: ids(status))\n", + "session11 = session11.to_frame()\n", + "session11.reset_index(inplace = True)\n", + "session11.rename(columns={'status':'session11'}, inplace=True)\n", + "session11" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Making one data frame, where for each ID for each session 1 corresponds to approved and 0 - not approved " + ] + }, + { + "cell_type": "code", + "execution_count": 61, + "metadata": {}, + "outputs": [], + "source": [ + "sessions = [session8, session9, session10, session11]" + ] + }, + { + "cell_type": "code", + "execution_count": 62, + "metadata": {}, + "outputs": [], + "source": [ + "sessions = reduce(lambda left,right: pd.merge(left,right,on=['PROLIFICID'], how='left'), sessions).fillna(0)" + ] + }, + { + "cell_type": "code", + "execution_count": 63, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
PROLIFICIDsession8session9session10session11
05cae6a77b38ea60016e548891.01.01.01.0
156ca0400b30699000bd9d94f1.01.01.01.0
25dd59fe0a6438056ac3973821.01.01.01.0
35caccbc4976d010014b9cd9d1.01.01.01.0
45e3deeeb387fb9000abb714c1.01.01.01.0
..................
3435ea8049b3698931ef59db2271.01.01.01.0
3445ea68597086c7251f22a528e1.01.01.01.0
3455ea6c3016666f50351c718761.01.01.01.0
3465ea93292936cd300093792151.01.01.00.0
3475ea87b7a3de5172c19d4c8a01.01.01.01.0
\n", + "

348 rows × 5 columns

\n", + "
" + ], + "text/plain": [ + " PROLIFICID session8 session9 session10 session11\n", + "0 5cae6a77b38ea60016e54889 1.0 1.0 1.0 1.0\n", + "1 56ca0400b30699000bd9d94f 1.0 1.0 1.0 1.0\n", + "2 5dd59fe0a6438056ac397382 1.0 1.0 1.0 1.0\n", + "3 5caccbc4976d010014b9cd9d 1.0 1.0 1.0 1.0\n", + "4 5e3deeeb387fb9000abb714c 1.0 1.0 1.0 1.0\n", + ".. ... ... ... ... ...\n", + "343 5ea8049b3698931ef59db227 1.0 1.0 1.0 1.0\n", + "344 5ea68597086c7251f22a528e 1.0 1.0 1.0 1.0\n", + "345 5ea6c3016666f50351c71876 1.0 1.0 1.0 1.0\n", + "346 5ea93292936cd30009379215 1.0 1.0 1.0 0.0\n", + "347 5ea87b7a3de5172c19d4c8a0 1.0 1.0 1.0 1.0\n", + "\n", + "[348 rows x 5 columns]" + ] + }, + "execution_count": 63, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "sessions" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Example: who did not complete session 11? And did they complete everything before?" + ] + }, + { + "cell_type": "code", + "execution_count": 74, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
PROLIFICIDsession8session9session10session11
475d9452e023002d001c67bab11.01.01.00.0
495e55385c54a6e7538c5bb5201.01.01.00.0
915c4b85a1dccaa800016b48211.01.01.00.0
2105e6783d865bd0b02409232991.00.00.00.0
2255dcc0649569be3899fe354f41.00.00.00.0
2275e7526bb07e4020883985d8b1.01.01.00.0
2295e33505e22d9f63318bec9881.01.00.00.0
2515e8f9fa62bc9102ab65190c31.01.01.00.0
2535e6d492f9d747603af5bb8681.01.01.00.0
2575e39ff812eb93d21c8cc140e1.01.01.00.0
3225ea039657736ed000b52576f1.01.01.00.0
3235eaa98e194138d012d5119591.00.00.00.0
3315ea31a3159f5e90eef5bab2c1.01.01.00.0
3375ea81268503624028c06218c1.01.01.00.0
3465ea93292936cd300093792151.01.01.00.0
\n", + "
" + ], + "text/plain": [ + " PROLIFICID session8 session9 session10 session11\n", + "47 5d9452e023002d001c67bab1 1.0 1.0 1.0 0.0\n", + "49 5e55385c54a6e7538c5bb520 1.0 1.0 1.0 0.0\n", + "91 5c4b85a1dccaa800016b4821 1.0 1.0 1.0 0.0\n", + "210 5e6783d865bd0b0240923299 1.0 0.0 0.0 0.0\n", + "225 5dcc0649569be3899fe354f4 1.0 0.0 0.0 0.0\n", + "227 5e7526bb07e4020883985d8b 1.0 1.0 1.0 0.0\n", + "229 5e33505e22d9f63318bec988 1.0 1.0 0.0 0.0\n", + "251 5e8f9fa62bc9102ab65190c3 1.0 1.0 1.0 0.0\n", + "253 5e6d492f9d747603af5bb868 1.0 1.0 1.0 0.0\n", + "257 5e39ff812eb93d21c8cc140e 1.0 1.0 1.0 0.0\n", + "322 5ea039657736ed000b52576f 1.0 1.0 1.0 0.0\n", + "323 5eaa98e194138d012d511959 1.0 0.0 0.0 0.0\n", + "331 5ea31a3159f5e90eef5bab2c 1.0 1.0 1.0 0.0\n", + "337 5ea81268503624028c06218c 1.0 1.0 1.0 0.0\n", + "346 5ea93292936cd30009379215 1.0 1.0 1.0 0.0" + ] + }, + "execution_count": 74, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "sessions[sessions['session11'] == 0]" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.7.4" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/scripts/__pycache__/cov_functions.cpython-37.pyc b/scripts/__pycache__/cov_functions.cpython-37.pyc index a73c4394cea55822ce152d4ba4edea5eccd5365d..c6c62a092176c653bc4b5724e9cd43f3141751f1 100755 GIT binary patch delta 397 zcmWm8%Sr-K7y#h@8E;7nA%v)*qZvqPxe%gUWswWJnier(C+AE}UdGNGyU;RPwGqxH ze1(vRd4QHd1hqa7(F@d~Isf8=|H}VX`K$z20|Eb-6HE0*BeC)te3aL!rDe5dVPdH* zL~oILZIV`k;5MRIOIWn8>uSfO=a@8fv#nvGHq9$T%jy^r)oK!>M=h0o%kRM1lPezP z@>vscAL@2Z>YU&n-6S1EIs0-|K(S-)!30F@(PYdE3-(8N7ocdzBI^>&+o!RL40-z{ z9+pB!&Xe5J?;4kVOvasrq#0Kf$gw}AFr5`$Nu%6nQKD0$gSnUBUK=$rS!7$u1mu~S zEWswTlN)fvev@T)PVBI9s^Hlc=l0lrDg!%glnQ66qOdQh3F?9a!Jz|p8QP7-C4-V< v_LGXjiS3_x02s1CIs$j>IX#!162r2rcMRe4H_A@=_Lgi74juQ0VUQef1ZT%+X7 z=r#F(k~`zA$sEcatlB{3QIkWJP1$@v8vQ3vP}X$v1sTYanNneNiz&q@ilewBzPL0A z=z#!`nm`Z{1R{b#LPx# diff --git a/scripts/cov_participants_who_did_not_do_most_of_sessions.ipynb b/scripts/cov_participants_who_did_not_do_most_of_sessions.ipynb index e33a08f..33bf102 100644 --- a/scripts/cov_participants_who_did_not_do_most_of_sessions.ipynb +++ b/scripts/cov_participants_who_did_not_do_most_of_sessions.ipynb @@ -1,12 +1,1049 @@ { "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Description: \n", + "\n", + "1. loading participants' data from sessions 8 to 11\n", + "2. filtering them for only APPROVED\n", + "3. if their participation was approved, setting it to 1 \n", + "4. merging data frames for different sessions, setting 0 for cases when participation was not approved" + ] + }, + { + "cell_type": "code", + "execution_count": 53, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd\n", + "import numpy as np\n", + "from cov_functions import *\n", + "import logging as lg\n", + "import logging.handlers\n", + "import os \n", + "from functools import reduce" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Loading session 8 " + ] + }, + { + "cell_type": "code", + "execution_count": 54, + "metadata": {}, + "outputs": [], + "source": [ + "conf = {\"session\": 8,\n", + " \"session_type\": \"long\"\n", + " }" + ] + }, + { + "cell_type": "code", + "execution_count": 55, + "metadata": {}, + "outputs": [], + "source": [ + "data_path = os.path.join(\"../../data/session\"+str(conf[\"session\"])+\"/\")\n", + "# Set up a specific logger with our desired output level\n", + "lg.basicConfig(filename=data_path+'log.txt',level=logging.INFO)\n", + "lg.info(\"\")\n", + "lg.info(\" LOG START\")\n", + "prolific_uk_d = pd.read_csv(data_path+\"prolific_data_uk.csv\")\n", + "prolific_be_d = pd.read_csv(data_path+\"prolific_data_be.csv\")\n", + "frames = [prolific_uk_d, prolific_be_d]\n", + "\n", + "prolific_d = pd.concat(frames)\n", + "\n", + "# 1. Clean prolific data\n", + "prolific_d = prolific_d.set_index(\"participant_id\", drop= True)\n", + "\n", + "# change index label to PROLIFICID\n", + "new_index = prolific_d.index.rename('PROLIFICID')\n", + "prolific_d.index = new_index\n", + "\n", + "session8 = prolific_d\n", + "session8 = session8[session8.status ==\"APPROVED\"]\n", + "session8 = session8['status']\n", + "session8 = session8.to_frame()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Function that changes values of approved rows to 1" + ] + }, { "cell_type": "code", - "execution_count": 1, + "execution_count": 56, "metadata": {}, "outputs": [], "source": [ - "import pandas as pd" + "def ids(status):\n", + " if status == 'APPROVED':\n", + " return 1.0\n", + " else: \n", + " return 0.0" + ] + }, + { + "cell_type": "code", + "execution_count": 57, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
PROLIFICIDsession8
05cae6a77b38ea60016e548891.0
156ca0400b30699000bd9d94f1.0
25dd59fe0a6438056ac3973821.0
35caccbc4976d010014b9cd9d1.0
45e3deeeb387fb9000abb714c1.0
.........
3295ea8049b3698931ef59db2271.0
3305ea68597086c7251f22a528e1.0
3315ea6c3016666f50351c718761.0
3325ea93292936cd300093792151.0
3335ea87b7a3de5172c19d4c8a01.0
\n", + "

334 rows × 2 columns

\n", + "
" + ], + "text/plain": [ + " PROLIFICID session8\n", + "0 5cae6a77b38ea60016e54889 1.0\n", + "1 56ca0400b30699000bd9d94f 1.0\n", + "2 5dd59fe0a6438056ac397382 1.0\n", + "3 5caccbc4976d010014b9cd9d 1.0\n", + "4 5e3deeeb387fb9000abb714c 1.0\n", + ".. ... ...\n", + "329 5ea8049b3698931ef59db227 1.0\n", + "330 5ea68597086c7251f22a528e 1.0\n", + "331 5ea6c3016666f50351c71876 1.0\n", + "332 5ea93292936cd30009379215 1.0\n", + "333 5ea87b7a3de5172c19d4c8a0 1.0\n", + "\n", + "[334 rows x 2 columns]" + ] + }, + "execution_count": 57, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "session8 = session8['status'].apply(lambda status: ids(status))\n", + "session8 = session8.to_frame()\n", + "session8.reset_index(inplace = True)\n", + "session8.rename(columns={'status':'session8'}, inplace=True)\n", + "session8" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Loading session 9" + ] + }, + { + "cell_type": "code", + "execution_count": 58, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
PROLIFICIDsession9
05c584e854e32ef00014af6851.0
15dc3224ff3795b23e5ec7c651.0
25d7c060606189b0017ba79c91.0
35e87376eb4921a37c33affb41.0
45e932b48bb285314d5ed56ba1.0
.........
3295ea56ecd5d022354cb1c061e1.0
3305ea93292936cd300093792151.0
3315ea1e8daeebbed0dabdaee6d1.0
3325ea30b6232a8c709ed3c645e1.0
3335ea8049b3698931ef59db2271.0
\n", + "

334 rows × 2 columns

\n", + "
" + ], + "text/plain": [ + " PROLIFICID session9\n", + "0 5c584e854e32ef00014af685 1.0\n", + "1 5dc3224ff3795b23e5ec7c65 1.0\n", + "2 5d7c060606189b0017ba79c9 1.0\n", + "3 5e87376eb4921a37c33affb4 1.0\n", + "4 5e932b48bb285314d5ed56ba 1.0\n", + ".. ... ...\n", + "329 5ea56ecd5d022354cb1c061e 1.0\n", + "330 5ea93292936cd30009379215 1.0\n", + "331 5ea1e8daeebbed0dabdaee6d 1.0\n", + "332 5ea30b6232a8c709ed3c645e 1.0\n", + "333 5ea8049b3698931ef59db227 1.0\n", + "\n", + "[334 rows x 2 columns]" + ] + }, + "execution_count": 58, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "conf = {\"session\": 9,\n", + " \"session_type\": \"short\"\n", + " }\n", + "data_path = os.path.join(\"../../data/session\"+str(conf[\"session\"])+\"/\")\n", + "# Set up a specific logger with our desired output level\n", + "lg.basicConfig(filename=data_path+'log.txt',level=logging.INFO)\n", + "lg.info(\"\")\n", + "lg.info(\" LOG START\")\n", + "prolific_uk_d = pd.read_csv(data_path+\"prolific_data_uk.csv\")\n", + "prolific_be_d = pd.read_csv(data_path+\"prolific_data_be.csv\")\n", + "frames = [prolific_uk_d, prolific_be_d]\n", + "\n", + "prolific_d = pd.concat(frames)\n", + "\n", + "# 1. Clean prolific data\n", + "prolific_d = prolific_d.set_index(\"participant_id\", drop= True)\n", + "\n", + "# change index label to PROLIFICID\n", + "new_index = prolific_d.index.rename('PROLIFICID')\n", + "prolific_d.index = new_index\n", + "\n", + "session9 = prolific_d\n", + "session9 = session9[session9.status ==\"APPROVED\"]\n", + "session9 = session9['status']\n", + "session9 = session9.to_frame()\n", + "session9 = session9['status'].apply(lambda status: ids(status))\n", + "session9 = session9.to_frame()\n", + "session9.reset_index(inplace = True)\n", + "session9.rename(columns={'status':'session9'}, inplace=True)\n", + "session9" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Loading session 10" + ] + }, + { + "cell_type": "code", + "execution_count": 59, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
PROLIFICIDsession10
05d9b55b519e9b6001550cf9f1.0
15c58a9908f34eb00015748671.0
25ddf87d7952798000c74a4781.0
35d920df12b679a00182bbc731.0
45e1b2b3e4a955b350b1e0a631.0
.........
3285ea72a2e0120e60efc328d9d1.0
3295ea68597086c7251f22a528e1.0
3305ea160b5485d2e00092fd2e21.0
3315ea6c3016666f50351c718761.0
3325ea84aca3297e825a9d92aa51.0
\n", + "

333 rows × 2 columns

\n", + "
" + ], + "text/plain": [ + " PROLIFICID session10\n", + "0 5d9b55b519e9b6001550cf9f 1.0\n", + "1 5c58a9908f34eb0001574867 1.0\n", + "2 5ddf87d7952798000c74a478 1.0\n", + "3 5d920df12b679a00182bbc73 1.0\n", + "4 5e1b2b3e4a955b350b1e0a63 1.0\n", + ".. ... ...\n", + "328 5ea72a2e0120e60efc328d9d 1.0\n", + "329 5ea68597086c7251f22a528e 1.0\n", + "330 5ea160b5485d2e00092fd2e2 1.0\n", + "331 5ea6c3016666f50351c71876 1.0\n", + "332 5ea84aca3297e825a9d92aa5 1.0\n", + "\n", + "[333 rows x 2 columns]" + ] + }, + "execution_count": 59, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "conf = {\"session\": 10,\n", + " \"session_type\": \"short\"\n", + " }\n", + "data_path = os.path.join(\"../../data/session\"+str(conf[\"session\"])+\"/\")\n", + "# Set up a specific logger with our desired output level\n", + "lg.basicConfig(filename=data_path+'log.txt',level=logging.INFO)\n", + "lg.info(\"\")\n", + "lg.info(\" LOG START\")\n", + "prolific_uk_d = pd.read_csv(data_path+\"prolific_data_uk.csv\")\n", + "prolific_be_d = pd.read_csv(data_path+\"prolific_data_be.csv\")\n", + "frames = [prolific_uk_d, prolific_be_d]\n", + "\n", + "prolific_d = pd.concat(frames)\n", + "\n", + "# 1. Clean prolific data\n", + "prolific_d = prolific_d.set_index(\"participant_id\", drop= True)\n", + "\n", + "# change index label to PROLIFICID\n", + "new_index = prolific_d.index.rename('PROLIFICID')\n", + "prolific_d.index = new_index\n", + "\n", + "session10 = prolific_d\n", + "session10 = session10[session10.status ==\"APPROVED\"]\n", + "session10 = session10['status']\n", + "session10 = session10.to_frame()\n", + "session10 = session10['status'].apply(lambda status: ids(status))\n", + "session10 = session10.to_frame()\n", + "session10.reset_index(inplace = True)\n", + "session10.rename(columns={'status':'session10'}, inplace=True)\n", + "session10" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Loading session 11" + ] + }, + { + "cell_type": "code", + "execution_count": 60, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
PROLIFICIDsession11
05e5ad8d315b8d42db10b84ce1.0
15d9b55b519e9b6001550cf9f1.0
25d7c060606189b0017ba79c91.0
35e81c1359984aa89fe6b8c131.0
45e4875f3110b3730eefa32a11.0
.........
3185ea17128cc936f013db64e701.0
3195ea04e98271c1b03ee09cbac1.0
3205ea8049b3698931ef59db2271.0
3215eaafa4b9f58200867cb6cc81.0
3225ea84aca3297e825a9d92aa51.0
\n", + "

323 rows × 2 columns

\n", + "
" + ], + "text/plain": [ + " PROLIFICID session11\n", + "0 5e5ad8d315b8d42db10b84ce 1.0\n", + "1 5d9b55b519e9b6001550cf9f 1.0\n", + "2 5d7c060606189b0017ba79c9 1.0\n", + "3 5e81c1359984aa89fe6b8c13 1.0\n", + "4 5e4875f3110b3730eefa32a1 1.0\n", + ".. ... ...\n", + "318 5ea17128cc936f013db64e70 1.0\n", + "319 5ea04e98271c1b03ee09cbac 1.0\n", + "320 5ea8049b3698931ef59db227 1.0\n", + "321 5eaafa4b9f58200867cb6cc8 1.0\n", + "322 5ea84aca3297e825a9d92aa5 1.0\n", + "\n", + "[323 rows x 2 columns]" + ] + }, + "execution_count": 60, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "conf = {\"session\": 11,\n", + " \"session_type\": \"short\"\n", + " }\n", + "data_path = os.path.join(\"../../data/session\"+str(conf[\"session\"])+\"/\")\n", + "# Set up a specific logger with our desired output level\n", + "lg.basicConfig(filename=data_path+'log.txt',level=logging.INFO)\n", + "lg.info(\"\")\n", + "lg.info(\" LOG START\")\n", + "prolific_uk_d = pd.read_csv(data_path+\"prolific_data_uk.csv\")\n", + "prolific_be_d = pd.read_csv(data_path+\"prolific_data_be.csv\")\n", + "frames = [prolific_uk_d, prolific_be_d]\n", + "\n", + "prolific_d = pd.concat(frames)\n", + "\n", + "# 1. Clean prolific data\n", + "prolific_d = prolific_d.set_index(\"participant_id\", drop= True)\n", + "\n", + "# change index label to PROLIFICID\n", + "new_index = prolific_d.index.rename('PROLIFICID')\n", + "prolific_d.index = new_index\n", + "\n", + "session11 = prolific_d\n", + "session11 = session11[session11.status ==\"APPROVED\"]\n", + "session11 = session11['status']\n", + "session11 = session11.to_frame()\n", + "session11 = session11['status'].apply(lambda status: ids(status))\n", + "session11 = session11.to_frame()\n", + "session11.reset_index(inplace = True)\n", + "session11.rename(columns={'status':'session11'}, inplace=True)\n", + "session11" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Making one data frame, where for each ID for each session 1 corresponds to approved and 0 - not approved " + ] + }, + { + "cell_type": "code", + "execution_count": 61, + "metadata": {}, + "outputs": [], + "source": [ + "sessions = [session8, session9, session10, session11]" + ] + }, + { + "cell_type": "code", + "execution_count": 62, + "metadata": {}, + "outputs": [], + "source": [ + "sessions = reduce(lambda left,right: pd.merge(left,right,on=['PROLIFICID'], how='left'), sessions).fillna(0)" + ] + }, + { + "cell_type": "code", + "execution_count": 63, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
PROLIFICIDsession8session9session10session11
05cae6a77b38ea60016e548891.01.01.01.0
156ca0400b30699000bd9d94f1.01.01.01.0
25dd59fe0a6438056ac3973821.01.01.01.0
35caccbc4976d010014b9cd9d1.01.01.01.0
45e3deeeb387fb9000abb714c1.01.01.01.0
..................
3435ea8049b3698931ef59db2271.01.01.01.0
3445ea68597086c7251f22a528e1.01.01.01.0
3455ea6c3016666f50351c718761.01.01.01.0
3465ea93292936cd300093792151.01.01.00.0
3475ea87b7a3de5172c19d4c8a01.01.01.01.0
\n", + "

348 rows × 5 columns

\n", + "
" + ], + "text/plain": [ + " PROLIFICID session8 session9 session10 session11\n", + "0 5cae6a77b38ea60016e54889 1.0 1.0 1.0 1.0\n", + "1 56ca0400b30699000bd9d94f 1.0 1.0 1.0 1.0\n", + "2 5dd59fe0a6438056ac397382 1.0 1.0 1.0 1.0\n", + "3 5caccbc4976d010014b9cd9d 1.0 1.0 1.0 1.0\n", + "4 5e3deeeb387fb9000abb714c 1.0 1.0 1.0 1.0\n", + ".. ... ... ... ... ...\n", + "343 5ea8049b3698931ef59db227 1.0 1.0 1.0 1.0\n", + "344 5ea68597086c7251f22a528e 1.0 1.0 1.0 1.0\n", + "345 5ea6c3016666f50351c71876 1.0 1.0 1.0 1.0\n", + "346 5ea93292936cd30009379215 1.0 1.0 1.0 0.0\n", + "347 5ea87b7a3de5172c19d4c8a0 1.0 1.0 1.0 1.0\n", + "\n", + "[348 rows x 5 columns]" + ] + }, + "execution_count": 63, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "sessions" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Example: who did not complete session 11? And did they complete everything before?" + ] + }, + { + "cell_type": "code", + "execution_count": 74, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
PROLIFICIDsession8session9session10session11
475d9452e023002d001c67bab11.01.01.00.0
495e55385c54a6e7538c5bb5201.01.01.00.0
915c4b85a1dccaa800016b48211.01.01.00.0
2105e6783d865bd0b02409232991.00.00.00.0
2255dcc0649569be3899fe354f41.00.00.00.0
2275e7526bb07e4020883985d8b1.01.01.00.0
2295e33505e22d9f63318bec9881.01.00.00.0
2515e8f9fa62bc9102ab65190c31.01.01.00.0
2535e6d492f9d747603af5bb8681.01.01.00.0
2575e39ff812eb93d21c8cc140e1.01.01.00.0
3225ea039657736ed000b52576f1.01.01.00.0
3235eaa98e194138d012d5119591.00.00.00.0
3315ea31a3159f5e90eef5bab2c1.01.01.00.0
3375ea81268503624028c06218c1.01.01.00.0
3465ea93292936cd300093792151.01.01.00.0
\n", + "
" + ], + "text/plain": [ + " PROLIFICID session8 session9 session10 session11\n", + "47 5d9452e023002d001c67bab1 1.0 1.0 1.0 0.0\n", + "49 5e55385c54a6e7538c5bb520 1.0 1.0 1.0 0.0\n", + "91 5c4b85a1dccaa800016b4821 1.0 1.0 1.0 0.0\n", + "210 5e6783d865bd0b0240923299 1.0 0.0 0.0 0.0\n", + "225 5dcc0649569be3899fe354f4 1.0 0.0 0.0 0.0\n", + "227 5e7526bb07e4020883985d8b 1.0 1.0 1.0 0.0\n", + "229 5e33505e22d9f63318bec988 1.0 1.0 0.0 0.0\n", + "251 5e8f9fa62bc9102ab65190c3 1.0 1.0 1.0 0.0\n", + "253 5e6d492f9d747603af5bb868 1.0 1.0 1.0 0.0\n", + "257 5e39ff812eb93d21c8cc140e 1.0 1.0 1.0 0.0\n", + "322 5ea039657736ed000b52576f 1.0 1.0 1.0 0.0\n", + "323 5eaa98e194138d012d511959 1.0 0.0 0.0 0.0\n", + "331 5ea31a3159f5e90eef5bab2c 1.0 1.0 1.0 0.0\n", + "337 5ea81268503624028c06218c 1.0 1.0 1.0 0.0\n", + "346 5ea93292936cd30009379215 1.0 1.0 1.0 0.0" + ] + }, + "execution_count": 74, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "sessions[sessions['session11'] == 0]" ] }, { diff --git a/scripts/cov_preprocess.ipynb b/scripts/cov_preprocess.ipynb index 328c67b..7abba30 100755 --- a/scripts/cov_preprocess.ipynb +++ b/scripts/cov_preprocess.ipynb @@ -253,9 +253,9 @@ ], "metadata": { "kernelspec": { - "display_name": "IPy3.7kernel", + "display_name": "Python 3", "language": "python", - "name": "python3.7" + "name": "python3" }, "language_info": { "codemirror_mode": { @@ -267,7 +267,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.7.3" + "version": "3.7.4" }, "toc": { "base_numbering": 1, -- GitLab