{ "cells": [ { "cell_type": "code", "execution_count": 54, "id": "daa13044", "metadata": { "ExecuteTime": { "end_time": "2024-02-23T01:01:41.396867Z", "start_time": "2024-02-23T01:01:40.758392Z" }, "colab": { "base_uri": "https://localhost:8080/", "height": 614 }, "id": "daa13044", "outputId": "4d440aaa-1ee7-4771-c526-f55e9458ca8a" }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
TimestampWhat is your current class standing?Who do you live with?Do you currently live in a house, apartnment, or dorm?How many people live in your household?Do you currently work?How many hours do you work per week on average?Do you work on or off campus?Do you work in a department related to your major?Do you have roommates that are part of your major?
02/9/2024 20:12:14SeniorNeitherHouse6Yes5 - 10Off-campusNoNo
12/9/2024 20:16:34JuniorBothApartment4NoNaNNaNNaNYes
22/9/2024 20:18:55JuniorFriendsHouse4NoNaNNaNNaNNo
32/9/2024 20:24:00SeniorNeitherApartment1NoNaNNaNNoNo
42/9/2024 20:26:16GraduateNeitherApartment1Yes10 - 20Off-campusYesNo
.................................
2552/14/2024 19:46:28JuniorFriendsHouse5Yes10 - 20On-campusNoNo
2562/15/2024 0:28:38NaNFamilyApartmentNorth District 4 bed 2 bathNoNaNNaNNaNNo
2572/15/2024 8:33:45SeniorFamilyHouse9No1 - 5Off-campusNoNo
2582/15/2024 16:10:40SophomoreFamilyApartment4Yes5 - 10On-campusNoNo
2592/15/2024 16:14:11SophomoreFriendsDorm3 (room), 8 (hall), ~70 (building)NoNaNNaNNaNYes
\n", "

260 rows × 10 columns

\n", "
" ], "text/plain": [ " Timestamp What is your current class standing? \\\n", "0 2/9/2024 20:12:14 Senior \n", "1 2/9/2024 20:16:34 Junior \n", "2 2/9/2024 20:18:55 Junior \n", "3 2/9/2024 20:24:00 Senior \n", "4 2/9/2024 20:26:16 Graduate \n", ".. ... ... \n", "255 2/14/2024 19:46:28 Junior \n", "256 2/15/2024 0:28:38 NaN \n", "257 2/15/2024 8:33:45 Senior \n", "258 2/15/2024 16:10:40 Sophomore \n", "259 2/15/2024 16:14:11 Sophomore \n", "\n", " Who do you live with? \\\n", "0 Neither \n", "1 Both \n", "2 Friends \n", "3 Neither \n", "4 Neither \n", ".. ... \n", "255 Friends \n", "256 Family \n", "257 Family \n", "258 Family \n", "259 Friends \n", "\n", " Do you currently live in a house, apartnment, or dorm? \\\n", "0 House \n", "1 Apartment \n", "2 House \n", "3 Apartment \n", "4 Apartment \n", ".. ... \n", "255 House \n", "256 Apartment \n", "257 House \n", "258 Apartment \n", "259 Dorm \n", "\n", " How many people live in your household? Do you currently work? \\\n", "0 6 Yes \n", "1 4 No \n", "2 4 No \n", "3 1 No \n", "4 1 Yes \n", ".. ... ... \n", "255 5 Yes \n", "256 North District 4 bed 2 bath No \n", "257 9 No \n", "258 4 Yes \n", "259 3 (room), 8 (hall), ~70 (building) No \n", "\n", " How many hours do you work per week on average? \\\n", "0 5 - 10 \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 10 - 20 \n", ".. ... \n", "255 10 - 20 \n", "256 NaN \n", "257 1 - 5 \n", "258 5 - 10 \n", "259 NaN \n", "\n", " Do you work on or off campus? \\\n", "0 Off-campus \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 Off-campus \n", ".. ... \n", "255 On-campus \n", "256 NaN \n", "257 Off-campus \n", "258 On-campus \n", "259 NaN \n", "\n", " Do you work in a department related to your major? \\\n", "0 No \n", "1 NaN \n", "2 NaN \n", "3 No \n", "4 Yes \n", ".. ... \n", "255 No \n", "256 NaN \n", "257 No \n", "258 No \n", "259 NaN \n", "\n", " Do you have roommates that are part of your major? \n", "0 No \n", "1 Yes \n", "2 No \n", "3 No \n", "4 No \n", ".. ... \n", "255 No \n", "256 No \n", "257 No \n", "258 No \n", "259 Yes \n", "\n", "[260 rows x 10 columns]" ] }, "execution_count": 54, "metadata": {}, "output_type": "execute_result" } ], "source": [ "%matplotlib inline\n", "import pandas as pd\n", "import numpy as np\n", "\n", "df = pd.read_csv(\"data.csv\")\n", "df = df.iloc[:, [0, 2, 7, 8, 9, 58, 59, 60, 61, 26]]\n", "df" ] }, { "cell_type": "code", "execution_count": 55, "id": "29889175", "metadata": { "ExecuteTime": { "end_time": "2024-02-23T01:01:41.409516Z", "start_time": "2024-02-23T01:01:41.398267Z" }, "id": "29889175" }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
TimestampWhat is your current class standing?Who do you live with?Do you currently live in a house, apartnment, or dorm?How many people live in your household?Do you currently work?How many hours do you work per week on average?Do you work on or off campus?Do you work in a department related to your major?Do you have roommates that are part of your major?
02/9/2024 20:12:14SeniorNeitherHouse6Yes5 - 10Off-campusNoNo
12/9/2024 20:16:34JuniorBothApartment4No0NaNNaNYes
22/9/2024 20:18:55JuniorFriendsHouse4No0NaNNaNNo
32/9/2024 20:24:00SeniorNeitherApartment1No0NaNNaNNo
42/9/2024 20:26:16GraduateNeitherApartment1Yes10 - 20Off-campusYesNo
.................................
2552/14/2024 19:46:28JuniorFriendsHouse5Yes10 - 20On-campusNoNo
2562/15/2024 0:28:38NaNFamilyApartment4No0NaNNaNNo
2572/15/2024 8:33:45SeniorFamilyHouse9No0Off-campusNaNNo
2582/15/2024 16:10:40SophomoreFamilyApartment4Yes5 - 10On-campusNoNo
2592/15/2024 16:14:11SophomoreFriendsDorm3No0NaNNaNYes
\n", "

260 rows × 10 columns

\n", "
" ], "text/plain": [ " Timestamp What is your current class standing? \\\n", "0 2/9/2024 20:12:14 Senior \n", "1 2/9/2024 20:16:34 Junior \n", "2 2/9/2024 20:18:55 Junior \n", "3 2/9/2024 20:24:00 Senior \n", "4 2/9/2024 20:26:16 Graduate \n", ".. ... ... \n", "255 2/14/2024 19:46:28 Junior \n", "256 2/15/2024 0:28:38 NaN \n", "257 2/15/2024 8:33:45 Senior \n", "258 2/15/2024 16:10:40 Sophomore \n", "259 2/15/2024 16:14:11 Sophomore \n", "\n", " Who do you live with? \\\n", "0 Neither \n", "1 Both \n", "2 Friends \n", "3 Neither \n", "4 Neither \n", ".. ... \n", "255 Friends \n", "256 Family \n", "257 Family \n", "258 Family \n", "259 Friends \n", "\n", " Do you currently live in a house, apartnment, or dorm? \\\n", "0 House \n", "1 Apartment \n", "2 House \n", "3 Apartment \n", "4 Apartment \n", ".. ... \n", "255 House \n", "256 Apartment \n", "257 House \n", "258 Apartment \n", "259 Dorm \n", "\n", " How many people live in your household? Do you currently work? \\\n", "0 6 Yes \n", "1 4 No \n", "2 4 No \n", "3 1 No \n", "4 1 Yes \n", ".. ... ... \n", "255 5 Yes \n", "256 4 No \n", "257 9 No \n", "258 4 Yes \n", "259 3 No \n", "\n", " How many hours do you work per week on average? \\\n", "0 5 - 10 \n", "1 0 \n", "2 0 \n", "3 0 \n", "4 10 - 20 \n", ".. ... \n", "255 10 - 20 \n", "256 0 \n", "257 0 \n", "258 5 - 10 \n", "259 0 \n", "\n", " Do you work on or off campus? \\\n", "0 Off-campus \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 Off-campus \n", ".. ... \n", "255 On-campus \n", "256 NaN \n", "257 Off-campus \n", "258 On-campus \n", "259 NaN \n", "\n", " Do you work in a department related to your major? \\\n", "0 No \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 Yes \n", ".. ... \n", "255 No \n", "256 NaN \n", "257 NaN \n", "258 No \n", "259 NaN \n", "\n", " Do you have roommates that are part of your major? \n", "0 No \n", "1 Yes \n", "2 No \n", "3 No \n", "4 No \n", ".. ... \n", "255 No \n", "256 No \n", "257 No \n", "258 No \n", "259 Yes \n", "\n", "[260 rows x 10 columns]" ] }, "execution_count": 55, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df['How many people live in your household?'] = (df['How many people live in your household?']\n", " .fillna(0)\n", " .replace('4 in total', '4')\n", " .replace('4 (Including me)', '4')\n", " .replace('at school 4 including me ', '4')\n", " .replace('3 excluding me', '4')\n", " .replace('5 including me', '5')\n", " .replace('North District 4 bed 2 bath', '4')\n", " .replace('3 (room), 8 (hall), ~70 (building)', '3')\n", " .astype(int))\n", "df.loc[df['Do you currently work?'] == 'No', 'How many hours do you work per week on average?'] = 0\n", "df['Who do you live with? '] = df['Who do you live with? '].replace('Family, Friends', 'Both').replace('Family, Friends, Both', 'Both')\n", "df.loc[df['Do you currently work?'] == 'No', 'Do you work in a department related to your major?'] = np.nan\n", "df" ] }, { "cell_type": "code", "execution_count": 56, "id": "de4448fd64205d85", "metadata": { "ExecuteTime": { "end_time": "2024-02-23T01:01:41.418974Z", "start_time": "2024-02-23T01:01:41.410787Z" }, "collapsed": false }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
TimestampWhat is your current class standing?Who do you live with?Do you currently live in a house, apartnment, or dorm?How many people live in your household?Do you currently work?How many hours do you work per week on average?Do you work on or off campus?Do you work in a department related to your major?Do you have roommates that are part of your major?
02/9/2024 20:12:14SeniorNeitherHouse6Yes5 - 10Off-campusNoNo
42/9/2024 20:26:16GraduateNeitherApartment1Yes10 - 20Off-campusYesNo
82/9/2024 22:02:49JuniorFriendsHouse6Yes10 - 20On-campusNoNo
92/9/2024 22:08:43SeniorFamilyHouse5Yes1 - 5On-campusNoNo
132/9/2024 22:15:13JuniorFamilyApartment4Yes10 - 20Off-campusNoNo
.................................
2462/13/2024 19:37:02GraduateFamilyHouse2Yes10 - 20On-campusYesNo
2472/13/2024 21:39:14SeniorFriendsApartment3Yes20 - 40Off-campusNoYes
2522/14/2024 9:48:12JuniorFamilyHouse5Yes20 - 40Off-campusNoNo
2552/14/2024 19:46:28JuniorFriendsHouse5Yes10 - 20On-campusNoNo
2582/15/2024 16:10:40SophomoreFamilyApartment4Yes5 - 10On-campusNoNo
\n", "

77 rows × 10 columns

\n", "
" ], "text/plain": [ " Timestamp What is your current class standing? \\\n", "0 2/9/2024 20:12:14 Senior \n", "4 2/9/2024 20:26:16 Graduate \n", "8 2/9/2024 22:02:49 Junior \n", "9 2/9/2024 22:08:43 Senior \n", "13 2/9/2024 22:15:13 Junior \n", ".. ... ... \n", "246 2/13/2024 19:37:02 Graduate \n", "247 2/13/2024 21:39:14 Senior \n", "252 2/14/2024 9:48:12 Junior \n", "255 2/14/2024 19:46:28 Junior \n", "258 2/15/2024 16:10:40 Sophomore \n", "\n", " Who do you live with? \\\n", "0 Neither \n", "4 Neither \n", "8 Friends \n", "9 Family \n", "13 Family \n", ".. ... \n", "246 Family \n", "247 Friends \n", "252 Family \n", "255 Friends \n", "258 Family \n", "\n", " Do you currently live in a house, apartnment, or dorm? \\\n", "0 House \n", "4 Apartment \n", "8 House \n", "9 House \n", "13 Apartment \n", ".. ... \n", "246 House \n", "247 Apartment \n", "252 House \n", "255 House \n", "258 Apartment \n", "\n", " How many people live in your household? Do you currently work? \\\n", "0 6 Yes \n", "4 1 Yes \n", "8 6 Yes \n", "9 5 Yes \n", "13 4 Yes \n", ".. ... ... \n", "246 2 Yes \n", "247 3 Yes \n", "252 5 Yes \n", "255 5 Yes \n", "258 4 Yes \n", "\n", " How many hours do you work per week on average? \\\n", "0 5 - 10 \n", "4 10 - 20 \n", "8 10 - 20 \n", "9 1 - 5 \n", "13 10 - 20 \n", ".. ... \n", "246 10 - 20 \n", "247 20 - 40 \n", "252 20 - 40 \n", "255 10 - 20 \n", "258 5 - 10 \n", "\n", " Do you work on or off campus? \\\n", "0 Off-campus \n", "4 Off-campus \n", "8 On-campus \n", "9 On-campus \n", "13 Off-campus \n", ".. ... \n", "246 On-campus \n", "247 Off-campus \n", "252 Off-campus \n", "255 On-campus \n", "258 On-campus \n", "\n", " Do you work in a department related to your major? \\\n", "0 No \n", "4 Yes \n", "8 No \n", "9 No \n", "13 No \n", ".. ... \n", "246 Yes \n", "247 No \n", "252 No \n", "255 No \n", "258 No \n", "\n", " Do you have roommates that are part of your major? \n", "0 No \n", "4 No \n", "8 No \n", "9 No \n", "13 No \n", ".. ... \n", "246 No \n", "247 Yes \n", "252 No \n", "255 No \n", "258 No \n", "\n", "[77 rows x 10 columns]" ] }, "execution_count": 56, "metadata": {}, "output_type": "execute_result" } ], "source": [ "# Working DataFrame\n", "w_df = df[df['Do you currently work?'] == 'Yes']\n", "# Not working DataFrame\n", "nw_df = df[df['Do you currently work?'] == 'No']\n", "w_df" ] }, { "cell_type": "code", "execution_count": 57, "id": "5fe8ec7f22878e60", "metadata": { "ExecuteTime": { "end_time": "2024-02-23T01:01:41.427847Z", "start_time": "2024-02-23T01:01:41.419852Z" }, "collapsed": false }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
TimestampWhat is your current class standing?Who do you live with?Do you currently live in a house, apartnment, or dorm?How many people live in your household?Do you currently work?How many hours do you work per week on average?Do you work on or off campus?Do you work in a department related to your major?Do you have roommates that are part of your major?
12/9/2024 20:16:34JuniorBothApartment4No0NaNNaNYes
22/9/2024 20:18:55JuniorFriendsHouse4No0NaNNaNNo
32/9/2024 20:24:00SeniorNeitherApartment1No0NaNNaNNo
52/9/2024 20:45:09JuniorBothApartment4No0NaNNaNNo
62/9/2024 21:55:59SophomoreFriendsApartment4No0NaNNaNNo
.................................
2532/14/2024 13:45:45SeniorFamilyHouse6No0NaNNaNNo
2542/14/2024 16:26:06JuniorFamilyHouse5No0NaNNaNYes
2562/15/2024 0:28:38NaNFamilyApartment4No0NaNNaNNo
2572/15/2024 8:33:45SeniorFamilyHouse9No0Off-campusNaNNo
2592/15/2024 16:14:11SophomoreFriendsDorm3No0NaNNaNYes
\n", "

176 rows × 10 columns

\n", "
" ], "text/plain": [ " Timestamp What is your current class standing? \\\n", "1 2/9/2024 20:16:34 Junior \n", "2 2/9/2024 20:18:55 Junior \n", "3 2/9/2024 20:24:00 Senior \n", "5 2/9/2024 20:45:09 Junior \n", "6 2/9/2024 21:55:59 Sophomore \n", ".. ... ... \n", "253 2/14/2024 13:45:45 Senior \n", "254 2/14/2024 16:26:06 Junior \n", "256 2/15/2024 0:28:38 NaN \n", "257 2/15/2024 8:33:45 Senior \n", "259 2/15/2024 16:14:11 Sophomore \n", "\n", " Who do you live with? \\\n", "1 Both \n", "2 Friends \n", "3 Neither \n", "5 Both \n", "6 Friends \n", ".. ... \n", "253 Family \n", "254 Family \n", "256 Family \n", "257 Family \n", "259 Friends \n", "\n", " Do you currently live in a house, apartnment, or dorm? \\\n", "1 Apartment \n", "2 House \n", "3 Apartment \n", "5 Apartment \n", "6 Apartment \n", ".. ... \n", "253 House \n", "254 House \n", "256 Apartment \n", "257 House \n", "259 Dorm \n", "\n", " How many people live in your household? Do you currently work? \\\n", "1 4 No \n", "2 4 No \n", "3 1 No \n", "5 4 No \n", "6 4 No \n", ".. ... ... \n", "253 6 No \n", "254 5 No \n", "256 4 No \n", "257 9 No \n", "259 3 No \n", "\n", " How many hours do you work per week on average? \\\n", "1 0 \n", "2 0 \n", "3 0 \n", "5 0 \n", "6 0 \n", ".. ... \n", "253 0 \n", "254 0 \n", "256 0 \n", "257 0 \n", "259 0 \n", "\n", " Do you work on or off campus? \\\n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "5 NaN \n", "6 NaN \n", ".. ... \n", "253 NaN \n", "254 NaN \n", "256 NaN \n", "257 Off-campus \n", "259 NaN \n", "\n", " Do you work in a department related to your major? \\\n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "5 NaN \n", "6 NaN \n", ".. ... \n", "253 NaN \n", "254 NaN \n", "256 NaN \n", "257 NaN \n", "259 NaN \n", "\n", " Do you have roommates that are part of your major? \n", "1 Yes \n", "2 No \n", "3 No \n", "5 No \n", "6 No \n", ".. ... \n", "253 No \n", "254 Yes \n", "256 No \n", "257 No \n", "259 Yes \n", "\n", "[176 rows x 10 columns]" ] }, "execution_count": 57, "metadata": {}, "output_type": "execute_result" } ], "source": [ "nw_df" ] }, { "cell_type": "markdown", "id": "899d85626b77db20", "metadata": { "collapsed": false }, "source": [ "
\n", "

CS105 Project

\n", "

Ali Naqvi, ...

\n", "

Topic: Does who a student is living with effect if and how they work jobs?

\n", "
\n" ] }, { "cell_type": "code", "execution_count": 58, "id": "bfa40c9e9693481d", "metadata": { "ExecuteTime": { "end_time": "2024-02-23T01:01:41.526696Z", "start_time": "2024-02-23T01:01:41.430135Z" }, "collapsed": false }, "outputs": [ { "data": { "image/png": "", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "import matplotlib.pyplot as plt\n", "\n", "# Assuming 'df' is your DataFrame\n", "\n", "# Count the number of people who work and don't work\n", "work_counts = df['Do you currently work?'].value_counts()\n", "\n", "# Plotting a pie chart\n", "plt.figure(figsize=(8, 8))\n", "plt.pie(work_counts, labels=work_counts.index, autopct='%1.1f%%', startangle=90, colors=['lightblue', 'lightcoral'])\n", "plt.title('Distribution of People Who Work and Don\\'t Work')\n", "plt.show()\n" ] }, { "cell_type": "code", "execution_count": 65, "id": "9c830283e9b26466", "metadata": { "ExecuteTime": { "end_time": "2024-02-23T01:01:41.532148Z", "start_time": "2024-02-23T01:01:41.528825Z" }, "collapsed": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Do you have roommates that are part of your major? No Yes Total\n", "Do you currently live in a house, apartnment, o... \n", "Apartment 83 44 127\n", "Dorm 17 11 28\n", "House 77 21 98\n", "Room 1 0 1\n", "house (renting) 1 0 1\n", "Total 179 76 255\n" ] } ], "source": [ "roommates_major_table = pd.crosstab(df.iloc[:, 3], df.iloc[:, 9], margins=True, margins_name='Total')\n", "\n", "# Print the table\n", "print(roommates_major_table)\n" ] }, { "cell_type": "code", "execution_count": 66, "id": "aef1e802", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Chi-squared Value: 6.761293513057266\n", "Degrees of Freedom: 10\n" ] } ], "source": [ "# Extract the observed values from the contingency table\n", "observed_values = roommates_major_table.iloc[:-1, :-1].values\n", "\n", "# Calculate expected values\n", "row_totals = roommates_major_table.iloc[:-1, -1].values\n", "col_totals = roommates_major_table.iloc[-1, :-1].values\n", "total = np.sum(row_totals)\n", "\n", "expected_values = np.outer(row_totals, col_totals) / total\n", "\n", "# Calculate chi-squared statistic\n", "chi2_statistic = np.sum((observed_values - expected_values)**2 / expected_values)\n", "\n", "# Degrees of freedom\n", "degrees_of_freedom = (roommates_major_table.shape[0] - 1) * (roommates_major_table.shape[1] - 1)\n", "\n", "# Print results\n", "print(f\"Chi-squared Value: {chi2_statistic}\\nDegrees of Freedom: {degrees_of_freedom}\")\n" ] } ], "metadata": { "colab": { "provenance": [] }, "kernelspec": { "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.11.5" } }, "nbformat": 4, "nbformat_minor": 5 }