diff options
Diffstat (limited to '')
-rw-r--r-- | CS105MiniProject.ipynb | 51 |
1 files changed, 39 insertions, 12 deletions
diff --git a/CS105MiniProject.ipynb b/CS105MiniProject.ipynb index c141cf1..2e6ac77 100644 --- a/CS105MiniProject.ipynb +++ b/CS105MiniProject.ipynb @@ -12,8 +12,8 @@ "id": "daa13044", "outputId": "4d440aaa-1ee7-4771-c526-f55e9458ca8a", "ExecuteTime": { - "end_time": "2024-02-16T01:21:49.702719Z", - "start_time": "2024-02-16T01:21:48.928305Z" + "end_time": "2024-02-16T01:29:14.937392Z", + "start_time": "2024-02-16T01:29:14.276865Z" } }, "outputs": [ @@ -44,15 +44,15 @@ "metadata": { "id": "29889175", "ExecuteTime": { - "end_time": "2024-02-16T01:21:49.714653Z", - "start_time": "2024-02-16T01:21:49.704177Z" + "end_time": "2024-02-16T01:29:14.950257Z", + "start_time": "2024-02-16T01:29:14.938720Z" } }, "outputs": [ { "data": { - "text/plain": " Timestamp What is your current class standing? \\\n0 2/9/2024 20:12:14 Senior \n1 2/9/2024 20:16:34 Junior \n2 2/9/2024 20:18:55 Junior \n3 2/9/2024 20:24:00 Senior \n4 2/9/2024 20:26:16 Graduate \n.. ... ... \n255 2/14/2024 19:46:28 Junior \n256 2/15/2024 0:28:38 NaN \n257 2/15/2024 8:33:45 Senior \n258 2/15/2024 16:10:40 Sophomore \n259 2/15/2024 16:14:11 Sophomore \n\n What gender do you identify as? Who do you live with? \\\n0 Male Neither \n1 Female Both \n2 Female Friends \n3 Male Neither \n4 Male Neither \n.. ... ... \n255 Male Friends \n256 Male Family \n257 Male Family \n258 Female Family \n259 Female Friends \n\n Do you currently live in a house, apartnment, or dorm? \\\n0 House \n1 Apartment \n2 House \n3 Apartment \n4 Apartment \n.. ... \n255 House \n256 Apartment \n257 House \n258 Apartment \n259 Dorm \n\n How many people live in your household? Do you currently work? \\\n0 6 Yes \n1 4 No \n2 4 No \n3 1 No \n4 1 Yes \n.. ... ... \n255 5 Yes \n256 4 No \n257 9 No \n258 4 Yes \n259 3 No \n\n How many hours do you work per week on average? \\\n0 5 - 10 \n1 0 \n2 0 \n3 0 \n4 10 - 20 \n.. ... \n255 10 - 20 \n256 0 \n257 0 \n258 5 - 10 \n259 0 \n\n Do you work on or off campus? \\\n0 Off-campus \n1 NaN \n2 NaN \n3 NaN \n4 Off-campus \n.. ... \n255 On-campus \n256 NaN \n257 Off-campus \n258 On-campus \n259 NaN \n\n Do you work in a department related to your major? \\\n0 No \n1 NaN \n2 NaN \n3 No \n4 Yes \n.. ... \n255 No \n256 NaN \n257 No \n258 No \n259 NaN \n\n Do you have roommates that are part of your major? \n0 No \n1 Yes \n2 No \n3 No \n4 No \n.. ... \n255 No \n256 No \n257 No \n258 No \n259 Yes \n\n[260 rows x 11 columns]", - "text/html": "<div>\n<style scoped>\n .dataframe tbody tr th:only-of-type {\n vertical-align: middle;\n }\n\n .dataframe tbody tr th {\n vertical-align: top;\n }\n\n .dataframe thead th {\n text-align: right;\n }\n</style>\n<table border=\"1\" class=\"dataframe\">\n <thead>\n <tr style=\"text-align: right;\">\n <th></th>\n <th>Timestamp</th>\n <th>What is your current class standing?</th>\n <th>What gender do you identify as?</th>\n <th>Who do you live with?</th>\n <th>Do you currently live in a house, apartnment, or dorm?</th>\n <th>How many people live in your household?</th>\n <th>Do you currently work?</th>\n <th>How many hours do you work per week on average?</th>\n <th>Do you work on or off campus?</th>\n <th>Do you work in a department related to your major?</th>\n <th>Do you have roommates that are part of your major?</th>\n </tr>\n </thead>\n <tbody>\n <tr>\n <th>0</th>\n <td>2/9/2024 20:12:14</td>\n <td>Senior</td>\n <td>Male</td>\n <td>Neither</td>\n <td>House</td>\n <td>6</td>\n <td>Yes</td>\n <td>5 - 10</td>\n <td>Off-campus</td>\n <td>No</td>\n <td>No</td>\n </tr>\n <tr>\n <th>1</th>\n <td>2/9/2024 20:16:34</td>\n <td>Junior</td>\n <td>Female</td>\n <td>Both</td>\n <td>Apartment</td>\n <td>4</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>Yes</td>\n </tr>\n <tr>\n <th>2</th>\n <td>2/9/2024 20:18:55</td>\n <td>Junior</td>\n <td>Female</td>\n <td>Friends</td>\n <td>House</td>\n <td>4</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>No</td>\n </tr>\n <tr>\n <th>3</th>\n <td>2/9/2024 20:24:00</td>\n <td>Senior</td>\n <td>Male</td>\n <td>Neither</td>\n <td>Apartment</td>\n <td>1</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>No</td>\n <td>No</td>\n </tr>\n <tr>\n <th>4</th>\n <td>2/9/2024 20:26:16</td>\n <td>Graduate</td>\n <td>Male</td>\n <td>Neither</td>\n <td>Apartment</td>\n <td>1</td>\n <td>Yes</td>\n <td>10 - 20</td>\n <td>Off-campus</td>\n <td>Yes</td>\n <td>No</td>\n </tr>\n <tr>\n <th>...</th>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n </tr>\n <tr>\n <th>255</th>\n <td>2/14/2024 19:46:28</td>\n <td>Junior</td>\n <td>Male</td>\n <td>Friends</td>\n <td>House</td>\n <td>5</td>\n <td>Yes</td>\n <td>10 - 20</td>\n <td>On-campus</td>\n <td>No</td>\n <td>No</td>\n </tr>\n <tr>\n <th>256</th>\n <td>2/15/2024 0:28:38</td>\n <td>NaN</td>\n <td>Male</td>\n <td>Family</td>\n <td>Apartment</td>\n <td>4</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>No</td>\n </tr>\n <tr>\n <th>257</th>\n <td>2/15/2024 8:33:45</td>\n <td>Senior</td>\n <td>Male</td>\n <td>Family</td>\n <td>House</td>\n <td>9</td>\n <td>No</td>\n <td>0</td>\n <td>Off-campus</td>\n <td>No</td>\n <td>No</td>\n </tr>\n <tr>\n <th>258</th>\n <td>2/15/2024 16:10:40</td>\n <td>Sophomore</td>\n <td>Female</td>\n <td>Family</td>\n <td>Apartment</td>\n <td>4</td>\n <td>Yes</td>\n <td>5 - 10</td>\n <td>On-campus</td>\n <td>No</td>\n <td>No</td>\n </tr>\n <tr>\n <th>259</th>\n <td>2/15/2024 16:14:11</td>\n <td>Sophomore</td>\n <td>Female</td>\n <td>Friends</td>\n <td>Dorm</td>\n <td>3</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>Yes</td>\n </tr>\n </tbody>\n</table>\n<p>260 rows × 11 columns</p>\n</div>" + "text/plain": " Timestamp What is your current class standing? \\\n0 2/9/2024 20:12:14 Senior \n1 2/9/2024 20:16:34 Junior \n2 2/9/2024 20:18:55 Junior \n3 2/9/2024 20:24:00 Senior \n4 2/9/2024 20:26:16 Graduate \n.. ... ... \n255 2/14/2024 19:46:28 Junior \n256 2/15/2024 0:28:38 NaN \n257 2/15/2024 8:33:45 Senior \n258 2/15/2024 16:10:40 Sophomore \n259 2/15/2024 16:14:11 Sophomore \n\n What gender do you identify as? Who do you live with? \\\n0 Male Neither \n1 Female Both \n2 Female Friends \n3 Male Neither \n4 Male Neither \n.. ... ... \n255 Male Friends \n256 Male Family \n257 Male Family \n258 Female Family \n259 Female Friends \n\n Do you currently live in a house, apartnment, or dorm? \\\n0 House \n1 Apartment \n2 House \n3 Apartment \n4 Apartment \n.. ... \n255 House \n256 Apartment \n257 House \n258 Apartment \n259 Dorm \n\n How many people live in your household? Do you currently work? \\\n0 6 Yes \n1 4 No \n2 4 No \n3 1 No \n4 1 Yes \n.. ... ... \n255 5 Yes \n256 4 No \n257 9 No \n258 4 Yes \n259 3 No \n\n How many hours do you work per week on average? \\\n0 5 - 10 \n1 0 \n2 0 \n3 0 \n4 10 - 20 \n.. ... \n255 10 - 20 \n256 0 \n257 0 \n258 5 - 10 \n259 0 \n\n Do you work on or off campus? \\\n0 Off-campus \n1 NaN \n2 NaN \n3 NaN \n4 Off-campus \n.. ... \n255 On-campus \n256 NaN \n257 Off-campus \n258 On-campus \n259 NaN \n\n Do you work in a department related to your major? \\\n0 No \n1 NaN \n2 NaN \n3 NaN \n4 Yes \n.. ... \n255 No \n256 NaN \n257 NaN \n258 No \n259 NaN \n\n Do you have roommates that are part of your major? \n0 No \n1 Yes \n2 No \n3 No \n4 No \n.. ... \n255 No \n256 No \n257 No \n258 No \n259 Yes \n\n[260 rows x 11 columns]", + "text/html": "<div>\n<style scoped>\n .dataframe tbody tr th:only-of-type {\n vertical-align: middle;\n }\n\n .dataframe tbody tr th {\n vertical-align: top;\n }\n\n .dataframe thead th {\n text-align: right;\n }\n</style>\n<table border=\"1\" class=\"dataframe\">\n <thead>\n <tr style=\"text-align: right;\">\n <th></th>\n <th>Timestamp</th>\n <th>What is your current class standing?</th>\n <th>What gender do you identify as?</th>\n <th>Who do you live with?</th>\n <th>Do you currently live in a house, apartnment, or dorm?</th>\n <th>How many people live in your household?</th>\n <th>Do you currently work?</th>\n <th>How many hours do you work per week on average?</th>\n <th>Do you work on or off campus?</th>\n <th>Do you work in a department related to your major?</th>\n <th>Do you have roommates that are part of your major?</th>\n </tr>\n </thead>\n <tbody>\n <tr>\n <th>0</th>\n <td>2/9/2024 20:12:14</td>\n <td>Senior</td>\n <td>Male</td>\n <td>Neither</td>\n <td>House</td>\n <td>6</td>\n <td>Yes</td>\n <td>5 - 10</td>\n <td>Off-campus</td>\n <td>No</td>\n <td>No</td>\n </tr>\n <tr>\n <th>1</th>\n <td>2/9/2024 20:16:34</td>\n <td>Junior</td>\n <td>Female</td>\n <td>Both</td>\n <td>Apartment</td>\n <td>4</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>Yes</td>\n </tr>\n <tr>\n <th>2</th>\n <td>2/9/2024 20:18:55</td>\n <td>Junior</td>\n <td>Female</td>\n <td>Friends</td>\n <td>House</td>\n <td>4</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>No</td>\n </tr>\n <tr>\n <th>3</th>\n <td>2/9/2024 20:24:00</td>\n <td>Senior</td>\n <td>Male</td>\n <td>Neither</td>\n <td>Apartment</td>\n <td>1</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>No</td>\n </tr>\n <tr>\n <th>4</th>\n <td>2/9/2024 20:26:16</td>\n <td>Graduate</td>\n <td>Male</td>\n <td>Neither</td>\n <td>Apartment</td>\n <td>1</td>\n <td>Yes</td>\n <td>10 - 20</td>\n <td>Off-campus</td>\n <td>Yes</td>\n <td>No</td>\n </tr>\n <tr>\n <th>...</th>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n </tr>\n <tr>\n <th>255</th>\n <td>2/14/2024 19:46:28</td>\n <td>Junior</td>\n <td>Male</td>\n <td>Friends</td>\n <td>House</td>\n <td>5</td>\n <td>Yes</td>\n <td>10 - 20</td>\n <td>On-campus</td>\n <td>No</td>\n <td>No</td>\n </tr>\n <tr>\n <th>256</th>\n <td>2/15/2024 0:28:38</td>\n <td>NaN</td>\n <td>Male</td>\n <td>Family</td>\n <td>Apartment</td>\n <td>4</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>No</td>\n </tr>\n <tr>\n <th>257</th>\n <td>2/15/2024 8:33:45</td>\n <td>Senior</td>\n <td>Male</td>\n <td>Family</td>\n <td>House</td>\n <td>9</td>\n <td>No</td>\n <td>0</td>\n <td>Off-campus</td>\n <td>NaN</td>\n <td>No</td>\n </tr>\n <tr>\n <th>258</th>\n <td>2/15/2024 16:10:40</td>\n <td>Sophomore</td>\n <td>Female</td>\n <td>Family</td>\n <td>Apartment</td>\n <td>4</td>\n <td>Yes</td>\n <td>5 - 10</td>\n <td>On-campus</td>\n <td>No</td>\n <td>No</td>\n </tr>\n <tr>\n <th>259</th>\n <td>2/15/2024 16:14:11</td>\n <td>Sophomore</td>\n <td>Female</td>\n <td>Friends</td>\n <td>Dorm</td>\n <td>3</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>Yes</td>\n </tr>\n </tbody>\n</table>\n<p>260 rows × 11 columns</p>\n</div>" }, "execution_count": 2, "metadata": {}, @@ -72,6 +72,7 @@ " .astype(int))\n", "df.loc[df['Do you currently work?'] == 'No', 'How many hours do you work per week on average?'] = 0\n", "df['Who do you live with? '] = df['Who do you live with? '].replace('Family, Friends', 'Both').replace('Family, Friends, Both', 'Both')\n", + "df.loc[df['Do you currently work?'] == 'No', 'Do you work in a department related to your major?'] = np.nan\n", "df" ] }, @@ -82,8 +83,8 @@ "metadata": { "collapsed": false, "ExecuteTime": { - "end_time": "2024-02-16T01:21:49.723810Z", - "start_time": "2024-02-16T01:21:49.715485Z" + "end_time": "2024-02-16T01:29:14.960720Z", + "start_time": "2024-02-16T01:29:14.951Z" } }, "outputs": [ @@ -107,17 +108,43 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 4, "id": "a9df972e44277de7", "metadata": { "collapsed": false, "ExecuteTime": { - "end_time": "2024-02-16T01:21:49.726718Z", - "start_time": "2024-02-16T01:21:49.724916Z" + "end_time": "2024-02-16T01:29:14.970741Z", + "start_time": "2024-02-16T01:29:14.962311Z" } }, + "outputs": [ + { + "data": { + "text/plain": " Timestamp What is your current class standing? \\\n1 2/9/2024 20:16:34 Junior \n2 2/9/2024 20:18:55 Junior \n3 2/9/2024 20:24:00 Senior \n5 2/9/2024 20:45:09 Junior \n6 2/9/2024 21:55:59 Sophomore \n.. ... ... \n253 2/14/2024 13:45:45 Senior \n254 2/14/2024 16:26:06 Junior \n256 2/15/2024 0:28:38 NaN \n257 2/15/2024 8:33:45 Senior \n259 2/15/2024 16:14:11 Sophomore \n\n What gender do you identify as? Who do you live with? \\\n1 Female Both \n2 Female Friends \n3 Male Neither \n5 Prefer not to say Both \n6 Female Friends \n.. ... ... \n253 Female Family \n254 Male Family \n256 Male Family \n257 Male Family \n259 Female Friends \n\n Do you currently live in a house, apartnment, or dorm? \\\n1 Apartment \n2 House \n3 Apartment \n5 Apartment \n6 Apartment \n.. ... \n253 House \n254 House \n256 Apartment \n257 House \n259 Dorm \n\n How many people live in your household? Do you currently work? \\\n1 4 No \n2 4 No \n3 1 No \n5 4 No \n6 4 No \n.. ... ... \n253 6 No \n254 5 No \n256 4 No \n257 9 No \n259 3 No \n\n How many hours do you work per week on average? \\\n1 0 \n2 0 \n3 0 \n5 0 \n6 0 \n.. ... \n253 0 \n254 0 \n256 0 \n257 0 \n259 0 \n\n Do you work on or off campus? \\\n1 NaN \n2 NaN \n3 NaN \n5 NaN \n6 NaN \n.. ... \n253 NaN \n254 NaN \n256 NaN \n257 Off-campus \n259 NaN \n\n Do you work in a department related to your major? \\\n1 NaN \n2 NaN \n3 NaN \n5 NaN \n6 NaN \n.. ... \n253 NaN \n254 NaN \n256 NaN \n257 NaN \n259 NaN \n\n Do you have roommates that are part of your major? \n1 Yes \n2 No \n3 No \n5 No \n6 No \n.. ... \n253 No \n254 Yes \n256 No \n257 No \n259 Yes \n\n[176 rows x 11 columns]", + "text/html": "<div>\n<style scoped>\n .dataframe tbody tr th:only-of-type {\n vertical-align: middle;\n }\n\n .dataframe tbody tr th {\n vertical-align: top;\n }\n\n .dataframe thead th {\n text-align: right;\n }\n</style>\n<table border=\"1\" class=\"dataframe\">\n <thead>\n <tr style=\"text-align: right;\">\n <th></th>\n <th>Timestamp</th>\n <th>What is your current class standing?</th>\n <th>What gender do you identify as?</th>\n <th>Who do you live with?</th>\n <th>Do you currently live in a house, apartnment, or dorm?</th>\n <th>How many people live in your household?</th>\n <th>Do you currently work?</th>\n <th>How many hours do you work per week on average?</th>\n <th>Do you work on or off campus?</th>\n <th>Do you work in a department related to your major?</th>\n <th>Do you have roommates that are part of your major?</th>\n </tr>\n </thead>\n <tbody>\n <tr>\n <th>1</th>\n <td>2/9/2024 20:16:34</td>\n <td>Junior</td>\n <td>Female</td>\n <td>Both</td>\n <td>Apartment</td>\n <td>4</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>Yes</td>\n </tr>\n <tr>\n <th>2</th>\n <td>2/9/2024 20:18:55</td>\n <td>Junior</td>\n <td>Female</td>\n <td>Friends</td>\n <td>House</td>\n <td>4</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>No</td>\n </tr>\n <tr>\n <th>3</th>\n <td>2/9/2024 20:24:00</td>\n <td>Senior</td>\n <td>Male</td>\n <td>Neither</td>\n <td>Apartment</td>\n <td>1</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>No</td>\n </tr>\n <tr>\n <th>5</th>\n <td>2/9/2024 20:45:09</td>\n <td>Junior</td>\n <td>Prefer not to say</td>\n <td>Both</td>\n <td>Apartment</td>\n <td>4</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>No</td>\n </tr>\n <tr>\n <th>6</th>\n <td>2/9/2024 21:55:59</td>\n <td>Sophomore</td>\n <td>Female</td>\n <td>Friends</td>\n <td>Apartment</td>\n <td>4</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>No</td>\n </tr>\n <tr>\n <th>...</th>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n <td>...</td>\n </tr>\n <tr>\n <th>253</th>\n <td>2/14/2024 13:45:45</td>\n <td>Senior</td>\n <td>Female</td>\n <td>Family</td>\n <td>House</td>\n <td>6</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>No</td>\n </tr>\n <tr>\n <th>254</th>\n <td>2/14/2024 16:26:06</td>\n <td>Junior</td>\n <td>Male</td>\n <td>Family</td>\n <td>House</td>\n <td>5</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>Yes</td>\n </tr>\n <tr>\n <th>256</th>\n <td>2/15/2024 0:28:38</td>\n <td>NaN</td>\n <td>Male</td>\n <td>Family</td>\n <td>Apartment</td>\n <td>4</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>No</td>\n </tr>\n <tr>\n <th>257</th>\n <td>2/15/2024 8:33:45</td>\n <td>Senior</td>\n <td>Male</td>\n <td>Family</td>\n <td>House</td>\n <td>9</td>\n <td>No</td>\n <td>0</td>\n <td>Off-campus</td>\n <td>NaN</td>\n <td>No</td>\n </tr>\n <tr>\n <th>259</th>\n <td>2/15/2024 16:14:11</td>\n <td>Sophomore</td>\n <td>Female</td>\n <td>Friends</td>\n <td>Dorm</td>\n <td>3</td>\n <td>No</td>\n <td>0</td>\n <td>NaN</td>\n <td>NaN</td>\n <td>Yes</td>\n </tr>\n </tbody>\n</table>\n<p>176 rows × 11 columns</p>\n</div>" + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "nw_df" + ] + }, + { + "cell_type": "code", "outputs": [], - "source": [] + "source": [], + "metadata": { + "collapsed": false, + "ExecuteTime": { + "end_time": "2024-02-16T01:29:14.974486Z", + "start_time": "2024-02-16T01:29:14.972680Z" + } + }, + "id": "bfa40c9e9693481d", + "execution_count": 4 } ], "metadata": { |