aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorGravatar ENathanLe <Nath.wessix@gmail.com> 2024-02-23 23:49:33 -0800
committerGravatar ENathanLe <Nath.wessix@gmail.com> 2024-02-23 23:49:33 -0800
commitf0ea11e112c327feca46b4d698a0b705cc80b7d6 (patch)
tree1a7bea412ca76388064103552879eead3f36f42f
parent8fb7d6e9d440808c221cab1008941693916a4fa2 (diff)
parent3433f80cc0fa340630fe5df03befa3df8494a9b2 (diff)
downloadCS105MiniProject-f0ea11e112c327feca46b4d698a0b705cc80b7d6.tar.gz
CS105MiniProject-f0ea11e112c327feca46b4d698a0b705cc80b7d6.tar.zst
CS105MiniProject-f0ea11e112c327feca46b4d698a0b705cc80b7d6.zip
Merge branch 'main' into nlee097_minorfix
# Conflicts: # CS105MiniProject.ipynb
-rw-r--r--CS105MiniProject.ipynb97
1 files changed, 69 insertions, 28 deletions
diff --git a/CS105MiniProject.ipynb b/CS105MiniProject.ipynb
index fca6629..6fb14c0 100644
--- a/CS105MiniProject.ipynb
+++ b/CS105MiniProject.ipynb
@@ -579,38 +579,16 @@
},
{
"cell_type": "code",
- "outputs": [
- {
- "name": "stdout",
- "output_type": "stream",
- "text": [
- "mean internships: 31.161538461538463\n",
- "median internships: 2.0\n"
- ]
- },
- {
- "data": {
- "text/plain": "<Figure size 640x480 with 1 Axes>",
- "image/png": ""
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
+ "outputs": [],
"source": [
"print(\"mean internships: \", df[\"How many internship/job applications have you sent out so far?\"].mean())\n",
"print(\"median internships: \", df[\"How many internship/job applications have you sent out so far?\"].median())\n",
"_ = sns.violinplot(x=df[\"How many internship/job applications have you sent out so far?\"])"
],
"metadata": {
- "collapsed": false,
- "ExecuteTime": {
- "end_time": "2024-02-24T07:45:31.407456Z",
- "start_time": "2024-02-24T07:45:30.996717Z"
- }
+ "collapsed": false
},
- "id": "350d4fef50f55e38",
- "execution_count": 110
+ "id": "8b82459b823370cd"
},
{
"cell_type": "markdown",
@@ -621,7 +599,7 @@
"metadata": {
"collapsed": false
},
- "id": "a3f2976fd30ca299"
+ "id": "c16acfb6f409d15e"
},
{
"cell_type": "markdown",
@@ -636,6 +614,69 @@
{
"cell_type": "markdown",
"source": [
+ "# Hypothesis 1: There will be a correlation between whether people live with family, friends, or neither and whether or not they work\n",
+ "\n",
+ "Null Hypothesis: There is no relationship between people who live with family, friends, or neither and whether or not they work.\n",
+ "\n",
+ "Significance value: 0.1\n",
+ "Degrees of freedom: 3"
+ ],
+ "metadata": {
+ "collapsed": false
+ },
+ "id": "b3b8550f7d931f4f"
+ },
+ {
+ "cell_type": "code",
+ "outputs": [],
+ "source": [
+ "hyp3_major_table = pd.crosstab(df.iloc[:, 3], df.iloc[:, 8], margins=True, margins_name='Total')\n",
+ "hyp3_major_table"
+ ],
+ "metadata": {
+ "collapsed": false
+ },
+ "id": "e1de39044138b742"
+ },
+ {
+ "cell_type": "code",
+ "outputs": [],
+ "source": [
+ "num_rows, num_cols = hyp3_major_table.shape\n",
+ "# Initialize expected frequencies\n",
+ "expected_frequencies = []\n",
+ "chi_squared = 0\n",
+ "for i in range(num_rows - 1):\n",
+ " row_totals = hyp3_major_table.iloc[i, -1]\n",
+ " for j in range(num_cols - 1):\n",
+ " col_totals = hyp3_major_table.iloc[-1, j]\n",
+ " expected_frequency = (row_totals * col_totals) / hyp3_major_table.iloc[-1, -1]\n",
+ " expected_frequencies.append(expected_frequency)\n",
+ " chi_squared += ((hyp3_major_table.iloc[i, j] - expected_frequency) ** 2) / expected_frequency\n",
+ "\n",
+ "print(\"Chi-squared value:\", chi_squared)"
+ ],
+ "metadata": {
+ "collapsed": false
+ },
+ "id": "a113621af30160ab"
+ },
+ {
+ "cell_type": "markdown",
+ "source": [
+ "With a significance value of 0.1 and 3 degrees of freedom, chi-squared must be greater than 6.25.\n",
+ "Since chi-squared of `4.61 < 6.25`, we accept the null hypothesis:\n",
+ "\n",
+ "There is no relationship between people who live with family, friends, or neither and whether or not they work."
+ ],
+ "metadata": {
+ "collapsed": false
+ },
+ "id": "d8fe5f03e8d634a7"
+ },
+ {
+ "cell_type": "markdown",
+ "source": [
"### Hypothesis 2: Students who live on-campus are more likely to have roommates of the same major.\n",
"\n",
"Null Hypothesis: There is no relationship between students who live on-campus and students who have roommates of the same major.\n",
@@ -646,7 +687,7 @@
"metadata": {
"collapsed": false
},
- "id": "dcc6d91b3e660c2e"
+ "id": "5c95a7d0932aef71"
},
{
"cell_type": "code",
@@ -662,7 +703,7 @@
}
],
"source": [
- "roommates_major_table = pd.crosstab(df.iloc[:, 3], df.iloc[:, 9], margins=True, margins_name='Total')\n",
+ "roommates_major_table = pd.crosstab(df.iloc[:, 4], df.iloc[:, 11], margins=True, margins_name='Total')\n",
"roommates_major_table"
],
"metadata": {