diff --git a/your-code/1.-Data-Cleaning.ipynb b/your-code/1.-Data-Cleaning.ipynb
index d1c8eea..44879bf 100644
--- a/your-code/1.-Data-Cleaning.ipynb
+++ b/your-code/1.-Data-Cleaning.ipynb
@@ -28,7 +28,7 @@
},
{
"cell_type": "code",
- "execution_count": 2,
+ "execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
@@ -47,11 +47,282 @@
},
{
"cell_type": "code",
- "execution_count": 3,
+ "execution_count": 2,
"metadata": {},
- "outputs": [],
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "
\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Name | \n",
+ " Team | \n",
+ " Pos | \n",
+ " Height | \n",
+ " Weight | \n",
+ " BMI | \n",
+ " Birth_Place | \n",
+ " Birthdate | \n",
+ " Age | \n",
+ " College | \n",
+ " Experience | \n",
+ " Games Played | \n",
+ " MIN | \n",
+ " FGM | \n",
+ " FGA | \n",
+ " FG% | \n",
+ " 3PM | \n",
+ " 3PA | \n",
+ " 3P% | \n",
+ " FTM | \n",
+ " FTA | \n",
+ " FT% | \n",
+ " OREB | \n",
+ " DREB | \n",
+ " REB | \n",
+ " AST | \n",
+ " STL | \n",
+ " BLK | \n",
+ " TO | \n",
+ " PTS | \n",
+ " DD2 | \n",
+ " TD3 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0 | \n",
+ " Aerial Powers | \n",
+ " DAL | \n",
+ " F | \n",
+ " 183 | \n",
+ " 71.0 | \n",
+ " 21.200991 | \n",
+ " US | \n",
+ " January 17, 1994 | \n",
+ " 23 | \n",
+ " Michigan State | \n",
+ " 2 | \n",
+ " 8 | \n",
+ " 173 | \n",
+ " 30 | \n",
+ " 85 | \n",
+ " 35.3 | \n",
+ " 12 | \n",
+ " 32 | \n",
+ " 37.5 | \n",
+ " 21 | \n",
+ " 26 | \n",
+ " 80.8 | \n",
+ " 6 | \n",
+ " 22 | \n",
+ " 28 | \n",
+ " 12 | \n",
+ " 3 | \n",
+ " 6 | \n",
+ " 12 | \n",
+ " 93 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ "
\n",
+ " \n",
+ " | 1 | \n",
+ " Alana Beard | \n",
+ " LA | \n",
+ " G/F | \n",
+ " 185 | \n",
+ " 73.0 | \n",
+ " 21.329438 | \n",
+ " US | \n",
+ " May 14, 1982 | \n",
+ " 35 | \n",
+ " Duke | \n",
+ " 12 | \n",
+ " 30 | \n",
+ " 947 | \n",
+ " 90 | \n",
+ " 177 | \n",
+ " 50.8 | \n",
+ " 5 | \n",
+ " 18 | \n",
+ " 27.8 | \n",
+ " 32 | \n",
+ " 41 | \n",
+ " 78.0 | \n",
+ " 19 | \n",
+ " 82 | \n",
+ " 101 | \n",
+ " 72 | \n",
+ " 63 | \n",
+ " 13 | \n",
+ " 40 | \n",
+ " 217 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ "
\n",
+ " \n",
+ " | 2 | \n",
+ " Alex Bentley | \n",
+ " CON | \n",
+ " G | \n",
+ " 170 | \n",
+ " 69.0 | \n",
+ " 23.875433 | \n",
+ " US | \n",
+ " October 27, 1990 | \n",
+ " 26 | \n",
+ " Penn State | \n",
+ " 4 | \n",
+ " 26 | \n",
+ " 617 | \n",
+ " 82 | \n",
+ " 218 | \n",
+ " 37.6 | \n",
+ " 19 | \n",
+ " 64 | \n",
+ " 29.7 | \n",
+ " 35 | \n",
+ " 42 | \n",
+ " 83.3 | \n",
+ " 4 | \n",
+ " 36 | \n",
+ " 40 | \n",
+ " 78 | \n",
+ " 22 | \n",
+ " 3 | \n",
+ " 24 | \n",
+ " 218 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ "
\n",
+ " \n",
+ " | 3 | \n",
+ " Alex Montgomery | \n",
+ " SAN | \n",
+ " G/F | \n",
+ " 185 | \n",
+ " 84.0 | \n",
+ " 24.543462 | \n",
+ " US | \n",
+ " December 11, 1988 | \n",
+ " 28 | \n",
+ " Georgia Tech | \n",
+ " 6 | \n",
+ " 31 | \n",
+ " 721 | \n",
+ " 75 | \n",
+ " 195 | \n",
+ " 38.5 | \n",
+ " 21 | \n",
+ " 68 | \n",
+ " 30.9 | \n",
+ " 17 | \n",
+ " 21 | \n",
+ " 81.0 | \n",
+ " 35 | \n",
+ " 134 | \n",
+ " 169 | \n",
+ " 65 | \n",
+ " 20 | \n",
+ " 10 | \n",
+ " 38 | \n",
+ " 188 | \n",
+ " 2 | \n",
+ " 0 | \n",
+ "
\n",
+ " \n",
+ " | 4 | \n",
+ " Alexis Jones | \n",
+ " MIN | \n",
+ " G | \n",
+ " 175 | \n",
+ " 78.0 | \n",
+ " 25.469388 | \n",
+ " US | \n",
+ " August 5, 1994 | \n",
+ " 23 | \n",
+ " Baylor | \n",
+ " R | \n",
+ " 24 | \n",
+ " 137 | \n",
+ " 16 | \n",
+ " 50 | \n",
+ " 32.0 | \n",
+ " 7 | \n",
+ " 20 | \n",
+ " 35.0 | \n",
+ " 11 | \n",
+ " 12 | \n",
+ " 91.7 | \n",
+ " 3 | \n",
+ " 9 | \n",
+ " 12 | \n",
+ " 12 | \n",
+ " 7 | \n",
+ " 0 | \n",
+ " 14 | \n",
+ " 50 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Name Team Pos Height Weight BMI Birth_Place \\\n",
+ "0 Aerial Powers DAL F 183 71.0 21.200991 US \n",
+ "1 Alana Beard LA G/F 185 73.0 21.329438 US \n",
+ "2 Alex Bentley CON G 170 69.0 23.875433 US \n",
+ "3 Alex Montgomery SAN G/F 185 84.0 24.543462 US \n",
+ "4 Alexis Jones MIN G 175 78.0 25.469388 US \n",
+ "\n",
+ " Birthdate Age College Experience Games Played MIN FGM \\\n",
+ "0 January 17, 1994 23 Michigan State 2 8 173 30 \n",
+ "1 May 14, 1982 35 Duke 12 30 947 90 \n",
+ "2 October 27, 1990 26 Penn State 4 26 617 82 \n",
+ "3 December 11, 1988 28 Georgia Tech 6 31 721 75 \n",
+ "4 August 5, 1994 23 Baylor R 24 137 16 \n",
+ "\n",
+ " FGA FG% 3PM 3PA 3P% FTM FTA FT% OREB DREB REB AST STL BLK \\\n",
+ "0 85 35.3 12 32 37.5 21 26 80.8 6 22 28 12 3 6 \n",
+ "1 177 50.8 5 18 27.8 32 41 78.0 19 82 101 72 63 13 \n",
+ "2 218 37.6 19 64 29.7 35 42 83.3 4 36 40 78 22 3 \n",
+ "3 195 38.5 21 68 30.9 17 21 81.0 35 134 169 65 20 10 \n",
+ "4 50 32.0 7 20 35.0 11 12 91.7 3 9 12 12 7 0 \n",
+ "\n",
+ " TO PTS DD2 TD3 \n",
+ "0 12 93 0 0 \n",
+ "1 40 217 0 0 \n",
+ "2 24 218 0 0 \n",
+ "3 38 188 2 0 \n",
+ "4 14 50 0 0 "
+ ]
+ },
+ "execution_count": 2,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
"source": [
- "#your code here"
+ "wnba = pd.read_csv(\"wnba.csv\")\n",
+ "wnba.head()"
]
},
{
@@ -64,11 +335,54 @@
},
{
"cell_type": "code",
- "execution_count": 5,
+ "execution_count": 3,
"metadata": {},
- "outputs": [],
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "Name 0\n",
+ "Team 0\n",
+ "Pos 0\n",
+ "Height 0\n",
+ "Weight 1\n",
+ "BMI 1\n",
+ "Birth_Place 0\n",
+ "Birthdate 0\n",
+ "Age 0\n",
+ "College 0\n",
+ "Experience 0\n",
+ "Games Played 0\n",
+ "MIN 0\n",
+ "FGM 0\n",
+ "FGA 0\n",
+ "FG% 0\n",
+ "3PM 0\n",
+ "3PA 0\n",
+ "3P% 0\n",
+ "FTM 0\n",
+ "FTA 0\n",
+ "FT% 0\n",
+ "OREB 0\n",
+ "DREB 0\n",
+ "REB 0\n",
+ "AST 0\n",
+ "STL 0\n",
+ "BLK 0\n",
+ "TO 0\n",
+ "PTS 0\n",
+ "DD2 0\n",
+ "TD3 0\n",
+ "dtype: int64"
+ ]
+ },
+ "execution_count": 3,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
"source": [
- "#your code here"
+ "wnba.isnull().sum()"
]
},
{
@@ -80,11 +394,122 @@
},
{
"cell_type": "code",
- "execution_count": 7,
+ "execution_count": 4,
"metadata": {},
- "outputs": [],
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Name | \n",
+ " Team | \n",
+ " Pos | \n",
+ " Height | \n",
+ " Weight | \n",
+ " BMI | \n",
+ " Birth_Place | \n",
+ " Birthdate | \n",
+ " Age | \n",
+ " College | \n",
+ " Experience | \n",
+ " Games Played | \n",
+ " MIN | \n",
+ " FGM | \n",
+ " FGA | \n",
+ " FG% | \n",
+ " 3PM | \n",
+ " 3PA | \n",
+ " 3P% | \n",
+ " FTM | \n",
+ " FTA | \n",
+ " FT% | \n",
+ " OREB | \n",
+ " DREB | \n",
+ " REB | \n",
+ " AST | \n",
+ " STL | \n",
+ " BLK | \n",
+ " TO | \n",
+ " PTS | \n",
+ " DD2 | \n",
+ " TD3 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 91 | \n",
+ " Makayla Epps | \n",
+ " CHI | \n",
+ " G | \n",
+ " 178 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " US | \n",
+ " June 6, 1995 | \n",
+ " 22 | \n",
+ " Kentucky | \n",
+ " R | \n",
+ " 14 | \n",
+ " 52 | \n",
+ " 2 | \n",
+ " 14 | \n",
+ " 14.3 | \n",
+ " 0 | \n",
+ " 5 | \n",
+ " 0.0 | \n",
+ " 2 | \n",
+ " 5 | \n",
+ " 40.0 | \n",
+ " 2 | \n",
+ " 0 | \n",
+ " 2 | \n",
+ " 4 | \n",
+ " 1 | \n",
+ " 0 | \n",
+ " 4 | \n",
+ " 6 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Name Team Pos Height Weight BMI Birth_Place Birthdate Age \\\n",
+ "91 Makayla Epps CHI G 178 NaN NaN US June 6, 1995 22 \n",
+ "\n",
+ " College Experience Games Played MIN FGM FGA FG% 3PM 3PA 3P% \\\n",
+ "91 Kentucky R 14 52 2 14 14.3 0 5 0.0 \n",
+ "\n",
+ " FTM FTA FT% OREB DREB REB AST STL BLK TO PTS DD2 TD3 \n",
+ "91 2 5 40.0 2 0 2 4 1 0 4 6 0 0 "
+ ]
+ },
+ "execution_count": 4,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
"source": [
- "#your code here"
+ "wnba[wnba.isnull().any(axis = 1)]"
]
},
{
@@ -96,11 +521,22 @@
},
{
"cell_type": "code",
- "execution_count": 9,
+ "execution_count": 5,
"metadata": {},
- "outputs": [],
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "the percentage of data we would remove is: 0.006993006993006993\n"
+ ]
+ }
+ ],
"source": [
- "#your code here"
+ "total_rows = wnba.shape[0]\n",
+ "p = 1/total_rows\n",
+ "\n",
+ "print(\"the percentage of data we would remove is: \", p)"
]
},
{
@@ -114,11 +550,11 @@
},
{
"cell_type": "code",
- "execution_count": 11,
+ "execution_count": 6,
"metadata": {},
"outputs": [],
"source": [
- "#your code here"
+ "wnba.dropna(inplace = True)"
]
},
{
@@ -130,11 +566,13 @@
},
{
"cell_type": "code",
- "execution_count": 13,
+ "execution_count": 7,
"metadata": {},
"outputs": [],
"source": [
- "#your answer here"
+ "# this was for sure a good decision\n",
+ "# a case i would not drop the NaN values, are if the number of rows affected have such a high percentage, that it would effect the data too much.\n",
+ "# another case is if we have sensitive data points where we can not afford loosing any datapoints"
]
},
{
@@ -147,11 +585,54 @@
},
{
"cell_type": "code",
- "execution_count": 14,
+ "execution_count": 8,
"metadata": {},
- "outputs": [],
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "Name object\n",
+ "Team object\n",
+ "Pos object\n",
+ "Height int64\n",
+ "Weight float64\n",
+ "BMI float64\n",
+ "Birth_Place object\n",
+ "Birthdate object\n",
+ "Age int64\n",
+ "College object\n",
+ "Experience object\n",
+ "Games Played int64\n",
+ "MIN int64\n",
+ "FGM int64\n",
+ "FGA int64\n",
+ "FG% float64\n",
+ "3PM int64\n",
+ "3PA int64\n",
+ "3P% float64\n",
+ "FTM int64\n",
+ "FTA int64\n",
+ "FT% float64\n",
+ "OREB int64\n",
+ "DREB int64\n",
+ "REB int64\n",
+ "AST int64\n",
+ "STL int64\n",
+ "BLK int64\n",
+ "TO int64\n",
+ "PTS int64\n",
+ "DD2 int64\n",
+ "TD3 int64\n",
+ "dtype: object"
+ ]
+ },
+ "execution_count": 8,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
"source": [
- "#your code here"
+ "wnba.dtypes"
]
},
{
@@ -170,11 +651,65 @@
},
{
"cell_type": "code",
- "execution_count": 16,
+ "execution_count": 9,
"metadata": {},
"outputs": [],
"source": [
- "#your code here"
+ "wnba['Weight'] = wnba['Weight'].astype(int)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 10,
+ "metadata": {
+ "scrolled": false
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "Name object\n",
+ "Team object\n",
+ "Pos object\n",
+ "Height int64\n",
+ "Weight int64\n",
+ "BMI float64\n",
+ "Birth_Place object\n",
+ "Birthdate object\n",
+ "Age int64\n",
+ "College object\n",
+ "Experience object\n",
+ "Games Played int64\n",
+ "MIN int64\n",
+ "FGM int64\n",
+ "FGA int64\n",
+ "FG% float64\n",
+ "3PM int64\n",
+ "3PA int64\n",
+ "3P% float64\n",
+ "FTM int64\n",
+ "FTA int64\n",
+ "FT% float64\n",
+ "OREB int64\n",
+ "DREB int64\n",
+ "REB int64\n",
+ "AST int64\n",
+ "STL int64\n",
+ "BLK int64\n",
+ "TO int64\n",
+ "PTS int64\n",
+ "DD2 int64\n",
+ "TD3 int64\n",
+ "dtype: object"
+ ]
+ },
+ "execution_count": 10,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "wnba.dtypes"
]
},
{
@@ -186,11 +721,345 @@
},
{
"cell_type": "code",
- "execution_count": 18,
+ "execution_count": 11,
"metadata": {},
- "outputs": [],
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Height | \n",
+ " Weight | \n",
+ " BMI | \n",
+ " Age | \n",
+ " Games Played | \n",
+ " MIN | \n",
+ " FGM | \n",
+ " FGA | \n",
+ " FG% | \n",
+ " 3PM | \n",
+ " 3PA | \n",
+ " 3P% | \n",
+ " FTM | \n",
+ " FTA | \n",
+ " FT% | \n",
+ " OREB | \n",
+ " DREB | \n",
+ " REB | \n",
+ " AST | \n",
+ " STL | \n",
+ " BLK | \n",
+ " TO | \n",
+ " PTS | \n",
+ " DD2 | \n",
+ " TD3 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | count | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ " 142.000000 | \n",
+ "
\n",
+ " \n",
+ " | mean | \n",
+ " 184.612676 | \n",
+ " 78.978873 | \n",
+ " 23.091214 | \n",
+ " 27.112676 | \n",
+ " 24.429577 | \n",
+ " 500.105634 | \n",
+ " 74.401408 | \n",
+ " 168.704225 | \n",
+ " 43.102817 | \n",
+ " 14.830986 | \n",
+ " 43.697183 | \n",
+ " 24.978169 | \n",
+ " 39.535211 | \n",
+ " 49.422535 | \n",
+ " 75.828873 | \n",
+ " 22.063380 | \n",
+ " 61.591549 | \n",
+ " 83.654930 | \n",
+ " 44.514085 | \n",
+ " 17.725352 | \n",
+ " 9.781690 | \n",
+ " 32.288732 | \n",
+ " 203.169014 | \n",
+ " 1.140845 | \n",
+ " 0.007042 | \n",
+ "
\n",
+ " \n",
+ " | std | \n",
+ " 8.698128 | \n",
+ " 10.996110 | \n",
+ " 2.073691 | \n",
+ " 3.667180 | \n",
+ " 7.075477 | \n",
+ " 289.373393 | \n",
+ " 55.980754 | \n",
+ " 117.165809 | \n",
+ " 9.855199 | \n",
+ " 17.372829 | \n",
+ " 46.155302 | \n",
+ " 18.459075 | \n",
+ " 36.743053 | \n",
+ " 44.244697 | \n",
+ " 18.536151 | \n",
+ " 21.519648 | \n",
+ " 49.669854 | \n",
+ " 68.200585 | \n",
+ " 41.490790 | \n",
+ " 13.413312 | \n",
+ " 12.537669 | \n",
+ " 21.447141 | \n",
+ " 153.032559 | \n",
+ " 2.909002 | \n",
+ " 0.083918 | \n",
+ "
\n",
+ " \n",
+ " | min | \n",
+ " 165.000000 | \n",
+ " 55.000000 | \n",
+ " 18.390675 | \n",
+ " 21.000000 | \n",
+ " 2.000000 | \n",
+ " 12.000000 | \n",
+ " 1.000000 | \n",
+ " 3.000000 | \n",
+ " 16.700000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ " 2.000000 | \n",
+ " 2.000000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ " 2.000000 | \n",
+ " 2.000000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ "
\n",
+ " \n",
+ " | 25% | \n",
+ " 175.750000 | \n",
+ " 71.500000 | \n",
+ " 21.785876 | \n",
+ " 24.000000 | \n",
+ " 22.000000 | \n",
+ " 242.250000 | \n",
+ " 27.000000 | \n",
+ " 69.000000 | \n",
+ " 37.125000 | \n",
+ " 0.000000 | \n",
+ " 3.000000 | \n",
+ " 0.000000 | \n",
+ " 13.000000 | \n",
+ " 17.250000 | \n",
+ " 71.575000 | \n",
+ " 7.000000 | \n",
+ " 26.000000 | \n",
+ " 34.250000 | \n",
+ " 11.250000 | \n",
+ " 7.000000 | \n",
+ " 2.000000 | \n",
+ " 14.000000 | \n",
+ " 77.250000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ "
\n",
+ " \n",
+ " | 50% | \n",
+ " 185.000000 | \n",
+ " 79.000000 | \n",
+ " 22.873314 | \n",
+ " 27.000000 | \n",
+ " 27.500000 | \n",
+ " 506.000000 | \n",
+ " 69.000000 | \n",
+ " 152.500000 | \n",
+ " 42.050000 | \n",
+ " 10.500000 | \n",
+ " 32.000000 | \n",
+ " 30.550000 | \n",
+ " 29.000000 | \n",
+ " 35.500000 | \n",
+ " 80.000000 | \n",
+ " 13.000000 | \n",
+ " 50.000000 | \n",
+ " 62.500000 | \n",
+ " 34.000000 | \n",
+ " 15.000000 | \n",
+ " 5.000000 | \n",
+ " 28.000000 | \n",
+ " 181.000000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ "
\n",
+ " \n",
+ " | 75% | \n",
+ " 191.000000 | \n",
+ " 86.000000 | \n",
+ " 24.180715 | \n",
+ " 30.000000 | \n",
+ " 29.000000 | \n",
+ " 752.500000 | \n",
+ " 105.000000 | \n",
+ " 244.750000 | \n",
+ " 48.625000 | \n",
+ " 22.000000 | \n",
+ " 65.500000 | \n",
+ " 36.175000 | \n",
+ " 53.250000 | \n",
+ " 66.500000 | \n",
+ " 85.925000 | \n",
+ " 31.000000 | \n",
+ " 84.000000 | \n",
+ " 116.500000 | \n",
+ " 66.750000 | \n",
+ " 27.500000 | \n",
+ " 12.000000 | \n",
+ " 48.000000 | \n",
+ " 277.750000 | \n",
+ " 1.000000 | \n",
+ " 0.000000 | \n",
+ "
\n",
+ " \n",
+ " | max | \n",
+ " 206.000000 | \n",
+ " 113.000000 | \n",
+ " 31.555880 | \n",
+ " 36.000000 | \n",
+ " 32.000000 | \n",
+ " 1018.000000 | \n",
+ " 227.000000 | \n",
+ " 509.000000 | \n",
+ " 100.000000 | \n",
+ " 88.000000 | \n",
+ " 225.000000 | \n",
+ " 100.000000 | \n",
+ " 168.000000 | \n",
+ " 186.000000 | \n",
+ " 100.000000 | \n",
+ " 113.000000 | \n",
+ " 226.000000 | \n",
+ " 334.000000 | \n",
+ " 206.000000 | \n",
+ " 63.000000 | \n",
+ " 64.000000 | \n",
+ " 87.000000 | \n",
+ " 584.000000 | \n",
+ " 17.000000 | \n",
+ " 1.000000 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Height Weight BMI Age Games Played \\\n",
+ "count 142.000000 142.000000 142.000000 142.000000 142.000000 \n",
+ "mean 184.612676 78.978873 23.091214 27.112676 24.429577 \n",
+ "std 8.698128 10.996110 2.073691 3.667180 7.075477 \n",
+ "min 165.000000 55.000000 18.390675 21.000000 2.000000 \n",
+ "25% 175.750000 71.500000 21.785876 24.000000 22.000000 \n",
+ "50% 185.000000 79.000000 22.873314 27.000000 27.500000 \n",
+ "75% 191.000000 86.000000 24.180715 30.000000 29.000000 \n",
+ "max 206.000000 113.000000 31.555880 36.000000 32.000000 \n",
+ "\n",
+ " MIN FGM FGA FG% 3PM \\\n",
+ "count 142.000000 142.000000 142.000000 142.000000 142.000000 \n",
+ "mean 500.105634 74.401408 168.704225 43.102817 14.830986 \n",
+ "std 289.373393 55.980754 117.165809 9.855199 17.372829 \n",
+ "min 12.000000 1.000000 3.000000 16.700000 0.000000 \n",
+ "25% 242.250000 27.000000 69.000000 37.125000 0.000000 \n",
+ "50% 506.000000 69.000000 152.500000 42.050000 10.500000 \n",
+ "75% 752.500000 105.000000 244.750000 48.625000 22.000000 \n",
+ "max 1018.000000 227.000000 509.000000 100.000000 88.000000 \n",
+ "\n",
+ " 3PA 3P% FTM FTA FT% OREB \\\n",
+ "count 142.000000 142.000000 142.000000 142.000000 142.000000 142.000000 \n",
+ "mean 43.697183 24.978169 39.535211 49.422535 75.828873 22.063380 \n",
+ "std 46.155302 18.459075 36.743053 44.244697 18.536151 21.519648 \n",
+ "min 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 \n",
+ "25% 3.000000 0.000000 13.000000 17.250000 71.575000 7.000000 \n",
+ "50% 32.000000 30.550000 29.000000 35.500000 80.000000 13.000000 \n",
+ "75% 65.500000 36.175000 53.250000 66.500000 85.925000 31.000000 \n",
+ "max 225.000000 100.000000 168.000000 186.000000 100.000000 113.000000 \n",
+ "\n",
+ " DREB REB AST STL BLK TO \\\n",
+ "count 142.000000 142.000000 142.000000 142.000000 142.000000 142.000000 \n",
+ "mean 61.591549 83.654930 44.514085 17.725352 9.781690 32.288732 \n",
+ "std 49.669854 68.200585 41.490790 13.413312 12.537669 21.447141 \n",
+ "min 2.000000 2.000000 0.000000 0.000000 0.000000 2.000000 \n",
+ "25% 26.000000 34.250000 11.250000 7.000000 2.000000 14.000000 \n",
+ "50% 50.000000 62.500000 34.000000 15.000000 5.000000 28.000000 \n",
+ "75% 84.000000 116.500000 66.750000 27.500000 12.000000 48.000000 \n",
+ "max 226.000000 334.000000 206.000000 63.000000 64.000000 87.000000 \n",
+ "\n",
+ " PTS DD2 TD3 \n",
+ "count 142.000000 142.000000 142.000000 \n",
+ "mean 203.169014 1.140845 0.007042 \n",
+ "std 153.032559 2.909002 0.083918 \n",
+ "min 2.000000 0.000000 0.000000 \n",
+ "25% 77.250000 0.000000 0.000000 \n",
+ "50% 181.000000 0.000000 0.000000 \n",
+ "75% 277.750000 1.000000 0.000000 \n",
+ "max 584.000000 17.000000 1.000000 "
+ ]
+ },
+ "execution_count": 11,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
"source": [
- "#your code here"
+ "wnba.describe()"
]
},
{
@@ -202,11 +1071,13 @@
},
{
"cell_type": "code",
- "execution_count": 20,
+ "execution_count": 12,
"metadata": {},
"outputs": [],
"source": [
- "#your answer here"
+ "# an indicator for an outlier would be either be a large standartdeviation \n",
+ "# or a difference between the steps of the quarters and the maximum\n",
+ "# for example in the FG% column, between 25% and 75% is only 11, but the maximum is 52 higher than the 75% value.\n"
]
},
{
@@ -218,17 +1089,17 @@
},
{
"cell_type": "code",
- "execution_count": 21,
+ "execution_count": 13,
"metadata": {},
"outputs": [],
"source": [
- "#your code here"
+ "wnba.to_csv(\"wnba_clean.csv\", index = False)"
]
}
],
"metadata": {
"kernelspec": {
- "display_name": "Python 3",
+ "display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
@@ -242,7 +1113,7 @@
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
- "version": "3.6.8"
+ "version": "3.11.4"
}
},
"nbformat": 4,
diff --git a/data/wnba.csv b/your-code/wnba.csv
similarity index 100%
rename from data/wnba.csv
rename to your-code/wnba.csv
diff --git a/data/wnba_clean.csv b/your-code/wnba_clean.csv
similarity index 97%
rename from data/wnba_clean.csv
rename to your-code/wnba_clean.csv
index 3d702f3..3bf5421 100644
--- a/data/wnba_clean.csv
+++ b/your-code/wnba_clean.csv
@@ -40,7 +40,7 @@ Courtney Vandersloot,CHI,G,173,66,22.05219018,US,"August 2, 1989",28,Gonzaga,6,2
Courtney Williams,CON,G,173,62,20.71569381,US,"November 5, 1994",22,South Florida,1,29,755,168,338,49.7,8,30,26.7,31,36,86.1,38,84,122,60,15,6,39,375,1,0
Crystal Langhorne,SEA,F/C,188,84,23.76641014,US,"October 27, 1986",30,Maryland,10,30,848,160,240,66.7,1,2,50.0,49,68,72.1,35,140,175,46,16,11,50,370,2,0
Damiris Dantas,ATL,C,191,89,24.39626107,BR,"November 17, 1992",24,Brazil,4,30,569,98,243,40.3,25,91,27.5,33,43,76.7,29,84,113,19,17,18,26,254,0,0
-Danielle Adams,CON,F/C,185,108,31.555880199999997,US,"February 19, 1989",28,Texas A&M,5,18,81,16,43,37.2,12,30,40.0,5,5,100.0,6,4,10,4,4,4,7,49,0,0
+Danielle Adams,CON,F/C,185,108,31.5558802,US,"February 19, 1989",28,Texas A&M,5,18,81,16,43,37.2,12,30,40.0,5,5,100.0,6,4,10,4,4,4,7,49,0,0
Danielle Robinson,PHO,G,175,57,18.6122449,US,"October 5, 1989",27,Oklahoma,7,28,680,79,178,44.4,0,5,0.0,51,61,83.6,13,73,86,106,33,4,58,209,0,0
Dearica Hamby,SAN,F,191,86,23.57391519,US,"June 11, 1993",24,Wake Forest,2,31,650,96,207,46.4,3,8,37.5,58,95,61.1,48,91,139,32,29,8,43,253,1,0
Devereaux Peters,IND,F,188,79,22.35174287,US,"August 10, 1989",28,Notre Dame,6,28,796,154,380,40.5,88,225,39.1,118,130,90.8,8,69,77,76,16,9,56,514,0,0
@@ -73,7 +73,7 @@ Kaela Davis,DAL,G,188,77,21.78587596,US,"March 15, 1995",22,South Carolina,R,23,
Kahleah Copper,CHI,G/F,185,70,20.45288532,US,"August 28, 1994",22,Rutgers,1,29,475,62,163,38.0,12,32,37.5,49,65,75.4,10,33,43,32,13,3,48,185,0,0
Kaleena Mosqueda-Lewis,SEA,F,180,82,25.30864198,US,"March 11, 1993",24,Connecticut,3,29,369,60,140,42.9,5,23,21.7,36,45,80.0,11,43,54,11,9,2,22,161,0,0
Karima Christmas-Kelly,DAL,G/F,183,82,24.48565201,US,"November 9, 1989",27,Duke,6,14,142,23,43,53.5,9,21,42.9,10,10,100.0,4,10,14,6,1,1,13,65,0,0
-Kayla Alexander,SAN,C,193,88,23.624795300000002,CA,"May 1, 1991",26,Arizona State,4,30,889,91,239,38.1,25,83,30.1,111,129,86.0,45,75,120,65,39,5,50,318,0,0
+Kayla Alexander,SAN,C,193,88,23.6247953,CA,"May 1, 1991",26,Arizona State,4,30,889,91,239,38.1,25,83,30.1,111,129,86.0,45,75,120,65,39,5,50,318,0,0
Kayla McBride,SAN,G/F,180,79,24.38271605,US,"June 25, 1992",25,Notre Dame,3,31,433,78,141,55.3,0,0,0.0,15,16,93.8,40,47,87,17,13,15,30,171,0,0
Kayla Pedersen,CON,F,193,86,23.08786813,US,"April 14, 1989",28,Stanford,5,27,882,128,337,38.0,47,147,32.0,108,118,91.5,12,93,105,59,32,5,54,411,0,0
Kayla Thornton,DAL,F,185,86,25.12783053,US,"October 20, 1992",24,Texas–El Paso,2,21,224,11,30,36.7,0,1,0.0,10,14,71.4,19,26,45,13,6,2,9,32,0,0
@@ -107,7 +107,7 @@ Odyssey Sims,LA,G,173,73,24.39105884,US,"July 13, 1992",25,Baylor,4,27,626,86,19
Plenette Pierson,MIN,F/C,188,88,24.89814396,US,"August 31, 1981",35,Texas Tech,15,29,402,54,142,38.0,17,51,33.3,15,20,75.0,13,49,62,48,12,4,33,140,0,0
Rachel Banham,CON,G,175,76,24.81632653,US,"July 15, 1993",24,Minnesota,2,26,238,32,87,36.8,16,48,33.3,16,20,80.0,2,27,29,20,4,0,12,96,0,0
Ramu Tokashiki,SEA,F,193,80,21.47708663,JP,"November 6, 1991",25,Japan,1,29,378,42,92,45.7,0,3,0.0,22,27,81.5,19,29,48,16,8,8,25,106,0,0
-Rebecca Allen,NY,G/F,188,74,20.937075600000004,AU,"June 11, 1992",25,Australia,3,28,254,31,86,36.0,14,40,35.0,2,6,33.3,13,51,64,15,9,12,17,78,0,0
+Rebecca Allen,NY,G/F,188,74,20.9370756,AU,"June 11, 1992",25,Australia,3,28,254,31,86,36.0,14,40,35.0,2,6,33.3,13,51,64,15,9,12,17,78,0,0
Rebekkah Brunson,MIN,F,188,84,23.76641014,US,"November 12, 1981",35,Georgetown,14,26,719,97,218,44.5,22,60,36.7,62,83,74.7,46,135,181,40,31,9,42,278,2,0
Renee Montgomery,MIN,G,170,63,21.79930796,US,"February 12, 1986",31,Connecticut,9,29,614,71,181,39.2,30,89,33.7,44,51,86.3,12,34,46,96,24,1,43,216,0,0
Riquna Williams,LA,G,170,75,25.95155709,US,"May 28, 1990",27,Miami (FL),5,23,408,45,140,32.1,20,74,27.0,38,44,86.4,6,26,32,16,19,3,26,148,0,0