From 30becc644ca6fe82c84603ed602d422fa8ef9955 Mon Sep 17 00:00:00 2001 From: Alejandro Arroyo Yamin Date: Thu, 11 Jul 2019 11:46:21 -0500 Subject: [PATCH] Terminamos lab import-export, Rodrigo y Alejandro --- .../.ipynb_checkpoints/main-checkpoint.ipynb | 2237 +++++++++++++++++ your-code/fertility_Diagnosis.txt | 100 + your-code/main.ipynb | 1992 ++++++++++++++- 3 files changed, 4295 insertions(+), 34 deletions(-) create mode 100644 your-code/.ipynb_checkpoints/main-checkpoint.ipynb create mode 100644 your-code/fertility_Diagnosis.txt diff --git a/your-code/.ipynb_checkpoints/main-checkpoint.ipynb b/your-code/.ipynb_checkpoints/main-checkpoint.ipynb new file mode 100644 index 0000000..eb9194a --- /dev/null +++ b/your-code/.ipynb_checkpoints/main-checkpoint.ipynb @@ -0,0 +1,2237 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Before your start:\n", + "- Read the README.md file\n", + "- Comment as much as you can and use the resources in the README.md file\n", + "- Happy learning!" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Challenge 1 - Working with JSON files\n", + "\n", + "Import the pandas library" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "# Your import here:\n", + "import pandas as pd" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### After importing pandas, let's find a dataset. In this lesson we will be working with a NASA dataset.\n", + "\n", + "Run the code in the cell below to load the dataset containing information about asteroids that have landed on earth. This piece of code helps us open the URL for the dataset and deocde the data using UTF-8." + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "# Run this code\n", + "\n", + "from urllib.request import urlopen\n", + "import json\n", + "\n", + "response = urlopen(\"https://data.nasa.gov/resource/y77d-th95.json\")\n", + "json_data = response.read().decode('utf-8', 'replace')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "In the next cell, load the data in `json_data` and load it into a pandas dataframe. Name the dataframe `nasa`." + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
:@computed_region_cbhk_fwbd:@computed_region_nnqa_25f4fallgeolocationidmassnamenametyperecclassreclatreclongyear
0NaNNaNFell{'type': 'Point', 'coordinates': [6.08333, 50....121.0AachenValidL550.775006.083331880-01-01T00:00:00.000
1NaNNaNFell{'type': 'Point', 'coordinates': [10.23333, 56...2720.0AarhusValidH656.1833310.233331951-01-01T00:00:00.000
2NaNNaNFell{'type': 'Point', 'coordinates': [-113, 54.216...6107000.0AbeeValidEH454.21667-113.000001952-01-01T00:00:00.000
3NaNNaNFell{'type': 'Point', 'coordinates': [-99.9, 16.88...101914.0AcapulcoValidAcapulcoite16.88333-99.900001976-01-01T00:00:00.000
4NaNNaNFell{'type': 'Point', 'coordinates': [-64.95, -33....370780.0AchirasValidL6-33.16667-64.950001902-01-01T00:00:00.000
5NaNNaNFell{'type': 'Point', 'coordinates': [71.8, 32.1]}3794239.0Adhi KotValidEH432.1000071.800001919-01-01T00:00:00.000
6NaNNaNFell{'type': 'Point', 'coordinates': [95.16667, 44...390910.0Adzhi-Bogdo (stone)ValidLL3-644.8333395.166671949-01-01T00:00:00.000
7NaNNaNFell{'type': 'Point', 'coordinates': [0.61667, 44....39230000.0AgenValidH544.216670.616671814-01-01T00:00:00.000
8NaNNaNFell{'type': 'Point', 'coordinates': [-65.23333, -...3981620.0AguadaValidL6-31.60000-65.233331930-01-01T00:00:00.000
9NaNNaNFell{'type': 'Point', 'coordinates': [-64.55, -30....4171440.0Aguila BlancaValidL-30.86667-64.550001920-01-01T00:00:00.000
10NaNNaNFell{'type': 'Point', 'coordinates': [-9.57028, 16...4231000.0Aioun el AtroussValidDiogenite-pm16.39806-9.570281974-01-01T00:00:00.000
11NaNNaNFell{'type': 'Point', 'coordinates': [8.38333, 19....42424000.0AïrValidL619.083338.383331925-01-01T00:00:00.000
12NaNNaNFell{'type': 'Point', 'coordinates': [2.33333, 50....425NaNAire-sur-la-LysValidUnknown50.666672.333331769-01-01T00:00:00.000
13NaNNaNFell{'type': 'Point', 'coordinates': [35.05, 29.51...426779.0AkabaValidL629.5166735.050001949-01-01T00:00:00.000
14NaNNaNFell{'type': 'Point', 'coordinates': [77.95, 29.71...4271800.0AkbarpurValidH429.7166777.950001838-01-01T00:00:00.000
15NaNNaNFell{'type': 'Point', 'coordinates': [8.43333, 8.9...4323000.0AkwangaValidH8.916678.433331959-01-01T00:00:00.000
16NaNNaNFell{'type': 'Point', 'coordinates': [42.81667, 39...43350000.0AkyumakValidIron, IVA39.9166742.816671981-01-01T00:00:00.000
17NaNNaNFell{'type': 'Point', 'coordinates': [39.51667, 24...446160.0Al RaisValidCR2-an24.4166739.516671957-01-01T00:00:00.000
18NaNNaNFell{'type': 'Point', 'coordinates': [28.96, 13.66...447700.0Al ZarnkhValidLL513.6603328.960002001-01-01T00:00:00.000
19NaNNaNFell{'type': 'Point', 'coordinates': [4.08333, 44....4486000.0AlaisValidCI144.116674.083331806-01-01T00:00:00.000
20NaNNaNFell{'type': 'Point', 'coordinates': [11.01667, 44...4532000.0AlbaretoValidL/LL444.6500011.016671766-01-01T00:00:00.000
21NaNNaNFell{'type': 'Point', 'coordinates': [22.66667, 2]}454625.0AlbertaValidL2.0000022.666671949-01-01T00:00:00.000
22NaNNaNFell{'type': 'Point', 'coordinates': [6.01533, 45....458252.0Alby sur ChéranValidEucrite-mmict45.821336.015332002-01-01T00:00:00.000
23NaNNaNFell{'type': 'Point', 'coordinates': [-1.78333, 51...461700.0AldsworthValidLL551.78333-1.783331835-01-01T00:00:00.000
24NaNNaNFell{'type': 'Point', 'coordinates': [37.13333, 36...4623200.0AleppoValidL636.2333337.133331873-01-01T00:00:00.000
25NaNNaNFell{'type': 'Point', 'coordinates': [8.75, 44.883...463908.0AlessandriaValidH544.883338.750001860-01-01T00:00:00.000
26NaNNaNFell{'type': 'Point', 'coordinates': [31.81667, 50...4659251.0AlexandrovskyValidH450.9500031.816671900-01-01T00:00:00.000
27NaNNaNFell{'type': 'Point', 'coordinates': [10.15, 45.26...466228000.0AlfianelloValidL645.2666710.150001883-01-01T00:00:00.000
2850.0429.0Fell{'type': 'Point', 'coordinates': [-85.88333, 4...227632000.0AlleganValidH542.53333-85.883331899-01-01T00:00:00.000
29NaNNaNFell{'type': 'Point', 'coordinates': [-105.31667, ...22782000000.0AllendeValidCV326.96667-105.316671969-01-01T00:00:00.000
.......................................
97029.01637.0Fell{'type': 'Point', 'coordinates': [-86.2945, 33...237735560.0SylacaugaValidH433.18836-86.294501954-01-01T00:00:00.000
971NaNNaNFell{'type': 'Point', 'coordinates': [14.65, 49.4]}237767540.0TaborValidH549.4000014.650001753-01-01T00:00:00.000
972NaNNaNFell{'type': 'Point', 'coordinates': [5.41667, 36....237789000.0TadjeraValidL536.183335.416671867-01-01T00:00:00.000
973NaNNaNFell{'type': 'Point', 'coordinates': [-134.20139, ...2378210000.0Tagish LakeValidC2-ung59.70444-134.201392000-01-01T00:00:00.000
974NaNNaNFell{'type': 'Point', 'coordinates': [137.305, 34....237841000.0TaharaValidH4/534.72000137.305001991-01-01T00:00:00.000
975NaNNaNFell{'type': 'Point', 'coordinates': [134.9, 35.38...23789720.0TakenouchiValidH535.38333134.900001880-01-01T00:00:00.000
976NaNNaNFellNaN237911421.0TalampayaValidEucrite-cmNaNNaN1995-01-01T00:00:00.000
977NaNNaNFell{'type': 'Point', 'coordinates': [112.76667, -...2379510500.0TambakwatuValidL6-7.75000112.766671975-01-01T00:00:00.000
978NaNNaNFell{'type': 'Point', 'coordinates': [-7.015, 31.1...48691100000.0TamdakhtValidH531.16333-7.015002008-01-01T00:00:00.000
979NaNNaNFell{'type': 'Point', 'coordinates': [136.23333, 3...23801905.0TanéValidL535.43333136.233331918-01-01T00:00:00.000
980NaNNaNFell{'type': 'Point', 'coordinates': [122.9, 45.4]}238733850.0TaonanValidL545.40000122.900001965-01-01T00:00:00.000
981NaNNaNFell{'type': 'Point', 'coordinates': [10.41667, 32...2388412000.0TatahouineValidDiogenite32.9500010.416671931-01-01T00:00:00.000
982NaNNaNFell{'type': 'Point', 'coordinates': [43.73333, 19...238852500.0TathlithValidL619.3833343.733331967-01-01T00:00:00.000
983NaNNaNFell{'type': 'Point', 'coordinates': [44.45, 35.13...238876000.0TaukValidL635.1333344.450001929-01-01T00:00:00.000
984NaNNaNFell{'type': 'Point', 'coordinates': [23.5, 46.716...2388821000.0TautiValidL646.7166723.500001937-01-01T00:00:00.000
985NaNNaNFell{'type': 'Point', 'coordinates': [142.95, -25....23897160000.0TenhamValidL6-25.73333142.950001879-01-01T00:00:00.000
986NaNNaNFell{'type': 'Point', 'coordinates': [26.95, 58.03...2389828500.0TennasilmValidL458.0333326.950001872-01-01T00:00:00.000
987NaNNaNFell{'type': 'Point', 'coordinates': [70.6, 33.4]}23908342.0ThalValidH633.4000070.600001950-01-01T00:00:00.000
988NaNNaNFell{'type': 'Point', 'coordinates': [37.15028, -1...5449314200.0ThikaValidL6-1.0027837.150282011-01-01T00:00:00.000
989NaNNaNFell{'type': 'Point', 'coordinates': [27.58333, -2...2397645300.0ThuatheValidH4/5-29.3333327.583332002-01-01T00:00:00.000
990NaNNaNFell{'type': 'Point', 'coordinates': [118.99, 32.9...239842232.0TianzhangValidH532.94667118.990001986-01-01T00:00:00.000
991NaNNaNFell{'type': 'Point', 'coordinates': [17.11667, 49...2398928000.0TieschitzValidH/L3.649.6000017.116671878-01-01T00:00:00.000
99234.01762.0Fell{'type': 'Point', 'coordinates': [-89.68333, 3...2399874800.0TildenValidL638.20000-89.683331927-01-01T00:00:00.000
993NaNNaNFell{'type': 'Point', 'coordinates': [1.53333, 14....239993000.0TillaberiValidL614.250001.533331970-01-01T00:00:00.000
994NaNNaNFell{'type': 'Point', 'coordinates': [35.2, 54.5]}2400465500.0TimochinValidH554.5000035.200001807-01-01T00:00:00.000
995NaNNaNFell{'type': 'Point', 'coordinates': [79.41667, 13...24009230.0TirupatiValidH613.6333379.416671934-01-01T00:00:00.000
996NaNNaNFell{'type': 'Point', 'coordinates': [-7.61123, 29...548237000.0TissintValidMartian (shergottite)29.48195-7.611232011-01-01T00:00:00.000
997NaNNaNFell{'type': 'Point', 'coordinates': [111.53333, -...2401120000.0TjabeValidH6-7.08333111.533331869-01-01T00:00:00.000
998NaNNaNFell{'type': 'Point', 'coordinates': [106.58333, -...2401216500.0TjerebonValidL5-6.66667106.583331922-01-01T00:00:00.000
999NaNNaNFell{'type': 'Point', 'coordinates': [34.76667, 47...24019600.0TomakovkaValidLL647.8500034.766671905-01-01T00:00:00.000
\n", + "

1000 rows × 12 columns

\n", + "
" + ], + "text/plain": [ + " :@computed_region_cbhk_fwbd :@computed_region_nnqa_25f4 fall \\\n", + "0 NaN NaN Fell \n", + "1 NaN NaN Fell \n", + "2 NaN NaN Fell \n", + "3 NaN NaN Fell \n", + "4 NaN NaN Fell \n", + "5 NaN NaN Fell \n", + "6 NaN NaN Fell \n", + "7 NaN NaN Fell \n", + "8 NaN NaN Fell \n", + "9 NaN NaN Fell \n", + "10 NaN NaN Fell \n", + "11 NaN NaN Fell \n", + "12 NaN NaN Fell \n", + "13 NaN NaN Fell \n", + "14 NaN NaN Fell \n", + "15 NaN NaN Fell \n", + "16 NaN NaN Fell \n", + "17 NaN NaN Fell \n", + "18 NaN NaN Fell \n", + "19 NaN NaN Fell \n", + "20 NaN NaN Fell \n", + "21 NaN NaN Fell \n", + "22 NaN NaN Fell \n", + "23 NaN NaN Fell \n", + "24 NaN NaN Fell \n", + "25 NaN NaN Fell \n", + "26 NaN NaN Fell \n", + "27 NaN NaN Fell \n", + "28 50.0 429.0 Fell \n", + "29 NaN NaN Fell \n", + ".. ... ... ... \n", + "970 29.0 1637.0 Fell \n", + "971 NaN NaN Fell \n", + "972 NaN NaN Fell \n", + "973 NaN NaN Fell \n", + "974 NaN NaN Fell \n", + "975 NaN NaN Fell \n", + "976 NaN NaN Fell \n", + "977 NaN NaN Fell \n", + "978 NaN NaN Fell \n", + "979 NaN NaN Fell \n", + "980 NaN NaN Fell \n", + "981 NaN NaN Fell \n", + "982 NaN NaN Fell \n", + "983 NaN NaN Fell \n", + "984 NaN NaN Fell \n", + "985 NaN NaN Fell \n", + "986 NaN NaN Fell \n", + "987 NaN NaN Fell \n", + "988 NaN NaN Fell \n", + "989 NaN NaN Fell \n", + "990 NaN NaN Fell \n", + "991 NaN NaN Fell \n", + "992 34.0 1762.0 Fell \n", + "993 NaN NaN Fell \n", + "994 NaN NaN Fell \n", + "995 NaN NaN Fell \n", + "996 NaN NaN Fell \n", + "997 NaN NaN Fell \n", + "998 NaN NaN Fell \n", + "999 NaN NaN Fell \n", + "\n", + " geolocation id mass \\\n", + "0 {'type': 'Point', 'coordinates': [6.08333, 50.... 1 21.0 \n", + "1 {'type': 'Point', 'coordinates': [10.23333, 56... 2 720.0 \n", + "2 {'type': 'Point', 'coordinates': [-113, 54.216... 6 107000.0 \n", + "3 {'type': 'Point', 'coordinates': [-99.9, 16.88... 10 1914.0 \n", + "4 {'type': 'Point', 'coordinates': [-64.95, -33.... 370 780.0 \n", + "5 {'type': 'Point', 'coordinates': [71.8, 32.1]} 379 4239.0 \n", + "6 {'type': 'Point', 'coordinates': [95.16667, 44... 390 910.0 \n", + "7 {'type': 'Point', 'coordinates': [0.61667, 44.... 392 30000.0 \n", + "8 {'type': 'Point', 'coordinates': [-65.23333, -... 398 1620.0 \n", + "9 {'type': 'Point', 'coordinates': [-64.55, -30.... 417 1440.0 \n", + "10 {'type': 'Point', 'coordinates': [-9.57028, 16... 423 1000.0 \n", + "11 {'type': 'Point', 'coordinates': [8.38333, 19.... 424 24000.0 \n", + "12 {'type': 'Point', 'coordinates': [2.33333, 50.... 425 NaN \n", + "13 {'type': 'Point', 'coordinates': [35.05, 29.51... 426 779.0 \n", + "14 {'type': 'Point', 'coordinates': [77.95, 29.71... 427 1800.0 \n", + "15 {'type': 'Point', 'coordinates': [8.43333, 8.9... 432 3000.0 \n", + "16 {'type': 'Point', 'coordinates': [42.81667, 39... 433 50000.0 \n", + "17 {'type': 'Point', 'coordinates': [39.51667, 24... 446 160.0 \n", + "18 {'type': 'Point', 'coordinates': [28.96, 13.66... 447 700.0 \n", + "19 {'type': 'Point', 'coordinates': [4.08333, 44.... 448 6000.0 \n", + "20 {'type': 'Point', 'coordinates': [11.01667, 44... 453 2000.0 \n", + "21 {'type': 'Point', 'coordinates': [22.66667, 2]} 454 625.0 \n", + "22 {'type': 'Point', 'coordinates': [6.01533, 45.... 458 252.0 \n", + "23 {'type': 'Point', 'coordinates': [-1.78333, 51... 461 700.0 \n", + "24 {'type': 'Point', 'coordinates': [37.13333, 36... 462 3200.0 \n", + "25 {'type': 'Point', 'coordinates': [8.75, 44.883... 463 908.0 \n", + "26 {'type': 'Point', 'coordinates': [31.81667, 50... 465 9251.0 \n", + "27 {'type': 'Point', 'coordinates': [10.15, 45.26... 466 228000.0 \n", + "28 {'type': 'Point', 'coordinates': [-85.88333, 4... 2276 32000.0 \n", + "29 {'type': 'Point', 'coordinates': [-105.31667, ... 2278 2000000.0 \n", + ".. ... ... ... \n", + "970 {'type': 'Point', 'coordinates': [-86.2945, 33... 23773 5560.0 \n", + "971 {'type': 'Point', 'coordinates': [14.65, 49.4]} 23776 7540.0 \n", + "972 {'type': 'Point', 'coordinates': [5.41667, 36.... 23778 9000.0 \n", + "973 {'type': 'Point', 'coordinates': [-134.20139, ... 23782 10000.0 \n", + "974 {'type': 'Point', 'coordinates': [137.305, 34.... 23784 1000.0 \n", + "975 {'type': 'Point', 'coordinates': [134.9, 35.38... 23789 720.0 \n", + "976 NaN 23791 1421.0 \n", + "977 {'type': 'Point', 'coordinates': [112.76667, -... 23795 10500.0 \n", + "978 {'type': 'Point', 'coordinates': [-7.015, 31.1... 48691 100000.0 \n", + "979 {'type': 'Point', 'coordinates': [136.23333, 3... 23801 905.0 \n", + "980 {'type': 'Point', 'coordinates': [122.9, 45.4]} 23873 3850.0 \n", + "981 {'type': 'Point', 'coordinates': [10.41667, 32... 23884 12000.0 \n", + "982 {'type': 'Point', 'coordinates': [43.73333, 19... 23885 2500.0 \n", + "983 {'type': 'Point', 'coordinates': [44.45, 35.13... 23887 6000.0 \n", + "984 {'type': 'Point', 'coordinates': [23.5, 46.716... 23888 21000.0 \n", + "985 {'type': 'Point', 'coordinates': [142.95, -25.... 23897 160000.0 \n", + "986 {'type': 'Point', 'coordinates': [26.95, 58.03... 23898 28500.0 \n", + "987 {'type': 'Point', 'coordinates': [70.6, 33.4]} 23908 342.0 \n", + "988 {'type': 'Point', 'coordinates': [37.15028, -1... 54493 14200.0 \n", + "989 {'type': 'Point', 'coordinates': [27.58333, -2... 23976 45300.0 \n", + "990 {'type': 'Point', 'coordinates': [118.99, 32.9... 23984 2232.0 \n", + "991 {'type': 'Point', 'coordinates': [17.11667, 49... 23989 28000.0 \n", + "992 {'type': 'Point', 'coordinates': [-89.68333, 3... 23998 74800.0 \n", + "993 {'type': 'Point', 'coordinates': [1.53333, 14.... 23999 3000.0 \n", + "994 {'type': 'Point', 'coordinates': [35.2, 54.5]} 24004 65500.0 \n", + "995 {'type': 'Point', 'coordinates': [79.41667, 13... 24009 230.0 \n", + "996 {'type': 'Point', 'coordinates': [-7.61123, 29... 54823 7000.0 \n", + "997 {'type': 'Point', 'coordinates': [111.53333, -... 24011 20000.0 \n", + "998 {'type': 'Point', 'coordinates': [106.58333, -... 24012 16500.0 \n", + "999 {'type': 'Point', 'coordinates': [34.76667, 47... 24019 600.0 \n", + "\n", + " name nametype recclass reclat reclong \\\n", + "0 Aachen Valid L5 50.77500 6.08333 \n", + "1 Aarhus Valid H6 56.18333 10.23333 \n", + "2 Abee Valid EH4 54.21667 -113.00000 \n", + "3 Acapulco Valid Acapulcoite 16.88333 -99.90000 \n", + "4 Achiras Valid L6 -33.16667 -64.95000 \n", + "5 Adhi Kot Valid EH4 32.10000 71.80000 \n", + "6 Adzhi-Bogdo (stone) Valid LL3-6 44.83333 95.16667 \n", + "7 Agen Valid H5 44.21667 0.61667 \n", + "8 Aguada Valid L6 -31.60000 -65.23333 \n", + "9 Aguila Blanca Valid L -30.86667 -64.55000 \n", + "10 Aioun el Atrouss Valid Diogenite-pm 16.39806 -9.57028 \n", + "11 Aïr Valid L6 19.08333 8.38333 \n", + "12 Aire-sur-la-Lys Valid Unknown 50.66667 2.33333 \n", + "13 Akaba Valid L6 29.51667 35.05000 \n", + "14 Akbarpur Valid H4 29.71667 77.95000 \n", + "15 Akwanga Valid H 8.91667 8.43333 \n", + "16 Akyumak Valid Iron, IVA 39.91667 42.81667 \n", + "17 Al Rais Valid CR2-an 24.41667 39.51667 \n", + "18 Al Zarnkh Valid LL5 13.66033 28.96000 \n", + "19 Alais Valid CI1 44.11667 4.08333 \n", + "20 Albareto Valid L/LL4 44.65000 11.01667 \n", + "21 Alberta Valid L 2.00000 22.66667 \n", + "22 Alby sur Chéran Valid Eucrite-mmict 45.82133 6.01533 \n", + "23 Aldsworth Valid LL5 51.78333 -1.78333 \n", + "24 Aleppo Valid L6 36.23333 37.13333 \n", + "25 Alessandria Valid H5 44.88333 8.75000 \n", + "26 Alexandrovsky Valid H4 50.95000 31.81667 \n", + "27 Alfianello Valid L6 45.26667 10.15000 \n", + "28 Allegan Valid H5 42.53333 -85.88333 \n", + "29 Allende Valid CV3 26.96667 -105.31667 \n", + ".. ... ... ... ... ... \n", + "970 Sylacauga Valid H4 33.18836 -86.29450 \n", + "971 Tabor Valid H5 49.40000 14.65000 \n", + "972 Tadjera Valid L5 36.18333 5.41667 \n", + "973 Tagish Lake Valid C2-ung 59.70444 -134.20139 \n", + "974 Tahara Valid H4/5 34.72000 137.30500 \n", + "975 Takenouchi Valid H5 35.38333 134.90000 \n", + "976 Talampaya Valid Eucrite-cm NaN NaN \n", + "977 Tambakwatu Valid L6 -7.75000 112.76667 \n", + "978 Tamdakht Valid H5 31.16333 -7.01500 \n", + "979 Tané Valid L5 35.43333 136.23333 \n", + "980 Taonan Valid L5 45.40000 122.90000 \n", + "981 Tatahouine Valid Diogenite 32.95000 10.41667 \n", + "982 Tathlith Valid L6 19.38333 43.73333 \n", + "983 Tauk Valid L6 35.13333 44.45000 \n", + "984 Tauti Valid L6 46.71667 23.50000 \n", + "985 Tenham Valid L6 -25.73333 142.95000 \n", + "986 Tennasilm Valid L4 58.03333 26.95000 \n", + "987 Thal Valid H6 33.40000 70.60000 \n", + "988 Thika Valid L6 -1.00278 37.15028 \n", + "989 Thuathe Valid H4/5 -29.33333 27.58333 \n", + "990 Tianzhang Valid H5 32.94667 118.99000 \n", + "991 Tieschitz Valid H/L3.6 49.60000 17.11667 \n", + "992 Tilden Valid L6 38.20000 -89.68333 \n", + "993 Tillaberi Valid L6 14.25000 1.53333 \n", + "994 Timochin Valid H5 54.50000 35.20000 \n", + "995 Tirupati Valid H6 13.63333 79.41667 \n", + "996 Tissint Valid Martian (shergottite) 29.48195 -7.61123 \n", + "997 Tjabe Valid H6 -7.08333 111.53333 \n", + "998 Tjerebon Valid L5 -6.66667 106.58333 \n", + "999 Tomakovka Valid LL6 47.85000 34.76667 \n", + "\n", + " year \n", + "0 1880-01-01T00:00:00.000 \n", + "1 1951-01-01T00:00:00.000 \n", + "2 1952-01-01T00:00:00.000 \n", + "3 1976-01-01T00:00:00.000 \n", + "4 1902-01-01T00:00:00.000 \n", + "5 1919-01-01T00:00:00.000 \n", + "6 1949-01-01T00:00:00.000 \n", + "7 1814-01-01T00:00:00.000 \n", + "8 1930-01-01T00:00:00.000 \n", + "9 1920-01-01T00:00:00.000 \n", + "10 1974-01-01T00:00:00.000 \n", + "11 1925-01-01T00:00:00.000 \n", + "12 1769-01-01T00:00:00.000 \n", + "13 1949-01-01T00:00:00.000 \n", + "14 1838-01-01T00:00:00.000 \n", + "15 1959-01-01T00:00:00.000 \n", + "16 1981-01-01T00:00:00.000 \n", + "17 1957-01-01T00:00:00.000 \n", + "18 2001-01-01T00:00:00.000 \n", + "19 1806-01-01T00:00:00.000 \n", + "20 1766-01-01T00:00:00.000 \n", + "21 1949-01-01T00:00:00.000 \n", + "22 2002-01-01T00:00:00.000 \n", + "23 1835-01-01T00:00:00.000 \n", + "24 1873-01-01T00:00:00.000 \n", + "25 1860-01-01T00:00:00.000 \n", + "26 1900-01-01T00:00:00.000 \n", + "27 1883-01-01T00:00:00.000 \n", + "28 1899-01-01T00:00:00.000 \n", + "29 1969-01-01T00:00:00.000 \n", + ".. ... \n", + "970 1954-01-01T00:00:00.000 \n", + "971 1753-01-01T00:00:00.000 \n", + "972 1867-01-01T00:00:00.000 \n", + "973 2000-01-01T00:00:00.000 \n", + "974 1991-01-01T00:00:00.000 \n", + "975 1880-01-01T00:00:00.000 \n", + "976 1995-01-01T00:00:00.000 \n", + "977 1975-01-01T00:00:00.000 \n", + "978 2008-01-01T00:00:00.000 \n", + "979 1918-01-01T00:00:00.000 \n", + "980 1965-01-01T00:00:00.000 \n", + "981 1931-01-01T00:00:00.000 \n", + "982 1967-01-01T00:00:00.000 \n", + "983 1929-01-01T00:00:00.000 \n", + "984 1937-01-01T00:00:00.000 \n", + "985 1879-01-01T00:00:00.000 \n", + "986 1872-01-01T00:00:00.000 \n", + "987 1950-01-01T00:00:00.000 \n", + "988 2011-01-01T00:00:00.000 \n", + "989 2002-01-01T00:00:00.000 \n", + "990 1986-01-01T00:00:00.000 \n", + "991 1878-01-01T00:00:00.000 \n", + "992 1927-01-01T00:00:00.000 \n", + "993 1970-01-01T00:00:00.000 \n", + "994 1807-01-01T00:00:00.000 \n", + "995 1934-01-01T00:00:00.000 \n", + "996 2011-01-01T00:00:00.000 \n", + "997 1869-01-01T00:00:00.000 \n", + "998 1922-01-01T00:00:00.000 \n", + "999 1905-01-01T00:00:00.000 \n", + "\n", + "[1000 rows x 12 columns]" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Your code here:\n", + "nasa = pd.read_json(json_data, orient='records')\n", + "nasa" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Now that we have loaded the data, let's examine it using the `head()` function." + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
:@computed_region_cbhk_fwbd:@computed_region_nnqa_25f4fallgeolocationidmassnamenametyperecclassreclatreclongyear
0NaNNaNFell{'type': 'Point', 'coordinates': [6.08333, 50....121.0AachenValidL550.775006.083331880-01-01T00:00:00.000
1NaNNaNFell{'type': 'Point', 'coordinates': [10.23333, 56...2720.0AarhusValidH656.1833310.233331951-01-01T00:00:00.000
2NaNNaNFell{'type': 'Point', 'coordinates': [-113, 54.216...6107000.0AbeeValidEH454.21667-113.000001952-01-01T00:00:00.000
3NaNNaNFell{'type': 'Point', 'coordinates': [-99.9, 16.88...101914.0AcapulcoValidAcapulcoite16.88333-99.900001976-01-01T00:00:00.000
4NaNNaNFell{'type': 'Point', 'coordinates': [-64.95, -33....370780.0AchirasValidL6-33.16667-64.950001902-01-01T00:00:00.000
\n", + "
" + ], + "text/plain": [ + " :@computed_region_cbhk_fwbd :@computed_region_nnqa_25f4 fall \\\n", + "0 NaN NaN Fell \n", + "1 NaN NaN Fell \n", + "2 NaN NaN Fell \n", + "3 NaN NaN Fell \n", + "4 NaN NaN Fell \n", + "\n", + " geolocation id mass name \\\n", + "0 {'type': 'Point', 'coordinates': [6.08333, 50.... 1 21.0 Aachen \n", + "1 {'type': 'Point', 'coordinates': [10.23333, 56... 2 720.0 Aarhus \n", + "2 {'type': 'Point', 'coordinates': [-113, 54.216... 6 107000.0 Abee \n", + "3 {'type': 'Point', 'coordinates': [-99.9, 16.88... 10 1914.0 Acapulco \n", + "4 {'type': 'Point', 'coordinates': [-64.95, -33.... 370 780.0 Achiras \n", + "\n", + " nametype recclass reclat reclong year \n", + "0 Valid L5 50.77500 6.08333 1880-01-01T00:00:00.000 \n", + "1 Valid H6 56.18333 10.23333 1951-01-01T00:00:00.000 \n", + "2 Valid EH4 54.21667 -113.00000 1952-01-01T00:00:00.000 \n", + "3 Valid Acapulcoite 16.88333 -99.90000 1976-01-01T00:00:00.000 \n", + "4 Valid L6 -33.16667 -64.95000 1902-01-01T00:00:00.000 " + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Your code here:\n", + "#.head() shows the first 5 rows by default.\n", + "nasa.head()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### The `value_counts()` function is commonly used in pandas to find the frequency of every value in a column.\n", + "\n", + "In the cell below, use the `value_counts()` function to determine the frequency of all types of asteroid landings by applying the function to the `fall` column." + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Fell 996\n", + "Found 4\n", + "Name: fall, dtype: int64" + ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Your code here:\n", + "fall_count = nasa['fall']\n", + "fall_count.value_counts()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Finally, let's save the dataframe as a json file again. Since we downloaded the file from an online source, the goal of saving the dataframe is to have a local copy. Save the dataframe using the `orient=records` argument and name the file `nasa.json`." + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [], + "source": [ + "# Your code here:\n", + "nasa.to_json('nasa.json', orient='records')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Challenge 2 - Working with CSV and Other Separated Files\n", + "\n", + "csv files are more commonly used as dataframes. In the cell below, load the file from the URL provided using the `read_csv()` function in pandas. Starting version 0.19 of pandas, you can load a csv file into a dataframe directly from a URL without having to load the file first like we did with the JSON URL. The dataset we will be using contains informtaions about NASA shuttles. \n", + "\n", + "In the cell below, we define the column names and the URL of the data. Following this cell, read the tst file to a variable called `shuttle`. Since the file does not contain the column names, you must add them yourself using the column names declared in `cols` using the `names` argument. Additionally, a tst file is space separated, make sure you pass ` sep=' '` to the function." + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": {}, + "outputs": [], + "source": [ + "# Run this code:\n", + "cols = ['time', 'rad_flow', 'fpv_close', 'fpv_open', 'high', 'bypass', 'bpv_close', 'bpv_open', 'class']\n", + "tst_url = 'https://archive.ics.uci.edu/ml/machine-learning-databases/statlog/shuttle/shuttle.tst'" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "metadata": {}, + "outputs": [], + "source": [ + "# Your code here:\n", + "shuttle = pd.read_csv(tst_url, sep=' ', names=cols)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Let's verify that this worked by looking at the `head()` function." + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
timerad_flowfpv_closefpv_openhighbypassbpv_closebpv_openclass
550810-6112588644
56096052-4404444
50-189-7500394021
53979042-22537124
55282054-6262821
\n", + "
" + ], + "text/plain": [ + " time rad_flow fpv_close fpv_open high bypass bpv_close bpv_open \\\n", + "55 0 81 0 -6 11 25 88 64 \n", + "56 0 96 0 52 -4 40 44 4 \n", + "50 -1 89 -7 50 0 39 40 2 \n", + "53 9 79 0 42 -2 25 37 12 \n", + "55 2 82 0 54 -6 26 28 2 \n", + "\n", + " class \n", + "55 4 \n", + "56 4 \n", + "50 1 \n", + "53 4 \n", + "55 1 " + ] + }, + "execution_count": 21, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Your code here:\n", + "shuttle.head()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "To make life easier for us, let's turn this dataframe into a comma separated file by saving it using the `to_csv()` function. Save `shuttle` into the file `shuttle.csv` and ensure the file is comma separated and that we are not saving the index column." + ] + }, + { + "cell_type": "code", + "execution_count": 22, + "metadata": {}, + "outputs": [], + "source": [ + "# Your code here:\n", + "shuttle.to_csv('shuttle.csv', index=False)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Challenge 3 - Working with Excel Files\n", + "\n", + "We can also use pandas to convert excel spreadsheets to dataframes. Let's use the `read_excel()` function. In this case, `astronauts.xls` is in the same folder that contains this notebook. Read this file into a variable called `astronaut`. \n", + "\n", + "Note: Make sure to install the `xlrd` library if it is not yet installed." + ] + }, + { + "cell_type": "code", + "execution_count": 24, + "metadata": {}, + "outputs": [], + "source": [ + "# Your code here:\n", + "astronaut = pd.read_excel('astronauts.xls')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Use the `head()` function to inspect the dataframe." + ] + }, + { + "cell_type": "code", + "execution_count": 25, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
NameYearGroupStatusBirth DateBirth PlaceGenderAlma MaterUndergraduate MajorGraduate MajorMilitary RankMilitary BranchSpace FlightsSpace Flight (hr)Space WalksSpace Walks (hr)MissionsDeath DateDeath Mission
0Joseph M. Acaba2004.019.0Active1967-05-17Inglewood, CAMaleUniversity of California-Santa Barbara; Univer...GeologyGeologyNaNNaN23307213.0STS-119 (Discovery), ISS-31/32 (Soyuz)NaTNaN
1Loren W. ActonNaNNaNRetired1936-03-07Lewiston, MTMaleMontana State University; University of ColoradoEngineering PhysicsSolar PhysicsNaNNaN119000.0STS 51-F (Challenger)NaTNaN
2James C. Adamson1984.010.0Retired1946-03-03Warsaw, NYMaleUS Military Academy; Princeton UniversityEngineeringAerospace EngineeringColonelUS Army (Retired)233400.0STS-28 (Columbia), STS-43 (Atlantis)NaTNaN
3Thomas D. Akers1987.012.0Retired1951-05-20St. Louis, MOMaleUniversity of Missouri-RollaApplied MathematicsApplied MathematicsColonelUS Air Force (Retired)4814429.0STS-41 (Discovery), STS-49 (Endeavor), STS-61 ...NaTNaN
4Buzz Aldrin1963.03.0Retired1930-01-20Montclair, NJMaleUS Military Academy; MITMechanical EngineeringAstronauticsColonelUS Air Force (Retired)228928.0Gemini 12, Apollo 11NaTNaN
\n", + "
" + ], + "text/plain": [ + " Name Year Group Status Birth Date Birth Place Gender \\\n", + "0 Joseph M. Acaba 2004.0 19.0 Active 1967-05-17 Inglewood, CA Male \n", + "1 Loren W. Acton NaN NaN Retired 1936-03-07 Lewiston, MT Male \n", + "2 James C. Adamson 1984.0 10.0 Retired 1946-03-03 Warsaw, NY Male \n", + "3 Thomas D. Akers 1987.0 12.0 Retired 1951-05-20 St. Louis, MO Male \n", + "4 Buzz Aldrin 1963.0 3.0 Retired 1930-01-20 Montclair, NJ Male \n", + "\n", + " Alma Mater Undergraduate Major \\\n", + "0 University of California-Santa Barbara; Univer... Geology \n", + "1 Montana State University; University of Colorado Engineering Physics \n", + "2 US Military Academy; Princeton University Engineering \n", + "3 University of Missouri-Rolla Applied Mathematics \n", + "4 US Military Academy; MIT Mechanical Engineering \n", + "\n", + " Graduate Major Military Rank Military Branch Space Flights \\\n", + "0 Geology NaN NaN 2 \n", + "1 Solar Physics NaN NaN 1 \n", + "2 Aerospace Engineering Colonel US Army (Retired) 2 \n", + "3 Applied Mathematics Colonel US Air Force (Retired) 4 \n", + "4 Astronautics Colonel US Air Force (Retired) 2 \n", + "\n", + " Space Flight (hr) Space Walks Space Walks (hr) \\\n", + "0 3307 2 13.0 \n", + "1 190 0 0.0 \n", + "2 334 0 0.0 \n", + "3 814 4 29.0 \n", + "4 289 2 8.0 \n", + "\n", + " Missions Death Date Death Mission \n", + "0 STS-119 (Discovery), ISS-31/32 (Soyuz) NaT NaN \n", + "1 STS 51-F (Challenger) NaT NaN \n", + "2 STS-28 (Columbia), STS-43 (Atlantis) NaT NaN \n", + "3 STS-41 (Discovery), STS-49 (Endeavor), STS-61 ... NaT NaN \n", + "4 Gemini 12, Apollo 11 NaT NaN " + ] + }, + "execution_count": 25, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Your code here:\n", + "astronaut.head()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Use the `value_counts()` function to find the most popular undergraduate major among all astronauts." + ] + }, + { + "cell_type": "code", + "execution_count": 30, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Physics 35\n", + "Aerospace Engineering 33\n", + "Mechanical Engineering 30\n", + "Aeronautical Engineering 28\n", + "Electrical Engineering 23\n", + "Engineering Science 13\n", + "Engineering 12\n", + "Mathematics 11\n", + "Chemistry 10\n", + "Naval Sciences 9\n", + "Chemical Engineering 9\n", + "Astronautical Engineering 8\n", + "Aeronautical & Astronautical Engineering 6\n", + "Biology 5\n", + "Mathematics & Physics 5\n", + "Geology 5\n", + "Civil Engineering 5\n", + "Physics & Astronomy 4\n", + "Applied Science & Engineering 4\n", + "Engineering Physics 3\n", + "Computer Science 3\n", + "Aeronautics & Astronautics 3\n", + "Applied Mathematics 3\n", + "Chemistry & Biology 2\n", + "Engineering Mechanics 2\n", + "Engineering Management 2\n", + "Education 2\n", + "Physics & Mathematics 2\n", + "Biological Science 2\n", + "Zoology 2\n", + " ..\n", + "Nuclear Engineering 1\n", + "Earth Sciences 1\n", + "Mathematical & Electrical Science 1\n", + "Chemistry; Physiological Optics 1\n", + "Systems Engineering 1\n", + "Mathematics & Statistics; Chemistry 1\n", + "Business Finance 1\n", + "Biochemistry 1\n", + "Physiology 1\n", + "Military Science 1\n", + "Economics 1\n", + "Molecular Biology 1\n", + "Animal Science 1\n", + "Aerospace Engineering & Mechanics 1\n", + "Electrical Science 1\n", + "Mathematics & Economics 1\n", + "Computer & Systems Engineering 1\n", + "Solid Earth Sciences 1\n", + "Psychology 1\n", + "Physics & Astronautical Engineering 1\n", + "Business Economics 1\n", + "Ecological Science 1\n", + "Military Engineering 1\n", + "Mathematics; Russian 1\n", + "Applied Biology; Mechanical Engineering 1\n", + "Aeronautics & Astronautics; Earth, Atmospheric & Planetary Sciences 1\n", + "Ceramic Engineering 1\n", + "Animal Nutrition 1\n", + "Bioscience 1\n", + "Electrical Engineering; Computer Science 1\n", + "Name: Undergraduate Major, Length: 83, dtype: int64" + ] + }, + "execution_count": 30, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Your code here:\n", + "undergrad_count = astronaut['Undergraduate Major']\n", + "undergrad_count.value_counts()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Due to all the commas present in the cells of this file, let's save it as a tab separated csv file. In the cell below, save `astronaut` as a tab separated file using the `to_csv` function. Call the file `astronaut.csv` and remember to remove the index column." + ] + }, + { + "cell_type": "code", + "execution_count": 31, + "metadata": {}, + "outputs": [], + "source": [ + "# Your code here:\n", + "astronaut.to_csv('astronaut.csv', sep=\"\\t\", index=False)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Bonus Challenge - Fertility Dataset\n", + "\n", + "Visit the following [URL](https://archive.ics.uci.edu/ml/datasets/Fertility) and retrieve the dataset as well as the column headers. Determine the correct separator and read the file into a variable called `fertility`. Examine the dataframe using the `head()` function." + ] + }, + { + "cell_type": "code", + "execution_count": 32, + "metadata": {}, + "outputs": [], + "source": [ + "# Your code here:\n", + "column = [\n", + " 'Season in which the analysis was performed.',\n", + " 'Age at the time of analysis.',\n", + " 'Childish diseases',\n", + " 'Accident or serious trauma',\n", + " 'Surgical intervention',\n", + " 'High fevers in the last year',\n", + " 'Frequency of alcohol consumption',\n", + " 'Smoking habit',\n", + " 'Number of hours spent sitting per day',\n", + " 'Output: Diagnosis',\n", + "]\n", + "fertility = pd.read_csv('fertility_Diagnosis.txt', sep=',', names=column)" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Season in which the analysis was performed.Age at the time of analysis.Childish diseasesAccident or serious traumaSurgical interventionHigh fevers in the last yearFrequency of alcohol consumptionSmoking habitNumber of hours spent sitting per dayOutput: Diagnosis
0-0.330.6901100.800.88N
1-0.330.9410100.810.31O
2-0.330.5010001.0-10.50N
3-0.330.7501101.0-10.38N
4-0.330.6711000.8-10.50O
\n", + "
" + ], + "text/plain": [ + " Season in which the analysis was performed. Age at the time of analysis. \\\n", + "0 -0.33 0.69 \n", + "1 -0.33 0.94 \n", + "2 -0.33 0.50 \n", + "3 -0.33 0.75 \n", + "4 -0.33 0.67 \n", + "\n", + " Childish diseases Accident or serious trauma Surgical intervention \\\n", + "0 0 1 1 \n", + "1 1 0 1 \n", + "2 1 0 0 \n", + "3 0 1 1 \n", + "4 1 1 0 \n", + "\n", + " High fevers in the last year Frequency of alcohol consumption \\\n", + "0 0 0.8 \n", + "1 0 0.8 \n", + "2 0 1.0 \n", + "3 0 1.0 \n", + "4 0 0.8 \n", + "\n", + " Smoking habit Number of hours spent sitting per day Output: Diagnosis \n", + "0 0 0.88 N \n", + "1 1 0.31 O \n", + "2 -1 0.50 N \n", + "3 -1 0.38 N \n", + "4 -1 0.50 O " + ] + }, + "execution_count": 33, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "fertility.head()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.7.3" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/your-code/fertility_Diagnosis.txt b/your-code/fertility_Diagnosis.txt new file mode 100644 index 0000000..e3a341d --- /dev/null +++ b/your-code/fertility_Diagnosis.txt @@ -0,0 +1,100 @@ +-0.33,0.69,0,1,1,0,0.8,0,0.88,N +-0.33,0.94,1,0,1,0,0.8,1,0.31,O +-0.33,0.5,1,0,0,0,1,-1,0.5,N +-0.33,0.75,0,1,1,0,1,-1,0.38,N +-0.33,0.67,1,1,0,0,0.8,-1,0.5,O +-0.33,0.67,1,0,1,0,0.8,0,0.5,N +-0.33,0.67,0,0,0,-1,0.8,-1,0.44,N +-0.33,1,1,1,1,0,0.6,-1,0.38,N +1,0.64,0,0,1,0,0.8,-1,0.25,N +1,0.61,1,0,0,0,1,-1,0.25,N +1,0.67,1,1,0,-1,0.8,0,0.31,N +1,0.78,1,1,1,0,0.6,0,0.13,N +1,0.75,1,1,1,0,0.8,1,0.25,N +1,0.81,1,0,0,0,1,-1,0.38,N +1,0.94,1,1,1,0,0.2,-1,0.25,N +1,0.81,1,1,0,0,1,1,0.5,N +1,0.64,1,0,1,0,1,-1,0.38,N +1,0.69,1,0,1,0,0.8,-1,0.25,O +1,0.75,1,1,1,0,1,1,0.25,N +1,0.67,1,0,0,0,0.8,1,0.38,O +1,0.67,0,0,1,0,0.8,-1,0.25,N +1,0.75,1,0,0,0,0.6,0,0.25,N +1,0.67,1,1,0,0,0.8,-1,0.25,N +1,0.69,1,0,1,-1,1,-1,0.44,O +1,0.56,1,0,1,0,1,-1,0.63,N +1,0.67,1,0,0,0,1,-1,0.25,N +1,0.67,1,0,1,0,0.6,-1,0.38,O +1,0.78,1,1,0,1,0.6,-1,0.38,O +1,0.58,0,0,1,0,1,-1,0.19,N +1,0.67,0,0,1,0,0.6,0,0.5,O +1,0.61,1,0,1,0,1,-1,0.63,N +1,0.56,1,0,0,0,1,-1,0.44,N +1,0.64,0,0,0,0,1,-1,0.63,N +1,0.58,1,1,1,0,0.8,0,0.44,N +1,0.56,1,1,1,0,1,-1,0.63,N +-1,0.78,1,1,0,1,0.6,-1,0.38,N +-1,0.78,1,0,1,0,1,-1,0.25,N +-1,0.56,1,0,1,0,1,-1,0.63,N +-1,0.67,0,0,1,0,0.6,0,0.5,O +-1,0.69,1,0,0,0,1,-1,0.31,N +-1,0.53,1,1,1,0,0.8,1,0.5,N +-1,0.56,1,1,0,0,0.8,1,0.5,N +-1,0.58,1,0,1,-1,0.8,1,0.5,N +-1,0.56,1,0,0,0,1,-1,0.44,N +-1,0.53,1,1,0,1,1,0,0.31,N +-1,0.53,1,0,0,1,1,0,0.44,N +-0.33,0.56,1,0,0,0,1,-1,0.63,N +-0.33,0.72,1,1,0,0,0.6,1,0.19,N +-0.33,0.64,1,1,1,0,0.8,-1,0.31,N +-0.33,0.75,1,1,1,0,0.6,-1,0.19,N +-0.33,0.67,1,0,1,0,0.8,-1,0.19,N +-0.33,0.53,1,1,0,1,1,-1,0.75,N +-0.33,0.53,1,1,0,0,0.8,0,0.5,N +-0.33,0.58,1,1,1,-1,0.8,0,0.19,N +-0.33,0.61,1,0,1,0,1,-1,0.63,N +-0.33,0.58,1,0,1,0,0.8,1,0.19,N +-0.33,0.53,1,1,0,0,0.8,0,0.75,N +-0.33,0.69,1,1,1,-1,1,-1,0.75,N +-0.33,0.56,1,1,0,0,0.4,1,0.63,N +1,0.58,0,0,0,1,0.8,1,0.44,N +1,0.56,0,0,0,1,0.8,0,1,N +-1,0.64,1,0,0,1,1,1,0.25,N +-1,0.61,1,1,1,0,0.6,-1,0.38,N +-1,0.56,1,0,0,1,1,-1,0.5,N +-1,0.53,1,0,0,1,0.8,-1,0.31,N +-0.33,0.56,0,0,1,0,1,-1,0.56,N +-0.33,0.5,1,1,0,-1,0.8,0,0.88,N +-0.33,0.5,1,0,0,1,1,-1,0.47,N +-0.33,0.5,1,0,0,1,0.8,0,0.31,N +-0.33,0.5,1,0,1,-1,0.8,-1,0.5,N +-0.33,0.5,1,1,0,-1,0.8,0,0.88,O +0.33,0.69,1,0,0,1,1,-1,0.31,N +1,0.56,1,0,0,1,0.6,0,0.5,N +-1,0.5,1,0,0,1,0.8,-1,0.44,N +-1,0.53,1,0,0,1,0.8,-1,0.63,N +-1,0.78,1,0,1,1,1,1,0.25,N +-1,0.75,1,0,1,1,0.6,0,0.56,N +-1,0.72,1,1,1,1,0.8,-1,0.19,N +-1,0.53,1,1,0,1,0.8,-1,0.38,N +-1,1,1,0,1,1,0.6,0,0.25,N +-0.33,0.92,1,1,0,1,1,-1,0.63,N +-1,0.81,1,1,1,1,0.8,0,0.19,N +-0.33,0.92,1,0,0,1,0.6,-1,0.19,N +-0.33,0.86,1,1,1,1,1,-1,0.25,N +-0.33,0.78,1,0,0,1,1,1,0.06,O +-0.33,0.89,1,1,0,0,0.6,1,0.31,N +-0.33,0.75,1,1,1,0,0.6,1,0.25,N +-0.33,0.75,1,1,1,1,0.8,1,0.25,N +-0.33,0.83,1,1,1,0,1,-1,0.31,N +-0.33,0.81,1,1,1,0,1,1,0.38,N +-0.33,0.81,1,1,1,1,0.8,-1,0.38,N +0.33,0.78,1,0,0,0,1,1,0.06,N +0.33,0.75,1,1,0,0,0.8,-1,0.38,N +0.33,0.75,1,0,1,0,0.8,-1,0.44,O +1,0.58,1,0,0,0,0.6,1,0.5,N +-1,0.67,1,0,0,0,1,-1,0.5,N +-1,0.61,1,0,0,0,0.8,0,0.5,N +-1,0.67,1,1,1,0,1,-1,0.31,N +-1,0.64,1,0,1,0,1,0,0.19,N +-1,0.69,0,1,1,0,0.6,-1,0.19,N diff --git a/your-code/main.ipynb b/your-code/main.ipynb index 8dcaafa..eb9194a 100644 --- a/your-code/main.ipynb +++ b/your-code/main.ipynb @@ -26,7 +26,7 @@ "outputs": [], "source": [ "# Your import here:\n", - "\n" + "import pandas as pd" ] }, { @@ -62,12 +62,1230 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 4, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
:@computed_region_cbhk_fwbd:@computed_region_nnqa_25f4fallgeolocationidmassnamenametyperecclassreclatreclongyear
0NaNNaNFell{'type': 'Point', 'coordinates': [6.08333, 50....121.0AachenValidL550.775006.083331880-01-01T00:00:00.000
1NaNNaNFell{'type': 'Point', 'coordinates': [10.23333, 56...2720.0AarhusValidH656.1833310.233331951-01-01T00:00:00.000
2NaNNaNFell{'type': 'Point', 'coordinates': [-113, 54.216...6107000.0AbeeValidEH454.21667-113.000001952-01-01T00:00:00.000
3NaNNaNFell{'type': 'Point', 'coordinates': [-99.9, 16.88...101914.0AcapulcoValidAcapulcoite16.88333-99.900001976-01-01T00:00:00.000
4NaNNaNFell{'type': 'Point', 'coordinates': [-64.95, -33....370780.0AchirasValidL6-33.16667-64.950001902-01-01T00:00:00.000
5NaNNaNFell{'type': 'Point', 'coordinates': [71.8, 32.1]}3794239.0Adhi KotValidEH432.1000071.800001919-01-01T00:00:00.000
6NaNNaNFell{'type': 'Point', 'coordinates': [95.16667, 44...390910.0Adzhi-Bogdo (stone)ValidLL3-644.8333395.166671949-01-01T00:00:00.000
7NaNNaNFell{'type': 'Point', 'coordinates': [0.61667, 44....39230000.0AgenValidH544.216670.616671814-01-01T00:00:00.000
8NaNNaNFell{'type': 'Point', 'coordinates': [-65.23333, -...3981620.0AguadaValidL6-31.60000-65.233331930-01-01T00:00:00.000
9NaNNaNFell{'type': 'Point', 'coordinates': [-64.55, -30....4171440.0Aguila BlancaValidL-30.86667-64.550001920-01-01T00:00:00.000
10NaNNaNFell{'type': 'Point', 'coordinates': [-9.57028, 16...4231000.0Aioun el AtroussValidDiogenite-pm16.39806-9.570281974-01-01T00:00:00.000
11NaNNaNFell{'type': 'Point', 'coordinates': [8.38333, 19....42424000.0AïrValidL619.083338.383331925-01-01T00:00:00.000
12NaNNaNFell{'type': 'Point', 'coordinates': [2.33333, 50....425NaNAire-sur-la-LysValidUnknown50.666672.333331769-01-01T00:00:00.000
13NaNNaNFell{'type': 'Point', 'coordinates': [35.05, 29.51...426779.0AkabaValidL629.5166735.050001949-01-01T00:00:00.000
14NaNNaNFell{'type': 'Point', 'coordinates': [77.95, 29.71...4271800.0AkbarpurValidH429.7166777.950001838-01-01T00:00:00.000
15NaNNaNFell{'type': 'Point', 'coordinates': [8.43333, 8.9...4323000.0AkwangaValidH8.916678.433331959-01-01T00:00:00.000
16NaNNaNFell{'type': 'Point', 'coordinates': [42.81667, 39...43350000.0AkyumakValidIron, IVA39.9166742.816671981-01-01T00:00:00.000
17NaNNaNFell{'type': 'Point', 'coordinates': [39.51667, 24...446160.0Al RaisValidCR2-an24.4166739.516671957-01-01T00:00:00.000
18NaNNaNFell{'type': 'Point', 'coordinates': [28.96, 13.66...447700.0Al ZarnkhValidLL513.6603328.960002001-01-01T00:00:00.000
19NaNNaNFell{'type': 'Point', 'coordinates': [4.08333, 44....4486000.0AlaisValidCI144.116674.083331806-01-01T00:00:00.000
20NaNNaNFell{'type': 'Point', 'coordinates': [11.01667, 44...4532000.0AlbaretoValidL/LL444.6500011.016671766-01-01T00:00:00.000
21NaNNaNFell{'type': 'Point', 'coordinates': [22.66667, 2]}454625.0AlbertaValidL2.0000022.666671949-01-01T00:00:00.000
22NaNNaNFell{'type': 'Point', 'coordinates': [6.01533, 45....458252.0Alby sur ChéranValidEucrite-mmict45.821336.015332002-01-01T00:00:00.000
23NaNNaNFell{'type': 'Point', 'coordinates': [-1.78333, 51...461700.0AldsworthValidLL551.78333-1.783331835-01-01T00:00:00.000
24NaNNaNFell{'type': 'Point', 'coordinates': [37.13333, 36...4623200.0AleppoValidL636.2333337.133331873-01-01T00:00:00.000
25NaNNaNFell{'type': 'Point', 'coordinates': [8.75, 44.883...463908.0AlessandriaValidH544.883338.750001860-01-01T00:00:00.000
26NaNNaNFell{'type': 'Point', 'coordinates': [31.81667, 50...4659251.0AlexandrovskyValidH450.9500031.816671900-01-01T00:00:00.000
27NaNNaNFell{'type': 'Point', 'coordinates': [10.15, 45.26...466228000.0AlfianelloValidL645.2666710.150001883-01-01T00:00:00.000
2850.0429.0Fell{'type': 'Point', 'coordinates': [-85.88333, 4...227632000.0AlleganValidH542.53333-85.883331899-01-01T00:00:00.000
29NaNNaNFell{'type': 'Point', 'coordinates': [-105.31667, ...22782000000.0AllendeValidCV326.96667-105.316671969-01-01T00:00:00.000
.......................................
97029.01637.0Fell{'type': 'Point', 'coordinates': [-86.2945, 33...237735560.0SylacaugaValidH433.18836-86.294501954-01-01T00:00:00.000
971NaNNaNFell{'type': 'Point', 'coordinates': [14.65, 49.4]}237767540.0TaborValidH549.4000014.650001753-01-01T00:00:00.000
972NaNNaNFell{'type': 'Point', 'coordinates': [5.41667, 36....237789000.0TadjeraValidL536.183335.416671867-01-01T00:00:00.000
973NaNNaNFell{'type': 'Point', 'coordinates': [-134.20139, ...2378210000.0Tagish LakeValidC2-ung59.70444-134.201392000-01-01T00:00:00.000
974NaNNaNFell{'type': 'Point', 'coordinates': [137.305, 34....237841000.0TaharaValidH4/534.72000137.305001991-01-01T00:00:00.000
975NaNNaNFell{'type': 'Point', 'coordinates': [134.9, 35.38...23789720.0TakenouchiValidH535.38333134.900001880-01-01T00:00:00.000
976NaNNaNFellNaN237911421.0TalampayaValidEucrite-cmNaNNaN1995-01-01T00:00:00.000
977NaNNaNFell{'type': 'Point', 'coordinates': [112.76667, -...2379510500.0TambakwatuValidL6-7.75000112.766671975-01-01T00:00:00.000
978NaNNaNFell{'type': 'Point', 'coordinates': [-7.015, 31.1...48691100000.0TamdakhtValidH531.16333-7.015002008-01-01T00:00:00.000
979NaNNaNFell{'type': 'Point', 'coordinates': [136.23333, 3...23801905.0TanéValidL535.43333136.233331918-01-01T00:00:00.000
980NaNNaNFell{'type': 'Point', 'coordinates': [122.9, 45.4]}238733850.0TaonanValidL545.40000122.900001965-01-01T00:00:00.000
981NaNNaNFell{'type': 'Point', 'coordinates': [10.41667, 32...2388412000.0TatahouineValidDiogenite32.9500010.416671931-01-01T00:00:00.000
982NaNNaNFell{'type': 'Point', 'coordinates': [43.73333, 19...238852500.0TathlithValidL619.3833343.733331967-01-01T00:00:00.000
983NaNNaNFell{'type': 'Point', 'coordinates': [44.45, 35.13...238876000.0TaukValidL635.1333344.450001929-01-01T00:00:00.000
984NaNNaNFell{'type': 'Point', 'coordinates': [23.5, 46.716...2388821000.0TautiValidL646.7166723.500001937-01-01T00:00:00.000
985NaNNaNFell{'type': 'Point', 'coordinates': [142.95, -25....23897160000.0TenhamValidL6-25.73333142.950001879-01-01T00:00:00.000
986NaNNaNFell{'type': 'Point', 'coordinates': [26.95, 58.03...2389828500.0TennasilmValidL458.0333326.950001872-01-01T00:00:00.000
987NaNNaNFell{'type': 'Point', 'coordinates': [70.6, 33.4]}23908342.0ThalValidH633.4000070.600001950-01-01T00:00:00.000
988NaNNaNFell{'type': 'Point', 'coordinates': [37.15028, -1...5449314200.0ThikaValidL6-1.0027837.150282011-01-01T00:00:00.000
989NaNNaNFell{'type': 'Point', 'coordinates': [27.58333, -2...2397645300.0ThuatheValidH4/5-29.3333327.583332002-01-01T00:00:00.000
990NaNNaNFell{'type': 'Point', 'coordinates': [118.99, 32.9...239842232.0TianzhangValidH532.94667118.990001986-01-01T00:00:00.000
991NaNNaNFell{'type': 'Point', 'coordinates': [17.11667, 49...2398928000.0TieschitzValidH/L3.649.6000017.116671878-01-01T00:00:00.000
99234.01762.0Fell{'type': 'Point', 'coordinates': [-89.68333, 3...2399874800.0TildenValidL638.20000-89.683331927-01-01T00:00:00.000
993NaNNaNFell{'type': 'Point', 'coordinates': [1.53333, 14....239993000.0TillaberiValidL614.250001.533331970-01-01T00:00:00.000
994NaNNaNFell{'type': 'Point', 'coordinates': [35.2, 54.5]}2400465500.0TimochinValidH554.5000035.200001807-01-01T00:00:00.000
995NaNNaNFell{'type': 'Point', 'coordinates': [79.41667, 13...24009230.0TirupatiValidH613.6333379.416671934-01-01T00:00:00.000
996NaNNaNFell{'type': 'Point', 'coordinates': [-7.61123, 29...548237000.0TissintValidMartian (shergottite)29.48195-7.611232011-01-01T00:00:00.000
997NaNNaNFell{'type': 'Point', 'coordinates': [111.53333, -...2401120000.0TjabeValidH6-7.08333111.533331869-01-01T00:00:00.000
998NaNNaNFell{'type': 'Point', 'coordinates': [106.58333, -...2401216500.0TjerebonValidL5-6.66667106.583331922-01-01T00:00:00.000
999NaNNaNFell{'type': 'Point', 'coordinates': [34.76667, 47...24019600.0TomakovkaValidLL647.8500034.766671905-01-01T00:00:00.000
\n", + "

1000 rows × 12 columns

\n", + "
" + ], + "text/plain": [ + " :@computed_region_cbhk_fwbd :@computed_region_nnqa_25f4 fall \\\n", + "0 NaN NaN Fell \n", + "1 NaN NaN Fell \n", + "2 NaN NaN Fell \n", + "3 NaN NaN Fell \n", + "4 NaN NaN Fell \n", + "5 NaN NaN Fell \n", + "6 NaN NaN Fell \n", + "7 NaN NaN Fell \n", + "8 NaN NaN Fell \n", + "9 NaN NaN Fell \n", + "10 NaN NaN Fell \n", + "11 NaN NaN Fell \n", + "12 NaN NaN Fell \n", + "13 NaN NaN Fell \n", + "14 NaN NaN Fell \n", + "15 NaN NaN Fell \n", + "16 NaN NaN Fell \n", + "17 NaN NaN Fell \n", + "18 NaN NaN Fell \n", + "19 NaN NaN Fell \n", + "20 NaN NaN Fell \n", + "21 NaN NaN Fell \n", + "22 NaN NaN Fell \n", + "23 NaN NaN Fell \n", + "24 NaN NaN Fell \n", + "25 NaN NaN Fell \n", + "26 NaN NaN Fell \n", + "27 NaN NaN Fell \n", + "28 50.0 429.0 Fell \n", + "29 NaN NaN Fell \n", + ".. ... ... ... \n", + "970 29.0 1637.0 Fell \n", + "971 NaN NaN Fell \n", + "972 NaN NaN Fell \n", + "973 NaN NaN Fell \n", + "974 NaN NaN Fell \n", + "975 NaN NaN Fell \n", + "976 NaN NaN Fell \n", + "977 NaN NaN Fell \n", + "978 NaN NaN Fell \n", + "979 NaN NaN Fell \n", + "980 NaN NaN Fell \n", + "981 NaN NaN Fell \n", + "982 NaN NaN Fell \n", + "983 NaN NaN Fell \n", + "984 NaN NaN Fell \n", + "985 NaN NaN Fell \n", + "986 NaN NaN Fell \n", + "987 NaN NaN Fell \n", + "988 NaN NaN Fell \n", + "989 NaN NaN Fell \n", + "990 NaN NaN Fell \n", + "991 NaN NaN Fell \n", + "992 34.0 1762.0 Fell \n", + "993 NaN NaN Fell \n", + "994 NaN NaN Fell \n", + "995 NaN NaN Fell \n", + "996 NaN NaN Fell \n", + "997 NaN NaN Fell \n", + "998 NaN NaN Fell \n", + "999 NaN NaN Fell \n", + "\n", + " geolocation id mass \\\n", + "0 {'type': 'Point', 'coordinates': [6.08333, 50.... 1 21.0 \n", + "1 {'type': 'Point', 'coordinates': [10.23333, 56... 2 720.0 \n", + "2 {'type': 'Point', 'coordinates': [-113, 54.216... 6 107000.0 \n", + "3 {'type': 'Point', 'coordinates': [-99.9, 16.88... 10 1914.0 \n", + "4 {'type': 'Point', 'coordinates': [-64.95, -33.... 370 780.0 \n", + "5 {'type': 'Point', 'coordinates': [71.8, 32.1]} 379 4239.0 \n", + "6 {'type': 'Point', 'coordinates': [95.16667, 44... 390 910.0 \n", + "7 {'type': 'Point', 'coordinates': [0.61667, 44.... 392 30000.0 \n", + "8 {'type': 'Point', 'coordinates': [-65.23333, -... 398 1620.0 \n", + "9 {'type': 'Point', 'coordinates': [-64.55, -30.... 417 1440.0 \n", + "10 {'type': 'Point', 'coordinates': [-9.57028, 16... 423 1000.0 \n", + "11 {'type': 'Point', 'coordinates': [8.38333, 19.... 424 24000.0 \n", + "12 {'type': 'Point', 'coordinates': [2.33333, 50.... 425 NaN \n", + "13 {'type': 'Point', 'coordinates': [35.05, 29.51... 426 779.0 \n", + "14 {'type': 'Point', 'coordinates': [77.95, 29.71... 427 1800.0 \n", + "15 {'type': 'Point', 'coordinates': [8.43333, 8.9... 432 3000.0 \n", + "16 {'type': 'Point', 'coordinates': [42.81667, 39... 433 50000.0 \n", + "17 {'type': 'Point', 'coordinates': [39.51667, 24... 446 160.0 \n", + "18 {'type': 'Point', 'coordinates': [28.96, 13.66... 447 700.0 \n", + "19 {'type': 'Point', 'coordinates': [4.08333, 44.... 448 6000.0 \n", + "20 {'type': 'Point', 'coordinates': [11.01667, 44... 453 2000.0 \n", + "21 {'type': 'Point', 'coordinates': [22.66667, 2]} 454 625.0 \n", + "22 {'type': 'Point', 'coordinates': [6.01533, 45.... 458 252.0 \n", + "23 {'type': 'Point', 'coordinates': [-1.78333, 51... 461 700.0 \n", + "24 {'type': 'Point', 'coordinates': [37.13333, 36... 462 3200.0 \n", + "25 {'type': 'Point', 'coordinates': [8.75, 44.883... 463 908.0 \n", + "26 {'type': 'Point', 'coordinates': [31.81667, 50... 465 9251.0 \n", + "27 {'type': 'Point', 'coordinates': [10.15, 45.26... 466 228000.0 \n", + "28 {'type': 'Point', 'coordinates': [-85.88333, 4... 2276 32000.0 \n", + "29 {'type': 'Point', 'coordinates': [-105.31667, ... 2278 2000000.0 \n", + ".. ... ... ... \n", + "970 {'type': 'Point', 'coordinates': [-86.2945, 33... 23773 5560.0 \n", + "971 {'type': 'Point', 'coordinates': [14.65, 49.4]} 23776 7540.0 \n", + "972 {'type': 'Point', 'coordinates': [5.41667, 36.... 23778 9000.0 \n", + "973 {'type': 'Point', 'coordinates': [-134.20139, ... 23782 10000.0 \n", + "974 {'type': 'Point', 'coordinates': [137.305, 34.... 23784 1000.0 \n", + "975 {'type': 'Point', 'coordinates': [134.9, 35.38... 23789 720.0 \n", + "976 NaN 23791 1421.0 \n", + "977 {'type': 'Point', 'coordinates': [112.76667, -... 23795 10500.0 \n", + "978 {'type': 'Point', 'coordinates': [-7.015, 31.1... 48691 100000.0 \n", + "979 {'type': 'Point', 'coordinates': [136.23333, 3... 23801 905.0 \n", + "980 {'type': 'Point', 'coordinates': [122.9, 45.4]} 23873 3850.0 \n", + "981 {'type': 'Point', 'coordinates': [10.41667, 32... 23884 12000.0 \n", + "982 {'type': 'Point', 'coordinates': [43.73333, 19... 23885 2500.0 \n", + "983 {'type': 'Point', 'coordinates': [44.45, 35.13... 23887 6000.0 \n", + "984 {'type': 'Point', 'coordinates': [23.5, 46.716... 23888 21000.0 \n", + "985 {'type': 'Point', 'coordinates': [142.95, -25.... 23897 160000.0 \n", + "986 {'type': 'Point', 'coordinates': [26.95, 58.03... 23898 28500.0 \n", + "987 {'type': 'Point', 'coordinates': [70.6, 33.4]} 23908 342.0 \n", + "988 {'type': 'Point', 'coordinates': [37.15028, -1... 54493 14200.0 \n", + "989 {'type': 'Point', 'coordinates': [27.58333, -2... 23976 45300.0 \n", + "990 {'type': 'Point', 'coordinates': [118.99, 32.9... 23984 2232.0 \n", + "991 {'type': 'Point', 'coordinates': [17.11667, 49... 23989 28000.0 \n", + "992 {'type': 'Point', 'coordinates': [-89.68333, 3... 23998 74800.0 \n", + "993 {'type': 'Point', 'coordinates': [1.53333, 14.... 23999 3000.0 \n", + "994 {'type': 'Point', 'coordinates': [35.2, 54.5]} 24004 65500.0 \n", + "995 {'type': 'Point', 'coordinates': [79.41667, 13... 24009 230.0 \n", + "996 {'type': 'Point', 'coordinates': [-7.61123, 29... 54823 7000.0 \n", + "997 {'type': 'Point', 'coordinates': [111.53333, -... 24011 20000.0 \n", + "998 {'type': 'Point', 'coordinates': [106.58333, -... 24012 16500.0 \n", + "999 {'type': 'Point', 'coordinates': [34.76667, 47... 24019 600.0 \n", + "\n", + " name nametype recclass reclat reclong \\\n", + "0 Aachen Valid L5 50.77500 6.08333 \n", + "1 Aarhus Valid H6 56.18333 10.23333 \n", + "2 Abee Valid EH4 54.21667 -113.00000 \n", + "3 Acapulco Valid Acapulcoite 16.88333 -99.90000 \n", + "4 Achiras Valid L6 -33.16667 -64.95000 \n", + "5 Adhi Kot Valid EH4 32.10000 71.80000 \n", + "6 Adzhi-Bogdo (stone) Valid LL3-6 44.83333 95.16667 \n", + "7 Agen Valid H5 44.21667 0.61667 \n", + "8 Aguada Valid L6 -31.60000 -65.23333 \n", + "9 Aguila Blanca Valid L -30.86667 -64.55000 \n", + "10 Aioun el Atrouss Valid Diogenite-pm 16.39806 -9.57028 \n", + "11 Aïr Valid L6 19.08333 8.38333 \n", + "12 Aire-sur-la-Lys Valid Unknown 50.66667 2.33333 \n", + "13 Akaba Valid L6 29.51667 35.05000 \n", + "14 Akbarpur Valid H4 29.71667 77.95000 \n", + "15 Akwanga Valid H 8.91667 8.43333 \n", + "16 Akyumak Valid Iron, IVA 39.91667 42.81667 \n", + "17 Al Rais Valid CR2-an 24.41667 39.51667 \n", + "18 Al Zarnkh Valid LL5 13.66033 28.96000 \n", + "19 Alais Valid CI1 44.11667 4.08333 \n", + "20 Albareto Valid L/LL4 44.65000 11.01667 \n", + "21 Alberta Valid L 2.00000 22.66667 \n", + "22 Alby sur Chéran Valid Eucrite-mmict 45.82133 6.01533 \n", + "23 Aldsworth Valid LL5 51.78333 -1.78333 \n", + "24 Aleppo Valid L6 36.23333 37.13333 \n", + "25 Alessandria Valid H5 44.88333 8.75000 \n", + "26 Alexandrovsky Valid H4 50.95000 31.81667 \n", + "27 Alfianello Valid L6 45.26667 10.15000 \n", + "28 Allegan Valid H5 42.53333 -85.88333 \n", + "29 Allende Valid CV3 26.96667 -105.31667 \n", + ".. ... ... ... ... ... \n", + "970 Sylacauga Valid H4 33.18836 -86.29450 \n", + "971 Tabor Valid H5 49.40000 14.65000 \n", + "972 Tadjera Valid L5 36.18333 5.41667 \n", + "973 Tagish Lake Valid C2-ung 59.70444 -134.20139 \n", + "974 Tahara Valid H4/5 34.72000 137.30500 \n", + "975 Takenouchi Valid H5 35.38333 134.90000 \n", + "976 Talampaya Valid Eucrite-cm NaN NaN \n", + "977 Tambakwatu Valid L6 -7.75000 112.76667 \n", + "978 Tamdakht Valid H5 31.16333 -7.01500 \n", + "979 Tané Valid L5 35.43333 136.23333 \n", + "980 Taonan Valid L5 45.40000 122.90000 \n", + "981 Tatahouine Valid Diogenite 32.95000 10.41667 \n", + "982 Tathlith Valid L6 19.38333 43.73333 \n", + "983 Tauk Valid L6 35.13333 44.45000 \n", + "984 Tauti Valid L6 46.71667 23.50000 \n", + "985 Tenham Valid L6 -25.73333 142.95000 \n", + "986 Tennasilm Valid L4 58.03333 26.95000 \n", + "987 Thal Valid H6 33.40000 70.60000 \n", + "988 Thika Valid L6 -1.00278 37.15028 \n", + "989 Thuathe Valid H4/5 -29.33333 27.58333 \n", + "990 Tianzhang Valid H5 32.94667 118.99000 \n", + "991 Tieschitz Valid H/L3.6 49.60000 17.11667 \n", + "992 Tilden Valid L6 38.20000 -89.68333 \n", + "993 Tillaberi Valid L6 14.25000 1.53333 \n", + "994 Timochin Valid H5 54.50000 35.20000 \n", + "995 Tirupati Valid H6 13.63333 79.41667 \n", + "996 Tissint Valid Martian (shergottite) 29.48195 -7.61123 \n", + "997 Tjabe Valid H6 -7.08333 111.53333 \n", + "998 Tjerebon Valid L5 -6.66667 106.58333 \n", + "999 Tomakovka Valid LL6 47.85000 34.76667 \n", + "\n", + " year \n", + "0 1880-01-01T00:00:00.000 \n", + "1 1951-01-01T00:00:00.000 \n", + "2 1952-01-01T00:00:00.000 \n", + "3 1976-01-01T00:00:00.000 \n", + "4 1902-01-01T00:00:00.000 \n", + "5 1919-01-01T00:00:00.000 \n", + "6 1949-01-01T00:00:00.000 \n", + "7 1814-01-01T00:00:00.000 \n", + "8 1930-01-01T00:00:00.000 \n", + "9 1920-01-01T00:00:00.000 \n", + "10 1974-01-01T00:00:00.000 \n", + "11 1925-01-01T00:00:00.000 \n", + "12 1769-01-01T00:00:00.000 \n", + "13 1949-01-01T00:00:00.000 \n", + "14 1838-01-01T00:00:00.000 \n", + "15 1959-01-01T00:00:00.000 \n", + "16 1981-01-01T00:00:00.000 \n", + "17 1957-01-01T00:00:00.000 \n", + "18 2001-01-01T00:00:00.000 \n", + "19 1806-01-01T00:00:00.000 \n", + "20 1766-01-01T00:00:00.000 \n", + "21 1949-01-01T00:00:00.000 \n", + "22 2002-01-01T00:00:00.000 \n", + "23 1835-01-01T00:00:00.000 \n", + "24 1873-01-01T00:00:00.000 \n", + "25 1860-01-01T00:00:00.000 \n", + "26 1900-01-01T00:00:00.000 \n", + "27 1883-01-01T00:00:00.000 \n", + "28 1899-01-01T00:00:00.000 \n", + "29 1969-01-01T00:00:00.000 \n", + ".. ... \n", + "970 1954-01-01T00:00:00.000 \n", + "971 1753-01-01T00:00:00.000 \n", + "972 1867-01-01T00:00:00.000 \n", + "973 2000-01-01T00:00:00.000 \n", + "974 1991-01-01T00:00:00.000 \n", + "975 1880-01-01T00:00:00.000 \n", + "976 1995-01-01T00:00:00.000 \n", + "977 1975-01-01T00:00:00.000 \n", + "978 2008-01-01T00:00:00.000 \n", + "979 1918-01-01T00:00:00.000 \n", + "980 1965-01-01T00:00:00.000 \n", + "981 1931-01-01T00:00:00.000 \n", + "982 1967-01-01T00:00:00.000 \n", + "983 1929-01-01T00:00:00.000 \n", + "984 1937-01-01T00:00:00.000 \n", + "985 1879-01-01T00:00:00.000 \n", + "986 1872-01-01T00:00:00.000 \n", + "987 1950-01-01T00:00:00.000 \n", + "988 2011-01-01T00:00:00.000 \n", + "989 2002-01-01T00:00:00.000 \n", + "990 1986-01-01T00:00:00.000 \n", + "991 1878-01-01T00:00:00.000 \n", + "992 1927-01-01T00:00:00.000 \n", + "993 1970-01-01T00:00:00.000 \n", + "994 1807-01-01T00:00:00.000 \n", + "995 1934-01-01T00:00:00.000 \n", + "996 2011-01-01T00:00:00.000 \n", + "997 1869-01-01T00:00:00.000 \n", + "998 1922-01-01T00:00:00.000 \n", + "999 1905-01-01T00:00:00.000 \n", + "\n", + "[1000 rows x 12 columns]" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# Your code here:\n", - "\n" + "nasa = pd.read_json(json_data, orient='records')\n", + "nasa" ] }, { @@ -79,12 +1297,156 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 5, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
:@computed_region_cbhk_fwbd:@computed_region_nnqa_25f4fallgeolocationidmassnamenametyperecclassreclatreclongyear
0NaNNaNFell{'type': 'Point', 'coordinates': [6.08333, 50....121.0AachenValidL550.775006.083331880-01-01T00:00:00.000
1NaNNaNFell{'type': 'Point', 'coordinates': [10.23333, 56...2720.0AarhusValidH656.1833310.233331951-01-01T00:00:00.000
2NaNNaNFell{'type': 'Point', 'coordinates': [-113, 54.216...6107000.0AbeeValidEH454.21667-113.000001952-01-01T00:00:00.000
3NaNNaNFell{'type': 'Point', 'coordinates': [-99.9, 16.88...101914.0AcapulcoValidAcapulcoite16.88333-99.900001976-01-01T00:00:00.000
4NaNNaNFell{'type': 'Point', 'coordinates': [-64.95, -33....370780.0AchirasValidL6-33.16667-64.950001902-01-01T00:00:00.000
\n", + "
" + ], + "text/plain": [ + " :@computed_region_cbhk_fwbd :@computed_region_nnqa_25f4 fall \\\n", + "0 NaN NaN Fell \n", + "1 NaN NaN Fell \n", + "2 NaN NaN Fell \n", + "3 NaN NaN Fell \n", + "4 NaN NaN Fell \n", + "\n", + " geolocation id mass name \\\n", + "0 {'type': 'Point', 'coordinates': [6.08333, 50.... 1 21.0 Aachen \n", + "1 {'type': 'Point', 'coordinates': [10.23333, 56... 2 720.0 Aarhus \n", + "2 {'type': 'Point', 'coordinates': [-113, 54.216... 6 107000.0 Abee \n", + "3 {'type': 'Point', 'coordinates': [-99.9, 16.88... 10 1914.0 Acapulco \n", + "4 {'type': 'Point', 'coordinates': [-64.95, -33.... 370 780.0 Achiras \n", + "\n", + " nametype recclass reclat reclong year \n", + "0 Valid L5 50.77500 6.08333 1880-01-01T00:00:00.000 \n", + "1 Valid H6 56.18333 10.23333 1951-01-01T00:00:00.000 \n", + "2 Valid EH4 54.21667 -113.00000 1952-01-01T00:00:00.000 \n", + "3 Valid Acapulcoite 16.88333 -99.90000 1976-01-01T00:00:00.000 \n", + "4 Valid L6 -33.16667 -64.95000 1902-01-01T00:00:00.000 " + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# Your code here:\n", - "\n" + "#.head() shows the first 5 rows by default.\n", + "nasa.head()" ] }, { @@ -98,12 +1460,26 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 11, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "Fell 996\n", + "Found 4\n", + "Name: fall, dtype: int64" + ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# Your code here:\n", - "\n" + "fall_count = nasa['fall']\n", + "fall_count.value_counts()" ] }, { @@ -115,12 +1491,12 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 12, "metadata": {}, "outputs": [], "source": [ "# Your code here:\n", - "\n" + "nasa.to_json('nasa.json', orient='records')" ] }, { @@ -136,24 +1512,23 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 13, "metadata": {}, "outputs": [], "source": [ "# Run this code:\n", - "\n", "cols = ['time', 'rad_flow', 'fpv_close', 'fpv_open', 'high', 'bypass', 'bpv_close', 'bpv_open', 'class']\n", "tst_url = 'https://archive.ics.uci.edu/ml/machine-learning-databases/statlog/shuttle/shuttle.tst'" ] }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 20, "metadata": {}, "outputs": [], "source": [ "# Your code here:\n", - "\n" + "shuttle = pd.read_csv(tst_url, sep=' ', names=cols)" ] }, { @@ -165,12 +1540,130 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 21, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
timerad_flowfpv_closefpv_openhighbypassbpv_closebpv_openclass
550810-6112588644
56096052-4404444
50-189-7500394021
53979042-22537124
55282054-6262821
\n", + "
" + ], + "text/plain": [ + " time rad_flow fpv_close fpv_open high bypass bpv_close bpv_open \\\n", + "55 0 81 0 -6 11 25 88 64 \n", + "56 0 96 0 52 -4 40 44 4 \n", + "50 -1 89 -7 50 0 39 40 2 \n", + "53 9 79 0 42 -2 25 37 12 \n", + "55 2 82 0 54 -6 26 28 2 \n", + "\n", + " class \n", + "55 4 \n", + "56 4 \n", + "50 1 \n", + "53 4 \n", + "55 1 " + ] + }, + "execution_count": 21, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# Your code here:\n", - "\n" + "shuttle.head()" ] }, { @@ -182,12 +1675,12 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 22, "metadata": {}, "outputs": [], "source": [ "# Your code here:\n", - "\n" + "shuttle.to_csv('shuttle.csv', index=False)" ] }, { @@ -203,12 +1696,12 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 24, "metadata": {}, "outputs": [], "source": [ "# Your code here:\n", - "\n" + "astronaut = pd.read_excel('astronauts.xls')" ] }, { @@ -220,12 +1713,211 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 25, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
NameYearGroupStatusBirth DateBirth PlaceGenderAlma MaterUndergraduate MajorGraduate MajorMilitary RankMilitary BranchSpace FlightsSpace Flight (hr)Space WalksSpace Walks (hr)MissionsDeath DateDeath Mission
0Joseph M. Acaba2004.019.0Active1967-05-17Inglewood, CAMaleUniversity of California-Santa Barbara; Univer...GeologyGeologyNaNNaN23307213.0STS-119 (Discovery), ISS-31/32 (Soyuz)NaTNaN
1Loren W. ActonNaNNaNRetired1936-03-07Lewiston, MTMaleMontana State University; University of ColoradoEngineering PhysicsSolar PhysicsNaNNaN119000.0STS 51-F (Challenger)NaTNaN
2James C. Adamson1984.010.0Retired1946-03-03Warsaw, NYMaleUS Military Academy; Princeton UniversityEngineeringAerospace EngineeringColonelUS Army (Retired)233400.0STS-28 (Columbia), STS-43 (Atlantis)NaTNaN
3Thomas D. Akers1987.012.0Retired1951-05-20St. Louis, MOMaleUniversity of Missouri-RollaApplied MathematicsApplied MathematicsColonelUS Air Force (Retired)4814429.0STS-41 (Discovery), STS-49 (Endeavor), STS-61 ...NaTNaN
4Buzz Aldrin1963.03.0Retired1930-01-20Montclair, NJMaleUS Military Academy; MITMechanical EngineeringAstronauticsColonelUS Air Force (Retired)228928.0Gemini 12, Apollo 11NaTNaN
\n", + "
" + ], + "text/plain": [ + " Name Year Group Status Birth Date Birth Place Gender \\\n", + "0 Joseph M. Acaba 2004.0 19.0 Active 1967-05-17 Inglewood, CA Male \n", + "1 Loren W. Acton NaN NaN Retired 1936-03-07 Lewiston, MT Male \n", + "2 James C. Adamson 1984.0 10.0 Retired 1946-03-03 Warsaw, NY Male \n", + "3 Thomas D. Akers 1987.0 12.0 Retired 1951-05-20 St. Louis, MO Male \n", + "4 Buzz Aldrin 1963.0 3.0 Retired 1930-01-20 Montclair, NJ Male \n", + "\n", + " Alma Mater Undergraduate Major \\\n", + "0 University of California-Santa Barbara; Univer... Geology \n", + "1 Montana State University; University of Colorado Engineering Physics \n", + "2 US Military Academy; Princeton University Engineering \n", + "3 University of Missouri-Rolla Applied Mathematics \n", + "4 US Military Academy; MIT Mechanical Engineering \n", + "\n", + " Graduate Major Military Rank Military Branch Space Flights \\\n", + "0 Geology NaN NaN 2 \n", + "1 Solar Physics NaN NaN 1 \n", + "2 Aerospace Engineering Colonel US Army (Retired) 2 \n", + "3 Applied Mathematics Colonel US Air Force (Retired) 4 \n", + "4 Astronautics Colonel US Air Force (Retired) 2 \n", + "\n", + " Space Flight (hr) Space Walks Space Walks (hr) \\\n", + "0 3307 2 13.0 \n", + "1 190 0 0.0 \n", + "2 334 0 0.0 \n", + "3 814 4 29.0 \n", + "4 289 2 8.0 \n", + "\n", + " Missions Death Date Death Mission \n", + "0 STS-119 (Discovery), ISS-31/32 (Soyuz) NaT NaN \n", + "1 STS 51-F (Challenger) NaT NaN \n", + "2 STS-28 (Columbia), STS-43 (Atlantis) NaT NaN \n", + "3 STS-41 (Discovery), STS-49 (Endeavor), STS-61 ... NaT NaN \n", + "4 Gemini 12, Apollo 11 NaT NaN " + ] + }, + "execution_count": 25, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# Your code here:\n", - "\n" + "astronaut.head()" ] }, { @@ -237,12 +1929,85 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 30, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "Physics 35\n", + "Aerospace Engineering 33\n", + "Mechanical Engineering 30\n", + "Aeronautical Engineering 28\n", + "Electrical Engineering 23\n", + "Engineering Science 13\n", + "Engineering 12\n", + "Mathematics 11\n", + "Chemistry 10\n", + "Naval Sciences 9\n", + "Chemical Engineering 9\n", + "Astronautical Engineering 8\n", + "Aeronautical & Astronautical Engineering 6\n", + "Biology 5\n", + "Mathematics & Physics 5\n", + "Geology 5\n", + "Civil Engineering 5\n", + "Physics & Astronomy 4\n", + "Applied Science & Engineering 4\n", + "Engineering Physics 3\n", + "Computer Science 3\n", + "Aeronautics & Astronautics 3\n", + "Applied Mathematics 3\n", + "Chemistry & Biology 2\n", + "Engineering Mechanics 2\n", + "Engineering Management 2\n", + "Education 2\n", + "Physics & Mathematics 2\n", + "Biological Science 2\n", + "Zoology 2\n", + " ..\n", + "Nuclear Engineering 1\n", + "Earth Sciences 1\n", + "Mathematical & Electrical Science 1\n", + "Chemistry; Physiological Optics 1\n", + "Systems Engineering 1\n", + "Mathematics & Statistics; Chemistry 1\n", + "Business Finance 1\n", + "Biochemistry 1\n", + "Physiology 1\n", + "Military Science 1\n", + "Economics 1\n", + "Molecular Biology 1\n", + "Animal Science 1\n", + "Aerospace Engineering & Mechanics 1\n", + "Electrical Science 1\n", + "Mathematics & Economics 1\n", + "Computer & Systems Engineering 1\n", + "Solid Earth Sciences 1\n", + "Psychology 1\n", + "Physics & Astronautical Engineering 1\n", + "Business Economics 1\n", + "Ecological Science 1\n", + "Military Engineering 1\n", + "Mathematics; Russian 1\n", + "Applied Biology; Mechanical Engineering 1\n", + "Aeronautics & Astronautics; Earth, Atmospheric & Planetary Sciences 1\n", + "Ceramic Engineering 1\n", + "Animal Nutrition 1\n", + "Bioscience 1\n", + "Electrical Engineering; Computer Science 1\n", + "Name: Undergraduate Major, Length: 83, dtype: int64" + ] + }, + "execution_count": 30, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# Your code here:\n", - "\n" + "undergrad_count = astronaut['Undergraduate Major']\n", + "undergrad_count.value_counts()" ] }, { @@ -254,12 +2019,12 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 31, "metadata": {}, "outputs": [], "source": [ "# Your code here:\n", - "\n" + "astronaut.to_csv('astronaut.csv', sep=\"\\t\", index=False)" ] }, { @@ -273,12 +2038,171 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 32, "metadata": {}, "outputs": [], "source": [ "# Your code here:\n", - "\n" + "column = [\n", + " 'Season in which the analysis was performed.',\n", + " 'Age at the time of analysis.',\n", + " 'Childish diseases',\n", + " 'Accident or serious trauma',\n", + " 'Surgical intervention',\n", + " 'High fevers in the last year',\n", + " 'Frequency of alcohol consumption',\n", + " 'Smoking habit',\n", + " 'Number of hours spent sitting per day',\n", + " 'Output: Diagnosis',\n", + "]\n", + "fertility = pd.read_csv('fertility_Diagnosis.txt', sep=',', names=column)" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Season in which the analysis was performed.Age at the time of analysis.Childish diseasesAccident or serious traumaSurgical interventionHigh fevers in the last yearFrequency of alcohol consumptionSmoking habitNumber of hours spent sitting per dayOutput: Diagnosis
0-0.330.6901100.800.88N
1-0.330.9410100.810.31O
2-0.330.5010001.0-10.50N
3-0.330.7501101.0-10.38N
4-0.330.6711000.8-10.50O
\n", + "
" + ], + "text/plain": [ + " Season in which the analysis was performed. Age at the time of analysis. \\\n", + "0 -0.33 0.69 \n", + "1 -0.33 0.94 \n", + "2 -0.33 0.50 \n", + "3 -0.33 0.75 \n", + "4 -0.33 0.67 \n", + "\n", + " Childish diseases Accident or serious trauma Surgical intervention \\\n", + "0 0 1 1 \n", + "1 1 0 1 \n", + "2 1 0 0 \n", + "3 0 1 1 \n", + "4 1 1 0 \n", + "\n", + " High fevers in the last year Frequency of alcohol consumption \\\n", + "0 0 0.8 \n", + "1 0 0.8 \n", + "2 0 1.0 \n", + "3 0 1.0 \n", + "4 0 0.8 \n", + "\n", + " Smoking habit Number of hours spent sitting per day Output: Diagnosis \n", + "0 0 0.88 N \n", + "1 1 0.31 O \n", + "2 -1 0.50 N \n", + "3 -1 0.38 N \n", + "4 -1 0.50 O " + ] + }, + "execution_count": 33, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "fertility.head()" ] }, { @@ -305,7 +2229,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.6.6" + "version": "3.7.3" } }, "nbformat": 4,