From 0c159c10264f285ff92368b045faddafb5bda8ae Mon Sep 17 00:00:00 2001 From: GildaRIA <114354041+GildaRIA@users.noreply.github.com> Date: Sat, 3 Dec 2022 08:38:56 -0600 Subject: [PATCH 1/5] Add files via upload --- Proyecto2_GildaRIA_Try.ipynb | 210 +++++++++++++++++++++++++++++++++++ 1 file changed, 210 insertions(+) create mode 100644 Proyecto2_GildaRIA_Try.ipynb diff --git a/Proyecto2_GildaRIA_Try.ipynb b/Proyecto2_GildaRIA_Try.ipynb new file mode 100644 index 0000000..d9379a7 --- /dev/null +++ b/Proyecto2_GildaRIA_Try.ipynb @@ -0,0 +1,210 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "c483e8a0-576e-4f21-a19f-6fb8fa42fa14", + "metadata": {}, + "outputs": [], + "source": [ + "from bs4 import BeautifulSoup\n", + "import requests\n", + "import selenium\n", + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "a114183e-9356-4213-91fb-60a782bce915", + "metadata": {}, + "outputs": [], + "source": [ + "from selenium import webdriver\n", + "browser = webdriver.Chrome()" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "5f60973b-6658-4ec5-baa2-862eab88fd7b", + "metadata": {}, + "outputs": [], + "source": [ + "driver = webdriver.Chrome()" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "9e25c2fa-d714-4d5f-875d-644a534caf37", + "metadata": {}, + "outputs": [], + "source": [ + "url = 'https://www.eleconomista.com.mx/tags/elecciones_en_Mexico'" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "909356bb-33df-42c7-b010-84f460b81b4e", + "metadata": {}, + "outputs": [], + "source": [ + "driver.get(url)" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "id": "f637afb6-9ff0-4116-af43-554ebd65084b", + "metadata": {}, + "outputs": [], + "source": [ + "sopa = BeautifulSoup(driver.page_source)" + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "id": "af6cae88-e924-4d40-9a0c-3e2efe2e1803", + "metadata": {}, + "outputs": [], + "source": [ + "datos_tabla1 = sopa.select('h3.jsx-578919967.title')" + ] + }, + { + "cell_type": "code", + "execution_count": 24, + "id": "e09fd631-90d9-4db7-8482-8d999c4bc4e0", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[

\n", + " PRI propondrá una ley para reglamentar a los gobiernos de coalición\n", + "

,\n", + "

\n", + " PAN, PRI y PRD anuncian su alianza “Va por México” en Edomex para 2023\n", + "

,\n", + "

\n", + " La coalición PRI-PAN-PRD sí da para ganar la CDMX\n", + "

,\n", + "

\n", + " Ruptura morenist\n", + "

,\n", + "

\n", + " Recortes al INE han reducido alcance de proyectos estratégicos\n", + "

,\n", + "

\n", + " Votarían por una alianza opositora 36.7% en 2024\n", + "

,\n", + "

\n", + " Si no tienes un plan para hacer crecer la economía al doble, no deberías aspirar a la presidencia: Marcelo Ebrard\n", + "

,\n", + "

\n", + " Recorte al INE impactaría a comicios del 2023 y 2024\n", + "

,\n", + "

\n", + " Gobiernos municipales, factor para el 2023 y 2024\n", + "

,\n", + "

¿Qué ciudades en México se perfilan para ser 'smart cities'?

,\n", + "

México recomprará bono al 2025 para bajar amortizaciones de la deuda externa

,\n", + "

Blackstone suspende los retiros de su fondo de inversión inmobiliaria de 69,000 millones de dólares

,\n", + "

¿Cuáles fueron los artistas más escuchados en Spotify 2022?

,\n", + "

Negociaciones contractuales \"presionadas\" por incremento de doble dígito al salario mínimo

,\n", + "

\n", + " Morena arranca con ventaja en Coahuila\n", + "

,\n", + "

\n", + " Sheinbaum, con ligera ventaja en la carrera presidencial\n", + "

,\n", + "

\n", + " Propone PRD a PRI y PAN una encuesta para elegir candidato aliancista en Edomex\n", + "

,\n", + "

\n", + " Morena: si ganan el 24 ¿por qué trampear?\n", + "

,\n", + "

\n", + " Morena abrirá registro para candidato en Coahuila el 31 de octubre\n", + "

,\n", + "

\n", + " ¿Corcholatismo acotado?\n", + "

,\n", + "

\n", + " ¿Cuáles son los escenarios de la reforma electoral en marcha?\n", + "

,\n", + "

\n", + " PRI perfila a Del Moral como candidata al Edomex\n", + "

,\n", + "

\n", + " Concluye en el PRI pasarela de presidenciables\n", + "

]" + ] + }, + "execution_count": 24, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "datos_tabla1" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "2a1f5079-cc0b-401e-90f5-a811fba87bcc", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "cfaf6513-1dfa-416c-a614-dce7217648ec", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "0c4a8bbb-7a16-477d-b860-201834ae2216", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "78cb7ee7-8825-443b-8394-eec9f680a1aa", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} From 21da38253be4365cf194cc55191ef23bdb2b6757 Mon Sep 17 00:00:00 2001 From: GildaRIA <114354041+GildaRIA@users.noreply.github.com> Date: Sun, 4 Dec 2022 15:11:07 -0600 Subject: [PATCH 2/5] Delete Proyecto2_GildaRIA_Try.ipynb --- Proyecto2_GildaRIA_Try.ipynb | 210 ----------------------------------- 1 file changed, 210 deletions(-) delete mode 100644 Proyecto2_GildaRIA_Try.ipynb diff --git a/Proyecto2_GildaRIA_Try.ipynb b/Proyecto2_GildaRIA_Try.ipynb deleted file mode 100644 index d9379a7..0000000 --- a/Proyecto2_GildaRIA_Try.ipynb +++ /dev/null @@ -1,210 +0,0 @@ -{ - "cells": [ - { - "cell_type": "code", - "execution_count": 1, - "id": "c483e8a0-576e-4f21-a19f-6fb8fa42fa14", - "metadata": {}, - "outputs": [], - "source": [ - "from bs4 import BeautifulSoup\n", - "import requests\n", - "import selenium\n", - "import pandas as pd" - ] - }, - { - "cell_type": "code", - "execution_count": 2, - "id": "a114183e-9356-4213-91fb-60a782bce915", - "metadata": {}, - "outputs": [], - "source": [ - "from selenium import webdriver\n", - "browser = webdriver.Chrome()" - ] - }, - { - "cell_type": "code", - "execution_count": 3, - "id": "5f60973b-6658-4ec5-baa2-862eab88fd7b", - "metadata": {}, - "outputs": [], - "source": [ - "driver = webdriver.Chrome()" - ] - }, - { - "cell_type": "code", - "execution_count": 4, - "id": "9e25c2fa-d714-4d5f-875d-644a534caf37", - "metadata": {}, - "outputs": [], - "source": [ - "url = 'https://www.eleconomista.com.mx/tags/elecciones_en_Mexico'" - ] - }, - { - "cell_type": "code", - "execution_count": 5, - "id": "909356bb-33df-42c7-b010-84f460b81b4e", - "metadata": {}, - "outputs": [], - "source": [ - "driver.get(url)" - ] - }, - { - "cell_type": "code", - "execution_count": 6, - "id": "f637afb6-9ff0-4116-af43-554ebd65084b", - "metadata": {}, - "outputs": [], - "source": [ - "sopa = BeautifulSoup(driver.page_source)" - ] - }, - { - "cell_type": "code", - "execution_count": 23, - "id": "af6cae88-e924-4d40-9a0c-3e2efe2e1803", - "metadata": {}, - "outputs": [], - "source": [ - "datos_tabla1 = sopa.select('h3.jsx-578919967.title')" - ] - }, - { - "cell_type": "code", - "execution_count": 24, - "id": "e09fd631-90d9-4db7-8482-8d999c4bc4e0", - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "[

\n", - " PRI propondrá una ley para reglamentar a los gobiernos de coalición\n", - "

,\n", - "

\n", - " PAN, PRI y PRD anuncian su alianza “Va por México” en Edomex para 2023\n", - "

,\n", - "

\n", - " La coalición PRI-PAN-PRD sí da para ganar la CDMX\n", - "

,\n", - "

\n", - " Ruptura morenist\n", - "

,\n", - "

\n", - " Recortes al INE han reducido alcance de proyectos estratégicos\n", - "

,\n", - "

\n", - " Votarían por una alianza opositora 36.7% en 2024\n", - "

,\n", - "

\n", - " Si no tienes un plan para hacer crecer la economía al doble, no deberías aspirar a la presidencia: Marcelo Ebrard\n", - "

,\n", - "

\n", - " Recorte al INE impactaría a comicios del 2023 y 2024\n", - "

,\n", - "

\n", - " Gobiernos municipales, factor para el 2023 y 2024\n", - "

,\n", - "

¿Qué ciudades en México se perfilan para ser 'smart cities'?

,\n", - "

México recomprará bono al 2025 para bajar amortizaciones de la deuda externa

,\n", - "

Blackstone suspende los retiros de su fondo de inversión inmobiliaria de 69,000 millones de dólares

,\n", - "

¿Cuáles fueron los artistas más escuchados en Spotify 2022?

,\n", - "

Negociaciones contractuales \"presionadas\" por incremento de doble dígito al salario mínimo

,\n", - "

\n", - " Morena arranca con ventaja en Coahuila\n", - "

,\n", - "

\n", - " Sheinbaum, con ligera ventaja en la carrera presidencial\n", - "

,\n", - "

\n", - " Propone PRD a PRI y PAN una encuesta para elegir candidato aliancista en Edomex\n", - "

,\n", - "

\n", - " Morena: si ganan el 24 ¿por qué trampear?\n", - "

,\n", - "

\n", - " Morena abrirá registro para candidato en Coahuila el 31 de octubre\n", - "

,\n", - "

\n", - " ¿Corcholatismo acotado?\n", - "

,\n", - "

\n", - " ¿Cuáles son los escenarios de la reforma electoral en marcha?\n", - "

,\n", - "

\n", - " PRI perfila a Del Moral como candidata al Edomex\n", - "

,\n", - "

\n", - " Concluye en el PRI pasarela de presidenciables\n", - "

]" - ] - }, - "execution_count": 24, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "datos_tabla1" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "2a1f5079-cc0b-401e-90f5-a811fba87bcc", - "metadata": {}, - "outputs": [], - "source": [] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "cfaf6513-1dfa-416c-a614-dce7217648ec", - "metadata": {}, - "outputs": [], - "source": [] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "0c4a8bbb-7a16-477d-b860-201834ae2216", - "metadata": {}, - "outputs": [], - "source": [] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "78cb7ee7-8825-443b-8394-eec9f680a1aa", - "metadata": {}, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3 (ipykernel)", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.9.12" - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} From e994a0603d1d65a4d22a6056ca5288cd2320957f Mon Sep 17 00:00:00 2001 From: GildaRIA <114354041+GildaRIA@users.noreply.github.com> Date: Sun, 4 Dec 2022 15:11:56 -0600 Subject: [PATCH 3/5] Add files via upload --- Proyecto2_GildaRIA_Try.ipynb | 421 +++++++++++++++++++++++++++++++++++ 1 file changed, 421 insertions(+) create mode 100644 Proyecto2_GildaRIA_Try.ipynb diff --git a/Proyecto2_GildaRIA_Try.ipynb b/Proyecto2_GildaRIA_Try.ipynb new file mode 100644 index 0000000..40b6211 --- /dev/null +++ b/Proyecto2_GildaRIA_Try.ipynb @@ -0,0 +1,421 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "c483e8a0-576e-4f21-a19f-6fb8fa42fa14", + "metadata": {}, + "outputs": [], + "source": [ + "from bs4 import BeautifulSoup\n", + "import requests\n", + "import selenium\n", + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "3b69ee34-618c-4570-a45d-ce60b05a4353", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Requirement already satisfied: html5lib in c:\\anaconda\\lib\\site-packages (1.1)\n", + "Requirement already satisfied: webencodings in c:\\anaconda\\lib\\site-packages (from html5lib) (0.5.1)\n", + "Requirement already satisfied: six>=1.9 in c:\\anaconda\\lib\\site-packages (from html5lib) (1.16.0)\n", + "Requirement already satisfied: lxml in c:\\anaconda\\lib\\site-packages (4.8.0)\n" + ] + } + ], + "source": [ + "!pip install html5lib\n", + "!pip install lxml" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "a114183e-9356-4213-91fb-60a782bce915", + "metadata": {}, + "outputs": [], + "source": [ + "from selenium import webdriver\n", + "browser = webdriver.Chrome()" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "5f60973b-6658-4ec5-baa2-862eab88fd7b", + "metadata": {}, + "outputs": [], + "source": [ + "driver = webdriver.Chrome()" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "9e25c2fa-d714-4d5f-875d-644a534caf37", + "metadata": {}, + "outputs": [], + "source": [ + "url = 'http://wdi.worldbank.org/table/4.2'" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "909356bb-33df-42c7-b010-84f460b81b4e", + "metadata": {}, + "outputs": [], + "source": [ + "driver.get(url)" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "f637afb6-9ff0-4116-af43-554ebd65084b", + "metadata": {}, + "outputs": [], + "source": [ + "sopa = BeautifulSoup(driver.page_source)" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "id": "af6cae88-e924-4d40-9a0c-3e2efe2e1803", + "metadata": {}, + "outputs": [], + "source": [ + "datos_tabla1 = sopa.select('table')" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "e09fd631-90d9-4db7-8482-8d999c4bc4e0", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[
Economy
4.2
\n", + " World Development Indicators:\n", + " Structure of value added
,\n", + "
Structure of value added
$ billions
% of GDP
% of GDP
% of GDP
% of GDP
2010
2020
2010
2020
2010
2020
2010
2020
2010
2020
,\n", + "
15.9
20.1
26.2
26.8
21.2
14.0
12.5
7.7
48.9
54.7
11.9
15.1
18.0
19.3
24.9
20.0
5.5
6.0
44.0
48.4
161.2
145.0
8.5
14.1
40.0
20.3
39.0
18.8
39.2
48.7
0.6
0.7
..
..
..
..
7.2
12.2
..
..
3.4
2.9
..
0.6
..
12.7
..
3.7
..
79.8
81.7
53.6
6.2
9.1
52.4
45.7
4.5
6.9
41.9
45.4
1.1
1.4
1.6
2.2
16.2
21.1
2.2
2.4
70.7
65.3
423.6
389.6
7.1
5.9
25.3
23.3
15.8
15.4
51.5
54.6
9.3
12.6
17.9
11.2
27.8
27.1
9.4
12.4
45.7
53.2
2.5
2.5
0.4
..
15.8
..
3.1
..
68.1
..
1,147.6
1,327.8
2.2
2.0
25.2
25.5
8.0
5.7
65.7
66.3
392.3
433.3
1.3
1.1
25.5
25.5
16.5
16.3
62.3
63.1
52.9
42.7
5.5
6.7
59.8
42.0
4.7
6.1
27.9
42.4
10.1
9.7
1.1
0.8
11.5
12.0
2.1
1.4
81.1
79.1
25.7
34.7
0.3
0.3
45.0
40.3
14.5
18.1
53.7
56.6
115.3
373.9
17.0
12.0
25.0
32.9
16.1
20.6
53.5
51.5
4.5
4.7
1.3
1.5
14.1
12.8
5.8
4.9
..
..
57.2
61.5
8.9
7.1
35.4
30.8
22.5
21.5
43.5
49.5
481.4
521.7
0.8
0.6
20.9
19.5
13.3
12.4
67.7
69.6
1.4
1.6
11.6
11.5
19.0
14.2
12.3
5.7
60.6
61.2
9.5
15.7
25.8
27.1
18.0
16.3
11.7
9.7
44.5
47.9
6.6
6.9
0.3
0.3
6.6
5.6
0.9
0.3
88.9
90.3
1.5
2.3
14.8
19.2
43.8
34.4
8.9
5.9
37.3
43.7
19.6
36.6
10.4
14.0
30.1
23.5
11.3
11.0
43.6
52.8
17.2
20.0
6.8
6.1
22.5
24.6
10.9
13.1
55.5
55.8
12.8
14.9
2.5
2.1
31.9
27.8
6.4
5.7
55.0
65.8
2,208.8
1,448.6
4.1
5.9
23.3
17.7
12.7
9.7
57.6
62.8
13.7
12.0
0.7
1.2
68.7
59.1
14.9
15.8
32.5
41.5
50.7
69.9
4.0
3.5
23.8
21.9
..
..
59.5
61.3
10.1
17.9
24.1
18.4
26.1
32.6
12.1
9.3
42.1
40.8
2.0
2.8
38.4
28.6
15.4
10.7
9.2
..
37.0
45.5
1.7
1.7
8.0
4.9
18.1
23.1
5.4
7.3
61.2
58.9
11.2
25.9
33.9
22.7
21.9
34.6
14.7
16.2
38.3
36.6
27.5
40.8
17.3
17.4
25.8
23.3
14.5
13.3
50.6
52.0
1,617.3
1,645.4
1.5
1.7
26.4
24.6
10.0
9.9
65.7
66.9
4.2
5.6
0.3
0.4
7.1
8.0
0.8
0.9
87.6
86.9
2.1
2.3
37.4
29.5
24.5
20.4
18.4
17.7
29.3
40.0
10.7
10.7
51.9
46.8
12.0
16.0
1.0
3.2
33.4
43.6
..
..
..
..
..
..
..
..
..
..
217.1
252.7
3.5
4.1
33.5
30.0
9.9
8.9
53.8
56.1
6,087.2
14,687.7
9.3
7.7
46.5
37.8
31.6
26.3
44.2
54.5
228.6
344.9
0.1
0.1
6.8
6.1
1.7
0.9
90.9
89.6
28.2
25.6
..
..
4.8
8.4
0.6
0.9
94.0
88.7
286.6
270.3
6.3
7.4
31.4
23.8
14.0
10.9
53.4
59.9
0.9
1.2
30.4
35.8
11.8
8.1
..
..
53.2
51.4
21.6
48.7
21.4
20.9
38.7
41.2
16.2
19.0
35.4
35.7
13.1
10.5
4.0
7.6
66.2
48.2
5.3
8.1
25.4
40.4
37.7
62.2
6.5
4.4
23.3
20.1
14.6
12.7
61.9
68.4
34.9
61.3
17.5
21.4
16.0
20.9
9.0
11.2
37.8
42.1
60.4
57.2
3.7
3.2
21.4
21.2
13.0
12.1
59.8
59.3
59.6
107.4
3.6
2.8
22.9
23.0
15.6
11.2
72.5
73.5
2.9
2.5
0.4
0.2
15.0
15.0
6.1
4.1
77.0
74.9
25.7
24.7
2.1
1.9
14.5
12.6
5.1
5.5
71.6
74.3
209.1
245.3
1.5
1.9
33.2
30.8
21.0
21.9
55.8
58.3
322.0
356.1
1.2
1.3
19.7
21.2
10.9
14.0
65.4
64.6
1.1
3.2
..
1.7
..
14.9
..
4.4
..
77.3
0.5
0.5
11.5
15.2
11.7
12.2
2.4
2.9
60.3
57.9
53.9
78.8
6.1
6.0
27.9
30.3
15.3
14.4
59.3
57.2
69.6
99.3
9.7
9.8
34.7
30.7
13.4
16.5
51.1
53.3
219.0
365.3
13.3
11.6
35.8
32.0
16.1
16.4
46.2
51.8
18.4
24.6
7.0
5.1
25.3
23.8
16.1
14.9
59.5
61.5
16.3
10.1
1.1
2.9
74.7
45.4
21.0
20.1
24.7
51.5
1.6
..
14.1
..
21.8
..
5.5
..
..
..
19.5
30.7
3.2
2.2
24.4
22.7
13.7
12.9
59.9
62.7
4.4
4.0
10.2
8.4
37.7
31.3
32.5
26.5
49.6
53.6
29.9
107.7
41.4
35.6
9.4
23.1
4.0
5.3
41.8
36.8
2.3
3.2
14.9
13.6
14.2
20.5
5.4
6.9
58.1
53.9
3.1
4.6
9.4
14.5
17.0
17.0
12.3
11.6
57.5
53.7
249.4
271.8
2.4
2.4
26.2
24.0
17.0
14.3
58.9
60.1
2,645.2
2,630.3
1.6
1.6
17.8
16.4
10.3
9.4
70.7
71.2
..
5.7
..
..
..
..
..
..
..
..
14.4
15.3
3.9
6.7
55.2
40.7
17.1
18.3
30.8
45.7
1.5
1.8
35.2
21.0
9.8
19.0
4.6
2.9
49.2
52.2
12.2
15.8
8.5
7.3
16.9
21.2
9.1
9.3
63.1
59.1
3,399.7
3,846.4
0.8
0.7
26.8
26.5
19.7
18.2
62.3
63.3
32.2
70.0
28.0
18.9
18.0
29.9
6.4
11.0
48.2
45.2
297.1
188.8
3.0
4.2
14.9
15.0
7.9
8.9
70.3
68.6
2.5
3.1
13.4
17.3
18.1
18.1
4.3
3.4
65.6
60.7
0.8
1.0
4.5
4.9
14.7
13.1
3.5
3.1
68.4
66.8
4.9
5.8
..
..
..
..
..
..
..
..
40.7
77.6
11.2
10.2
27.5
22.1
18.9
14.1
59.5
61.9
6.9
14.2
17.5
25.7
32.3
28.3
10.6
9.6
43.4
37.6
0.8
1.4
45.1
30.9
13.1
13.5
11.3
9.1
39.4
50.2
3.4
5.5
28.5
16.9
24.9
38.8
5.7
4.2
41.6
38.9
11.9
14.5
20.2
20.4
23.5
23.3
14.5
17.6
52.5
53.9
15.8
23.8
11.6
12.1
25.6
26.0
16.5
16.0
60.6
58.3
132.2
156.7
3.0
3.4
25.2
24.6
18.1
17.5
56.7
56.6
13.8
21.7
6.3
4.3
22.0
19.7
13.0
8.7
61.9
66.2
1,675.6
2,667.7
17.0
18.2
30.7
24.5
17.0
13.7
45.0
48.4
755.1
1,058.7
13.9
13.7
42.8
38.3
22.0
19.9
40.7
44.4
486.8
231.5
6.5
12.8
44.2
35.7
12.8
20.0
51.1
49.0
138.5
184.4
5.2
6.0
55.8
41.3
2.3
2.7
39.7
54.3
221.9
425.9
1.0
0.9
23.3
38.0
19.5
34.5
66.7
54.8
5.9
7.3
0.6
0.3
9.2
7.6
3.6
2.1
93.0
93.9
234.7
407.1
1.6
1.2
20.8
18.6
14.1
11.3
66.8
71.4
2,136.1
1,892.6
1.8
2.0
21.9
21.6
14.2
14.8
66.3
66.8
13.2
13.8
5.3
8.7
18.0
20.4
7.8
8.0
66.5
59.7
5,759.1
5,040.1
1.1
1.0
28.3
29.0
20.8
19.7
70.5
69.5
27.1
43.7
3.6
5.2
26.3
23.9
18.9
17.3
59.1
61.6
148.0
171.1
4.5
5.4
40.6
33.1
11.3
13.1
51.7
56.1
45.4
100.7
17.6
22.6
18.6
17.4
11.2
7.6
57.0
53.9
0.2
0.2
24.2
26.2
11.9
9.8
5.6
4.4
63.9
67.9
..
..
..
..
..
..
..
..
..
..
1,144.1
1,637.9
2.1
1.8
34.1
32.6
27.4
24.8
54.7
57.1
5.3
7.7
9.5
7.4
27.0
27.6
13.8
13.4
45.9
47.6
115.4
106.0
0.5
0.5
66.1
45.4
6.0
6.6
47.0
69.1
4.8
7.8
17.4
13.6
26.3
29.2
16.9
14.5
49.3
49.8
7.1
19.0
22.6
16.3
30.5
32.4
11.1
7.7
43.6
41.0
24.0
33.6
4.1
4.0
20.4
19.4
11.9
10.9
64.5
63.5
38.4
25.9
3.9
8.9
13.8
17.6
7.7
12.3
71.9
81.3
2.2
2.3
4.9
4.7
31.5
35.5
13.1
14.8
53.8
43.7
2.0
3.0
44.8
41.1
5.0
17.7
2.6
..
50.2
41.6
75.4
52.3
1.8
4.1
75.7
48.3
4.0
2.9
32.2
55.8
5.1
6.4
..
0.1
..
44.2
..
38.7
..
52.2
37.1
56.5
3.0
3.2
26.2
25.0
16.9
15.7
60.7
61.6
56.2
73.4
0.3
0.2
11.0
11.2
5.0
4.6
78.9
79.7
10.0
13.2
29.1
24.8
18.0
16.4
9.5
10.7
48.8
51.8
7.0
12.2
29.6
22.7
15.2
18.5
9.9
11.5
47.9
52.6
255.0
337.0
10.1
8.2
40.5
35.9
23.4
22.3
48.5
54.8
2.6
3.7
5.6
8.0
9.4
11.8
2.3
2.5
77.7
70.8
10.7
17.5
33.0
36.2
22.7
21.2
6.7
6.8
35.5
34.4
9.0
14.9
1.3
0.4
17.6
13.4
11.2
7.5
69.3
76.9
0.2
0.2
11.6
21.8
13.7
12.8
3.7
3.4
71.5
67.2
5.6
7.9
16.7
20.2
38.2
28.8
6.7
6.1
39.9
42.5
10.0
10.9
3.6
3.4
22.5
16.6
14.2
10.7
62.9
68.2
1,057.8
1,087.1
3.2
3.8
32.4
29.6
15.6
17.2
60.4
60.3
0.3
0.4
24.7
22.5
7.2
4.9
0.4
0.5
60.7
66.8
7.0
11.9
11.2
8.7
20.4
22.8
10.0
10.5
54.5
55.5
5.4
6.8
..
..
12.9
14.9
..
..
87.1
76.7
7.2
13.3
11.7
13.0
33.2
37.0
6.8
7.8
44.8
40.5
4.1
4.8
7.7
7.6
17.1
17.3
4.6
4.1
58.6
58.0
93.2
114.7
12.9
11.7
25.7
26.1
15.6
15.3
51.0
50.8
11.1
14.0
26.8
25.6
16.4
21.8
10.0
8.1
47.0
41.5
37.8
78.9
37.4
20.9
25.6
38.6
19.0
24.8
37.0
40.5
11.4
10.6
8.5
9.2
27.4
25.8
12.3
11.1
54.0
58.8
16.0
33.4
33.2
22.2
14.2
12.0
5.9
4.5
46.4
53.9
847.4
913.9
1.8
1.6
19.7
17.8
10.5
10.8
68.4
69.8
9.4
9.4
1.3
1.8
26.2
22.4
5.6
..
64.9
65.5
146.5
211.7
6.6
5.7
21.2
20.4
10.8
9.8
64.4
65.6
8.8
12.6
17.0
15.6
22.0
25.8
14.3
13.5
51.7
48.8
7.9
13.7
35.8
38.4
23.0
20.2
6.9
7.3
35.1
36.2
361.5
432.3
23.9
24.1
25.3
28.2
6.6
12.7
50.8
46.4
9.4
12.1
10.1
8.6
21.0
22.8
9.9
13.2
55.1
56.2
0.8
1.2
..
..
..
..
..
..
..
..
428.8
362.2
1.6
1.8
34.8
26.0
7.2
6.5
52.7
60.3
65.0
74.0
1.2
2.6
63.3
47.5
10.0
8.0
39.9
54.7
177.2
300.3
23.3
21.9
19.7
18.6
13.1
11.4
52.8
53.7
0.2
0.3
3.8
3.3
9.3
13.4
0.8
1.0
76.7
73.7
29.4
54.0
3.6
2.8
18.4
23.9
7.1
5.8
72.9
70.1
14.3
24.7
19.6
17.0
33.2
36.7
2.4
1.7
44.1
41.8
27.1
35.4
13.3
11.1
34.3
33.8
18.6
18.7
45.3
48.2
147.5
201.7
6.8
7.7
35.8
30.2
15.6
12.2
48.9
54.4
208.4
361.8
13.7
10.2
32.3
28.4
21.9
17.7
53.9
61.4
479.8
596.6
2.9
2.5
28.9
27.7
15.3
16.0
56.3
57.8
238.1
228.5
1.9
2.1
20.0
19.4
11.6
11.9
66.1
65.7
98.4
103.1
0.8
0.6
50.9
51.1
47.3
48.2
48.6
48.8
125.1
144.4
0.1
0.3
73.2
52.3
12.5
7.9
28.6
52.7
166.3
249.5
5.0
4.0
38.0
26.9
23.0
16.3
46.2
59.8
1,524.9
1,488.3
3.3
4.0
30.0
29.8
12.8
13.4
53.1
56.1
6.1
10.2
24.3
26.6
16.3
18.6
8.2
8.7
49.9
46.6
0.7
0.8
10.4
10.2
17.8
14.9
10.2
5.4
71.8
74.9
1.9
1.5
..
0.0
..
..
..
31.5
..
..
0.2
0.5
11.3
14.0
17.4
13.2
8.5
5.6
67.1
70.8
528.2
703.4
2.6
2.5
58.4
40.1
11.0
12.1
39.2
53.9
16.1
24.5
15.9
16.2
21.8
23.2
15.6
14.3
52.4
50.3
41.8
53.3
6.6
6.3
25.3
24.9
15.3
13.3
51.7
51.9
1.0
1.2
2.3
2.5
14.0
15.6
8.0
6.5
68.5
67.6
2.6
4.1
52.9
59.5
7.8
5.2
2.2
1.9
35.3
31.0
239.8
345.3
0.0
0.0
26.6
23.6
20.8
20.0
67.8
71.7
0.9
1.2
0.1
..
12.9
..
1.5
..
77.8
..
90.8
105.2
1.6
1.8
30.6
27.4
18.0
17.5
58.4
60.4
48.2
53.6
1.9
2.1
26.5
29.4
17.5
20.7
58.8
56.9
0.8
1.5
..
..
..
..
..
..
..
..
..
7.0
..
..
..
..
..
..
..
..
417.4
335.4
2.1
2.5
25.3
23.4
13.9
11.7
64.3
64.6
14.6
..
5.3
9.6
61.1
36.9
2.3
..
33.6
53.5
1,422.1
1,281.5
2.4
3.1
23.2
20.4
11.4
11.0
66.3
67.8
56.7
81.0
8.5
8.6
26.6
26.2
18.1
16.1
54.6
59.5
0.8
1.0
1.3
1.3
22.5
20.9
8.3
4.6
65.8
67.6
1.5
1.6
2.7
2.2
11.9
11.0
3.4
3.8
73.9
72.6
0.8
..
..
..
..
..
..
..
..
..
0.7
0.9
6.3
8.6
15.9
12.9
4.9
3.9
64.0
63.0
74.2
27.0
31.9
20.4
21.1
23.4
5.1
..
30.8
36.3
4.4
2.9
9.5
8.2
35.2
35.2
21.0
22.0
48.2
53.1
495.8
541.5
1.6
1.4
23.8
21.1
14.7
12.1
62.8
66.1
603.4
752.2
0.7
0.7
24.9
25.2
18.2
18.1
70.8
71.3
252.5
21.4
19.4
39.0
30.4
18.6
..
..
50.1
42.5
5.6
8.1
19.6
24.0
25.0
33.8
9.7
15.6
45.1
35.3
32.0
62.4
25.6
26.7
23.6
28.7
8.7
8.5
43.3
36.3
341.1
499.7
10.5
8.7
39.9
33.2
30.9
25.5
49.6
58.1
0.9
1.9
25.6
15.4
9.1
25.4
1.0
1.7
68.9
55.2
3.4
7.6
28.7
18.8
15.0
22.7
7.2
14.4
56.3
49.3
0.4
0.5
16.4
17.7
18.0
14.8
6.0
5.6
53.6
51.2
22.2
21.4
0.5
1.1
53.8
34.1
19.2
16.5
45.5
62.6
46.2
42.5
6.8
10.2
29.5
21.6
15.7
13.8
55.9
60.1
777.0
720.0
9.0
6.7
24.5
28.0
15.1
19.1
54.5
54.2
22.6
45.2
11.3
10.8
59.1
42.0
..
..
28.1
47.2
0.7
0.9
0.6
0.4
11.9
15.7
1.3
0.7
83.4
72.7
0.0
0.1
26.5
..
5.5
..
1.1
..
..
..
26.7
37.6
32.3
23.9
24.7
26.5
16.7
15.8
44.8
42.8
141.2
156.6
7.4
9.3
25.6
20.8
13.1
10.1
55.5
55.8
289.8
358.9
0.8
0.9
52.5
40.9
7.9
9.7
46.7
58.2
2,491.1
2,756.9
0.6
0.6
18.9
17.1
9.5
8.7
70.6
72.7
15,049.0
20,893.7
1.0
1.1
19.3
18.4
11.9
11.2
76.3
80.1
40.3
53.6
7.2
7.3
24.5
18.1
13.5
10.3
58.2
63.0
49.8
59.9
26.9
25.1
21.2
31.7
10.2
19.6
39.9
35.8
0.7
0.9
19.5
21.2
12.9
10.0
5.0
2.8
61.7
59.8
393.2
..
5.4
..
48.4
..
11.9
..
39.0
..
147.2
343.2
..
..
..
..
..
..
..
..
4.3
4.2
..
..
..
..
..
..
..
..
9.7
15.5
9.0
7.1
18.6
17.0
12.2
11.0
57.7
60.6
30.9
18.8
8.2
5.0
43.8
35.6
8.0
..
27.4
16.8
20.3
18.1
9.4
3.0
32.2
40.3
7.6
7.7
52.8
53.6
12.0
18.1
9.6
7.6
20.7
35.8
9.2
18.4
57.8
49.9
66,596.1
84,906.8
3.9
4.4
27.6
26.3
15.9
16.0
62.8
65.7
17,063.3
27,118.7
5.5
5.9
35.9
34.1
24.2
22.8
57.0
58.2
21,025.8
22,133.9
2.1
2.1
23.6
22.9
13.7
13.9
64.0
65.2
5,347.1
4,743.2
4.7
6.5
29.1
28.3
14.3
15.7
55.7
67.7
2,973.1
3,106.9
5.9
5.4
46.3
34.7
11.7
12.2
47.0
56.9
16,672.9
22,546.0
1.1
1.1
20.0
19.0
11.7
11.1
75.3
79.7
2,060.8
3,482.5
17.5
17.7
29.1
24.8
16.5
14.1
46.5
49.6
1,451.8
1,706.1
15.9
18.5
27.1
26.5
9.8
11.2
50.9
48.9
613.2
481.0
23.6
26.8
28.3
25.9
4.8
10.7
42.9
39.1
5,246.9
7,585.5
15.3
16.1
33.0
27.8
16.4
14.9
46.8
48.1
14,604.0
22,848.3
6.9
7.0
36.7
34.1
21.7
22.1
50.5
55.9
45,752.2
53,699.8
1.3
1.3
23.9
22.4
14.1
13.4
69.0
71.8
]" + ] + }, + "execution_count": 15, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "datos_tabla1" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "2a1f5079-cc0b-401e-90f5-a811fba87bcc", + "metadata": {}, + "outputs": [], + "source": [ + "df = pd.read_html(str(sopa.select('div.scrollable')[0]))[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "id": "cfaf6513-1dfa-416c-a614-dce7217648ec", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
012345678910
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
\n", + "
" + ], + "text/plain": [ + " 0 1 2 3 4 5 6 7 8 9 \\\n", + "0 Afghanistan 15.9 20.1 26.2 26.8 21.2 14.0 12.5 7.7 48.9 \n", + "1 Albania 11.9 15.1 18.0 19.3 24.9 20.0 5.5 6.0 44.0 \n", + "2 Algeria 161.2 145.0 8.5 14.1 40.0 20.3 39.0 18.8 39.2 \n", + "3 American Samoa 0.6 0.7 .. .. .. .. 7.2 12.2 .. \n", + "4 Andorra 3.4 2.9 .. 0.6 .. 12.7 .. 3.7 .. \n", + "\n", + " 10 \n", + "0 54.7 \n", + "1 48.4 \n", + "2 48.7 \n", + "3 .. \n", + "4 79.8 " + ] + }, + "execution_count": 21, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 37, + "id": "0c4a8bbb-7a16-477d-b860-201834ae2216", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Int64Index([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10], dtype='int64')" + ] + }, + "execution_count": 37, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.columns" + ] + }, + { + "cell_type": "code", + "execution_count": 44, + "id": "78cb7ee7-8825-443b-8394-eec9f680a1aa", + "metadata": {}, + "outputs": [], + "source": [ + "df_header = pd.read_html(str(sopa.select('div.fixed')[0]))[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 45, + "id": "f4edcffc-d4df-4e97-98c9-ccad9d782883", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Unnamed: 0_level_0Gross domestic productAgricultureIndustryManufacturingServices
Unnamed: 0_level_1$ billions% of GDP% of GDP% of GDP% of GDP
Unnamed: 0_level_22010202020102020201020202010202020102020
\n", + "
" + ], + "text/plain": [ + "Empty DataFrame\n", + "Columns: [(Unnamed: 0_level_0, Unnamed: 0_level_1, Unnamed: 0_level_2), (Gross domestic product, $ billions, 2010), (Gross domestic product, $ billions, 2020), (Agriculture, % of GDP, 2010), (Agriculture, % of GDP, 2020), (Industry, % of GDP, 2010), (Industry, % of GDP, 2020), (Manufacturing, % of GDP, 2010), (Manufacturing, % of GDP, 2020), (Services, % of GDP, 2010), (Services, % of GDP, 2020)]\n", + "Index: []" + ] + }, + "execution_count": 45, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_header.head()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "e6cb0036-eacf-4da3-85cd-32eae80cab85", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "974c3764-b484-4eae-a854-555ef7d952dc", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} From beb7f5aded0947a56d49c33993a354819a793764 Mon Sep 17 00:00:00 2001 From: GildaRIA <114354041+GildaRIA@users.noreply.github.com> Date: Sun, 4 Dec 2022 17:17:28 -0600 Subject: [PATCH 4/5] Delete Proyecto2_GildaRIA_Try.ipynb --- Proyecto2_GildaRIA_Try.ipynb | 421 ----------------------------------- 1 file changed, 421 deletions(-) delete mode 100644 Proyecto2_GildaRIA_Try.ipynb diff --git a/Proyecto2_GildaRIA_Try.ipynb b/Proyecto2_GildaRIA_Try.ipynb deleted file mode 100644 index 40b6211..0000000 --- a/Proyecto2_GildaRIA_Try.ipynb +++ /dev/null @@ -1,421 +0,0 @@ -{ - "cells": [ - { - "cell_type": "code", - "execution_count": 1, - "id": "c483e8a0-576e-4f21-a19f-6fb8fa42fa14", - "metadata": {}, - "outputs": [], - "source": [ - "from bs4 import BeautifulSoup\n", - "import requests\n", - "import selenium\n", - "import pandas as pd" - ] - }, - { - "cell_type": "code", - "execution_count": 2, - "id": "3b69ee34-618c-4570-a45d-ce60b05a4353", - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Requirement already satisfied: html5lib in c:\\anaconda\\lib\\site-packages (1.1)\n", - "Requirement already satisfied: webencodings in c:\\anaconda\\lib\\site-packages (from html5lib) (0.5.1)\n", - "Requirement already satisfied: six>=1.9 in c:\\anaconda\\lib\\site-packages (from html5lib) (1.16.0)\n", - "Requirement already satisfied: lxml in c:\\anaconda\\lib\\site-packages (4.8.0)\n" - ] - } - ], - "source": [ - "!pip install html5lib\n", - "!pip install lxml" - ] - }, - { - "cell_type": "code", - "execution_count": 3, - "id": "a114183e-9356-4213-91fb-60a782bce915", - "metadata": {}, - "outputs": [], - "source": [ - "from selenium import webdriver\n", - "browser = webdriver.Chrome()" - ] - }, - { - "cell_type": "code", - "execution_count": 4, - "id": "5f60973b-6658-4ec5-baa2-862eab88fd7b", - "metadata": {}, - "outputs": [], - "source": [ - "driver = webdriver.Chrome()" - ] - }, - { - "cell_type": "code", - "execution_count": 11, - "id": "9e25c2fa-d714-4d5f-875d-644a534caf37", - "metadata": {}, - "outputs": [], - "source": [ - "url = 'http://wdi.worldbank.org/table/4.2'" - ] - }, - { - "cell_type": "code", - "execution_count": 12, - "id": "909356bb-33df-42c7-b010-84f460b81b4e", - "metadata": {}, - "outputs": [], - "source": [ - "driver.get(url)" - ] - }, - { - "cell_type": "code", - "execution_count": 13, - "id": "f637afb6-9ff0-4116-af43-554ebd65084b", - "metadata": {}, - "outputs": [], - "source": [ - "sopa = BeautifulSoup(driver.page_source)" - ] - }, - { - "cell_type": "code", - "execution_count": 14, - "id": "af6cae88-e924-4d40-9a0c-3e2efe2e1803", - "metadata": {}, - "outputs": [], - "source": [ - "datos_tabla1 = sopa.select('table')" - ] - }, - { - "cell_type": "code", - "execution_count": 15, - "id": "e09fd631-90d9-4db7-8482-8d999c4bc4e0", - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "[
Economy
4.2
\n", - " World Development Indicators:\n", - " Structure of value added
,\n", - "
Structure of value added
$ billions
% of GDP
% of GDP
% of GDP
% of GDP
2010
2020
2010
2020
2010
2020
2010
2020
2010
2020
,\n", - "
15.9
20.1
26.2
26.8
21.2
14.0
12.5
7.7
48.9
54.7
11.9
15.1
18.0
19.3
24.9
20.0
5.5
6.0
44.0
48.4
161.2
145.0
8.5
14.1
40.0
20.3
39.0
18.8
39.2
48.7
0.6
0.7
..
..
..
..
7.2
12.2
..
..
3.4
2.9
..
0.6
..
12.7
..
3.7
..
79.8
81.7
53.6
6.2
9.1
52.4
45.7
4.5
6.9
41.9
45.4
1.1
1.4
1.6
2.2
16.2
21.1
2.2
2.4
70.7
65.3
423.6
389.6
7.1
5.9
25.3
23.3
15.8
15.4
51.5
54.6
9.3
12.6
17.9
11.2
27.8
27.1
9.4
12.4
45.7
53.2
2.5
2.5
0.4
..
15.8
..
3.1
..
68.1
..
1,147.6
1,327.8
2.2
2.0
25.2
25.5
8.0
5.7
65.7
66.3
392.3
433.3
1.3
1.1
25.5
25.5
16.5
16.3
62.3
63.1
52.9
42.7
5.5
6.7
59.8
42.0
4.7
6.1
27.9
42.4
10.1
9.7
1.1
0.8
11.5
12.0
2.1
1.4
81.1
79.1
25.7
34.7
0.3
0.3
45.0
40.3
14.5
18.1
53.7
56.6
115.3
373.9
17.0
12.0
25.0
32.9
16.1
20.6
53.5
51.5
4.5
4.7
1.3
1.5
14.1
12.8
5.8
4.9
..
..
57.2
61.5
8.9
7.1
35.4
30.8
22.5
21.5
43.5
49.5
481.4
521.7
0.8
0.6
20.9
19.5
13.3
12.4
67.7
69.6
1.4
1.6
11.6
11.5
19.0
14.2
12.3
5.7
60.6
61.2
9.5
15.7
25.8
27.1
18.0
16.3
11.7
9.7
44.5
47.9
6.6
6.9
0.3
0.3
6.6
5.6
0.9
0.3
88.9
90.3
1.5
2.3
14.8
19.2
43.8
34.4
8.9
5.9
37.3
43.7
19.6
36.6
10.4
14.0
30.1
23.5
11.3
11.0
43.6
52.8
17.2
20.0
6.8
6.1
22.5
24.6
10.9
13.1
55.5
55.8
12.8
14.9
2.5
2.1
31.9
27.8
6.4
5.7
55.0
65.8
2,208.8
1,448.6
4.1
5.9
23.3
17.7
12.7
9.7
57.6
62.8
13.7
12.0
0.7
1.2
68.7
59.1
14.9
15.8
32.5
41.5
50.7
69.9
4.0
3.5
23.8
21.9
..
..
59.5
61.3
10.1
17.9
24.1
18.4
26.1
32.6
12.1
9.3
42.1
40.8
2.0
2.8
38.4
28.6
15.4
10.7
9.2
..
37.0
45.5
1.7
1.7
8.0
4.9
18.1
23.1
5.4
7.3
61.2
58.9
11.2
25.9
33.9
22.7
21.9
34.6
14.7
16.2
38.3
36.6
27.5
40.8
17.3
17.4
25.8
23.3
14.5
13.3
50.6
52.0
1,617.3
1,645.4
1.5
1.7
26.4
24.6
10.0
9.9
65.7
66.9
4.2
5.6
0.3
0.4
7.1
8.0
0.8
0.9
87.6
86.9
2.1
2.3
37.4
29.5
24.5
20.4
18.4
17.7
29.3
40.0
10.7
10.7
51.9
46.8
12.0
16.0
1.0
3.2
33.4
43.6
..
..
..
..
..
..
..
..
..
..
217.1
252.7
3.5
4.1
33.5
30.0
9.9
8.9
53.8
56.1
6,087.2
14,687.7
9.3
7.7
46.5
37.8
31.6
26.3
44.2
54.5
228.6
344.9
0.1
0.1
6.8
6.1
1.7
0.9
90.9
89.6
28.2
25.6
..
..
4.8
8.4
0.6
0.9
94.0
88.7
286.6
270.3
6.3
7.4
31.4
23.8
14.0
10.9
53.4
59.9
0.9
1.2
30.4
35.8
11.8
8.1
..
..
53.2
51.4
21.6
48.7
21.4
20.9
38.7
41.2
16.2
19.0
35.4
35.7
13.1
10.5
4.0
7.6
66.2
48.2
5.3
8.1
25.4
40.4
37.7
62.2
6.5
4.4
23.3
20.1
14.6
12.7
61.9
68.4
34.9
61.3
17.5
21.4
16.0
20.9
9.0
11.2
37.8
42.1
60.4
57.2
3.7
3.2
21.4
21.2
13.0
12.1
59.8
59.3
59.6
107.4
3.6
2.8
22.9
23.0
15.6
11.2
72.5
73.5
2.9
2.5
0.4
0.2
15.0
15.0
6.1
4.1
77.0
74.9
25.7
24.7
2.1
1.9
14.5
12.6
5.1
5.5
71.6
74.3
209.1
245.3
1.5
1.9
33.2
30.8
21.0
21.9
55.8
58.3
322.0
356.1
1.2
1.3
19.7
21.2
10.9
14.0
65.4
64.6
1.1
3.2
..
1.7
..
14.9
..
4.4
..
77.3
0.5
0.5
11.5
15.2
11.7
12.2
2.4
2.9
60.3
57.9
53.9
78.8
6.1
6.0
27.9
30.3
15.3
14.4
59.3
57.2
69.6
99.3
9.7
9.8
34.7
30.7
13.4
16.5
51.1
53.3
219.0
365.3
13.3
11.6
35.8
32.0
16.1
16.4
46.2
51.8
18.4
24.6
7.0
5.1
25.3
23.8
16.1
14.9
59.5
61.5
16.3
10.1
1.1
2.9
74.7
45.4
21.0
20.1
24.7
51.5
1.6
..
14.1
..
21.8
..
5.5
..
..
..
19.5
30.7
3.2
2.2
24.4
22.7
13.7
12.9
59.9
62.7
4.4
4.0
10.2
8.4
37.7
31.3
32.5
26.5
49.6
53.6
29.9
107.7
41.4
35.6
9.4
23.1
4.0
5.3
41.8
36.8
2.3
3.2
14.9
13.6
14.2
20.5
5.4
6.9
58.1
53.9
3.1
4.6
9.4
14.5
17.0
17.0
12.3
11.6
57.5
53.7
249.4
271.8
2.4
2.4
26.2
24.0
17.0
14.3
58.9
60.1
2,645.2
2,630.3
1.6
1.6
17.8
16.4
10.3
9.4
70.7
71.2
..
5.7
..
..
..
..
..
..
..
..
14.4
15.3
3.9
6.7
55.2
40.7
17.1
18.3
30.8
45.7
1.5
1.8
35.2
21.0
9.8
19.0
4.6
2.9
49.2
52.2
12.2
15.8
8.5
7.3
16.9
21.2
9.1
9.3
63.1
59.1
3,399.7
3,846.4
0.8
0.7
26.8
26.5
19.7
18.2
62.3
63.3
32.2
70.0
28.0
18.9
18.0
29.9
6.4
11.0
48.2
45.2
297.1
188.8
3.0
4.2
14.9
15.0
7.9
8.9
70.3
68.6
2.5
3.1
13.4
17.3
18.1
18.1
4.3
3.4
65.6
60.7
0.8
1.0
4.5
4.9
14.7
13.1
3.5
3.1
68.4
66.8
4.9
5.8
..
..
..
..
..
..
..
..
40.7
77.6
11.2
10.2
27.5
22.1
18.9
14.1
59.5
61.9
6.9
14.2
17.5
25.7
32.3
28.3
10.6
9.6
43.4
37.6
0.8
1.4
45.1
30.9
13.1
13.5
11.3
9.1
39.4
50.2
3.4
5.5
28.5
16.9
24.9
38.8
5.7
4.2
41.6
38.9
11.9
14.5
20.2
20.4
23.5
23.3
14.5
17.6
52.5
53.9
15.8
23.8
11.6
12.1
25.6
26.0
16.5
16.0
60.6
58.3
132.2
156.7
3.0
3.4
25.2
24.6
18.1
17.5
56.7
56.6
13.8
21.7
6.3
4.3
22.0
19.7
13.0
8.7
61.9
66.2
1,675.6
2,667.7
17.0
18.2
30.7
24.5
17.0
13.7
45.0
48.4
755.1
1,058.7
13.9
13.7
42.8
38.3
22.0
19.9
40.7
44.4
486.8
231.5
6.5
12.8
44.2
35.7
12.8
20.0
51.1
49.0
138.5
184.4
5.2
6.0
55.8
41.3
2.3
2.7
39.7
54.3
221.9
425.9
1.0
0.9
23.3
38.0
19.5
34.5
66.7
54.8
5.9
7.3
0.6
0.3
9.2
7.6
3.6
2.1
93.0
93.9
234.7
407.1
1.6
1.2
20.8
18.6
14.1
11.3
66.8
71.4
2,136.1
1,892.6
1.8
2.0
21.9
21.6
14.2
14.8
66.3
66.8
13.2
13.8
5.3
8.7
18.0
20.4
7.8
8.0
66.5
59.7
5,759.1
5,040.1
1.1
1.0
28.3
29.0
20.8
19.7
70.5
69.5
27.1
43.7
3.6
5.2
26.3
23.9
18.9
17.3
59.1
61.6
148.0
171.1
4.5
5.4
40.6
33.1
11.3
13.1
51.7
56.1
45.4
100.7
17.6
22.6
18.6
17.4
11.2
7.6
57.0
53.9
0.2
0.2
24.2
26.2
11.9
9.8
5.6
4.4
63.9
67.9
..
..
..
..
..
..
..
..
..
..
1,144.1
1,637.9
2.1
1.8
34.1
32.6
27.4
24.8
54.7
57.1
5.3
7.7
9.5
7.4
27.0
27.6
13.8
13.4
45.9
47.6
115.4
106.0
0.5
0.5
66.1
45.4
6.0
6.6
47.0
69.1
4.8
7.8
17.4
13.6
26.3
29.2
16.9
14.5
49.3
49.8
7.1
19.0
22.6
16.3
30.5
32.4
11.1
7.7
43.6
41.0
24.0
33.6
4.1
4.0
20.4
19.4
11.9
10.9
64.5
63.5
38.4
25.9
3.9
8.9
13.8
17.6
7.7
12.3
71.9
81.3
2.2
2.3
4.9
4.7
31.5
35.5
13.1
14.8
53.8
43.7
2.0
3.0
44.8
41.1
5.0
17.7
2.6
..
50.2
41.6
75.4
52.3
1.8
4.1
75.7
48.3
4.0
2.9
32.2
55.8
5.1
6.4
..
0.1
..
44.2
..
38.7
..
52.2
37.1
56.5
3.0
3.2
26.2
25.0
16.9
15.7
60.7
61.6
56.2
73.4
0.3
0.2
11.0
11.2
5.0
4.6
78.9
79.7
10.0
13.2
29.1
24.8
18.0
16.4
9.5
10.7
48.8
51.8
7.0
12.2
29.6
22.7
15.2
18.5
9.9
11.5
47.9
52.6
255.0
337.0
10.1
8.2
40.5
35.9
23.4
22.3
48.5
54.8
2.6
3.7
5.6
8.0
9.4
11.8
2.3
2.5
77.7
70.8
10.7
17.5
33.0
36.2
22.7
21.2
6.7
6.8
35.5
34.4
9.0
14.9
1.3
0.4
17.6
13.4
11.2
7.5
69.3
76.9
0.2
0.2
11.6
21.8
13.7
12.8
3.7
3.4
71.5
67.2
5.6
7.9
16.7
20.2
38.2
28.8
6.7
6.1
39.9
42.5
10.0
10.9
3.6
3.4
22.5
16.6
14.2
10.7
62.9
68.2
1,057.8
1,087.1
3.2
3.8
32.4
29.6
15.6
17.2
60.4
60.3
0.3
0.4
24.7
22.5
7.2
4.9
0.4
0.5
60.7
66.8
7.0
11.9
11.2
8.7
20.4
22.8
10.0
10.5
54.5
55.5
5.4
6.8
..
..
12.9
14.9
..
..
87.1
76.7
7.2
13.3
11.7
13.0
33.2
37.0
6.8
7.8
44.8
40.5
4.1
4.8
7.7
7.6
17.1
17.3
4.6
4.1
58.6
58.0
93.2
114.7
12.9
11.7
25.7
26.1
15.6
15.3
51.0
50.8
11.1
14.0
26.8
25.6
16.4
21.8
10.0
8.1
47.0
41.5
37.8
78.9
37.4
20.9
25.6
38.6
19.0
24.8
37.0
40.5
11.4
10.6
8.5
9.2
27.4
25.8
12.3
11.1
54.0
58.8
16.0
33.4
33.2
22.2
14.2
12.0
5.9
4.5
46.4
53.9
847.4
913.9
1.8
1.6
19.7
17.8
10.5
10.8
68.4
69.8
9.4
9.4
1.3
1.8
26.2
22.4
5.6
..
64.9
65.5
146.5
211.7
6.6
5.7
21.2
20.4
10.8
9.8
64.4
65.6
8.8
12.6
17.0
15.6
22.0
25.8
14.3
13.5
51.7
48.8
7.9
13.7
35.8
38.4
23.0
20.2
6.9
7.3
35.1
36.2
361.5
432.3
23.9
24.1
25.3
28.2
6.6
12.7
50.8
46.4
9.4
12.1
10.1
8.6
21.0
22.8
9.9
13.2
55.1
56.2
0.8
1.2
..
..
..
..
..
..
..
..
428.8
362.2
1.6
1.8
34.8
26.0
7.2
6.5
52.7
60.3
65.0
74.0
1.2
2.6
63.3
47.5
10.0
8.0
39.9
54.7
177.2
300.3
23.3
21.9
19.7
18.6
13.1
11.4
52.8
53.7
0.2
0.3
3.8
3.3
9.3
13.4
0.8
1.0
76.7
73.7
29.4
54.0
3.6
2.8
18.4
23.9
7.1
5.8
72.9
70.1
14.3
24.7
19.6
17.0
33.2
36.7
2.4
1.7
44.1
41.8
27.1
35.4
13.3
11.1
34.3
33.8
18.6
18.7
45.3
48.2
147.5
201.7
6.8
7.7
35.8
30.2
15.6
12.2
48.9
54.4
208.4
361.8
13.7
10.2
32.3
28.4
21.9
17.7
53.9
61.4
479.8
596.6
2.9
2.5
28.9
27.7
15.3
16.0
56.3
57.8
238.1
228.5
1.9
2.1
20.0
19.4
11.6
11.9
66.1
65.7
98.4
103.1
0.8
0.6
50.9
51.1
47.3
48.2
48.6
48.8
125.1
144.4
0.1
0.3
73.2
52.3
12.5
7.9
28.6
52.7
166.3
249.5
5.0
4.0
38.0
26.9
23.0
16.3
46.2
59.8
1,524.9
1,488.3
3.3
4.0
30.0
29.8
12.8
13.4
53.1
56.1
6.1
10.2
24.3
26.6
16.3
18.6
8.2
8.7
49.9
46.6
0.7
0.8
10.4
10.2
17.8
14.9
10.2
5.4
71.8
74.9
1.9
1.5
..
0.0
..
..
..
31.5
..
..
0.2
0.5
11.3
14.0
17.4
13.2
8.5
5.6
67.1
70.8
528.2
703.4
2.6
2.5
58.4
40.1
11.0
12.1
39.2
53.9
16.1
24.5
15.9
16.2
21.8
23.2
15.6
14.3
52.4
50.3
41.8
53.3
6.6
6.3
25.3
24.9
15.3
13.3
51.7
51.9
1.0
1.2
2.3
2.5
14.0
15.6
8.0
6.5
68.5
67.6
2.6
4.1
52.9
59.5
7.8
5.2
2.2
1.9
35.3
31.0
239.8
345.3
0.0
0.0
26.6
23.6
20.8
20.0
67.8
71.7
0.9
1.2
0.1
..
12.9
..
1.5
..
77.8
..
90.8
105.2
1.6
1.8
30.6
27.4
18.0
17.5
58.4
60.4
48.2
53.6
1.9
2.1
26.5
29.4
17.5
20.7
58.8
56.9
0.8
1.5
..
..
..
..
..
..
..
..
..
7.0
..
..
..
..
..
..
..
..
417.4
335.4
2.1
2.5
25.3
23.4
13.9
11.7
64.3
64.6
14.6
..
5.3
9.6
61.1
36.9
2.3
..
33.6
53.5
1,422.1
1,281.5
2.4
3.1
23.2
20.4
11.4
11.0
66.3
67.8
56.7
81.0
8.5
8.6
26.6
26.2
18.1
16.1
54.6
59.5
0.8
1.0
1.3
1.3
22.5
20.9
8.3
4.6
65.8
67.6
1.5
1.6
2.7
2.2
11.9
11.0
3.4
3.8
73.9
72.6
0.8
..
..
..
..
..
..
..
..
..
0.7
0.9
6.3
8.6
15.9
12.9
4.9
3.9
64.0
63.0
74.2
27.0
31.9
20.4
21.1
23.4
5.1
..
30.8
36.3
4.4
2.9
9.5
8.2
35.2
35.2
21.0
22.0
48.2
53.1
495.8
541.5
1.6
1.4
23.8
21.1
14.7
12.1
62.8
66.1
603.4
752.2
0.7
0.7
24.9
25.2
18.2
18.1
70.8
71.3
252.5
21.4
19.4
39.0
30.4
18.6
..
..
50.1
42.5
5.6
8.1
19.6
24.0
25.0
33.8
9.7
15.6
45.1
35.3
32.0
62.4
25.6
26.7
23.6
28.7
8.7
8.5
43.3
36.3
341.1
499.7
10.5
8.7
39.9
33.2
30.9
25.5
49.6
58.1
0.9
1.9
25.6
15.4
9.1
25.4
1.0
1.7
68.9
55.2
3.4
7.6
28.7
18.8
15.0
22.7
7.2
14.4
56.3
49.3
0.4
0.5
16.4
17.7
18.0
14.8
6.0
5.6
53.6
51.2
22.2
21.4
0.5
1.1
53.8
34.1
19.2
16.5
45.5
62.6
46.2
42.5
6.8
10.2
29.5
21.6
15.7
13.8
55.9
60.1
777.0
720.0
9.0
6.7
24.5
28.0
15.1
19.1
54.5
54.2
22.6
45.2
11.3
10.8
59.1
42.0
..
..
28.1
47.2
0.7
0.9
0.6
0.4
11.9
15.7
1.3
0.7
83.4
72.7
0.0
0.1
26.5
..
5.5
..
1.1
..
..
..
26.7
37.6
32.3
23.9
24.7
26.5
16.7
15.8
44.8
42.8
141.2
156.6
7.4
9.3
25.6
20.8
13.1
10.1
55.5
55.8
289.8
358.9
0.8
0.9
52.5
40.9
7.9
9.7
46.7
58.2
2,491.1
2,756.9
0.6
0.6
18.9
17.1
9.5
8.7
70.6
72.7
15,049.0
20,893.7
1.0
1.1
19.3
18.4
11.9
11.2
76.3
80.1
40.3
53.6
7.2
7.3
24.5
18.1
13.5
10.3
58.2
63.0
49.8
59.9
26.9
25.1
21.2
31.7
10.2
19.6
39.9
35.8
0.7
0.9
19.5
21.2
12.9
10.0
5.0
2.8
61.7
59.8
393.2
..
5.4
..
48.4
..
11.9
..
39.0
..
147.2
343.2
..
..
..
..
..
..
..
..
4.3
4.2
..
..
..
..
..
..
..
..
9.7
15.5
9.0
7.1
18.6
17.0
12.2
11.0
57.7
60.6
30.9
18.8
8.2
5.0
43.8
35.6
8.0
..
27.4
16.8
20.3
18.1
9.4
3.0
32.2
40.3
7.6
7.7
52.8
53.6
12.0
18.1
9.6
7.6
20.7
35.8
9.2
18.4
57.8
49.9
66,596.1
84,906.8
3.9
4.4
27.6
26.3
15.9
16.0
62.8
65.7
17,063.3
27,118.7
5.5
5.9
35.9
34.1
24.2
22.8
57.0
58.2
21,025.8
22,133.9
2.1
2.1
23.6
22.9
13.7
13.9
64.0
65.2
5,347.1
4,743.2
4.7
6.5
29.1
28.3
14.3
15.7
55.7
67.7
2,973.1
3,106.9
5.9
5.4
46.3
34.7
11.7
12.2
47.0
56.9
16,672.9
22,546.0
1.1
1.1
20.0
19.0
11.7
11.1
75.3
79.7
2,060.8
3,482.5
17.5
17.7
29.1
24.8
16.5
14.1
46.5
49.6
1,451.8
1,706.1
15.9
18.5
27.1
26.5
9.8
11.2
50.9
48.9
613.2
481.0
23.6
26.8
28.3
25.9
4.8
10.7
42.9
39.1
5,246.9
7,585.5
15.3
16.1
33.0
27.8
16.4
14.9
46.8
48.1
14,604.0
22,848.3
6.9
7.0
36.7
34.1
21.7
22.1
50.5
55.9
45,752.2
53,699.8
1.3
1.3
23.9
22.4
14.1
13.4
69.0
71.8
]" - ] - }, - "execution_count": 15, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "datos_tabla1" - ] - }, - { - "cell_type": "code", - "execution_count": 20, - "id": "2a1f5079-cc0b-401e-90f5-a811fba87bcc", - "metadata": {}, - "outputs": [], - "source": [ - "df = pd.read_html(str(sopa.select('div.scrollable')[0]))[0]" - ] - }, - { - "cell_type": "code", - "execution_count": 21, - "id": "cfaf6513-1dfa-416c-a614-dce7217648ec", - "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
012345678910
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
\n", - "
" - ], - "text/plain": [ - " 0 1 2 3 4 5 6 7 8 9 \\\n", - "0 Afghanistan 15.9 20.1 26.2 26.8 21.2 14.0 12.5 7.7 48.9 \n", - "1 Albania 11.9 15.1 18.0 19.3 24.9 20.0 5.5 6.0 44.0 \n", - "2 Algeria 161.2 145.0 8.5 14.1 40.0 20.3 39.0 18.8 39.2 \n", - "3 American Samoa 0.6 0.7 .. .. .. .. 7.2 12.2 .. \n", - "4 Andorra 3.4 2.9 .. 0.6 .. 12.7 .. 3.7 .. \n", - "\n", - " 10 \n", - "0 54.7 \n", - "1 48.4 \n", - "2 48.7 \n", - "3 .. \n", - "4 79.8 " - ] - }, - "execution_count": 21, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "df.head()" - ] - }, - { - "cell_type": "code", - "execution_count": 37, - "id": "0c4a8bbb-7a16-477d-b860-201834ae2216", - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "Int64Index([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10], dtype='int64')" - ] - }, - "execution_count": 37, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "df.columns" - ] - }, - { - "cell_type": "code", - "execution_count": 44, - "id": "78cb7ee7-8825-443b-8394-eec9f680a1aa", - "metadata": {}, - "outputs": [], - "source": [ - "df_header = pd.read_html(str(sopa.select('div.fixed')[0]))[0]" - ] - }, - { - "cell_type": "code", - "execution_count": 45, - "id": "f4edcffc-d4df-4e97-98c9-ccad9d782883", - "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
Unnamed: 0_level_0Gross domestic productAgricultureIndustryManufacturingServices
Unnamed: 0_level_1$ billions% of GDP% of GDP% of GDP% of GDP
Unnamed: 0_level_22010202020102020201020202010202020102020
\n", - "
" - ], - "text/plain": [ - "Empty DataFrame\n", - "Columns: [(Unnamed: 0_level_0, Unnamed: 0_level_1, Unnamed: 0_level_2), (Gross domestic product, $ billions, 2010), (Gross domestic product, $ billions, 2020), (Agriculture, % of GDP, 2010), (Agriculture, % of GDP, 2020), (Industry, % of GDP, 2010), (Industry, % of GDP, 2020), (Manufacturing, % of GDP, 2010), (Manufacturing, % of GDP, 2020), (Services, % of GDP, 2010), (Services, % of GDP, 2020)]\n", - "Index: []" - ] - }, - "execution_count": 45, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "df_header.head()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "e6cb0036-eacf-4da3-85cd-32eae80cab85", - "metadata": {}, - "outputs": [], - "source": [] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "974c3764-b484-4eae-a854-555ef7d952dc", - "metadata": {}, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3 (ipykernel)", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.9.12" - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} From aaea99d41d8cb602563114dc4cf1d764b276f4d8 Mon Sep 17 00:00:00 2001 From: GildaRIA <114354041+GildaRIA@users.noreply.github.com> Date: Sun, 4 Dec 2022 17:18:13 -0600 Subject: [PATCH 5/5] Add files via upload --- Proyecto2_GildaRIA_Try.ipynb | 7494 ++++++++++++++++++++++++++++++++++ README_ProyectoGilda.md | 10 + 2 files changed, 7504 insertions(+) create mode 100644 Proyecto2_GildaRIA_Try.ipynb create mode 100644 README_ProyectoGilda.md diff --git a/Proyecto2_GildaRIA_Try.ipynb b/Proyecto2_GildaRIA_Try.ipynb new file mode 100644 index 0000000..85e0029 --- /dev/null +++ b/Proyecto2_GildaRIA_Try.ipynb @@ -0,0 +1,7494 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "c483e8a0-576e-4f21-a19f-6fb8fa42fa14", + "metadata": {}, + "outputs": [], + "source": [ + "from bs4 import BeautifulSoup\n", + "import requests\n", + "import selenium\n", + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "3b69ee34-618c-4570-a45d-ce60b05a4353", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Requirement already satisfied: html5lib in c:\\anaconda\\lib\\site-packages (1.1)\n", + "Requirement already satisfied: webencodings in c:\\anaconda\\lib\\site-packages (from html5lib) (0.5.1)\n", + "Requirement already satisfied: six>=1.9 in c:\\anaconda\\lib\\site-packages (from html5lib) (1.16.0)\n", + "Requirement already satisfied: lxml in c:\\anaconda\\lib\\site-packages (4.8.0)\n" + ] + } + ], + "source": [ + "!pip install html5lib\n", + "!pip install lxml" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "a114183e-9356-4213-91fb-60a782bce915", + "metadata": {}, + "outputs": [], + "source": [ + "from selenium import webdriver\n", + "browser = webdriver.Chrome()" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "5f60973b-6658-4ec5-baa2-862eab88fd7b", + "metadata": {}, + "outputs": [], + "source": [ + "driver = webdriver.Chrome()" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "9e25c2fa-d714-4d5f-875d-644a534caf37", + "metadata": {}, + "outputs": [], + "source": [ + "url = 'http://wdi.worldbank.org/table/4.2'" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "909356bb-33df-42c7-b010-84f460b81b4e", + "metadata": {}, + "outputs": [], + "source": [ + "driver.get(url)" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "f637afb6-9ff0-4116-af43-554ebd65084b", + "metadata": {}, + "outputs": [], + "source": [ + "sopa = BeautifulSoup(driver.page_source)" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "id": "af6cae88-e924-4d40-9a0c-3e2efe2e1803", + "metadata": {}, + "outputs": [], + "source": [ + "datos_tabla1 = sopa.select('table')" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "e09fd631-90d9-4db7-8482-8d999c4bc4e0", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[
Economy
4.2
\n", + " World Development Indicators:\n", + " Structure of value added
,\n", + "
Structure of value added
$ billions
% of GDP
% of GDP
% of GDP
% of GDP
2010
2020
2010
2020
2010
2020
2010
2020
2010
2020
,\n", + "
15.9
20.1
26.2
26.8
21.2
14.0
12.5
7.7
48.9
54.7
11.9
15.1
18.0
19.3
24.9
20.0
5.5
6.0
44.0
48.4
161.2
145.0
8.5
14.1
40.0
20.3
39.0
18.8
39.2
48.7
0.6
0.7
..
..
..
..
7.2
12.2
..
..
3.4
2.9
..
0.6
..
12.7
..
3.7
..
79.8
81.7
53.6
6.2
9.1
52.4
45.7
4.5
6.9
41.9
45.4
1.1
1.4
1.6
2.2
16.2
21.1
2.2
2.4
70.7
65.3
423.6
389.6
7.1
5.9
25.3
23.3
15.8
15.4
51.5
54.6
9.3
12.6
17.9
11.2
27.8
27.1
9.4
12.4
45.7
53.2
2.5
2.5
0.4
..
15.8
..
3.1
..
68.1
..
1,147.6
1,327.8
2.2
2.0
25.2
25.5
8.0
5.7
65.7
66.3
392.3
433.3
1.3
1.1
25.5
25.5
16.5
16.3
62.3
63.1
52.9
42.7
5.5
6.7
59.8
42.0
4.7
6.1
27.9
42.4
10.1
9.7
1.1
0.8
11.5
12.0
2.1
1.4
81.1
79.1
25.7
34.7
0.3
0.3
45.0
40.3
14.5
18.1
53.7
56.6
115.3
373.9
17.0
12.0
25.0
32.9
16.1
20.6
53.5
51.5
4.5
4.7
1.3
1.5
14.1
12.8
5.8
4.9
..
..
57.2
61.5
8.9
7.1
35.4
30.8
22.5
21.5
43.5
49.5
481.4
521.7
0.8
0.6
20.9
19.5
13.3
12.4
67.7
69.6
1.4
1.6
11.6
11.5
19.0
14.2
12.3
5.7
60.6
61.2
9.5
15.7
25.8
27.1
18.0
16.3
11.7
9.7
44.5
47.9
6.6
6.9
0.3
0.3
6.6
5.6
0.9
0.3
88.9
90.3
1.5
2.3
14.8
19.2
43.8
34.4
8.9
5.9
37.3
43.7
19.6
36.6
10.4
14.0
30.1
23.5
11.3
11.0
43.6
52.8
17.2
20.0
6.8
6.1
22.5
24.6
10.9
13.1
55.5
55.8
12.8
14.9
2.5
2.1
31.9
27.8
6.4
5.7
55.0
65.8
2,208.8
1,448.6
4.1
5.9
23.3
17.7
12.7
9.7
57.6
62.8
13.7
12.0
0.7
1.2
68.7
59.1
14.9
15.8
32.5
41.5
50.7
69.9
4.0
3.5
23.8
21.9
..
..
59.5
61.3
10.1
17.9
24.1
18.4
26.1
32.6
12.1
9.3
42.1
40.8
2.0
2.8
38.4
28.6
15.4
10.7
9.2
..
37.0
45.5
1.7
1.7
8.0
4.9
18.1
23.1
5.4
7.3
61.2
58.9
11.2
25.9
33.9
22.7
21.9
34.6
14.7
16.2
38.3
36.6
27.5
40.8
17.3
17.4
25.8
23.3
14.5
13.3
50.6
52.0
1,617.3
1,645.4
1.5
1.7
26.4
24.6
10.0
9.9
65.7
66.9
4.2
5.6
0.3
0.4
7.1
8.0
0.8
0.9
87.6
86.9
2.1
2.3
37.4
29.5
24.5
20.4
18.4
17.7
29.3
40.0
10.7
10.7
51.9
46.8
12.0
16.0
1.0
3.2
33.4
43.6
..
..
..
..
..
..
..
..
..
..
217.1
252.7
3.5
4.1
33.5
30.0
9.9
8.9
53.8
56.1
6,087.2
14,687.7
9.3
7.7
46.5
37.8
31.6
26.3
44.2
54.5
228.6
344.9
0.1
0.1
6.8
6.1
1.7
0.9
90.9
89.6
28.2
25.6
..
..
4.8
8.4
0.6
0.9
94.0
88.7
286.6
270.3
6.3
7.4
31.4
23.8
14.0
10.9
53.4
59.9
0.9
1.2
30.4
35.8
11.8
8.1
..
..
53.2
51.4
21.6
48.7
21.4
20.9
38.7
41.2
16.2
19.0
35.4
35.7
13.1
10.5
4.0
7.6
66.2
48.2
5.3
8.1
25.4
40.4
37.7
62.2
6.5
4.4
23.3
20.1
14.6
12.7
61.9
68.4
34.9
61.3
17.5
21.4
16.0
20.9
9.0
11.2
37.8
42.1
60.4
57.2
3.7
3.2
21.4
21.2
13.0
12.1
59.8
59.3
59.6
107.4
3.6
2.8
22.9
23.0
15.6
11.2
72.5
73.5
2.9
2.5
0.4
0.2
15.0
15.0
6.1
4.1
77.0
74.9
25.7
24.7
2.1
1.9
14.5
12.6
5.1
5.5
71.6
74.3
209.1
245.3
1.5
1.9
33.2
30.8
21.0
21.9
55.8
58.3
322.0
356.1
1.2
1.3
19.7
21.2
10.9
14.0
65.4
64.6
1.1
3.2
..
1.7
..
14.9
..
4.4
..
77.3
0.5
0.5
11.5
15.2
11.7
12.2
2.4
2.9
60.3
57.9
53.9
78.8
6.1
6.0
27.9
30.3
15.3
14.4
59.3
57.2
69.6
99.3
9.7
9.8
34.7
30.7
13.4
16.5
51.1
53.3
219.0
365.3
13.3
11.6
35.8
32.0
16.1
16.4
46.2
51.8
18.4
24.6
7.0
5.1
25.3
23.8
16.1
14.9
59.5
61.5
16.3
10.1
1.1
2.9
74.7
45.4
21.0
20.1
24.7
51.5
1.6
..
14.1
..
21.8
..
5.5
..
..
..
19.5
30.7
3.2
2.2
24.4
22.7
13.7
12.9
59.9
62.7
4.4
4.0
10.2
8.4
37.7
31.3
32.5
26.5
49.6
53.6
29.9
107.7
41.4
35.6
9.4
23.1
4.0
5.3
41.8
36.8
2.3
3.2
14.9
13.6
14.2
20.5
5.4
6.9
58.1
53.9
3.1
4.6
9.4
14.5
17.0
17.0
12.3
11.6
57.5
53.7
249.4
271.8
2.4
2.4
26.2
24.0
17.0
14.3
58.9
60.1
2,645.2
2,630.3
1.6
1.6
17.8
16.4
10.3
9.4
70.7
71.2
..
5.7
..
..
..
..
..
..
..
..
14.4
15.3
3.9
6.7
55.2
40.7
17.1
18.3
30.8
45.7
1.5
1.8
35.2
21.0
9.8
19.0
4.6
2.9
49.2
52.2
12.2
15.8
8.5
7.3
16.9
21.2
9.1
9.3
63.1
59.1
3,399.7
3,846.4
0.8
0.7
26.8
26.5
19.7
18.2
62.3
63.3
32.2
70.0
28.0
18.9
18.0
29.9
6.4
11.0
48.2
45.2
297.1
188.8
3.0
4.2
14.9
15.0
7.9
8.9
70.3
68.6
2.5
3.1
13.4
17.3
18.1
18.1
4.3
3.4
65.6
60.7
0.8
1.0
4.5
4.9
14.7
13.1
3.5
3.1
68.4
66.8
4.9
5.8
..
..
..
..
..
..
..
..
40.7
77.6
11.2
10.2
27.5
22.1
18.9
14.1
59.5
61.9
6.9
14.2
17.5
25.7
32.3
28.3
10.6
9.6
43.4
37.6
0.8
1.4
45.1
30.9
13.1
13.5
11.3
9.1
39.4
50.2
3.4
5.5
28.5
16.9
24.9
38.8
5.7
4.2
41.6
38.9
11.9
14.5
20.2
20.4
23.5
23.3
14.5
17.6
52.5
53.9
15.8
23.8
11.6
12.1
25.6
26.0
16.5
16.0
60.6
58.3
132.2
156.7
3.0
3.4
25.2
24.6
18.1
17.5
56.7
56.6
13.8
21.7
6.3
4.3
22.0
19.7
13.0
8.7
61.9
66.2
1,675.6
2,667.7
17.0
18.2
30.7
24.5
17.0
13.7
45.0
48.4
755.1
1,058.7
13.9
13.7
42.8
38.3
22.0
19.9
40.7
44.4
486.8
231.5
6.5
12.8
44.2
35.7
12.8
20.0
51.1
49.0
138.5
184.4
5.2
6.0
55.8
41.3
2.3
2.7
39.7
54.3
221.9
425.9
1.0
0.9
23.3
38.0
19.5
34.5
66.7
54.8
5.9
7.3
0.6
0.3
9.2
7.6
3.6
2.1
93.0
93.9
234.7
407.1
1.6
1.2
20.8
18.6
14.1
11.3
66.8
71.4
2,136.1
1,892.6
1.8
2.0
21.9
21.6
14.2
14.8
66.3
66.8
13.2
13.8
5.3
8.7
18.0
20.4
7.8
8.0
66.5
59.7
5,759.1
5,040.1
1.1
1.0
28.3
29.0
20.8
19.7
70.5
69.5
27.1
43.7
3.6
5.2
26.3
23.9
18.9
17.3
59.1
61.6
148.0
171.1
4.5
5.4
40.6
33.1
11.3
13.1
51.7
56.1
45.4
100.7
17.6
22.6
18.6
17.4
11.2
7.6
57.0
53.9
0.2
0.2
24.2
26.2
11.9
9.8
5.6
4.4
63.9
67.9
..
..
..
..
..
..
..
..
..
..
1,144.1
1,637.9
2.1
1.8
34.1
32.6
27.4
24.8
54.7
57.1
5.3
7.7
9.5
7.4
27.0
27.6
13.8
13.4
45.9
47.6
115.4
106.0
0.5
0.5
66.1
45.4
6.0
6.6
47.0
69.1
4.8
7.8
17.4
13.6
26.3
29.2
16.9
14.5
49.3
49.8
7.1
19.0
22.6
16.3
30.5
32.4
11.1
7.7
43.6
41.0
24.0
33.6
4.1
4.0
20.4
19.4
11.9
10.9
64.5
63.5
38.4
25.9
3.9
8.9
13.8
17.6
7.7
12.3
71.9
81.3
2.2
2.3
4.9
4.7
31.5
35.5
13.1
14.8
53.8
43.7
2.0
3.0
44.8
41.1
5.0
17.7
2.6
..
50.2
41.6
75.4
52.3
1.8
4.1
75.7
48.3
4.0
2.9
32.2
55.8
5.1
6.4
..
0.1
..
44.2
..
38.7
..
52.2
37.1
56.5
3.0
3.2
26.2
25.0
16.9
15.7
60.7
61.6
56.2
73.4
0.3
0.2
11.0
11.2
5.0
4.6
78.9
79.7
10.0
13.2
29.1
24.8
18.0
16.4
9.5
10.7
48.8
51.8
7.0
12.2
29.6
22.7
15.2
18.5
9.9
11.5
47.9
52.6
255.0
337.0
10.1
8.2
40.5
35.9
23.4
22.3
48.5
54.8
2.6
3.7
5.6
8.0
9.4
11.8
2.3
2.5
77.7
70.8
10.7
17.5
33.0
36.2
22.7
21.2
6.7
6.8
35.5
34.4
9.0
14.9
1.3
0.4
17.6
13.4
11.2
7.5
69.3
76.9
0.2
0.2
11.6
21.8
13.7
12.8
3.7
3.4
71.5
67.2
5.6
7.9
16.7
20.2
38.2
28.8
6.7
6.1
39.9
42.5
10.0
10.9
3.6
3.4
22.5
16.6
14.2
10.7
62.9
68.2
1,057.8
1,087.1
3.2
3.8
32.4
29.6
15.6
17.2
60.4
60.3
0.3
0.4
24.7
22.5
7.2
4.9
0.4
0.5
60.7
66.8
7.0
11.9
11.2
8.7
20.4
22.8
10.0
10.5
54.5
55.5
5.4
6.8
..
..
12.9
14.9
..
..
87.1
76.7
7.2
13.3
11.7
13.0
33.2
37.0
6.8
7.8
44.8
40.5
4.1
4.8
7.7
7.6
17.1
17.3
4.6
4.1
58.6
58.0
93.2
114.7
12.9
11.7
25.7
26.1
15.6
15.3
51.0
50.8
11.1
14.0
26.8
25.6
16.4
21.8
10.0
8.1
47.0
41.5
37.8
78.9
37.4
20.9
25.6
38.6
19.0
24.8
37.0
40.5
11.4
10.6
8.5
9.2
27.4
25.8
12.3
11.1
54.0
58.8
16.0
33.4
33.2
22.2
14.2
12.0
5.9
4.5
46.4
53.9
847.4
913.9
1.8
1.6
19.7
17.8
10.5
10.8
68.4
69.8
9.4
9.4
1.3
1.8
26.2
22.4
5.6
..
64.9
65.5
146.5
211.7
6.6
5.7
21.2
20.4
10.8
9.8
64.4
65.6
8.8
12.6
17.0
15.6
22.0
25.8
14.3
13.5
51.7
48.8
7.9
13.7
35.8
38.4
23.0
20.2
6.9
7.3
35.1
36.2
361.5
432.3
23.9
24.1
25.3
28.2
6.6
12.7
50.8
46.4
9.4
12.1
10.1
8.6
21.0
22.8
9.9
13.2
55.1
56.2
0.8
1.2
..
..
..
..
..
..
..
..
428.8
362.2
1.6
1.8
34.8
26.0
7.2
6.5
52.7
60.3
65.0
74.0
1.2
2.6
63.3
47.5
10.0
8.0
39.9
54.7
177.2
300.3
23.3
21.9
19.7
18.6
13.1
11.4
52.8
53.7
0.2
0.3
3.8
3.3
9.3
13.4
0.8
1.0
76.7
73.7
29.4
54.0
3.6
2.8
18.4
23.9
7.1
5.8
72.9
70.1
14.3
24.7
19.6
17.0
33.2
36.7
2.4
1.7
44.1
41.8
27.1
35.4
13.3
11.1
34.3
33.8
18.6
18.7
45.3
48.2
147.5
201.7
6.8
7.7
35.8
30.2
15.6
12.2
48.9
54.4
208.4
361.8
13.7
10.2
32.3
28.4
21.9
17.7
53.9
61.4
479.8
596.6
2.9
2.5
28.9
27.7
15.3
16.0
56.3
57.8
238.1
228.5
1.9
2.1
20.0
19.4
11.6
11.9
66.1
65.7
98.4
103.1
0.8
0.6
50.9
51.1
47.3
48.2
48.6
48.8
125.1
144.4
0.1
0.3
73.2
52.3
12.5
7.9
28.6
52.7
166.3
249.5
5.0
4.0
38.0
26.9
23.0
16.3
46.2
59.8
1,524.9
1,488.3
3.3
4.0
30.0
29.8
12.8
13.4
53.1
56.1
6.1
10.2
24.3
26.6
16.3
18.6
8.2
8.7
49.9
46.6
0.7
0.8
10.4
10.2
17.8
14.9
10.2
5.4
71.8
74.9
1.9
1.5
..
0.0
..
..
..
31.5
..
..
0.2
0.5
11.3
14.0
17.4
13.2
8.5
5.6
67.1
70.8
528.2
703.4
2.6
2.5
58.4
40.1
11.0
12.1
39.2
53.9
16.1
24.5
15.9
16.2
21.8
23.2
15.6
14.3
52.4
50.3
41.8
53.3
6.6
6.3
25.3
24.9
15.3
13.3
51.7
51.9
1.0
1.2
2.3
2.5
14.0
15.6
8.0
6.5
68.5
67.6
2.6
4.1
52.9
59.5
7.8
5.2
2.2
1.9
35.3
31.0
239.8
345.3
0.0
0.0
26.6
23.6
20.8
20.0
67.8
71.7
0.9
1.2
0.1
..
12.9
..
1.5
..
77.8
..
90.8
105.2
1.6
1.8
30.6
27.4
18.0
17.5
58.4
60.4
48.2
53.6
1.9
2.1
26.5
29.4
17.5
20.7
58.8
56.9
0.8
1.5
..
..
..
..
..
..
..
..
..
7.0
..
..
..
..
..
..
..
..
417.4
335.4
2.1
2.5
25.3
23.4
13.9
11.7
64.3
64.6
14.6
..
5.3
9.6
61.1
36.9
2.3
..
33.6
53.5
1,422.1
1,281.5
2.4
3.1
23.2
20.4
11.4
11.0
66.3
67.8
56.7
81.0
8.5
8.6
26.6
26.2
18.1
16.1
54.6
59.5
0.8
1.0
1.3
1.3
22.5
20.9
8.3
4.6
65.8
67.6
1.5
1.6
2.7
2.2
11.9
11.0
3.4
3.8
73.9
72.6
0.8
..
..
..
..
..
..
..
..
..
0.7
0.9
6.3
8.6
15.9
12.9
4.9
3.9
64.0
63.0
74.2
27.0
31.9
20.4
21.1
23.4
5.1
..
30.8
36.3
4.4
2.9
9.5
8.2
35.2
35.2
21.0
22.0
48.2
53.1
495.8
541.5
1.6
1.4
23.8
21.1
14.7
12.1
62.8
66.1
603.4
752.2
0.7
0.7
24.9
25.2
18.2
18.1
70.8
71.3
252.5
21.4
19.4
39.0
30.4
18.6
..
..
50.1
42.5
5.6
8.1
19.6
24.0
25.0
33.8
9.7
15.6
45.1
35.3
32.0
62.4
25.6
26.7
23.6
28.7
8.7
8.5
43.3
36.3
341.1
499.7
10.5
8.7
39.9
33.2
30.9
25.5
49.6
58.1
0.9
1.9
25.6
15.4
9.1
25.4
1.0
1.7
68.9
55.2
3.4
7.6
28.7
18.8
15.0
22.7
7.2
14.4
56.3
49.3
0.4
0.5
16.4
17.7
18.0
14.8
6.0
5.6
53.6
51.2
22.2
21.4
0.5
1.1
53.8
34.1
19.2
16.5
45.5
62.6
46.2
42.5
6.8
10.2
29.5
21.6
15.7
13.8
55.9
60.1
777.0
720.0
9.0
6.7
24.5
28.0
15.1
19.1
54.5
54.2
22.6
45.2
11.3
10.8
59.1
42.0
..
..
28.1
47.2
0.7
0.9
0.6
0.4
11.9
15.7
1.3
0.7
83.4
72.7
0.0
0.1
26.5
..
5.5
..
1.1
..
..
..
26.7
37.6
32.3
23.9
24.7
26.5
16.7
15.8
44.8
42.8
141.2
156.6
7.4
9.3
25.6
20.8
13.1
10.1
55.5
55.8
289.8
358.9
0.8
0.9
52.5
40.9
7.9
9.7
46.7
58.2
2,491.1
2,756.9
0.6
0.6
18.9
17.1
9.5
8.7
70.6
72.7
15,049.0
20,893.7
1.0
1.1
19.3
18.4
11.9
11.2
76.3
80.1
40.3
53.6
7.2
7.3
24.5
18.1
13.5
10.3
58.2
63.0
49.8
59.9
26.9
25.1
21.2
31.7
10.2
19.6
39.9
35.8
0.7
0.9
19.5
21.2
12.9
10.0
5.0
2.8
61.7
59.8
393.2
..
5.4
..
48.4
..
11.9
..
39.0
..
147.2
343.2
..
..
..
..
..
..
..
..
4.3
4.2
..
..
..
..
..
..
..
..
9.7
15.5
9.0
7.1
18.6
17.0
12.2
11.0
57.7
60.6
30.9
18.8
8.2
5.0
43.8
35.6
8.0
..
27.4
16.8
20.3
18.1
9.4
3.0
32.2
40.3
7.6
7.7
52.8
53.6
12.0
18.1
9.6
7.6
20.7
35.8
9.2
18.4
57.8
49.9
66,596.1
84,906.8
3.9
4.4
27.6
26.3
15.9
16.0
62.8
65.7
17,063.3
27,118.7
5.5
5.9
35.9
34.1
24.2
22.8
57.0
58.2
21,025.8
22,133.9
2.1
2.1
23.6
22.9
13.7
13.9
64.0
65.2
5,347.1
4,743.2
4.7
6.5
29.1
28.3
14.3
15.7
55.7
67.7
2,973.1
3,106.9
5.9
5.4
46.3
34.7
11.7
12.2
47.0
56.9
16,672.9
22,546.0
1.1
1.1
20.0
19.0
11.7
11.1
75.3
79.7
2,060.8
3,482.5
17.5
17.7
29.1
24.8
16.5
14.1
46.5
49.6
1,451.8
1,706.1
15.9
18.5
27.1
26.5
9.8
11.2
50.9
48.9
613.2
481.0
23.6
26.8
28.3
25.9
4.8
10.7
42.9
39.1
5,246.9
7,585.5
15.3
16.1
33.0
27.8
16.4
14.9
46.8
48.1
14,604.0
22,848.3
6.9
7.0
36.7
34.1
21.7
22.1
50.5
55.9
45,752.2
53,699.8
1.3
1.3
23.9
22.4
14.1
13.4
69.0
71.8
]" + ] + }, + "execution_count": 15, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "datos_tabla1" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "2a1f5079-cc0b-401e-90f5-a811fba87bcc", + "metadata": {}, + "outputs": [], + "source": [ + "df = pd.read_html(str(sopa.select('div.scrollable')[0]))[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "id": "cfaf6513-1dfa-416c-a614-dce7217648ec", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
012345678910
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
\n", + "
" + ], + "text/plain": [ + " 0 1 2 3 4 5 6 7 8 9 \\\n", + "0 Afghanistan 15.9 20.1 26.2 26.8 21.2 14.0 12.5 7.7 48.9 \n", + "1 Albania 11.9 15.1 18.0 19.3 24.9 20.0 5.5 6.0 44.0 \n", + "2 Algeria 161.2 145.0 8.5 14.1 40.0 20.3 39.0 18.8 39.2 \n", + "3 American Samoa 0.6 0.7 .. .. .. .. 7.2 12.2 .. \n", + "4 Andorra 3.4 2.9 .. 0.6 .. 12.7 .. 3.7 .. \n", + "\n", + " 10 \n", + "0 54.7 \n", + "1 48.4 \n", + "2 48.7 \n", + "3 .. \n", + "4 79.8 " + ] + }, + "execution_count": 21, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 37, + "id": "0c4a8bbb-7a16-477d-b860-201834ae2216", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Int64Index([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10], dtype='int64')" + ] + }, + "execution_count": 37, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.columns" + ] + }, + { + "cell_type": "code", + "execution_count": 44, + "id": "78cb7ee7-8825-443b-8394-eec9f680a1aa", + "metadata": {}, + "outputs": [], + "source": [ + "df_header = pd.read_html(str(sopa.select('div.fixed')[0]))[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 45, + "id": "f4edcffc-d4df-4e97-98c9-ccad9d782883", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Unnamed: 0_level_0Gross domestic productAgricultureIndustryManufacturingServices
Unnamed: 0_level_1$ billions% of GDP% of GDP% of GDP% of GDP
Unnamed: 0_level_22010202020102020201020202010202020102020
\n", + "
" + ], + "text/plain": [ + "Empty DataFrame\n", + "Columns: [(Unnamed: 0_level_0, Unnamed: 0_level_1, Unnamed: 0_level_2), (Gross domestic product, $ billions, 2010), (Gross domestic product, $ billions, 2020), (Agriculture, % of GDP, 2010), (Agriculture, % of GDP, 2020), (Industry, % of GDP, 2010), (Industry, % of GDP, 2020), (Manufacturing, % of GDP, 2010), (Manufacturing, % of GDP, 2020), (Services, % of GDP, 2010), (Services, % of GDP, 2020)]\n", + "Index: []" + ] + }, + "execution_count": 45, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_header.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 55, + "id": "e6cb0036-eacf-4da3-85cd-32eae80cab85", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
País12345678910
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " País 1 2 3 4 5 6 7 \\\n", + "0 Afghanistan 15.9 20.1 26.2 26.8 21.2 14.0 12.5 \n", + "1 Albania 11.9 15.1 18.0 19.3 24.9 20.0 5.5 \n", + "2 Algeria 161.2 145.0 8.5 14.1 40.0 20.3 39.0 \n", + "3 American Samoa 0.6 0.7 .. .. .. .. 7.2 \n", + "4 Andorra 3.4 2.9 .. 0.6 .. 12.7 .. \n", + ".. ... ... ... ... ... ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 15.9 18.5 27.1 26.5 9.8 \n", + "222 Low income 613.2 481.0 23.6 26.8 28.3 25.9 4.8 \n", + "223 Lower middle income 5246.9 7585.5 15.3 16.1 33.0 27.8 16.4 \n", + "224 Upper middle income 14604.0 22848.3 6.9 7.0 36.7 34.1 21.7 \n", + "225 High income 45752.2 53699.8 1.3 1.3 23.9 22.4 14.1 \n", + "\n", + " 8 9 10 \n", + "0 7.7 48.9 54.7 \n", + "1 6.0 44.0 48.4 \n", + "2 18.8 39.2 48.7 \n", + "3 12.2 .. .. \n", + "4 3.7 .. 79.8 \n", + ".. ... ... ... \n", + "221 11.2 50.9 48.9 \n", + "222 10.7 42.9 39.1 \n", + "223 14.9 46.8 48.1 \n", + "224 22.1 50.5 55.9 \n", + "225 13.4 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 55, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.rename({'País': 0}, inplace = True)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 60, + "id": "974c3764-b484-4eae-a854-555ef7d952dc", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 .. .. .. \n", + "4 .. 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 60, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.columns = [\"Country\", \"GDP $billions 2010\", \"GDP $billions 2020\", \"Agriculture GDP% 2010\", \"Agriculture GDP% 2020\", \"Industry GDP% 2010\", \"Industry GDP% 2020\", \"Manufacturing GDP% 2010\", \"Manufacturing GDP% 2020\", \"Services GDP% 2010\", \"Services GDP% 2020\"]\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 68, + "id": "48c5b1b5-4929-49fa-a1e0-4f625549446f", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Country object\n", + "GDP $billions 2010 object\n", + "GDP $billions 2020 object\n", + "Agriculture GDP% 2010 object\n", + "Agriculture GDP% 2020 object\n", + "Industry GDP% 2010 object\n", + "Industry GDP% 2020 object\n", + "Manufacturing GDP% 2010 object\n", + "Manufacturing GDP% 2020 object\n", + "Services GDP% 2010 object\n", + "Services GDP% 2020 object\n", + "dtype: object" + ] + }, + "execution_count": 68, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.dtypes" + ] + }, + { + "cell_type": "code", + "execution_count": 92, + "id": "1162d94c-5fd5-4eb3-87ba-e0a05d332e5e", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.70.00.00.00.07.212.20.00.0
4Andorra3.42.90.00.60.012.70.03.70.079.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 0.0 0.0 0.0 \n", + "4 0.0 0.6 0.0 \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 0.0 7.2 12.2 \n", + "4 12.7 0.0 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 0.0 0.0 \n", + "4 0.0 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 92, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.replace(['..'], 0.0)" + ] + }, + { + "cell_type": "code", + "execution_count": 96, + "id": "cdacd32d-065c-4536-816d-dfa1125b52bd", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 .. .. .. \n", + "4 .. 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 96, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['GDP $billions 2010'] = pd.to_numeric(df['GDP $billions 2010'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 97, + "id": "eaa9a40a-9eac-48c0-a91c-4042c8282240", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 .. .. .. \n", + "4 .. 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 97, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['GDP $billions 2010'] = df['GDP $billions 2010'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 98, + "id": "2a6a7db3-babd-4838-b04b-de475b635521", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 .. .. .. \n", + "4 .. 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 98, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['GDP $billions 2020'] = pd.to_numeric(df['GDP $billions 2020'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 99, + "id": "e3b9bdb1-474b-4ebd-bab0-dbc78b1693e6", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 .. .. .. \n", + "4 .. 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 99, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['GDP $billions 2020'] = df['GDP $billions 2020'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 100, + "id": "ac437d6d-5488-4205-89ec-5dd355adbf31", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaN......7.212.2....
4Andorra3.42.9NaN0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN .. .. \n", + "4 NaN 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 100, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Agriculture GDP% 2010'] = pd.to_numeric(df['Agriculture GDP% 2010'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 101, + "id": "21dbcdb6-042a-4dc8-9d7d-a588389c37da", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaN......7.212.2....
4Andorra3.42.9NaN0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN .. .. \n", + "4 NaN 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 101, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Agriculture GDP% 2010'] = df['Agriculture GDP% 2010'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 102, + "id": "c628c010-645e-40bb-97be-4300447672cc", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaN....7.212.2....
4Andorra3.42.9NaN0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN .. \n", + "4 NaN 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 102, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Agriculture GDP% 2020'] = pd.to_numeric(df['Agriculture GDP% 2020'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 103, + "id": "2acdb2ef-f665-4f46-af23-7666f07c3153", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaN....7.212.2....
4Andorra3.42.9NaN0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN .. \n", + "4 NaN 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 103, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Agriculture GDP% 2020'] = df['Agriculture GDP% 2020'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 104, + "id": "678d56f6-7f44-4f71-8c3b-5574751b0bf3", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaN..7.212.2....
4Andorra3.42.9NaN0.6NaN12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 104, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Industry GDP% 2010'] = pd.to_numeric(df['Industry GDP% 2010'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 106, + "id": "4e969618-eaa1-4c13-800a-ce5399c544b3", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaN..7.212.2....
4Andorra3.42.9NaN0.6NaN12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 106, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Industry GDP% 2010'] = df['Industry GDP% 2010'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 107, + "id": "3363a224-1919-4e00-9648-f1aad31ed4ff", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2....
4Andorra3.42.9NaN0.6NaN12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 107, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Industry GDP% 2020'] = pd.to_numeric(df['Industry GDP% 2020'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 108, + "id": "68611546-7a5c-438e-9df3-1dc15559161e", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2....
4Andorra3.42.9NaN0.6NaN12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 108, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Industry GDP% 2020'] = df['Industry GDP% 2020'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 109, + "id": "aff3ff0f-66f2-4c25-aff3-84a89b46326b", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2....
4Andorra3.42.9NaN0.6NaN12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 109, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Manufacturing GDP% 2020'] = pd.to_numeric(df['Manufacturing GDP% 2020'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 110, + "id": "839788fb-c614-4d9b-a922-02b7c015a4b7", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2....
4Andorra3.42.9NaN0.6NaN12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 110, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Manufacturing GDP% 2020'] = df['Manufacturing GDP% 2020'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 111, + "id": "74d3c2a7-1d2c-4512-b481-c53d907cd232", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2....
4Andorra3.42.9NaN0.6NaN12.7NaN3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 NaN 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 111, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Manufacturing GDP% 2010'] = pd.to_numeric(df['Manufacturing GDP% 2010'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 112, + "id": "a5b54422-1b0f-47e9-8bb1-438038c2dcbd", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2....
4Andorra3.42.9NaN0.6NaN12.7NaN3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 NaN 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 112, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Manufacturing GDP% 2010'] = df['Manufacturing GDP% 2010'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 113, + "id": "999a3505-f285-444d-b843-515693f132a0", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2..NaN
4Andorra3.42.9NaN0.6NaN12.7NaN3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 NaN 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. NaN \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 113, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Services GDP% 2020'] = pd.to_numeric(df['Services GDP% 2020'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 114, + "id": "2ee4ef2a-f840-459a-8857-1dae6ade7a4f", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2..NaN
4Andorra3.42.9NaN0.6NaN12.7NaN3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 NaN 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. NaN \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 114, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Services GDP% 2020'] = df['Services GDP% 2020'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 115, + "id": "7d609d41-d5d8-4670-b7ca-0ea66e04a7ff", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2NaNNaN
4Andorra3.42.9NaN0.6NaN12.7NaN3.7NaN79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 NaN 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 NaN NaN \n", + "4 NaN 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 115, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Services GDP% 2010'] = pd.to_numeric(df['Services GDP% 2010'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 116, + "id": "74502001-0f67-4b6b-b80c-4a949b7009fb", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2NaNNaN
4Andorra3.42.9NaN0.6NaN12.7NaN3.7NaN79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 NaN 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 NaN NaN \n", + "4 NaN 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 116, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Services GDP% 2010'] = df['Services GDP% 2010'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 118, + "id": "82a2235f-e62d-42b4-a77c-68ea6a8b658e", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Country object\n", + "GDP $billions 2010 float64\n", + "GDP $billions 2020 float64\n", + "Agriculture GDP% 2010 float64\n", + "Agriculture GDP% 2020 float64\n", + "Industry GDP% 2010 float64\n", + "Industry GDP% 2020 float64\n", + "Manufacturing GDP% 2010 float64\n", + "Manufacturing GDP% 2020 float64\n", + "Services GDP% 2010 float64\n", + "Services GDP% 2020 float64\n", + "dtype: object" + ] + }, + "execution_count": 118, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.dtypes" + ] + }, + { + "cell_type": "code", + "execution_count": 119, + "id": "d411b755-49d6-401c-b151-d61ff330143e", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
GDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
count222.000000220.000000209.000000208.000000211.000000209.000000207.000000200.00000208.000000208.000000
mean1196.0594591537.55909110.97607710.38557726.59099524.88756011.56618411.7715055.11730857.306731
std5962.6633797607.17806111.20007710.29035413.7630039.9199756.9786587.1013313.63659112.313578
min0.0000000.1000000.0000000.0000004.8000004.9000000.4000000.3000024.70000016.800000
25%5.3250007.2250002.2000002.20000018.00000018.1000006.4000006.5750045.85000049.450000
50%25.70000032.0500006.8000007.20000024.50000023.50000011.30000011.2000054.50000056.400000
75%218.525000257.10000017.00000016.45000031.70000030.70000015.60000015.8000064.32500065.700000
max66596.10000084906.80000052.90000059.50000075.70000059.10000047.30000048.2000094.00000093.900000
\n", + "
" + ], + "text/plain": [ + " GDP $billions 2010 GDP $billions 2020 Agriculture GDP% 2010 \\\n", + "count 222.000000 220.000000 209.000000 \n", + "mean 1196.059459 1537.559091 10.976077 \n", + "std 5962.663379 7607.178061 11.200077 \n", + "min 0.000000 0.100000 0.000000 \n", + "25% 5.325000 7.225000 2.200000 \n", + "50% 25.700000 32.050000 6.800000 \n", + "75% 218.525000 257.100000 17.000000 \n", + "max 66596.100000 84906.800000 52.900000 \n", + "\n", + " Agriculture GDP% 2020 Industry GDP% 2010 Industry GDP% 2020 \\\n", + "count 208.000000 211.000000 209.000000 \n", + "mean 10.385577 26.590995 24.887560 \n", + "std 10.290354 13.763003 9.919975 \n", + "min 0.000000 4.800000 4.900000 \n", + "25% 2.200000 18.000000 18.100000 \n", + "50% 7.200000 24.500000 23.500000 \n", + "75% 16.450000 31.700000 30.700000 \n", + "max 59.500000 75.700000 59.100000 \n", + "\n", + " Manufacturing GDP% 2010 Manufacturing GDP% 2020 Services GDP% 2010 \\\n", + "count 207.000000 200.00000 208.000000 \n", + "mean 11.566184 11.77150 55.117308 \n", + "std 6.978658 7.10133 13.636591 \n", + "min 0.400000 0.30000 24.700000 \n", + "25% 6.400000 6.57500 45.850000 \n", + "50% 11.300000 11.20000 54.500000 \n", + "75% 15.600000 15.80000 64.325000 \n", + "max 47.300000 48.20000 94.000000 \n", + "\n", + " Services GDP% 2020 \n", + "count 208.000000 \n", + "mean 57.306731 \n", + "std 12.313578 \n", + "min 16.800000 \n", + "25% 49.450000 \n", + "50% 56.400000 \n", + "75% 65.700000 \n", + "max 93.900000 " + ] + }, + "execution_count": 119, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.describe()" + ] + }, + { + "cell_type": "code", + "execution_count": 126, + "id": "22807eba-83ff-4560-bd82-14da13ba452a", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
125Mexico1057.81087.13.23.832.429.615.617.260.460.3
\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 Agriculture GDP% 2010 \\\n", + "125 Mexico 1057.8 1087.1 3.2 \n", + "\n", + " Agriculture GDP% 2020 Industry GDP% 2010 Industry GDP% 2020 \\\n", + "125 3.8 32.4 29.6 \n", + "\n", + " Manufacturing GDP% 2010 Manufacturing GDP% 2020 Services GDP% 2010 \\\n", + "125 15.6 17.2 60.4 \n", + "\n", + " Services GDP% 2020 \n", + "125 60.3 " + ] + }, + "execution_count": 126, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df[df['Country']=='Mexico']" + ] + }, + { + "cell_type": "code", + "execution_count": 122, + "id": "60eda7b7-6038-4b2a-85aa-ff2f6369eef4", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.0" + ] + }, + "execution_count": 122, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "min_gdp10 = df['GDP $billions 2010'].min()\n", + "min_gdp10" + ] + }, + { + "cell_type": "code", + "execution_count": 123, + "id": "723f8d8c-bb94-41d6-8538-4af2077d8fb0", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010
198Tuvalu0.0
\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010\n", + "198 Tuvalu 0.0" + ] + }, + "execution_count": 123, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.loc[(df['GDP $billions 2010']==min_gdp10), ['Country', 'GDP $billions 2010']]" + ] + }, + { + "cell_type": "code", + "execution_count": 128, + "id": "06170cea-9078-4f06-bedc-c2d194aaa6c1", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.1" + ] + }, + "execution_count": 128, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "min_gdp20 = df['GDP $billions 2020'].min()\n", + "min_gdp20" + ] + }, + { + "cell_type": "code", + "execution_count": 129, + "id": "63fd3d6a-2829-4e07-9568-cc91137767ea", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2020
198Tuvalu0.1
\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2020\n", + "198 Tuvalu 0.1" + ] + }, + "execution_count": 129, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.loc[(df['GDP $billions 2020']==min_gdp20), ['Country', 'GDP $billions 2020']]" + ] + }, + { + "cell_type": "code", + "execution_count": 131, + "id": "d9b12970-f61f-4e05-9cae-2733bcb4c8b3", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020
3American Samoa0.60.7
6Antigua and Barbuda1.11.4
9Aruba2.52.5
19Belize1.41.6
22Bhutan1.52.3
30Burundi2.02.8
31Cabo Verde1.71.7
36Central African Republic2.12.3
44Comoros0.91.2
51Curacao2.92.5
55Djibouti1.13.2
56Dominica0.50.5
62Eritrea1.6NaN
66Faroe Islands2.33.2
72Gambia, The1.51.8
77Greenland2.53.1
78Grenada0.81.0
82Guinea-Bissau0.81.4
101Kiribati0.20.2
110Lesotho2.22.3
111Liberia2.03.0
119Maldives2.63.7
122Marshall Islands0.20.2
126Micronesia, Fed. Sts.0.30.4
143Northern Mariana Islands0.81.2
147Palau0.20.3
160Samoa0.70.8
161San Marino1.91.5
162Sao Tome and Principe0.20.5
166Seychelles1.01.2
167Sierra Leone2.64.1
169Sint Maarten (Dutch part)0.91.2
172Solomon Islands0.81.5
178St. Kitts and Nevis0.81.0
179St. Lucia1.51.6
180St. Martin (French part)0.8NaN
181St. Vincent and the Grenadines0.70.9
190Timor-Leste0.91.9
192Tonga0.40.5
197Turks and Caicos Islands0.70.9
206Vanuatu0.70.9
\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020\n", + "3 American Samoa 0.6 0.7\n", + "6 Antigua and Barbuda 1.1 1.4\n", + "9 Aruba 2.5 2.5\n", + "19 Belize 1.4 1.6\n", + "22 Bhutan 1.5 2.3\n", + "30 Burundi 2.0 2.8\n", + "31 Cabo Verde 1.7 1.7\n", + "36 Central African Republic 2.1 2.3\n", + "44 Comoros 0.9 1.2\n", + "51 Curacao 2.9 2.5\n", + "55 Djibouti 1.1 3.2\n", + "56 Dominica 0.5 0.5\n", + "62 Eritrea 1.6 NaN\n", + "66 Faroe Islands 2.3 3.2\n", + "72 Gambia, The 1.5 1.8\n", + "77 Greenland 2.5 3.1\n", + "78 Grenada 0.8 1.0\n", + "82 Guinea-Bissau 0.8 1.4\n", + "101 Kiribati 0.2 0.2\n", + "110 Lesotho 2.2 2.3\n", + "111 Liberia 2.0 3.0\n", + "119 Maldives 2.6 3.7\n", + "122 Marshall Islands 0.2 0.2\n", + "126 Micronesia, Fed. Sts. 0.3 0.4\n", + "143 Northern Mariana Islands 0.8 1.2\n", + "147 Palau 0.2 0.3\n", + "160 Samoa 0.7 0.8\n", + "161 San Marino 1.9 1.5\n", + "162 Sao Tome and Principe 0.2 0.5\n", + "166 Seychelles 1.0 1.2\n", + "167 Sierra Leone 2.6 4.1\n", + "169 Sint Maarten (Dutch part) 0.9 1.2\n", + "172 Solomon Islands 0.8 1.5\n", + "178 St. Kitts and Nevis 0.8 1.0\n", + "179 St. Lucia 1.5 1.6\n", + "180 St. Martin (French part) 0.8 NaN\n", + "181 St. Vincent and the Grenadines 0.7 0.9\n", + "190 Timor-Leste 0.9 1.9\n", + "192 Tonga 0.4 0.5\n", + "197 Turks and Caicos Islands 0.7 0.9\n", + "206 Vanuatu 0.7 0.9" + ] + }, + "execution_count": 131, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "paises_lowgdp = df.loc[(df['GDP $billions 2010']>0) & (df['GDP $billions 2010']<3), ['Country', 'GDP $billions 2010', 'GDP $billions 2020']]\n", + "paises_lowgdp" + ] + }, + { + "cell_type": "code", + "execution_count": 132, + "id": "08fb78a2-c682-4176-86a4-48ada7fa0775", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "66596.1" + ] + }, + "execution_count": 132, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "max_gdp10 = df['GDP $billions 2010'].max()\n", + "max_gdp10" + ] + }, + { + "cell_type": "code", + "execution_count": 150, + "id": "d6cfedee-10dc-4bdb-8893-07e7f664a3cd", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020
40China6087.214687.7
97Japan5759.15040.1
203United States15049.020893.7
215East Asia & Pacific17063.327118.7
216Europe & Central Asia21025.822133.9
217Latin America & Caribbean5347.14743.2
219North America16672.922546.0
223Lower middle income5246.97585.5
224Upper middle income14604.022848.3
225High income45752.253699.8
\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020\n", + "40 China 6087.2 14687.7\n", + "97 Japan 5759.1 5040.1\n", + "203 United States 15049.0 20893.7\n", + "215 East Asia & Pacific 17063.3 27118.7\n", + "216 Europe & Central Asia 21025.8 22133.9\n", + "217 Latin America & Caribbean 5347.1 4743.2\n", + "219 North America 16672.9 22546.0\n", + "223 Lower middle income 5246.9 7585.5\n", + "224 Upper middle income 14604.0 22848.3\n", + "225 High income 45752.2 53699.8" + ] + }, + "execution_count": 150, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "paises_maxgdp = df.loc[(df['GDP $billions 2010']>5000) & (df['GDP $billions 2010']<66596.1), ['Country', 'GDP $billions 2010', 'GDP $billions 2020']]\n", + "paises_maxgdp" + ] + }, + { + "cell_type": "code", + "execution_count": 151, + "id": "92fd5f20-9505-4e8b-aca4-55ce5aa6a747", + "metadata": {}, + "outputs": [], + "source": [ + "df.to_csv('ProyectoGDP_Paises.csv')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "0a50003e-d0a4-40a5-9dc4-621bdfebfce9", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/README_ProyectoGilda.md b/README_ProyectoGilda.md new file mode 100644 index 0000000..ae6b8c4 --- /dev/null +++ b/README_ProyectoGilda.md @@ -0,0 +1,10 @@ +### Proyecto web scrapping + +## Web scraapping + +Los problemas que encontré al resolver este trabajo fueron: + +>Encontrar una web que me interesara con datos numéricos. +>Encontrar una web cuyos datos estuvieran en tablas. +>Cuando extraje los datos, me di cuenta de que estaban guardados como strings y para mí fue difícil convertirlos en float. +>Al final pude trabajar con los datos y el dataframe.