diff --git a/Proyecto2_GildaRIA_Try.ipynb b/Proyecto2_GildaRIA_Try.ipynb new file mode 100644 index 0000000..85e0029 --- /dev/null +++ b/Proyecto2_GildaRIA_Try.ipynb @@ -0,0 +1,7494 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "c483e8a0-576e-4f21-a19f-6fb8fa42fa14", + "metadata": {}, + "outputs": [], + "source": [ + "from bs4 import BeautifulSoup\n", + "import requests\n", + "import selenium\n", + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "3b69ee34-618c-4570-a45d-ce60b05a4353", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Requirement already satisfied: html5lib in c:\\anaconda\\lib\\site-packages (1.1)\n", + "Requirement already satisfied: webencodings in c:\\anaconda\\lib\\site-packages (from html5lib) (0.5.1)\n", + "Requirement already satisfied: six>=1.9 in c:\\anaconda\\lib\\site-packages (from html5lib) (1.16.0)\n", + "Requirement already satisfied: lxml in c:\\anaconda\\lib\\site-packages (4.8.0)\n" + ] + } + ], + "source": [ + "!pip install html5lib\n", + "!pip install lxml" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "a114183e-9356-4213-91fb-60a782bce915", + "metadata": {}, + "outputs": [], + "source": [ + "from selenium import webdriver\n", + "browser = webdriver.Chrome()" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "5f60973b-6658-4ec5-baa2-862eab88fd7b", + "metadata": {}, + "outputs": [], + "source": [ + "driver = webdriver.Chrome()" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "9e25c2fa-d714-4d5f-875d-644a534caf37", + "metadata": {}, + "outputs": [], + "source": [ + "url = 'http://wdi.worldbank.org/table/4.2'" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "909356bb-33df-42c7-b010-84f460b81b4e", + "metadata": {}, + "outputs": [], + "source": [ + "driver.get(url)" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "f637afb6-9ff0-4116-af43-554ebd65084b", + "metadata": {}, + "outputs": [], + "source": [ + "sopa = BeautifulSoup(driver.page_source)" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "id": "af6cae88-e924-4d40-9a0c-3e2efe2e1803", + "metadata": {}, + "outputs": [], + "source": [ + "datos_tabla1 = sopa.select('table')" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "e09fd631-90d9-4db7-8482-8d999c4bc4e0", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[
Economy
4.2
\n", + " World Development Indicators:\n", + " Structure of value added
,\n", + "
Structure of value added
$ billions
% of GDP
% of GDP
% of GDP
% of GDP
2010
2020
2010
2020
2010
2020
2010
2020
2010
2020
,\n", + "
15.9
20.1
26.2
26.8
21.2
14.0
12.5
7.7
48.9
54.7
11.9
15.1
18.0
19.3
24.9
20.0
5.5
6.0
44.0
48.4
161.2
145.0
8.5
14.1
40.0
20.3
39.0
18.8
39.2
48.7
0.6
0.7
..
..
..
..
7.2
12.2
..
..
3.4
2.9
..
0.6
..
12.7
..
3.7
..
79.8
81.7
53.6
6.2
9.1
52.4
45.7
4.5
6.9
41.9
45.4
1.1
1.4
1.6
2.2
16.2
21.1
2.2
2.4
70.7
65.3
423.6
389.6
7.1
5.9
25.3
23.3
15.8
15.4
51.5
54.6
9.3
12.6
17.9
11.2
27.8
27.1
9.4
12.4
45.7
53.2
2.5
2.5
0.4
..
15.8
..
3.1
..
68.1
..
1,147.6
1,327.8
2.2
2.0
25.2
25.5
8.0
5.7
65.7
66.3
392.3
433.3
1.3
1.1
25.5
25.5
16.5
16.3
62.3
63.1
52.9
42.7
5.5
6.7
59.8
42.0
4.7
6.1
27.9
42.4
10.1
9.7
1.1
0.8
11.5
12.0
2.1
1.4
81.1
79.1
25.7
34.7
0.3
0.3
45.0
40.3
14.5
18.1
53.7
56.6
115.3
373.9
17.0
12.0
25.0
32.9
16.1
20.6
53.5
51.5
4.5
4.7
1.3
1.5
14.1
12.8
5.8
4.9
..
..
57.2
61.5
8.9
7.1
35.4
30.8
22.5
21.5
43.5
49.5
481.4
521.7
0.8
0.6
20.9
19.5
13.3
12.4
67.7
69.6
1.4
1.6
11.6
11.5
19.0
14.2
12.3
5.7
60.6
61.2
9.5
15.7
25.8
27.1
18.0
16.3
11.7
9.7
44.5
47.9
6.6
6.9
0.3
0.3
6.6
5.6
0.9
0.3
88.9
90.3
1.5
2.3
14.8
19.2
43.8
34.4
8.9
5.9
37.3
43.7
19.6
36.6
10.4
14.0
30.1
23.5
11.3
11.0
43.6
52.8
17.2
20.0
6.8
6.1
22.5
24.6
10.9
13.1
55.5
55.8
12.8
14.9
2.5
2.1
31.9
27.8
6.4
5.7
55.0
65.8
2,208.8
1,448.6
4.1
5.9
23.3
17.7
12.7
9.7
57.6
62.8
13.7
12.0
0.7
1.2
68.7
59.1
14.9
15.8
32.5
41.5
50.7
69.9
4.0
3.5
23.8
21.9
..
..
59.5
61.3
10.1
17.9
24.1
18.4
26.1
32.6
12.1
9.3
42.1
40.8
2.0
2.8
38.4
28.6
15.4
10.7
9.2
..
37.0
45.5
1.7
1.7
8.0
4.9
18.1
23.1
5.4
7.3
61.2
58.9
11.2
25.9
33.9
22.7
21.9
34.6
14.7
16.2
38.3
36.6
27.5
40.8
17.3
17.4
25.8
23.3
14.5
13.3
50.6
52.0
1,617.3
1,645.4
1.5
1.7
26.4
24.6
10.0
9.9
65.7
66.9
4.2
5.6
0.3
0.4
7.1
8.0
0.8
0.9
87.6
86.9
2.1
2.3
37.4
29.5
24.5
20.4
18.4
17.7
29.3
40.0
10.7
10.7
51.9
46.8
12.0
16.0
1.0
3.2
33.4
43.6
..
..
..
..
..
..
..
..
..
..
217.1
252.7
3.5
4.1
33.5
30.0
9.9
8.9
53.8
56.1
6,087.2
14,687.7
9.3
7.7
46.5
37.8
31.6
26.3
44.2
54.5
228.6
344.9
0.1
0.1
6.8
6.1
1.7
0.9
90.9
89.6
28.2
25.6
..
..
4.8
8.4
0.6
0.9
94.0
88.7
286.6
270.3
6.3
7.4
31.4
23.8
14.0
10.9
53.4
59.9
0.9
1.2
30.4
35.8
11.8
8.1
..
..
53.2
51.4
21.6
48.7
21.4
20.9
38.7
41.2
16.2
19.0
35.4
35.7
13.1
10.5
4.0
7.6
66.2
48.2
5.3
8.1
25.4
40.4
37.7
62.2
6.5
4.4
23.3
20.1
14.6
12.7
61.9
68.4
34.9
61.3
17.5
21.4
16.0
20.9
9.0
11.2
37.8
42.1
60.4
57.2
3.7
3.2
21.4
21.2
13.0
12.1
59.8
59.3
59.6
107.4
3.6
2.8
22.9
23.0
15.6
11.2
72.5
73.5
2.9
2.5
0.4
0.2
15.0
15.0
6.1
4.1
77.0
74.9
25.7
24.7
2.1
1.9
14.5
12.6
5.1
5.5
71.6
74.3
209.1
245.3
1.5
1.9
33.2
30.8
21.0
21.9
55.8
58.3
322.0
356.1
1.2
1.3
19.7
21.2
10.9
14.0
65.4
64.6
1.1
3.2
..
1.7
..
14.9
..
4.4
..
77.3
0.5
0.5
11.5
15.2
11.7
12.2
2.4
2.9
60.3
57.9
53.9
78.8
6.1
6.0
27.9
30.3
15.3
14.4
59.3
57.2
69.6
99.3
9.7
9.8
34.7
30.7
13.4
16.5
51.1
53.3
219.0
365.3
13.3
11.6
35.8
32.0
16.1
16.4
46.2
51.8
18.4
24.6
7.0
5.1
25.3
23.8
16.1
14.9
59.5
61.5
16.3
10.1
1.1
2.9
74.7
45.4
21.0
20.1
24.7
51.5
1.6
..
14.1
..
21.8
..
5.5
..
..
..
19.5
30.7
3.2
2.2
24.4
22.7
13.7
12.9
59.9
62.7
4.4
4.0
10.2
8.4
37.7
31.3
32.5
26.5
49.6
53.6
29.9
107.7
41.4
35.6
9.4
23.1
4.0
5.3
41.8
36.8
2.3
3.2
14.9
13.6
14.2
20.5
5.4
6.9
58.1
53.9
3.1
4.6
9.4
14.5
17.0
17.0
12.3
11.6
57.5
53.7
249.4
271.8
2.4
2.4
26.2
24.0
17.0
14.3
58.9
60.1
2,645.2
2,630.3
1.6
1.6
17.8
16.4
10.3
9.4
70.7
71.2
..
5.7
..
..
..
..
..
..
..
..
14.4
15.3
3.9
6.7
55.2
40.7
17.1
18.3
30.8
45.7
1.5
1.8
35.2
21.0
9.8
19.0
4.6
2.9
49.2
52.2
12.2
15.8
8.5
7.3
16.9
21.2
9.1
9.3
63.1
59.1
3,399.7
3,846.4
0.8
0.7
26.8
26.5
19.7
18.2
62.3
63.3
32.2
70.0
28.0
18.9
18.0
29.9
6.4
11.0
48.2
45.2
297.1
188.8
3.0
4.2
14.9
15.0
7.9
8.9
70.3
68.6
2.5
3.1
13.4
17.3
18.1
18.1
4.3
3.4
65.6
60.7
0.8
1.0
4.5
4.9
14.7
13.1
3.5
3.1
68.4
66.8
4.9
5.8
..
..
..
..
..
..
..
..
40.7
77.6
11.2
10.2
27.5
22.1
18.9
14.1
59.5
61.9
6.9
14.2
17.5
25.7
32.3
28.3
10.6
9.6
43.4
37.6
0.8
1.4
45.1
30.9
13.1
13.5
11.3
9.1
39.4
50.2
3.4
5.5
28.5
16.9
24.9
38.8
5.7
4.2
41.6
38.9
11.9
14.5
20.2
20.4
23.5
23.3
14.5
17.6
52.5
53.9
15.8
23.8
11.6
12.1
25.6
26.0
16.5
16.0
60.6
58.3
132.2
156.7
3.0
3.4
25.2
24.6
18.1
17.5
56.7
56.6
13.8
21.7
6.3
4.3
22.0
19.7
13.0
8.7
61.9
66.2
1,675.6
2,667.7
17.0
18.2
30.7
24.5
17.0
13.7
45.0
48.4
755.1
1,058.7
13.9
13.7
42.8
38.3
22.0
19.9
40.7
44.4
486.8
231.5
6.5
12.8
44.2
35.7
12.8
20.0
51.1
49.0
138.5
184.4
5.2
6.0
55.8
41.3
2.3
2.7
39.7
54.3
221.9
425.9
1.0
0.9
23.3
38.0
19.5
34.5
66.7
54.8
5.9
7.3
0.6
0.3
9.2
7.6
3.6
2.1
93.0
93.9
234.7
407.1
1.6
1.2
20.8
18.6
14.1
11.3
66.8
71.4
2,136.1
1,892.6
1.8
2.0
21.9
21.6
14.2
14.8
66.3
66.8
13.2
13.8
5.3
8.7
18.0
20.4
7.8
8.0
66.5
59.7
5,759.1
5,040.1
1.1
1.0
28.3
29.0
20.8
19.7
70.5
69.5
27.1
43.7
3.6
5.2
26.3
23.9
18.9
17.3
59.1
61.6
148.0
171.1
4.5
5.4
40.6
33.1
11.3
13.1
51.7
56.1
45.4
100.7
17.6
22.6
18.6
17.4
11.2
7.6
57.0
53.9
0.2
0.2
24.2
26.2
11.9
9.8
5.6
4.4
63.9
67.9
..
..
..
..
..
..
..
..
..
..
1,144.1
1,637.9
2.1
1.8
34.1
32.6
27.4
24.8
54.7
57.1
5.3
7.7
9.5
7.4
27.0
27.6
13.8
13.4
45.9
47.6
115.4
106.0
0.5
0.5
66.1
45.4
6.0
6.6
47.0
69.1
4.8
7.8
17.4
13.6
26.3
29.2
16.9
14.5
49.3
49.8
7.1
19.0
22.6
16.3
30.5
32.4
11.1
7.7
43.6
41.0
24.0
33.6
4.1
4.0
20.4
19.4
11.9
10.9
64.5
63.5
38.4
25.9
3.9
8.9
13.8
17.6
7.7
12.3
71.9
81.3
2.2
2.3
4.9
4.7
31.5
35.5
13.1
14.8
53.8
43.7
2.0
3.0
44.8
41.1
5.0
17.7
2.6
..
50.2
41.6
75.4
52.3
1.8
4.1
75.7
48.3
4.0
2.9
32.2
55.8
5.1
6.4
..
0.1
..
44.2
..
38.7
..
52.2
37.1
56.5
3.0
3.2
26.2
25.0
16.9
15.7
60.7
61.6
56.2
73.4
0.3
0.2
11.0
11.2
5.0
4.6
78.9
79.7
10.0
13.2
29.1
24.8
18.0
16.4
9.5
10.7
48.8
51.8
7.0
12.2
29.6
22.7
15.2
18.5
9.9
11.5
47.9
52.6
255.0
337.0
10.1
8.2
40.5
35.9
23.4
22.3
48.5
54.8
2.6
3.7
5.6
8.0
9.4
11.8
2.3
2.5
77.7
70.8
10.7
17.5
33.0
36.2
22.7
21.2
6.7
6.8
35.5
34.4
9.0
14.9
1.3
0.4
17.6
13.4
11.2
7.5
69.3
76.9
0.2
0.2
11.6
21.8
13.7
12.8
3.7
3.4
71.5
67.2
5.6
7.9
16.7
20.2
38.2
28.8
6.7
6.1
39.9
42.5
10.0
10.9
3.6
3.4
22.5
16.6
14.2
10.7
62.9
68.2
1,057.8
1,087.1
3.2
3.8
32.4
29.6
15.6
17.2
60.4
60.3
0.3
0.4
24.7
22.5
7.2
4.9
0.4
0.5
60.7
66.8
7.0
11.9
11.2
8.7
20.4
22.8
10.0
10.5
54.5
55.5
5.4
6.8
..
..
12.9
14.9
..
..
87.1
76.7
7.2
13.3
11.7
13.0
33.2
37.0
6.8
7.8
44.8
40.5
4.1
4.8
7.7
7.6
17.1
17.3
4.6
4.1
58.6
58.0
93.2
114.7
12.9
11.7
25.7
26.1
15.6
15.3
51.0
50.8
11.1
14.0
26.8
25.6
16.4
21.8
10.0
8.1
47.0
41.5
37.8
78.9
37.4
20.9
25.6
38.6
19.0
24.8
37.0
40.5
11.4
10.6
8.5
9.2
27.4
25.8
12.3
11.1
54.0
58.8
16.0
33.4
33.2
22.2
14.2
12.0
5.9
4.5
46.4
53.9
847.4
913.9
1.8
1.6
19.7
17.8
10.5
10.8
68.4
69.8
9.4
9.4
1.3
1.8
26.2
22.4
5.6
..
64.9
65.5
146.5
211.7
6.6
5.7
21.2
20.4
10.8
9.8
64.4
65.6
8.8
12.6
17.0
15.6
22.0
25.8
14.3
13.5
51.7
48.8
7.9
13.7
35.8
38.4
23.0
20.2
6.9
7.3
35.1
36.2
361.5
432.3
23.9
24.1
25.3
28.2
6.6
12.7
50.8
46.4
9.4
12.1
10.1
8.6
21.0
22.8
9.9
13.2
55.1
56.2
0.8
1.2
..
..
..
..
..
..
..
..
428.8
362.2
1.6
1.8
34.8
26.0
7.2
6.5
52.7
60.3
65.0
74.0
1.2
2.6
63.3
47.5
10.0
8.0
39.9
54.7
177.2
300.3
23.3
21.9
19.7
18.6
13.1
11.4
52.8
53.7
0.2
0.3
3.8
3.3
9.3
13.4
0.8
1.0
76.7
73.7
29.4
54.0
3.6
2.8
18.4
23.9
7.1
5.8
72.9
70.1
14.3
24.7
19.6
17.0
33.2
36.7
2.4
1.7
44.1
41.8
27.1
35.4
13.3
11.1
34.3
33.8
18.6
18.7
45.3
48.2
147.5
201.7
6.8
7.7
35.8
30.2
15.6
12.2
48.9
54.4
208.4
361.8
13.7
10.2
32.3
28.4
21.9
17.7
53.9
61.4
479.8
596.6
2.9
2.5
28.9
27.7
15.3
16.0
56.3
57.8
238.1
228.5
1.9
2.1
20.0
19.4
11.6
11.9
66.1
65.7
98.4
103.1
0.8
0.6
50.9
51.1
47.3
48.2
48.6
48.8
125.1
144.4
0.1
0.3
73.2
52.3
12.5
7.9
28.6
52.7
166.3
249.5
5.0
4.0
38.0
26.9
23.0
16.3
46.2
59.8
1,524.9
1,488.3
3.3
4.0
30.0
29.8
12.8
13.4
53.1
56.1
6.1
10.2
24.3
26.6
16.3
18.6
8.2
8.7
49.9
46.6
0.7
0.8
10.4
10.2
17.8
14.9
10.2
5.4
71.8
74.9
1.9
1.5
..
0.0
..
..
..
31.5
..
..
0.2
0.5
11.3
14.0
17.4
13.2
8.5
5.6
67.1
70.8
528.2
703.4
2.6
2.5
58.4
40.1
11.0
12.1
39.2
53.9
16.1
24.5
15.9
16.2
21.8
23.2
15.6
14.3
52.4
50.3
41.8
53.3
6.6
6.3
25.3
24.9
15.3
13.3
51.7
51.9
1.0
1.2
2.3
2.5
14.0
15.6
8.0
6.5
68.5
67.6
2.6
4.1
52.9
59.5
7.8
5.2
2.2
1.9
35.3
31.0
239.8
345.3
0.0
0.0
26.6
23.6
20.8
20.0
67.8
71.7
0.9
1.2
0.1
..
12.9
..
1.5
..
77.8
..
90.8
105.2
1.6
1.8
30.6
27.4
18.0
17.5
58.4
60.4
48.2
53.6
1.9
2.1
26.5
29.4
17.5
20.7
58.8
56.9
0.8
1.5
..
..
..
..
..
..
..
..
..
7.0
..
..
..
..
..
..
..
..
417.4
335.4
2.1
2.5
25.3
23.4
13.9
11.7
64.3
64.6
14.6
..
5.3
9.6
61.1
36.9
2.3
..
33.6
53.5
1,422.1
1,281.5
2.4
3.1
23.2
20.4
11.4
11.0
66.3
67.8
56.7
81.0
8.5
8.6
26.6
26.2
18.1
16.1
54.6
59.5
0.8
1.0
1.3
1.3
22.5
20.9
8.3
4.6
65.8
67.6
1.5
1.6
2.7
2.2
11.9
11.0
3.4
3.8
73.9
72.6
0.8
..
..
..
..
..
..
..
..
..
0.7
0.9
6.3
8.6
15.9
12.9
4.9
3.9
64.0
63.0
74.2
27.0
31.9
20.4
21.1
23.4
5.1
..
30.8
36.3
4.4
2.9
9.5
8.2
35.2
35.2
21.0
22.0
48.2
53.1
495.8
541.5
1.6
1.4
23.8
21.1
14.7
12.1
62.8
66.1
603.4
752.2
0.7
0.7
24.9
25.2
18.2
18.1
70.8
71.3
252.5
21.4
19.4
39.0
30.4
18.6
..
..
50.1
42.5
5.6
8.1
19.6
24.0
25.0
33.8
9.7
15.6
45.1
35.3
32.0
62.4
25.6
26.7
23.6
28.7
8.7
8.5
43.3
36.3
341.1
499.7
10.5
8.7
39.9
33.2
30.9
25.5
49.6
58.1
0.9
1.9
25.6
15.4
9.1
25.4
1.0
1.7
68.9
55.2
3.4
7.6
28.7
18.8
15.0
22.7
7.2
14.4
56.3
49.3
0.4
0.5
16.4
17.7
18.0
14.8
6.0
5.6
53.6
51.2
22.2
21.4
0.5
1.1
53.8
34.1
19.2
16.5
45.5
62.6
46.2
42.5
6.8
10.2
29.5
21.6
15.7
13.8
55.9
60.1
777.0
720.0
9.0
6.7
24.5
28.0
15.1
19.1
54.5
54.2
22.6
45.2
11.3
10.8
59.1
42.0
..
..
28.1
47.2
0.7
0.9
0.6
0.4
11.9
15.7
1.3
0.7
83.4
72.7
0.0
0.1
26.5
..
5.5
..
1.1
..
..
..
26.7
37.6
32.3
23.9
24.7
26.5
16.7
15.8
44.8
42.8
141.2
156.6
7.4
9.3
25.6
20.8
13.1
10.1
55.5
55.8
289.8
358.9
0.8
0.9
52.5
40.9
7.9
9.7
46.7
58.2
2,491.1
2,756.9
0.6
0.6
18.9
17.1
9.5
8.7
70.6
72.7
15,049.0
20,893.7
1.0
1.1
19.3
18.4
11.9
11.2
76.3
80.1
40.3
53.6
7.2
7.3
24.5
18.1
13.5
10.3
58.2
63.0
49.8
59.9
26.9
25.1
21.2
31.7
10.2
19.6
39.9
35.8
0.7
0.9
19.5
21.2
12.9
10.0
5.0
2.8
61.7
59.8
393.2
..
5.4
..
48.4
..
11.9
..
39.0
..
147.2
343.2
..
..
..
..
..
..
..
..
4.3
4.2
..
..
..
..
..
..
..
..
9.7
15.5
9.0
7.1
18.6
17.0
12.2
11.0
57.7
60.6
30.9
18.8
8.2
5.0
43.8
35.6
8.0
..
27.4
16.8
20.3
18.1
9.4
3.0
32.2
40.3
7.6
7.7
52.8
53.6
12.0
18.1
9.6
7.6
20.7
35.8
9.2
18.4
57.8
49.9
66,596.1
84,906.8
3.9
4.4
27.6
26.3
15.9
16.0
62.8
65.7
17,063.3
27,118.7
5.5
5.9
35.9
34.1
24.2
22.8
57.0
58.2
21,025.8
22,133.9
2.1
2.1
23.6
22.9
13.7
13.9
64.0
65.2
5,347.1
4,743.2
4.7
6.5
29.1
28.3
14.3
15.7
55.7
67.7
2,973.1
3,106.9
5.9
5.4
46.3
34.7
11.7
12.2
47.0
56.9
16,672.9
22,546.0
1.1
1.1
20.0
19.0
11.7
11.1
75.3
79.7
2,060.8
3,482.5
17.5
17.7
29.1
24.8
16.5
14.1
46.5
49.6
1,451.8
1,706.1
15.9
18.5
27.1
26.5
9.8
11.2
50.9
48.9
613.2
481.0
23.6
26.8
28.3
25.9
4.8
10.7
42.9
39.1
5,246.9
7,585.5
15.3
16.1
33.0
27.8
16.4
14.9
46.8
48.1
14,604.0
22,848.3
6.9
7.0
36.7
34.1
21.7
22.1
50.5
55.9
45,752.2
53,699.8
1.3
1.3
23.9
22.4
14.1
13.4
69.0
71.8
]" + ] + }, + "execution_count": 15, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "datos_tabla1" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "2a1f5079-cc0b-401e-90f5-a811fba87bcc", + "metadata": {}, + "outputs": [], + "source": [ + "df = pd.read_html(str(sopa.select('div.scrollable')[0]))[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "id": "cfaf6513-1dfa-416c-a614-dce7217648ec", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
012345678910
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
\n", + "
" + ], + "text/plain": [ + " 0 1 2 3 4 5 6 7 8 9 \\\n", + "0 Afghanistan 15.9 20.1 26.2 26.8 21.2 14.0 12.5 7.7 48.9 \n", + "1 Albania 11.9 15.1 18.0 19.3 24.9 20.0 5.5 6.0 44.0 \n", + "2 Algeria 161.2 145.0 8.5 14.1 40.0 20.3 39.0 18.8 39.2 \n", + "3 American Samoa 0.6 0.7 .. .. .. .. 7.2 12.2 .. \n", + "4 Andorra 3.4 2.9 .. 0.6 .. 12.7 .. 3.7 .. \n", + "\n", + " 10 \n", + "0 54.7 \n", + "1 48.4 \n", + "2 48.7 \n", + "3 .. \n", + "4 79.8 " + ] + }, + "execution_count": 21, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 37, + "id": "0c4a8bbb-7a16-477d-b860-201834ae2216", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Int64Index([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10], dtype='int64')" + ] + }, + "execution_count": 37, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.columns" + ] + }, + { + "cell_type": "code", + "execution_count": 44, + "id": "78cb7ee7-8825-443b-8394-eec9f680a1aa", + "metadata": {}, + "outputs": [], + "source": [ + "df_header = pd.read_html(str(sopa.select('div.fixed')[0]))[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 45, + "id": "f4edcffc-d4df-4e97-98c9-ccad9d782883", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Unnamed: 0_level_0Gross domestic productAgricultureIndustryManufacturingServices
Unnamed: 0_level_1$ billions% of GDP% of GDP% of GDP% of GDP
Unnamed: 0_level_22010202020102020201020202010202020102020
\n", + "
" + ], + "text/plain": [ + "Empty DataFrame\n", + "Columns: [(Unnamed: 0_level_0, Unnamed: 0_level_1, Unnamed: 0_level_2), (Gross domestic product, $ billions, 2010), (Gross domestic product, $ billions, 2020), (Agriculture, % of GDP, 2010), (Agriculture, % of GDP, 2020), (Industry, % of GDP, 2010), (Industry, % of GDP, 2020), (Manufacturing, % of GDP, 2010), (Manufacturing, % of GDP, 2020), (Services, % of GDP, 2010), (Services, % of GDP, 2020)]\n", + "Index: []" + ] + }, + "execution_count": 45, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_header.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 55, + "id": "e6cb0036-eacf-4da3-85cd-32eae80cab85", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
País12345678910
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " País 1 2 3 4 5 6 7 \\\n", + "0 Afghanistan 15.9 20.1 26.2 26.8 21.2 14.0 12.5 \n", + "1 Albania 11.9 15.1 18.0 19.3 24.9 20.0 5.5 \n", + "2 Algeria 161.2 145.0 8.5 14.1 40.0 20.3 39.0 \n", + "3 American Samoa 0.6 0.7 .. .. .. .. 7.2 \n", + "4 Andorra 3.4 2.9 .. 0.6 .. 12.7 .. \n", + ".. ... ... ... ... ... ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 15.9 18.5 27.1 26.5 9.8 \n", + "222 Low income 613.2 481.0 23.6 26.8 28.3 25.9 4.8 \n", + "223 Lower middle income 5246.9 7585.5 15.3 16.1 33.0 27.8 16.4 \n", + "224 Upper middle income 14604.0 22848.3 6.9 7.0 36.7 34.1 21.7 \n", + "225 High income 45752.2 53699.8 1.3 1.3 23.9 22.4 14.1 \n", + "\n", + " 8 9 10 \n", + "0 7.7 48.9 54.7 \n", + "1 6.0 44.0 48.4 \n", + "2 18.8 39.2 48.7 \n", + "3 12.2 .. .. \n", + "4 3.7 .. 79.8 \n", + ".. ... ... ... \n", + "221 11.2 50.9 48.9 \n", + "222 10.7 42.9 39.1 \n", + "223 14.9 46.8 48.1 \n", + "224 22.1 50.5 55.9 \n", + "225 13.4 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 55, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.rename({'País': 0}, inplace = True)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 60, + "id": "974c3764-b484-4eae-a854-555ef7d952dc", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 .. .. .. \n", + "4 .. 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 60, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.columns = [\"Country\", \"GDP $billions 2010\", \"GDP $billions 2020\", \"Agriculture GDP% 2010\", \"Agriculture GDP% 2020\", \"Industry GDP% 2010\", \"Industry GDP% 2020\", \"Manufacturing GDP% 2010\", \"Manufacturing GDP% 2020\", \"Services GDP% 2010\", \"Services GDP% 2020\"]\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 68, + "id": "48c5b1b5-4929-49fa-a1e0-4f625549446f", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Country object\n", + "GDP $billions 2010 object\n", + "GDP $billions 2020 object\n", + "Agriculture GDP% 2010 object\n", + "Agriculture GDP% 2020 object\n", + "Industry GDP% 2010 object\n", + "Industry GDP% 2020 object\n", + "Manufacturing GDP% 2010 object\n", + "Manufacturing GDP% 2020 object\n", + "Services GDP% 2010 object\n", + "Services GDP% 2020 object\n", + "dtype: object" + ] + }, + "execution_count": 68, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.dtypes" + ] + }, + { + "cell_type": "code", + "execution_count": 92, + "id": "1162d94c-5fd5-4eb3-87ba-e0a05d332e5e", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.70.00.00.00.07.212.20.00.0
4Andorra3.42.90.00.60.012.70.03.70.079.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 0.0 0.0 0.0 \n", + "4 0.0 0.6 0.0 \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 0.0 7.2 12.2 \n", + "4 12.7 0.0 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 0.0 0.0 \n", + "4 0.0 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 92, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.replace(['..'], 0.0)" + ] + }, + { + "cell_type": "code", + "execution_count": 96, + "id": "cdacd32d-065c-4536-816d-dfa1125b52bd", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 .. .. .. \n", + "4 .. 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 96, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['GDP $billions 2010'] = pd.to_numeric(df['GDP $billions 2010'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 97, + "id": "eaa9a40a-9eac-48c0-a91c-4042c8282240", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 .. .. .. \n", + "4 .. 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 97, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['GDP $billions 2010'] = df['GDP $billions 2010'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 98, + "id": "2a6a7db3-babd-4838-b04b-de475b635521", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 .. .. .. \n", + "4 .. 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 98, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['GDP $billions 2020'] = pd.to_numeric(df['GDP $billions 2020'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 99, + "id": "e3b9bdb1-474b-4ebd-bab0-dbc78b1693e6", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7........7.212.2....
4Andorra3.42.9..0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 .. .. .. \n", + "4 .. 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 99, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['GDP $billions 2020'] = df['GDP $billions 2020'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 100, + "id": "ac437d6d-5488-4205-89ec-5dd355adbf31", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaN......7.212.2....
4Andorra3.42.9NaN0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN .. .. \n", + "4 NaN 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 100, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Agriculture GDP% 2010'] = pd.to_numeric(df['Agriculture GDP% 2010'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 101, + "id": "21dbcdb6-042a-4dc8-9d7d-a588389c37da", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaN......7.212.2....
4Andorra3.42.9NaN0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN .. .. \n", + "4 NaN 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 101, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Agriculture GDP% 2010'] = df['Agriculture GDP% 2010'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 102, + "id": "c628c010-645e-40bb-97be-4300447672cc", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaN....7.212.2....
4Andorra3.42.9NaN0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN .. \n", + "4 NaN 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 102, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Agriculture GDP% 2020'] = pd.to_numeric(df['Agriculture GDP% 2020'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 103, + "id": "2acdb2ef-f665-4f46-af23-7666f07c3153", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaN....7.212.2....
4Andorra3.42.9NaN0.6..12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN .. \n", + "4 NaN 0.6 .. \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 103, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Agriculture GDP% 2020'] = df['Agriculture GDP% 2020'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 104, + "id": "678d56f6-7f44-4f71-8c3b-5574751b0bf3", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaN..7.212.2....
4Andorra3.42.9NaN0.6NaN12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 104, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Industry GDP% 2010'] = pd.to_numeric(df['Industry GDP% 2010'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 106, + "id": "4e969618-eaa1-4c13-800a-ce5399c544b3", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaN..7.212.2....
4Andorra3.42.9NaN0.6NaN12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 .. 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 106, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Industry GDP% 2010'] = df['Industry GDP% 2010'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 107, + "id": "3363a224-1919-4e00-9648-f1aad31ed4ff", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2....
4Andorra3.42.9NaN0.6NaN12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 107, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Industry GDP% 2020'] = pd.to_numeric(df['Industry GDP% 2020'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 108, + "id": "68611546-7a5c-438e-9df3-1dc15559161e", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2....
4Andorra3.42.9NaN0.6NaN12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 108, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Industry GDP% 2020'] = df['Industry GDP% 2020'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 109, + "id": "aff3ff0f-66f2-4c25-aff3-84a89b46326b", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2....
4Andorra3.42.9NaN0.6NaN12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 109, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Manufacturing GDP% 2020'] = pd.to_numeric(df['Manufacturing GDP% 2020'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 110, + "id": "839788fb-c614-4d9b-a922-02b7c015a4b7", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2....
4Andorra3.42.9NaN0.6NaN12.7..3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 .. 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 110, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Manufacturing GDP% 2020'] = df['Manufacturing GDP% 2020'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 111, + "id": "74d3c2a7-1d2c-4512-b481-c53d907cd232", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2....
4Andorra3.42.9NaN0.6NaN12.7NaN3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 NaN 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 111, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Manufacturing GDP% 2010'] = pd.to_numeric(df['Manufacturing GDP% 2010'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 112, + "id": "a5b54422-1b0f-47e9-8bb1-438038c2dcbd", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2....
4Andorra3.42.9NaN0.6NaN12.7NaN3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 NaN 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. .. \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 112, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Manufacturing GDP% 2010'] = df['Manufacturing GDP% 2010'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 113, + "id": "999a3505-f285-444d-b843-515693f132a0", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2..NaN
4Andorra3.42.9NaN0.6NaN12.7NaN3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 NaN 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. NaN \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 113, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Services GDP% 2020'] = pd.to_numeric(df['Services GDP% 2020'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 114, + "id": "2ee4ef2a-f840-459a-8857-1dae6ade7a4f", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2..NaN
4Andorra3.42.9NaN0.6NaN12.7NaN3.7..79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 NaN 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 .. NaN \n", + "4 .. 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 114, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Services GDP% 2020'] = df['Services GDP% 2020'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 115, + "id": "7d609d41-d5d8-4670-b7ca-0ea66e04a7ff", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2NaNNaN
4Andorra3.42.9NaN0.6NaN12.7NaN3.7NaN79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 NaN 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 NaN NaN \n", + "4 NaN 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 115, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Services GDP% 2010'] = pd.to_numeric(df['Services GDP% 2010'], errors='coerce')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 116, + "id": "74502001-0f67-4b6b-b80c-4a949b7009fb", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
0Afghanistan15.920.126.226.821.214.012.57.748.954.7
1Albania11.915.118.019.324.920.05.56.044.048.4
2Algeria161.2145.08.514.140.020.339.018.839.248.7
3American Samoa0.60.7NaNNaNNaNNaN7.212.2NaNNaN
4Andorra3.42.9NaN0.6NaN12.7NaN3.7NaN79.8
....................................
221Sub-Saharan Africa1451.81706.115.918.527.126.59.811.250.948.9
222Low income613.2481.023.626.828.325.94.810.742.939.1
223Lower middle income5246.97585.515.316.133.027.816.414.946.848.1
224Upper middle income14604.022848.36.97.036.734.121.722.150.555.9
225High income45752.253699.81.31.323.922.414.113.469.071.8
\n", + "

226 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 \\\n", + "0 Afghanistan 15.9 20.1 \n", + "1 Albania 11.9 15.1 \n", + "2 Algeria 161.2 145.0 \n", + "3 American Samoa 0.6 0.7 \n", + "4 Andorra 3.4 2.9 \n", + ".. ... ... ... \n", + "221 Sub-Saharan Africa 1451.8 1706.1 \n", + "222 Low income 613.2 481.0 \n", + "223 Lower middle income 5246.9 7585.5 \n", + "224 Upper middle income 14604.0 22848.3 \n", + "225 High income 45752.2 53699.8 \n", + "\n", + " Agriculture GDP% 2010 Agriculture GDP% 2020 Industry GDP% 2010 \\\n", + "0 26.2 26.8 21.2 \n", + "1 18.0 19.3 24.9 \n", + "2 8.5 14.1 40.0 \n", + "3 NaN NaN NaN \n", + "4 NaN 0.6 NaN \n", + ".. ... ... ... \n", + "221 15.9 18.5 27.1 \n", + "222 23.6 26.8 28.3 \n", + "223 15.3 16.1 33.0 \n", + "224 6.9 7.0 36.7 \n", + "225 1.3 1.3 23.9 \n", + "\n", + " Industry GDP% 2020 Manufacturing GDP% 2010 Manufacturing GDP% 2020 \\\n", + "0 14.0 12.5 7.7 \n", + "1 20.0 5.5 6.0 \n", + "2 20.3 39.0 18.8 \n", + "3 NaN 7.2 12.2 \n", + "4 12.7 NaN 3.7 \n", + ".. ... ... ... \n", + "221 26.5 9.8 11.2 \n", + "222 25.9 4.8 10.7 \n", + "223 27.8 16.4 14.9 \n", + "224 34.1 21.7 22.1 \n", + "225 22.4 14.1 13.4 \n", + "\n", + " Services GDP% 2010 Services GDP% 2020 \n", + "0 48.9 54.7 \n", + "1 44.0 48.4 \n", + "2 39.2 48.7 \n", + "3 NaN NaN \n", + "4 NaN 79.8 \n", + ".. ... ... \n", + "221 50.9 48.9 \n", + "222 42.9 39.1 \n", + "223 46.8 48.1 \n", + "224 50.5 55.9 \n", + "225 69.0 71.8 \n", + "\n", + "[226 rows x 11 columns]" + ] + }, + "execution_count": 116, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Services GDP% 2010'] = df['Services GDP% 2010'].astype(float)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 118, + "id": "82a2235f-e62d-42b4-a77c-68ea6a8b658e", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Country object\n", + "GDP $billions 2010 float64\n", + "GDP $billions 2020 float64\n", + "Agriculture GDP% 2010 float64\n", + "Agriculture GDP% 2020 float64\n", + "Industry GDP% 2010 float64\n", + "Industry GDP% 2020 float64\n", + "Manufacturing GDP% 2010 float64\n", + "Manufacturing GDP% 2020 float64\n", + "Services GDP% 2010 float64\n", + "Services GDP% 2020 float64\n", + "dtype: object" + ] + }, + "execution_count": 118, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.dtypes" + ] + }, + { + "cell_type": "code", + "execution_count": 119, + "id": "d411b755-49d6-401c-b151-d61ff330143e", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
GDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
count222.000000220.000000209.000000208.000000211.000000209.000000207.000000200.00000208.000000208.000000
mean1196.0594591537.55909110.97607710.38557726.59099524.88756011.56618411.7715055.11730857.306731
std5962.6633797607.17806111.20007710.29035413.7630039.9199756.9786587.1013313.63659112.313578
min0.0000000.1000000.0000000.0000004.8000004.9000000.4000000.3000024.70000016.800000
25%5.3250007.2250002.2000002.20000018.00000018.1000006.4000006.5750045.85000049.450000
50%25.70000032.0500006.8000007.20000024.50000023.50000011.30000011.2000054.50000056.400000
75%218.525000257.10000017.00000016.45000031.70000030.70000015.60000015.8000064.32500065.700000
max66596.10000084906.80000052.90000059.50000075.70000059.10000047.30000048.2000094.00000093.900000
\n", + "
" + ], + "text/plain": [ + " GDP $billions 2010 GDP $billions 2020 Agriculture GDP% 2010 \\\n", + "count 222.000000 220.000000 209.000000 \n", + "mean 1196.059459 1537.559091 10.976077 \n", + "std 5962.663379 7607.178061 11.200077 \n", + "min 0.000000 0.100000 0.000000 \n", + "25% 5.325000 7.225000 2.200000 \n", + "50% 25.700000 32.050000 6.800000 \n", + "75% 218.525000 257.100000 17.000000 \n", + "max 66596.100000 84906.800000 52.900000 \n", + "\n", + " Agriculture GDP% 2020 Industry GDP% 2010 Industry GDP% 2020 \\\n", + "count 208.000000 211.000000 209.000000 \n", + "mean 10.385577 26.590995 24.887560 \n", + "std 10.290354 13.763003 9.919975 \n", + "min 0.000000 4.800000 4.900000 \n", + "25% 2.200000 18.000000 18.100000 \n", + "50% 7.200000 24.500000 23.500000 \n", + "75% 16.450000 31.700000 30.700000 \n", + "max 59.500000 75.700000 59.100000 \n", + "\n", + " Manufacturing GDP% 2010 Manufacturing GDP% 2020 Services GDP% 2010 \\\n", + "count 207.000000 200.00000 208.000000 \n", + "mean 11.566184 11.77150 55.117308 \n", + "std 6.978658 7.10133 13.636591 \n", + "min 0.400000 0.30000 24.700000 \n", + "25% 6.400000 6.57500 45.850000 \n", + "50% 11.300000 11.20000 54.500000 \n", + "75% 15.600000 15.80000 64.325000 \n", + "max 47.300000 48.20000 94.000000 \n", + "\n", + " Services GDP% 2020 \n", + "count 208.000000 \n", + "mean 57.306731 \n", + "std 12.313578 \n", + "min 16.800000 \n", + "25% 49.450000 \n", + "50% 56.400000 \n", + "75% 65.700000 \n", + "max 93.900000 " + ] + }, + "execution_count": 119, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.describe()" + ] + }, + { + "cell_type": "code", + "execution_count": 126, + "id": "22807eba-83ff-4560-bd82-14da13ba452a", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020Agriculture GDP% 2010Agriculture GDP% 2020Industry GDP% 2010Industry GDP% 2020Manufacturing GDP% 2010Manufacturing GDP% 2020Services GDP% 2010Services GDP% 2020
125Mexico1057.81087.13.23.832.429.615.617.260.460.3
\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020 Agriculture GDP% 2010 \\\n", + "125 Mexico 1057.8 1087.1 3.2 \n", + "\n", + " Agriculture GDP% 2020 Industry GDP% 2010 Industry GDP% 2020 \\\n", + "125 3.8 32.4 29.6 \n", + "\n", + " Manufacturing GDP% 2010 Manufacturing GDP% 2020 Services GDP% 2010 \\\n", + "125 15.6 17.2 60.4 \n", + "\n", + " Services GDP% 2020 \n", + "125 60.3 " + ] + }, + "execution_count": 126, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df[df['Country']=='Mexico']" + ] + }, + { + "cell_type": "code", + "execution_count": 122, + "id": "60eda7b7-6038-4b2a-85aa-ff2f6369eef4", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.0" + ] + }, + "execution_count": 122, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "min_gdp10 = df['GDP $billions 2010'].min()\n", + "min_gdp10" + ] + }, + { + "cell_type": "code", + "execution_count": 123, + "id": "723f8d8c-bb94-41d6-8538-4af2077d8fb0", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010
198Tuvalu0.0
\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010\n", + "198 Tuvalu 0.0" + ] + }, + "execution_count": 123, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.loc[(df['GDP $billions 2010']==min_gdp10), ['Country', 'GDP $billions 2010']]" + ] + }, + { + "cell_type": "code", + "execution_count": 128, + "id": "06170cea-9078-4f06-bedc-c2d194aaa6c1", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.1" + ] + }, + "execution_count": 128, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "min_gdp20 = df['GDP $billions 2020'].min()\n", + "min_gdp20" + ] + }, + { + "cell_type": "code", + "execution_count": 129, + "id": "63fd3d6a-2829-4e07-9568-cc91137767ea", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2020
198Tuvalu0.1
\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2020\n", + "198 Tuvalu 0.1" + ] + }, + "execution_count": 129, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.loc[(df['GDP $billions 2020']==min_gdp20), ['Country', 'GDP $billions 2020']]" + ] + }, + { + "cell_type": "code", + "execution_count": 131, + "id": "d9b12970-f61f-4e05-9cae-2733bcb4c8b3", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020
3American Samoa0.60.7
6Antigua and Barbuda1.11.4
9Aruba2.52.5
19Belize1.41.6
22Bhutan1.52.3
30Burundi2.02.8
31Cabo Verde1.71.7
36Central African Republic2.12.3
44Comoros0.91.2
51Curacao2.92.5
55Djibouti1.13.2
56Dominica0.50.5
62Eritrea1.6NaN
66Faroe Islands2.33.2
72Gambia, The1.51.8
77Greenland2.53.1
78Grenada0.81.0
82Guinea-Bissau0.81.4
101Kiribati0.20.2
110Lesotho2.22.3
111Liberia2.03.0
119Maldives2.63.7
122Marshall Islands0.20.2
126Micronesia, Fed. Sts.0.30.4
143Northern Mariana Islands0.81.2
147Palau0.20.3
160Samoa0.70.8
161San Marino1.91.5
162Sao Tome and Principe0.20.5
166Seychelles1.01.2
167Sierra Leone2.64.1
169Sint Maarten (Dutch part)0.91.2
172Solomon Islands0.81.5
178St. Kitts and Nevis0.81.0
179St. Lucia1.51.6
180St. Martin (French part)0.8NaN
181St. Vincent and the Grenadines0.70.9
190Timor-Leste0.91.9
192Tonga0.40.5
197Turks and Caicos Islands0.70.9
206Vanuatu0.70.9
\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020\n", + "3 American Samoa 0.6 0.7\n", + "6 Antigua and Barbuda 1.1 1.4\n", + "9 Aruba 2.5 2.5\n", + "19 Belize 1.4 1.6\n", + "22 Bhutan 1.5 2.3\n", + "30 Burundi 2.0 2.8\n", + "31 Cabo Verde 1.7 1.7\n", + "36 Central African Republic 2.1 2.3\n", + "44 Comoros 0.9 1.2\n", + "51 Curacao 2.9 2.5\n", + "55 Djibouti 1.1 3.2\n", + "56 Dominica 0.5 0.5\n", + "62 Eritrea 1.6 NaN\n", + "66 Faroe Islands 2.3 3.2\n", + "72 Gambia, The 1.5 1.8\n", + "77 Greenland 2.5 3.1\n", + "78 Grenada 0.8 1.0\n", + "82 Guinea-Bissau 0.8 1.4\n", + "101 Kiribati 0.2 0.2\n", + "110 Lesotho 2.2 2.3\n", + "111 Liberia 2.0 3.0\n", + "119 Maldives 2.6 3.7\n", + "122 Marshall Islands 0.2 0.2\n", + "126 Micronesia, Fed. Sts. 0.3 0.4\n", + "143 Northern Mariana Islands 0.8 1.2\n", + "147 Palau 0.2 0.3\n", + "160 Samoa 0.7 0.8\n", + "161 San Marino 1.9 1.5\n", + "162 Sao Tome and Principe 0.2 0.5\n", + "166 Seychelles 1.0 1.2\n", + "167 Sierra Leone 2.6 4.1\n", + "169 Sint Maarten (Dutch part) 0.9 1.2\n", + "172 Solomon Islands 0.8 1.5\n", + "178 St. Kitts and Nevis 0.8 1.0\n", + "179 St. Lucia 1.5 1.6\n", + "180 St. Martin (French part) 0.8 NaN\n", + "181 St. Vincent and the Grenadines 0.7 0.9\n", + "190 Timor-Leste 0.9 1.9\n", + "192 Tonga 0.4 0.5\n", + "197 Turks and Caicos Islands 0.7 0.9\n", + "206 Vanuatu 0.7 0.9" + ] + }, + "execution_count": 131, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "paises_lowgdp = df.loc[(df['GDP $billions 2010']>0) & (df['GDP $billions 2010']<3), ['Country', 'GDP $billions 2010', 'GDP $billions 2020']]\n", + "paises_lowgdp" + ] + }, + { + "cell_type": "code", + "execution_count": 132, + "id": "08fb78a2-c682-4176-86a4-48ada7fa0775", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "66596.1" + ] + }, + "execution_count": 132, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "max_gdp10 = df['GDP $billions 2010'].max()\n", + "max_gdp10" + ] + }, + { + "cell_type": "code", + "execution_count": 150, + "id": "d6cfedee-10dc-4bdb-8893-07e7f664a3cd", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CountryGDP $billions 2010GDP $billions 2020
40China6087.214687.7
97Japan5759.15040.1
203United States15049.020893.7
215East Asia & Pacific17063.327118.7
216Europe & Central Asia21025.822133.9
217Latin America & Caribbean5347.14743.2
219North America16672.922546.0
223Lower middle income5246.97585.5
224Upper middle income14604.022848.3
225High income45752.253699.8
\n", + "
" + ], + "text/plain": [ + " Country GDP $billions 2010 GDP $billions 2020\n", + "40 China 6087.2 14687.7\n", + "97 Japan 5759.1 5040.1\n", + "203 United States 15049.0 20893.7\n", + "215 East Asia & Pacific 17063.3 27118.7\n", + "216 Europe & Central Asia 21025.8 22133.9\n", + "217 Latin America & Caribbean 5347.1 4743.2\n", + "219 North America 16672.9 22546.0\n", + "223 Lower middle income 5246.9 7585.5\n", + "224 Upper middle income 14604.0 22848.3\n", + "225 High income 45752.2 53699.8" + ] + }, + "execution_count": 150, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "paises_maxgdp = df.loc[(df['GDP $billions 2010']>5000) & (df['GDP $billions 2010']<66596.1), ['Country', 'GDP $billions 2010', 'GDP $billions 2020']]\n", + "paises_maxgdp" + ] + }, + { + "cell_type": "code", + "execution_count": 151, + "id": "92fd5f20-9505-4e8b-aca4-55ce5aa6a747", + "metadata": {}, + "outputs": [], + "source": [ + "df.to_csv('ProyectoGDP_Paises.csv')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "0a50003e-d0a4-40a5-9dc4-621bdfebfce9", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/README_ProyectoGilda.md b/README_ProyectoGilda.md new file mode 100644 index 0000000..ae6b8c4 --- /dev/null +++ b/README_ProyectoGilda.md @@ -0,0 +1,10 @@ +### Proyecto web scrapping + +## Web scraapping + +Los problemas que encontré al resolver este trabajo fueron: + +>Encontrar una web que me interesara con datos numéricos. +>Encontrar una web cuyos datos estuvieran en tablas. +>Cuando extraje los datos, me di cuenta de que estaban guardados como strings y para mí fue difícil convertirlos en float. +>Al final pude trabajar con los datos y el dataframe.