diff --git a/your-code/main.ipynb b/your-code/main.ipynb index a2958dd..a3befab 100644 --- a/your-code/main.ipynb +++ b/your-code/main.ipynb @@ -12,11 +12,13 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 27, "metadata": {}, "outputs": [], "source": [ - "# Import reduce from functools, numpy and pandas" + "from functools import reduce\n", + "import pandas as pd\n", + "import numpy as np" ] }, { @@ -32,7 +34,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 7, "metadata": {}, "outputs": [], "source": [ @@ -54,11 +56,13 @@ }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, + "execution_count": 8, + "metadata": { + "scrolled": false + }, "outputs": [], "source": [ - "# your code here" + "prophet = prophet[568:]" ] }, { @@ -70,11 +74,32 @@ }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "# your code here" + "execution_count": 9, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "PROPHET\n", + "\n", + "|Almustafa,\n", + "the{7}\n", + "chosen\n", + "and\n", + "the\n", + "beloved,\n", + "who\n", + "was\n", + "a\n", + "dawn\n", + "unto\n" + ] + } + ], + "source": [ + "for i in range(10):\n", + " print(prophet[i])" ] }, { @@ -88,7 +113,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 10, "metadata": {}, "outputs": [], "source": [ @@ -101,8 +126,7 @@ " Input: 'the{7}'\n", " Output: 'the'\n", " '''\n", - " \n", - " # your code here" + " return x.split(\"{\")[0]" ] }, { @@ -114,11 +138,11 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 11, "metadata": {}, "outputs": [], "source": [ - "# your code here" + "prophet_reference = list(map(reference, prophet))" ] }, { @@ -130,7 +154,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 12, "metadata": {}, "outputs": [], "source": [ @@ -143,8 +167,7 @@ " Input: 'the\\nbeloved'\n", " Output: ['the', 'beloved']\n", " '''\n", - " \n", - " # your code here" + " return x.split(\"\\n\")" ] }, { @@ -156,11 +179,11 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 13, "metadata": {}, "outputs": [], "source": [ - "# your code here" + "prophet_line = list(map(line_break,prophet_reference))" ] }, { @@ -172,11 +195,11 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 14, "metadata": {}, "outputs": [], "source": [ - "# your code here" + "prophet_flat = [j for i in prophet_line for j in i]" ] }, { @@ -190,7 +213,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 15, "metadata": {}, "outputs": [], "source": [ @@ -210,8 +233,10 @@ " '''\n", " \n", " word_list = ['and', 'the', 'a', 'an']\n", - " \n", - " # your code here" + " if x in word_list:\n", + " return False\n", + " else:\n", + " return True" ] }, { @@ -221,6 +246,15 @@ "Use the `filter()` function to filter out the words speficied in the `word_filter()` function. Store the filtered list in the variable `prophet_filter`." ] }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [], + "source": [ + "prophet_filter = list(filter(word_filter, prophet_flat))" + ] + }, { "cell_type": "markdown", "metadata": {}, @@ -232,7 +266,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 17, "metadata": {}, "outputs": [], "source": [ @@ -240,7 +274,11 @@ " \n", " word_list = ['and', 'the', 'a', 'an']\n", " \n", - " # your code here" + " if x.lower() in word_list:\n", + " return False\n", + " else:\n", + " return True\n", + "prophet_filter_case = list(filter(word_filter_case, prophet_filter))" ] }, { @@ -256,7 +294,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 18, "metadata": {}, "outputs": [], "source": [ @@ -269,8 +307,7 @@ " Input: 'John', 'Smith'\n", " Output: 'John Smith'\n", " '''\n", - " \n", - " # your code here" + " return a + \" \" + b" ] }, { @@ -282,11 +319,11 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 19, "metadata": {}, "outputs": [], "source": [ - "# your code here" + "prophet_string = reduce(concat_space,prophet_filter_case)" ] }, { @@ -302,7 +339,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 20, "metadata": {}, "outputs": [], "source": [ @@ -316,15 +353,6 @@ "You'll need to import pandas" ] }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "# your code here" - ] - }, { "cell_type": "markdown", "metadata": {}, @@ -334,10 +362,12 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 21, "metadata": {}, "outputs": [], - "source": [] + "source": [ + "df = pd.read_csv(\"https://archive.ics.uci.edu/ml/machine-learning-databases/00381/PRSA_data_2010.1.1-2014.12.31.csv\")" + ] }, { "cell_type": "markdown", @@ -348,11 +378,146 @@ }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "# your code here" + "execution_count": 22, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
| \n", + " | No | \n", + "year | \n", + "month | \n", + "day | \n", + "hour | \n", + "pm2.5 | \n", + "DEWP | \n", + "TEMP | \n", + "PRES | \n", + "cbwd | \n", + "Iws | \n", + "Is | \n", + "Ir | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "1 | \n", + "2010 | \n", + "1 | \n", + "1 | \n", + "0 | \n", + "NaN | \n", + "-21 | \n", + "-11.0 | \n", + "1021.0 | \n", + "NW | \n", + "1.79 | \n", + "0 | \n", + "0 | \n", + "
| 1 | \n", + "2 | \n", + "2010 | \n", + "1 | \n", + "1 | \n", + "1 | \n", + "NaN | \n", + "-21 | \n", + "-12.0 | \n", + "1020.0 | \n", + "NW | \n", + "4.92 | \n", + "0 | \n", + "0 | \n", + "
| 2 | \n", + "3 | \n", + "2010 | \n", + "1 | \n", + "1 | \n", + "2 | \n", + "NaN | \n", + "-21 | \n", + "-11.0 | \n", + "1019.0 | \n", + "NW | \n", + "6.71 | \n", + "0 | \n", + "0 | \n", + "
| 3 | \n", + "4 | \n", + "2010 | \n", + "1 | \n", + "1 | \n", + "3 | \n", + "NaN | \n", + "-21 | \n", + "-14.0 | \n", + "1019.0 | \n", + "NW | \n", + "9.84 | \n", + "0 | \n", + "0 | \n", + "
| 4 | \n", + "5 | \n", + "2010 | \n", + "1 | \n", + "1 | \n", + "4 | \n", + "NaN | \n", + "-20 | \n", + "-12.0 | \n", + "1018.0 | \n", + "NW | \n", + "12.97 | \n", + "0 | \n", + "0 | \n", + "