diff --git a/your-code/main.ipynb b/your-code/main.ipynb index a2958dd..c1f1cca 100644 --- a/your-code/main.ipynb +++ b/your-code/main.ipynb @@ -12,11 +12,15 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 12, "metadata": {}, "outputs": [], "source": [ - "# Import reduce from functools, numpy and pandas" + "# Import reduce from functools, numpy and pandas\n", + "\n", + "import numpy as np\n", + "from functools import reduce\n", + "import pandas as pd" ] }, { @@ -32,7 +36,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 2, "metadata": {}, "outputs": [], "source": [ @@ -54,11 +58,11 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 3, "metadata": {}, "outputs": [], "source": [ - "# your code here" + "del prophet[0:568]\n" ] }, { @@ -70,11 +74,31 @@ }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "# your code here" + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['PROPHET\\n\\n|Almustafa,',\n", + " 'the{7}',\n", + " 'chosen',\n", + " 'and',\n", + " 'the\\nbeloved,',\n", + " 'who',\n", + " 'was',\n", + " 'a',\n", + " 'dawn',\n", + " 'unto']" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "prophet[0:10]" ] }, { @@ -88,7 +112,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 5, "metadata": {}, "outputs": [], "source": [ @@ -96,13 +120,18 @@ " '''\n", " Input: A string\n", " Output: The string with references removed\n", - " \n", + "\n", " Example:\n", " Input: 'the{7}'\n", " Output: 'the'\n", " '''\n", - " \n", - " # your code here" + " clean_word = ''\n", + " if \"{\" in x:\n", + " v_index = x.index(\"{\")\n", + " clean_word = x[0:v_index]\n", + " else:\n", + " clean_word = x\n", + " return clean_word\n" ] }, { @@ -114,11 +143,11 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 6, "metadata": {}, "outputs": [], "source": [ - "# your code here" + "prophet_reference = list(map(reference,prophet))\n" ] }, { @@ -130,7 +159,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 7, "metadata": {}, "outputs": [], "source": [ @@ -143,8 +172,7 @@ " Input: 'the\\nbeloved'\n", " Output: ['the', 'beloved']\n", " '''\n", - " \n", - " # your code here" + " return x.split(\"\\n\")" ] }, { @@ -156,11 +184,11 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 8, "metadata": {}, "outputs": [], "source": [ - "# your code here" + "prophet_line = list(map(line_break,prophet_reference))" ] }, { @@ -172,11 +200,11 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 9, "metadata": {}, "outputs": [], "source": [ - "# your code here" + "prophet_flat= [x for i in prophet_line for x in i]" ] }, { @@ -190,7 +218,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 10, "metadata": {}, "outputs": [], "source": [ @@ -210,8 +238,15 @@ " '''\n", " \n", " word_list = ['and', 'the', 'a', 'an']\n", + " if x in word_list:\n", + " return False\n", + " else:\n", + " return True\n", " \n", - " # your code here" + " \n", + "prophet_filter = list(filter(word_filter,prophet_flat))\n", + "\n", + " " ] }, { @@ -232,15 +267,21 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 18, "metadata": {}, "outputs": [], "source": [ "def word_filter_case(x):\n", " \n", " word_list = ['and', 'the', 'a', 'an']\n", + " \n", + " if x.lower() in word_list:\n", + " return False\n", + " else:\n", + " return True\n", " \n", - " # your code here" + " \n", + "prophet_filter = list(filter(word_filter_case,prophet_flat))" ] }, { @@ -256,7 +297,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 19, "metadata": {}, "outputs": [], "source": [ @@ -270,7 +311,8 @@ " Output: 'John Smith'\n", " '''\n", " \n", - " # your code here" + " output = a +\" \"+b\n", + " return output" ] }, { @@ -282,11 +324,11 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 20, "metadata": {}, "outputs": [], "source": [ - "# your code here" + "prophet_string = reduce(concat_space,prophet_filter)" ] }, { @@ -302,7 +344,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 34, "metadata": {}, "outputs": [], "source": [ @@ -318,11 +360,12 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 35, "metadata": {}, "outputs": [], "source": [ - "# your code here" + "import pandas as pd\n", + "import numpy as np" ] }, { @@ -334,10 +377,12 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 36, "metadata": {}, "outputs": [], - "source": [] + "source": [ + "df = pd.read_csv(url)" + ] }, { "cell_type": "markdown", @@ -348,11 +393,146 @@ }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "# your code here" + "execution_count": 37, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
| \n", + " | No | \n", + "year | \n", + "month | \n", + "day | \n", + "hour | \n", + "pm2.5 | \n", + "DEWP | \n", + "TEMP | \n", + "PRES | \n", + "cbwd | \n", + "Iws | \n", + "Is | \n", + "Ir | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "1 | \n", + "2010 | \n", + "1 | \n", + "1 | \n", + "0 | \n", + "NaN | \n", + "-21 | \n", + "-11.0 | \n", + "1021.0 | \n", + "NW | \n", + "1.79 | \n", + "0 | \n", + "0 | \n", + "
| 1 | \n", + "2 | \n", + "2010 | \n", + "1 | \n", + "1 | \n", + "1 | \n", + "NaN | \n", + "-21 | \n", + "-12.0 | \n", + "1020.0 | \n", + "NW | \n", + "4.92 | \n", + "0 | \n", + "0 | \n", + "
| 2 | \n", + "3 | \n", + "2010 | \n", + "1 | \n", + "1 | \n", + "2 | \n", + "NaN | \n", + "-21 | \n", + "-11.0 | \n", + "1019.0 | \n", + "NW | \n", + "6.71 | \n", + "0 | \n", + "0 | \n", + "
| 3 | \n", + "4 | \n", + "2010 | \n", + "1 | \n", + "1 | \n", + "3 | \n", + "NaN | \n", + "-21 | \n", + "-14.0 | \n", + "1019.0 | \n", + "NW | \n", + "9.84 | \n", + "0 | \n", + "0 | \n", + "
| 4 | \n", + "5 | \n", + "2010 | \n", + "1 | \n", + "1 | \n", + "4 | \n", + "NaN | \n", + "-20 | \n", + "-12.0 | \n", + "1018.0 | \n", + "NW | \n", + "12.97 | \n", + "0 | \n", + "0 | \n", + "