From 1843deede8319b7db09d19e3b2d6a1e75bd35c26 Mon Sep 17 00:00:00 2001 From: palean Date: Tue, 16 Jul 2019 17:52:51 -0500 Subject: [PATCH] Adding morning lab --- .../.ipynb_checkpoints/main-checkpoint.ipynb | 5327 ++++++++++++++++- your-code/main.ipynb | 5327 ++++++++++++++++- 2 files changed, 10410 insertions(+), 244 deletions(-) diff --git a/your-code/.ipynb_checkpoints/main-checkpoint.ipynb b/your-code/.ipynb_checkpoints/main-checkpoint.ipynb index 812f7a4..5a88557 100644 --- a/your-code/.ipynb_checkpoints/main-checkpoint.ipynb +++ b/your-code/.ipynb_checkpoints/main-checkpoint.ipynb @@ -40,9 +40,32 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 1, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Requirement already satisfied: bs4 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (0.0.1)\n", + "Requirement already satisfied: requests in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (2.22.0)\n", + "Requirement already satisfied: pandas in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (0.24.2)\n", + "Requirement already satisfied: html5lib in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (1.0.1)\n", + "Requirement already satisfied: lxml in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (4.3.4)\n", + "Requirement already satisfied: beautifulsoup4 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from bs4) (4.7.1)\n", + "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from requests) (1.25.3)\n", + "Requirement already satisfied: certifi>=2017.4.17 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from requests) (2019.6.16)\n", + "Requirement already satisfied: idna<2.9,>=2.5 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from requests) (2.8)\n", + "Requirement already satisfied: chardet<3.1.0,>=3.0.2 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from requests) (3.0.4)\n", + "Requirement already satisfied: numpy>=1.12.0 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from pandas) (1.16.4)\n", + "Requirement already satisfied: pytz>=2011k in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from pandas) (2019.1)\n", + "Requirement already satisfied: python-dateutil>=2.5.0 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from pandas) (2.8.0)\n", + "Requirement already satisfied: webencodings in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from html5lib) (0.5.1)\n", + "Requirement already satisfied: six>=1.9 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from html5lib) (1.12.0)\n", + "Requirement already satisfied: soupsieve>=1.2 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from beautifulsoup4->bs4) (1.9.2)\n" + ] + } + ], "source": [ "import requests\n", "from bs4 import BeautifulSoup\n", @@ -52,9 +75,11 @@ "# from lxml.html import fromstring\n", "# import urllib.request\n", "# from urllib.request import urlopen\n", - "# import random\n", + "import random\n", "# import re\n", - "# import scrapy" + "#import scrapy\n", + "import sys\n", + "!{sys.executable} -m pip install bs4 requests pandas html5lib lxml" ] }, { @@ -66,12 +91,3793 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 5, "metadata": {}, "outputs": [], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'https://github.com/trending/developers'" + "url = 'https://github.com/trending/developers'\n", + "html = requests.get(url).content" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "Trending developers on GitHub today · GitHub\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
\n", + "Skip to content\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "\n", + " Sign up\n", + " \n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "

Trending

\n", + "

\n", + " These are the\n", + " developers\n", + " building the hot tools today.\n", + "

\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " Language:\n", + "\n", + " \n", + "\n", + " Any\n", + " \n", + "\n", + "\n", + "\n", + "
\n", + "Select a language\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "C++\n", + "\n", + "\n", + "\n", + "HTML\n", + "\n", + "\n", + "\n", + "Java\n", + "\n", + "\n", + "\n", + "JavaScript\n", + "\n", + "\n", + "\n", + "PHP\n", + "\n", + "\n", + "\n", + "Python\n", + "\n", + "\n", + "\n", + "Ruby\n", + "\n", + "\n", + "\n", + "Unknown languages\n", + "\n", + "\n", + "\n", + "1C Enterprise\n", + "\n", + "\n", + "\n", + "ABAP\n", + "\n", + "\n", + "\n", + "ABNF\n", + "\n", + "\n", + "\n", + "ActionScript\n", + "\n", + "\n", + "\n", + "Ada\n", + "\n", + "\n", + "\n", + "Adobe Font Metrics\n", + "\n", + "\n", + "\n", + "Agda\n", + "\n", + "\n", + "\n", + "AGS Script\n", + "\n", + "\n", + "\n", + "Alloy\n", + "\n", + "\n", + "\n", + "Alpine Abuild\n", + "\n", + "\n", + "\n", + "Altium Designer\n", + "\n", + "\n", + "\n", + "AMPL\n", + "\n", + "\n", + "\n", + "AngelScript\n", + "\n", + "\n", + "\n", + "Ant Build System\n", + "\n", + "\n", + "\n", + "ANTLR\n", + "\n", + "\n", + "\n", + "ApacheConf\n", + "\n", + "\n", + "\n", + "Apex\n", + "\n", + "\n", + "\n", + "API Blueprint\n", + "\n", + "\n", + "\n", + "APL\n", + "\n", + "\n", + "\n", + "Apollo Guidance Computer\n", + "\n", + "\n", + "\n", + "AppleScript\n", + "\n", + "\n", + "\n", + "Arc\n", + "\n", + "\n", + "\n", + "AsciiDoc\n", + "\n", + "\n", + "\n", + "ASN.1\n", + "\n", + "\n", + "\n", + "ASP\n", + "\n", + "\n", + "\n", + "AspectJ\n", + "\n", + "\n", + "\n", + "Assembly\n", + "\n", + "\n", + "\n", + "Asymptote\n", + "\n", + "\n", + "\n", + "ATS\n", + "\n", + "\n", + "\n", + "Augeas\n", + "\n", + "\n", + "\n", + "AutoHotkey\n", + "\n", + "\n", + "\n", + "AutoIt\n", + "\n", + "\n", + "\n", + "Awk\n", + "\n", + "\n", + "\n", + "Ballerina\n", + "\n", + "\n", + "\n", + "Batchfile\n", + "\n", + "\n", + "\n", + "Befunge\n", + "\n", + "\n", + "\n", + "Bison\n", + "\n", + "\n", + "\n", + "BitBake\n", + "\n", + "\n", + "\n", + "Blade\n", + "\n", + "\n", + "\n", + "BlitzBasic\n", + "\n", + "\n", + "\n", + "BlitzMax\n", + "\n", + "\n", + "\n", + "Bluespec\n", + "\n", + "\n", + "\n", + "Boo\n", + "\n", + "\n", + "\n", + "Brainfuck\n", + "\n", + "\n", + "\n", + "Brightscript\n", + "\n", + "\n", + "\n", + "Zeek\n", + "\n", + "\n", + "\n", + "C\n", + "\n", + "\n", + "\n", + "C#\n", + "\n", + "\n", + "\n", + "C++\n", + "\n", + "\n", + "\n", + "C-ObjDump\n", + "\n", + "\n", + "\n", + "C2hs Haskell\n", + "\n", + "\n", + "\n", + "Cabal Config\n", + "\n", + "\n", + "\n", + "Cap'n Proto\n", + "\n", + "\n", + "\n", + "CartoCSS\n", + "\n", + "\n", + "\n", + "Ceylon\n", + "\n", + "\n", + "\n", + "Chapel\n", + "\n", + "\n", + "\n", + "Charity\n", + "\n", + "\n", + "\n", + "ChucK\n", + "\n", + "\n", + "\n", + "Cirru\n", + "\n", + "\n", + "\n", + "Clarion\n", + "\n", + "\n", + "\n", + "Clean\n", + "\n", + "\n", + "\n", + "Click\n", + "\n", + "\n", + "\n", + "CLIPS\n", + "\n", + "\n", + "\n", + "Clojure\n", + "\n", + "\n", + "\n", + "Closure Templates\n", + "\n", + "\n", + "\n", + "Cloud Firestore Security Rules\n", + "\n", + "\n", + "\n", + "CMake\n", + "\n", + "\n", + "\n", + "COBOL\n", + "\n", + "\n", + "\n", + "CoffeeScript\n", + "\n", + "\n", + "\n", + "ColdFusion\n", + "\n", + "\n", + "\n", + "ColdFusion CFC\n", + "\n", + "\n", + "\n", + "COLLADA\n", + "\n", + "\n", + "\n", + "Common Lisp\n", + "\n", + "\n", + "\n", + "Common Workflow Language\n", + "\n", + "\n", + "\n", + "Component Pascal\n", + "\n", + "\n", + "\n", + "CoNLL-U\n", + "\n", + "\n", + "\n", + "Cool\n", + "\n", + "\n", + "\n", + "Coq\n", + "\n", + "\n", + "\n", + "Cpp-ObjDump\n", + "\n", + "\n", + "\n", + "Creole\n", + "\n", + "\n", + "\n", + "Crystal\n", + "\n", + "\n", + "\n", + "CSON\n", + "\n", + "\n", + "\n", + "Csound\n", + "\n", + "\n", + "\n", + "Csound Document\n", + "\n", + "\n", + "\n", + "Csound Score\n", + "\n", + "\n", + "\n", + "CSS\n", + "\n", + "\n", + "\n", + "CSV\n", + "\n", + "\n", + "\n", + "Cuda\n", + "\n", + "\n", + "\n", + "CWeb\n", + "\n", + "\n", + "\n", + "Cycript\n", + "\n", + "\n", + "\n", + "Cython\n", + "\n", + "\n", + "\n", + "D\n", + "\n", + "\n", + "\n", + "D-ObjDump\n", + "\n", + "\n", + "\n", + "Darcs Patch\n", + "\n", + "\n", + "\n", + "Dart\n", + "\n", + "\n", + "\n", + "DataWeave\n", + "\n", + "\n", + "\n", + "desktop\n", + "\n", + "\n", + "\n", + "Dhall\n", + "\n", + "\n", + "\n", + "Diff\n", + "\n", + "\n", + "\n", + "DIGITAL Command Language\n", + "\n", + "\n", + "\n", + "DM\n", + "\n", + "\n", + "\n", + "DNS Zone\n", + "\n", + "\n", + "\n", + "Dockerfile\n", + "\n", + "\n", + "\n", + "Dogescript\n", + "\n", + "\n", + "\n", + "DTrace\n", + "\n", + "\n", + "\n", + "Dylan\n", + "\n", + "\n", + "\n", + "E\n", + "\n", + "\n", + "\n", + "Eagle\n", + "\n", + "\n", + "\n", + "Easybuild\n", + "\n", + "\n", + "\n", + "EBNF\n", + "\n", + "\n", + "\n", + "eC\n", + "\n", + "\n", + "\n", + "Ecere Projects\n", + "\n", + "\n", + "\n", + "ECL\n", + "\n", + "\n", + "\n", + "ECLiPSe\n", + "\n", + "\n", + "\n", + "Edje Data Collection\n", + "\n", + "\n", + "\n", + "edn\n", + "\n", + "\n", + "\n", + "Eiffel\n", + "\n", + "\n", + "\n", + "EJS\n", + "\n", + "\n", + "\n", + "Elixir\n", + "\n", + "\n", + "\n", + "Elm\n", + "\n", + "\n", + "\n", + "Emacs Lisp\n", + "\n", + "\n", + "\n", + "EmberScript\n", + "\n", + "\n", + "\n", + "EML\n", + "\n", + "\n", + "\n", + "EQ\n", + "\n", + "\n", + "\n", + "Erlang\n", + "\n", + "\n", + "\n", + "F#\n", + "\n", + "\n", + "\n", + "F*\n", + "\n", + "\n", + "\n", + "Factor\n", + "\n", + "\n", + "\n", + "Fancy\n", + "\n", + "\n", + "\n", + "Fantom\n", + "\n", + "\n", + "\n", + "FIGlet Font\n", + "\n", + "\n", + "\n", + "Filebench WML\n", + "\n", + "\n", + "\n", + "Filterscript\n", + "\n", + "\n", + "\n", + "fish\n", + "\n", + "\n", + "\n", + "FLUX\n", + "\n", + "\n", + "\n", + "Formatted\n", + "\n", + "\n", + "\n", + "Forth\n", + "\n", + "\n", + "\n", + "Fortran\n", + "\n", + "\n", + "\n", + "FreeMarker\n", + "\n", + "\n", + "\n", + "Frege\n", + "\n", + "\n", + "\n", + "G-code\n", + "\n", + "\n", + "\n", + "Game Maker Language\n", + "\n", + "\n", + "\n", + "GAMS\n", + "\n", + "\n", + "\n", + "GAP\n", + "\n", + "\n", + "\n", + "GCC Machine Description\n", + "\n", + "\n", + "\n", + "GDB\n", + "\n", + "\n", + "\n", + "GDScript\n", + "\n", + "\n", + "\n", + "Genie\n", + "\n", + "\n", + "\n", + "Genshi\n", + "\n", + "\n", + "\n", + "Gentoo Ebuild\n", + "\n", + "\n", + "\n", + "Gentoo Eclass\n", + "\n", + "\n", + "\n", + "Gerber Image\n", + "\n", + "\n", + "\n", + "Gettext Catalog\n", + "\n", + "\n", + "\n", + "Gherkin\n", + "\n", + "\n", + "\n", + "Git Attributes\n", + "\n", + "\n", + "\n", + "Git Config\n", + "\n", + "\n", + "\n", + "GLSL\n", + "\n", + "\n", + "\n", + "Glyph\n", + "\n", + "\n", + "\n", + "Glyph Bitmap Distribution Format\n", + "\n", + "\n", + "\n", + "GN\n", + "\n", + "\n", + "\n", + "Gnuplot\n", + "\n", + "\n", + "\n", + "Go\n", + "\n", + "\n", + "\n", + "Golo\n", + "\n", + "\n", + "\n", + "Gosu\n", + "\n", + "\n", + "\n", + "Grace\n", + "\n", + "\n", + "\n", + "Gradle\n", + "\n", + "\n", + "\n", + "Grammatical Framework\n", + "\n", + "\n", + "\n", + "Graph Modeling Language\n", + "\n", + "\n", + "\n", + "GraphQL\n", + "\n", + "\n", + "\n", + "Graphviz (DOT)\n", + "\n", + "\n", + "\n", + "Groovy\n", + "\n", + "\n", + "\n", + "Groovy Server Pages\n", + "\n", + "\n", + "\n", + "Hack\n", + "\n", + "\n", + "\n", + "Haml\n", + "\n", + "\n", + "\n", + "Handlebars\n", + "\n", + "\n", + "\n", + "HAProxy\n", + "\n", + "\n", + "\n", + "Harbour\n", + "\n", + "\n", + "\n", + "Haskell\n", + "\n", + "\n", + "\n", + "Haxe\n", + "\n", + "\n", + "\n", + "HCL\n", + "\n", + "\n", + "\n", + "HiveQL\n", + "\n", + "\n", + "\n", + "HLSL\n", + "\n", + "\n", + "\n", + "HolyC\n", + "\n", + "\n", + "\n", + "HTML\n", + "\n", + "\n", + "\n", + "HTML+Django\n", + "\n", + "\n", + "\n", + "HTML+ECR\n", + "\n", + "\n", + "\n", + "HTML+EEX\n", + "\n", + "\n", + "\n", + "HTML+ERB\n", + "\n", + "\n", + "\n", + "HTML+PHP\n", + "\n", + "\n", + "\n", + "HTML+Razor\n", + "\n", + "\n", + "\n", + "HTTP\n", + "\n", + "\n", + "\n", + "HXML\n", + "\n", + "\n", + "\n", + "Hy\n", + "\n", + "\n", + "\n", + "HyPhy\n", + "\n", + "\n", + "\n", + "IDL\n", + "\n", + "\n", + "\n", + "Idris\n", + "\n", + "\n", + "\n", + "IGOR Pro\n", + "\n", + "\n", + "\n", + "Inform 7\n", + "\n", + "\n", + "\n", + "INI\n", + "\n", + "\n", + "\n", + "Inno Setup\n", + "\n", + "\n", + "\n", + "Io\n", + "\n", + "\n", + "\n", + "Ioke\n", + "\n", + "\n", + "\n", + "IRC log\n", + "\n", + "\n", + "\n", + "Isabelle\n", + "\n", + "\n", + "\n", + "Isabelle ROOT\n", + "\n", + "\n", + "\n", + "J\n", + "\n", + "\n", + "\n", + "Jasmin\n", + "\n", + "\n", + "\n", + "Java\n", + "\n", + "\n", + "\n", + "Java Properties\n", + "\n", + "\n", + "\n", + "Java Server Pages\n", + "\n", + "\n", + "\n", + "JavaScript\n", + "\n", + "\n", + "\n", + "JavaScript+ERB\n", + "\n", + "\n", + "\n", + "JFlex\n", + "\n", + "\n", + "\n", + "Jison\n", + "\n", + "\n", + "\n", + "Jison Lex\n", + "\n", + "\n", + "\n", + "Jolie\n", + "\n", + "\n", + "\n", + "JSON\n", + "\n", + "\n", + "\n", + "JSON with Comments\n", + "\n", + "\n", + "\n", + "JSON5\n", + "\n", + "\n", + "\n", + "JSONiq\n", + "\n", + "\n", + "\n", + "JSONLD\n", + "\n", + "\n", + "\n", + "Jsonnet\n", + "\n", + "\n", + "\n", + "JSX\n", + "\n", + "\n", + "\n", + "Julia\n", + "\n", + "\n", + "\n", + "Jupyter Notebook\n", + "\n", + "\n", + "\n", + "KiCad Layout\n", + "\n", + "\n", + "\n", + "KiCad Legacy Layout\n", + "\n", + "\n", + "\n", + "KiCad Schematic\n", + "\n", + "\n", + "\n", + "Kit\n", + "\n", + "\n", + "\n", + "Kotlin\n", + "\n", + "\n", + "\n", + "KRL\n", + "\n", + "\n", + "\n", + "LabVIEW\n", + "\n", + "\n", + "\n", + "Lasso\n", + "\n", + "\n", + "\n", + "Latte\n", + "\n", + "\n", + "\n", + "Lean\n", + "\n", + "\n", + "\n", + "Less\n", + "\n", + "\n", + "\n", + "Lex\n", + "\n", + "\n", + "\n", + "LFE\n", + "\n", + "\n", + "\n", + "LilyPond\n", + "\n", + "\n", + "\n", + "Limbo\n", + "\n", + "\n", + "\n", + "Linker Script\n", + "\n", + "\n", + "\n", + "Linux Kernel Module\n", + "\n", + "\n", + "\n", + "Liquid\n", + "\n", + "\n", + "\n", + "Literate Agda\n", + "\n", + "\n", + "\n", + "Literate CoffeeScript\n", + "\n", + "\n", + "\n", + "Literate Haskell\n", + "\n", + "\n", + "\n", + "LiveScript\n", + "\n", + "\n", + "\n", + "LLVM\n", + "\n", + "\n", + "\n", + "Logos\n", + "\n", + "\n", + "\n", + "Logtalk\n", + "\n", + "\n", + "\n", + "LOLCODE\n", + "\n", + "\n", + "\n", + "LookML\n", + "\n", + "\n", + "\n", + "LoomScript\n", + "\n", + "\n", + "\n", + "LSL\n", + "\n", + "\n", + "\n", + "Lua\n", + "\n", + "\n", + "\n", + "M\n", + "\n", + "\n", + "\n", + "M4\n", + "\n", + "\n", + "\n", + "M4Sugar\n", + "\n", + "\n", + "\n", + "Makefile\n", + "\n", + "\n", + "\n", + "Mako\n", + "\n", + "\n", + "\n", + "Markdown\n", + "\n", + "\n", + "\n", + "Marko\n", + "\n", + "\n", + "\n", + "Mask\n", + "\n", + "\n", + "\n", + "Mathematica\n", + "\n", + "\n", + "\n", + "MATLAB\n", + "\n", + "\n", + "\n", + "Maven POM\n", + "\n", + "\n", + "\n", + "Max\n", + "\n", + "\n", + "\n", + "MAXScript\n", + "\n", + "\n", + "\n", + "mcfunction\n", + "\n", + "\n", + "\n", + "MediaWiki\n", + "\n", + "\n", + "\n", + "Mercury\n", + "\n", + "\n", + "\n", + "Meson\n", + "\n", + "\n", + "\n", + "Metal\n", + "\n", + "\n", + "\n", + "MiniD\n", + "\n", + "\n", + "\n", + "Mirah\n", + "\n", + "\n", + "\n", + "Modelica\n", + "\n", + "\n", + "\n", + "Modula-2\n", + "\n", + "\n", + "\n", + "Modula-3\n", + "\n", + "\n", + "\n", + "Module Management System\n", + "\n", + "\n", + "\n", + "Monkey\n", + "\n", + "\n", + "\n", + "Moocode\n", + "\n", + "\n", + "\n", + "MoonScript\n", + "\n", + "\n", + "\n", + "Motorola 68K Assembly\n", + "\n", + "\n", + "\n", + "MQL4\n", + "\n", + "\n", + "\n", + "MQL5\n", + "\n", + "\n", + "\n", + "MTML\n", + "\n", + "\n", + "\n", + "MUF\n", + "\n", + "\n", + "\n", + "mupad\n", + "\n", + "\n", + "\n", + "Myghty\n", + "\n", + "\n", + "\n", + "nanorc\n", + "\n", + "\n", + "\n", + "NCL\n", + "\n", + "\n", + "\n", + "Nearley\n", + "\n", + "\n", + "\n", + "Nemerle\n", + "\n", + "\n", + "\n", + "nesC\n", + "\n", + "\n", + "\n", + "NetLinx\n", + "\n", + "\n", + "\n", + "NetLinx+ERB\n", + "\n", + "\n", + "\n", + "NetLogo\n", + "\n", + "\n", + "\n", + "NewLisp\n", + "\n", + "\n", + "\n", + "Nextflow\n", + "\n", + "\n", + "\n", + "Nginx\n", + "\n", + "\n", + "\n", + "Nim\n", + "\n", + "\n", + "\n", + "Ninja\n", + "\n", + "\n", + "\n", + "Nit\n", + "\n", + "\n", + "\n", + "Nix\n", + "\n", + "\n", + "\n", + "NL\n", + "\n", + "\n", + "\n", + "NSIS\n", + "\n", + "\n", + "\n", + "Nu\n", + "\n", + "\n", + "\n", + "NumPy\n", + "\n", + "\n", + "\n", + "ObjDump\n", + "\n", + "\n", + "\n", + "Objective-C\n", + "\n", + "\n", + "\n", + "Objective-C++\n", + "\n", + "\n", + "\n", + "Objective-J\n", + "\n", + "\n", + "\n", + "ObjectScript\n", + "\n", + "\n", + "\n", + "OCaml\n", + "\n", + "\n", + "\n", + "Omgrofl\n", + "\n", + "\n", + "\n", + "ooc\n", + "\n", + "\n", + "\n", + "Opa\n", + "\n", + "\n", + "\n", + "Opal\n", + "\n", + "\n", + "\n", + "OpenCL\n", + "\n", + "\n", + "\n", + "OpenEdge ABL\n", + "\n", + "\n", + "\n", + "OpenRC runscript\n", + "\n", + "\n", + "\n", + "OpenSCAD\n", + "\n", + "\n", + "\n", + "OpenType Feature File\n", + "\n", + "\n", + "\n", + "Org\n", + "\n", + "\n", + "\n", + "Ox\n", + "\n", + "\n", + "\n", + "Oxygene\n", + "\n", + "\n", + "\n", + "Oz\n", + "\n", + "\n", + "\n", + "P4\n", + "\n", + "\n", + "\n", + "Pan\n", + "\n", + "\n", + "\n", + "Papyrus\n", + "\n", + "\n", + "\n", + "Parrot\n", + "\n", + "\n", + "\n", + "Parrot Assembly\n", + "\n", + "\n", + "\n", + "Parrot Internal Representation\n", + "\n", + "\n", + "\n", + "Pascal\n", + "\n", + "\n", + "\n", + "Pawn\n", + "\n", + "\n", + "\n", + "Pep8\n", + "\n", + "\n", + "\n", + "Perl\n", + "\n", + "\n", + "\n", + "Perl 6\n", + "\n", + "\n", + "\n", + "PHP\n", + "\n", + "\n", + "\n", + "Pic\n", + "\n", + "\n", + "\n", + "Pickle\n", + "\n", + "\n", + "\n", + "PicoLisp\n", + "\n", + "\n", + "\n", + "PigLatin\n", + "\n", + "\n", + "\n", + "Pike\n", + "\n", + "\n", + "\n", + "PLpgSQL\n", + "\n", + "\n", + "\n", + "PLSQL\n", + "\n", + "\n", + "\n", + "Pod\n", + "\n", + "\n", + "\n", + "Pod 6\n", + "\n", + "\n", + "\n", + "PogoScript\n", + "\n", + "\n", + "\n", + "Pony\n", + "\n", + "\n", + "\n", + "PostCSS\n", + "\n", + "\n", + "\n", + "PostScript\n", + "\n", + "\n", + "\n", + "POV-Ray SDL\n", + "\n", + "\n", + "\n", + "PowerBuilder\n", + "\n", + "\n", + "\n", + "PowerShell\n", + "\n", + "\n", + "\n", + "Processing\n", + "\n", + "\n", + "\n", + "Prolog\n", + "\n", + "\n", + "\n", + "Propeller Spin\n", + "\n", + "\n", + "\n", + "Protocol Buffer\n", + "\n", + "\n", + "\n", + "Public Key\n", + "\n", + "\n", + "\n", + "Pug\n", + "\n", + "\n", + "\n", + "Puppet\n", + "\n", + "\n", + "\n", + "Pure Data\n", + "\n", + "\n", + "\n", + "PureBasic\n", + "\n", + "\n", + "\n", + "PureScript\n", + "\n", + "\n", + "\n", + "Python\n", + "\n", + "\n", + "\n", + "Python console\n", + "\n", + "\n", + "\n", + "Python traceback\n", + "\n", + "\n", + "\n", + "q\n", + "\n", + "\n", + "\n", + "QMake\n", + "\n", + "\n", + "\n", + "QML\n", + "\n", + "\n", + "\n", + "Quake\n", + "\n", + "\n", + "\n", + "R\n", + "\n", + "\n", + "\n", + "Racket\n", + "\n", + "\n", + "\n", + "Ragel\n", + "\n", + "\n", + "\n", + "RAML\n", + "\n", + "\n", + "\n", + "Rascal\n", + "\n", + "\n", + "\n", + "Raw token data\n", + "\n", + "\n", + "\n", + "RDoc\n", + "\n", + "\n", + "\n", + "REALbasic\n", + "\n", + "\n", + "\n", + "Reason\n", + "\n", + "\n", + "\n", + "Rebol\n", + "\n", + "\n", + "\n", + "Red\n", + "\n", + "\n", + "\n", + "Redcode\n", + "\n", + "\n", + "\n", + "Regular Expression\n", + "\n", + "\n", + "\n", + "Ren'Py\n", + "\n", + "\n", + "\n", + "RenderScript\n", + "\n", + "\n", + "\n", + "reStructuredText\n", + "\n", + "\n", + "\n", + "REXX\n", + "\n", + "\n", + "\n", + "RHTML\n", + "\n", + "\n", + "\n", + "Rich Text Format\n", + "\n", + "\n", + "\n", + "Ring\n", + "\n", + "\n", + "\n", + "RMarkdown\n", + "\n", + "\n", + "\n", + "RobotFramework\n", + "\n", + "\n", + "\n", + "Roff\n", + "\n", + "\n", + "\n", + "Roff Manpage\n", + "\n", + "\n", + "\n", + "Rouge\n", + "\n", + "\n", + "\n", + "RPC\n", + "\n", + "\n", + "\n", + "RPM Spec\n", + "\n", + "\n", + "\n", + "Ruby\n", + "\n", + "\n", + "\n", + "RUNOFF\n", + "\n", + "\n", + "\n", + "Rust\n", + "\n", + "\n", + "\n", + "Sage\n", + "\n", + "\n", + "\n", + "SaltStack\n", + "\n", + "\n", + "\n", + "SAS\n", + "\n", + "\n", + "\n", + "Sass\n", + "\n", + "\n", + "\n", + "Scala\n", + "\n", + "\n", + "\n", + "Scaml\n", + "\n", + "\n", + "\n", + "Scheme\n", + "\n", + "\n", + "\n", + "Scilab\n", + "\n", + "\n", + "\n", + "SCSS\n", + "\n", + "\n", + "\n", + "sed\n", + "\n", + "\n", + "\n", + "Self\n", + "\n", + "\n", + "\n", + "ShaderLab\n", + "\n", + "\n", + "\n", + "Shell\n", + "\n", + "\n", + "\n", + "ShellSession\n", + "\n", + "\n", + "\n", + "Shen\n", + "\n", + "\n", + "\n", + "Slash\n", + "\n", + "\n", + "\n", + "Slice\n", + "\n", + "\n", + "\n", + "Slim\n", + "\n", + "\n", + "\n", + "Smali\n", + "\n", + "\n", + "\n", + "Smalltalk\n", + "\n", + "\n", + "\n", + "Smarty\n", + "\n", + "\n", + "\n", + "SMT\n", + "\n", + "\n", + "\n", + "Solidity\n", + "\n", + "\n", + "\n", + "SourcePawn\n", + "\n", + "\n", + "\n", + "SPARQL\n", + "\n", + "\n", + "\n", + "Spline Font Database\n", + "\n", + "\n", + "\n", + "SQF\n", + "\n", + "\n", + "\n", + "SQL\n", + "\n", + "\n", + "\n", + "SQLPL\n", + "\n", + "\n", + "\n", + "Squirrel\n", + "\n", + "\n", + "\n", + "SRecode Template\n", + "\n", + "\n", + "\n", + "SSH Config\n", + "\n", + "\n", + "\n", + "Stan\n", + "\n", + "\n", + "\n", + "Standard ML\n", + "\n", + "\n", + "\n", + "Stata\n", + "\n", + "\n", + "\n", + "STON\n", + "\n", + "\n", + "\n", + "Stylus\n", + "\n", + "\n", + "\n", + "SubRip Text\n", + "\n", + "\n", + "\n", + "SugarSS\n", + "\n", + "\n", + "\n", + "SuperCollider\n", + "\n", + "\n", + "\n", + "SVG\n", + "\n", + "\n", + "\n", + "Swift\n", + "\n", + "\n", + "\n", + "SystemVerilog\n", + "\n", + "\n", + "\n", + "Tcl\n", + "\n", + "\n", + "\n", + "Tcsh\n", + "\n", + "\n", + "\n", + "Tea\n", + "\n", + "\n", + "\n", + "Terra\n", + "\n", + "\n", + "\n", + "TeX\n", + "\n", + "\n", + "\n", + "Text\n", + "\n", + "\n", + "\n", + "Textile\n", + "\n", + "\n", + "\n", + "Thrift\n", + "\n", + "\n", + "\n", + "TI Program\n", + "\n", + "\n", + "\n", + "TLA\n", + "\n", + "\n", + "\n", + "TOML\n", + "\n", + "\n", + "\n", + "TSQL\n", + "\n", + "\n", + "\n", + "TSX\n", + "\n", + "\n", + "\n", + "Turing\n", + "\n", + "\n", + "\n", + "Turtle\n", + "\n", + "\n", + "\n", + "Twig\n", + "\n", + "\n", + "\n", + "TXL\n", + "\n", + "\n", + "\n", + "Type Language\n", + "\n", + "\n", + "\n", + "TypeScript\n", + "\n", + "\n", + "\n", + "Unified Parallel C\n", + "\n", + "\n", + "\n", + "Unity3D Asset\n", + "\n", + "\n", + "\n", + "Unix Assembly\n", + "\n", + "\n", + "\n", + "Uno\n", + "\n", + "\n", + "\n", + "UnrealScript\n", + "\n", + "\n", + "\n", + "UrWeb\n", + "\n", + "\n", + "\n", + "Vala\n", + "\n", + "\n", + "\n", + "VCL\n", + "\n", + "\n", + "\n", + "Verilog\n", + "\n", + "\n", + "\n", + "VHDL\n", + "\n", + "\n", + "\n", + "Vim script\n", + "\n", + "\n", + "\n", + "Visual Basic\n", + "\n", + "\n", + "\n", + "Volt\n", + "\n", + "\n", + "\n", + "Vue\n", + "\n", + "\n", + "\n", + "Wavefront Material\n", + "\n", + "\n", + "\n", + "Wavefront Object\n", + "\n", + "\n", + "\n", + "wdl\n", + "\n", + "\n", + "\n", + "Web Ontology Language\n", + "\n", + "\n", + "\n", + "WebAssembly\n", + "\n", + "\n", + "\n", + "WebIDL\n", + "\n", + "\n", + "\n", + "WebVTT\n", + "\n", + "\n", + "\n", + "Windows Registry Entries\n", + "\n", + "\n", + "\n", + "wisp\n", + "\n", + "\n", + "\n", + "Wollok\n", + "\n", + "\n", + "\n", + "World of Warcraft Addon Data\n", + "\n", + "\n", + "\n", + "X BitMap\n", + "\n", + "\n", + "\n", + "X Font Directory Index\n", + "\n", + "\n", + "\n", + "X PixMap\n", + "\n", + "\n", + "\n", + "X10\n", + "\n", + "\n", + "\n", + "xBase\n", + "\n", + "\n", + "\n", + "XC\n", + "\n", + "\n", + "\n", + "XCompose\n", + "\n", + "\n", + "\n", + "XML\n", + "\n", + "\n", + "\n", + "Xojo\n", + "\n", + "\n", + "\n", + "XPages\n", + "\n", + "\n", + "\n", + "XProc\n", + "\n", + "\n", + "\n", + "XQuery\n", + "\n", + "\n", + "\n", + "XS\n", + "\n", + "\n", + "\n", + "XSLT\n", + "\n", + "\n", + "\n", + "Xtend\n", + "\n", + "\n", + "\n", + "Yacc\n", + "\n", + "\n", + "\n", + "YAML\n", + "\n", + "\n", + "\n", + "YANG\n", + "\n", + "\n", + "\n", + "YARA\n", + "\n", + "\n", + "\n", + "YASnippet\n", + "\n", + "\n", + "\n", + "ZAP\n", + "\n", + "\n", + "\n", + "Zeek\n", + "\n", + "\n", + "\n", + "ZenScript\n", + "\n", + "\n", + "\n", + "Zephir\n", + "\n", + "\n", + "\n", + "Zig\n", + "\n", + "\n", + "\n", + "ZIL\n", + "\n", + "\n", + "\n", + "Zimpl\n", + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " Date range:\n", + " Today\n", + "\n", + "\n", + "
\n", + "Adjust time span\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + " 2\n", + " \n", + "
\n", + "\"@bfred-it\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Federico Brigante

\n", + "

\n", + "bfred-it\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + " 4\n", + " \n", + "
\n", + "\"@olleolleolle\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Olle Jonsson

\n", + "

\n", + "olleolleolle\n", + "

\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
Popular repo
\n", + "

\n", + "\n", + "\n", + "\n", + " wav2c\n", + " \n", + "

\n", + "
\n", + " wav2c makes arrays out of sounds - useful for Arduino SMAPLER v2 (and for GameBoy Advance) etc\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + " 6\n", + " \n", + "
\n", + "\"@fthomas\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Frank S. Thomas

\n", + "

\n", + "fthomas\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 7\n", + " \n", + "
\n", + "\"@syuilo\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

syuilo

\n", + "

\n", + "syuilo\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + " 9\n", + " \n", + "
\n", + "\"@balloob\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Paulus Schoutsen

\n", + "

\n", + "balloob\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 10\n", + " \n", + "
\n", + "\"@sdras\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Sarah Drasner

\n", + "

\n", + "sdras\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 11\n", + " \n", + "
\n", + "\"@skmp\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Stefanos Kornilios Mitsis Poiitidis

\n", + "

\n", + "skmp\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "\n", + "
\n", + "\n", + " 15\n", + " \n", + "
\n", + "\"@mholt\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Matt Holt

\n", + "

\n", + "mholt\n", + "

\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
Popular repo
\n", + "

\n", + "\n", + "\n", + "\n", + " PapaParse\n", + " \n", + "

\n", + "
\n", + " Fast and powerful CSV (delimited text) parser that gracefully handles large files and malformed input\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "
\n", + "\n", + " 18\n", + " \n", + "
\n", + "\"@unixorn\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Joe Block

\n", + "

\n", + "unixorn\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + " 20\n", + " \n", + "
\n", + "\"@randombit\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Jack Lloyd

\n", + "

\n", + "randombit\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 21\n", + " \n", + "
\n", + "\"@rauchg\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Guillermo Rauch

\n", + "

\n", + "rauchg\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 22\n", + " \n", + "
\n", + "\"@tgriesser\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Tim Griesser

\n", + "

\n", + "tgriesser\n", + "

\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
Popular repo
\n", + "

\n", + "\n", + "\n", + "\n", + " knex\n", + " \n", + "

\n", + "
\n", + " A query builder for PostgreSQL, MySQL and SQLite3, designed to be flexible, portable, and fun to use.\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 23\n", + " \n", + "
\n", + "\"@vtjnash\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Jameson Nash

\n", + "

\n", + "vtjnash\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 24\n", + " \n", + "
\n", + "\"@andersy005\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Anderson Banihirwe

\n", + "

\n", + "andersy005\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + "\n", + " You can’t perform that action at this time.\n", + "
\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "" + ] + }, + "execution_count": 6, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "#printing the content from the Trending Developers\n", + "soup_html = BeautifulSoup(html,'html')\n", + "soup_html" ] }, { @@ -79,9 +3885,7 @@ "execution_count": null, "metadata": {}, "outputs": [], - "source": [ - "#your code" - ] + "source": [] }, { "cell_type": "markdown", @@ -134,11 +3938,58 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 7, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "['Eric Ma',\n", + " 'Federico Brigante',\n", + " 'Kyle Roach',\n", + " 'Olle Jonsson',\n", + " 'Nikita Sobolev',\n", + " 'Frank S. Thomas',\n", + " 'syuilo',\n", + " 'Ives van Hoorne',\n", + " 'Paulus Schoutsen',\n", + " 'Sarah Drasner',\n", + " 'Stefanos Kornilios Mitsis Poiitidis',\n", + " 'Jan Hovancik',\n", + " 'Andreas Mueller',\n", + " 'Guillaume Gomez',\n", + " 'Matt Holt',\n", + " 'Clifford Wolf',\n", + " 'Franck Nijhof',\n", + " 'Joe Block',\n", + " 'Andrei Neagoie',\n", + " 'Jack Lloyd',\n", + " 'Guillermo Rauch',\n", + " 'Tim Griesser',\n", + " 'Jameson Nash',\n", + " 'Anderson Banihirwe',\n", + " 'Danny Ryan']" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "#your code" + "#To reach the names\n", + "tags = ['h1'] #esto es una lista!\n", + "texto = soup_html.find_all(tags,{'class':'h3 lh-condensed'})\n", + "\n", + "#Método largo\n", + "#names = []\n", + "#for t in texto:\n", + "# names.append(t.text)\n", + "#names \n", + " \n", + "#list comprenhension\n", + "names = [t.text for t in texto]\n", + "names" ] }, { @@ -152,7 +4003,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 8, "metadata": {}, "outputs": [], "source": [ @@ -162,37 +4013,148 @@ }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], + "execution_count": 9, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "b'\\n\\n\\n\\n\\n\\n\\n\\n \\n \\n \\n \\n \\n \\n \\n \\n \\n\\n\\n\\n \\n \\n \\n \\n \\n \\n \\n\\n \\n \\n Trending Python repositories on GitHub today \\xc2\\xb7 GitHub\\n \\n \\n \\n \\n\\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n\\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n\\n \\n \\n \\n \\n \\n\\n\\n \\n\\n \\n\\n \\n \\n \\n\\n \\n\\n\\n\\n\\n \\n\\n\\n\\n\\n\\n\\n \\n\\n \\n \\n\\n \\n \\n\\n \\n\\n \\n\\n \\n \\n\\n \\n\\n\\n \\n\\n\\n \\n\\n \\n\\n \\n \\n\\n\\n\\n\\n\\n\\n\\n \\n\\n \\n\\n \\n \\n\\n
\\n Skip to content\\n
\\n\\n \\n \\n \\n\\n\\n
\\n
\\n
\\n \\n \\n \\n\\n
\\n \\n\\n
\\n\\n
\\n \\n Sign up\\n \\n\\n \\n
\\n
\\n\\n
\\n
\\n \\n
\\n\\n \\n\\n \\n
\\n
\\n
\\n\\n
\\n\\n
\\n\\n\\n
\\n\\n
\\n\\n\\n\\n
\\n
\\n
\\n \\n
\\n\\n\\n
\\n
\\n

Trending

\\n

See what the GitHub community is most excited about today.

\\n
\\n
\\n\\n\\n
\\n
\\n
\\n \\n\\n\\n
\\n
\\n
\\n \\n Language:\\n\\n \\n \\n Python\\n \\n \\n \\n\\n \\n
\\n Select a language\\n \\n
\\n\\n
\\n
\\n
\\n \\n
\\n
\\n
\\n\\n
\\n
\\n \\n\\n Clear language\\n
\\n\\n
\\n \\n \\n C++\\n \\n \\n \\n HTML\\n \\n \\n \\n Java\\n \\n \\n \\n JavaScript\\n \\n \\n \\n PHP\\n \\n \\n \\n Python\\n \\n \\n \\n Ruby\\n \\n\\n \\n \\n Unknown languages\\n \\n\\n \\n \\n 1C Enterprise\\n \\n \\n \\n ABAP\\n \\n \\n \\n ABNF\\n \\n \\n \\n ActionScript\\n \\n \\n \\n Ada\\n \\n \\n \\n Adobe Font Metrics\\n \\n \\n \\n Agda\\n \\n \\n \\n AGS Script\\n \\n \\n \\n Alloy\\n \\n \\n \\n Alpine Abuild\\n \\n \\n \\n Altium Designer\\n \\n \\n \\n AMPL\\n \\n \\n \\n AngelScript\\n \\n \\n \\n Ant Build System\\n \\n \\n \\n ANTLR\\n \\n \\n \\n ApacheConf\\n \\n \\n \\n Apex\\n \\n \\n \\n API Blueprint\\n \\n \\n \\n APL\\n \\n \\n \\n Apollo Guidance Computer\\n \\n \\n \\n AppleScript\\n \\n \\n \\n Arc\\n \\n \\n \\n AsciiDoc\\n \\n \\n \\n ASN.1\\n \\n \\n \\n ASP\\n \\n \\n \\n AspectJ\\n \\n \\n \\n Assembly\\n \\n \\n \\n Asymptote\\n \\n \\n \\n ATS\\n \\n \\n \\n Augeas\\n \\n \\n \\n AutoHotkey\\n \\n \\n \\n AutoIt\\n \\n \\n \\n Awk\\n \\n \\n \\n Ballerina\\n \\n \\n \\n Batchfile\\n \\n \\n \\n Befunge\\n \\n \\n \\n Bison\\n \\n \\n \\n BitBake\\n \\n \\n \\n Blade\\n \\n \\n \\n BlitzBasic\\n \\n \\n \\n BlitzMax\\n \\n \\n \\n Bluespec\\n \\n \\n \\n Boo\\n \\n \\n \\n Brainfuck\\n \\n \\n \\n Brightscript\\n \\n \\n \\n Zeek\\n \\n \\n \\n C\\n \\n \\n \\n C#\\n \\n \\n \\n C++\\n \\n \\n \\n C-ObjDump\\n \\n \\n \\n C2hs Haskell\\n \\n \\n \\n Cabal Config\\n \\n \\n \\n Cap'n Proto\\n \\n \\n \\n CartoCSS\\n \\n \\n \\n Ceylon\\n \\n \\n \\n Chapel\\n \\n \\n \\n Charity\\n \\n \\n \\n ChucK\\n \\n \\n \\n Cirru\\n \\n \\n \\n Clarion\\n \\n \\n \\n Clean\\n \\n \\n \\n Click\\n \\n \\n \\n CLIPS\\n \\n \\n \\n Clojure\\n \\n \\n \\n Closure Templates\\n \\n \\n \\n Cloud Firestore Security Rules\\n \\n \\n \\n CMake\\n \\n \\n \\n COBOL\\n \\n \\n \\n CoffeeScript\\n \\n \\n \\n ColdFusion\\n \\n \\n \\n ColdFusion CFC\\n \\n \\n \\n COLLADA\\n \\n \\n \\n Common Lisp\\n \\n \\n \\n Common Workflow Language\\n \\n \\n \\n Component Pascal\\n \\n \\n \\n CoNLL-U\\n \\n \\n \\n Cool\\n \\n \\n \\n Coq\\n \\n \\n \\n Cpp-ObjDump\\n \\n \\n \\n Creole\\n \\n \\n \\n Crystal\\n \\n \\n \\n CSON\\n \\n \\n \\n Csound\\n \\n \\n \\n Csound Document\\n \\n \\n \\n Csound Score\\n \\n \\n \\n CSS\\n \\n \\n \\n CSV\\n \\n \\n \\n Cuda\\n \\n \\n \\n CWeb\\n \\n \\n \\n Cycript\\n \\n \\n \\n Cython\\n \\n \\n \\n D\\n \\n \\n \\n D-ObjDump\\n \\n \\n \\n Darcs Patch\\n \\n \\n \\n Dart\\n \\n \\n \\n DataWeave\\n \\n \\n \\n desktop\\n \\n \\n \\n Dhall\\n \\n \\n \\n Diff\\n \\n \\n \\n DIGITAL Command Language\\n \\n \\n \\n DM\\n \\n \\n \\n DNS Zone\\n \\n \\n \\n Dockerfile\\n \\n \\n \\n Dogescript\\n \\n \\n \\n DTrace\\n \\n \\n \\n Dylan\\n \\n \\n \\n E\\n \\n \\n \\n Eagle\\n \\n \\n \\n Easybuild\\n \\n \\n \\n EBNF\\n \\n \\n \\n eC\\n \\n \\n \\n Ecere Projects\\n \\n \\n \\n ECL\\n \\n \\n \\n ECLiPSe\\n \\n \\n \\n Edje Data Collection\\n \\n \\n \\n edn\\n \\n \\n \\n Eiffel\\n \\n \\n \\n EJS\\n \\n \\n \\n Elixir\\n \\n \\n \\n Elm\\n \\n \\n \\n Emacs Lisp\\n \\n \\n \\n EmberScript\\n \\n \\n \\n EML\\n \\n \\n \\n EQ\\n \\n \\n \\n Erlang\\n \\n \\n \\n F#\\n \\n \\n \\n F*\\n \\n \\n \\n Factor\\n \\n \\n \\n Fancy\\n \\n \\n \\n Fantom\\n \\n \\n \\n FIGlet Font\\n \\n \\n \\n Filebench WML\\n \\n \\n \\n Filterscript\\n \\n \\n \\n fish\\n \\n \\n \\n FLUX\\n \\n \\n \\n Formatted\\n \\n \\n \\n Forth\\n \\n \\n \\n Fortran\\n \\n \\n \\n FreeMarker\\n \\n \\n \\n Frege\\n \\n \\n \\n G-code\\n \\n \\n \\n Game Maker Language\\n \\n \\n \\n GAMS\\n \\n \\n \\n GAP\\n \\n \\n \\n GCC Machine Description\\n \\n \\n \\n GDB\\n \\n \\n \\n GDScript\\n \\n \\n \\n Genie\\n \\n \\n \\n Genshi\\n \\n \\n \\n Gentoo Ebuild\\n \\n \\n \\n Gentoo Eclass\\n \\n \\n \\n Gerber Image\\n \\n \\n \\n Gettext Catalog\\n \\n \\n \\n Gherkin\\n \\n \\n \\n Git Attributes\\n \\n \\n \\n Git Config\\n \\n \\n \\n GLSL\\n \\n \\n \\n Glyph\\n \\n \\n \\n Glyph Bitmap Distribution Format\\n \\n \\n \\n GN\\n \\n \\n \\n Gnuplot\\n \\n \\n \\n Go\\n \\n \\n \\n Golo\\n \\n \\n \\n Gosu\\n \\n \\n \\n Grace\\n \\n \\n \\n Gradle\\n \\n \\n \\n Grammatical Framework\\n \\n \\n \\n Graph Modeling Language\\n \\n \\n \\n GraphQL\\n \\n \\n \\n Graphviz (DOT)\\n \\n \\n \\n Groovy\\n \\n \\n \\n Groovy Server Pages\\n \\n \\n \\n Hack\\n \\n \\n \\n Haml\\n \\n \\n \\n Handlebars\\n \\n \\n \\n HAProxy\\n \\n \\n \\n Harbour\\n \\n \\n \\n Haskell\\n \\n \\n \\n Haxe\\n \\n \\n \\n HCL\\n \\n \\n \\n HiveQL\\n \\n \\n \\n HLSL\\n \\n \\n \\n HolyC\\n \\n \\n \\n HTML\\n \\n \\n \\n HTML+Django\\n \\n \\n \\n HTML+ECR\\n \\n \\n \\n HTML+EEX\\n \\n \\n \\n HTML+ERB\\n \\n \\n \\n HTML+PHP\\n \\n \\n \\n HTML+Razor\\n \\n \\n \\n HTTP\\n \\n \\n \\n HXML\\n \\n \\n \\n Hy\\n \\n \\n \\n HyPhy\\n \\n \\n \\n IDL\\n \\n \\n \\n Idris\\n \\n \\n \\n IGOR Pro\\n \\n \\n \\n Inform 7\\n \\n \\n \\n INI\\n \\n \\n \\n Inno Setup\\n \\n \\n \\n Io\\n \\n \\n \\n Ioke\\n \\n \\n \\n IRC log\\n \\n \\n \\n Isabelle\\n \\n \\n \\n Isabelle ROOT\\n \\n \\n \\n J\\n \\n \\n \\n Jasmin\\n \\n \\n \\n Java\\n \\n \\n \\n Java Properties\\n \\n \\n \\n Java Server Pages\\n \\n \\n \\n JavaScript\\n \\n \\n \\n JavaScript+ERB\\n \\n \\n \\n JFlex\\n \\n \\n \\n Jison\\n \\n \\n \\n Jison Lex\\n \\n \\n \\n Jolie\\n \\n \\n \\n JSON\\n \\n \\n \\n JSON with Comments\\n \\n \\n \\n JSON5\\n \\n \\n \\n JSONiq\\n \\n \\n \\n JSONLD\\n \\n \\n \\n Jsonnet\\n \\n \\n \\n JSX\\n \\n \\n \\n Julia\\n \\n \\n \\n Jupyter Notebook\\n \\n \\n \\n KiCad Layout\\n \\n \\n \\n KiCad Legacy Layout\\n \\n \\n \\n KiCad Schematic\\n \\n \\n \\n Kit\\n \\n \\n \\n Kotlin\\n \\n \\n \\n KRL\\n \\n \\n \\n LabVIEW\\n \\n \\n \\n Lasso\\n \\n \\n \\n Latte\\n \\n \\n \\n Lean\\n \\n \\n \\n Less\\n \\n \\n \\n Lex\\n \\n \\n \\n LFE\\n \\n \\n \\n LilyPond\\n \\n \\n \\n Limbo\\n \\n \\n \\n Linker Script\\n \\n \\n \\n Linux Kernel Module\\n \\n \\n \\n Liquid\\n \\n \\n \\n Literate Agda\\n \\n \\n \\n Literate CoffeeScript\\n \\n \\n \\n Literate Haskell\\n \\n \\n \\n LiveScript\\n \\n \\n \\n LLVM\\n \\n \\n \\n Logos\\n \\n \\n \\n Logtalk\\n \\n \\n \\n LOLCODE\\n \\n \\n \\n LookML\\n \\n \\n \\n LoomScript\\n \\n \\n \\n LSL\\n \\n \\n \\n Lua\\n \\n \\n \\n M\\n \\n \\n \\n M4\\n \\n \\n \\n M4Sugar\\n \\n \\n \\n Makefile\\n \\n \\n \\n Mako\\n \\n \\n \\n Markdown\\n \\n \\n \\n Marko\\n \\n \\n \\n Mask\\n \\n \\n \\n Mathematica\\n \\n \\n \\n MATLAB\\n \\n \\n \\n Maven POM\\n \\n \\n \\n Max\\n \\n \\n \\n MAXScript\\n \\n \\n \\n mcfunction\\n \\n \\n \\n MediaWiki\\n \\n \\n \\n Mercury\\n \\n \\n \\n Meson\\n \\n \\n \\n Metal\\n \\n \\n \\n MiniD\\n \\n \\n \\n Mirah\\n \\n \\n \\n Modelica\\n \\n \\n \\n Modula-2\\n \\n \\n \\n Modula-3\\n \\n \\n \\n Module Management System\\n \\n \\n \\n Monkey\\n \\n \\n \\n Moocode\\n \\n \\n \\n MoonScript\\n \\n \\n \\n Motorola 68K Assembly\\n \\n \\n \\n MQL4\\n \\n \\n \\n MQL5\\n \\n \\n \\n MTML\\n \\n \\n \\n MUF\\n \\n \\n \\n mupad\\n \\n \\n \\n Myghty\\n \\n \\n \\n nanorc\\n \\n \\n \\n NCL\\n \\n \\n \\n Nearley\\n \\n \\n \\n Nemerle\\n \\n \\n \\n nesC\\n \\n \\n \\n NetLinx\\n \\n \\n \\n NetLinx+ERB\\n \\n \\n \\n NetLogo\\n \\n \\n \\n NewLisp\\n \\n \\n \\n Nextflow\\n \\n \\n \\n Nginx\\n \\n \\n \\n Nim\\n \\n \\n \\n Ninja\\n \\n \\n \\n Nit\\n \\n \\n \\n Nix\\n \\n \\n \\n NL\\n \\n \\n \\n NSIS\\n \\n \\n \\n Nu\\n \\n \\n \\n NumPy\\n \\n \\n \\n ObjDump\\n \\n \\n \\n Objective-C\\n \\n \\n \\n Objective-C++\\n \\n \\n \\n Objective-J\\n \\n \\n \\n ObjectScript\\n \\n \\n \\n OCaml\\n \\n \\n \\n Omgrofl\\n \\n \\n \\n ooc\\n \\n \\n \\n Opa\\n \\n \\n \\n Opal\\n \\n \\n \\n OpenCL\\n \\n \\n \\n OpenEdge ABL\\n \\n \\n \\n OpenRC runscript\\n \\n \\n \\n OpenSCAD\\n \\n \\n \\n OpenType Feature File\\n \\n \\n \\n Org\\n \\n \\n \\n Ox\\n \\n \\n \\n Oxygene\\n \\n \\n \\n Oz\\n \\n \\n \\n P4\\n \\n \\n \\n Pan\\n \\n \\n \\n Papyrus\\n \\n \\n \\n Parrot\\n \\n \\n \\n Parrot Assembly\\n \\n \\n \\n Parrot Internal Representation\\n \\n \\n \\n Pascal\\n \\n \\n \\n Pawn\\n \\n \\n \\n Pep8\\n \\n \\n \\n Perl\\n \\n \\n \\n Perl 6\\n \\n \\n \\n PHP\\n \\n \\n \\n Pic\\n \\n \\n \\n Pickle\\n \\n \\n \\n PicoLisp\\n \\n \\n \\n PigLatin\\n \\n \\n \\n Pike\\n \\n \\n \\n PLpgSQL\\n \\n \\n \\n PLSQL\\n \\n \\n \\n Pod\\n \\n \\n \\n Pod 6\\n \\n \\n \\n PogoScript\\n \\n \\n \\n Pony\\n \\n \\n \\n PostCSS\\n \\n \\n \\n PostScript\\n \\n \\n \\n POV-Ray SDL\\n \\n \\n \\n PowerBuilder\\n \\n \\n \\n PowerShell\\n \\n \\n \\n Processing\\n \\n \\n \\n Prolog\\n \\n \\n \\n Propeller Spin\\n \\n \\n \\n Protocol Buffer\\n \\n \\n \\n Public Key\\n \\n \\n \\n Pug\\n \\n \\n \\n Puppet\\n \\n \\n \\n Pure Data\\n \\n \\n \\n PureBasic\\n \\n \\n \\n PureScript\\n \\n \\n \\n Python\\n \\n \\n \\n Python console\\n \\n \\n \\n Python traceback\\n \\n \\n \\n q\\n \\n \\n \\n QMake\\n \\n \\n \\n QML\\n \\n \\n \\n Quake\\n \\n \\n \\n R\\n \\n \\n \\n Racket\\n \\n \\n \\n Ragel\\n \\n \\n \\n RAML\\n \\n \\n \\n Rascal\\n \\n \\n \\n Raw token data\\n \\n \\n \\n RDoc\\n \\n \\n \\n REALbasic\\n \\n \\n \\n Reason\\n \\n \\n \\n Rebol\\n \\n \\n \\n Red\\n \\n \\n \\n Redcode\\n \\n \\n \\n Regular Expression\\n \\n \\n \\n Ren'Py\\n \\n \\n \\n RenderScript\\n \\n \\n \\n reStructuredText\\n \\n \\n \\n REXX\\n \\n \\n \\n RHTML\\n \\n \\n \\n Rich Text Format\\n \\n \\n \\n Ring\\n \\n \\n \\n RMarkdown\\n \\n \\n \\n RobotFramework\\n \\n \\n \\n Roff\\n \\n \\n \\n Roff Manpage\\n \\n \\n \\n Rouge\\n \\n \\n \\n RPC\\n \\n \\n \\n RPM Spec\\n \\n \\n \\n Ruby\\n \\n \\n \\n RUNOFF\\n \\n \\n \\n Rust\\n \\n \\n \\n Sage\\n \\n \\n \\n SaltStack\\n \\n \\n \\n SAS\\n \\n \\n \\n Sass\\n \\n \\n \\n Scala\\n \\n \\n \\n Scaml\\n \\n \\n \\n Scheme\\n \\n \\n \\n Scilab\\n \\n \\n \\n SCSS\\n \\n \\n \\n sed\\n \\n \\n \\n Self\\n \\n \\n \\n ShaderLab\\n \\n \\n \\n Shell\\n \\n \\n \\n ShellSession\\n \\n \\n \\n Shen\\n \\n \\n \\n Slash\\n \\n \\n \\n Slice\\n \\n \\n \\n Slim\\n \\n \\n \\n Smali\\n \\n \\n \\n Smalltalk\\n \\n \\n \\n Smarty\\n \\n \\n \\n SMT\\n \\n \\n \\n Solidity\\n \\n \\n \\n SourcePawn\\n \\n \\n \\n SPARQL\\n \\n \\n \\n Spline Font Database\\n \\n \\n \\n SQF\\n \\n \\n \\n SQL\\n \\n \\n \\n SQLPL\\n \\n \\n \\n Squirrel\\n \\n \\n \\n SRecode Template\\n \\n \\n \\n SSH Config\\n \\n \\n \\n Stan\\n \\n \\n \\n Standard ML\\n \\n \\n \\n Stata\\n \\n \\n \\n STON\\n \\n \\n \\n Stylus\\n \\n \\n \\n SubRip Text\\n \\n \\n \\n SugarSS\\n \\n \\n \\n SuperCollider\\n \\n \\n \\n SVG\\n \\n \\n \\n Swift\\n \\n \\n \\n SystemVerilog\\n \\n \\n \\n Tcl\\n \\n \\n \\n Tcsh\\n \\n \\n \\n Tea\\n \\n \\n \\n Terra\\n \\n \\n \\n TeX\\n \\n \\n \\n Text\\n \\n \\n \\n Textile\\n \\n \\n \\n Thrift\\n \\n \\n \\n TI Program\\n \\n \\n \\n TLA\\n \\n \\n \\n TOML\\n \\n \\n \\n TSQL\\n \\n \\n \\n TSX\\n \\n \\n \\n Turing\\n \\n \\n \\n Turtle\\n \\n \\n \\n Twig\\n \\n \\n \\n TXL\\n \\n \\n \\n Type Language\\n \\n \\n \\n TypeScript\\n \\n \\n \\n Unified Parallel C\\n \\n \\n \\n Unity3D Asset\\n \\n \\n \\n Unix Assembly\\n \\n \\n \\n Uno\\n \\n \\n \\n UnrealScript\\n \\n \\n \\n UrWeb\\n \\n \\n \\n Vala\\n \\n \\n \\n VCL\\n \\n \\n \\n Verilog\\n \\n \\n \\n VHDL\\n \\n \\n \\n Vim script\\n \\n \\n \\n Visual Basic\\n \\n \\n \\n Volt\\n \\n \\n \\n Vue\\n \\n \\n \\n Wavefront Material\\n \\n \\n \\n Wavefront Object\\n \\n \\n \\n wdl\\n \\n \\n \\n Web Ontology Language\\n \\n \\n \\n WebAssembly\\n \\n \\n \\n WebIDL\\n \\n \\n \\n WebVTT\\n \\n \\n \\n Windows Registry Entries\\n \\n \\n \\n wisp\\n \\n \\n \\n Wollok\\n \\n \\n \\n World of Warcraft Addon Data\\n \\n \\n \\n X BitMap\\n \\n \\n \\n X Font Directory Index\\n \\n \\n \\n X PixMap\\n \\n \\n \\n X10\\n \\n \\n \\n xBase\\n \\n \\n \\n XC\\n \\n \\n \\n XCompose\\n \\n \\n \\n XML\\n \\n \\n \\n Xojo\\n \\n \\n \\n XPages\\n \\n \\n \\n XProc\\n \\n \\n \\n XQuery\\n \\n \\n \\n XS\\n \\n \\n \\n XSLT\\n \\n \\n \\n Xtend\\n \\n \\n \\n Yacc\\n \\n \\n \\n YAML\\n \\n \\n \\n YANG\\n \\n \\n \\n YARA\\n \\n \\n \\n YASnippet\\n \\n \\n \\n ZAP\\n \\n \\n \\n Zeek\\n \\n \\n \\n ZenScript\\n \\n \\n \\n Zephir\\n \\n \\n \\n Zig\\n \\n \\n \\n ZIL\\n \\n \\n \\n Zimpl\\n \\n
\\n
\\n\\n
\\n \\n
\\n
\\n
\\n\\n
\\n\\n
\\n
\\n \\n Date range:\\n Today\\n \\n \\n
\\n Adjust time span\\n \\n
\\n\\n
\\n \\n \\n Today\\n \\n \\n \\n This week\\n \\n \\n \\n This month\\n \\n
\\n
\\n
\\n\\n
\\n
\\n
\\n
\\n \\n\\n \\n\\n \\n\\n
\\n
\\n \\n \\n Star\\n\\n\\n
\\n\\n

\\n \\n \\n uber / ludwig\\n

\\n\\n

\\n Ludwig is a toolbox built on top of TensorFlow that allows to train and test deep learning models without the need to write code.\\n

\\n\\n
\\n \\n \\n Python\\n\\n\\n\\n \\n \\n 5,146\\n \\n\\n \\n \\n 547\\n \\n\\n \\n \\n Built by\\n \"@w4nderlust\"\\n \"@msaisumanth\"\\n \"@ydudin3\"\\n \"@dsblank\"\\n \"@carlogrisetti\"\\n \\n\\n \\n \\n 74 stars today\\n \\n
\\n
\\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n
\\n
\\n \\n \\n Star\\n\\n\\n
\\n\\n

\\n \\n \\n d2l-ai / d2l-zh\\n

\\n\\n

\\n \\xe3\\x80\\x8a\\xe5\\x8a\\xa8\\xe6\\x89\\x8b\\xe5\\xad\\xa6\\xe6\\xb7\\xb1\\xe5\\xba\\xa6\\xe5\\xad\\xa6\\xe4\\xb9\\xa0\\xe3\\x80\\x8b\\xef\\xbc\\x9a\\xe9\\x9d\\xa2\\xe5\\x90\\x91\\xe4\\xb8\\xad\\xe6\\x96\\x87\\xe8\\xaf\\xbb\\xe8\\x80\\x85\\xe3\\x80\\x81\\xe8\\x83\\xbd\\xe8\\xbf\\x90\\xe8\\xa1\\x8c\\xe3\\x80\\x81\\xe5\\x8f\\xaf\\xe8\\xae\\xa8\\xe8\\xae\\xba\\xe3\\x80\\x82\\xe8\\x8b\\xb1\\xe6\\x96\\x87\\xe7\\x89\\x88\\xe5\\x8d\\xb3\\xe4\\xbc\\xaf\\xe5\\x85\\x8b\\xe5\\x88\\xa9\\xe2\\x80\\x9c\\xe6\\xb7\\xb1\\xe5\\xba\\xa6\\xe5\\xad\\xa6\\xe4\\xb9\\xa0\\xe5\\xaf\\xbc\\xe8\\xae\\xba\\xef\\xbc\\x88STAT 157\\xef\\xbc\\x89\\xe2\\x80\\x9d\\xe6\\x95\\x99\\xe6\\x9d\\x90\\xe3\\x80\\x82\\n

\\n\\n
\\n \\n \\n Python\\n\\n\\n\\n \\n \\n 10,459\\n \\n\\n \\n \\n 2,665\\n \\n\\n \\n \\n Built by\\n \"@astonzhang\"\\n \"@mli\"\\n \"@szha\"\\n \"@yanwenlei\"\\n \"@XiaGenYuan\"\\n \\n\\n \\n \\n 45 stars today\\n \\n
\\n
\\n\\n \\n\\n
\\n
\\n \\n \\n Star\\n\\n\\n
\\n\\n

\\n \\n \\n beecost / bee-university\\n

\\n\\n

\\n Project thu th\\xe1\\xba\\xadp \\xc4\\x91i\\xe1\\xbb\\x83m chu\\xe1\\xba\\xa9n \\xc4\\x91\\xe1\\xba\\xa1i h\\xe1\\xbb\\x8dc 2014 - 2018 v\\xc3\\xa0 ph\\xc3\\xa2n t\\xc3\\xadch d\\xe1\\xbb\\xaf li\\xe1\\xbb\\x87u\\n

\\n\\n
\\n \\n \\n Python\\n\\n\\n\\n \\n \\n 61\\n \\n\\n \\n \\n 12\\n \\n\\n \\n \\n Built by\\n \"@tuantmtb\"\\n \\n\\n \\n \\n 5 stars today\\n \\n
\\n
\\n\\n \\n\\n
\\n
\\n
\\n
\\n
\\n\\n
\\n\\n \\n\\n\\n\\n\\n
\\n \\n \\n You can\\xe2\\x80\\x99t perform that action at this time.\\n
\\n\\n\\n \\n \\n \\n \\n \\n \\n \\n
\\n \\n You signed in with another tab or window. Reload to refresh your session.\\n You signed out in another tab or window. Reload to refresh your session.\\n
\\n \\n\\n
\\n
\\n
\\n
\\n\\n
\\n\\n \\n\\n\\n'" + ] + }, + "execution_count": 9, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "#your code" + "#your code\n", + "html = requests.get(url).content\n", + "html" ] }, { - "cell_type": "markdown", - "metadata": {}, + "cell_type": "code", + "execution_count": 10, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "['gto76/python-cheatsheet',\n", + " 'j3ssie/Osmedeus',\n", + " 'tangzixiang0304/Shielded_detector',\n", + " 'uber/ludwig',\n", + " 'xinshuoweng/AB3DMOT',\n", + " 'NVlabs/stylegan',\n", + " 'dagster-io/dagster',\n", + " 'tensorflow/models',\n", + " 'eragonruan/text-detection-ctpn',\n", + " 'sherlock-project/sherlock',\n", + " 'deepfakes/faceswap',\n", + " 'nbei/Deep-Flow-Guided-Video-Inpainting',\n", + " 'iovisor/bcc',\n", + " 'Roibal/Cryptocurrency-Trading-Bots-Python-Beginner-Advance',\n", + " 'NVIDIA/DeepLearningExamples',\n", + " 'BlackHC/tfpyth',\n", + " 'clovaai/deep-text-recognition-benchmark',\n", + " 'tkat0/PyTorch_BlazeFace',\n", + " 'OpenMined/PySyft',\n", + " 'CoreyMSchafer/code_snippets',\n", + " 'public-apis/public-apis',\n", + " 'd2l-ai/d2l-zh',\n", + " 'apache/airflow',\n", + " 'beecost/bee-university',\n", + " 'sundowndev/PhoneInfoga']" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "#### Display all the image links from Walt Disney wikipedia page" + "soup_html = BeautifulSoup(html,'html')\n", + "tags = ['h1']\n", + "texto = soup_html.find_all(tags,{'class':'h3 lh-condensed'})\n", + "\n", + "names = [t.text.replace('\\n','').replace(' ','') for t in texto]\n", + "names\n", + "\n" ] }, { - "cell_type": "code", - "execution_count": null, + "cell_type": "markdown", "metadata": {}, - "outputs": [], "source": [ - "# This is the url you will scrape in this exercise\n", - "url = 'https://en.wikipedia.org/wiki/Walt_Disney'" + "#### Display all the image links from Walt Disney wikipedia page" ] }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], + "execution_count": 11, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "['//upload.wikimedia.org/wikipedia/en/thumb/e/e7/Cscr-featured.svg/20px-Cscr-featured.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/1/1b/Semi-protection-shackle.svg/20px-Semi-protection-shackle.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/d/df/Walt_Disney_1946.JPG/220px-Walt_Disney_1946.JPG',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/8/87/Walt_Disney_1942_signature.svg/150px-Walt_Disney_1942_signature.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/c/c4/Walt_Disney_envelope_ca._1921.jpg/220px-Walt_Disney_envelope_ca._1921.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/4/4d/Newman_Laugh-O-Gram_%281921%29.webm/220px-seek%3D2-Newman_Laugh-O-Gram_%281921%29.webm.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/0/0d/Trolley_Troubles_poster.jpg/170px-Trolley_Troubles_poster.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/7/71/Walt_Disney_and_his_cartoon_creation_%22Mickey_Mouse%22_-_National_Board_of_Review_Magazine.jpg/170px-Walt_Disney_and_his_cartoon_creation_%22Mickey_Mouse%22_-_National_Board_of_Review_Magazine.jpg',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/4/4e/Steamboat-willie.jpg/170px-Steamboat-willie.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/5/57/Walt_Disney_1935.jpg/170px-Walt_Disney_1935.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/c/cd/Walt_Disney_Snow_white_1937_trailer_screenshot_%2813%29.jpg/220px-Walt_Disney_Snow_white_1937_trailer_screenshot_%2813%29.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/1/15/Disney_drawing_goofy.jpg/170px-Disney_drawing_goofy.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/1/13/DisneySchiphol1951.jpg/220px-DisneySchiphol1951.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/8/8c/WaltDisneyplansDisneylandDec1954.jpg/220px-WaltDisneyplansDisneylandDec1954.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/f/ff/Walt_disney_portrait_right.jpg/170px-Walt_disney_portrait_right.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/1/1a/Walt_Disney_Grave.JPG/170px-Walt_Disney_Grave.JPG',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/2/2d/Roy_O._Disney_with_Company_at_Press_Conference.jpg/170px-Roy_O._Disney_with_Company_at_Press_Conference.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/a/a9/Disney_Display_Case.JPG/170px-Disney_Display_Case.JPG',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/6/6c/Disney1968.jpg/170px-Disney1968.jpg',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/8/8a/OOjs_UI_icon_edit-ltr-progressive.svg/10px-OOjs_UI_icon_edit-ltr-progressive.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/d/da/Animation_disc.svg/30px-Animation_disc.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/6/69/P_vip.svg/29px-P_vip.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/1/1a/Magic_Kingdom_castle.jpg/24px-Magic_Kingdom_castle.jpg',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/e/e7/Video-x-generic.svg/30px-Video-x-generic.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/a/a3/Flag_of_Los_Angeles_County%2C_California.svg/30px-Flag_of_Los_Angeles_County%2C_California.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/a/a3/USA_flag_on_television.svg/30px-USA_flag_on_television.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/4/4a/Commons-logo.svg/22px-Commons-logo.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/f/fa/Wikiquote-logo.svg/25px-Wikiquote-logo.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/f/ff/Wikidata-logo.svg/30px-Wikidata-logo.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/8/8a/OOjs_UI_icon_edit-ltr-progressive.svg/10px-OOjs_UI_icon_edit-ltr-progressive.svg.png',\n", + " '//en.wikipedia.org/wiki/Special:CentralAutoLogin/start?type=1x1',\n", + " '/static/images/wikimedia-button.png',\n", + " '/static/images/poweredby_mediawiki_88x31.png']" + ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "#your code" + "# This is the url you will scrape in this exercise\n", + "url = 'https://en.wikipedia.org/wiki/Walt_Disney'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')\n", + "\n", + "tags = ['img']\n", + "images = soup_html.find_all(tags)\n", + "\n", + "image_list = [i.attrs['src'] for i in images]\n", + "image_list" ] }, { @@ -204,21 +4166,189 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 12, "metadata": {}, "outputs": [], "source": [ "# This is the url you will scrape in this exercise\n", - "url ='https://en.wikipedia.org/wiki/Python' " + "url ='https://en.wikipedia.org/wiki/Python'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')" ] }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], + "execution_count": 13, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "['https://en.wiktionary.org/wiki/Python',\n", + " 'https://en.wiktionary.org/wiki/python',\n", + " '/w/index.php?title=Python&action=edit§ion=1',\n", + " '/wiki/Pythonidae',\n", + " '/wiki/Python_(genus)',\n", + " '/w/index.php?title=Python&action=edit§ion=2',\n", + " '/wiki/Python_(mythology)',\n", + " '/wiki/Python_of_Aenus',\n", + " '/wiki/Python_(painter)',\n", + " '/wiki/Python_of_Byzantium',\n", + " '/wiki/Python_of_Catana',\n", + " '/w/index.php?title=Python&action=edit§ion=3',\n", + " '/wiki/Python_(film)',\n", + " '/wiki/Pythons_2',\n", + " '/wiki/Monty_Python',\n", + " '/wiki/Python_(Monty)_Pictures',\n", + " '/w/index.php?title=Python&action=edit§ion=4',\n", + " '/wiki/Python_(programming_language)',\n", + " '/wiki/CPython',\n", + " '/wiki/CMU_Common_Lisp',\n", + " '/wiki/PERQ#PERQ_3',\n", + " '/w/index.php?title=Python&action=edit§ion=5',\n", + " '/w/index.php?title=Python&action=edit§ion=6',\n", + " '/wiki/Python_(Busch_Gardens_Tampa_Bay)',\n", + " '/wiki/Python_(Coney_Island,_Cincinnati,_Ohio)',\n", + " '/wiki/Python_(Efteling)',\n", + " '/w/index.php?title=Python&action=edit§ion=7',\n", + " '/wiki/Python_(automobile_maker)',\n", + " '/wiki/Python_(Ford_prototype)',\n", + " '/w/index.php?title=Python&action=edit§ion=8',\n", + " '/wiki/Colt_Python',\n", + " '/wiki/Python_(missile)',\n", + " '/wiki/Python_(nuclear_primary)',\n", + " '/w/index.php?title=Python&action=edit§ion=9',\n", + " '/wiki/Python_Anghelo',\n", + " '/w/index.php?title=Python&action=edit§ion=10',\n", + " '/wiki/PYTHON',\n", + " '/w/index.php?title=Python&action=edit§ion=11',\n", + " '/wiki/Cython',\n", + " '/wiki/Pyton',\n", + " '/wiki/File:Disambig_gray.svg',\n", + " '/wiki/Help:Disambiguation',\n", + " '//en.wikipedia.org/w/index.php?title=Special:WhatLinksHere/Python&namespace=0',\n", + " 'https://en.wikipedia.org/w/index.php?title=Python&oldid=905477736',\n", + " '/wiki/Help:Category',\n", + " '/wiki/Category:Disambiguation_pages',\n", + " '/wiki/Category:Disambiguation_pages_with_short_description',\n", + " '/wiki/Category:All_article_disambiguation_pages',\n", + " '/wiki/Category:All_disambiguation_pages',\n", + " '/wiki/Category:Animal_common_name_disambiguation_pages',\n", + " '/wiki/Special:MyTalk',\n", + " '/wiki/Special:MyContributions',\n", + " '/w/index.php?title=Special:CreateAccount&returnto=Python',\n", + " '/w/index.php?title=Special:UserLogin&returnto=Python',\n", + " '/wiki/Python',\n", + " '/wiki/Talk:Python',\n", + " '/wiki/Python',\n", + " '/w/index.php?title=Python&action=edit',\n", + " '/w/index.php?title=Python&action=history',\n", + " '/wiki/Main_Page',\n", + " '/wiki/Main_Page',\n", + " '/wiki/Portal:Contents',\n", + " '/wiki/Portal:Featured_content',\n", + " '/wiki/Portal:Current_events',\n", + " '/wiki/Special:Random',\n", + " 'https://donate.wikimedia.org/wiki/Special:FundraiserRedirector?utm_source=donate&utm_medium=sidebar&utm_campaign=C13_en.wikipedia.org&uselang=en',\n", + " '//shop.wikimedia.org',\n", + " '/wiki/Help:Contents',\n", + " '/wiki/Wikipedia:About',\n", + " '/wiki/Wikipedia:Community_portal',\n", + " '/wiki/Special:RecentChanges',\n", + " '//en.wikipedia.org/wiki/Wikipedia:Contact_us',\n", + " '/wiki/Special:WhatLinksHere/Python',\n", + " '/wiki/Special:RecentChangesLinked/Python',\n", + " '/wiki/Wikipedia:File_Upload_Wizard',\n", + " '/wiki/Special:SpecialPages',\n", + " '/w/index.php?title=Python&oldid=905477736',\n", + " '/w/index.php?title=Python&action=info',\n", + " 'https://www.wikidata.org/wiki/Special:EntityPage/Q747452',\n", + " '/w/index.php?title=Special:CiteThisPage&page=Python&id=905477736',\n", + " 'https://commons.wikimedia.org/wiki/Category:Python',\n", + " '/w/index.php?title=Special:Book&bookcmd=book_creator&referer=Python',\n", + " '/w/index.php?title=Special:ElectronPdf&page=Python&action=show-download-screen',\n", + " '/w/index.php?title=Python&printable=yes',\n", + " 'https://af.wikipedia.org/wiki/Python',\n", + " 'https://als.wikipedia.org/wiki/Python',\n", + " 'https://az.wikipedia.org/wiki/Python',\n", + " 'https://bn.wikipedia.org/wiki/%E0%A6%AA%E0%A6%BE%E0%A6%87%E0%A6%A5%E0%A6%A8_(%E0%A6%A6%E0%A7%8D%E0%A6%AC%E0%A7%8D%E0%A6%AF%E0%A6%B0%E0%A7%8D%E0%A6%A5%E0%A6%A4%E0%A6%BE_%E0%A6%A8%E0%A6%BF%E0%A6%B0%E0%A6%B8%E0%A6%A8)',\n", + " 'https://be.wikipedia.org/wiki/Python',\n", + " 'https://bg.wikipedia.org/wiki/%D0%9F%D0%B8%D1%82%D0%BE%D0%BD_(%D0%BF%D0%BE%D1%8F%D1%81%D0%BD%D0%B5%D0%BD%D0%B8%D0%B5)',\n", + " 'https://cs.wikipedia.org/wiki/Python_(rozcestn%C3%ADk)',\n", + " 'https://da.wikipedia.org/wiki/Python',\n", + " 'https://de.wikipedia.org/wiki/Python',\n", + " 'https://eo.wikipedia.org/wiki/Pitono_(apartigilo)',\n", + " 'https://eu.wikipedia.org/wiki/Python_(argipena)',\n", + " 'https://fa.wikipedia.org/wiki/%D9%BE%D8%A7%DB%8C%D8%AA%D9%88%D9%86',\n", + " 'https://fr.wikipedia.org/wiki/Python',\n", + " 'https://ko.wikipedia.org/wiki/%ED%8C%8C%EC%9D%B4%EC%84%A0',\n", + " 'https://hr.wikipedia.org/wiki/Python_(razdvojba)',\n", + " 'https://io.wikipedia.org/wiki/Pitono',\n", + " 'https://id.wikipedia.org/wiki/Python',\n", + " 'https://ia.wikipedia.org/wiki/Python_(disambiguation)',\n", + " 'https://is.wikipedia.org/wiki/Python_(a%C3%B0greining)',\n", + " 'https://it.wikipedia.org/wiki/Python_(disambigua)',\n", + " 'https://he.wikipedia.org/wiki/%D7%A4%D7%99%D7%AA%D7%95%D7%9F',\n", + " 'https://ka.wikipedia.org/wiki/%E1%83%9E%E1%83%98%E1%83%97%E1%83%9D%E1%83%9C%E1%83%98_(%E1%83%9B%E1%83%A0%E1%83%90%E1%83%95%E1%83%90%E1%83%9A%E1%83%9B%E1%83%9C%E1%83%98%E1%83%A8%E1%83%95%E1%83%9C%E1%83%94%E1%83%9A%E1%83%9D%E1%83%95%E1%83%90%E1%83%9C%E1%83%98)',\n", + " 'https://kg.wikipedia.org/wiki/Mboma_(nyoka)',\n", + " 'https://la.wikipedia.org/wiki/Python_(discretiva)',\n", + " 'https://lb.wikipedia.org/wiki/Python',\n", + " 'https://hu.wikipedia.org/wiki/Python_(egy%C3%A9rtelm%C5%B1s%C3%ADt%C5%91_lap)',\n", + " 'https://mr.wikipedia.org/wiki/%E0%A4%AA%E0%A4%BE%E0%A4%AF%E0%A4%A5%E0%A5%89%E0%A4%A8_(%E0%A4%86%E0%A4%9C%E0%A5%8D%E0%A4%9E%E0%A4%BE%E0%A4%B5%E0%A4%B2%E0%A5%80_%E0%A4%AD%E0%A4%BE%E0%A4%B7%E0%A4%BE)',\n", + " 'https://nl.wikipedia.org/wiki/Python',\n", + " 'https://ja.wikipedia.org/wiki/%E3%83%91%E3%82%A4%E3%82%BD%E3%83%B3',\n", + " 'https://no.wikipedia.org/wiki/Pyton',\n", + " 'https://pl.wikipedia.org/wiki/Pyton',\n", + " 'https://pt.wikipedia.org/wiki/Python_(desambigua%C3%A7%C3%A3o)',\n", + " 'https://ru.wikipedia.org/wiki/Python_(%D0%B7%D0%BD%D0%B0%D1%87%D0%B5%D0%BD%D0%B8%D1%8F)',\n", + " 'https://sd.wikipedia.org/wiki/%D8%A7%D8%B1%DA%99',\n", + " 'https://sk.wikipedia.org/wiki/Python',\n", + " 'https://sh.wikipedia.org/wiki/Python',\n", + " 'https://fi.wikipedia.org/wiki/Python',\n", + " 'https://sv.wikipedia.org/wiki/Pyton',\n", + " 'https://th.wikipedia.org/wiki/%E0%B9%84%E0%B8%9E%E0%B8%97%E0%B8%AD%E0%B8%99',\n", + " 'https://tr.wikipedia.org/wiki/Python',\n", + " 'https://uk.wikipedia.org/wiki/%D0%9F%D1%96%D1%84%D0%BE%D0%BD',\n", + " 'https://ur.wikipedia.org/wiki/%D9%BE%D8%A7%D8%A6%DB%8C%D8%AA%DA%BE%D9%88%D9%86',\n", + " 'https://vi.wikipedia.org/wiki/Python',\n", + " 'https://zh.wikipedia.org/wiki/Python_(%E6%B6%88%E6%AD%A7%E4%B9%89)',\n", + " 'https://www.wikidata.org/wiki/Special:EntityPage/Q747452#sitelinks-wikipedia',\n", + " '//en.wikipedia.org/wiki/Wikipedia:Text_of_Creative_Commons_Attribution-ShareAlike_3.0_Unported_License',\n", + " '//creativecommons.org/licenses/by-sa/3.0/',\n", + " '//foundation.wikimedia.org/wiki/Terms_of_Use',\n", + " '//foundation.wikimedia.org/wiki/Privacy_policy',\n", + " '//www.wikimediafoundation.org/',\n", + " 'https://foundation.wikimedia.org/wiki/Privacy_policy',\n", + " '/wiki/Wikipedia:About',\n", + " '/wiki/Wikipedia:General_disclaimer',\n", + " '//en.wikipedia.org/wiki/Wikipedia:Contact_us',\n", + " 'https://www.mediawiki.org/wiki/Special:MyLanguage/How_to_contribute',\n", + " 'https://foundation.wikimedia.org/wiki/Cookie_statement',\n", + " '//en.m.wikipedia.org/w/index.php?title=Python&mobileaction=toggle_view_mobile',\n", + " 'https://wikimediafoundation.org/',\n", + " 'https://www.mediawiki.org/']" + ] + }, + "execution_count": 13, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "#your code" + "wiki_links = soup_html.find_all('a',{'href':True})\n", + "\n", + "wiki_links_list = [w['href'] for w in wiki_links if not w['href'].startswith('#')]\n", + "wiki_links_list\n", + "\n", + "#wiki_links_list = []\n", + "#for i in wiki_links:\n", + "# try:\n", + "# wiki_links_list.append(i.attrs['href'])\n", + "# except:\n", + "# pass\n", + "#wiki_links" ] }, { @@ -230,21 +4360,44 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 14, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "['Title 2 - The Congress',\n", + " 'Title 6 - Domestic Security',\n", + " 'Title 7 - Agriculture',\n", + " 'Title 15 - Commerce and Trade',\n", + " 'Title 16 - Conservation',\n", + " 'Title 19 - Customs Duties',\n", + " 'Title 21 - Food and Drugs',\n", + " 'Title 26 - Internal Revenue Code',\n", + " 'Title 34 - Crime Control and Law Enforcement',\n", + " \"Title 38 - Veterans' Benefits\",\n", + " 'Title 42 - The Public Health and Welfare',\n", + " 'Title 43 - Public Lands',\n", + " 'Title 48 - Territories and Insular Possessions',\n", + " 'Title 49 - Transportation',\n", + " 'Title 50 - War and National Defense']" + ] + }, + "execution_count": 14, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'http://uscode.house.gov/download/download.shtml'" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#your code" + "url = 'http://uscode.house.gov/download/download.shtml'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')\n", + "\n", + "titles = soup_html.find_all('div',{'class':'usctitlechanged'})\n", + "\n", + "titles_list = [t.text.replace('\\n\\n ','').replace('\\n\\n ','') for t in titles]\n", + "titles_list" ] }, { @@ -256,21 +4409,38 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 15, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "['ALEJANDRO ROSALES CASTILLO',\n", + " 'YASER ABDEL SAID',\n", + " 'JASON DEREK BROWN',\n", + " 'RAFAEL CARO-QUINTERO',\n", + " 'ALEXIS FLORES',\n", + " 'EUGENE PALMER',\n", + " 'SANTIAGO VILLALBA MEDEROS',\n", + " 'ROBERT WILLIAM FISHER',\n", + " 'BHADRESHKUMAR CHETANBHAI PATEL',\n", + " 'ARNOLDO JIMENEZ']" + ] + }, + "execution_count": 15, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'https://www.fbi.gov/wanted/topten'" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#your code " + "url = 'https://www.fbi.gov/wanted/topten'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html5lib')\n", + "\n", + "wanted = soup_html.find_all('h3',{'class':'title'})\n", + "wanted_list = [w.text.replace('\\n','') for w in wanted]\n", + "wanted_list" ] }, { @@ -282,21 +4452,654 @@ }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], + "execution_count": 16, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Date & Time UTCLatitude degreesLongitude degreesRegion name [+]
12345678910›»12345678910›»12345678910›».112345678910›»12345678910›».112345678910›»
02019-07-16 20:52:18.608min ago36.07N117.84W2.0
12019-07-16 20:49:09.111min ago36.07N117.65W2.0
22019-07-16 20:33:52.927min ago40.09N19.91E2.7
32019-07-16 20:31:33.329min ago23.45S66.86W4.5
42019-07-16 20:29:07.731min ago35.86N117.69W2.2
52019-07-16 20:23:34.737min ago36.07N117.84W2.0
62019-07-16 20:19:00.142min ago33.10N12.42W2.8
72019-07-16 20:17:51.643min ago35.55N117.43W2.8
82019-07-16 20:15:36.845min ago35.78N117.62W4.5
92019-07-16 20:11:01.550min ago37.82N121.77W4.3
102019-07-16 19:42:25.91hr 18min ago35.61N117.47W2.3
112019-07-16 19:35:57.01hr 25min ago35.62N117.45W2.1
122019-07-16 19:23:50.11hr 37min ago36.19N117.89W2.7
132019-07-16 19:20:21.41hr 40min ago38.39N16.94E3.1
142019-07-16 19:16:53.81hr 44min ago38.45N16.91E2.6
152019-07-16 19:16:15.91hr 44min ago61.27N152.44W2.4
162019-07-16 19:11:48.91hr 49min ago36.03N117.87W2.5
172019-07-16 19:04:00.21hr 57min ago35.96N117.71W2.0
182019-07-16 19:01:48.01hr 59min ago39.56N67.17E3.6
192019-07-16 19:01:00.82hr 00min ago35.68N117.54W2.5
202019-07-16 18:53:32.02hr 07min ago0.68S126.36E4.0
212019-07-16 18:50:16.22hr 10min ago43.62N75.40E3.2
222019-07-16 18:47:48.92hr 13min ago35.59N117.42W2.1
232019-07-16 18:36:26.82hr 24min ago35.74N117.56W2.7
242019-07-16 18:22:31.92hr 38min ago35.65N117.52W2.0
252019-07-16 18:15:26.52hr 45min ago28.47N56.76E4.3
262019-07-16 18:10:01.02hr 51min ago34.41S150.73E2.4
272019-07-16 17:48:24.03hr 12min ago9.93S118.23E4.1
282019-07-16 17:42:29.93hr 18min ago35.67N117.54W2.0
292019-07-16 17:39:43.03hr 21min ago0.54S127.86E4.1
302019-07-16 17:31:56.03hr 29min ago35.67N117.47W2.3
312019-07-16 17:05:45.03hr 55min ago36.20N117.90W2.9
322019-07-16 17:05:08.03hr 55min ago15.40N94.64W4.2
332019-07-16 17:01:30.83hr 59min ago36.10N117.90W2.1
342019-07-16 16:45:56.54hr 15min ago0.68S127.58E4.7
352019-07-16 16:45:55.04hr 15min ago18.99N70.09W2.9
362019-07-16 16:43:40.94hr 17min ago37.23N28.27E2.7
372019-07-16 16:43:21.74hr 17min ago36.03N117.79W2.4
382019-07-16 16:36:41.54hr 24min ago35.96N117.30W2.1
392019-07-16 16:28:38.14hr 32min ago35.92N117.68W2.3
402019-07-16 16:27:59.04hr 33min ago18.51S120.55E2.9
412019-07-16 16:26:00.54hr 35min ago30.57N141.98E4.8
422019-07-16 16:21:05.14hr 39min ago28.45N56.70E4.5
432019-07-16 16:01:04.34hr 59min ago62.22N150.00W2.3
442019-07-16 15:59:52.05hr 01min ago35.81N117.63W2.9
452019-07-16 15:57:04.45hr 03min ago36.10N117.82W3.0
462019-07-16 15:28:58.05hr 32min ago18.26S120.37E3.3
472019-07-16 15:26:26.65hr 34min ago35.68N117.51W2.0
482019-07-16 15:25:42.65hr 35min ago37.16N141.54E4.6
492019-07-16 15:13:22.15hr 47min ago35.90N117.67W2.1
50NaNNaNNaNNaNNaNNaN
5112345678910›»12345678910›»12345678910›»12345678910›»12345678910›»12345678910›»
52NaNNaNNaNNaNNaNNaN
\n", + "
" + ], + "text/plain": [ + " Date & Time UTC Latitude degrees \\\n", + " 12345678910›» 12345678910›» 12345678910›».1 \n", + "0 2019-07-16 20:52:18.608min ago 36.07 N \n", + "1 2019-07-16 20:49:09.111min ago 36.07 N \n", + "2 2019-07-16 20:33:52.927min ago 40.09 N \n", + "3 2019-07-16 20:31:33.329min ago 23.45 S \n", + "4 2019-07-16 20:29:07.731min ago 35.86 N \n", + "5 2019-07-16 20:23:34.737min ago 36.07 N \n", + "6 2019-07-16 20:19:00.142min ago 33.10 N \n", + "7 2019-07-16 20:17:51.643min ago 35.55 N \n", + "8 2019-07-16 20:15:36.845min ago 35.78 N \n", + "9 2019-07-16 20:11:01.550min ago 37.82 N \n", + "10 2019-07-16 19:42:25.91hr 18min ago 35.61 N \n", + "11 2019-07-16 19:35:57.01hr 25min ago 35.62 N \n", + "12 2019-07-16 19:23:50.11hr 37min ago 36.19 N \n", + "13 2019-07-16 19:20:21.41hr 40min ago 38.39 N \n", + "14 2019-07-16 19:16:53.81hr 44min ago 38.45 N \n", + "15 2019-07-16 19:16:15.91hr 44min ago 61.27 N \n", + "16 2019-07-16 19:11:48.91hr 49min ago 36.03 N \n", + "17 2019-07-16 19:04:00.21hr 57min ago 35.96 N \n", + "18 2019-07-16 19:01:48.01hr 59min ago 39.56 N \n", + "19 2019-07-16 19:01:00.82hr 00min ago 35.68 N \n", + "20 2019-07-16 18:53:32.02hr 07min ago 0.68 S \n", + "21 2019-07-16 18:50:16.22hr 10min ago 43.62 N \n", + "22 2019-07-16 18:47:48.92hr 13min ago 35.59 N \n", + "23 2019-07-16 18:36:26.82hr 24min ago 35.74 N \n", + "24 2019-07-16 18:22:31.92hr 38min ago 35.65 N \n", + "25 2019-07-16 18:15:26.52hr 45min ago 28.47 N \n", + "26 2019-07-16 18:10:01.02hr 51min ago 34.41 S \n", + "27 2019-07-16 17:48:24.03hr 12min ago 9.93 S \n", + "28 2019-07-16 17:42:29.93hr 18min ago 35.67 N \n", + "29 2019-07-16 17:39:43.03hr 21min ago 0.54 S \n", + "30 2019-07-16 17:31:56.03hr 29min ago 35.67 N \n", + "31 2019-07-16 17:05:45.03hr 55min ago 36.20 N \n", + "32 2019-07-16 17:05:08.03hr 55min ago 15.40 N \n", + "33 2019-07-16 17:01:30.83hr 59min ago 36.10 N \n", + "34 2019-07-16 16:45:56.54hr 15min ago 0.68 S \n", + "35 2019-07-16 16:45:55.04hr 15min ago 18.99 N \n", + "36 2019-07-16 16:43:40.94hr 17min ago 37.23 N \n", + "37 2019-07-16 16:43:21.74hr 17min ago 36.03 N \n", + "38 2019-07-16 16:36:41.54hr 24min ago 35.96 N \n", + "39 2019-07-16 16:28:38.14hr 32min ago 35.92 N \n", + "40 2019-07-16 16:27:59.04hr 33min ago 18.51 S \n", + "41 2019-07-16 16:26:00.54hr 35min ago 30.57 N \n", + "42 2019-07-16 16:21:05.14hr 39min ago 28.45 N \n", + "43 2019-07-16 16:01:04.34hr 59min ago 62.22 N \n", + "44 2019-07-16 15:59:52.05hr 01min ago 35.81 N \n", + "45 2019-07-16 15:57:04.45hr 03min ago 36.10 N \n", + "46 2019-07-16 15:28:58.05hr 32min ago 18.26 S \n", + "47 2019-07-16 15:26:26.65hr 34min ago 35.68 N \n", + "48 2019-07-16 15:25:42.65hr 35min ago 37.16 N \n", + "49 2019-07-16 15:13:22.15hr 47min ago 35.90 N \n", + "50 NaN NaN NaN \n", + "51 12345678910›» 12345678910›» 12345678910›» \n", + "52 NaN NaN NaN \n", + "\n", + " Longitude degrees Region name [+] \n", + " 12345678910›» 12345678910›».1 12345678910›» \n", + "0 117.84 W 2.0 \n", + "1 117.65 W 2.0 \n", + "2 19.91 E 2.7 \n", + "3 66.86 W 4.5 \n", + "4 117.69 W 2.2 \n", + "5 117.84 W 2.0 \n", + "6 12.42 W 2.8 \n", + "7 117.43 W 2.8 \n", + "8 117.62 W 4.5 \n", + "9 121.77 W 4.3 \n", + "10 117.47 W 2.3 \n", + "11 117.45 W 2.1 \n", + "12 117.89 W 2.7 \n", + "13 16.94 E 3.1 \n", + "14 16.91 E 2.6 \n", + "15 152.44 W 2.4 \n", + "16 117.87 W 2.5 \n", + "17 117.71 W 2.0 \n", + "18 67.17 E 3.6 \n", + "19 117.54 W 2.5 \n", + "20 126.36 E 4.0 \n", + "21 75.40 E 3.2 \n", + "22 117.42 W 2.1 \n", + "23 117.56 W 2.7 \n", + "24 117.52 W 2.0 \n", + "25 56.76 E 4.3 \n", + "26 150.73 E 2.4 \n", + "27 118.23 E 4.1 \n", + "28 117.54 W 2.0 \n", + "29 127.86 E 4.1 \n", + "30 117.47 W 2.3 \n", + "31 117.90 W 2.9 \n", + "32 94.64 W 4.2 \n", + "33 117.90 W 2.1 \n", + "34 127.58 E 4.7 \n", + "35 70.09 W 2.9 \n", + "36 28.27 E 2.7 \n", + "37 117.79 W 2.4 \n", + "38 117.30 W 2.1 \n", + "39 117.68 W 2.3 \n", + "40 120.55 E 2.9 \n", + "41 141.98 E 4.8 \n", + "42 56.70 E 4.5 \n", + "43 150.00 W 2.3 \n", + "44 117.63 W 2.9 \n", + "45 117.82 W 3.0 \n", + "46 120.37 E 3.3 \n", + "47 117.51 W 2.0 \n", + "48 141.54 E 4.6 \n", + "49 117.67 W 2.1 \n", + "50 NaN NaN NaN \n", + "51 12345678910›» 12345678910›» 12345678910›» \n", + "52 NaN NaN NaN " + ] + }, + "execution_count": 16, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'https://www.emsc-csem.org/Earthquake/'" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#your code" + "url = 'https://www.emsc-csem.org/Earthquake/'\n", + "html = requests.get(url).content\n", + "df_list = pd.read_html(html)\n", + "df_list[3][['Date & Time UTC','Latitude degrees','Longitude degrees','Region name [+]']]" ] }, { @@ -308,21 +5111,88 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 17, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
01
0Code Geist Hackathon by SefrWahed[7/29/2019]
1The Code Factor[5/21/2019]
2TECHFEST MUNICH[9/6/2019]
3Galileo App Competition[1/31/2019]
\n", + "
" + ], + "text/plain": [ + " 0 1\n", + "0 Code Geist Hackathon by SefrWahed [7/29/2019]\n", + "1 The Code Factor [5/21/2019]\n", + "2 TECHFEST MUNICH [9/6/2019]\n", + "3 Galileo App Competition [1/31/2019]" + ] + }, + "execution_count": 17, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url ='https://hackevents.co/hackathons'" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#your code" + "import re\n", + "\n", + "url ='https://hackevents.co/hackathons'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html5lib')\n", + "\n", + "hacks_titles = soup_html.find_all('h5',{'class':'card-title'})\n", + "hacks_fechas = soup_html.find_all('p',{'class':'card-text'})\n", + "\n", + "hacks_list = [[j.text,re.findall(r'\\d+/\\d+/\\d+',hacks_fechas[i].text)] for i,j in enumerate(hacks_titles)]\n", + "#hacks_list\n", + "\n", + "df = pd.DataFrame(hacks_list)\n", + "df" ] }, { @@ -342,22 +5212,47 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 26, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdin", + "output_type": "stream", + "text": [ + "Ingresa tu usuario de twitter: paolalean\n" + ] + } + ], "source": [ "# This is the url you will scrape in this exercise \n", "# You will need to add the account credentials to this url\n", - "url = 'https://twitter.com/'" + "usuario = input('Ingresa tu usuario de twitter: ')\n", + "url = f'https://twitter.com/{usuario}'\n", + "#para prueba de cuenta sin tweets usar la de victor: vik54076455" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 30, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "307\n" + ] + } + ], "source": [ - "#your code" + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')\n", + "tweets = soup_html.find_all('span',{'class':'ProfileNav-value'})\n", + "\n", + "try:\n", + " print(int(tweets[0].text))\n", + "except:\n", + " print(\"no tienes tweets\")\n" ] }, { @@ -377,22 +5272,38 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 34, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdin", + "output_type": "stream", + "text": [ + "Ingresa tu usuario de twitter: paolalean\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Tienes la increíble cantidad de 27 followers\n" + ] + } + ], "source": [ "# This is the url you will scrape in this exercise \n", "# You will need to add the account credentials to this url\n", - "url = 'https://twitter.com/'" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#your code" + "usuario = input('Ingresa tu usuario de twitter: ')\n", + "url = f'https://twitter.com/{usuario}'\n", + "\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')\n", + "tweets = soup_html.find_all('span',{'class':'ProfileNav-value'})\n", + "\n", + "try:\n", + " print(f\"Tienes la increíble cantidad de {int(tweets[1].text)} followers\")\n", + "except:\n", + " print(\"Sin followers\")" ] }, { @@ -404,12 +5315,42 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 48, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "[['The Free Encyclopedia', '5892000'],\n", + " ['English', '1159000'],\n", + " ['日本語', '1532000'],\n", + " ['Español', '2323000'],\n", + " ['Deutsch', '1556000'],\n", + " ['Русский', '2123000'],\n", + " ['Français', '1541000'],\n", + " ['Italiano', '1065000'],\n", + " ['中文', '1010000'],\n", + " ['Português', '1346000'],\n", + " ['Polski', '1000000'],\n", + " ['Wikipedia apps are now available:', '100000']]" + ] + }, + "execution_count": 48, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'https://www.wikipedia.org/'" + "url = 'https://www.wikipedia.org/'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')\n", + "\n", + "language = soup_html.find_all('strong')\n", + "number = soup_html.find_all('bdi')\n", + "\n", + "lista = [[j.text,''.join(re.findall('\\d+', number[i].text))] for i,j in enumerate(language)]\n", + "lista" ] }, { @@ -430,21 +5371,40 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 52, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "['Business and economy',\n", + " 'Crime and justice',\n", + " 'Defence',\n", + " 'Education',\n", + " 'Environment',\n", + " 'Government',\n", + " 'Government spending',\n", + " 'Health',\n", + " 'Mapping',\n", + " 'Society',\n", + " 'Towns and cities',\n", + " 'Transport']" + ] + }, + "execution_count": 52, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'https://data.gov.uk/'" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#your code " + "url = 'https://data.gov.uk/'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')\n", + "\n", + "datasets = soup_html.find_all('h2')\n", + "datas = [d.text for d in datasets]\n", + "datas" ] }, { @@ -456,12 +5416,135 @@ }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], + "execution_count": 57, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
RankLanguageSpeakers(millions)
0Chinese (macrolanguage)1311.0
11Mandarin918.0
22Spanish460.0
33English379.0
44Hindi341.0
5Arabic (macrolanguage)319.0
65Bengali228.0
76Portuguese221.0
87Russian154.0
98Japanese128.0
10Lahnda (macrolanguage)119.0
\n", + "
" + ], + "text/plain": [ + " Rank Language Speakers(millions)\n", + "0 — Chinese (macrolanguage) 1311.0\n", + "1 1 Mandarin 918.0\n", + "2 2 Spanish 460.0\n", + "3 3 English 379.0\n", + "4 4 Hindi 341.0\n", + "5 — Arabic (macrolanguage) 319.0\n", + "6 5 Bengali 228.0\n", + "7 6 Portuguese 221.0\n", + "8 7 Russian 154.0\n", + "9 8 Japanese 128.0\n", + "10 — Lahnda (macrolanguage) 119.0" + ] + }, + "execution_count": 57, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'https://en.wikipedia.org/wiki/List_of_languages_by_number_of_native_speakers'" + "url = 'https://en.wikipedia.org/wiki/List_of_languages_by_number_of_native_speakers'\n", + "html = requests.get(url).content\n", + "\n", + "df_read_tables = pd.read_html(html)\n", + "df_read_tables[0][['Rank','Language','Speakers(millions)']].head(11)\n" ] }, { @@ -608,5 +5691,5 @@ } }, "nbformat": 4, - "nbformat_minor": 2 + "nbformat_minor": 4 } diff --git a/your-code/main.ipynb b/your-code/main.ipynb index 812f7a4..5a88557 100644 --- a/your-code/main.ipynb +++ b/your-code/main.ipynb @@ -40,9 +40,32 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 1, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Requirement already satisfied: bs4 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (0.0.1)\n", + "Requirement already satisfied: requests in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (2.22.0)\n", + "Requirement already satisfied: pandas in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (0.24.2)\n", + "Requirement already satisfied: html5lib in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (1.0.1)\n", + "Requirement already satisfied: lxml in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (4.3.4)\n", + "Requirement already satisfied: beautifulsoup4 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from bs4) (4.7.1)\n", + "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from requests) (1.25.3)\n", + "Requirement already satisfied: certifi>=2017.4.17 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from requests) (2019.6.16)\n", + "Requirement already satisfied: idna<2.9,>=2.5 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from requests) (2.8)\n", + "Requirement already satisfied: chardet<3.1.0,>=3.0.2 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from requests) (3.0.4)\n", + "Requirement already satisfied: numpy>=1.12.0 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from pandas) (1.16.4)\n", + "Requirement already satisfied: pytz>=2011k in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from pandas) (2019.1)\n", + "Requirement already satisfied: python-dateutil>=2.5.0 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from pandas) (2.8.0)\n", + "Requirement already satisfied: webencodings in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from html5lib) (0.5.1)\n", + "Requirement already satisfied: six>=1.9 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from html5lib) (1.12.0)\n", + "Requirement already satisfied: soupsieve>=1.2 in c:\\users\\paola\\appdata\\local\\programs\\python\\python37\\lib\\site-packages (from beautifulsoup4->bs4) (1.9.2)\n" + ] + } + ], "source": [ "import requests\n", "from bs4 import BeautifulSoup\n", @@ -52,9 +75,11 @@ "# from lxml.html import fromstring\n", "# import urllib.request\n", "# from urllib.request import urlopen\n", - "# import random\n", + "import random\n", "# import re\n", - "# import scrapy" + "#import scrapy\n", + "import sys\n", + "!{sys.executable} -m pip install bs4 requests pandas html5lib lxml" ] }, { @@ -66,12 +91,3793 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 5, "metadata": {}, "outputs": [], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'https://github.com/trending/developers'" + "url = 'https://github.com/trending/developers'\n", + "html = requests.get(url).content" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "Trending developers on GitHub today · GitHub\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
\n", + "Skip to content\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "\n", + " Sign up\n", + " \n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "

Trending

\n", + "

\n", + " These are the\n", + " developers\n", + " building the hot tools today.\n", + "

\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " Language:\n", + "\n", + " \n", + "\n", + " Any\n", + " \n", + "\n", + "\n", + "\n", + "
\n", + "Select a language\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "C++\n", + "\n", + "\n", + "\n", + "HTML\n", + "\n", + "\n", + "\n", + "Java\n", + "\n", + "\n", + "\n", + "JavaScript\n", + "\n", + "\n", + "\n", + "PHP\n", + "\n", + "\n", + "\n", + "Python\n", + "\n", + "\n", + "\n", + "Ruby\n", + "\n", + "\n", + "\n", + "Unknown languages\n", + "\n", + "\n", + "\n", + "1C Enterprise\n", + "\n", + "\n", + "\n", + "ABAP\n", + "\n", + "\n", + "\n", + "ABNF\n", + "\n", + "\n", + "\n", + "ActionScript\n", + "\n", + "\n", + "\n", + "Ada\n", + "\n", + "\n", + "\n", + "Adobe Font Metrics\n", + "\n", + "\n", + "\n", + "Agda\n", + "\n", + "\n", + "\n", + "AGS Script\n", + "\n", + "\n", + "\n", + "Alloy\n", + "\n", + "\n", + "\n", + "Alpine Abuild\n", + "\n", + "\n", + "\n", + "Altium Designer\n", + "\n", + "\n", + "\n", + "AMPL\n", + "\n", + "\n", + "\n", + "AngelScript\n", + "\n", + "\n", + "\n", + "Ant Build System\n", + "\n", + "\n", + "\n", + "ANTLR\n", + "\n", + "\n", + "\n", + "ApacheConf\n", + "\n", + "\n", + "\n", + "Apex\n", + "\n", + "\n", + "\n", + "API Blueprint\n", + "\n", + "\n", + "\n", + "APL\n", + "\n", + "\n", + "\n", + "Apollo Guidance Computer\n", + "\n", + "\n", + "\n", + "AppleScript\n", + "\n", + "\n", + "\n", + "Arc\n", + "\n", + "\n", + "\n", + "AsciiDoc\n", + "\n", + "\n", + "\n", + "ASN.1\n", + "\n", + "\n", + "\n", + "ASP\n", + "\n", + "\n", + "\n", + "AspectJ\n", + "\n", + "\n", + "\n", + "Assembly\n", + "\n", + "\n", + "\n", + "Asymptote\n", + "\n", + "\n", + "\n", + "ATS\n", + "\n", + "\n", + "\n", + "Augeas\n", + "\n", + "\n", + "\n", + "AutoHotkey\n", + "\n", + "\n", + "\n", + "AutoIt\n", + "\n", + "\n", + "\n", + "Awk\n", + "\n", + "\n", + "\n", + "Ballerina\n", + "\n", + "\n", + "\n", + "Batchfile\n", + "\n", + "\n", + "\n", + "Befunge\n", + "\n", + "\n", + "\n", + "Bison\n", + "\n", + "\n", + "\n", + "BitBake\n", + "\n", + "\n", + "\n", + "Blade\n", + "\n", + "\n", + "\n", + "BlitzBasic\n", + "\n", + "\n", + "\n", + "BlitzMax\n", + "\n", + "\n", + "\n", + "Bluespec\n", + "\n", + "\n", + "\n", + "Boo\n", + "\n", + "\n", + "\n", + "Brainfuck\n", + "\n", + "\n", + "\n", + "Brightscript\n", + "\n", + "\n", + "\n", + "Zeek\n", + "\n", + "\n", + "\n", + "C\n", + "\n", + "\n", + "\n", + "C#\n", + "\n", + "\n", + "\n", + "C++\n", + "\n", + "\n", + "\n", + "C-ObjDump\n", + "\n", + "\n", + "\n", + "C2hs Haskell\n", + "\n", + "\n", + "\n", + "Cabal Config\n", + "\n", + "\n", + "\n", + "Cap'n Proto\n", + "\n", + "\n", + "\n", + "CartoCSS\n", + "\n", + "\n", + "\n", + "Ceylon\n", + "\n", + "\n", + "\n", + "Chapel\n", + "\n", + "\n", + "\n", + "Charity\n", + "\n", + "\n", + "\n", + "ChucK\n", + "\n", + "\n", + "\n", + "Cirru\n", + "\n", + "\n", + "\n", + "Clarion\n", + "\n", + "\n", + "\n", + "Clean\n", + "\n", + "\n", + "\n", + "Click\n", + "\n", + "\n", + "\n", + "CLIPS\n", + "\n", + "\n", + "\n", + "Clojure\n", + "\n", + "\n", + "\n", + "Closure Templates\n", + "\n", + "\n", + "\n", + "Cloud Firestore Security Rules\n", + "\n", + "\n", + "\n", + "CMake\n", + "\n", + "\n", + "\n", + "COBOL\n", + "\n", + "\n", + "\n", + "CoffeeScript\n", + "\n", + "\n", + "\n", + "ColdFusion\n", + "\n", + "\n", + "\n", + "ColdFusion CFC\n", + "\n", + "\n", + "\n", + "COLLADA\n", + "\n", + "\n", + "\n", + "Common Lisp\n", + "\n", + "\n", + "\n", + "Common Workflow Language\n", + "\n", + "\n", + "\n", + "Component Pascal\n", + "\n", + "\n", + "\n", + "CoNLL-U\n", + "\n", + "\n", + "\n", + "Cool\n", + "\n", + "\n", + "\n", + "Coq\n", + "\n", + "\n", + "\n", + "Cpp-ObjDump\n", + "\n", + "\n", + "\n", + "Creole\n", + "\n", + "\n", + "\n", + "Crystal\n", + "\n", + "\n", + "\n", + "CSON\n", + "\n", + "\n", + "\n", + "Csound\n", + "\n", + "\n", + "\n", + "Csound Document\n", + "\n", + "\n", + "\n", + "Csound Score\n", + "\n", + "\n", + "\n", + "CSS\n", + "\n", + "\n", + "\n", + "CSV\n", + "\n", + "\n", + "\n", + "Cuda\n", + "\n", + "\n", + "\n", + "CWeb\n", + "\n", + "\n", + "\n", + "Cycript\n", + "\n", + "\n", + "\n", + "Cython\n", + "\n", + "\n", + "\n", + "D\n", + "\n", + "\n", + "\n", + "D-ObjDump\n", + "\n", + "\n", + "\n", + "Darcs Patch\n", + "\n", + "\n", + "\n", + "Dart\n", + "\n", + "\n", + "\n", + "DataWeave\n", + "\n", + "\n", + "\n", + "desktop\n", + "\n", + "\n", + "\n", + "Dhall\n", + "\n", + "\n", + "\n", + "Diff\n", + "\n", + "\n", + "\n", + "DIGITAL Command Language\n", + "\n", + "\n", + "\n", + "DM\n", + "\n", + "\n", + "\n", + "DNS Zone\n", + "\n", + "\n", + "\n", + "Dockerfile\n", + "\n", + "\n", + "\n", + "Dogescript\n", + "\n", + "\n", + "\n", + "DTrace\n", + "\n", + "\n", + "\n", + "Dylan\n", + "\n", + "\n", + "\n", + "E\n", + "\n", + "\n", + "\n", + "Eagle\n", + "\n", + "\n", + "\n", + "Easybuild\n", + "\n", + "\n", + "\n", + "EBNF\n", + "\n", + "\n", + "\n", + "eC\n", + "\n", + "\n", + "\n", + "Ecere Projects\n", + "\n", + "\n", + "\n", + "ECL\n", + "\n", + "\n", + "\n", + "ECLiPSe\n", + "\n", + "\n", + "\n", + "Edje Data Collection\n", + "\n", + "\n", + "\n", + "edn\n", + "\n", + "\n", + "\n", + "Eiffel\n", + "\n", + "\n", + "\n", + "EJS\n", + "\n", + "\n", + "\n", + "Elixir\n", + "\n", + "\n", + "\n", + "Elm\n", + "\n", + "\n", + "\n", + "Emacs Lisp\n", + "\n", + "\n", + "\n", + "EmberScript\n", + "\n", + "\n", + "\n", + "EML\n", + "\n", + "\n", + "\n", + "EQ\n", + "\n", + "\n", + "\n", + "Erlang\n", + "\n", + "\n", + "\n", + "F#\n", + "\n", + "\n", + "\n", + "F*\n", + "\n", + "\n", + "\n", + "Factor\n", + "\n", + "\n", + "\n", + "Fancy\n", + "\n", + "\n", + "\n", + "Fantom\n", + "\n", + "\n", + "\n", + "FIGlet Font\n", + "\n", + "\n", + "\n", + "Filebench WML\n", + "\n", + "\n", + "\n", + "Filterscript\n", + "\n", + "\n", + "\n", + "fish\n", + "\n", + "\n", + "\n", + "FLUX\n", + "\n", + "\n", + "\n", + "Formatted\n", + "\n", + "\n", + "\n", + "Forth\n", + "\n", + "\n", + "\n", + "Fortran\n", + "\n", + "\n", + "\n", + "FreeMarker\n", + "\n", + "\n", + "\n", + "Frege\n", + "\n", + "\n", + "\n", + "G-code\n", + "\n", + "\n", + "\n", + "Game Maker Language\n", + "\n", + "\n", + "\n", + "GAMS\n", + "\n", + "\n", + "\n", + "GAP\n", + "\n", + "\n", + "\n", + "GCC Machine Description\n", + "\n", + "\n", + "\n", + "GDB\n", + "\n", + "\n", + "\n", + "GDScript\n", + "\n", + "\n", + "\n", + "Genie\n", + "\n", + "\n", + "\n", + "Genshi\n", + "\n", + "\n", + "\n", + "Gentoo Ebuild\n", + "\n", + "\n", + "\n", + "Gentoo Eclass\n", + "\n", + "\n", + "\n", + "Gerber Image\n", + "\n", + "\n", + "\n", + "Gettext Catalog\n", + "\n", + "\n", + "\n", + "Gherkin\n", + "\n", + "\n", + "\n", + "Git Attributes\n", + "\n", + "\n", + "\n", + "Git Config\n", + "\n", + "\n", + "\n", + "GLSL\n", + "\n", + "\n", + "\n", + "Glyph\n", + "\n", + "\n", + "\n", + "Glyph Bitmap Distribution Format\n", + "\n", + "\n", + "\n", + "GN\n", + "\n", + "\n", + "\n", + "Gnuplot\n", + "\n", + "\n", + "\n", + "Go\n", + "\n", + "\n", + "\n", + "Golo\n", + "\n", + "\n", + "\n", + "Gosu\n", + "\n", + "\n", + "\n", + "Grace\n", + "\n", + "\n", + "\n", + "Gradle\n", + "\n", + "\n", + "\n", + "Grammatical Framework\n", + "\n", + "\n", + "\n", + "Graph Modeling Language\n", + "\n", + "\n", + "\n", + "GraphQL\n", + "\n", + "\n", + "\n", + "Graphviz (DOT)\n", + "\n", + "\n", + "\n", + "Groovy\n", + "\n", + "\n", + "\n", + "Groovy Server Pages\n", + "\n", + "\n", + "\n", + "Hack\n", + "\n", + "\n", + "\n", + "Haml\n", + "\n", + "\n", + "\n", + "Handlebars\n", + "\n", + "\n", + "\n", + "HAProxy\n", + "\n", + "\n", + "\n", + "Harbour\n", + "\n", + "\n", + "\n", + "Haskell\n", + "\n", + "\n", + "\n", + "Haxe\n", + "\n", + "\n", + "\n", + "HCL\n", + "\n", + "\n", + "\n", + "HiveQL\n", + "\n", + "\n", + "\n", + "HLSL\n", + "\n", + "\n", + "\n", + "HolyC\n", + "\n", + "\n", + "\n", + "HTML\n", + "\n", + "\n", + "\n", + "HTML+Django\n", + "\n", + "\n", + "\n", + "HTML+ECR\n", + "\n", + "\n", + "\n", + "HTML+EEX\n", + "\n", + "\n", + "\n", + "HTML+ERB\n", + "\n", + "\n", + "\n", + "HTML+PHP\n", + "\n", + "\n", + "\n", + "HTML+Razor\n", + "\n", + "\n", + "\n", + "HTTP\n", + "\n", + "\n", + "\n", + "HXML\n", + "\n", + "\n", + "\n", + "Hy\n", + "\n", + "\n", + "\n", + "HyPhy\n", + "\n", + "\n", + "\n", + "IDL\n", + "\n", + "\n", + "\n", + "Idris\n", + "\n", + "\n", + "\n", + "IGOR Pro\n", + "\n", + "\n", + "\n", + "Inform 7\n", + "\n", + "\n", + "\n", + "INI\n", + "\n", + "\n", + "\n", + "Inno Setup\n", + "\n", + "\n", + "\n", + "Io\n", + "\n", + "\n", + "\n", + "Ioke\n", + "\n", + "\n", + "\n", + "IRC log\n", + "\n", + "\n", + "\n", + "Isabelle\n", + "\n", + "\n", + "\n", + "Isabelle ROOT\n", + "\n", + "\n", + "\n", + "J\n", + "\n", + "\n", + "\n", + "Jasmin\n", + "\n", + "\n", + "\n", + "Java\n", + "\n", + "\n", + "\n", + "Java Properties\n", + "\n", + "\n", + "\n", + "Java Server Pages\n", + "\n", + "\n", + "\n", + "JavaScript\n", + "\n", + "\n", + "\n", + "JavaScript+ERB\n", + "\n", + "\n", + "\n", + "JFlex\n", + "\n", + "\n", + "\n", + "Jison\n", + "\n", + "\n", + "\n", + "Jison Lex\n", + "\n", + "\n", + "\n", + "Jolie\n", + "\n", + "\n", + "\n", + "JSON\n", + "\n", + "\n", + "\n", + "JSON with Comments\n", + "\n", + "\n", + "\n", + "JSON5\n", + "\n", + "\n", + "\n", + "JSONiq\n", + "\n", + "\n", + "\n", + "JSONLD\n", + "\n", + "\n", + "\n", + "Jsonnet\n", + "\n", + "\n", + "\n", + "JSX\n", + "\n", + "\n", + "\n", + "Julia\n", + "\n", + "\n", + "\n", + "Jupyter Notebook\n", + "\n", + "\n", + "\n", + "KiCad Layout\n", + "\n", + "\n", + "\n", + "KiCad Legacy Layout\n", + "\n", + "\n", + "\n", + "KiCad Schematic\n", + "\n", + "\n", + "\n", + "Kit\n", + "\n", + "\n", + "\n", + "Kotlin\n", + "\n", + "\n", + "\n", + "KRL\n", + "\n", + "\n", + "\n", + "LabVIEW\n", + "\n", + "\n", + "\n", + "Lasso\n", + "\n", + "\n", + "\n", + "Latte\n", + "\n", + "\n", + "\n", + "Lean\n", + "\n", + "\n", + "\n", + "Less\n", + "\n", + "\n", + "\n", + "Lex\n", + "\n", + "\n", + "\n", + "LFE\n", + "\n", + "\n", + "\n", + "LilyPond\n", + "\n", + "\n", + "\n", + "Limbo\n", + "\n", + "\n", + "\n", + "Linker Script\n", + "\n", + "\n", + "\n", + "Linux Kernel Module\n", + "\n", + "\n", + "\n", + "Liquid\n", + "\n", + "\n", + "\n", + "Literate Agda\n", + "\n", + "\n", + "\n", + "Literate CoffeeScript\n", + "\n", + "\n", + "\n", + "Literate Haskell\n", + "\n", + "\n", + "\n", + "LiveScript\n", + "\n", + "\n", + "\n", + "LLVM\n", + "\n", + "\n", + "\n", + "Logos\n", + "\n", + "\n", + "\n", + "Logtalk\n", + "\n", + "\n", + "\n", + "LOLCODE\n", + "\n", + "\n", + "\n", + "LookML\n", + "\n", + "\n", + "\n", + "LoomScript\n", + "\n", + "\n", + "\n", + "LSL\n", + "\n", + "\n", + "\n", + "Lua\n", + "\n", + "\n", + "\n", + "M\n", + "\n", + "\n", + "\n", + "M4\n", + "\n", + "\n", + "\n", + "M4Sugar\n", + "\n", + "\n", + "\n", + "Makefile\n", + "\n", + "\n", + "\n", + "Mako\n", + "\n", + "\n", + "\n", + "Markdown\n", + "\n", + "\n", + "\n", + "Marko\n", + "\n", + "\n", + "\n", + "Mask\n", + "\n", + "\n", + "\n", + "Mathematica\n", + "\n", + "\n", + "\n", + "MATLAB\n", + "\n", + "\n", + "\n", + "Maven POM\n", + "\n", + "\n", + "\n", + "Max\n", + "\n", + "\n", + "\n", + "MAXScript\n", + "\n", + "\n", + "\n", + "mcfunction\n", + "\n", + "\n", + "\n", + "MediaWiki\n", + "\n", + "\n", + "\n", + "Mercury\n", + "\n", + "\n", + "\n", + "Meson\n", + "\n", + "\n", + "\n", + "Metal\n", + "\n", + "\n", + "\n", + "MiniD\n", + "\n", + "\n", + "\n", + "Mirah\n", + "\n", + "\n", + "\n", + "Modelica\n", + "\n", + "\n", + "\n", + "Modula-2\n", + "\n", + "\n", + "\n", + "Modula-3\n", + "\n", + "\n", + "\n", + "Module Management System\n", + "\n", + "\n", + "\n", + "Monkey\n", + "\n", + "\n", + "\n", + "Moocode\n", + "\n", + "\n", + "\n", + "MoonScript\n", + "\n", + "\n", + "\n", + "Motorola 68K Assembly\n", + "\n", + "\n", + "\n", + "MQL4\n", + "\n", + "\n", + "\n", + "MQL5\n", + "\n", + "\n", + "\n", + "MTML\n", + "\n", + "\n", + "\n", + "MUF\n", + "\n", + "\n", + "\n", + "mupad\n", + "\n", + "\n", + "\n", + "Myghty\n", + "\n", + "\n", + "\n", + "nanorc\n", + "\n", + "\n", + "\n", + "NCL\n", + "\n", + "\n", + "\n", + "Nearley\n", + "\n", + "\n", + "\n", + "Nemerle\n", + "\n", + "\n", + "\n", + "nesC\n", + "\n", + "\n", + "\n", + "NetLinx\n", + "\n", + "\n", + "\n", + "NetLinx+ERB\n", + "\n", + "\n", + "\n", + "NetLogo\n", + "\n", + "\n", + "\n", + "NewLisp\n", + "\n", + "\n", + "\n", + "Nextflow\n", + "\n", + "\n", + "\n", + "Nginx\n", + "\n", + "\n", + "\n", + "Nim\n", + "\n", + "\n", + "\n", + "Ninja\n", + "\n", + "\n", + "\n", + "Nit\n", + "\n", + "\n", + "\n", + "Nix\n", + "\n", + "\n", + "\n", + "NL\n", + "\n", + "\n", + "\n", + "NSIS\n", + "\n", + "\n", + "\n", + "Nu\n", + "\n", + "\n", + "\n", + "NumPy\n", + "\n", + "\n", + "\n", + "ObjDump\n", + "\n", + "\n", + "\n", + "Objective-C\n", + "\n", + "\n", + "\n", + "Objective-C++\n", + "\n", + "\n", + "\n", + "Objective-J\n", + "\n", + "\n", + "\n", + "ObjectScript\n", + "\n", + "\n", + "\n", + "OCaml\n", + "\n", + "\n", + "\n", + "Omgrofl\n", + "\n", + "\n", + "\n", + "ooc\n", + "\n", + "\n", + "\n", + "Opa\n", + "\n", + "\n", + "\n", + "Opal\n", + "\n", + "\n", + "\n", + "OpenCL\n", + "\n", + "\n", + "\n", + "OpenEdge ABL\n", + "\n", + "\n", + "\n", + "OpenRC runscript\n", + "\n", + "\n", + "\n", + "OpenSCAD\n", + "\n", + "\n", + "\n", + "OpenType Feature File\n", + "\n", + "\n", + "\n", + "Org\n", + "\n", + "\n", + "\n", + "Ox\n", + "\n", + "\n", + "\n", + "Oxygene\n", + "\n", + "\n", + "\n", + "Oz\n", + "\n", + "\n", + "\n", + "P4\n", + "\n", + "\n", + "\n", + "Pan\n", + "\n", + "\n", + "\n", + "Papyrus\n", + "\n", + "\n", + "\n", + "Parrot\n", + "\n", + "\n", + "\n", + "Parrot Assembly\n", + "\n", + "\n", + "\n", + "Parrot Internal Representation\n", + "\n", + "\n", + "\n", + "Pascal\n", + "\n", + "\n", + "\n", + "Pawn\n", + "\n", + "\n", + "\n", + "Pep8\n", + "\n", + "\n", + "\n", + "Perl\n", + "\n", + "\n", + "\n", + "Perl 6\n", + "\n", + "\n", + "\n", + "PHP\n", + "\n", + "\n", + "\n", + "Pic\n", + "\n", + "\n", + "\n", + "Pickle\n", + "\n", + "\n", + "\n", + "PicoLisp\n", + "\n", + "\n", + "\n", + "PigLatin\n", + "\n", + "\n", + "\n", + "Pike\n", + "\n", + "\n", + "\n", + "PLpgSQL\n", + "\n", + "\n", + "\n", + "PLSQL\n", + "\n", + "\n", + "\n", + "Pod\n", + "\n", + "\n", + "\n", + "Pod 6\n", + "\n", + "\n", + "\n", + "PogoScript\n", + "\n", + "\n", + "\n", + "Pony\n", + "\n", + "\n", + "\n", + "PostCSS\n", + "\n", + "\n", + "\n", + "PostScript\n", + "\n", + "\n", + "\n", + "POV-Ray SDL\n", + "\n", + "\n", + "\n", + "PowerBuilder\n", + "\n", + "\n", + "\n", + "PowerShell\n", + "\n", + "\n", + "\n", + "Processing\n", + "\n", + "\n", + "\n", + "Prolog\n", + "\n", + "\n", + "\n", + "Propeller Spin\n", + "\n", + "\n", + "\n", + "Protocol Buffer\n", + "\n", + "\n", + "\n", + "Public Key\n", + "\n", + "\n", + "\n", + "Pug\n", + "\n", + "\n", + "\n", + "Puppet\n", + "\n", + "\n", + "\n", + "Pure Data\n", + "\n", + "\n", + "\n", + "PureBasic\n", + "\n", + "\n", + "\n", + "PureScript\n", + "\n", + "\n", + "\n", + "Python\n", + "\n", + "\n", + "\n", + "Python console\n", + "\n", + "\n", + "\n", + "Python traceback\n", + "\n", + "\n", + "\n", + "q\n", + "\n", + "\n", + "\n", + "QMake\n", + "\n", + "\n", + "\n", + "QML\n", + "\n", + "\n", + "\n", + "Quake\n", + "\n", + "\n", + "\n", + "R\n", + "\n", + "\n", + "\n", + "Racket\n", + "\n", + "\n", + "\n", + "Ragel\n", + "\n", + "\n", + "\n", + "RAML\n", + "\n", + "\n", + "\n", + "Rascal\n", + "\n", + "\n", + "\n", + "Raw token data\n", + "\n", + "\n", + "\n", + "RDoc\n", + "\n", + "\n", + "\n", + "REALbasic\n", + "\n", + "\n", + "\n", + "Reason\n", + "\n", + "\n", + "\n", + "Rebol\n", + "\n", + "\n", + "\n", + "Red\n", + "\n", + "\n", + "\n", + "Redcode\n", + "\n", + "\n", + "\n", + "Regular Expression\n", + "\n", + "\n", + "\n", + "Ren'Py\n", + "\n", + "\n", + "\n", + "RenderScript\n", + "\n", + "\n", + "\n", + "reStructuredText\n", + "\n", + "\n", + "\n", + "REXX\n", + "\n", + "\n", + "\n", + "RHTML\n", + "\n", + "\n", + "\n", + "Rich Text Format\n", + "\n", + "\n", + "\n", + "Ring\n", + "\n", + "\n", + "\n", + "RMarkdown\n", + "\n", + "\n", + "\n", + "RobotFramework\n", + "\n", + "\n", + "\n", + "Roff\n", + "\n", + "\n", + "\n", + "Roff Manpage\n", + "\n", + "\n", + "\n", + "Rouge\n", + "\n", + "\n", + "\n", + "RPC\n", + "\n", + "\n", + "\n", + "RPM Spec\n", + "\n", + "\n", + "\n", + "Ruby\n", + "\n", + "\n", + "\n", + "RUNOFF\n", + "\n", + "\n", + "\n", + "Rust\n", + "\n", + "\n", + "\n", + "Sage\n", + "\n", + "\n", + "\n", + "SaltStack\n", + "\n", + "\n", + "\n", + "SAS\n", + "\n", + "\n", + "\n", + "Sass\n", + "\n", + "\n", + "\n", + "Scala\n", + "\n", + "\n", + "\n", + "Scaml\n", + "\n", + "\n", + "\n", + "Scheme\n", + "\n", + "\n", + "\n", + "Scilab\n", + "\n", + "\n", + "\n", + "SCSS\n", + "\n", + "\n", + "\n", + "sed\n", + "\n", + "\n", + "\n", + "Self\n", + "\n", + "\n", + "\n", + "ShaderLab\n", + "\n", + "\n", + "\n", + "Shell\n", + "\n", + "\n", + "\n", + "ShellSession\n", + "\n", + "\n", + "\n", + "Shen\n", + "\n", + "\n", + "\n", + "Slash\n", + "\n", + "\n", + "\n", + "Slice\n", + "\n", + "\n", + "\n", + "Slim\n", + "\n", + "\n", + "\n", + "Smali\n", + "\n", + "\n", + "\n", + "Smalltalk\n", + "\n", + "\n", + "\n", + "Smarty\n", + "\n", + "\n", + "\n", + "SMT\n", + "\n", + "\n", + "\n", + "Solidity\n", + "\n", + "\n", + "\n", + "SourcePawn\n", + "\n", + "\n", + "\n", + "SPARQL\n", + "\n", + "\n", + "\n", + "Spline Font Database\n", + "\n", + "\n", + "\n", + "SQF\n", + "\n", + "\n", + "\n", + "SQL\n", + "\n", + "\n", + "\n", + "SQLPL\n", + "\n", + "\n", + "\n", + "Squirrel\n", + "\n", + "\n", + "\n", + "SRecode Template\n", + "\n", + "\n", + "\n", + "SSH Config\n", + "\n", + "\n", + "\n", + "Stan\n", + "\n", + "\n", + "\n", + "Standard ML\n", + "\n", + "\n", + "\n", + "Stata\n", + "\n", + "\n", + "\n", + "STON\n", + "\n", + "\n", + "\n", + "Stylus\n", + "\n", + "\n", + "\n", + "SubRip Text\n", + "\n", + "\n", + "\n", + "SugarSS\n", + "\n", + "\n", + "\n", + "SuperCollider\n", + "\n", + "\n", + "\n", + "SVG\n", + "\n", + "\n", + "\n", + "Swift\n", + "\n", + "\n", + "\n", + "SystemVerilog\n", + "\n", + "\n", + "\n", + "Tcl\n", + "\n", + "\n", + "\n", + "Tcsh\n", + "\n", + "\n", + "\n", + "Tea\n", + "\n", + "\n", + "\n", + "Terra\n", + "\n", + "\n", + "\n", + "TeX\n", + "\n", + "\n", + "\n", + "Text\n", + "\n", + "\n", + "\n", + "Textile\n", + "\n", + "\n", + "\n", + "Thrift\n", + "\n", + "\n", + "\n", + "TI Program\n", + "\n", + "\n", + "\n", + "TLA\n", + "\n", + "\n", + "\n", + "TOML\n", + "\n", + "\n", + "\n", + "TSQL\n", + "\n", + "\n", + "\n", + "TSX\n", + "\n", + "\n", + "\n", + "Turing\n", + "\n", + "\n", + "\n", + "Turtle\n", + "\n", + "\n", + "\n", + "Twig\n", + "\n", + "\n", + "\n", + "TXL\n", + "\n", + "\n", + "\n", + "Type Language\n", + "\n", + "\n", + "\n", + "TypeScript\n", + "\n", + "\n", + "\n", + "Unified Parallel C\n", + "\n", + "\n", + "\n", + "Unity3D Asset\n", + "\n", + "\n", + "\n", + "Unix Assembly\n", + "\n", + "\n", + "\n", + "Uno\n", + "\n", + "\n", + "\n", + "UnrealScript\n", + "\n", + "\n", + "\n", + "UrWeb\n", + "\n", + "\n", + "\n", + "Vala\n", + "\n", + "\n", + "\n", + "VCL\n", + "\n", + "\n", + "\n", + "Verilog\n", + "\n", + "\n", + "\n", + "VHDL\n", + "\n", + "\n", + "\n", + "Vim script\n", + "\n", + "\n", + "\n", + "Visual Basic\n", + "\n", + "\n", + "\n", + "Volt\n", + "\n", + "\n", + "\n", + "Vue\n", + "\n", + "\n", + "\n", + "Wavefront Material\n", + "\n", + "\n", + "\n", + "Wavefront Object\n", + "\n", + "\n", + "\n", + "wdl\n", + "\n", + "\n", + "\n", + "Web Ontology Language\n", + "\n", + "\n", + "\n", + "WebAssembly\n", + "\n", + "\n", + "\n", + "WebIDL\n", + "\n", + "\n", + "\n", + "WebVTT\n", + "\n", + "\n", + "\n", + "Windows Registry Entries\n", + "\n", + "\n", + "\n", + "wisp\n", + "\n", + "\n", + "\n", + "Wollok\n", + "\n", + "\n", + "\n", + "World of Warcraft Addon Data\n", + "\n", + "\n", + "\n", + "X BitMap\n", + "\n", + "\n", + "\n", + "X Font Directory Index\n", + "\n", + "\n", + "\n", + "X PixMap\n", + "\n", + "\n", + "\n", + "X10\n", + "\n", + "\n", + "\n", + "xBase\n", + "\n", + "\n", + "\n", + "XC\n", + "\n", + "\n", + "\n", + "XCompose\n", + "\n", + "\n", + "\n", + "XML\n", + "\n", + "\n", + "\n", + "Xojo\n", + "\n", + "\n", + "\n", + "XPages\n", + "\n", + "\n", + "\n", + "XProc\n", + "\n", + "\n", + "\n", + "XQuery\n", + "\n", + "\n", + "\n", + "XS\n", + "\n", + "\n", + "\n", + "XSLT\n", + "\n", + "\n", + "\n", + "Xtend\n", + "\n", + "\n", + "\n", + "Yacc\n", + "\n", + "\n", + "\n", + "YAML\n", + "\n", + "\n", + "\n", + "YANG\n", + "\n", + "\n", + "\n", + "YARA\n", + "\n", + "\n", + "\n", + "YASnippet\n", + "\n", + "\n", + "\n", + "ZAP\n", + "\n", + "\n", + "\n", + "Zeek\n", + "\n", + "\n", + "\n", + "ZenScript\n", + "\n", + "\n", + "\n", + "Zephir\n", + "\n", + "\n", + "\n", + "Zig\n", + "\n", + "\n", + "\n", + "ZIL\n", + "\n", + "\n", + "\n", + "Zimpl\n", + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " Date range:\n", + " Today\n", + "\n", + "\n", + "
\n", + "Adjust time span\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + " 2\n", + " \n", + "
\n", + "\"@bfred-it\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Federico Brigante

\n", + "

\n", + "bfred-it\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + " 4\n", + " \n", + "
\n", + "\"@olleolleolle\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Olle Jonsson

\n", + "

\n", + "olleolleolle\n", + "

\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
Popular repo
\n", + "

\n", + "\n", + "\n", + "\n", + " wav2c\n", + " \n", + "

\n", + "
\n", + " wav2c makes arrays out of sounds - useful for Arduino SMAPLER v2 (and for GameBoy Advance) etc\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + " 6\n", + " \n", + "
\n", + "\"@fthomas\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Frank S. Thomas

\n", + "

\n", + "fthomas\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 7\n", + " \n", + "
\n", + "\"@syuilo\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

syuilo

\n", + "

\n", + "syuilo\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + " 9\n", + " \n", + "
\n", + "\"@balloob\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Paulus Schoutsen

\n", + "

\n", + "balloob\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 10\n", + " \n", + "
\n", + "\"@sdras\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Sarah Drasner

\n", + "

\n", + "sdras\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 11\n", + " \n", + "
\n", + "\"@skmp\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Stefanos Kornilios Mitsis Poiitidis

\n", + "

\n", + "skmp\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "\n", + "
\n", + "\n", + " 15\n", + " \n", + "
\n", + "\"@mholt\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Matt Holt

\n", + "

\n", + "mholt\n", + "

\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
Popular repo
\n", + "

\n", + "\n", + "\n", + "\n", + " PapaParse\n", + " \n", + "

\n", + "
\n", + " Fast and powerful CSV (delimited text) parser that gracefully handles large files and malformed input\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "
\n", + "\n", + " 18\n", + " \n", + "
\n", + "\"@unixorn\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Joe Block

\n", + "

\n", + "unixorn\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + " 20\n", + " \n", + "
\n", + "\"@randombit\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Jack Lloyd

\n", + "

\n", + "randombit\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 21\n", + " \n", + "
\n", + "\"@rauchg\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Guillermo Rauch

\n", + "

\n", + "rauchg\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 22\n", + " \n", + "
\n", + "\"@tgriesser\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Tim Griesser

\n", + "

\n", + "tgriesser\n", + "

\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
Popular repo
\n", + "

\n", + "\n", + "\n", + "\n", + " knex\n", + " \n", + "

\n", + "
\n", + " A query builder for PostgreSQL, MySQL and SQLite3, designed to be flexible, portable, and fun to use.\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 23\n", + " \n", + "
\n", + "\"@vtjnash\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Jameson Nash

\n", + "

\n", + "vtjnash\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + " 24\n", + " \n", + "
\n", + "\"@andersy005\"\n", + "
\n", + "
\n", + "
\n", + "
\n", + "

Anderson Banihirwe

\n", + "

\n", + "andersy005\n", + "

\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + "Follow\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "
\n", + "\n", + "\n", + " You can’t perform that action at this time.\n", + "
\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "\n", + "" + ] + }, + "execution_count": 6, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "#printing the content from the Trending Developers\n", + "soup_html = BeautifulSoup(html,'html')\n", + "soup_html" ] }, { @@ -79,9 +3885,7 @@ "execution_count": null, "metadata": {}, "outputs": [], - "source": [ - "#your code" - ] + "source": [] }, { "cell_type": "markdown", @@ -134,11 +3938,58 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 7, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "['Eric Ma',\n", + " 'Federico Brigante',\n", + " 'Kyle Roach',\n", + " 'Olle Jonsson',\n", + " 'Nikita Sobolev',\n", + " 'Frank S. Thomas',\n", + " 'syuilo',\n", + " 'Ives van Hoorne',\n", + " 'Paulus Schoutsen',\n", + " 'Sarah Drasner',\n", + " 'Stefanos Kornilios Mitsis Poiitidis',\n", + " 'Jan Hovancik',\n", + " 'Andreas Mueller',\n", + " 'Guillaume Gomez',\n", + " 'Matt Holt',\n", + " 'Clifford Wolf',\n", + " 'Franck Nijhof',\n", + " 'Joe Block',\n", + " 'Andrei Neagoie',\n", + " 'Jack Lloyd',\n", + " 'Guillermo Rauch',\n", + " 'Tim Griesser',\n", + " 'Jameson Nash',\n", + " 'Anderson Banihirwe',\n", + " 'Danny Ryan']" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "#your code" + "#To reach the names\n", + "tags = ['h1'] #esto es una lista!\n", + "texto = soup_html.find_all(tags,{'class':'h3 lh-condensed'})\n", + "\n", + "#Método largo\n", + "#names = []\n", + "#for t in texto:\n", + "# names.append(t.text)\n", + "#names \n", + " \n", + "#list comprenhension\n", + "names = [t.text for t in texto]\n", + "names" ] }, { @@ -152,7 +4003,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 8, "metadata": {}, "outputs": [], "source": [ @@ -162,37 +4013,148 @@ }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], + "execution_count": 9, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "b'\\n\\n\\n\\n\\n\\n\\n\\n \\n \\n \\n \\n \\n \\n \\n \\n \\n\\n\\n\\n \\n \\n \\n \\n \\n \\n \\n\\n \\n \\n Trending Python repositories on GitHub today \\xc2\\xb7 GitHub\\n \\n \\n \\n \\n\\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n\\n \\n \\n \\n \\n \\n \\n \\n \\n \\n \\n\\n \\n \\n \\n \\n \\n\\n\\n \\n\\n \\n\\n \\n \\n \\n\\n \\n\\n\\n\\n\\n \\n\\n\\n\\n\\n\\n\\n \\n\\n \\n \\n\\n \\n \\n\\n \\n\\n \\n\\n \\n \\n\\n \\n\\n\\n \\n\\n\\n \\n\\n \\n\\n \\n \\n\\n\\n\\n\\n\\n\\n\\n \\n\\n \\n\\n \\n \\n\\n
\\n Skip to content\\n
\\n\\n \\n \\n \\n\\n\\n
\\n
\\n
\\n \\n \\n \\n\\n
\\n \\n\\n
\\n\\n
\\n \\n Sign up\\n \\n\\n \\n
\\n
\\n\\n
\\n
\\n \\n
\\n\\n \\n\\n \\n
\\n
\\n
\\n\\n
\\n\\n
\\n\\n\\n
\\n\\n
\\n\\n\\n\\n
\\n
\\n
\\n \\n
\\n\\n\\n
\\n
\\n

Trending

\\n

See what the GitHub community is most excited about today.

\\n
\\n
\\n\\n\\n
\\n
\\n
\\n \\n\\n\\n
\\n
\\n
\\n \\n Language:\\n\\n \\n \\n Python\\n \\n \\n \\n\\n \\n
\\n Select a language\\n \\n
\\n\\n
\\n
\\n
\\n \\n
\\n
\\n
\\n\\n
\\n
\\n \\n\\n Clear language\\n
\\n\\n
\\n \\n \\n C++\\n \\n \\n \\n HTML\\n \\n \\n \\n Java\\n \\n \\n \\n JavaScript\\n \\n \\n \\n PHP\\n \\n \\n \\n Python\\n \\n \\n \\n Ruby\\n \\n\\n \\n \\n Unknown languages\\n \\n\\n \\n \\n 1C Enterprise\\n \\n \\n \\n ABAP\\n \\n \\n \\n ABNF\\n \\n \\n \\n ActionScript\\n \\n \\n \\n Ada\\n \\n \\n \\n Adobe Font Metrics\\n \\n \\n \\n Agda\\n \\n \\n \\n AGS Script\\n \\n \\n \\n Alloy\\n \\n \\n \\n Alpine Abuild\\n \\n \\n \\n Altium Designer\\n \\n \\n \\n AMPL\\n \\n \\n \\n AngelScript\\n \\n \\n \\n Ant Build System\\n \\n \\n \\n ANTLR\\n \\n \\n \\n ApacheConf\\n \\n \\n \\n Apex\\n \\n \\n \\n API Blueprint\\n \\n \\n \\n APL\\n \\n \\n \\n Apollo Guidance Computer\\n \\n \\n \\n AppleScript\\n \\n \\n \\n Arc\\n \\n \\n \\n AsciiDoc\\n \\n \\n \\n ASN.1\\n \\n \\n \\n ASP\\n \\n \\n \\n AspectJ\\n \\n \\n \\n Assembly\\n \\n \\n \\n Asymptote\\n \\n \\n \\n ATS\\n \\n \\n \\n Augeas\\n \\n \\n \\n AutoHotkey\\n \\n \\n \\n AutoIt\\n \\n \\n \\n Awk\\n \\n \\n \\n Ballerina\\n \\n \\n \\n Batchfile\\n \\n \\n \\n Befunge\\n \\n \\n \\n Bison\\n \\n \\n \\n BitBake\\n \\n \\n \\n Blade\\n \\n \\n \\n BlitzBasic\\n \\n \\n \\n BlitzMax\\n \\n \\n \\n Bluespec\\n \\n \\n \\n Boo\\n \\n \\n \\n Brainfuck\\n \\n \\n \\n Brightscript\\n \\n \\n \\n Zeek\\n \\n \\n \\n C\\n \\n \\n \\n C#\\n \\n \\n \\n C++\\n \\n \\n \\n C-ObjDump\\n \\n \\n \\n C2hs Haskell\\n \\n \\n \\n Cabal Config\\n \\n \\n \\n Cap'n Proto\\n \\n \\n \\n CartoCSS\\n \\n \\n \\n Ceylon\\n \\n \\n \\n Chapel\\n \\n \\n \\n Charity\\n \\n \\n \\n ChucK\\n \\n \\n \\n Cirru\\n \\n \\n \\n Clarion\\n \\n \\n \\n Clean\\n \\n \\n \\n Click\\n \\n \\n \\n CLIPS\\n \\n \\n \\n Clojure\\n \\n \\n \\n Closure Templates\\n \\n \\n \\n Cloud Firestore Security Rules\\n \\n \\n \\n CMake\\n \\n \\n \\n COBOL\\n \\n \\n \\n CoffeeScript\\n \\n \\n \\n ColdFusion\\n \\n \\n \\n ColdFusion CFC\\n \\n \\n \\n COLLADA\\n \\n \\n \\n Common Lisp\\n \\n \\n \\n Common Workflow Language\\n \\n \\n \\n Component Pascal\\n \\n \\n \\n CoNLL-U\\n \\n \\n \\n Cool\\n \\n \\n \\n Coq\\n \\n \\n \\n Cpp-ObjDump\\n \\n \\n \\n Creole\\n \\n \\n \\n Crystal\\n \\n \\n \\n CSON\\n \\n \\n \\n Csound\\n \\n \\n \\n Csound Document\\n \\n \\n \\n Csound Score\\n \\n \\n \\n CSS\\n \\n \\n \\n CSV\\n \\n \\n \\n Cuda\\n \\n \\n \\n CWeb\\n \\n \\n \\n Cycript\\n \\n \\n \\n Cython\\n \\n \\n \\n D\\n \\n \\n \\n D-ObjDump\\n \\n \\n \\n Darcs Patch\\n \\n \\n \\n Dart\\n \\n \\n \\n DataWeave\\n \\n \\n \\n desktop\\n \\n \\n \\n Dhall\\n \\n \\n \\n Diff\\n \\n \\n \\n DIGITAL Command Language\\n \\n \\n \\n DM\\n \\n \\n \\n DNS Zone\\n \\n \\n \\n Dockerfile\\n \\n \\n \\n Dogescript\\n \\n \\n \\n DTrace\\n \\n \\n \\n Dylan\\n \\n \\n \\n E\\n \\n \\n \\n Eagle\\n \\n \\n \\n Easybuild\\n \\n \\n \\n EBNF\\n \\n \\n \\n eC\\n \\n \\n \\n Ecere Projects\\n \\n \\n \\n ECL\\n \\n \\n \\n ECLiPSe\\n \\n \\n \\n Edje Data Collection\\n \\n \\n \\n edn\\n \\n \\n \\n Eiffel\\n \\n \\n \\n EJS\\n \\n \\n \\n Elixir\\n \\n \\n \\n Elm\\n \\n \\n \\n Emacs Lisp\\n \\n \\n \\n EmberScript\\n \\n \\n \\n EML\\n \\n \\n \\n EQ\\n \\n \\n \\n Erlang\\n \\n \\n \\n F#\\n \\n \\n \\n F*\\n \\n \\n \\n Factor\\n \\n \\n \\n Fancy\\n \\n \\n \\n Fantom\\n \\n \\n \\n FIGlet Font\\n \\n \\n \\n Filebench WML\\n \\n \\n \\n Filterscript\\n \\n \\n \\n fish\\n \\n \\n \\n FLUX\\n \\n \\n \\n Formatted\\n \\n \\n \\n Forth\\n \\n \\n \\n Fortran\\n \\n \\n \\n FreeMarker\\n \\n \\n \\n Frege\\n \\n \\n \\n G-code\\n \\n \\n \\n Game Maker Language\\n \\n \\n \\n GAMS\\n \\n \\n \\n GAP\\n \\n \\n \\n GCC Machine Description\\n \\n \\n \\n GDB\\n \\n \\n \\n GDScript\\n \\n \\n \\n Genie\\n \\n \\n \\n Genshi\\n \\n \\n \\n Gentoo Ebuild\\n \\n \\n \\n Gentoo Eclass\\n \\n \\n \\n Gerber Image\\n \\n \\n \\n Gettext Catalog\\n \\n \\n \\n Gherkin\\n \\n \\n \\n Git Attributes\\n \\n \\n \\n Git Config\\n \\n \\n \\n GLSL\\n \\n \\n \\n Glyph\\n \\n \\n \\n Glyph Bitmap Distribution Format\\n \\n \\n \\n GN\\n \\n \\n \\n Gnuplot\\n \\n \\n \\n Go\\n \\n \\n \\n Golo\\n \\n \\n \\n Gosu\\n \\n \\n \\n Grace\\n \\n \\n \\n Gradle\\n \\n \\n \\n Grammatical Framework\\n \\n \\n \\n Graph Modeling Language\\n \\n \\n \\n GraphQL\\n \\n \\n \\n Graphviz (DOT)\\n \\n \\n \\n Groovy\\n \\n \\n \\n Groovy Server Pages\\n \\n \\n \\n Hack\\n \\n \\n \\n Haml\\n \\n \\n \\n Handlebars\\n \\n \\n \\n HAProxy\\n \\n \\n \\n Harbour\\n \\n \\n \\n Haskell\\n \\n \\n \\n Haxe\\n \\n \\n \\n HCL\\n \\n \\n \\n HiveQL\\n \\n \\n \\n HLSL\\n \\n \\n \\n HolyC\\n \\n \\n \\n HTML\\n \\n \\n \\n HTML+Django\\n \\n \\n \\n HTML+ECR\\n \\n \\n \\n HTML+EEX\\n \\n \\n \\n HTML+ERB\\n \\n \\n \\n HTML+PHP\\n \\n \\n \\n HTML+Razor\\n \\n \\n \\n HTTP\\n \\n \\n \\n HXML\\n \\n \\n \\n Hy\\n \\n \\n \\n HyPhy\\n \\n \\n \\n IDL\\n \\n \\n \\n Idris\\n \\n \\n \\n IGOR Pro\\n \\n \\n \\n Inform 7\\n \\n \\n \\n INI\\n \\n \\n \\n Inno Setup\\n \\n \\n \\n Io\\n \\n \\n \\n Ioke\\n \\n \\n \\n IRC log\\n \\n \\n \\n Isabelle\\n \\n \\n \\n Isabelle ROOT\\n \\n \\n \\n J\\n \\n \\n \\n Jasmin\\n \\n \\n \\n Java\\n \\n \\n \\n Java Properties\\n \\n \\n \\n Java Server Pages\\n \\n \\n \\n JavaScript\\n \\n \\n \\n JavaScript+ERB\\n \\n \\n \\n JFlex\\n \\n \\n \\n Jison\\n \\n \\n \\n Jison Lex\\n \\n \\n \\n Jolie\\n \\n \\n \\n JSON\\n \\n \\n \\n JSON with Comments\\n \\n \\n \\n JSON5\\n \\n \\n \\n JSONiq\\n \\n \\n \\n JSONLD\\n \\n \\n \\n Jsonnet\\n \\n \\n \\n JSX\\n \\n \\n \\n Julia\\n \\n \\n \\n Jupyter Notebook\\n \\n \\n \\n KiCad Layout\\n \\n \\n \\n KiCad Legacy Layout\\n \\n \\n \\n KiCad Schematic\\n \\n \\n \\n Kit\\n \\n \\n \\n Kotlin\\n \\n \\n \\n KRL\\n \\n \\n \\n LabVIEW\\n \\n \\n \\n Lasso\\n \\n \\n \\n Latte\\n \\n \\n \\n Lean\\n \\n \\n \\n Less\\n \\n \\n \\n Lex\\n \\n \\n \\n LFE\\n \\n \\n \\n LilyPond\\n \\n \\n \\n Limbo\\n \\n \\n \\n Linker Script\\n \\n \\n \\n Linux Kernel Module\\n \\n \\n \\n Liquid\\n \\n \\n \\n Literate Agda\\n \\n \\n \\n Literate CoffeeScript\\n \\n \\n \\n Literate Haskell\\n \\n \\n \\n LiveScript\\n \\n \\n \\n LLVM\\n \\n \\n \\n Logos\\n \\n \\n \\n Logtalk\\n \\n \\n \\n LOLCODE\\n \\n \\n \\n LookML\\n \\n \\n \\n LoomScript\\n \\n \\n \\n LSL\\n \\n \\n \\n Lua\\n \\n \\n \\n M\\n \\n \\n \\n M4\\n \\n \\n \\n M4Sugar\\n \\n \\n \\n Makefile\\n \\n \\n \\n Mako\\n \\n \\n \\n Markdown\\n \\n \\n \\n Marko\\n \\n \\n \\n Mask\\n \\n \\n \\n Mathematica\\n \\n \\n \\n MATLAB\\n \\n \\n \\n Maven POM\\n \\n \\n \\n Max\\n \\n \\n \\n MAXScript\\n \\n \\n \\n mcfunction\\n \\n \\n \\n MediaWiki\\n \\n \\n \\n Mercury\\n \\n \\n \\n Meson\\n \\n \\n \\n Metal\\n \\n \\n \\n MiniD\\n \\n \\n \\n Mirah\\n \\n \\n \\n Modelica\\n \\n \\n \\n Modula-2\\n \\n \\n \\n Modula-3\\n \\n \\n \\n Module Management System\\n \\n \\n \\n Monkey\\n \\n \\n \\n Moocode\\n \\n \\n \\n MoonScript\\n \\n \\n \\n Motorola 68K Assembly\\n \\n \\n \\n MQL4\\n \\n \\n \\n MQL5\\n \\n \\n \\n MTML\\n \\n \\n \\n MUF\\n \\n \\n \\n mupad\\n \\n \\n \\n Myghty\\n \\n \\n \\n nanorc\\n \\n \\n \\n NCL\\n \\n \\n \\n Nearley\\n \\n \\n \\n Nemerle\\n \\n \\n \\n nesC\\n \\n \\n \\n NetLinx\\n \\n \\n \\n NetLinx+ERB\\n \\n \\n \\n NetLogo\\n \\n \\n \\n NewLisp\\n \\n \\n \\n Nextflow\\n \\n \\n \\n Nginx\\n \\n \\n \\n Nim\\n \\n \\n \\n Ninja\\n \\n \\n \\n Nit\\n \\n \\n \\n Nix\\n \\n \\n \\n NL\\n \\n \\n \\n NSIS\\n \\n \\n \\n Nu\\n \\n \\n \\n NumPy\\n \\n \\n \\n ObjDump\\n \\n \\n \\n Objective-C\\n \\n \\n \\n Objective-C++\\n \\n \\n \\n Objective-J\\n \\n \\n \\n ObjectScript\\n \\n \\n \\n OCaml\\n \\n \\n \\n Omgrofl\\n \\n \\n \\n ooc\\n \\n \\n \\n Opa\\n \\n \\n \\n Opal\\n \\n \\n \\n OpenCL\\n \\n \\n \\n OpenEdge ABL\\n \\n \\n \\n OpenRC runscript\\n \\n \\n \\n OpenSCAD\\n \\n \\n \\n OpenType Feature File\\n \\n \\n \\n Org\\n \\n \\n \\n Ox\\n \\n \\n \\n Oxygene\\n \\n \\n \\n Oz\\n \\n \\n \\n P4\\n \\n \\n \\n Pan\\n \\n \\n \\n Papyrus\\n \\n \\n \\n Parrot\\n \\n \\n \\n Parrot Assembly\\n \\n \\n \\n Parrot Internal Representation\\n \\n \\n \\n Pascal\\n \\n \\n \\n Pawn\\n \\n \\n \\n Pep8\\n \\n \\n \\n Perl\\n \\n \\n \\n Perl 6\\n \\n \\n \\n PHP\\n \\n \\n \\n Pic\\n \\n \\n \\n Pickle\\n \\n \\n \\n PicoLisp\\n \\n \\n \\n PigLatin\\n \\n \\n \\n Pike\\n \\n \\n \\n PLpgSQL\\n \\n \\n \\n PLSQL\\n \\n \\n \\n Pod\\n \\n \\n \\n Pod 6\\n \\n \\n \\n PogoScript\\n \\n \\n \\n Pony\\n \\n \\n \\n PostCSS\\n \\n \\n \\n PostScript\\n \\n \\n \\n POV-Ray SDL\\n \\n \\n \\n PowerBuilder\\n \\n \\n \\n PowerShell\\n \\n \\n \\n Processing\\n \\n \\n \\n Prolog\\n \\n \\n \\n Propeller Spin\\n \\n \\n \\n Protocol Buffer\\n \\n \\n \\n Public Key\\n \\n \\n \\n Pug\\n \\n \\n \\n Puppet\\n \\n \\n \\n Pure Data\\n \\n \\n \\n PureBasic\\n \\n \\n \\n PureScript\\n \\n \\n \\n Python\\n \\n \\n \\n Python console\\n \\n \\n \\n Python traceback\\n \\n \\n \\n q\\n \\n \\n \\n QMake\\n \\n \\n \\n QML\\n \\n \\n \\n Quake\\n \\n \\n \\n R\\n \\n \\n \\n Racket\\n \\n \\n \\n Ragel\\n \\n \\n \\n RAML\\n \\n \\n \\n Rascal\\n \\n \\n \\n Raw token data\\n \\n \\n \\n RDoc\\n \\n \\n \\n REALbasic\\n \\n \\n \\n Reason\\n \\n \\n \\n Rebol\\n \\n \\n \\n Red\\n \\n \\n \\n Redcode\\n \\n \\n \\n Regular Expression\\n \\n \\n \\n Ren'Py\\n \\n \\n \\n RenderScript\\n \\n \\n \\n reStructuredText\\n \\n \\n \\n REXX\\n \\n \\n \\n RHTML\\n \\n \\n \\n Rich Text Format\\n \\n \\n \\n Ring\\n \\n \\n \\n RMarkdown\\n \\n \\n \\n RobotFramework\\n \\n \\n \\n Roff\\n \\n \\n \\n Roff Manpage\\n \\n \\n \\n Rouge\\n \\n \\n \\n RPC\\n \\n \\n \\n RPM Spec\\n \\n \\n \\n Ruby\\n \\n \\n \\n RUNOFF\\n \\n \\n \\n Rust\\n \\n \\n \\n Sage\\n \\n \\n \\n SaltStack\\n \\n \\n \\n SAS\\n \\n \\n \\n Sass\\n \\n \\n \\n Scala\\n \\n \\n \\n Scaml\\n \\n \\n \\n Scheme\\n \\n \\n \\n Scilab\\n \\n \\n \\n SCSS\\n \\n \\n \\n sed\\n \\n \\n \\n Self\\n \\n \\n \\n ShaderLab\\n \\n \\n \\n Shell\\n \\n \\n \\n ShellSession\\n \\n \\n \\n Shen\\n \\n \\n \\n Slash\\n \\n \\n \\n Slice\\n \\n \\n \\n Slim\\n \\n \\n \\n Smali\\n \\n \\n \\n Smalltalk\\n \\n \\n \\n Smarty\\n \\n \\n \\n SMT\\n \\n \\n \\n Solidity\\n \\n \\n \\n SourcePawn\\n \\n \\n \\n SPARQL\\n \\n \\n \\n Spline Font Database\\n \\n \\n \\n SQF\\n \\n \\n \\n SQL\\n \\n \\n \\n SQLPL\\n \\n \\n \\n Squirrel\\n \\n \\n \\n SRecode Template\\n \\n \\n \\n SSH Config\\n \\n \\n \\n Stan\\n \\n \\n \\n Standard ML\\n \\n \\n \\n Stata\\n \\n \\n \\n STON\\n \\n \\n \\n Stylus\\n \\n \\n \\n SubRip Text\\n \\n \\n \\n SugarSS\\n \\n \\n \\n SuperCollider\\n \\n \\n \\n SVG\\n \\n \\n \\n Swift\\n \\n \\n \\n SystemVerilog\\n \\n \\n \\n Tcl\\n \\n \\n \\n Tcsh\\n \\n \\n \\n Tea\\n \\n \\n \\n Terra\\n \\n \\n \\n TeX\\n \\n \\n \\n Text\\n \\n \\n \\n Textile\\n \\n \\n \\n Thrift\\n \\n \\n \\n TI Program\\n \\n \\n \\n TLA\\n \\n \\n \\n TOML\\n \\n \\n \\n TSQL\\n \\n \\n \\n TSX\\n \\n \\n \\n Turing\\n \\n \\n \\n Turtle\\n \\n \\n \\n Twig\\n \\n \\n \\n TXL\\n \\n \\n \\n Type Language\\n \\n \\n \\n TypeScript\\n \\n \\n \\n Unified Parallel C\\n \\n \\n \\n Unity3D Asset\\n \\n \\n \\n Unix Assembly\\n \\n \\n \\n Uno\\n \\n \\n \\n UnrealScript\\n \\n \\n \\n UrWeb\\n \\n \\n \\n Vala\\n \\n \\n \\n VCL\\n \\n \\n \\n Verilog\\n \\n \\n \\n VHDL\\n \\n \\n \\n Vim script\\n \\n \\n \\n Visual Basic\\n \\n \\n \\n Volt\\n \\n \\n \\n Vue\\n \\n \\n \\n Wavefront Material\\n \\n \\n \\n Wavefront Object\\n \\n \\n \\n wdl\\n \\n \\n \\n Web Ontology Language\\n \\n \\n \\n WebAssembly\\n \\n \\n \\n WebIDL\\n \\n \\n \\n WebVTT\\n \\n \\n \\n Windows Registry Entries\\n \\n \\n \\n wisp\\n \\n \\n \\n Wollok\\n \\n \\n \\n World of Warcraft Addon Data\\n \\n \\n \\n X BitMap\\n \\n \\n \\n X Font Directory Index\\n \\n \\n \\n X PixMap\\n \\n \\n \\n X10\\n \\n \\n \\n xBase\\n \\n \\n \\n XC\\n \\n \\n \\n XCompose\\n \\n \\n \\n XML\\n \\n \\n \\n Xojo\\n \\n \\n \\n XPages\\n \\n \\n \\n XProc\\n \\n \\n \\n XQuery\\n \\n \\n \\n XS\\n \\n \\n \\n XSLT\\n \\n \\n \\n Xtend\\n \\n \\n \\n Yacc\\n \\n \\n \\n YAML\\n \\n \\n \\n YANG\\n \\n \\n \\n YARA\\n \\n \\n \\n YASnippet\\n \\n \\n \\n ZAP\\n \\n \\n \\n Zeek\\n \\n \\n \\n ZenScript\\n \\n \\n \\n Zephir\\n \\n \\n \\n Zig\\n \\n \\n \\n ZIL\\n \\n \\n \\n Zimpl\\n \\n
\\n
\\n\\n
\\n \\n
\\n
\\n
\\n\\n
\\n\\n
\\n
\\n \\n Date range:\\n Today\\n \\n \\n
\\n Adjust time span\\n \\n
\\n\\n
\\n \\n \\n Today\\n \\n \\n \\n This week\\n \\n \\n \\n This month\\n \\n
\\n
\\n
\\n\\n
\\n
\\n
\\n
\\n \\n\\n \\n\\n \\n\\n
\\n
\\n \\n \\n Star\\n\\n\\n
\\n\\n

\\n \\n \\n uber / ludwig\\n

\\n\\n

\\n Ludwig is a toolbox built on top of TensorFlow that allows to train and test deep learning models without the need to write code.\\n

\\n\\n
\\n \\n \\n Python\\n\\n\\n\\n \\n \\n 5,146\\n \\n\\n \\n \\n 547\\n \\n\\n \\n \\n Built by\\n \"@w4nderlust\"\\n \"@msaisumanth\"\\n \"@ydudin3\"\\n \"@dsblank\"\\n \"@carlogrisetti\"\\n \\n\\n \\n \\n 74 stars today\\n \\n
\\n
\\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n \\n\\n
\\n
\\n \\n \\n Star\\n\\n\\n
\\n\\n

\\n \\n \\n d2l-ai / d2l-zh\\n

\\n\\n

\\n \\xe3\\x80\\x8a\\xe5\\x8a\\xa8\\xe6\\x89\\x8b\\xe5\\xad\\xa6\\xe6\\xb7\\xb1\\xe5\\xba\\xa6\\xe5\\xad\\xa6\\xe4\\xb9\\xa0\\xe3\\x80\\x8b\\xef\\xbc\\x9a\\xe9\\x9d\\xa2\\xe5\\x90\\x91\\xe4\\xb8\\xad\\xe6\\x96\\x87\\xe8\\xaf\\xbb\\xe8\\x80\\x85\\xe3\\x80\\x81\\xe8\\x83\\xbd\\xe8\\xbf\\x90\\xe8\\xa1\\x8c\\xe3\\x80\\x81\\xe5\\x8f\\xaf\\xe8\\xae\\xa8\\xe8\\xae\\xba\\xe3\\x80\\x82\\xe8\\x8b\\xb1\\xe6\\x96\\x87\\xe7\\x89\\x88\\xe5\\x8d\\xb3\\xe4\\xbc\\xaf\\xe5\\x85\\x8b\\xe5\\x88\\xa9\\xe2\\x80\\x9c\\xe6\\xb7\\xb1\\xe5\\xba\\xa6\\xe5\\xad\\xa6\\xe4\\xb9\\xa0\\xe5\\xaf\\xbc\\xe8\\xae\\xba\\xef\\xbc\\x88STAT 157\\xef\\xbc\\x89\\xe2\\x80\\x9d\\xe6\\x95\\x99\\xe6\\x9d\\x90\\xe3\\x80\\x82\\n

\\n\\n
\\n \\n \\n Python\\n\\n\\n\\n \\n \\n 10,459\\n \\n\\n \\n \\n 2,665\\n \\n\\n \\n \\n Built by\\n \"@astonzhang\"\\n \"@mli\"\\n \"@szha\"\\n \"@yanwenlei\"\\n \"@XiaGenYuan\"\\n \\n\\n \\n \\n 45 stars today\\n \\n
\\n
\\n\\n \\n\\n
\\n
\\n \\n \\n Star\\n\\n\\n
\\n\\n

\\n \\n \\n beecost / bee-university\\n

\\n\\n

\\n Project thu th\\xe1\\xba\\xadp \\xc4\\x91i\\xe1\\xbb\\x83m chu\\xe1\\xba\\xa9n \\xc4\\x91\\xe1\\xba\\xa1i h\\xe1\\xbb\\x8dc 2014 - 2018 v\\xc3\\xa0 ph\\xc3\\xa2n t\\xc3\\xadch d\\xe1\\xbb\\xaf li\\xe1\\xbb\\x87u\\n

\\n\\n
\\n \\n \\n Python\\n\\n\\n\\n \\n \\n 61\\n \\n\\n \\n \\n 12\\n \\n\\n \\n \\n Built by\\n \"@tuantmtb\"\\n \\n\\n \\n \\n 5 stars today\\n \\n
\\n
\\n\\n \\n\\n
\\n
\\n
\\n
\\n
\\n\\n
\\n\\n \\n\\n\\n\\n\\n
\\n \\n \\n You can\\xe2\\x80\\x99t perform that action at this time.\\n
\\n\\n\\n \\n \\n \\n \\n \\n \\n \\n
\\n \\n You signed in with another tab or window. Reload to refresh your session.\\n You signed out in another tab or window. Reload to refresh your session.\\n
\\n \\n\\n
\\n
\\n
\\n
\\n\\n
\\n\\n \\n\\n\\n'" + ] + }, + "execution_count": 9, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "#your code" + "#your code\n", + "html = requests.get(url).content\n", + "html" ] }, { - "cell_type": "markdown", - "metadata": {}, + "cell_type": "code", + "execution_count": 10, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "['gto76/python-cheatsheet',\n", + " 'j3ssie/Osmedeus',\n", + " 'tangzixiang0304/Shielded_detector',\n", + " 'uber/ludwig',\n", + " 'xinshuoweng/AB3DMOT',\n", + " 'NVlabs/stylegan',\n", + " 'dagster-io/dagster',\n", + " 'tensorflow/models',\n", + " 'eragonruan/text-detection-ctpn',\n", + " 'sherlock-project/sherlock',\n", + " 'deepfakes/faceswap',\n", + " 'nbei/Deep-Flow-Guided-Video-Inpainting',\n", + " 'iovisor/bcc',\n", + " 'Roibal/Cryptocurrency-Trading-Bots-Python-Beginner-Advance',\n", + " 'NVIDIA/DeepLearningExamples',\n", + " 'BlackHC/tfpyth',\n", + " 'clovaai/deep-text-recognition-benchmark',\n", + " 'tkat0/PyTorch_BlazeFace',\n", + " 'OpenMined/PySyft',\n", + " 'CoreyMSchafer/code_snippets',\n", + " 'public-apis/public-apis',\n", + " 'd2l-ai/d2l-zh',\n", + " 'apache/airflow',\n", + " 'beecost/bee-university',\n", + " 'sundowndev/PhoneInfoga']" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "#### Display all the image links from Walt Disney wikipedia page" + "soup_html = BeautifulSoup(html,'html')\n", + "tags = ['h1']\n", + "texto = soup_html.find_all(tags,{'class':'h3 lh-condensed'})\n", + "\n", + "names = [t.text.replace('\\n','').replace(' ','') for t in texto]\n", + "names\n", + "\n" ] }, { - "cell_type": "code", - "execution_count": null, + "cell_type": "markdown", "metadata": {}, - "outputs": [], "source": [ - "# This is the url you will scrape in this exercise\n", - "url = 'https://en.wikipedia.org/wiki/Walt_Disney'" + "#### Display all the image links from Walt Disney wikipedia page" ] }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], + "execution_count": 11, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "['//upload.wikimedia.org/wikipedia/en/thumb/e/e7/Cscr-featured.svg/20px-Cscr-featured.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/1/1b/Semi-protection-shackle.svg/20px-Semi-protection-shackle.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/d/df/Walt_Disney_1946.JPG/220px-Walt_Disney_1946.JPG',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/8/87/Walt_Disney_1942_signature.svg/150px-Walt_Disney_1942_signature.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/c/c4/Walt_Disney_envelope_ca._1921.jpg/220px-Walt_Disney_envelope_ca._1921.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/4/4d/Newman_Laugh-O-Gram_%281921%29.webm/220px-seek%3D2-Newman_Laugh-O-Gram_%281921%29.webm.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/0/0d/Trolley_Troubles_poster.jpg/170px-Trolley_Troubles_poster.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/7/71/Walt_Disney_and_his_cartoon_creation_%22Mickey_Mouse%22_-_National_Board_of_Review_Magazine.jpg/170px-Walt_Disney_and_his_cartoon_creation_%22Mickey_Mouse%22_-_National_Board_of_Review_Magazine.jpg',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/4/4e/Steamboat-willie.jpg/170px-Steamboat-willie.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/5/57/Walt_Disney_1935.jpg/170px-Walt_Disney_1935.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/c/cd/Walt_Disney_Snow_white_1937_trailer_screenshot_%2813%29.jpg/220px-Walt_Disney_Snow_white_1937_trailer_screenshot_%2813%29.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/1/15/Disney_drawing_goofy.jpg/170px-Disney_drawing_goofy.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/1/13/DisneySchiphol1951.jpg/220px-DisneySchiphol1951.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/8/8c/WaltDisneyplansDisneylandDec1954.jpg/220px-WaltDisneyplansDisneylandDec1954.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/f/ff/Walt_disney_portrait_right.jpg/170px-Walt_disney_portrait_right.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/1/1a/Walt_Disney_Grave.JPG/170px-Walt_Disney_Grave.JPG',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/2/2d/Roy_O._Disney_with_Company_at_Press_Conference.jpg/170px-Roy_O._Disney_with_Company_at_Press_Conference.jpg',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/a/a9/Disney_Display_Case.JPG/170px-Disney_Display_Case.JPG',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/6/6c/Disney1968.jpg/170px-Disney1968.jpg',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/8/8a/OOjs_UI_icon_edit-ltr-progressive.svg/10px-OOjs_UI_icon_edit-ltr-progressive.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/d/da/Animation_disc.svg/30px-Animation_disc.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/6/69/P_vip.svg/29px-P_vip.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/1/1a/Magic_Kingdom_castle.jpg/24px-Magic_Kingdom_castle.jpg',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/e/e7/Video-x-generic.svg/30px-Video-x-generic.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/a/a3/Flag_of_Los_Angeles_County%2C_California.svg/30px-Flag_of_Los_Angeles_County%2C_California.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/a/a3/USA_flag_on_television.svg/30px-USA_flag_on_television.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/4/4a/Commons-logo.svg/22px-Commons-logo.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/f/fa/Wikiquote-logo.svg/25px-Wikiquote-logo.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/commons/thumb/f/ff/Wikidata-logo.svg/30px-Wikidata-logo.svg.png',\n", + " '//upload.wikimedia.org/wikipedia/en/thumb/8/8a/OOjs_UI_icon_edit-ltr-progressive.svg/10px-OOjs_UI_icon_edit-ltr-progressive.svg.png',\n", + " '//en.wikipedia.org/wiki/Special:CentralAutoLogin/start?type=1x1',\n", + " '/static/images/wikimedia-button.png',\n", + " '/static/images/poweredby_mediawiki_88x31.png']" + ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "#your code" + "# This is the url you will scrape in this exercise\n", + "url = 'https://en.wikipedia.org/wiki/Walt_Disney'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')\n", + "\n", + "tags = ['img']\n", + "images = soup_html.find_all(tags)\n", + "\n", + "image_list = [i.attrs['src'] for i in images]\n", + "image_list" ] }, { @@ -204,21 +4166,189 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 12, "metadata": {}, "outputs": [], "source": [ "# This is the url you will scrape in this exercise\n", - "url ='https://en.wikipedia.org/wiki/Python' " + "url ='https://en.wikipedia.org/wiki/Python'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')" ] }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], + "execution_count": 13, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "['https://en.wiktionary.org/wiki/Python',\n", + " 'https://en.wiktionary.org/wiki/python',\n", + " '/w/index.php?title=Python&action=edit§ion=1',\n", + " '/wiki/Pythonidae',\n", + " '/wiki/Python_(genus)',\n", + " '/w/index.php?title=Python&action=edit§ion=2',\n", + " '/wiki/Python_(mythology)',\n", + " '/wiki/Python_of_Aenus',\n", + " '/wiki/Python_(painter)',\n", + " '/wiki/Python_of_Byzantium',\n", + " '/wiki/Python_of_Catana',\n", + " '/w/index.php?title=Python&action=edit§ion=3',\n", + " '/wiki/Python_(film)',\n", + " '/wiki/Pythons_2',\n", + " '/wiki/Monty_Python',\n", + " '/wiki/Python_(Monty)_Pictures',\n", + " '/w/index.php?title=Python&action=edit§ion=4',\n", + " '/wiki/Python_(programming_language)',\n", + " '/wiki/CPython',\n", + " '/wiki/CMU_Common_Lisp',\n", + " '/wiki/PERQ#PERQ_3',\n", + " '/w/index.php?title=Python&action=edit§ion=5',\n", + " '/w/index.php?title=Python&action=edit§ion=6',\n", + " '/wiki/Python_(Busch_Gardens_Tampa_Bay)',\n", + " '/wiki/Python_(Coney_Island,_Cincinnati,_Ohio)',\n", + " '/wiki/Python_(Efteling)',\n", + " '/w/index.php?title=Python&action=edit§ion=7',\n", + " '/wiki/Python_(automobile_maker)',\n", + " '/wiki/Python_(Ford_prototype)',\n", + " '/w/index.php?title=Python&action=edit§ion=8',\n", + " '/wiki/Colt_Python',\n", + " '/wiki/Python_(missile)',\n", + " '/wiki/Python_(nuclear_primary)',\n", + " '/w/index.php?title=Python&action=edit§ion=9',\n", + " '/wiki/Python_Anghelo',\n", + " '/w/index.php?title=Python&action=edit§ion=10',\n", + " '/wiki/PYTHON',\n", + " '/w/index.php?title=Python&action=edit§ion=11',\n", + " '/wiki/Cython',\n", + " '/wiki/Pyton',\n", + " '/wiki/File:Disambig_gray.svg',\n", + " '/wiki/Help:Disambiguation',\n", + " '//en.wikipedia.org/w/index.php?title=Special:WhatLinksHere/Python&namespace=0',\n", + " 'https://en.wikipedia.org/w/index.php?title=Python&oldid=905477736',\n", + " '/wiki/Help:Category',\n", + " '/wiki/Category:Disambiguation_pages',\n", + " '/wiki/Category:Disambiguation_pages_with_short_description',\n", + " '/wiki/Category:All_article_disambiguation_pages',\n", + " '/wiki/Category:All_disambiguation_pages',\n", + " '/wiki/Category:Animal_common_name_disambiguation_pages',\n", + " '/wiki/Special:MyTalk',\n", + " '/wiki/Special:MyContributions',\n", + " '/w/index.php?title=Special:CreateAccount&returnto=Python',\n", + " '/w/index.php?title=Special:UserLogin&returnto=Python',\n", + " '/wiki/Python',\n", + " '/wiki/Talk:Python',\n", + " '/wiki/Python',\n", + " '/w/index.php?title=Python&action=edit',\n", + " '/w/index.php?title=Python&action=history',\n", + " '/wiki/Main_Page',\n", + " '/wiki/Main_Page',\n", + " '/wiki/Portal:Contents',\n", + " '/wiki/Portal:Featured_content',\n", + " '/wiki/Portal:Current_events',\n", + " '/wiki/Special:Random',\n", + " 'https://donate.wikimedia.org/wiki/Special:FundraiserRedirector?utm_source=donate&utm_medium=sidebar&utm_campaign=C13_en.wikipedia.org&uselang=en',\n", + " '//shop.wikimedia.org',\n", + " '/wiki/Help:Contents',\n", + " '/wiki/Wikipedia:About',\n", + " '/wiki/Wikipedia:Community_portal',\n", + " '/wiki/Special:RecentChanges',\n", + " '//en.wikipedia.org/wiki/Wikipedia:Contact_us',\n", + " '/wiki/Special:WhatLinksHere/Python',\n", + " '/wiki/Special:RecentChangesLinked/Python',\n", + " '/wiki/Wikipedia:File_Upload_Wizard',\n", + " '/wiki/Special:SpecialPages',\n", + " '/w/index.php?title=Python&oldid=905477736',\n", + " '/w/index.php?title=Python&action=info',\n", + " 'https://www.wikidata.org/wiki/Special:EntityPage/Q747452',\n", + " '/w/index.php?title=Special:CiteThisPage&page=Python&id=905477736',\n", + " 'https://commons.wikimedia.org/wiki/Category:Python',\n", + " '/w/index.php?title=Special:Book&bookcmd=book_creator&referer=Python',\n", + " '/w/index.php?title=Special:ElectronPdf&page=Python&action=show-download-screen',\n", + " '/w/index.php?title=Python&printable=yes',\n", + " 'https://af.wikipedia.org/wiki/Python',\n", + " 'https://als.wikipedia.org/wiki/Python',\n", + " 'https://az.wikipedia.org/wiki/Python',\n", + " 'https://bn.wikipedia.org/wiki/%E0%A6%AA%E0%A6%BE%E0%A6%87%E0%A6%A5%E0%A6%A8_(%E0%A6%A6%E0%A7%8D%E0%A6%AC%E0%A7%8D%E0%A6%AF%E0%A6%B0%E0%A7%8D%E0%A6%A5%E0%A6%A4%E0%A6%BE_%E0%A6%A8%E0%A6%BF%E0%A6%B0%E0%A6%B8%E0%A6%A8)',\n", + " 'https://be.wikipedia.org/wiki/Python',\n", + " 'https://bg.wikipedia.org/wiki/%D0%9F%D0%B8%D1%82%D0%BE%D0%BD_(%D0%BF%D0%BE%D1%8F%D1%81%D0%BD%D0%B5%D0%BD%D0%B8%D0%B5)',\n", + " 'https://cs.wikipedia.org/wiki/Python_(rozcestn%C3%ADk)',\n", + " 'https://da.wikipedia.org/wiki/Python',\n", + " 'https://de.wikipedia.org/wiki/Python',\n", + " 'https://eo.wikipedia.org/wiki/Pitono_(apartigilo)',\n", + " 'https://eu.wikipedia.org/wiki/Python_(argipena)',\n", + " 'https://fa.wikipedia.org/wiki/%D9%BE%D8%A7%DB%8C%D8%AA%D9%88%D9%86',\n", + " 'https://fr.wikipedia.org/wiki/Python',\n", + " 'https://ko.wikipedia.org/wiki/%ED%8C%8C%EC%9D%B4%EC%84%A0',\n", + " 'https://hr.wikipedia.org/wiki/Python_(razdvojba)',\n", + " 'https://io.wikipedia.org/wiki/Pitono',\n", + " 'https://id.wikipedia.org/wiki/Python',\n", + " 'https://ia.wikipedia.org/wiki/Python_(disambiguation)',\n", + " 'https://is.wikipedia.org/wiki/Python_(a%C3%B0greining)',\n", + " 'https://it.wikipedia.org/wiki/Python_(disambigua)',\n", + " 'https://he.wikipedia.org/wiki/%D7%A4%D7%99%D7%AA%D7%95%D7%9F',\n", + " 'https://ka.wikipedia.org/wiki/%E1%83%9E%E1%83%98%E1%83%97%E1%83%9D%E1%83%9C%E1%83%98_(%E1%83%9B%E1%83%A0%E1%83%90%E1%83%95%E1%83%90%E1%83%9A%E1%83%9B%E1%83%9C%E1%83%98%E1%83%A8%E1%83%95%E1%83%9C%E1%83%94%E1%83%9A%E1%83%9D%E1%83%95%E1%83%90%E1%83%9C%E1%83%98)',\n", + " 'https://kg.wikipedia.org/wiki/Mboma_(nyoka)',\n", + " 'https://la.wikipedia.org/wiki/Python_(discretiva)',\n", + " 'https://lb.wikipedia.org/wiki/Python',\n", + " 'https://hu.wikipedia.org/wiki/Python_(egy%C3%A9rtelm%C5%B1s%C3%ADt%C5%91_lap)',\n", + " 'https://mr.wikipedia.org/wiki/%E0%A4%AA%E0%A4%BE%E0%A4%AF%E0%A4%A5%E0%A5%89%E0%A4%A8_(%E0%A4%86%E0%A4%9C%E0%A5%8D%E0%A4%9E%E0%A4%BE%E0%A4%B5%E0%A4%B2%E0%A5%80_%E0%A4%AD%E0%A4%BE%E0%A4%B7%E0%A4%BE)',\n", + " 'https://nl.wikipedia.org/wiki/Python',\n", + " 'https://ja.wikipedia.org/wiki/%E3%83%91%E3%82%A4%E3%82%BD%E3%83%B3',\n", + " 'https://no.wikipedia.org/wiki/Pyton',\n", + " 'https://pl.wikipedia.org/wiki/Pyton',\n", + " 'https://pt.wikipedia.org/wiki/Python_(desambigua%C3%A7%C3%A3o)',\n", + " 'https://ru.wikipedia.org/wiki/Python_(%D0%B7%D0%BD%D0%B0%D1%87%D0%B5%D0%BD%D0%B8%D1%8F)',\n", + " 'https://sd.wikipedia.org/wiki/%D8%A7%D8%B1%DA%99',\n", + " 'https://sk.wikipedia.org/wiki/Python',\n", + " 'https://sh.wikipedia.org/wiki/Python',\n", + " 'https://fi.wikipedia.org/wiki/Python',\n", + " 'https://sv.wikipedia.org/wiki/Pyton',\n", + " 'https://th.wikipedia.org/wiki/%E0%B9%84%E0%B8%9E%E0%B8%97%E0%B8%AD%E0%B8%99',\n", + " 'https://tr.wikipedia.org/wiki/Python',\n", + " 'https://uk.wikipedia.org/wiki/%D0%9F%D1%96%D1%84%D0%BE%D0%BD',\n", + " 'https://ur.wikipedia.org/wiki/%D9%BE%D8%A7%D8%A6%DB%8C%D8%AA%DA%BE%D9%88%D9%86',\n", + " 'https://vi.wikipedia.org/wiki/Python',\n", + " 'https://zh.wikipedia.org/wiki/Python_(%E6%B6%88%E6%AD%A7%E4%B9%89)',\n", + " 'https://www.wikidata.org/wiki/Special:EntityPage/Q747452#sitelinks-wikipedia',\n", + " '//en.wikipedia.org/wiki/Wikipedia:Text_of_Creative_Commons_Attribution-ShareAlike_3.0_Unported_License',\n", + " '//creativecommons.org/licenses/by-sa/3.0/',\n", + " '//foundation.wikimedia.org/wiki/Terms_of_Use',\n", + " '//foundation.wikimedia.org/wiki/Privacy_policy',\n", + " '//www.wikimediafoundation.org/',\n", + " 'https://foundation.wikimedia.org/wiki/Privacy_policy',\n", + " '/wiki/Wikipedia:About',\n", + " '/wiki/Wikipedia:General_disclaimer',\n", + " '//en.wikipedia.org/wiki/Wikipedia:Contact_us',\n", + " 'https://www.mediawiki.org/wiki/Special:MyLanguage/How_to_contribute',\n", + " 'https://foundation.wikimedia.org/wiki/Cookie_statement',\n", + " '//en.m.wikipedia.org/w/index.php?title=Python&mobileaction=toggle_view_mobile',\n", + " 'https://wikimediafoundation.org/',\n", + " 'https://www.mediawiki.org/']" + ] + }, + "execution_count": 13, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "#your code" + "wiki_links = soup_html.find_all('a',{'href':True})\n", + "\n", + "wiki_links_list = [w['href'] for w in wiki_links if not w['href'].startswith('#')]\n", + "wiki_links_list\n", + "\n", + "#wiki_links_list = []\n", + "#for i in wiki_links:\n", + "# try:\n", + "# wiki_links_list.append(i.attrs['href'])\n", + "# except:\n", + "# pass\n", + "#wiki_links" ] }, { @@ -230,21 +4360,44 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 14, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "['Title 2 - The Congress',\n", + " 'Title 6 - Domestic Security',\n", + " 'Title 7 - Agriculture',\n", + " 'Title 15 - Commerce and Trade',\n", + " 'Title 16 - Conservation',\n", + " 'Title 19 - Customs Duties',\n", + " 'Title 21 - Food and Drugs',\n", + " 'Title 26 - Internal Revenue Code',\n", + " 'Title 34 - Crime Control and Law Enforcement',\n", + " \"Title 38 - Veterans' Benefits\",\n", + " 'Title 42 - The Public Health and Welfare',\n", + " 'Title 43 - Public Lands',\n", + " 'Title 48 - Territories and Insular Possessions',\n", + " 'Title 49 - Transportation',\n", + " 'Title 50 - War and National Defense']" + ] + }, + "execution_count": 14, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'http://uscode.house.gov/download/download.shtml'" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#your code" + "url = 'http://uscode.house.gov/download/download.shtml'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')\n", + "\n", + "titles = soup_html.find_all('div',{'class':'usctitlechanged'})\n", + "\n", + "titles_list = [t.text.replace('\\n\\n ','').replace('\\n\\n ','') for t in titles]\n", + "titles_list" ] }, { @@ -256,21 +4409,38 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 15, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "['ALEJANDRO ROSALES CASTILLO',\n", + " 'YASER ABDEL SAID',\n", + " 'JASON DEREK BROWN',\n", + " 'RAFAEL CARO-QUINTERO',\n", + " 'ALEXIS FLORES',\n", + " 'EUGENE PALMER',\n", + " 'SANTIAGO VILLALBA MEDEROS',\n", + " 'ROBERT WILLIAM FISHER',\n", + " 'BHADRESHKUMAR CHETANBHAI PATEL',\n", + " 'ARNOLDO JIMENEZ']" + ] + }, + "execution_count": 15, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'https://www.fbi.gov/wanted/topten'" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#your code " + "url = 'https://www.fbi.gov/wanted/topten'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html5lib')\n", + "\n", + "wanted = soup_html.find_all('h3',{'class':'title'})\n", + "wanted_list = [w.text.replace('\\n','') for w in wanted]\n", + "wanted_list" ] }, { @@ -282,21 +4452,654 @@ }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], + "execution_count": 16, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Date & Time UTCLatitude degreesLongitude degreesRegion name [+]
12345678910›»12345678910›»12345678910›».112345678910›»12345678910›».112345678910›»
02019-07-16 20:52:18.608min ago36.07N117.84W2.0
12019-07-16 20:49:09.111min ago36.07N117.65W2.0
22019-07-16 20:33:52.927min ago40.09N19.91E2.7
32019-07-16 20:31:33.329min ago23.45S66.86W4.5
42019-07-16 20:29:07.731min ago35.86N117.69W2.2
52019-07-16 20:23:34.737min ago36.07N117.84W2.0
62019-07-16 20:19:00.142min ago33.10N12.42W2.8
72019-07-16 20:17:51.643min ago35.55N117.43W2.8
82019-07-16 20:15:36.845min ago35.78N117.62W4.5
92019-07-16 20:11:01.550min ago37.82N121.77W4.3
102019-07-16 19:42:25.91hr 18min ago35.61N117.47W2.3
112019-07-16 19:35:57.01hr 25min ago35.62N117.45W2.1
122019-07-16 19:23:50.11hr 37min ago36.19N117.89W2.7
132019-07-16 19:20:21.41hr 40min ago38.39N16.94E3.1
142019-07-16 19:16:53.81hr 44min ago38.45N16.91E2.6
152019-07-16 19:16:15.91hr 44min ago61.27N152.44W2.4
162019-07-16 19:11:48.91hr 49min ago36.03N117.87W2.5
172019-07-16 19:04:00.21hr 57min ago35.96N117.71W2.0
182019-07-16 19:01:48.01hr 59min ago39.56N67.17E3.6
192019-07-16 19:01:00.82hr 00min ago35.68N117.54W2.5
202019-07-16 18:53:32.02hr 07min ago0.68S126.36E4.0
212019-07-16 18:50:16.22hr 10min ago43.62N75.40E3.2
222019-07-16 18:47:48.92hr 13min ago35.59N117.42W2.1
232019-07-16 18:36:26.82hr 24min ago35.74N117.56W2.7
242019-07-16 18:22:31.92hr 38min ago35.65N117.52W2.0
252019-07-16 18:15:26.52hr 45min ago28.47N56.76E4.3
262019-07-16 18:10:01.02hr 51min ago34.41S150.73E2.4
272019-07-16 17:48:24.03hr 12min ago9.93S118.23E4.1
282019-07-16 17:42:29.93hr 18min ago35.67N117.54W2.0
292019-07-16 17:39:43.03hr 21min ago0.54S127.86E4.1
302019-07-16 17:31:56.03hr 29min ago35.67N117.47W2.3
312019-07-16 17:05:45.03hr 55min ago36.20N117.90W2.9
322019-07-16 17:05:08.03hr 55min ago15.40N94.64W4.2
332019-07-16 17:01:30.83hr 59min ago36.10N117.90W2.1
342019-07-16 16:45:56.54hr 15min ago0.68S127.58E4.7
352019-07-16 16:45:55.04hr 15min ago18.99N70.09W2.9
362019-07-16 16:43:40.94hr 17min ago37.23N28.27E2.7
372019-07-16 16:43:21.74hr 17min ago36.03N117.79W2.4
382019-07-16 16:36:41.54hr 24min ago35.96N117.30W2.1
392019-07-16 16:28:38.14hr 32min ago35.92N117.68W2.3
402019-07-16 16:27:59.04hr 33min ago18.51S120.55E2.9
412019-07-16 16:26:00.54hr 35min ago30.57N141.98E4.8
422019-07-16 16:21:05.14hr 39min ago28.45N56.70E4.5
432019-07-16 16:01:04.34hr 59min ago62.22N150.00W2.3
442019-07-16 15:59:52.05hr 01min ago35.81N117.63W2.9
452019-07-16 15:57:04.45hr 03min ago36.10N117.82W3.0
462019-07-16 15:28:58.05hr 32min ago18.26S120.37E3.3
472019-07-16 15:26:26.65hr 34min ago35.68N117.51W2.0
482019-07-16 15:25:42.65hr 35min ago37.16N141.54E4.6
492019-07-16 15:13:22.15hr 47min ago35.90N117.67W2.1
50NaNNaNNaNNaNNaNNaN
5112345678910›»12345678910›»12345678910›»12345678910›»12345678910›»12345678910›»
52NaNNaNNaNNaNNaNNaN
\n", + "
" + ], + "text/plain": [ + " Date & Time UTC Latitude degrees \\\n", + " 12345678910›» 12345678910›» 12345678910›».1 \n", + "0 2019-07-16 20:52:18.608min ago 36.07 N \n", + "1 2019-07-16 20:49:09.111min ago 36.07 N \n", + "2 2019-07-16 20:33:52.927min ago 40.09 N \n", + "3 2019-07-16 20:31:33.329min ago 23.45 S \n", + "4 2019-07-16 20:29:07.731min ago 35.86 N \n", + "5 2019-07-16 20:23:34.737min ago 36.07 N \n", + "6 2019-07-16 20:19:00.142min ago 33.10 N \n", + "7 2019-07-16 20:17:51.643min ago 35.55 N \n", + "8 2019-07-16 20:15:36.845min ago 35.78 N \n", + "9 2019-07-16 20:11:01.550min ago 37.82 N \n", + "10 2019-07-16 19:42:25.91hr 18min ago 35.61 N \n", + "11 2019-07-16 19:35:57.01hr 25min ago 35.62 N \n", + "12 2019-07-16 19:23:50.11hr 37min ago 36.19 N \n", + "13 2019-07-16 19:20:21.41hr 40min ago 38.39 N \n", + "14 2019-07-16 19:16:53.81hr 44min ago 38.45 N \n", + "15 2019-07-16 19:16:15.91hr 44min ago 61.27 N \n", + "16 2019-07-16 19:11:48.91hr 49min ago 36.03 N \n", + "17 2019-07-16 19:04:00.21hr 57min ago 35.96 N \n", + "18 2019-07-16 19:01:48.01hr 59min ago 39.56 N \n", + "19 2019-07-16 19:01:00.82hr 00min ago 35.68 N \n", + "20 2019-07-16 18:53:32.02hr 07min ago 0.68 S \n", + "21 2019-07-16 18:50:16.22hr 10min ago 43.62 N \n", + "22 2019-07-16 18:47:48.92hr 13min ago 35.59 N \n", + "23 2019-07-16 18:36:26.82hr 24min ago 35.74 N \n", + "24 2019-07-16 18:22:31.92hr 38min ago 35.65 N \n", + "25 2019-07-16 18:15:26.52hr 45min ago 28.47 N \n", + "26 2019-07-16 18:10:01.02hr 51min ago 34.41 S \n", + "27 2019-07-16 17:48:24.03hr 12min ago 9.93 S \n", + "28 2019-07-16 17:42:29.93hr 18min ago 35.67 N \n", + "29 2019-07-16 17:39:43.03hr 21min ago 0.54 S \n", + "30 2019-07-16 17:31:56.03hr 29min ago 35.67 N \n", + "31 2019-07-16 17:05:45.03hr 55min ago 36.20 N \n", + "32 2019-07-16 17:05:08.03hr 55min ago 15.40 N \n", + "33 2019-07-16 17:01:30.83hr 59min ago 36.10 N \n", + "34 2019-07-16 16:45:56.54hr 15min ago 0.68 S \n", + "35 2019-07-16 16:45:55.04hr 15min ago 18.99 N \n", + "36 2019-07-16 16:43:40.94hr 17min ago 37.23 N \n", + "37 2019-07-16 16:43:21.74hr 17min ago 36.03 N \n", + "38 2019-07-16 16:36:41.54hr 24min ago 35.96 N \n", + "39 2019-07-16 16:28:38.14hr 32min ago 35.92 N \n", + "40 2019-07-16 16:27:59.04hr 33min ago 18.51 S \n", + "41 2019-07-16 16:26:00.54hr 35min ago 30.57 N \n", + "42 2019-07-16 16:21:05.14hr 39min ago 28.45 N \n", + "43 2019-07-16 16:01:04.34hr 59min ago 62.22 N \n", + "44 2019-07-16 15:59:52.05hr 01min ago 35.81 N \n", + "45 2019-07-16 15:57:04.45hr 03min ago 36.10 N \n", + "46 2019-07-16 15:28:58.05hr 32min ago 18.26 S \n", + "47 2019-07-16 15:26:26.65hr 34min ago 35.68 N \n", + "48 2019-07-16 15:25:42.65hr 35min ago 37.16 N \n", + "49 2019-07-16 15:13:22.15hr 47min ago 35.90 N \n", + "50 NaN NaN NaN \n", + "51 12345678910›» 12345678910›» 12345678910›» \n", + "52 NaN NaN NaN \n", + "\n", + " Longitude degrees Region name [+] \n", + " 12345678910›» 12345678910›».1 12345678910›» \n", + "0 117.84 W 2.0 \n", + "1 117.65 W 2.0 \n", + "2 19.91 E 2.7 \n", + "3 66.86 W 4.5 \n", + "4 117.69 W 2.2 \n", + "5 117.84 W 2.0 \n", + "6 12.42 W 2.8 \n", + "7 117.43 W 2.8 \n", + "8 117.62 W 4.5 \n", + "9 121.77 W 4.3 \n", + "10 117.47 W 2.3 \n", + "11 117.45 W 2.1 \n", + "12 117.89 W 2.7 \n", + "13 16.94 E 3.1 \n", + "14 16.91 E 2.6 \n", + "15 152.44 W 2.4 \n", + "16 117.87 W 2.5 \n", + "17 117.71 W 2.0 \n", + "18 67.17 E 3.6 \n", + "19 117.54 W 2.5 \n", + "20 126.36 E 4.0 \n", + "21 75.40 E 3.2 \n", + "22 117.42 W 2.1 \n", + "23 117.56 W 2.7 \n", + "24 117.52 W 2.0 \n", + "25 56.76 E 4.3 \n", + "26 150.73 E 2.4 \n", + "27 118.23 E 4.1 \n", + "28 117.54 W 2.0 \n", + "29 127.86 E 4.1 \n", + "30 117.47 W 2.3 \n", + "31 117.90 W 2.9 \n", + "32 94.64 W 4.2 \n", + "33 117.90 W 2.1 \n", + "34 127.58 E 4.7 \n", + "35 70.09 W 2.9 \n", + "36 28.27 E 2.7 \n", + "37 117.79 W 2.4 \n", + "38 117.30 W 2.1 \n", + "39 117.68 W 2.3 \n", + "40 120.55 E 2.9 \n", + "41 141.98 E 4.8 \n", + "42 56.70 E 4.5 \n", + "43 150.00 W 2.3 \n", + "44 117.63 W 2.9 \n", + "45 117.82 W 3.0 \n", + "46 120.37 E 3.3 \n", + "47 117.51 W 2.0 \n", + "48 141.54 E 4.6 \n", + "49 117.67 W 2.1 \n", + "50 NaN NaN NaN \n", + "51 12345678910›» 12345678910›» 12345678910›» \n", + "52 NaN NaN NaN " + ] + }, + "execution_count": 16, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'https://www.emsc-csem.org/Earthquake/'" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#your code" + "url = 'https://www.emsc-csem.org/Earthquake/'\n", + "html = requests.get(url).content\n", + "df_list = pd.read_html(html)\n", + "df_list[3][['Date & Time UTC','Latitude degrees','Longitude degrees','Region name [+]']]" ] }, { @@ -308,21 +5111,88 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 17, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
01
0Code Geist Hackathon by SefrWahed[7/29/2019]
1The Code Factor[5/21/2019]
2TECHFEST MUNICH[9/6/2019]
3Galileo App Competition[1/31/2019]
\n", + "
" + ], + "text/plain": [ + " 0 1\n", + "0 Code Geist Hackathon by SefrWahed [7/29/2019]\n", + "1 The Code Factor [5/21/2019]\n", + "2 TECHFEST MUNICH [9/6/2019]\n", + "3 Galileo App Competition [1/31/2019]" + ] + }, + "execution_count": 17, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url ='https://hackevents.co/hackathons'" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#your code" + "import re\n", + "\n", + "url ='https://hackevents.co/hackathons'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html5lib')\n", + "\n", + "hacks_titles = soup_html.find_all('h5',{'class':'card-title'})\n", + "hacks_fechas = soup_html.find_all('p',{'class':'card-text'})\n", + "\n", + "hacks_list = [[j.text,re.findall(r'\\d+/\\d+/\\d+',hacks_fechas[i].text)] for i,j in enumerate(hacks_titles)]\n", + "#hacks_list\n", + "\n", + "df = pd.DataFrame(hacks_list)\n", + "df" ] }, { @@ -342,22 +5212,47 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 26, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdin", + "output_type": "stream", + "text": [ + "Ingresa tu usuario de twitter: paolalean\n" + ] + } + ], "source": [ "# This is the url you will scrape in this exercise \n", "# You will need to add the account credentials to this url\n", - "url = 'https://twitter.com/'" + "usuario = input('Ingresa tu usuario de twitter: ')\n", + "url = f'https://twitter.com/{usuario}'\n", + "#para prueba de cuenta sin tweets usar la de victor: vik54076455" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 30, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "307\n" + ] + } + ], "source": [ - "#your code" + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')\n", + "tweets = soup_html.find_all('span',{'class':'ProfileNav-value'})\n", + "\n", + "try:\n", + " print(int(tweets[0].text))\n", + "except:\n", + " print(\"no tienes tweets\")\n" ] }, { @@ -377,22 +5272,38 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 34, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdin", + "output_type": "stream", + "text": [ + "Ingresa tu usuario de twitter: paolalean\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Tienes la increíble cantidad de 27 followers\n" + ] + } + ], "source": [ "# This is the url you will scrape in this exercise \n", "# You will need to add the account credentials to this url\n", - "url = 'https://twitter.com/'" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#your code" + "usuario = input('Ingresa tu usuario de twitter: ')\n", + "url = f'https://twitter.com/{usuario}'\n", + "\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')\n", + "tweets = soup_html.find_all('span',{'class':'ProfileNav-value'})\n", + "\n", + "try:\n", + " print(f\"Tienes la increíble cantidad de {int(tweets[1].text)} followers\")\n", + "except:\n", + " print(\"Sin followers\")" ] }, { @@ -404,12 +5315,42 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 48, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "[['The Free Encyclopedia', '5892000'],\n", + " ['English', '1159000'],\n", + " ['日本語', '1532000'],\n", + " ['Español', '2323000'],\n", + " ['Deutsch', '1556000'],\n", + " ['Русский', '2123000'],\n", + " ['Français', '1541000'],\n", + " ['Italiano', '1065000'],\n", + " ['中文', '1010000'],\n", + " ['Português', '1346000'],\n", + " ['Polski', '1000000'],\n", + " ['Wikipedia apps are now available:', '100000']]" + ] + }, + "execution_count": 48, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'https://www.wikipedia.org/'" + "url = 'https://www.wikipedia.org/'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')\n", + "\n", + "language = soup_html.find_all('strong')\n", + "number = soup_html.find_all('bdi')\n", + "\n", + "lista = [[j.text,''.join(re.findall('\\d+', number[i].text))] for i,j in enumerate(language)]\n", + "lista" ] }, { @@ -430,21 +5371,40 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 52, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "['Business and economy',\n", + " 'Crime and justice',\n", + " 'Defence',\n", + " 'Education',\n", + " 'Environment',\n", + " 'Government',\n", + " 'Government spending',\n", + " 'Health',\n", + " 'Mapping',\n", + " 'Society',\n", + " 'Towns and cities',\n", + " 'Transport']" + ] + }, + "execution_count": 52, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'https://data.gov.uk/'" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "#your code " + "url = 'https://data.gov.uk/'\n", + "html = requests.get(url).content\n", + "soup_html = BeautifulSoup(html,'html')\n", + "\n", + "datasets = soup_html.find_all('h2')\n", + "datas = [d.text for d in datasets]\n", + "datas" ] }, { @@ -456,12 +5416,135 @@ }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], + "execution_count": 57, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
RankLanguageSpeakers(millions)
0Chinese (macrolanguage)1311.0
11Mandarin918.0
22Spanish460.0
33English379.0
44Hindi341.0
5Arabic (macrolanguage)319.0
65Bengali228.0
76Portuguese221.0
87Russian154.0
98Japanese128.0
10Lahnda (macrolanguage)119.0
\n", + "
" + ], + "text/plain": [ + " Rank Language Speakers(millions)\n", + "0 — Chinese (macrolanguage) 1311.0\n", + "1 1 Mandarin 918.0\n", + "2 2 Spanish 460.0\n", + "3 3 English 379.0\n", + "4 4 Hindi 341.0\n", + "5 — Arabic (macrolanguage) 319.0\n", + "6 5 Bengali 228.0\n", + "7 6 Portuguese 221.0\n", + "8 7 Russian 154.0\n", + "9 8 Japanese 128.0\n", + "10 — Lahnda (macrolanguage) 119.0" + ] + }, + "execution_count": 57, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# This is the url you will scrape in this exercise\n", - "url = 'https://en.wikipedia.org/wiki/List_of_languages_by_number_of_native_speakers'" + "url = 'https://en.wikipedia.org/wiki/List_of_languages_by_number_of_native_speakers'\n", + "html = requests.get(url).content\n", + "\n", + "df_read_tables = pd.read_html(html)\n", + "df_read_tables[0][['Rank','Language','Speakers(millions)']].head(11)\n" ] }, { @@ -608,5 +5691,5 @@ } }, "nbformat": 4, - "nbformat_minor": 2 + "nbformat_minor": 4 }