Commit dabf7132 authored by Everardo Gonzalez's avatar Everardo Gonzalez

changed html parser

parent bb9f5ca3
......@@ -36,8 +36,9 @@
"source": [
"# look for html class \"filename\" in URL and try download\n",
"soup = BeautifulSoup(html, \"lxml\")\n",
"# soup = BeautifulSoup(html, \"lxml\")\n",
"soup = BeautifulSoup(html, \"html.parser\") # works better \n",
"for link in'a.filename'):\n",
" href = link.get('href')\n",
