From 69b7d37fd1f5749ab4e3696e804ef4ec91a9669d Mon Sep 17 00:00:00 2001 From: SREERAM KEERTHAN PARUCHURU <cb.en.u4cse16249@cb.students.amrita.edu> Date: Wed, 30 Jan 2019 13:05:55 +0530 Subject: [PATCH] beautiful soup --- reguestss.py | 13 +++++++++++++ 1 file changed, 13 insertions(+) create mode 100644 reguestss.py diff --git a/reguestss.py b/reguestss.py new file mode 100644 index 0000000..cb05eef --- /dev/null +++ b/reguestss.py @@ -0,0 +1,13 @@ +import requests +from bs4 import BeautifulSoup +page = requests.get("http://dataquestio.github.io/web-scraping-pages/simple.html") +page +page.status_code +page.content +soup = BeautifulSoup(page.content, 'html.parser') +soup.prettify() +k=list(soup.children) +print([type(item) for item in list(soup.children)]) +html = list(soup.children)[2] +body = list(html.children)[3] +print(body) -- GitLab