浏览代码

Refactoring scraper.py: Adding method for retrieving HTML content

David Leonard 10 年之前
父节点
当前提交
724f3988ce
共有 1 个文件被更改,包括 16 次插入0 次删除
  1. 16 0
      hackathon_starter/hackathon/scripts/scraper.py

+ 16 - 0
hackathon_starter/hackathon/scripts/scraper.py

@@ -7,6 +7,22 @@ import requests
 import itertools 
 from bs4 import BeautifulSoup
 
+def fetchHTML(url):
+	'''
+	Returns HTML retrived from a url.
+
+	Parameters:
+		url: String
+			- The URL to fetch HTML from
+
+	Returns:
+		html: String
+			- The HTML from a given URL
+	'''
+	req = requests.get(url)
+	html = req.text
+	return html
+
 def steamDiscounts():
 	req = requests.get('http://store.steampowered.com/search/?specials=1#sort_by=_ASC&sort_order=ASC&specials=1&page=1')
 	content = req.text