清华大佬耗费三个月吐血整理的几百G的资源,免费分享!....>>>
import re import urllib.request def getUrl(url): page = urllib.request.urlopen(url) html = page.read().decode('utf-8') return html def getHtnlList(html): reg = r'正则表达式' reglist = re.compile(reg) return reglist html = getUrl("网址") getHtml(html)