Python爬虫,,#Author:xu
Python爬虫,,#Author:xu
#Author:xuesong liimport geventfrom gevent import monkeymonkey.patch_all()from urllib.request import urlopenimport timedef pa_web_page(url): print("GET url",url) req = urlopen(url) data =req.read() print(data) f = open("test",‘w‘) f.read(data) f.close() print(‘%d bytes received from %s.‘ % (len(data), url))t_start = time.time()pa_web_page("http://www.autohome.com.cn/beijing/")pa_web_page("http://www.xiaohuar.com/")print("time cost:",time.time()-t_start)t2_start = time.time()gevent.joinall([ #gevent.spawn(pa_web_page, ‘https://www.python.org/‘), gevent.spawn(pa_web_page, ‘http://www.autohome.com.cn/beijing/‘), gevent.spawn(pa_web_page, ‘http://www.xiaohuar.com/‘), #gevent.spawn(pa_web_page, ‘https://github.com/‘),])print("time cost t2:",time.time()-t2_start)
Python爬虫
评论关闭