background image
self.links[text] = self.link
fp = urllib.urlopen("http://list.taobao.com/browse/cat-0.htm")
data = fp.read()
fp.close()
linkdemo = GetLinks()
linkdemo.feed(data)
linkdemo.close()
for href, link in linkdemo.links.items():
href = href.decode('gb2312').encode('utf-8')
print href, '-', link
pass
-
http://ju.atpanel.com/?url=http://list.taobao.com/market/baihuo.htm?spm=1.4761
3.90750.”这样的列表
2,下载豆瓣图片【多线程】:
# -* - coding: UTF-8 -* -
from HTMLParser import HTMLParser
import htmllib,urllib,formatter,string
import os,sys,time
import threading
'''
Created on 2012-10-09
@author: xing.gexing
'''
#建立线程池,并启动线程直到结束
def parallel(urls):
startTime = time.time()
threads=[]