import re, urllib htmlSource = urllib.urlopen("http://www.75271.com").read(200000) linksList = re.findall('<a href="(.*?)">.*?</a>',htmlSource) for link in linksList: print link
import re, urllib htmlSource = urllib.urlopen("http://www.75271.com").read(200000) linksList = re.findall('<a href="(.*?)">.*?</a>',htmlSource) for link in linksList: print link