This python class will search for links in a webpage without using BeautifulSoup
import urllib
import re
class Crawl:
url=""
def __init__(self,url):
Crawl.url=url
def getURL(self):
print Crawl.url
def links(self):
cont=urllib.urlopen(Crawl.url).read()
links=re.findall('<a.*href=(.*)>(.*)</a>', cont)
for link in links:
li=link[0]
li=li.replace(''','')
li=li.replace('"','')
end=li.find(" ")
if end>0:
print li[:end]
else:
print li
crawl=Crawl("http://www.sachinpuri.com")
crawl.links()
