#Encoding=utf-8ImportReImportRequestsclassGetUrl (object):def __init__(self,num): Self.totle=Num Self.myheader= {'Host':'www.wooyun.org', 'Connection':'keep-alive', 'user-agent':'mozilla/5.0 (Windows NT 6.1) applewebkit/537.36 (khtml, like Gecko) chrome/46.0.2490.80 safari/537.36', 'Accept':'*/*','Referer':'http://www.wooyun.com/', 'accept-encoding':'gzip, deflate, SDCH','Accept-language':'zh-cn,zh;q=0.8'}#Table Header information defBeginer (self):Print 'Get Start'page= 1Urlliset= [] whilePage < 45: URL='http://www.wooyun.org/corps/page/'+Str (page) r= Requests.get (url,headers=self.myheader) Site= Re.findall ('href= "http://(. *?)"', R.text) site= Re.findall ('(!www.) (.*?)', R.text) site2= Re.findall ('href= "https://(. *?)"', R.text) page+ = 1 forEleminchsite:urlliset.append (elem) forEleminchsite2:urlliset.append (elem) self.writeqq (text= urlliset,file_dir='Site.text', mode='W') defwriteqq (Self,text, File_dir, mode): With open (File_dir, mode) as F: forSiteinchtext:f.write (site) f.write ("\ n") Spidre= GetUrl (44) Spidre.beginer ()
Python applet gets Wooyun vendor site