[Python]代码
import webbrowser as web import re import urllib import time import os def spider(url,urlpattern): urls=getURLs(url,urlpattern) for url in urls: visitURL(url) def visitURL(url): url=url[:-1] #remove the " at the end of the string print(url) #print("/n") web.open(url,1,False) time.sleep(5) def getURLs(url,urlpattern): urls=[] response=urllib.urlopen(url) html=response.read() pattern=re.compile(urlpattern) urls=pattern.findall(html) urls=list(set(urls)) return urls if __name__=="__main__": urls={ "这里填写你blog的地址" } for i in range(1,10): for url,urlpattern in urls.items(): spider(url,urlpattern) print("Blogs has been refreshed for ", i, " times") os.system("taskkill /F /IM chrome.exe")
原创文章,作者:ItWorker,如若转载,请注明出处:https://blog.ytso.com/8084.html