广度优先爬取数据 from bs4 import BeautifulSoup import urllib.request class Queue: def __init__(self): self.st=[] def fetch(self): return self.st.pop(0) def enter(self,obj): self.st.append(obj) def empty(self): return len(self.st)==0 def spider(url): queue=Queue() queue.enter(url) while not queue.empty(): url=queue.fetch() try: data=urllib.request.urlopen(url) data=data.read() data=data.decode() soup=BeautifulSoup(data,"lxml") print(soup.find("h3").text) links=soup.select("a") for link in links: __________________ url=start_url+"/"+href _____________________ except Exception as err: print(err) start_url="https://127.0.0.1:5000" spider(start_url) print("The End")