寫(xiě)好了所有的程序運(yùn)行遇到bug,不知道怎么改
#?-*-?coding:?utf-8?-*- from?baike_moon?import??html_downloader,?html_parser,?html_outputer,?url_manager class?SpiderMain(object): ????def?__init__(self): ????????self.urls?=?url_manager.UrlManager() ????????self.downloader?=?html_downloader.HtmlDownloader() ????????self.parser?=?html_parser.HtmlParser() ????????self.outputer??=html_outputer.HtmlOutputer() ???? ???? ????def?craw(self,?root_url): ????????count?=?1 ????????self.urls.add_new_url(root_url) ????????while?self.urls.has_new_url(): ????????????#try: ????????????????new_url?=?self.urls.get_new_url() ????????????????print?'craw?%d:%s'?%(count,new_url) ????????????????html_cont?=?self.downloader.download(new_url) ????????????????new_urls,new_data?=?self.parser.parse(new_url,html_cont) ????????????????self.urls.add_new_urls(new_urls) ????????????????self.outputer.collect_data(new_data) ???????????????? ????????????????if?count?==?1000: ????????????????????break ????????????????count?=?count+1 ????????????#except: ???????????#?????print?'爬取失敗' ????????? ????????self.outputer.output_html() ???????? if?__name__=="__main__": ????root_url?=?"http://baike.baidu.com/view/21087.htm" ????obj_spider?=?SpiderMain() ????obj_spider.craw(root_url)
報(bào)錯(cuò):
pydev_imports.execfile(file, globals, locals) ?# execute the script
? File "E:\eclipse python\????\baike_moon\spider_main.py", line 38, in <module>
? ? obj_spider.craw(root_url)
? File "E:\eclipse python\????\baike_moon\spider_main.py", line 22, in craw
? ? new_urls,new_data = self.parser.parse(new_url,html_cont)
TypeError: 'set' object is not callable
2016-03-30
我找到我的原因了 在manager里面有字母打錯(cuò)了造成錯(cuò)誤 你去查查你的代碼是不是有哪兒地方字母打的不對(duì)
2016-03-30
同問(wèn)啊 一模一樣的錯(cuò)誤 求助啊
2016-03-08
2016-03-08
同問(wèn),,不過(guò)我的錯(cuò)誤是TypeError: 'NoneType' object is not iterable,,,
2016-02-25
看一下html_parser文件有沒(méi)有加 urlparse 和 re