依赖BeautifulSoup Python
主文件spider_main.py
1  | # -*- coding:utf-8 -*-  | 
网页下载器html_downloder.py
1  | # -*- coding:utf-8 -*-  | 
网页解析器html_parser.py
1  | # -*- coding:utf-8 -*-  | 
URL管理器url_manager.py
1  | # -*- coding:utf-8 -*-  | 
定义路径输出结果
1  | 
  | 

1  | # -*- coding:utf-8 -*-  | 
1  | # -*- coding:utf-8 -*-  | 
1  | # -*- coding:utf-8 -*-  | 
1  | # -*- coding:utf-8 -*-  | 
1  | 
  | 
