依赖BeautifulSoup Python
主文件spider_main.py
1 | # -*- coding:utf-8 -*- |
网页下载器html_downloder.py
1 | # -*- coding:utf-8 -*- |
网页解析器html_parser.py
1 | # -*- coding:utf-8 -*- |
URL管理器url_manager.py
1 | # -*- coding:utf-8 -*- |
定义路径输出结果
1 |
|
1 | # -*- coding:utf-8 -*- |
1 | # -*- coding:utf-8 -*- |
1 | # -*- coding:utf-8 -*- |
1 | # -*- coding:utf-8 -*- |
1 |
|