File tree Expand file tree Collapse file tree 5 files changed +12
-131
lines changed Expand file tree Collapse file tree 5 files changed +12
-131
lines changed Load Diff This file was deleted.
Original file line number Diff line number Diff line change 1
1
import time
2
- from page_parsing import url_list
2
+ from tc_itemInfo import url_list
3
3
4
4
while True :
5
5
print url_list .find ().count ()
Original file line number Diff line number Diff line change 1
1
# coding:utf-8
2
2
from multiprocessing import Pool
3
- from channel_extact import channel_list
3
+ from tc_urlLists import channel_list
4
4
from page_parsing import get_links_from
5
5
6
6
def get_all_links_from (channel ):
Load Diff This file was deleted.
Original file line number Diff line number Diff line change 1
1
# pythonSpider
2
- some python spiders with BeautifulSoup
2
+ some python spiders with BeautifulSoup & requests
3
3
4
- ## [ githubSpider ] ( github )
5
- - 爬取关注或粉丝列表 [ followXXXList] ( github/github_followXXXList.py )
6
- - 爬取用户个人信息 [ userInfo] ( github/github_userInfo.py )
4
+ ## [ github ] ( github )
5
+ - 爬取关注或粉丝列表 [ followXXXList.py ] ( github/github_followXXXList.py )
6
+ - 爬取用户个人信息 [ userInfo.py ] ( github/github_userInfo.py )
7
7
8
- ## 58同城Spider
8
+ ## [ 58同城] ( 58tongcheng )
9
+ - 获取所有的二级菜单列表 [ tc_urlLists.py] ( 58tongcheng/tc_urlLists.py )
10
+ - 获取每一个url下的具体信息 [ tc_itemInfo.py] ( 58tongcheng/tc_itemInfo.py )
9
11
12
+ ## [ 豆瓣] ( douban )
13
+ - 获取单个电影的短评 [ douban_comment.py] ( douban/douban_comment.py )
14
+ - 获取单个电影的所有大图海报 [ douban_photosR.py] ( douban/douban_photosR.py )
You can’t perform that action at this time.
0 commit comments