Skip to content

Commit 6efd56e

Browse files
committed
7.4
1 parent c44a777 commit 6efd56e

File tree

8 files changed

+26043
-107
lines changed

8 files changed

+26043
-107
lines changed

.idea/Python.iml

Lines changed: 1 addition & 1 deletion
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

.idea/encodings.xml

Lines changed: 4 additions & 0 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

.idea/misc.xml

Lines changed: 1 addition & 1 deletion
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

.idea/workspace.xml

Lines changed: 74 additions & 83 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

douban.py

Lines changed: 38 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,38 @@
1+
# 请求json接口整体数据 抽取想要的 保存数据
2+
import requests
3+
import json
4+
response=requests.get("https://movie.douban.com/j/chart/top_list?type=11&interval_id=100%3A90&action=&start=0&limit=20")
5+
py_data=json.loads(response.text)
6+
for i in py_data:
7+
items={'电影名称':i['title'],'上映地区':i['regions'],
8+
'评分':i['score'],'上映时间':i['release_date']}
9+
# print(items)
10+
content=json.dumps(items,ensure_ascii=False)+".\n"
11+
with open("douban.json" , "a" , encoding="utf-8") as f:
12+
f.write(content)
13+
print(content)
14+
15+
16+
17+
18+
19+
20+
21+
22+
23+
24+
25+
26+
# import requests
27+
# import json
28+
# response=requests.get("http://image.baidu.com/pv/pv.gif?dsp=pc&tn=result&hs=2&type=prerequire&t=1556545641129")
29+
# py_data=json.loads(response.text)
30+
# for i in py_data:
31+
# print(i)
32+
# # print(items)
33+
# # content=json.dumps(items,ensure_ascii=False)+".\n"
34+
# # with open("douban.json" , "a" , encoding="utf-8") as f:
35+
# # f.write(content)
36+
# # print(content)
37+
38+

readFile.py

Lines changed: 40 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,23 +1,54 @@
1+
2+
# from time import sleep
3+
# from selenium import webdriver
4+
#
5+
# def getFile(url):
6+
# #实例化一个浏览器驱动
7+
# chrome = webdriver.Chrome()
8+
#
9+
# #访问页面
10+
# chrome.get(url)
11+
# #捕获元素
12+
#
13+
# texts = chrome.find_elements_by_xpath("//div[@class='content']/p")
14+
# for t in texts:
15+
# print(t.text)
16+
# sleep(1)
17+
# next_url = chrome.find_elements_by_xpath("//a[@class='nextchapter']")
18+
# if next_url:
19+
# next_urls = next_url[0].get_attribute("href")
20+
# getFile(next_urls)
21+
# else:
22+
# chrome.close()
23+
# return
24+
# #关闭浏览器
25+
##################################################################
26+
127
from time import sleep
228
from selenium import webdriver
329

4-
def getFile(url):
30+
def getFile(chrome, url):
531
#实例化一个浏览器驱动
6-
chrome = webdriver.Chrome()
7-
832
#访问页面
933
chrome.get(url)
1034
#捕获元素
11-
12-
texts = chrome.find_elements_by_xpath("//div[@class='content']/p")
13-
for t in texts:
14-
print(t.text)
35+
texts = chrome.find_elements_by_xpath("//div[@class='bg']/h1")
36+
textcont = chrome.find_elements_by_xpath("//div[@class='content-body']/p")
37+
# print(texts,textcont)
38+
with open("1.txt","a") as f:
39+
f.write(texts[0].text+"\n")
40+
for i in textcont:
41+
f.write(i.text + "\n")
1542
sleep(1)
16-
next_url = chrome.find_elements_by_xpath("//a[@class='nextchapter']")
43+
next_url = chrome.find_elements_by_xpath("//a[@id='xiayipian']")
1744
if next_url:
1845
next_urls = next_url[0].get_attribute("href")
19-
getFile(next_urls)
46+
# print(next_urls)
47+
getFile(chrome,next_urls)
2048
else:
2149
chrome.close()
2250
return
2351
#关闭浏览器
52+
if __name__ == '__main__':
53+
chrome = webdriver.Chrome()
54+
getFile(chrome, "http://seputu.com/biji2/127.html")

selenium使用.py

Lines changed: 34 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -1,16 +1,37 @@
1+
# from selenium import webdriver
2+
#
3+
# #实例化一个浏览器驱动
4+
# chrome = webdriver.Chrome()
5+
#
6+
# #访问页面
7+
# chrome.get("https://www.baidu.com/")
8+
# #捕获元素
9+
# inputs = chrome.find_element_by_id("kw")
10+
# #对元素进行操作
11+
# inputs.send_keys("老边饺子")
12+
# button = chrome.find_element_by_id("su")
13+
# button.click()
14+
# #关闭浏览器
15+
# chrome.close()
16+
##########################################################
117
from selenium import webdriver
2-
3-
#实例化一个浏览器驱动
18+
import time
419
chrome = webdriver.Chrome()
5-
6-
#访问页面
7-
chrome.get("https://www.baidu.com/")
8-
#捕获元素
9-
inputs = chrome.find_element_by_id("kw")
10-
#对元素进行操作
11-
inputs.send_keys("老边饺子")
12-
button = chrome.find_element_by_id("su")
13-
button.click()
20+
def qqzone():
21+
#访问页面
22+
chrome.get("https://xui.ptlogin2.qq.com/cgi-bin/xlogin?proxy_url=https%3A//qzs.qq.com/qzone/v6/portal/proxy.html&daid=5&&hide_title_bar=1&low_login=0&qlogin_auto_login=1&no_verifyimg=1&link_target=blank&appid=549000912&style=22&target=self&s_url=https%3A%2F%2Fqzs.qq.com%2Fqzone%2Fv5%2Floginsucc.html%3Fpara%3Dizone&pt_qr_app=手机QQ空间&pt_qr_link=https%3A//z.qzone.com/download.html&self_regurl=https%3A//qzs.qq.com/qzone/v6/reg/index.html&pt_qr_help_link=https%3A//z.qzone.com/download.html&pt_no_auth=0")
23+
time.sleep(1)
24+
#捕获元素
25+
button = chrome.find_elements_by_class_name("face")
26+
#对元素进行操作
27+
button[0].click()
28+
time.sleep(1)
29+
button1 = chrome.find_element_by_id("aAppstore")
30+
button1.click()
31+
button2 = chrome.find_elements_by_class_name("my-app-list-item")
32+
print(button2.text)
33+
qqzone()
34+
# nongchang()
35+
# time.sleep(100)
1436
#关闭浏览器
15-
chrome.close()
16-
37+
# chrome.close()

0 commit comments

Comments
 (0)