Skip to content

Commit 3ad7044

Browse files
committed
commit code
1 parent b8ae9ba commit 3ad7044

File tree

1 file changed

+29
-0
lines changed

1 file changed

+29
-0
lines changed

chaoxi/craw_weibo/craw_weibo.py

Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,29 @@
1+
from selenium import webdriver
2+
import urllib.request
3+
4+
driver = webdriver.Chrome()
5+
driver.get('https://weibo.com/')
6+
7+
driver.get('https://s.weibo.com/weibo/%25E5%25A5%25A5%25E8%25BF%2590%25E4%25BC%259A?topnav=1&wvr=6&b=1')
8+
9+
contents = driver.find_elements_by_xpath(r'//p[@class="txt"]')
10+
11+
for i in range(0,3):
12+
print("==============================")
13+
print(contents[i].get_attribute('innerHTML'))
14+
15+
contents = driver.find_elements_by_xpath(r'//img[@action-type="fl_pics"]')
16+
17+
print(len(contents))
18+
19+
for i in range(0,20):
20+
print("==============================")
21+
print(contents[i].get_attribute('src'))
22+
23+
24+
for i in range(0,20):
25+
print("==============================")
26+
image_url=contents[i].get_attribute('src')
27+
file_name="downloads//p"+str(i)+".jpg"
28+
print(image_url,file_name)
29+
urllib.request.urlretrieve(image_url, filename=file_name)

0 commit comments

Comments
 (0)