add doutu.py.

master
newrain001 3 years ago committed by Gitee
parent 654fb4952c
commit 4c1011d151
  1. 36
      doutu.py

@ -0,0 +1,36 @@
#!/usr/bin/env python3
#_*_ coding: utf-8 _*_
'''
***********************************************
authOr: newrain *
blog: https://blog.csdn.net/NewRain_wang *
https://newrain001.gitee.io *
github: https://github.com/newrain001 *
gitee : https://gitee.com/newrain001 *
email : newrain_wang@163.com *
***********************************************
'''
import requests
from lxml import etree
import time
def getUrl():
header = {
'User-Agent': 'User-Agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/93.0.4577.63 Safari/537.36',
'Referer': 'www.doutula.com',
}
html = requests.get('https://www.doutula.com/photo/list', headers=header)
if html.status_code == 200:
e = etree.HTML(html.text)
url = e.xpath('//ul/li/div/div/a/img/@data-original')
for i in url:
name = i.split("/")[-1]
result = requests.get(i)
with open(f'image/{name}', 'wb') as f:
f.write(result.content)
print(name,'已完成')
time.sleep(1)
getUrl()
Loading…
Cancel
Save