|
import re
from urllib import request
target_url = "http://pic.yxdown.com/list/0_0_1.html"
request_headers = {'User-Agent' : "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_3) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.100 Safari/537.36"}
def request_target():
request_html = request.Request(url=target_url,headers=request_headers)
read_request = request.urlopen(request_html)
return read_request.read().decode("utf-8")
def analyse_page(html):
get_content = re.compile('.*? <div class="conbox">.*? <div class="cbmiddle">.*?<img src="(.*?)"',re.S)
read_list = get_content.findall(html)
print(read_list)
for read in read_list:
print("地址列表:",read.strip())
read_target = request_target()
print(read_target)
analyse_page(read_target)
这个是拿到图片地址的代码。你在for这些代码下载地址的就行了 |
|