1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
| import time import requests import re import os
headers = { "User-Agent": "Admin" } response = requests.get("https://www.vmgirls.com/13230.html", headers = headers) html = response.text
dir_name = re.findall('<h1 class="post-title h3">(.*?)</h1>', html)[-1]
if not os.path.exists(dir_name): os.mkdir(dir_name)
urls = re.findall('<a href="(.*?)" alt=".*?" title=".*?">', html) print(urls)
for url in urls: time.sleep(1) file_name = url.split('/')[-1] response = requests.get(url, headers = headers) with open(dir_name + '/' + file_name, 'wb') as f: f.write(response.content)
|