import os
import requests
from lxml import html
IMG_HREF_XPATH = '//a[img[contains(@class, "img preview")]]'
WEB_ROOT = 'https://2...content-available-to-author-only...h.hk'
thread_url = input('Введите ссылку на тред\n')
requests_obj = requests.get(thread_url)
thread_source = html.fromstring(requests_obj.text)
if not os.path.exists('media'):
os.makedirs('media')
for elem in thread_source.xpath(IMG_HREF_XPATH):
media_name = elem.get('href').split('/')[-1]
media_url = WEB_ROOT + elem.get('href')
response = requests.get(media_url, stream=True)
with open('media/{}'.format(media_name), 'wb+') as file:
for chunk in response:
file.write(chunk)
print('Downloaded: {}'.format(media_url))
aW1wb3J0IG9zCgppbXBvcnQgcmVxdWVzdHMKZnJvbSBseG1sIGltcG9ydCBodG1sCgpJTUdfSFJFRl9YUEFUSCA9ICcvL2FbaW1nW2NvbnRhaW5zKEBjbGFzcywgImltZyBwcmV2aWV3IildXScKV0VCX1JPT1QgPSAnaHR0cHM6Ly8yLi4uY29udGVudC1hdmFpbGFibGUtdG8tYXV0aG9yLW9ubHkuLi5oLmhrJwoKdGhyZWFkX3VybCA9IGlucHV0KCfQktCy0LXQtNC40YLQtSDRgdGB0YvQu9C60YMg0L3QsCDRgtGA0LXQtFxuJykKcmVxdWVzdHNfb2JqID0gcmVxdWVzdHMuZ2V0KHRocmVhZF91cmwpCnRocmVhZF9zb3VyY2UgPSBodG1sLmZyb21zdHJpbmcocmVxdWVzdHNfb2JqLnRleHQpCgppZiBub3Qgb3MucGF0aC5leGlzdHMoJ21lZGlhJyk6CiAgICBvcy5tYWtlZGlycygnbWVkaWEnKQoKZm9yIGVsZW0gaW4gdGhyZWFkX3NvdXJjZS54cGF0aChJTUdfSFJFRl9YUEFUSCk6CgogICAgbWVkaWFfbmFtZSA9IGVsZW0uZ2V0KCdocmVmJykuc3BsaXQoJy8nKVstMV0KICAgIG1lZGlhX3VybCA9IFdFQl9ST09UICsgZWxlbS5nZXQoJ2hyZWYnKQogICAgcmVzcG9uc2UgPSByZXF1ZXN0cy5nZXQobWVkaWFfdXJsLCBzdHJlYW09VHJ1ZSkKICAgIAogICAgd2l0aCBvcGVuKCdtZWRpYS97fScuZm9ybWF0KG1lZGlhX25hbWUpLCAnd2IrJykgYXMgZmlsZToKICAgICAgICBmb3IgY2h1bmsgaW4gcmVzcG9uc2U6CiAgICAgICAgICAgIGZpbGUud3JpdGUoY2h1bmspCiAgICAgICAgICAgIAogICAgcHJpbnQoJ0Rvd25sb2FkZWQ6IHt9Jy5mb3JtYXQobWVkaWFfdXJsKSkK