Randomize useragent

2023-08-23 13:44:22 -05:00 · 2023-08-23 13:44:22 -05:00 · b8eb526782
parent 0a4bd99771
commit b8eb526782
4 changed files with 16 additions and 5 deletions
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@ -1,5 +1,9 @@
 # Changelog
 ## 0.0.5
 * Randomize user agent to circumvent ratelimit
 ## 0.0.4
 * Improved image scraping (Thanks https://austinhuang.me/)
--- a/imgin/get.py
+++ b/imgin/get.py
@ -2,11 +2,11 @@ import sys
 from os import remove, write
 from threading import Thread
 #from gevent import sleep
 from time import sleep
 import requests
 import bs4
 from .useragents import get_random_user_agent
 from .config import IMAGE_CACHE, SINGLE_IMAGE_DELETE_AFTER_SECS
 def delete_file(path):
@ -23,6 +23,7 @@ def error(msg):
    sys.stderr.flush()
 def get(url: str, write_dir: str, delete=True):
    ua = get_random_user_agent()
    orig_url = url
    if not url.startswith('https://imgur.com/'):
        url = 'https://imgur.com/' + url
@ -38,7 +39,7 @@ def get(url: str, write_dir: str, delete=True):
        print('Getting img', url)
        url = 'https://i.imgur.com/' + url.rsplit('/', 1)[-1]
        with open(f'{write_dir}/{url[-11:]}', 'wb') as img:
-            img.write(requests.get(url).content)
+            img.write(requests.get(url, headers={'User-Agent': ua}).content)
        if delete:
            Thread(target=delete_file, args=[f"{write_dir}/{url[-11:]}"]).start()
        return None
@ -49,7 +50,7 @@ def get(url: str, write_dir: str, delete=True):
        title = ''
        metas = []
        print('Detecting album/gallery images (contentUrl)', url)
-        soup = bs4.BeautifulSoup(requests.get(url).text, 'html.parser')
+        soup = bs4.BeautifulSoup(requests.get(url, headers={'User-Agent': ua}).text, 'html.parser')
        try:
            title = soup.select('meta[property="og:title"]')[0]['content']
            if title == "Imgur":
@ -78,7 +79,7 @@ def get(url: str, write_dir: str, delete=True):
            print("Writing image", f"{write_dir}{found_url[-11:]}")
            with open(f"{write_dir}{found_url[-11:]}", "wb") as f:
-                f.write(requests.get(found_url).content)
+                f.write(requests.get(found_url, headers={'User-Agent': ua}).content)
            if delete:
                Thread(target=delete_file, args=[f"{write_dir}{found_url[-11:]}"]).start()
--- a/imgin/useragents.py
+++ b/imgin/useragents.py
--- a/imgin/web/index.html
+++ b/imgin/web/index.html
@ -39,7 +39,7 @@
      <p>Or, run it with python by installing the requirements.txt and ./run.py. Or use the Dockerfile. Contact me if you want help or find a bug.</p>
      <footer>
        <small>
-            <p>Imgin Version 0.0.4</p>
+            <p>Imgin Version 0.0.5</p>
            Powered by <a href="https://voidnet.tech/">VoidNetwork LLC</a><br>
            This website does not claim ownership of any media.
            <br>This service simply acts as a proxy to Imgur.com and does not store images aside from a brief cache.