petyasoft · eihosusss · Sep 24, 2024
diff --git a/CatPhotosFromReddit.py b/CatPhotosFromReddit.py
@@ -0,0 +1,69 @@
+import praw
+import requests
+import os
+import hashlib
+from fake_useragent import UserAgent
+
+ua = UserAgent()
+fake_user_agent = ua.random  # Generate a random user agent
+
+# Reddit API credentials
+CLIENT_ID = 'CLIENT_ID'
+CLIENT_SECRET = 'CLIENT_SECRET'
+
+reddit = praw.Reddit(client_id=CLIENT_ID,
+                     client_secret=CLIENT_SECRET,
+                     user_agent=fake_user_agent)
+
+# List of subreddits from where the photos will be downloaded
+subreddits = ['cat', 'cats']
+
+photos_dir = "photos"
+if not os.path.exists(photos_dir):
+    os.makedirs(photos_dir)
+
+downloaded_images = set()
+
+def get_image_hash(image_content):
+    return hashlib.md5(image_content).hexdigest()
+
+def load_existing_hashes():
+    for filename in os.listdir(photos_dir):
+        filepath = os.path.join(photos_dir, filename)
+        if os.path.isfile(filepath):
+            with open(filepath, 'rb') as img_file:
+                content = img_file.read()
+                image_hash = get_image_hash(content)
+                downloaded_images.add(image_hash)
+
+def download_image(url, filepath):
+    headers = {'User-Agent': fake_user_agent}
+    response = requests.get(url, headers=headers)
+
+    if response.status_code == 200:
+        image_hash = get_image_hash(response.content)
+
+        if image_hash in downloaded_images:
+            print(f"Image already downloaded, skipping: {url}")
+        else:
+            with open(filepath, 'wb') as f:
+                f.write(response.content)
+            downloaded_images.add(image_hash)
+            print(f"Downloaded {filepath}")
+    else:
+        print(f"Failed to download {url}")
+
+
+load_existing_hashes()
+
+
+for subreddit in subreddits:
+    print(f"Fetching latest posts from {subreddit}")
+    for submission in reddit.subreddit(subreddit).new(limit=10):  # Change the limit to get the desired ammount of photos
+        if submission.url.endswith(('jpg', 'jpeg', 'png')):
+            image_name = submission.url.split('/')[-1]
+            file_path = os.path.join(photos_dir, image_name)
+            if not os.path.exists(file_path):
+                download_image(submission.url, file_path)
+
+print("Download complete.")
diff --git a/README.md b/README.md
@@ -4,6 +4,7 @@
 ## Requirements
 - Python 3.11 (you can install it [here](https://www.python.org/downloads/release/python-3110/))
 - Telegram API_ID and API_HASH (you can get them [here](https://my.telegram.org/auth?to=apps))
+- Reddit account, API, and secret (you can get them [here](https://www.reddit.com/prefs/apps))
 
 
 
@@ -49,6 +50,8 @@
 
 5. IMPORTANT Create a `sessions` folder
 
+6. To get cat photos using CatPhotosFromReddit.py, you need to register a Reddit account and create an app to obtain the Reddit API client ID and secret. Visit [Reddit Apps](https://www.reddit.com/prefs/apps) to generate these credentials.
+
 
 
 ## Usage

diff --git a/requirements.txt b/requirements.txt
@@ -4,4 +4,4 @@ loguru==0.7.2
 aiohttp==3.9.5
 fake-useragent==1.5.1
 requests==2.28.1
-
+praw