reddit-save/utilities.py

import os
import praw
import requests
import youtube_dl
import re
from datetime import datetime
from secrets import REDDIT_USERNAME, REDDIT_PASSWORD
from secrets import REDDIT_CLIENT_ID, REDDIT_SECRET

IMAGE_EXTENSIONS = ["jpg", "jpeg", "png", "gif", "gifv"]
VIDEO_EXTENSIONS = ["mp4"]
PLATFORMS = ["redgifs.com", "gfycat.com", "imgur.com"]

def make_client():
    return praw.Reddit(
        username=REDDIT_USERNAME,
        password=REDDIT_PASSWORD,
        client_id=REDDIT_CLIENT_ID,
        client_secret=REDDIT_SECRET,
        user_agent="reddit-save",
    )


def get_saved_posts(client):
    return [
        saved for saved in client.user.me().saved(limit=None)
        if saved.__class__.__name__ == "Submission"
    ]


def get_upvoted_posts(client):
    return [
        upvoted for upvoted in client.user.me().upvoted(limit=None)
        if saved.__class__.__name__ == "Submission"
    ]


def get_post_html(post):
    with open(os.path.join("html", "post.html")) as f:
        html = f.read()
    dt = datetime.utcfromtimestamp(post.created_utc)
    html = html.replace("<!--title-->", post.title)
    html = html.replace("<!--subreddit-->", f"/r/{str(post.subreddit)}")
    html = html.replace("<!--user-->", f"/u/{post.author.name}" if post.author else "[deleted]")
    html = html.replace("<!--link-->", f"https://reddit.com{post.permalink}")
    html = html.replace("<!--content-link-->", post.url)
    html = html.replace("<!--body-->", post.selftext_html or "")
    html = html.replace("<!--timestamp-->", str(dt))
    html = html.replace("<!--date-->", dt.strftime("%d %B, %Y"))
    return html


def save_media(post, location):
    media_extensions = IMAGE_EXTENSIONS + VIDEO_EXTENSIONS
    extension = post.url.split("?")[0].split(".")[-1].lower()
    readable_name = list(filter(bool, post.permalink.split("/")))[-1]
    domain = ".".join(post.url.split("/")[2].split(".")[-2:])
    if extension in media_extensions and not (extension == "gifv" and domain == "imgur.com"):
        filename = f"{readable_name}_{post.id}.{extension}"
        with open(os.path.join(location, "media", filename), "wb") as f:
            f.write(requests.get(post.url).content)
            return filename
    else:
        if domain in PLATFORMS:
            url = post.url
            if domain == "gfycat.com":
                html = requests.get(post.url).content
                if len(html) < 50000:
                    match = re.search(
                        r"http([\dA-Za-z\+\:\/\.]+)\.mp4", html.decode()
                    )
                    if match:
                        url = match.group()
                    else: return None
            options = {
                "nocheckcertificate": True, "quiet": True, "no_warnings": True,
                "ignoreerrors": True,
                "outtmpl": os.path.join(
                    location, "media",  f"{readable_name}_{post.id}" + ".%(ext)s"
                )
            }
            with youtube_dl.YoutubeDL(options) as ydl:
                try:
                    ydl.download([url])
                except: pass
            for f in os.listdir(os.path.join(location, "media")):
                if f.startswith(f"{readable_name}_{post.id}"):
                    return f

        # gyfcat, v.reddit, imgur, redgifs


def add_media_preview_to_html(post_html, media):
    extension = media.split(".")[-1]
    location = "/".join(["media", media])
    if extension in IMAGE_EXTENSIONS:
        return post_html.replace(
            "<!--preview-->",
            f'<img src="{location}">'
        )
    if extension in VIDEO_EXTENSIONS:
        return post_html.replace(
            "<!--preview-->",
            f'<video controls><source src="{location}"></video>'
        )
    return post_html
Get saved posts 2020-12-30 23:59:55 +01:00			`import os`
			`import praw`
Display image previews 2020-12-31 01:33:30 +01:00			`import requests`
Youtube DL for videos 2020-12-31 02:32:06 +01:00			`import youtube_dl`
Handle gfycat links 2020-12-31 03:18:48 +01:00			`import re`
Get saved posts 2020-12-30 23:59:55 +01:00			`from datetime import datetime`
Handle imgur errors 2020-12-31 03:58:31 +01:00			`from secrets import REDDIT_USERNAME, REDDIT_PASSWORD`
			`from secrets import REDDIT_CLIENT_ID, REDDIT_SECRET`
Get saved posts 2020-12-30 23:59:55 +01:00
Handle imgur errors 2020-12-31 03:58:31 +01:00			`IMAGE_EXTENSIONS = ["jpg", "jpeg", "png", "gif", "gifv"]`
Display image previews 2020-12-31 01:33:30 +01:00			`VIDEO_EXTENSIONS = ["mp4"]`
Handle imgur errors 2020-12-31 03:58:31 +01:00			`PLATFORMS = ["redgifs.com", "gfycat.com", "imgur.com"]`
Display image previews 2020-12-31 01:33:30 +01:00
Get saved posts 2020-12-30 23:59:55 +01:00			`def make_client():`
			`return praw.Reddit(`
			`username=REDDIT_USERNAME,`
			`password=REDDIT_PASSWORD,`
			`client_id=REDDIT_CLIENT_ID,`
			`client_secret=REDDIT_SECRET,`
			`user_agent="reddit-save",`
			`)`


			`def get_saved_posts(client):`
Handle gfycat links 2020-12-31 03:18:48 +01:00			`return [`
Handle imgur errors 2020-12-31 03:58:31 +01:00			`saved for saved in client.user.me().saved(limit=None)`
Handle gfycat links 2020-12-31 03:18:48 +01:00			`if saved.__class__.__name__ == "Submission"`
			`]`
Get saved posts 2020-12-30 23:59:55 +01:00

Get upvoted posts 2020-12-31 00:05:45 +01:00			`def get_upvoted_posts(client):`
Handle gfycat links 2020-12-31 03:18:48 +01:00			`return [`
			`upvoted for upvoted in client.user.me().upvoted(limit=None)`
			`if saved.__class__.__name__ == "Submission"`
			`]`
Get upvoted posts 2020-12-31 00:05:45 +01:00

Get saved posts 2020-12-30 23:59:55 +01:00			`def get_post_html(post):`
			`with open(os.path.join("html", "post.html")) as f:`
			`html = f.read()`
			`dt = datetime.utcfromtimestamp(post.created_utc)`
			`html = html.replace("<!--title-->", post.title)`
Save post content 2020-12-31 00:47:15 +01:00			`html = html.replace("<!--subreddit-->", f"/r/{str(post.subreddit)}")`
			`html = html.replace("<!--user-->", f"/u/{post.author.name}" if post.author else "[deleted]")`
			`html = html.replace("<!--link-->", f"https://reddit.com{post.permalink}")`
Content links 2020-12-31 00:54:04 +01:00			`html = html.replace("<!--content-link-->", post.url)`
Save post content 2020-12-31 00:47:15 +01:00			`html = html.replace("<!--body-->", post.selftext_html or "")`
Get saved posts 2020-12-30 23:59:55 +01:00			`html = html.replace("<!--timestamp-->", str(dt))`
			`html = html.replace("<!--date-->", dt.strftime("%d %B, %Y"))`
Display image previews 2020-12-31 01:33:30 +01:00			`return html`


Youtube DL for videos 2020-12-31 02:32:06 +01:00			`def save_media(post, location):`
Display image previews 2020-12-31 01:33:30 +01:00			`media_extensions = IMAGE_EXTENSIONS + VIDEO_EXTENSIONS`
Handle imgur errors 2020-12-31 03:58:31 +01:00			`extension = post.url.split("?")[0].split(".")[-1].lower()`
Display image previews 2020-12-31 01:33:30 +01:00			`readable_name = list(filter(bool, post.permalink.split("/")))[-1]`
Handle imgur errors 2020-12-31 03:58:31 +01:00			`domain = ".".join(post.url.split("/")[2].split(".")[-2:])`
			`if extension in media_extensions and not (extension == "gifv" and domain == "imgur.com"):`
Youtube DL for videos 2020-12-31 02:32:06 +01:00			`filename = f"{readable_name}_{post.id}.{extension}"`
			`with open(os.path.join(location, "media", filename), "wb") as f:`
			`f.write(requests.get(post.url).content)`
			`return filename`
			`else:`
			`if domain in PLATFORMS:`
Handle gfycat links 2020-12-31 03:18:48 +01:00			`url = post.url`
			`if domain == "gfycat.com":`
			`html = requests.get(post.url).content`
			`if len(html) < 50000:`
			`match = re.search(`
			`r"http([\dA-Za-z\+\:\/\.]+)\.mp4", html.decode()`
			`)`
			`if match:`
			`url = match.group()`
			`else: return None`
Youtube DL for videos 2020-12-31 02:32:06 +01:00			`options = {`
			`"nocheckcertificate": True, "quiet": True, "no_warnings": True,`
Handle imgur errors 2020-12-31 03:58:31 +01:00			`"ignoreerrors": True,`
Youtube DL for videos 2020-12-31 02:32:06 +01:00			`"outtmpl": os.path.join(`
			`location, "media", f"{readable_name}_{post.id}" + ".%(ext)s"`
			`)`
			`}`
			`with youtube_dl.YoutubeDL(options) as ydl:`
Handle imgur errors 2020-12-31 03:58:31 +01:00			`try:`
			`ydl.download([url])`
			`except: pass`
Youtube DL for videos 2020-12-31 02:32:06 +01:00			`for f in os.listdir(os.path.join(location, "media")):`
			`if f.startswith(f"{readable_name}_{post.id}"):`
			`return f`
Display image previews 2020-12-31 01:33:30 +01:00
			`# gyfcat, v.reddit, imgur, redgifs`


			`def add_media_preview_to_html(post_html, media):`
Youtube DL for videos 2020-12-31 02:32:06 +01:00			`extension = media.split(".")[-1]`
			`location = "/".join(["media", media])`
Display image previews 2020-12-31 01:33:30 +01:00			`if extension in IMAGE_EXTENSIONS:`
			`return post_html.replace(`
			`"<!--preview-->",`
			`f'<img src="{location}">'`
			`)`
Youtube DL for videos 2020-12-31 02:32:06 +01:00			`if extension in VIDEO_EXTENSIONS:`
			`return post_html.replace(`
			`"<!--preview-->",`
			`f'<video controls><source src="{location}"></video>'`
Handle imgur errors 2020-12-31 03:58:31 +01:00			`)`
			`return post_html`