reddit-save/utilities.py

import os
import praw
import requests
from redvid import Downloader
import youtube_dl
import re
from datetime import datetime

try:
    from logindata import REDDIT_USERNAME, REDDIT_PASSWORD
    from logindata import REDDIT_CLIENT_ID, REDDIT_SECRET
except ImportError:
    REDDIT_USERNAME = os.getenv("REDDIT_USERNAME")
    REDDIT_PASSWORD = os.getenv("REDDIT_PASSWORD")
    REDDIT_CLIENT_ID = os.getenv("REDDIT_CLIENT_ID")
    REDDIT_SECRET = os.getenv("REDDIT_SECRET")

IMAGE_EXTENSIONS = ["gif", "gifv", "jpg", "jpeg", "png"]
VIDEO_EXTENSIONS = ["mp4"]
PLATFORMS = ["redgifs.com", "gfycat.com", "imgur.com", "youtube.com"]


def make_client():
    """Creates a PRAW client with the details in the secrets.py file."""

    return praw.Reddit(
        username=REDDIT_USERNAME,
        password=REDDIT_PASSWORD,
        client_id=REDDIT_CLIENT_ID,
        client_secret=REDDIT_SECRET,
        user_agent="reddit-save",
    )


def get_saved_posts(client):
    """Gets a list of posts that the user has saved."""

    return [
        saved for saved in client.user.me().saved(limit=None)
        if saved.__class__.__name__ == "Submission"
    ]


def get_upvoted_posts(client):
    """Gets a list of posts that the user has upvoted."""

    return [
        upvoted for upvoted in client.user.me().upvoted(limit=None)
        if upvoted.__class__.__name__ == "Submission"
    ]


def get_saved_comments(client):
    """Gets a list of comments that the user has saved."""

    return [
        saved for saved in client.user.me().saved(limit=None)
        if saved.__class__.__name__ != "Submission"
    ]


def get_post_html(post):
    """Takes a post object and creates a HTML for it - but not including the
    preview HTML."""

    with open(os.path.join("html", "post-div.html"), encoding="utf-8") as f:
        html = f.read()
    dt = datetime.utcfromtimestamp(post.created_utc)
    html = html.replace("<!--title-->", post.title)
    html = html.replace("<!--subreddit-->", f"/r/{str(post.subreddit)}")
    html = html.replace("<!--user-->", f"/u/{post.author.name}" if post.author else "[deleted]")
    html = html.replace("<!--link-->", f"posts/{post.id}.html")
    html = html.replace("<!--reddit-link-->", f"https://reddit.com{post.permalink}")
    html = html.replace("<!--content-link-->", post.url)
    html = html.replace("<!--id-->", post.id)
    html = html.replace("<!--body-->", (post.selftext_html or "").replace(
        '<a href="/r/', '<a href="https://reddit.com/r/'
    ))
    html = html.replace("<!--timestamp-->", str(dt))
    html = html.replace("<!--date-->", dt.strftime("%d %B, %Y"))
    return html


def save_media(post, location):
    """Takes a post object and tries to download any image/video it might be
    associated with. If it can, it will return the filename."""

    url = post.url
    stripped_url = url.split("?")[0]
    if url.endswith(post.permalink): return None

    # What is the key information?
    extension = stripped_url.split(".")[-1].lower()
    domain = ".".join(post.url.split("/")[2].split(".")[-2:])
    readable_name = list(filter(bool, post.permalink.split("/")))[-1]

    # If it's an imgur gallery, forget it
    if domain == "imgur.com" and "gallery" in url: return None

    # Can the media be obtained directly?
    if extension in IMAGE_EXTENSIONS + VIDEO_EXTENSIONS:
        filename = f"{readable_name}_{post.id}.{extension}"
        response = requests.get(post.url)
        media_type = response.headers.get("Content-Type", "")
        if media_type.startswith("image") or media_type.startswith("video"):
            with open(os.path.join(location, "media", filename), "wb") as f:
                f.write(response.content)
                return filename

    # Is this a v.redd.it link?
    if domain == "redd.it":
        downloader = Downloader(max_q=True, log=False)
        downloader.url = url
        current = os.getcwd()
        try:
            name = downloader.download()
            extension = name.split(".")[-1]
            filename = f"{readable_name}_{post.id}.{extension}"
            os.rename(name, os.path.join(location, "media", filename))
            return filename
        except:
            os.chdir(current)
            return None

    # Is it a gfycat link that redirects? Update the URL if possible
    if domain == "gfycat.com":
        html = requests.get(post.url).content
        if len(html) < 50000:
            match = re.search(r"http([\dA-Za-z\+\:\/\.]+)\.mp4", html.decode())
            if match:
                url = match.group()
            else:
                return None

    # Is this an imgur image?
    if domain == "imgur.com" and extension != "gifv":
        for extension in IMAGE_EXTENSIONS:
            direct_url = f'https://i.{url[url.find("//") + 2:]}.{extension}'
            direct_url = direct_url.replace("i.imgur.com", "imgur.com")
            direct_url = direct_url.replace("m.imgur.com", "imgur.com")
            response = requests.get(direct_url)
            if response.status_code == 200:
                filename = f"{readable_name}_{post.id}.{extension}"
                with open(os.path.join(location, "media", filename), "wb") as f:
                    f.write(response.content)
                    return filename

    # Try to use youtube_dl if it's one of the possible domains
    if domain in PLATFORMS:
        options = {
            "nocheckcertificate": True, "quiet": True, "no_warnings": True,
            "ignoreerrors": True,
            "outtmpl": os.path.join(
                location, "media", f"{readable_name}_{post.id}" + ".%(ext)s"
            )
        }
        with youtube_dl.YoutubeDL(options) as ydl:
            try:
                ydl.download([url])
            except:
                pass
        for f in os.listdir(os.path.join(location, "media")):
            if f.startswith(f"{readable_name}_{post.id}"):
                return f


def add_media_preview_to_html(post_html, media):
    """Takes post HTML and returns a modified version with the preview
    inserted."""

    extension = media.split(".")[-1]
    location = "/".join(["media", media])
    if extension in IMAGE_EXTENSIONS:
        return post_html.replace(
            "<!--preview-->",
            f'<img src="{location}">'
        )
    if extension in VIDEO_EXTENSIONS:
        return post_html.replace(
            "<!--preview-->",
            f'<video controls><source src="{location}"></video>'
        )
    return post_html


def create_post_page_html(post, post_html):
    """Creates the HTML for a post's own page."""

    with open(os.path.join("html", "post.html"), encoding="utf-8") as f:
        html = f.read()
    html = html.replace("<!--title-->", post.title)
    html = html.replace("<!--post-->", post_html.replace("h2>", "h1>").replace(
        '<img src="media/', '<img src="../media/'
    ).replace(
        '<source src="media/', '<source src="../media/'
    ))
    html = re.sub(r'<a href="posts(.+?)</a>', "", html)
    with open(os.path.join("html", "style.css"), encoding="utf-8") as f:
        html = html.replace("<style></style>", f"<style>\n{f.read()}\n</style>")
    with open(os.path.join("html", "main.js"), encoding="utf-8") as f:
        html = html.replace("<script></script>", f"<script>\n{f.read()}\n</script>")
    comments_html = []
    post.comments.replace_more(limit=0)
    for comment in post.comments:
        comments_html.append(get_comment_html(
            comment, op=post.author.name if post.author else None
        ))
    html = html.replace("<!--comments-->", "\n".join(comments_html))
    return html


def get_comment_html(comment, children=True, op=None):
    """Takes a post object and creates a HTML for it - it will get its children
    too unless you specify otherwise."""

    with open(os.path.join("html", "comment-div.html"), encoding="utf-8") as f:
        html = f.read()
    dt = datetime.utcfromtimestamp(comment.created_utc)
    author = "[deleted]"
    if comment.author:
        if comment.author == op:
            author = f'<span class="op">/u/{comment.author.name}</span>'
        else:
            author = f"/u/{comment.author.name}"
    html = html.replace("<!--user-->", author)
    html = html.replace("<!--body-->", (comment.body_html or "").replace(
        '<a href="/r/', '<a href="https://reddit.com/r/'
    ))
    html = html.replace("<!--score-->", str(comment.score))
    html = html.replace("<!--link-->", f"https://reddit.com{comment.permalink}")
    html = html.replace("<!--timestamp-->", str(dt))
    html = html.replace("<!--id-->", comment.id)
    html = html.replace("<!--date-->", dt.strftime("%H:%M - %d %B, %Y"))
    if children:
        children_html = []
        for child in comment.replies:
            children_html.append(get_comment_html(child, children=False, op=op))
        html = html.replace("<!--children-->", "\n".join(children_html))
    return html
Get saved posts 2020-12-30 23:59:55 +01:00			`import os`
			`import praw`
Display image previews 2020-12-31 01:33:30 +01:00			`import requests`
Support v.redd.it 2021-01-01 22:44:40 +01:00			`from redvid import Downloader`
Youtube DL for videos 2020-12-31 02:32:06 +01:00			`import youtube_dl`
Handle gfycat links 2020-12-31 03:18:48 +01:00			`import re`
Get saved posts 2020-12-30 23:59:55 +01:00			`from datetime import datetime`
Add docker support Replaced secrets.py with docker environment variables. Set location as a default "./archive/" while inside docker container. 2021-01-27 09:39:19 +01:00
Fixed ImportError: cannot import name 'token_urlsafe' from 'secrets' #7 Fixed UnicodeEncodeError: 'charmap' codec can't encode characters in position 28919-28920: character maps to <undefined> 2022-07-10 22:33:02 +02:00			`try:`
			`from logindata import REDDIT_USERNAME, REDDIT_PASSWORD`
			`from logindata import REDDIT_CLIENT_ID, REDDIT_SECRET`
Add docker support Replaced secrets.py with docker environment variables. Set location as a default "./archive/" while inside docker container. 2021-01-27 09:39:19 +01:00			`except ImportError:`
			`REDDIT_USERNAME = os.getenv("REDDIT_USERNAME")`
			`REDDIT_PASSWORD = os.getenv("REDDIT_PASSWORD")`
			`REDDIT_CLIENT_ID = os.getenv("REDDIT_CLIENT_ID")`
			`REDDIT_SECRET = os.getenv("REDDIT_SECRET")`
Get saved posts 2020-12-30 23:59:55 +01:00
Don't do previously saved items 2021-01-02 23:33:47 +01:00			`IMAGE_EXTENSIONS = ["gif", "gifv", "jpg", "jpeg", "png"]`
Display image previews 2020-12-31 01:33:30 +01:00			`VIDEO_EXTENSIONS = ["mp4"]`
Support v.redd.it 2021-01-01 22:44:40 +01:00			`PLATFORMS = ["redgifs.com", "gfycat.com", "imgur.com", "youtube.com"]`
Display image previews 2020-12-31 01:33:30 +01:00
Fixed ImportError: cannot import name 'token_urlsafe' from 'secrets' #7 Fixed UnicodeEncodeError: 'charmap' codec can't encode characters in position 28919-28920: character maps to <undefined> 2022-07-10 22:33:02 +02:00
Get saved posts 2020-12-30 23:59:55 +01:00			`def make_client():`
Support v.redd.it 2021-01-01 22:44:40 +01:00			`"""Creates a PRAW client with the details in the secrets.py file."""`

Get saved posts 2020-12-30 23:59:55 +01:00			`return praw.Reddit(`
			`username=REDDIT_USERNAME,`
			`password=REDDIT_PASSWORD,`
			`client_id=REDDIT_CLIENT_ID,`
			`client_secret=REDDIT_SECRET,`
			`user_agent="reddit-save",`
			`)`


			`def get_saved_posts(client):`
Support v.redd.it 2021-01-01 22:44:40 +01:00			`"""Gets a list of posts that the user has saved."""`

Handle gfycat links 2020-12-31 03:18:48 +01:00			`return [`
README 2021-01-03 23:50:31 +01:00			`saved for saved in client.user.me().saved(limit=None)`
Handle gfycat links 2020-12-31 03:18:48 +01:00			`if saved.__class__.__name__ == "Submission"`
			`]`
Get saved posts 2020-12-30 23:59:55 +01:00

Get upvoted posts 2020-12-31 00:05:45 +01:00			`def get_upvoted_posts(client):`
Saved comments 2021-01-03 01:20:15 +01:00			`"""Gets a list of posts that the user has upvoted."""`
Support v.redd.it 2021-01-01 22:44:40 +01:00
Handle gfycat links 2020-12-31 03:18:48 +01:00			`return [`
			`upvoted for upvoted in client.user.me().upvoted(limit=None)`
Don't do previously saved items 2021-01-02 23:33:47 +01:00			`if upvoted.__class__.__name__ == "Submission"`
Handle gfycat links 2020-12-31 03:18:48 +01:00			`]`
Get upvoted posts 2020-12-31 00:05:45 +01:00

Saved comments 2021-01-03 01:20:15 +01:00			`def get_saved_comments(client):`
			`"""Gets a list of comments that the user has saved."""`

			`return [`
			`saved for saved in client.user.me().saved(limit=None)`
			`if saved.__class__.__name__ != "Submission"`
			`]`


Get saved posts 2020-12-30 23:59:55 +01:00			`def get_post_html(post):`
Support v.redd.it 2021-01-01 22:44:40 +01:00			`"""Takes a post object and creates a HTML for it - but not including the`
			`preview HTML."""`

Fixed ImportError: cannot import name 'token_urlsafe' from 'secrets' #7 Fixed UnicodeEncodeError: 'charmap' codec can't encode characters in position 28919-28920: character maps to <undefined> 2022-07-10 22:33:02 +02:00			`with open(os.path.join("html", "post-div.html"), encoding="utf-8") as f:`
Get saved posts 2020-12-30 23:59:55 +01:00			`html = f.read()`
			`dt = datetime.utcfromtimestamp(post.created_utc)`
			`html = html.replace("<!--title-->", post.title)`
Save post content 2020-12-31 00:47:15 +01:00			`html = html.replace("<!--subreddit-->", f"/r/{str(post.subreddit)}")`
			`html = html.replace("<!--user-->", f"/u/{post.author.name}" if post.author else "[deleted]")`
Post pages 2021-01-02 23:46:36 +01:00			`html = html.replace("<!--link-->", f"posts/{post.id}.html")`
			`html = html.replace("<!--reddit-link-->", f"https://reddit.com{post.permalink}")`
Content links 2020-12-31 00:54:04 +01:00			`html = html.replace("<!--content-link-->", post.url)`
Don't do previously saved items 2021-01-02 23:33:47 +01:00			`html = html.replace("<!--id-->", post.id)`
Correct inline reddit links 2021-01-03 23:12:49 +01:00			`html = html.replace("<!--body-->", (post.selftext_html or "").replace(`
			`'<a href="/r/', '<a href="https://reddit.com/r/'`
			`))`
Get saved posts 2020-12-30 23:59:55 +01:00			`html = html.replace("<!--timestamp-->", str(dt))`
			`html = html.replace("<!--date-->", dt.strftime("%d %B, %Y"))`
Display image previews 2020-12-31 01:33:30 +01:00			`return html`


Youtube DL for videos 2020-12-31 02:32:06 +01:00			`def save_media(post, location):`
Support v.redd.it 2021-01-01 22:44:40 +01:00			`"""Takes a post object and tries to download any image/video it might be`
			`associated with. If it can, it will return the filename."""`

			`url = post.url`
			`stripped_url = url.split("?")[0]`
Fix imgur issues 2021-01-02 01:08:14 +01:00			`if url.endswith(post.permalink): return None`
Support v.redd.it 2021-01-01 22:44:40 +01:00
			`# What is the key information?`
			`extension = stripped_url.split(".")[-1].lower()`
Handle imgur errors 2020-12-31 03:58:31 +01:00			`domain = ".".join(post.url.split("/")[2].split(".")[-2:])`
Support v.redd.it 2021-01-01 22:44:40 +01:00			`readable_name = list(filter(bool, post.permalink.split("/")))[-1]`

Fix imgur issues 2021-01-02 01:08:14 +01:00			`# If it's an imgur gallery, forget it`
			`if domain == "imgur.com" and "gallery" in url: return None`

Support v.redd.it 2021-01-01 22:44:40 +01:00			`# Can the media be obtained directly?`
			`if extension in IMAGE_EXTENSIONS + VIDEO_EXTENSIONS:`
Youtube DL for videos 2020-12-31 02:32:06 +01:00			`filename = f"{readable_name}_{post.id}.{extension}"`
Fix imgur issues 2021-01-02 01:08:14 +01:00			`response = requests.get(post.url)`
			`media_type = response.headers.get("Content-Type", "")`
			`if media_type.startswith("image") or media_type.startswith("video"):`
			`with open(os.path.join(location, "media", filename), "wb") as f:`
Support v.redd.it 2021-01-01 22:44:40 +01:00			`f.write(response.content)`
			`return filename`
Fixed ImportError: cannot import name 'token_urlsafe' from 'secrets' #7 Fixed UnicodeEncodeError: 'charmap' codec can't encode characters in position 28919-28920: character maps to <undefined> 2022-07-10 22:33:02 +02:00
Support v.redd.it 2021-01-01 22:44:40 +01:00			`# Is this a v.redd.it link?`
			`if domain == "redd.it":`
			`downloader = Downloader(max_q=True, log=False)`
			`downloader.url = url`
Style blockquote 2021-01-03 21:56:15 +01:00			`current = os.getcwd()`
			`try:`
			`name = downloader.download()`
			`extension = name.split(".")[-1]`
			`filename = f"{readable_name}_{post.id}.{extension}"`
			`os.rename(name, os.path.join(location, "media", filename))`
			`return filename`
			`except:`
			`os.chdir(current)`
			`return None`
Support v.redd.it 2021-01-01 22:44:40 +01:00
			`# Is it a gfycat link that redirects? Update the URL if possible`
			`if domain == "gfycat.com":`
			`html = requests.get(post.url).content`
			`if len(html) < 50000:`
			`match = re.search(r"http([\dA-Za-z\+\:\/\.]+)\.mp4", html.decode())`
			`if match:`
			`url = match.group()`
Fixed ImportError: cannot import name 'token_urlsafe' from 'secrets' #7 Fixed UnicodeEncodeError: 'charmap' codec can't encode characters in position 28919-28920: character maps to <undefined> 2022-07-10 22:33:02 +02:00			`else:`
			`return None`
Support imgur downloads 2021-01-01 23:51:40 +01:00
			`# Is this an imgur image?`
Fixed ImportError: cannot import name 'token_urlsafe' from 'secrets' #7 Fixed UnicodeEncodeError: 'charmap' codec can't encode characters in position 28919-28920: character maps to <undefined> 2022-07-10 22:33:02 +02:00			`if domain == "imgur.com" and extension != "gifv":`
Support imgur downloads 2021-01-01 23:51:40 +01:00			`for extension in IMAGE_EXTENSIONS:`
			`direct_url = f'https://i.{url[url.find("//") + 2:]}.{extension}'`
Fix imgur issues 2021-01-02 01:08:14 +01:00			`direct_url = direct_url.replace("i.imgur.com", "imgur.com")`
			`direct_url = direct_url.replace("m.imgur.com", "imgur.com")`
Support imgur downloads 2021-01-01 23:51:40 +01:00			`response = requests.get(direct_url)`
			`if response.status_code == 200:`
			`filename = f"{readable_name}_{post.id}.{extension}"`
			`with open(os.path.join(location, "media", filename), "wb") as f:`
			`f.write(response.content)`
			`return filename`
Fix imgur issues 2021-01-02 01:08:14 +01:00
Support v.redd.it 2021-01-01 22:44:40 +01:00			`# Try to use youtube_dl if it's one of the possible domains`
			`if domain in PLATFORMS:`
			`options = {`
			`"nocheckcertificate": True, "quiet": True, "no_warnings": True,`
			`"ignoreerrors": True,`
			`"outtmpl": os.path.join(`
Fixed ImportError: cannot import name 'token_urlsafe' from 'secrets' #7 Fixed UnicodeEncodeError: 'charmap' codec can't encode characters in position 28919-28920: character maps to <undefined> 2022-07-10 22:33:02 +02:00			`location, "media", f"{readable_name}_{post.id}" + ".%(ext)s"`
Support v.redd.it 2021-01-01 22:44:40 +01:00			`)`
			`}`
			`with youtube_dl.YoutubeDL(options) as ydl:`
			`try:`
			`ydl.download([url])`
Fix imgur issues 2021-01-02 01:08:14 +01:00			`except:`
			`pass`
Support v.redd.it 2021-01-01 22:44:40 +01:00			`for f in os.listdir(os.path.join(location, "media")):`
			`if f.startswith(f"{readable_name}_{post.id}"):`
			`return f`
Display image previews 2020-12-31 01:33:30 +01:00

			`def add_media_preview_to_html(post_html, media):`
Support v.redd.it 2021-01-01 22:44:40 +01:00			`"""Takes post HTML and returns a modified version with the preview`
			`inserted."""`
Fixed ImportError: cannot import name 'token_urlsafe' from 'secrets' #7 Fixed UnicodeEncodeError: 'charmap' codec can't encode characters in position 28919-28920: character maps to <undefined> 2022-07-10 22:33:02 +02:00
Youtube DL for videos 2020-12-31 02:32:06 +01:00			`extension = media.split(".")[-1]`
			`location = "/".join(["media", media])`
Display image previews 2020-12-31 01:33:30 +01:00			`if extension in IMAGE_EXTENSIONS:`
			`return post_html.replace(`
			`"<!--preview-->",`
			`f'<img src="{location}">'`
			`)`
Youtube DL for videos 2020-12-31 02:32:06 +01:00			`if extension in VIDEO_EXTENSIONS:`
			`return post_html.replace(`
			`"<!--preview-->",`
			`f'<video controls><source src="{location}"></video>'`
Handle imgur errors 2020-12-31 03:58:31 +01:00			`)`
Post pages 2021-01-02 23:46:36 +01:00			`return post_html`


			`def create_post_page_html(post, post_html):`
Saved comments 2021-01-03 01:20:15 +01:00			`"""Creates the HTML for a post's own page."""`

Fixed ImportError: cannot import name 'token_urlsafe' from 'secrets' #7 Fixed UnicodeEncodeError: 'charmap' codec can't encode characters in position 28919-28920: character maps to <undefined> 2022-07-10 22:33:02 +02:00			`with open(os.path.join("html", "post.html"), encoding="utf-8") as f:`
Post pages 2021-01-02 23:46:36 +01:00			`html = f.read()`
			`html = html.replace("<!--title-->", post.title)`
			`html = html.replace("<!--post-->", post_html.replace("h2>", "h1>").replace(`
			`'<img src="media/', '<img src="../media/'`
Media zoom 2021-01-03 04:01:13 +01:00			`).replace(`
			`'<source src="media/', '<source src="../media/'`
Post pages 2021-01-02 23:46:36 +01:00			`))`
Don't link to post page on post page 2021-01-03 22:58:41 +01:00			`html = re.sub(r'<a href="posts(.+?)</a>', "", html)`
Fixed ImportError: cannot import name 'token_urlsafe' from 'secrets' #7 Fixed UnicodeEncodeError: 'charmap' codec can't encode characters in position 28919-28920: character maps to <undefined> 2022-07-10 22:33:02 +02:00			`with open(os.path.join("html", "style.css"), encoding="utf-8") as f:`
Post pages 2021-01-02 23:46:36 +01:00			`html = html.replace("<style></style>", f"<style>\n{f.read()}\n</style>")`
Fixed ImportError: cannot import name 'token_urlsafe' from 'secrets' #7 Fixed UnicodeEncodeError: 'charmap' codec can't encode characters in position 28919-28920: character maps to <undefined> 2022-07-10 22:33:02 +02:00			`with open(os.path.join("html", "main.js"), encoding="utf-8") as f:`
Start JS integration 2021-01-03 03:26:38 +01:00			`html = html.replace("<script></script>", f"<script>\n{f.read()}\n</script>")`
Save top-level comments 2021-01-03 00:18:26 +01:00			`comments_html = []`
			`post.comments.replace_more(limit=0)`
			`for comment in post.comments:`
README 2021-01-03 23:50:31 +01:00			`comments_html.append(get_comment_html(`
			`comment, op=post.author.name if post.author else None`
			`))`
Save top-level comments 2021-01-03 00:18:26 +01:00			`html = html.replace("<!--comments-->", "\n".join(comments_html))`
			`return html`


Highlight OP comment 2021-01-03 23:08:22 +01:00			`def get_comment_html(comment, children=True, op=None):`
Saved comments 2021-01-03 01:20:15 +01:00			`"""Takes a post object and creates a HTML for it - it will get its children`
			`too unless you specify otherwise."""`

Fixed ImportError: cannot import name 'token_urlsafe' from 'secrets' #7 Fixed UnicodeEncodeError: 'charmap' codec can't encode characters in position 28919-28920: character maps to <undefined> 2022-07-10 22:33:02 +02:00			`with open(os.path.join("html", "comment-div.html"), encoding="utf-8") as f:`
Save top-level comments 2021-01-03 00:18:26 +01:00			`html = f.read()`
			`dt = datetime.utcfromtimestamp(comment.created_utc)`
Highlight OP comment 2021-01-03 23:08:22 +01:00			`author = "[deleted]"`
			`if comment.author:`
			`if comment.author == op:`
			`author = f'<span class="op">/u/{comment.author.name}</span>'`
			`else:`
			`author = f"/u/{comment.author.name}"`
			`html = html.replace("<!--user-->", author)`
Correct inline reddit links 2021-01-03 23:12:49 +01:00			`html = html.replace("<!--body-->", (comment.body_html or "").replace(`
			`'<a href="/r/', '<a href="https://reddit.com/r/'`
			`))`
Save top-level comments 2021-01-03 00:18:26 +01:00			`html = html.replace("<!--score-->", str(comment.score))`
			`html = html.replace("<!--link-->", f"https://reddit.com{comment.permalink}")`
			`html = html.replace("<!--timestamp-->", str(dt))`
Saved comments 2021-01-03 01:20:15 +01:00			`html = html.replace("<!--id-->", comment.id)`
Save top-level comments 2021-01-03 00:18:26 +01:00			`html = html.replace("<!--date-->", dt.strftime("%H:%M - %d %B, %Y"))`
Level 2 comments 2021-01-03 00:40:17 +01:00			`if children:`
			`children_html = []`
			`for child in comment.replies:`
Highlight OP comment 2021-01-03 23:08:22 +01:00			`children_html.append(get_comment_html(child, children=False, op=op))`
Level 2 comments 2021-01-03 00:40:17 +01:00			`html = html.replace("<!--children-->", "\n".join(children_html))`
Fixed ImportError: cannot import name 'token_urlsafe' from 'secrets' #7 Fixed UnicodeEncodeError: 'charmap' codec can't encode characters in position 28919-28920: character maps to <undefined> 2022-07-10 22:33:02 +02:00			`return html`