From 4ecaf1aa28f7a40ad1242d38da4f2b5d38d72ffc Mon Sep 17 00:00:00 2001 From: leca Date: Mon, 2 Sep 2024 23:02:09 +0300 Subject: [PATCH] Added script for downloading all media from subreddit using libreddit (redlib) frontend --- utilities/redditdownload.py | 163 ++++++++++++++++++++++++++++++++++++ 1 file changed, 163 insertions(+) create mode 100644 utilities/redditdownload.py diff --git a/utilities/redditdownload.py b/utilities/redditdownload.py new file mode 100644 index 0000000..6197a18 --- /dev/null +++ b/utilities/redditdownload.py @@ -0,0 +1,163 @@ +import requests +import json +import os +import readme + +debug = False + +def get_image_name(url): + return url.split("/")[-1] + +def get_page_url(url, after): + return url + "?sort=hot&t=&after=t3_" + after + +def get_full_url(libreddit_instance, url): + return libreddit_instance + url + +def get_subreddit_full_url(libreddit_instance, subreddit): + return libreddit_instance + "/r/" + subreddit + +def get_posts_ids_in_page(page_content): + posts = [] + + posts_html = re.findall(r"(\
)", page_content) + for post_html in posts_html: + posts.append(re.search(r"\w{6,7}", post_html).group()) + return posts + +def get_single_videos_in_page(page_content): + videos_url = [] + + videos_html = re.findall(r"(\