forked from TheAlgorithms/Python
- Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathreddit.py
53 lines (45 loc) · 2.01 KB
/
reddit.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
from __future__ importannotations
importrequests
valid_terms=set(
"""approved_at_utc approved_by author_flair_background_color
author_flair_css_class author_flair_richtext author_flair_template_id author_fullname
author_premium can_mod_post category clicked content_categories created_utc downs
edited gilded gildings hidden hide_score is_created_from_ads_ui is_meta
is_original_content is_reddit_media_domain is_video link_flair_css_class
link_flair_richtext link_flair_text link_flair_text_color media_embed mod_reason_title
name permalink pwls quarantine saved score secure_media secure_media_embed selftext
subreddit subreddit_name_prefixed subreddit_type thumbnail title top_awarded_type
total_awards_received ups upvote_ratio url user_reports""".split()
)
defget_subreddit_data(
subreddit: str, limit: int=1, age: str="new", wanted_data: list|None=None
) ->dict:
"""
subreddit : Subreddit to query
limit : Number of posts to fetch
age : ["new", "top", "hot"]
wanted_data : Get only the required data in the list
"""
wanted_data=wanted_dataor []
ifinvalid_search_terms:=", ".join(sorted(set(wanted_data) -valid_terms)):
msg=f"Invalid search term: {invalid_search_terms}"
raiseValueError(msg)
response=requests.get(
f"https://reddit.com/r/{subreddit}/{age}.json?limit={limit}",
headers={"User-agent": "A random string"},
timeout=10,
)
ifresponse.status_code==429:
raiserequests.HTTPError(response=response)
data=response.json()
ifnotwanted_data:
return {id_: data["data"]["children"][id_] forid_inrange(limit)}
data_dict= {}
forid_inrange(limit):
data_dict[id_] = {
item: data["data"]["children"][id_]["data"][item] foriteminwanted_data
}
returndata_dict
if__name__=="__main__":
# If you get Error 429, that means you are rate limited.Try after some time
print(get_subreddit_data("learnpython", wanted_data=["title", "url", "selftext"]))