-
Notifications
You must be signed in to change notification settings - Fork 14
/
Copy pathscraper.py
27 lines (22 loc) · 1006 Bytes
/
scraper.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
import praw
class Scraper:
def __init__(self, env):
self.env = env
self.hotPosts = []
# Read-only instance
self.reddit = praw.Reddit(client_id=env['CLIENT_ID'],
client_secret=env['CLIENT_SECRET'],
user_agent=env['USER_AGENT'])
self.reddit.read_only = True
self.subreddit = self.reddit.subreddit(env['SUBREDDIT'])
self.minPostLength = int(env['MIN_POST_LENGTH'])
self.maxPostLength = int(env['MAX_POST_LENGTH'])
def getHotPosts(self):
for post in self.subreddit.hot():
if not post.stickied and post.is_self and (self.minPostLength <= len(post.selftext) <= self.maxPostLength) and len(self.hotPosts) < 2:
self.hotPosts.append(post)
if len(self.hotPosts) >= 2:
break
self.hotPosts = self.hotPosts[:1]
post = self.hotPosts[0]
return (post.title, post.title+"\n"+post.selftext)