You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
49 lines
1.4 KiB
49 lines
1.4 KiB
4 years ago
|
import praw
|
||
|
import urllib
|
||
|
from urllib import request,parse
|
||
|
|
||
|
url_opn_list = []
|
||
|
|
||
|
headers = {}
|
||
|
headers['User-Agent'] = 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/47.0.2526.111 Safari/537.36'
|
||
|
|
||
|
def reddit_parse_hot(reddit, sub , many):
|
||
|
loop = 0
|
||
|
what_to_parse = reddit.subreddit(sub)
|
||
|
hot_posts = what_to_parse.hot(limit = many)
|
||
|
for post in hot_posts:
|
||
|
post_url = post.url
|
||
|
print(post_url)
|
||
|
req = request.Request(post_url, headers = headers)
|
||
|
url_opn = request.urlopen(req)
|
||
|
url_opn_list.append(post_url)
|
||
|
loop += 1
|
||
|
return url_opn_list
|
||
|
|
||
|
def reddit_parse_time(reddit, sub, many):
|
||
|
loop = 0
|
||
|
what_to_parse = reddit.subreddit(sub)
|
||
|
time_posts = what_to_parse.new(limit = many)
|
||
|
for post in time_posts:
|
||
|
post_url = post.url
|
||
|
print(post_url)
|
||
|
req = request.Request(post_url, headers = headers)
|
||
|
url_opn = request.urlopen(req)
|
||
|
url_opn_list.append(post_url)
|
||
|
loop += 1
|
||
|
return url_opn_list
|
||
|
|
||
|
|
||
|
def random_subreddit(reddit,many):
|
||
|
loop = 0
|
||
|
what_to_parse = reddit.subreddit('random')
|
||
|
hot_posts = what_to_parse.hot(limit = many)
|
||
|
for post in hot_posts:
|
||
|
post_url = post.url
|
||
|
print(post_url)
|
||
|
req = request.Request(post_url, headers = headers)
|
||
|
url_opn = request.urlopen(req)
|
||
|
url_opn_list.append(post_url)
|
||
|
loop += 1
|
||
|
return url_opn_list, what_to_parse
|