binaryPUNCH/RedditComments-LinkScraper.py

## RedditComments-LinkScraper.py
# Super simple URL/link scraper for any Reddit comment thread, enjoy!
# Requires PRAW and BeautifulSoup4, only tested on Python 2.7

threadID = "3rns3d" # Change threadID to the one you wish to scrape (hint: the ID is in the url)

import praw
import codecs
import pprint
import HTMLParser
from bs4 import BeautifulSoup

r = praw.Reddit('RedditComments-LinkScraper by /u/binaryPUNCH')
r = praw.Reddit(user_agent='RedditComments-LinkScraper')

submission = r.get_submission(submission_id=threadID)
submission.replace_more_comments(limit=None, threshold=0)
comments = praw.helpers.flatten_tree(submission.comments)

for loop in comments:
    soup = BeautifulSoup(loop.body_html, 'html.parser')
    for url in soup.find_all('a'):
        with codecs.open("results-%s.txt" % threadID, "a", "utf-8") as fout:
            fout.write((url.get('href')+u"\r\n"))
	# Super simple URL/link scraper for any Reddit comment thread, enjoy!
	# Requires PRAW and BeautifulSoup4, only tested on Python 2.7

	threadID = "3rns3d" # Change threadID to the one you wish to scrape (hint: the ID is in the url)

	import praw
	import codecs
	import pprint
	import HTMLParser
	from bs4 import BeautifulSoup

	r = praw.Reddit('RedditComments-LinkScraper by /u/binaryPUNCH')
	r = praw.Reddit(user_agent='RedditComments-LinkScraper')

	submission = r.get_submission(submission_id=threadID)
	submission.replace_more_comments(limit=None, threshold=0)
	comments = praw.helpers.flatten_tree(submission.comments)

	for loop in comments:
	soup = BeautifulSoup(loop.body_html, 'html.parser')
	for url in soup.find_all('a'):
	with codecs.open("results-%s.txt" % threadID, "a", "utf-8") as fout:
	fout.write((url.get('href')+u"\r\n"))