Skip to content

Instantly share code, notes, and snippets.

@chfoo
Last active February 8, 2016 06:12
Show Gist options
  • Save chfoo/3806f2aef3a8b9dc0657 to your computer and use it in GitHub Desktop.
Save chfoo/3806f2aef3a8b9dc0657 to your computer and use it in GitHub Desktop.
Download Reddit Live Thread Post JSON
'''Download Reddit Live Thread Post JSON'''
# reddit_live_download.py
#
# This is free and unencumbered software released into the public domain.
#
# Anyone is free to copy, modify, publish, use, compile, sell, or
# distribute this software, either in source code form or as a compiled
# binary, for any purpose, commercial or non-commercial, and by any
# means.
#
# In jurisdictions that recognize copyright laws, the author or authors
# of this software dedicate any and all copyright interest in the
# software to the public domain. We make this dedication for the benefit
# of the public at large and to the detriment of our heirs and
# successors. We intend this dedication to be an overt act of
# relinquishment in perpetuity of all present and future rights to this
# software under copyright law.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
# IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR
# OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
# ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
# OTHER DEALINGS IN THE SOFTWARE.
#
# For more information, please refer to <http://unlicense.org>
import argparse
import json
import requests
import time
__version__ = '1.0.1'
USER_AGENT = 'Download live thread script {} (by /u/chfoo)'.format(__version__)
def main():
arg_parser = argparse.ArgumentParser()
arg_parser.add_argument('live_thread_id')
args = arg_parser.parse_args()
headers = {
'User-Agent': USER_AGENT
}
params = {
'limit': 100,
}
url = 'https://www.reddit.com/live/{}/.json'.format(args.live_thread_id)
while True:
response = requests.get(url, headers=headers, params=params)
doc = response.json()
children = doc['data']['children']
if not children:
break
for child in children:
print(json.dumps(child['data']))
after = doc['data']['after']
params['after'] = after
if not after:
break
time.sleep(2)
if __name__ == '__main__':
main()
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment