Skip to content

Instantly share code, notes, and snippets.

Created January 31, 2012 12:21
Show Gist options
  • Save DrAzraelTod/1710255 to your computer and use it in GitHub Desktop.
Save DrAzraelTod/1710255 to your computer and use it in GitHub Desktop.
yturl - youtube video url extractor in python, i found it months ago and don't remember where to get it now
#!/usr/bin/env python
# vim: set fileencoding=utf-8 :
# (c) Christopher Down 2011
# See the COPYING file for copyright information.
""" Prints direct URLs to YouTube media. """
from urllib import urlopen
from urlparse import parse_qs
from os.path import basename
import sys
__author__ = 'Christopher Down'
__copyright__ = 'Copyright 2011 %s' % __author__
__license__ = 'BSD'
__version__ = 1.01
class YTURL():
def __init__(self):
self.youtubeQueryURL = ''
self.videoURLListKey = 'url_encoded_fmt_stream_map'
self.videoIDKeys = [ 'v', 'video_id' ]
self.videoItagQualityOrder = [ 38, 37, 22, 45, 44, 35, 18, 34, 43, 5, 17 ]
self.allowedVideoIDCharacters = '-_abcdefghijklmnopqrstuvwxyz0123456789'
def getVideoItags(self, videoID):
""" Returns the available itags and their associated URLs as a list. """
availableFormats = {}
parsedResponse = parse_qs(urlopen(self.youtubeQueryURL % videoID).read())
if self.videoURLListKey in parsedResponse:
for videoFormat in parsedResponse[self.videoURLListKey][0].split(','):
videoFormat = parse_qs(videoFormat)
if 'url' in videoFormat and 'itag' in videoFormat:
availableFormats[int(videoFormat['itag'][0])] = videoFormat['url'][0]
return False
return False
return availableFormats
def checkIsValidItag(self, itag):
""" Checks that all arguments are known itags. """
if itag not in self.videoItagQualityOrder:
return False
return True
def getPreferredItagOrder(self, preferredItags):
""" Determines and returns the preferred video itag sorting.
If argv has a length of 3, this returns a tuple, otherwise, it
returns a list. """
if len(preferredItags) == 1:
v = self.videoItagQualityOrder
return zip(*sorted(enumerate(v),key=lambda (i,x):abs(v.index(preferredItags[0])-i)))[1]
elif len(preferredItags) > 1:
for itag in preferredItags:
return preferredItags + self.videoItagQualityOrder
return self.videoItagQualityOrder
def checkIsValidVideoID(self, videoID):
""" Checks that a video ID is syntactically valid. """
if len(videoID) != 11:
return False
for c in videoID:
if c.lower() not in self.allowedVideoIDCharacters:
return False
return True
def stripYouTubeURL(self, url):
""" Strips a YouTube URL to the video ID. """
if '?' in url:
url = url[url.index('?') + 1:]
urlPost = parse_qs(url)
for key in self.videoIDKeys:
if key in urlPost:
return urlPost[key][0]
if url.startswith('http://'):
url = url[7:]
elif url.startswith('https://'):
url = url[8:]
if url.startswith('www.'):
url = url[4:]
if url.startswith(''):
return url[9:]
elif url.startswith(''):
return url[14:]
return url
def main():
if len(sys.argv) == 1:
print >> sys.stderr, 'Usage: %s id [itag ...]' % basename(sys.argv[0])
y = YTURL()
videoID = y.stripYouTubeURL(sys.argv[1])
if not y.checkIsValidVideoID(videoID):
print >> sys.stderr, 'Invalid video ID.'
for itag in sys.argv[2:]:
if not itag.isdigit() or not y.checkIsValidItag(int(itag)):
print >> sys.stderr, '%s is not a valid itag.' % itag
preferredItags = map(int, sys.argv[2:])
availableFormats = y.getVideoItags(videoID)
if availableFormats is not False:
for itag in y.getPreferredItagOrder(preferredItags):
if itag in availableFormats:
print availableFormats[itag]
print >> sys.stderr, """ The YouTube API returned data from which no
media URL could be retrieved. """
if __name__ == '__main__':
Copy link

cdown commented May 11, 2012

This is an old version, I keep it updated at :-)

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment