you-get/src/you_get/extractors/youtube.py

#!/usr/bin/env python

from ..common import *
from ..extractor import VideoExtractor

class YouTube(VideoExtractor):
    name = "YouTube"

    # YouTube media encoding options, in descending quality order.
    # http://en.wikipedia.org/wiki/YouTube#Quality_and_codecs. Retrieved July 17, 2014.
    stream_types = [
        {'itag': '38', 'container': 'MP4', 'video_resolution': '3072p', 'video_encoding': 'H.264', 'video_profile': 'High', 'video_bitrate': '3.5-5', 'audio_encoding': 'AAC', 'audio_bitrate': '192'},
        #{'itag': '85', 'container': 'MP4', 'video_resolution': '1080p', 'video_encoding': 'H.264', 'video_profile': '3D', 'video_bitrate': '3-4', 'audio_encoding': 'AAC', 'audio_bitrate': '192'},
        {'itag': '46', 'container': 'WebM', 'video_resolution': '1080p', 'video_encoding': 'VP8', 'video_profile': '', 'video_bitrate': '', 'audio_encoding': 'Vorbis', 'audio_bitrate': '192'},
        {'itag': '37', 'container': 'MP4', 'video_resolution': '1080p', 'video_encoding': 'H.264', 'video_profile': 'High', 'video_bitrate': '3-4.3', 'audio_encoding': 'AAC', 'audio_bitrate': '192'},
        #{'itag': '102', 'container': 'WebM', 'video_resolution': '720p', 'video_encoding': 'VP8', 'video_profile': '3D', 'video_bitrate': '', 'audio_encoding': 'Vorbis', 'audio_bitrate': '192'},
        {'itag': '45', 'container': 'WebM', 'video_resolution': '720p', 'video_encoding': 'VP8', 'video_profile': '', 'video_bitrate': '2', 'audio_encoding': 'Vorbis', 'audio_bitrate': '192'},
        #{'itag': '84', 'container': 'MP4', 'video_resolution': '720p', 'video_encoding': 'H.264', 'video_profile': '3D', 'video_bitrate': '2-3', 'audio_encoding': 'AAC', 'audio_bitrate': '192'},
        {'itag': '22', 'container': 'MP4', 'video_resolution': '720p', 'video_encoding': 'H.264', 'video_profile': 'High', 'video_bitrate': '2-3', 'audio_encoding': 'AAC', 'audio_bitrate': '192'},
        {'itag': '120', 'container': 'FLV', 'video_resolution': '720p', 'video_encoding': 'H.264', 'video_profile': 'Main@L3.1', 'video_bitrate': '2', 'audio_encoding': 'AAC', 'audio_bitrate': '128'}, # Live streaming only
        {'itag': '44', 'container': 'WebM', 'video_resolution': '480p', 'video_encoding': 'VP8', 'video_profile': '', 'video_bitrate': '1', 'audio_encoding': 'Vorbis', 'audio_bitrate': '128'},
        {'itag': '35', 'container': 'FLV', 'video_resolution': '480p', 'video_encoding': 'H.264', 'video_profile': 'Main', 'video_bitrate': '0.8-1', 'audio_encoding': 'AAC', 'audio_bitrate': '128'},
        #{'itag': '101', 'container': 'WebM', 'video_resolution': '360p', 'video_encoding': 'VP8', 'video_profile': '3D', 'video_bitrate': '', 'audio_encoding': 'Vorbis', 'audio_bitrate': '192'},
        #{'itag': '100', 'container': 'WebM', 'video_resolution': '360p', 'video_encoding': 'VP8', 'video_profile': '3D', 'video_bitrate': '', 'audio_encoding': 'Vorbis', 'audio_bitrate': '128'},
        {'itag': '43', 'container': 'WebM', 'video_resolution': '360p', 'video_encoding': 'VP8', 'video_profile': '', 'video_bitrate': '0.5', 'audio_encoding': 'Vorbis', 'audio_bitrate': '128'},
        {'itag': '34', 'container': 'FLV', 'video_resolution': '360p', 'video_encoding': 'H.264', 'video_profile': 'Main', 'video_bitrate': '0.5', 'audio_encoding': 'AAC', 'audio_bitrate': '128'},
        #{'itag': '82', 'container': 'MP4', 'video_resolution': '360p', 'video_encoding': 'H.264', 'video_profile': '3D', 'video_bitrate': '0.5', 'audio_encoding': 'AAC', 'audio_bitrate': '96'},
        {'itag': '18', 'container': 'MP4', 'video_resolution': '270p/360p', 'video_encoding': 'H.264', 'video_profile': 'Baseline', 'video_bitrate': '0.5', 'audio_encoding': 'AAC', 'audio_bitrate': '96'},
        {'itag': '6', 'container': 'FLV', 'video_resolution': '270p', 'video_encoding': 'Sorenson H.263', 'video_profile': '', 'video_bitrate': '0.8', 'audio_encoding': 'MP3', 'audio_bitrate': '64'},
        #{'itag': '83', 'container': 'MP4', 'video_resolution': '240p', 'video_encoding': 'H.264', 'video_profile': '3D', 'video_bitrate': '0.5', 'audio_encoding': 'AAC', 'audio_bitrate': '96'},
        {'itag': '13', 'container': '3GP', 'video_resolution': '', 'video_encoding': 'MPEG-4 Visual', 'video_profile': '', 'video_bitrate': '0.5', 'audio_encoding': 'AAC', 'audio_bitrate': ''},
        {'itag': '5', 'container': 'FLV', 'video_resolution': '240p', 'video_encoding': 'Sorenson H.263', 'video_profile': '', 'video_bitrate': '0.25', 'audio_encoding': 'MP3', 'audio_bitrate': '64'},
        {'itag': '36', 'container': '3GP', 'video_resolution': '240p', 'video_encoding': 'MPEG-4 Visual', 'video_profile': 'Simple', 'video_bitrate': '0.175', 'audio_encoding': 'AAC', 'audio_bitrate': '36'},
        {'itag': '17', 'container': '3GP', 'video_resolution': '144p', 'video_encoding': 'MPEG-4 Visual', 'video_profile': 'Simple', 'video_bitrate': '0.05', 'audio_encoding': 'AAC', 'audio_bitrate': '24'},
    ]

    def decipher(js, s):
        def tr_js(code):
            code = re.sub(r'function', r'def', code)
            code = re.sub(r'\$', '_dollar', code)
            code = re.sub(r'\{', r':\n\t', code)
            code = re.sub(r'\}', r'\n', code)
            code = re.sub(r'var\s+', r'', code)
            code = re.sub(r'(\w+).join\(""\)', r'"".join(\1)', code)
            code = re.sub(r'(\w+).length', r'len(\1)', code)
            code = re.sub(r'(\w+).slice\((\w+)\)', r'\1[\2:]', code)
            code = re.sub(r'(\w+).splice\((\w+),(\w+)\)', r'del \1[\2:\2+\3]', code)
            code = re.sub(r'(\w+).split\(""\)', r'list(\1)', code)
            return code

        f1 = match1(js, r'\w+\.sig\|\|([$\w]+)\(\w+\.\w+\)')
        f1def = match1(js, r'(function %s\(\w+\)\{[^\{]+\})' % re.escape(f1))
        f1def = re.sub(r'([$\w]+\.)([$\w]+\(\w+,\d+\))', r'\2', f1def)
        code = tr_js(f1def)
        f2s = set(re.findall(r'([$\w]+)\(\w+,\d+\)', f1def))
        for f2 in f2s:
            f2e = re.escape(f2)
            f2def = re.search(r'[^$\w]%s:function\((\w+,\w+)\)(\{[^\{\}]+\})' % f2e, js)
            if f2def:
                f2def = 'function {}({}){}'.format(f2e, f2def.group(1), f2def.group(2))
            else:
                f2def = re.search(r'[^$\w]%s:function\((\w+)\)(\{[^\{\}]+\})' % f2e, js)
                f2def = 'function {}({},b){}'.format(f2e, f2def.group(1), f2def.group(2))
            f2 = re.sub(r'\$', '_dollar', f2)
            code = code + 'global %s\n' % f2 + tr_js(f2def)

        code = code + 'sig=%s(s)' % re.sub(r'\$', '_dollar', f1)
        exec(code, globals(), locals())
        return locals()['sig']

    def get_url_from_vid(vid):
        return 'http://youtu.be/{}'.format(vid)

    def get_vid_from_url(url):
        """Extracts video ID from URL.
        """
        return match1(url, r'youtu\.be/([^/]+)') or \
          match1(url, r'youtube\.com/embed/([^/?]+)') or \
          match1(url, r'youtube\.com/v/([^/?]+)') or \
          parse_query_param(url, 'v') or \
          parse_query_param(parse_query_param(url, 'u'), 'v')

    def get_playlist_id_from_url(url):
        """Extracts playlist ID from URL.
        """
        return parse_query_param(url, 'list') or \
          parse_query_param(url, 'p')

    def download_playlist_by_url(self, url, **kwargs):
        self.url = url

        playlist_id = __class__.get_playlist_id_from_url(self.url)
        if playlist_id is None:
            log.wtf('[Failed] Unsupported URL pattern.')

        video_page = get_content('http://www.youtube.com/playlist?list=%s' % playlist_id)
        from html.parser import HTMLParser
        videos = sorted([HTMLParser().unescape(video)
                         for video in re.findall(r'<a href="(/watch\?[^"]+)"', video_page)
                            if parse_query_param(video, 'index')],
                        key=lambda video: parse_query_param(video, 'index'))
        self.title = re.search(r'<meta name="title" content="([^"]+)"', video_page).group(1)
        self.p_playlist()
        for video in videos:
            vid = parse_query_param(video, 'v')
            index = parse_query_param(video, 'index')
            __class__().download_by_url(__class__.get_url_from_vid(vid), index=index, **kwargs)

    def prepare(self, **kwargs):
        assert self.url or self.vid

        if not self.vid and self.url:
            self.vid = __class__.get_vid_from_url(self.url)

            if self.vid is None:
                self.download_playlist_by_url(self.url, **kwargs)
                exit(0)

        video_info = parse.parse_qs(get_content('http://www.youtube.com/get_video_info?video_id={}'.format(self.vid)))

        if 'status' not in video_info:
            log.wtf('[Failed] Unknown status.')

        elif video_info['status'] == ['ok']:
            if 'use_cipher_signature' not in video_info or video_info['use_cipher_signature'] == ['False']:
                self.title = parse.unquote_plus(video_info['title'][0])
                stream_list = video_info['url_encoded_fmt_stream_map'][0].split(',')

            else:
                # Parse video page instead
                video_page = get_content('http://www.youtube.com/watch?v=%s' % self.vid)
                ytplayer_config = json.loads(re.search('ytplayer.config\s*=\s*([^\n]+?});', video_page).group(1))

                self.title = ytplayer_config['args']['title']
                self.html5player = 'http:' + ytplayer_config['assets']['js']
                stream_list = ytplayer_config['args']['url_encoded_fmt_stream_map'].split(',')

        elif video_info['status'] == ['fail']:
            if video_info['errorcode'] == ['150']:
                video_page = get_content('http://www.youtube.com/watch?v=%s' % self.vid)
                ytplayer_config = json.loads(re.search('ytplayer.config\s*=\s*([^\n]+});ytplayer', video_page).group(1))

                if 'title' in ytplayer_config['args']:
                    # 150 Restricted from playback on certain sites
                    # Parse video page instead
                    self.title = ytplayer_config['args']['title']
                    self.html5player = 'http:' + ytplayer_config['assets']['js']
                    stream_list = ytplayer_config['args']['url_encoded_fmt_stream_map'].split(',')
                else:
                    log.wtf('[Error] The uploader has not made this video available in your country.')
                    #self.title = re.search('<meta name="title" content="([^"]+)"', video_page).group(1)
                    #stream_list = []

            elif video_info['errorcode'] == ['100']:
                log.wtf('[Failed] This video does not exist.', exit_code=int(video_info['errorcode'][0]))

            else:
                log.wtf('[Failed] %s' % video_info['reason'][0], exit_code=int(video_info['errorcode'][0]))

        else:
            log.wtf('[Failed] Invalid status.')

        for stream in stream_list:
            metadata = parse.parse_qs(stream)
            stream_itag = metadata['itag'][0]
            self.streams[stream_itag] = {
                'itag': metadata['itag'][0],
                'url': metadata['url'][0],
                'sig': metadata['sig'][0] if 'sig' in metadata else None,
                's': metadata['s'][0] if 's' in metadata else None,
                'quality': metadata['quality'][0],
                'type': metadata['type'][0],
                'mime': metadata['type'][0].split(';')[0],
                'container': mime_to_container(metadata['type'][0].split(';')[0]),
            }

    def extract(self, **kwargs):
        if not self.streams_sorted:
            # No stream is available
            return

        if 'stream_id' in kwargs and kwargs['stream_id']:
            # Extract the stream
            stream_id = kwargs['stream_id']
            if stream_id not in self.streams:
                log.e('[Error] Invalid video format.')
                log.e('Run \'-i\' command with no specific video format to view all available formats.')
                exit(2)
        else:
            # Extract stream with the best quality
            stream_id = self.streams_sorted[0]['itag']

        src = self.streams[stream_id]['url']

        if self.streams[stream_id]['sig'] is not None:
            sig = self.streams[stream_id]['sig']
            src += '&signature={}'.format(sig)

        elif self.streams[stream_id]['s'] is not None:
            s = self.streams[stream_id]['s']
            js = get_content(self.html5player)
            sig = __class__.decipher(js, s)
            src += '&signature={}'.format(sig)

        self.streams[stream_id]['src'] = [src]
        self.streams[stream_id]['size'] = urls_size(self.streams[stream_id]['src'])

site = YouTube()
download = site.download_by_url
download_playlist = site.download_playlist_by_url
refactor for Python packaging 2012-08-31 19:20:38 +04:00			`#!/usr/bin/env python`
initial commit 2012-08-20 19:54:03 +04:00
refactor for Python packaging 2012-08-31 19:20:38 +04:00			`from ..common import *`
Major refactoring * Change entry point to you_get.__main__:main * New entry point for development (you-get-dev): you_get.__main__:main_dev * you_get.extractor -> you_get.extractors 2014-07-21 04:39:40 +04:00			`from ..extractor import VideoExtractor`
initial commit 2012-08-20 19:54:03 +04:00
YouTube: OOP style 2014-07-17 11:01:44 +04:00			`class YouTube(VideoExtractor):`
			`name = "YouTube"`

			`# YouTube media encoding options, in descending quality order.`
			`# http://en.wikipedia.org/wiki/YouTube#Quality_and_codecs. Retrieved July 17, 2014.`
			`stream_types = [`
			`{'itag': '38', 'container': 'MP4', 'video_resolution': '3072p', 'video_encoding': 'H.264', 'video_profile': 'High', 'video_bitrate': '3.5-5', 'audio_encoding': 'AAC', 'audio_bitrate': '192'},`
			`#{'itag': '85', 'container': 'MP4', 'video_resolution': '1080p', 'video_encoding': 'H.264', 'video_profile': '3D', 'video_bitrate': '3-4', 'audio_encoding': 'AAC', 'audio_bitrate': '192'},`
			`{'itag': '46', 'container': 'WebM', 'video_resolution': '1080p', 'video_encoding': 'VP8', 'video_profile': '', 'video_bitrate': '', 'audio_encoding': 'Vorbis', 'audio_bitrate': '192'},`
			`{'itag': '37', 'container': 'MP4', 'video_resolution': '1080p', 'video_encoding': 'H.264', 'video_profile': 'High', 'video_bitrate': '3-4.3', 'audio_encoding': 'AAC', 'audio_bitrate': '192'},`
			`#{'itag': '102', 'container': 'WebM', 'video_resolution': '720p', 'video_encoding': 'VP8', 'video_profile': '3D', 'video_bitrate': '', 'audio_encoding': 'Vorbis', 'audio_bitrate': '192'},`
			`{'itag': '45', 'container': 'WebM', 'video_resolution': '720p', 'video_encoding': 'VP8', 'video_profile': '', 'video_bitrate': '2', 'audio_encoding': 'Vorbis', 'audio_bitrate': '192'},`
			`#{'itag': '84', 'container': 'MP4', 'video_resolution': '720p', 'video_encoding': 'H.264', 'video_profile': '3D', 'video_bitrate': '2-3', 'audio_encoding': 'AAC', 'audio_bitrate': '192'},`
			`{'itag': '22', 'container': 'MP4', 'video_resolution': '720p', 'video_encoding': 'H.264', 'video_profile': 'High', 'video_bitrate': '2-3', 'audio_encoding': 'AAC', 'audio_bitrate': '192'},`
			`{'itag': '120', 'container': 'FLV', 'video_resolution': '720p', 'video_encoding': 'H.264', 'video_profile': 'Main@L3.1', 'video_bitrate': '2', 'audio_encoding': 'AAC', 'audio_bitrate': '128'}, # Live streaming only`
			`{'itag': '44', 'container': 'WebM', 'video_resolution': '480p', 'video_encoding': 'VP8', 'video_profile': '', 'video_bitrate': '1', 'audio_encoding': 'Vorbis', 'audio_bitrate': '128'},`
			`{'itag': '35', 'container': 'FLV', 'video_resolution': '480p', 'video_encoding': 'H.264', 'video_profile': 'Main', 'video_bitrate': '0.8-1', 'audio_encoding': 'AAC', 'audio_bitrate': '128'},`
			`#{'itag': '101', 'container': 'WebM', 'video_resolution': '360p', 'video_encoding': 'VP8', 'video_profile': '3D', 'video_bitrate': '', 'audio_encoding': 'Vorbis', 'audio_bitrate': '192'},`
			`#{'itag': '100', 'container': 'WebM', 'video_resolution': '360p', 'video_encoding': 'VP8', 'video_profile': '3D', 'video_bitrate': '', 'audio_encoding': 'Vorbis', 'audio_bitrate': '128'},`
			`{'itag': '43', 'container': 'WebM', 'video_resolution': '360p', 'video_encoding': 'VP8', 'video_profile': '', 'video_bitrate': '0.5', 'audio_encoding': 'Vorbis', 'audio_bitrate': '128'},`
			`{'itag': '34', 'container': 'FLV', 'video_resolution': '360p', 'video_encoding': 'H.264', 'video_profile': 'Main', 'video_bitrate': '0.5', 'audio_encoding': 'AAC', 'audio_bitrate': '128'},`
			`#{'itag': '82', 'container': 'MP4', 'video_resolution': '360p', 'video_encoding': 'H.264', 'video_profile': '3D', 'video_bitrate': '0.5', 'audio_encoding': 'AAC', 'audio_bitrate': '96'},`
			`{'itag': '18', 'container': 'MP4', 'video_resolution': '270p/360p', 'video_encoding': 'H.264', 'video_profile': 'Baseline', 'video_bitrate': '0.5', 'audio_encoding': 'AAC', 'audio_bitrate': '96'},`
			`{'itag': '6', 'container': 'FLV', 'video_resolution': '270p', 'video_encoding': 'Sorenson H.263', 'video_profile': '', 'video_bitrate': '0.8', 'audio_encoding': 'MP3', 'audio_bitrate': '64'},`
			`#{'itag': '83', 'container': 'MP4', 'video_resolution': '240p', 'video_encoding': 'H.264', 'video_profile': '3D', 'video_bitrate': '0.5', 'audio_encoding': 'AAC', 'audio_bitrate': '96'},`
			`{'itag': '13', 'container': '3GP', 'video_resolution': '', 'video_encoding': 'MPEG-4 Visual', 'video_profile': '', 'video_bitrate': '0.5', 'audio_encoding': 'AAC', 'audio_bitrate': ''},`
			`{'itag': '5', 'container': 'FLV', 'video_resolution': '240p', 'video_encoding': 'Sorenson H.263', 'video_profile': '', 'video_bitrate': '0.25', 'audio_encoding': 'MP3', 'audio_bitrate': '64'},`
			`{'itag': '36', 'container': '3GP', 'video_resolution': '240p', 'video_encoding': 'MPEG-4 Visual', 'video_profile': 'Simple', 'video_bitrate': '0.175', 'audio_encoding': 'AAC', 'audio_bitrate': '36'},`
			`{'itag': '17', 'container': '3GP', 'video_resolution': '144p', 'video_encoding': 'MPEG-4 Visual', 'video_profile': 'Simple', 'video_bitrate': '0.05', 'audio_encoding': 'AAC', 'audio_bitrate': '24'},`
			`]`

			`def decipher(js, s):`
			`def tr_js(code):`
			`code = re.sub(r'function', r'def', code)`
			`code = re.sub(r'\$', '_dollar', code)`
			`code = re.sub(r'\{', r':\n\t', code)`
			`code = re.sub(r'\}', r'\n', code)`
			`code = re.sub(r'var\s+', r'', code)`
			`code = re.sub(r'(\w+).join\(""\)', r'"".join(\1)', code)`
			`code = re.sub(r'(\w+).length', r'len(\1)', code)`
			`code = re.sub(r'(\w+).slice\((\w+)\)', r'\1[\2:]', code)`
Fix (partly) #373 * Handle JavaScript: Array.prototype.splice() * Python has a list.reverse() method 2014-07-24 19:09:08 +04:00			`code = re.sub(r'(\w+).splice\((\w+),(\w+)\)', r'del \1[\2:\2+\3]', code)`
YouTube: OOP style 2014-07-17 11:01:44 +04:00			`code = re.sub(r'(\w+).split\(""\)', r'list(\1)', code)`
			`return code`

			`f1 = match1(js, r'\w+\.sig\\|\\|([$\w]+)\(\w+\.\w+\)')`
			`f1def = match1(js, r'(function %s\(\w+\)\{[^\{]+\})' % re.escape(f1))`
			`f1def = re.sub(r'([$\w]+\.)([$\w]+\(\w+,\d+\))', r'\2', f1def)`
			`code = tr_js(f1def)`
			`f2s = set(re.findall(r'([$\w]+)\(\w+,\d+\)', f1def))`
			`for f2 in f2s:`
			`f2e = re.escape(f2)`
			`f2def = re.search(r'[^$\w]%s:function\((\w+,\w+)\)(\{[^\{\}]+\})' % f2e, js)`
			`if f2def:`
			`f2def = 'function {}({}){}'.format(f2e, f2def.group(1), f2def.group(2))`
			`else:`
			`f2def = re.search(r'[^$\w]%s:function\((\w+)\)(\{[^\{\}]+\})' % f2e, js)`
			`f2def = 'function {}({},b){}'.format(f2e, f2def.group(1), f2def.group(2))`
			`f2 = re.sub(r'\$', '_dollar', f2)`
			`code = code + 'global %s\n' % f2 + tr_js(f2def)`

			`code = code + 'sig=%s(s)' % re.sub(r'\$', '_dollar', f1)`
			`exec(code, globals(), locals())`
			`return locals()['sig']`

			`def get_url_from_vid(vid):`
			`return 'http://youtu.be/{}'.format(vid)`

			`def get_vid_from_url(url):`
			`"""Extracts video ID from URL.`
			`"""`
			`return match1(url, r'youtu\.be/([^/]+)') or \`
			`match1(url, r'youtube\.com/embed/([^/?]+)') or \`
			`match1(url, r'youtube\.com/v/([^/?]+)') or \`
			`parse_query_param(url, 'v') or \`
			`parse_query_param(parse_query_param(url, 'u'), 'v')`

			`def get_playlist_id_from_url(url):`
			`"""Extracts playlist ID from URL.`
			`"""`
			`return parse_query_param(url, 'list') or \`
YouTube: fix #282 2013-12-21 07:00:07 +04:00			`parse_query_param(url, 'p')`
Handle $ symbol in js function name 2014-02-06 08:03:51 +04:00
YouTube: OOP style 2014-07-17 11:01:44 +04:00			`def download_playlist_by_url(self, url, **kwargs):`
			`self.url = url`

			`playlist_id = __class__.get_playlist_id_from_url(self.url)`
			`if playlist_id is None:`
			`log.wtf('[Failed] Unsupported URL pattern.')`

			`video_page = get_content('http://www.youtube.com/playlist?list=%s' % playlist_id)`
			`from html.parser import HTMLParser`
			`videos = sorted([HTMLParser().unescape(video)`
			`for video in re.findall(r'<a href="(/watch\?[^"]+)"', video_page)`
			`if parse_query_param(video, 'index')],`
			`key=lambda video: parse_query_param(video, 'index'))`
			`self.title = re.search(r'<meta name="title" content="([^"]+)"', video_page).group(1)`
			`self.p_playlist()`
			`for video in videos:`
			`vid = parse_query_param(video, 'v')`
			`index = parse_query_param(video, 'index')`
			`__class__().download_by_url(__class__.get_url_from_vid(vid), index=index, **kwargs)`

			`def prepare(self, **kwargs):`
			`assert self.url or self.vid`

			`if not self.vid and self.url:`
			`self.vid = __class__.get_vid_from_url(self.url)`

			`if self.vid is None:`
			`self.download_playlist_by_url(self.url, **kwargs)`
			`exit(0)`

			`video_info = parse.parse_qs(get_content('http://www.youtube.com/get_video_info?video_id={}'.format(self.vid)))`

			`if 'status' not in video_info:`
			`log.wtf('[Failed] Unknown status.')`

			`elif video_info['status'] == ['ok']:`
			`if 'use_cipher_signature' not in video_info or video_info['use_cipher_signature'] == ['False']:`
			`self.title = parse.unquote_plus(video_info['title'][0])`
			`stream_list = video_info['url_encoded_fmt_stream_map'][0].split(',')`

			`else:`
			`# Parse video page instead`
			`video_page = get_content('http://www.youtube.com/watch?v=%s' % self.vid)`
YouTube: non-greedy regex, fix #394 2014-08-20 07:46:03 +04:00			`ytplayer_config = json.loads(re.search('ytplayer.config\s=\s([^\n]+?});', video_page).group(1))`
YouTube: OOP style 2014-07-17 11:01:44 +04:00
			`self.title = ytplayer_config['args']['title']`
			`self.html5player = 'http:' + ytplayer_config['assets']['js']`
			`stream_list = ytplayer_config['args']['url_encoded_fmt_stream_map'].split(',')`

			`elif video_info['status'] == ['fail']:`
			`if video_info['errorcode'] == ['150']:`
			`video_page = get_content('http://www.youtube.com/watch?v=%s' % self.vid)`
YouTube: fix regex 2014-09-20 20:59:55 +04:00			`ytplayer_config = json.loads(re.search('ytplayer.config\s=\s([^\n]+});ytplayer', video_page).group(1))`
YouTube: OOP style 2014-07-17 11:01:44 +04:00
			`if 'title' in ytplayer_config['args']:`
			`# 150 Restricted from playback on certain sites`
			`# Parse video page instead`
			`self.title = ytplayer_config['args']['title']`
			`self.html5player = 'http:' + ytplayer_config['assets']['js']`
			`stream_list = ytplayer_config['args']['url_encoded_fmt_stream_map'].split(',')`
			`else:`
			`log.wtf('[Error] The uploader has not made this video available in your country.')`
			`#self.title = re.search('<meta name="title" content="([^"]+)"', video_page).group(1)`
			`#stream_list = []`

			`elif video_info['errorcode'] == ['100']:`
			`log.wtf('[Failed] This video does not exist.', exit_code=int(video_info['errorcode'][0]))`

			`else:`
			`log.wtf('[Failed] %s' % video_info['reason'][0], exit_code=int(video_info['errorcode'][0]))`

			`else:`
			`log.wtf('[Failed] Invalid status.')`

			`for stream in stream_list:`
			`metadata = parse.parse_qs(stream)`
			`stream_itag = metadata['itag'][0]`
			`self.streams[stream_itag] = {`
			`'itag': metadata['itag'][0],`
			`'url': metadata['url'][0],`
			`'sig': metadata['sig'][0] if 'sig' in metadata else None,`
			`'s': metadata['s'][0] if 's' in metadata else None,`
			`'quality': metadata['quality'][0],`
			`'type': metadata['type'][0],`
			`'mime': metadata['type'][0].split(';')[0],`
			`'container': mime_to_container(metadata['type'][0].split(';')[0]),`
			`}`

			`def extract(self, **kwargs):`
			`if not self.streams_sorted:`
			`# No stream is available`
			`return`

			`if 'stream_id' in kwargs and kwargs['stream_id']:`
			`# Extract the stream`
			`stream_id = kwargs['stream_id']`
			`if stream_id not in self.streams:`
			`log.e('[Error] Invalid video format.')`
change "[Error] Invalid video format." message 2014-07-30 05:48:26 +04:00			`log.e('Run \'-i\' command with no specific video format to view all available formats.')`
YouTube: OOP style 2014-07-17 11:01:44 +04:00			`exit(2)`
			`else:`
			`# Extract stream with the best quality`
			`stream_id = self.streams_sorted[0]['itag']`

			`src = self.streams[stream_id]['url']`

			`if self.streams[stream_id]['sig'] is not None:`
			`sig = self.streams[stream_id]['sig']`
			`src += '&signature={}'.format(sig)`

			`elif self.streams[stream_id]['s'] is not None:`
			`s = self.streams[stream_id]['s']`
			`js = get_content(self.html5player)`
			`sig = __class__.decipher(js, s)`
			`src += '&signature={}'.format(sig)`

			`self.streams[stream_id]['src'] = [src]`
			`self.streams[stream_id]['size'] = urls_size(self.streams[stream_id]['src'])`
initial commit 2012-08-20 19:54:03 +04:00
YouTube: OOP style 2014-07-17 11:01:44 +04:00			`site = YouTube()`
			`download = site.download_by_url`
			`download_playlist = site.download_playlist_by_url`