you-get/src/you_get/extractors/acfun.py

#!/usr/bin/env python

__all__ = ['acfun_download']

from ..common import *

from .le import letvcloud_download_by_vu
from .qq import qq_download_by_vid
from .sina import sina_download_by_vid
from .tudou import tudou_download_by_iid
from .youku import youku_download_by_vid, youku_open_download_by_vid

import json, re

def get_srt_json(id):
    url = 'http://danmu.aixifan.com/V2/%s' % id
    return get_html(url)

def acfun_download_by_vid(vid, title, output_dir='.', merge=True, info_only=False, **kwargs):
    """str, str, str, bool, bool ->None
    
    Download Acfun video by vid.
    
    Call Acfun API, decide which site to use, and pass the job to its
    extractor.
    """

    #first call the main parasing API
    info = json.loads(get_html('http://www.acfun.tv/video/getVideo.aspx?id=' + vid))

    sourceType = info['sourceType']

    #decide sourceId to know which extractor to use
    if 'sourceId' in info: sourceId = info['sourceId']
    # danmakuId = info['danmakuId']

    #call extractor decided by sourceId
    if sourceType == 'sina':
        sina_download_by_vid(sourceId, title, output_dir=output_dir, merge=merge, info_only=info_only)
    elif sourceType == 'youku':
        youku_download_by_vid(sourceId, title=title, output_dir=output_dir, merge=merge, info_only=info_only, **kwargs)
    elif sourceType == 'tudou':
        tudou_download_by_iid(sourceId, title, output_dir=output_dir, merge=merge, info_only=info_only)
    elif sourceType == 'qq':
        qq_download_by_vid(sourceId, title, output_dir=output_dir, merge=merge, info_only=info_only)
    elif sourceType == 'letv':
        letvcloud_download_by_vu(sourceId, '2d8c027396', title, output_dir=output_dir, merge=merge, info_only=info_only)
    elif sourceType == 'zhuzhan':
        #As in Jul.28.2016, Acfun is using embsig to anti hotlink so we need to pass this
        embsig =  info['encode']
        a = 'http://api.aixifan.com/plays/%s' % vid
        s = json.loads(get_content(a, headers={'deviceType': '2'}))
        if s['data']['source'] == "zhuzhan-youku":
            sourceId = s['data']['sourceId']
            youku_open_download_by_vid(client_id='908a519d032263f8', vid=sourceId, title=title, output_dir=output_dir,merge=merge, info_only=info_only, embsig = embsig, **kwargs)
    else:
        raise NotImplementedError(sourceType)

    if not info_only and not dry_run:
        if not kwargs['caption']:
            print('Skipping danmaku.')
            return
        try:
            title = get_filename(title)
            print('Downloading %s ...\n' % (title + '.cmt.json'))
            cmt = get_srt_json(vid)
            with open(os.path.join(output_dir, title + '.cmt.json'), 'w', encoding='utf-8') as x:
                x.write(cmt)
        except:
            pass

def acfun_download(url, output_dir='.', merge=True, info_only=False, **kwargs):
    assert re.match(r'http://[^\.]+.acfun.[^\.]+/\D/\D\D(\d+)', url)
    html = get_html(url)

    title = r1(r'<h1 id="txt-title-view">([^<>]+)<', html)
    title = unescape_html(title)
    title = escape_file_path(title)
    assert title

    videos = re.findall("data-vid=\"(\d+)\".*href=\"[^\"]+\".*title=\"([^\"]+)\"", html)
    for video in videos:
        p_vid = video[0]
        p_title = title + " - " + video[1] if video[1] != '删除标签' else title
        acfun_download_by_vid(p_vid, p_title,
                              output_dir=output_dir,
                              merge=merge,
                              info_only=info_only,
                              **kwargs)

site_info = "AcFun.tv"
download = acfun_download
download_playlist = playlist_not_supported('acfun')
add support for AcFun 2012-09-01 23:38:23 +04:00			`#!/usr/bin/env python`

			`__all__ = ['acfun_download']`

			`from ..common import *`

[letv] fix #947 2016-03-03 23:49:47 +03:00			`from .le import letvcloud_download_by_vu`
[qq] fix support 2015-06-19 06:46:43 +03:00			`from .qq import qq_download_by_vid`
Sina: fix #207 for video.sina.com 2013-07-14 19:34:42 +04:00			`from .sina import sina_download_by_vid`
add support for AcFun 2012-09-01 23:38:23 +04:00			`from .tudou import tudou_download_by_iid`
[Acfun]Fix Acfun Youku COOP, fix #1069 2016-04-28 08:29:22 +03:00			`from .youku import youku_download_by_vid, youku_open_download_by_vid`
add support for AcFun 2012-09-01 23:38:23 +04:00
			`import json, re`

			`def get_srt_json(id):`
[acfun] fix #776 2016-01-11 02:18:49 +03:00			`url = 'http://danmu.aixifan.com/V2/%s' % id`
add support for AcFun 2012-09-01 23:38:23 +04:00			`return get_html(url)`

[acfun] fix #776 2016-01-11 02:18:49 +03:00			`def acfun_download_by_vid(vid, title, output_dir='.', merge=True, info_only=False, **kwargs):`
[Acfun] Update embsig with Youku COOP to bypass anti hot linking 2016-07-28 11:24:12 +03:00			`"""str, str, str, bool, bool ->None`

			`Download Acfun video by vid.`

			`Call Acfun API, decide which site to use, and pass the job to its`
			`extractor.`
			`"""`

			`#first call the main parasing API`
Fix Acfun, add uu to Letvcloud, update key(fix #530, #495,#525, #528) 2015-05-28 05:29:49 +03:00			`info = json.loads(get_html('http://www.acfun.tv/video/getVideo.aspx?id=' + vid))`
[Acfun] Update embsig with Youku COOP to bypass anti hot linking 2016-07-28 11:24:12 +03:00
Fix Acfun, add uu to Letvcloud, update key(fix #530, #495,#525, #528) 2015-05-28 05:29:49 +03:00			`sourceType = info['sourceType']`
[Acfun] Update embsig with Youku COOP to bypass anti hot linking 2016-07-28 11:24:12 +03:00
			`#decide sourceId to know which extractor to use`
[acfun] fix #745 2015-11-11 03:41:16 +03:00			`if 'sourceId' in info: sourceId = info['sourceId']`
Fix Acfun, add uu to Letvcloud, update key(fix #530, #495,#525, #528) 2015-05-28 05:29:49 +03:00			`# danmakuId = info['danmakuId']`
[Acfun] Update embsig with Youku COOP to bypass anti hot linking 2016-07-28 11:24:12 +03:00
			`#call extractor decided by sourceId`
Fix Acfun, add uu to Letvcloud, update key(fix #530, #495,#525, #528) 2015-05-28 05:29:49 +03:00			`if sourceType == 'sina':`
			`sina_download_by_vid(sourceId, title, output_dir=output_dir, merge=merge, info_only=info_only)`
			`elif sourceType == 'youku':`
[acfun] fix exception when caption not present in youku source 2016-02-25 22:14:59 +03:00			`youku_download_by_vid(sourceId, title=title, output_dir=output_dir, merge=merge, info_only=info_only, **kwargs)`
Fix Acfun, add uu to Letvcloud, update key(fix #530, #495,#525, #528) 2015-05-28 05:29:49 +03:00			`elif sourceType == 'tudou':`
			`tudou_download_by_iid(sourceId, title, output_dir=output_dir, merge=merge, info_only=info_only)`
			`elif sourceType == 'qq':`
[qq] fix support 2015-06-19 06:46:43 +03:00			`qq_download_by_vid(sourceId, title, output_dir=output_dir, merge=merge, info_only=info_only)`
Fix Acfun, add uu to Letvcloud, update key(fix #530, #495,#525, #528) 2015-05-28 05:29:49 +03:00			`elif sourceType == 'letv':`
			`letvcloud_download_by_vu(sourceId, '2d8c027396', title, output_dir=output_dir, merge=merge, info_only=info_only)`
[acfun] fix #745 2015-11-11 03:41:16 +03:00			`elif sourceType == 'zhuzhan':`
[Acfun] Update embsig with Youku COOP to bypass anti hot linking 2016-07-28 11:24:12 +03:00			`#As in Jul.28.2016, Acfun is using embsig to anti hotlink so we need to pass this`
			`embsig = info['encode']`
[Acfun]Fix Acfun Youku COOP, fix #1069 2016-04-28 08:29:22 +03:00			`a = 'http://api.aixifan.com/plays/%s' % vid`
			`s = json.loads(get_content(a, headers={'deviceType': '2'}))`
			`if s['data']['source'] == "zhuzhan-youku":`
			`sourceId = s['data']['sourceId']`
[Acfun] Update embsig with Youku COOP to bypass anti hot linking 2016-07-28 11:24:12 +03:00			`youku_open_download_by_vid(client_id='908a519d032263f8', vid=sourceId, title=title, output_dir=output_dir,merge=merge, info_only=info_only, embsig = embsig, **kwargs)`
add support for AcFun 2012-09-01 23:38:23 +04:00			`else:`
Fix Acfun, add uu to Letvcloud, update key(fix #530, #495,#525, #528) 2015-05-28 05:29:49 +03:00			`raise NotImplementedError(sourceType)`
AcFun: fix #295 2014-02-14 05:20:06 +04:00
[acfun] fix #776 2016-01-11 02:18:49 +03:00			`if not info_only and not dry_run:`
			`if not kwargs['caption']:`
			`print('Skipping danmaku.')`
			`return`
Acfun: mute the exception if .cmt.json not available 2013-12-16 15:08:38 +04:00			`try:`
[acfun] fix #776 2016-01-11 02:18:49 +03:00			`title = get_filename(title)`
Acfun & Bilibili: 'Downloading %s ...\n' 2014-05-29 04:42:57 +04:00			`print('Downloading %s ...\n' % (title + '.cmt.json'))`
quick fix for acfun danmaku #408 2014-09-18 09:38:50 +04:00			`cmt = get_srt_json(vid)`
[acfun] fix #776 2016-01-11 02:18:49 +03:00			`with open(os.path.join(output_dir, title + '.cmt.json'), 'w', encoding='utf-8') as x:`
Acfun: mute the exception if .cmt.json not available 2013-12-16 15:08:38 +04:00			`x.write(cmt)`
			`except:`
			`pass`
format code 2015-01-27 18:44:45 +03:00
[acfun] fix "unexpected keyword argument 'json_output'" 2015-09-30 23:03:39 +03:00			`def acfun_download(url, output_dir='.', merge=True, info_only=False, **kwargs):`
AcFun: fix #475 2015-01-20 06:39:29 +03:00			`assert re.match(r'http://[^\.]+.acfun.[^\.]+/\D/\D\D(\d+)', url)`
add support for AcFun 2012-09-01 23:38:23 +04:00			`html = get_html(url)`
AcFun: fix #295 2014-02-14 05:20:06 +04:00
AcFun: fix #321 2014-04-13 15:31:21 +04:00			`title = r1(r'<h1 id="txt-title-view">([^<>]+)<', html)`
add support for AcFun 2012-09-01 23:38:23 +04:00			`title = unescape_html(title)`
			`title = escape_file_path(title)`
AcFun: fix #295 2014-02-14 05:20:06 +04:00			`assert title`

AcFun: fixed 2014-08-21 17:35:18 +04:00			`videos = re.findall("data-vid=\"(\d+)\".href=\"[^\"]+\".title=\"([^\"]+)\"", html)`
[acfun] fix #776 2016-01-11 02:18:49 +03:00			`for video in videos:`
			`p_vid = video[0]`
			`p_title = title + " - " + video[1] if video[1] != '删除标签' else title`
			`acfun_download_by_vid(p_vid, p_title,`
			`output_dir=output_dir,`
			`merge=merge,`
			`info_only=info_only,`
			`**kwargs)`
add support for AcFun 2012-09-01 23:38:23 +04:00
AcFun: fix 2014-07-19 01:53:48 +04:00			`site_info = "AcFun.tv"`
add support for AcFun 2012-09-01 23:38:23 +04:00			`download = acfun_download`
			`download_playlist = playlist_not_supported('acfun')`