pornhub commit

2025-02-09 03:37:52 +03:00 · 2020-05-28 14:45:19 +08:00 · 2020-05-28 14:45:19 +08:00 · f047840d24
commit f047840d24
parent eca7a1d569
2 changed files with 59 additions and 0 deletions
--- a/src/you_get/common.py
+++ b/src/you_get/common.py
@ -125,6 +125,7 @@ SITES = {
    'zhanqi'           : 'zhanqi',
    'zhibo'            : 'zhibo',
    'zhihu'            : 'zhihu',
    'pornhub'          : 'pornhub',
 }
 dry_run = False
--- a/src/you_get/extractors/pornhub.py
+++ b/src/you_get/extractors/pornhub.py
@ -0,0 +1,58 @@
 #!/usr/bin/env python
 __all__ = ['pornhub_download']
 import urllib.request, urllib.parse
 from ..common import *
 def pornhub_download(url, output_dir='.', merge=False, info_only=False, **kwargs):
    query = dict(urllib.parse.parse_qsl(urllib.parse.urlsplit(url).query))
    viewkey = query["viewkey"]
    html = get_html('https://www.pornhub.com/embed/' + viewkey)
    title = re.findall(r'<title>(.*?)</title>', html)[0]
    p = re.compile("<script>(.*?)</script>", re.DOTALL)
    js = re.findall(p, html)
    jsf = js[0].replace('\n', '').replace('\t', '')
    comment = re.compile(r'/\*(.*?)\*/', re.DOTALL)
    cdata = re.sub(comment, "", jsf)
    cs = cdata.replace(r'var ', '').split(";")
    usi = cs[0].find("utmSource")
    flashvars = cs[0][12:usi - 5]
    jfv = json.loads(flashvars)
    param_dict = {}
    for c in cs:
        if c.find("=") != -1:
            ca = c.split("=", 1)
            param_dict[ca[0]] = ca[1].replace(r'" + "', '').strip(r'"')
    real_url = ""
    mp = []
    if "mp4480p" in param_dict:
        mp = param_dict["mp4480p"].split(r' + ')
    elif "mp4720p" in param_dict:
        mp = param_dict["mp4720p"].split(r' + ')
    elif "mp41080p" in param_dict:
        mp = param_dict["mp41080p"].split(r' + ')
    if len(mp) == 0:
        raise Exception('Resource not found!')
    for m in mp:
        real_url = real_url + param_dict[m]
    type, ext, size = url_info(real_url)
    print_info(site_info, title, type, size)
    if not info_only:
        download_urls([real_url], title, ext, size, output_dir, merge=merge)
 site_info = "pornhub.com"
 download = pornhub_download
 download_playlist = playlist_not_supported('pornhub')