mirror of
https://github.com/soimort/you-get.git
synced 2025-02-11 12:42:29 +03:00
133 lines
5.6 KiB
Python
133 lines
5.6 KiB
Python
#!/usr/bin/env python
|
|
import base64
|
|
|
|
import binascii
|
|
|
|
from ..common import *
|
|
import random
|
|
import ctypes
|
|
from json import loads
|
|
|
|
__all__ = ['ixigua_download', 'ixigua_download_playlist_by_url']
|
|
|
|
headers = {
|
|
"user-agent": "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/66.0.3359.139 "
|
|
"Safari/537.36",
|
|
}
|
|
|
|
|
|
def int_overflow(val):
|
|
maxint = 2147483647
|
|
if not -maxint - 1 <= val <= maxint:
|
|
val = (val + (maxint + 1)) % (2 * (maxint + 1)) - maxint - 1
|
|
return val
|
|
|
|
|
|
def unsigned_right_shitf(n, i):
|
|
if n < 0:
|
|
n = ctypes.c_uint32(n).value
|
|
if i < 0:
|
|
return -int_overflow(n << abs(i))
|
|
return int_overflow(n >> i)
|
|
|
|
|
|
def get_video_url_from_video_id(video_id):
|
|
"""Splicing URLs according to video ID to get video details"""
|
|
# from js
|
|
data = [""] * 256
|
|
for index, _ in enumerate(data):
|
|
t = index
|
|
for i in range(8):
|
|
t = -306674912 ^ unsigned_right_shitf(t, 1) if 1 & t else unsigned_right_shitf(t, 1)
|
|
data[index] = t
|
|
|
|
def tmp():
|
|
rand_num = random.random()
|
|
path = "/video/urls/v/1/toutiao/mp4/{video_id}?r={random_num}".format(video_id=video_id,
|
|
random_num=str(rand_num)[2:])
|
|
e = o = r = -1
|
|
i, a = 0, len(path)
|
|
while i < a:
|
|
e = ord(path[i])
|
|
i += 1
|
|
if e < 128:
|
|
r = unsigned_right_shitf(r, 8) ^ data[255 & (r ^ e)]
|
|
else:
|
|
if e < 2048:
|
|
r = unsigned_right_shitf(r, 8) ^ data[255 & (r ^ (192 | e >> 6 & 31))]
|
|
r = unsigned_right_shitf(r, 8) ^ data[255 & (r ^ (128 | 63 & e))]
|
|
else:
|
|
if 55296 <= e < 57344:
|
|
e = (1023 & e) + 64
|
|
i += 1
|
|
o = 1023 & t.url(i)
|
|
r = unsigned_right_shitf(r, 8) ^ data[255 & (r ^ (240 | e >> 8 & 7))]
|
|
r = unsigned_right_shitf(r, 8) ^ data[255 & (r ^ (128 | e >> 2 & 63))]
|
|
r = unsigned_right_shitf(r, 8) ^ data[255 & (r ^ (128 | o >> 6 & 15 | (3 & e) << 4))]
|
|
r = unsigned_right_shitf(r, 8) ^ data[255 & (r ^ (128 | 63 & o))]
|
|
else:
|
|
r = unsigned_right_shitf(r, 8) ^ data[255 & (r ^ (224 | e >> 12 & 15))]
|
|
r = unsigned_right_shitf(r, 8) ^ data[255 & (r ^ (128 | e >> 6 & 63))]
|
|
r = unsigned_right_shitf(r, 8) ^ data[255 & (r ^ (128 | 63 & e))]
|
|
|
|
return "https://ib.365yg.com{path}&s={param}".format(path=path, param=unsigned_right_shitf(r ^ -1, 0))
|
|
|
|
while 1:
|
|
url = tmp()
|
|
if url.split("=")[-1][0] != "-": # 参数s不能为负数
|
|
return url
|
|
|
|
|
|
def ixigua_download(url, output_dir='.', merge=True, info_only=False, **kwargs):
|
|
# example url: https://www.ixigua.com/i6631065141750268420/#mid=63024814422
|
|
html = get_html(url, faker=True)
|
|
video_id = match1(html, r"videoId\s*:\s*'([^']+)'")
|
|
title = match1(html, r"title: '(\S+)',")
|
|
if not video_id:
|
|
log.e("video_id not found, url:{}".format(url))
|
|
return
|
|
video_info_url = get_video_url_from_video_id(video_id)
|
|
video_info = loads(get_content(video_info_url))
|
|
if video_info.get("code", 1) != 0:
|
|
log.e("Get video info from {} error: server return code {}".format(video_info_url, video_info.get("code", 1)))
|
|
return
|
|
if not video_info.get("data", None):
|
|
log.e("Get video info from {} error: The server returns JSON value"
|
|
" without data or data is empty".format(video_info_url))
|
|
return
|
|
if not video_info["data"].get("video_list", None):
|
|
log.e("Get video info from {} error: The server returns JSON value"
|
|
" without data.video_list or data.video_list is empty".format(video_info_url))
|
|
return
|
|
if not video_info["data"]["video_list"].get("video_1", None):
|
|
log.e("Get video info from {} error: The server returns JSON value"
|
|
" without data.video_list.video_1 or data.video_list.video_1 is empty".format(video_info_url))
|
|
return
|
|
size = int(video_info["data"]["video_list"]["video_1"]["size"])
|
|
print_info(site_info=site_info, title=title, type="mp4", size=size) # 该网站只有mp4类型文件
|
|
if not info_only:
|
|
video_url = base64.b64decode(video_info["data"]["video_list"]["video_1"]["main_url"].encode("utf-8"))
|
|
download_urls([video_url.decode("utf-8")], title, "mp4", size, output_dir, merge=merge, headers=headers, **kwargs)
|
|
|
|
|
|
def ixigua_download_playlist_by_url(url, output_dir='.', merge=True, info_only=False, **kwargs):
|
|
assert "user" in url, "Only support users to publish video list,Please provide a similar url:" \
|
|
"https://www.ixigua.com/c/user/6907091136/"
|
|
|
|
user_id = url.split("/")[-2] if url[-1] == "/" else url.split("/")[-1]
|
|
params = {"max_behot_time": "0", "max_repin_time": "0", "count": "20", "page_type": "0", "user_id": user_id}
|
|
while 1:
|
|
url = "https://www.ixigua.com/c/user/article/?" + "&".join(["{}={}".format(k, v) for k, v in params.items()])
|
|
video_list = loads(get_content(url, headers=headers))
|
|
params["max_behot_time"] = video_list["next"]["max_behot_time"]
|
|
for video in video_list["data"]:
|
|
ixigua_download("https://www.ixigua.com/i{}/".format(video["item_id"]), output_dir, merge, info_only,
|
|
**kwargs)
|
|
if video_list["next"]["max_behot_time"] == 0:
|
|
break
|
|
|
|
|
|
site_info = "ixigua.com"
|
|
download = ixigua_download
|
|
download_playlist = ixigua_download_playlist_by_url
|