mirror of
https://github.com/soimort/you-get.git
synced 2025-02-02 16:24:00 +03:00
Merge branch 'pinterest' into develop (close #744)
This commit is contained in:
commit
312bfc9b8c
@ -47,6 +47,7 @@ SITES = {
|
|||||||
'mtv81' : 'mtv81',
|
'mtv81' : 'mtv81',
|
||||||
'7gogo' : 'nanagogo',
|
'7gogo' : 'nanagogo',
|
||||||
'nicovideo' : 'nicovideo',
|
'nicovideo' : 'nicovideo',
|
||||||
|
'pinterest' : 'pinterest',
|
||||||
'pixnet' : 'pixnet',
|
'pixnet' : 'pixnet',
|
||||||
'pptv' : 'pptv',
|
'pptv' : 'pptv',
|
||||||
'qianmo' : 'qianmo',
|
'qianmo' : 'qianmo',
|
||||||
|
@ -40,6 +40,7 @@ from .mtv81 import *
|
|||||||
from .nanagogo import *
|
from .nanagogo import *
|
||||||
from .netease import *
|
from .netease import *
|
||||||
from .nicovideo import *
|
from .nicovideo import *
|
||||||
|
from .pinterest import *
|
||||||
from .pixnet import *
|
from .pixnet import *
|
||||||
from .pptv import *
|
from .pptv import *
|
||||||
from .qianmo import *
|
from .qianmo import *
|
||||||
|
47
src/you_get/extractors/pinterest.py
Normal file
47
src/you_get/extractors/pinterest.py
Normal file
@ -0,0 +1,47 @@
|
|||||||
|
#!/usr/bin/env python
|
||||||
|
|
||||||
|
from ..common import *
|
||||||
|
from ..extractor import VideoExtractor
|
||||||
|
|
||||||
|
class Pinterest(VideoExtractor):
|
||||||
|
# site name
|
||||||
|
name = "Pinterest"
|
||||||
|
|
||||||
|
# ordered list of supported stream types / qualities on this site
|
||||||
|
# order: high quality -> low quality
|
||||||
|
stream_types = [
|
||||||
|
{'id': 'original'}, # contains an 'id' or 'itag' field at minimum
|
||||||
|
{'id': 'small'},
|
||||||
|
]
|
||||||
|
|
||||||
|
def prepare(self, **kwargs):
|
||||||
|
# scrape the html
|
||||||
|
content = get_content(self.url)
|
||||||
|
|
||||||
|
# extract title
|
||||||
|
self.title = match1(content,
|
||||||
|
r'<meta property="og:description" name="og:description" content="([^"]+)"')
|
||||||
|
|
||||||
|
# extract raw urls
|
||||||
|
orig_img = match1(content,
|
||||||
|
r'<meta itemprop="image" content="([^"]+/originals/[^"]+)"')
|
||||||
|
twit_img = match1(content,
|
||||||
|
r'<meta property="twitter:image:src" name="twitter:image:src" content="([^"]+)"')
|
||||||
|
|
||||||
|
# construct available streams
|
||||||
|
if orig_img: self.streams['original'] = {'url': orig_img}
|
||||||
|
if twit_img: self.streams['small'] = {'url': twit_img}
|
||||||
|
|
||||||
|
def extract(self, **kwargs):
|
||||||
|
for i in self.streams:
|
||||||
|
# for each available stream
|
||||||
|
s = self.streams[i]
|
||||||
|
# fill in 'container' field and 'size' field (optional)
|
||||||
|
_, s['container'], s['size'] = url_info(s['url'])
|
||||||
|
# 'src' field is a list of processed urls for direct downloading
|
||||||
|
# usually derived from 'url'
|
||||||
|
s['src'] = [s['url']]
|
||||||
|
|
||||||
|
site = Pinterest()
|
||||||
|
download = site.download_by_url
|
||||||
|
# TBD: implement download_playlist
|
Loading…
Reference in New Issue
Block a user