you-get/src/you_get/extractors/pinterest.py

#!/usr/bin/env python

from ..common import *
from ..extractor import VideoExtractor

class Pinterest(VideoExtractor):
    # site name
    name = "Pinterest"

    # ordered list of supported stream types / qualities on this site
    # order: high quality -> low quality
    stream_types = [
        {'id': 'original'}, # contains an 'id' or 'itag' field at minimum
        {'id': 'small'},
    ]

    def prepare(self, **kwargs):
        # scrape the html
        content = get_content(self.url)

        # extract title
        self.title = match1(content,
                            r'<meta property="og:description" name="og:description" content="([^"]+)"')

        # extract raw urls
        orig_img = match1(content,
                         r'<meta itemprop="image" content="([^"]+/originals/[^"]+)"')
        twit_img = match1(content,
                          r'<meta property="twitter:image:src" name="twitter:image:src" content="([^"]+)"')

        # construct available streams
        if orig_img: self.streams['original'] = {'url': orig_img}
        if twit_img: self.streams['small'] = {'url': twit_img}

    def extract(self, **kwargs):
        for i in self.streams:
            # for each available stream
            s = self.streams[i]
            # fill in 'container' field and 'size' field (optional)
            _, s['container'], s['size'] = url_info(s['url'])
            # 'src' field is a list of processed urls for direct downloading
            # usually derived from 'url'
            s['src'] = [s['url']]

site = Pinterest()
download = site.download_by_url
# TBD: implement download_playlist
[pinterest] new site support (using VideoExtractor) 2015-11-10 04:56:53 +03:00			`#!/usr/bin/env python`

			`from ..common import *`
			`from ..extractor import VideoExtractor`

			`class Pinterest(VideoExtractor):`
			`# site name`
			`name = "Pinterest"`

			`# ordered list of supported stream types / qualities on this site`
			`# order: high quality -> low quality`
			`stream_types = [`
			`{'id': 'original'}, # contains an 'id' or 'itag' field at minimum`
			`{'id': 'small'},`
			`]`

			`def prepare(self, **kwargs):`
			`# scrape the html`
			`content = get_content(self.url)`

			`# extract title`
			`self.title = match1(content,`
			`r'<meta property="og:description" name="og:description" content="([^"]+)"')`

			`# extract raw urls`
			`orig_img = match1(content,`
			`r'<meta itemprop="image" content="([^"]+/originals/[^"]+)"')`
			`twit_img = match1(content,`
			`r'<meta property="twitter:image:src" name="twitter:image:src" content="([^"]+)"')`

			`# construct available streams`
			`if orig_img: self.streams['original'] = {'url': orig_img}`
			`if twit_img: self.streams['small'] = {'url': twit_img}`

			`def extract(self, **kwargs):`
			`for i in self.streams:`
			`# for each available stream`
			`s = self.streams[i]`
			`# fill in 'container' field and 'size' field (optional)`
			`_, s['container'], s['size'] = url_info(s['url'])`
			`# 'src' field is a list of processed urls for direct downloading`
			`# usually derived from 'url'`
			`s['src'] = [s['url']]`

			`site = Pinterest()`
			`download = site.download_by_url`
			`# TBD: implement download_playlist`