2013-03-02 21:26:28 +01:00
|
|
|
# ex:ts=4:sw=4:sts=4:et
|
|
|
|
# -*- tab-width: 4; c-basic-offset: 4; indent-tabs-mode: nil -*-
|
2013-03-01 23:39:42 +01:00
|
|
|
from __future__ import absolute_import
|
2013-03-23 16:11:36 +01:00
|
|
|
import re
|
2014-01-05 17:28:00 +01:00
|
|
|
from svtplay_dl.utils.urllib import urlparse
|
2014-08-17 10:57:08 +02:00
|
|
|
from svtplay_dl.utils import download_thumbnail, get_http_data
|
|
|
|
|
2014-01-19 14:26:48 +01:00
|
|
|
import logging
|
|
|
|
|
|
|
|
log = logging.getLogger('svtplay_dl')
|
2013-03-23 16:11:36 +01:00
|
|
|
|
|
|
|
class Service(object):
|
2014-01-01 14:57:17 +01:00
|
|
|
supported_domains = []
|
2014-01-01 15:50:47 +01:00
|
|
|
supported_domains_re = []
|
2014-01-01 14:57:17 +01:00
|
|
|
|
2014-02-18 16:48:53 +01:00
|
|
|
def __init__(self, _url):
|
|
|
|
self._url = _url
|
|
|
|
self._urldata = None
|
|
|
|
|
|
|
|
@property
|
|
|
|
def url(self):
|
|
|
|
return self._url
|
|
|
|
|
|
|
|
def get_urldata(self):
|
|
|
|
if self._urldata is None:
|
|
|
|
self._urldata = get_http_data(self.url)
|
|
|
|
return self._urldata
|
2014-01-06 23:14:06 +01:00
|
|
|
|
2014-01-06 22:47:54 +01:00
|
|
|
@classmethod
|
|
|
|
def handles(cls, url):
|
2014-01-01 14:57:17 +01:00
|
|
|
urlp = urlparse(url)
|
|
|
|
|
2014-01-01 15:50:47 +01:00
|
|
|
# Apply supported_domains_re regexp to the netloc. This
|
|
|
|
# is meant for 'dynamic' domains, e.g. containing country
|
|
|
|
# information etc.
|
2014-01-06 22:47:54 +01:00
|
|
|
for domain_re in [re.compile(x) for x in cls.supported_domains_re]:
|
2014-01-01 15:50:47 +01:00
|
|
|
if domain_re.match(urlp.netloc):
|
|
|
|
return True
|
|
|
|
|
2014-01-06 22:47:54 +01:00
|
|
|
if urlp.netloc in cls.supported_domains:
|
2014-01-01 14:57:17 +01:00
|
|
|
return True
|
|
|
|
|
|
|
|
# For every listed domain, try with www. subdomain as well.
|
2014-01-06 22:47:54 +01:00
|
|
|
if urlp.netloc in ['www.'+x for x in cls.supported_domains]:
|
2014-01-01 14:57:17 +01:00
|
|
|
return True
|
|
|
|
|
|
|
|
return False
|
2013-03-01 23:39:42 +01:00
|
|
|
|
2014-01-11 23:02:47 +01:00
|
|
|
def get_subtitle(self, options):
|
|
|
|
pass
|
|
|
|
|
2014-03-19 22:57:49 +01:00
|
|
|
# the options parameter is unused, but is part of the
|
|
|
|
# interface, so we don't want to remove it. Thus, the
|
|
|
|
# pylint ignore.
|
|
|
|
def find_all_episodes(self, options): # pylint: disable-msg=unused-argument
|
2014-02-18 18:56:28 +01:00
|
|
|
log.warning("--all-episodes not implemented for this service")
|
|
|
|
return [self.url]
|
2014-01-19 14:26:48 +01:00
|
|
|
|
2014-02-18 16:17:02 +01:00
|
|
|
def opengraph_get(html, prop):
|
|
|
|
"""
|
|
|
|
Extract specified OpenGraph property from html.
|
|
|
|
|
|
|
|
>>> opengraph_get('<html><head><meta property="og:image" content="http://example.com/img.jpg"><meta ...', "image")
|
|
|
|
'http://example.com/img.jpg'
|
|
|
|
>>> opengraph_get('<html><head><meta content="http://example.com/img2.jpg" property="og:image"><meta ...', "image")
|
|
|
|
'http://example.com/img2.jpg'
|
|
|
|
>>> opengraph_get('<html><head><meta name="og:image" property="og:image" content="http://example.com/img3.jpg"><meta ...', "image")
|
|
|
|
'http://example.com/img3.jpg'
|
|
|
|
"""
|
|
|
|
match = re.search('<meta [^>]*property="og:' + prop + '" content="([^"]*)"', html)
|
|
|
|
if match is None:
|
|
|
|
match = re.search('<meta [^>]*content="([^"]*)" property="og:' + prop + '"', html)
|
|
|
|
if match is None:
|
|
|
|
return None
|
|
|
|
return match.group(1)
|
|
|
|
|
|
|
|
|
2014-01-19 14:26:48 +01:00
|
|
|
class OpenGraphThumbMixin(object):
|
|
|
|
"""
|
|
|
|
Mix this into the service class to grab thumbnail from OpenGraph properties.
|
|
|
|
"""
|
|
|
|
def get_thumbnail(self, options):
|
2014-02-18 16:48:53 +01:00
|
|
|
url = opengraph_get(self.get_urldata(), "image")
|
2014-02-18 16:17:02 +01:00
|
|
|
if url is None:
|
|
|
|
return
|
|
|
|
download_thumbnail(options, url)
|
2014-01-19 14:26:48 +01:00
|
|
|
|
|
|
|
|
2013-03-23 15:56:25 +01:00
|
|
|
from svtplay_dl.service.aftonbladet import Aftonbladet
|
2014-08-17 10:57:08 +02:00
|
|
|
from svtplay_dl.service.bambuser import Bambuser
|
|
|
|
from svtplay_dl.service.dbtv import Dbtv
|
2013-03-23 15:56:25 +01:00
|
|
|
from svtplay_dl.service.dr import Dr
|
|
|
|
from svtplay_dl.service.expressen import Expressen
|
|
|
|
from svtplay_dl.service.hbo import Hbo
|
|
|
|
from svtplay_dl.service.justin import Justin
|
|
|
|
from svtplay_dl.service.kanal5 import Kanal5
|
2014-08-17 10:57:08 +02:00
|
|
|
from svtplay_dl.service.lemonwhale import Lemonwhale
|
|
|
|
from svtplay_dl.service.mtvnn import Mtvnn
|
2013-04-21 21:51:45 +02:00
|
|
|
from svtplay_dl.service.mtvservices import Mtvservices
|
2013-03-23 15:56:25 +01:00
|
|
|
from svtplay_dl.service.nrk import Nrk
|
2014-08-17 10:57:08 +02:00
|
|
|
from svtplay_dl.service.oppetarkiv import OppetArkiv
|
2014-03-25 15:37:41 +01:00
|
|
|
from svtplay_dl.service.picsearch import Picsearch
|
2014-08-17 10:57:08 +02:00
|
|
|
from svtplay_dl.service.qbrick import Qbrick
|
2013-03-23 15:56:25 +01:00
|
|
|
from svtplay_dl.service.radioplay import Radioplay
|
2014-08-17 10:57:08 +02:00
|
|
|
from svtplay_dl.service.ruv import Ruv
|
2013-03-23 15:56:25 +01:00
|
|
|
from svtplay_dl.service.sr import Sr
|
|
|
|
from svtplay_dl.service.svtplay import Svtplay
|
|
|
|
from svtplay_dl.service.tv4play import Tv4play
|
|
|
|
from svtplay_dl.service.urplay import Urplay
|
2014-08-17 10:57:08 +02:00
|
|
|
from svtplay_dl.service.vg import Vg
|
2013-03-23 15:56:25 +01:00
|
|
|
from svtplay_dl.service.viaplay import Viaplay
|
|
|
|
from svtplay_dl.service.vimeo import Vimeo
|
|
|
|
|
2013-03-23 15:58:15 +01:00
|
|
|
sites = [
|
2014-01-06 22:47:54 +01:00
|
|
|
Aftonbladet,
|
2014-02-05 20:37:50 +01:00
|
|
|
Bambuser,
|
2014-08-11 23:20:17 +02:00
|
|
|
Dbtv,
|
2014-01-06 22:47:54 +01:00
|
|
|
Dr,
|
|
|
|
Expressen,
|
|
|
|
Hbo,
|
|
|
|
Justin,
|
2014-05-01 23:17:57 +02:00
|
|
|
Lemonwhale,
|
2014-01-06 22:47:54 +01:00
|
|
|
Kanal5,
|
|
|
|
Mtvservices,
|
2014-08-11 20:41:09 +02:00
|
|
|
Mtvnn,
|
2014-01-06 22:47:54 +01:00
|
|
|
Nrk,
|
|
|
|
Qbrick,
|
2014-03-25 15:37:41 +01:00
|
|
|
Picsearch,
|
2014-01-06 22:47:54 +01:00
|
|
|
Ruv,
|
|
|
|
Radioplay,
|
|
|
|
Sr,
|
|
|
|
Svtplay,
|
2014-05-01 19:51:21 +02:00
|
|
|
OppetArkiv,
|
2014-01-06 22:47:54 +01:00
|
|
|
Tv4play,
|
|
|
|
Urplay,
|
|
|
|
Viaplay,
|
2014-08-17 10:55:05 +02:00
|
|
|
Vimeo,
|
|
|
|
Vg]
|
2013-03-23 15:58:15 +01:00
|
|
|
|
2013-02-28 21:44:28 +01:00
|
|
|
|
2013-03-10 13:28:31 +01:00
|
|
|
class Generic(object):
|
|
|
|
''' Videos embed in sites '''
|
2013-03-23 16:11:36 +01:00
|
|
|
def get(self, url):
|
2013-03-10 13:28:31 +01:00
|
|
|
data = get_http_data(url)
|
2013-11-14 22:43:39 +01:00
|
|
|
match = re.search(r"src=\"(http://www.svt.se/wd.*)\" height", data)
|
2013-03-10 13:28:31 +01:00
|
|
|
stream = None
|
|
|
|
if match:
|
|
|
|
url = match.group(1)
|
|
|
|
for i in sites:
|
2014-01-01 15:03:15 +01:00
|
|
|
if i.handles(url):
|
2014-03-25 20:22:21 +01:00
|
|
|
url = url.replace("&", "&")
|
2014-01-06 23:14:06 +01:00
|
|
|
return url, i(url)
|
2013-03-10 13:28:31 +01:00
|
|
|
|
2013-05-05 12:57:42 +02:00
|
|
|
match = re.search(r"src=\"(http://player.vimeo.com/video/[0-9]+)\" ", data)
|
2013-03-10 13:28:31 +01:00
|
|
|
if match:
|
|
|
|
for i in sites:
|
2014-01-01 15:03:15 +01:00
|
|
|
if i.handles(match.group(1)):
|
2014-01-06 23:14:06 +01:00
|
|
|
return match.group(1), i(url)
|
2014-02-04 20:20:36 +01:00
|
|
|
match = re.search(r"tv4play.se/iframe/video/(\d+)?", data)
|
2013-03-24 14:55:14 +01:00
|
|
|
if match:
|
|
|
|
url = "http://www.tv4play.se/?video_id=%s" % match.group(1)
|
|
|
|
for i in sites:
|
2014-01-01 15:03:15 +01:00
|
|
|
if i.handles(url):
|
2014-01-06 23:14:06 +01:00
|
|
|
return url, i(url)
|
2014-02-05 20:42:34 +01:00
|
|
|
match = re.search(r"embed.bambuser.com/broadcast/(\d+)", data)
|
|
|
|
if match:
|
|
|
|
url = "http://bambuser.com/v/%s" % match.group(1)
|
|
|
|
for i in sites:
|
|
|
|
if i.handles(url):
|
|
|
|
return url, i(url)
|
2014-02-05 23:15:19 +01:00
|
|
|
match = re.search(r'iframe src="(http://tv.aftonbladet[^"]*)"', data)
|
2014-02-08 22:47:27 +01:00
|
|
|
if match:
|
|
|
|
url = match.group(1)
|
|
|
|
for i in sites:
|
|
|
|
if i.handles(url):
|
|
|
|
return url, i(url)
|
2014-08-12 19:08:08 +02:00
|
|
|
match = re.search(r'a href="(http://tv.aftonbladet[^"]*)" class="abVi', data)
|
|
|
|
if match:
|
|
|
|
url = match.group(1)
|
|
|
|
for i in sites:
|
|
|
|
if i.handles(url):
|
|
|
|
return url, i(url)
|
|
|
|
|
2014-02-08 22:47:27 +01:00
|
|
|
match = re.search(r"iframe src='(http://www.svtplay[^']*)'", data)
|
2014-02-05 23:15:19 +01:00
|
|
|
if match:
|
|
|
|
url = match.group(1)
|
|
|
|
for i in sites:
|
|
|
|
if i.handles(url):
|
|
|
|
return url, i(url)
|
2014-02-05 20:42:34 +01:00
|
|
|
|
2013-03-10 13:28:31 +01:00
|
|
|
return url, stream
|
|
|
|
|
2013-02-28 21:44:28 +01:00
|
|
|
def service_handler(url):
|
|
|
|
handler = None
|
|
|
|
|
|
|
|
for i in sites:
|
2014-01-01 15:03:15 +01:00
|
|
|
if i.handles(url):
|
2014-01-06 23:14:06 +01:00
|
|
|
handler = i(url)
|
2013-02-28 21:44:28 +01:00
|
|
|
break
|
|
|
|
|
2014-01-01 14:57:17 +01:00
|
|
|
return handler
|