2013-03-02 21:26:28 +01:00
|
|
|
# ex:ts=4:sw=4:sts=4:et
|
|
|
|
# -*- tab-width: 4; c-basic-offset: 4; indent-tabs-mode: nil -*-
|
2013-04-27 13:17:00 +02:00
|
|
|
|
|
|
|
# pylint has issues with urlparse: "some types could not be inferred"
|
|
|
|
# pylint: disable=E1103
|
|
|
|
|
2013-03-01 23:39:42 +01:00
|
|
|
from __future__ import absolute_import
|
2013-02-12 19:43:37 +01:00
|
|
|
import re
|
2014-03-25 20:21:52 +01:00
|
|
|
import json
|
2014-06-07 20:43:40 +02:00
|
|
|
import copy
|
2015-10-24 21:55:33 +02:00
|
|
|
import os
|
2018-01-30 22:07:21 +01:00
|
|
|
from urllib.parse import urlparse
|
|
|
|
|
2013-02-12 19:43:37 +01:00
|
|
|
|
2018-03-13 00:33:39 +01:00
|
|
|
from svtplay_dl.utils.text import filenamify
|
2014-01-26 01:54:20 +01:00
|
|
|
from svtplay_dl.service import Service, OpenGraphThumbMixin
|
2014-04-21 17:13:38 +02:00
|
|
|
from svtplay_dl.fetcher.rtmp import RTMP
|
2014-05-01 16:52:05 +02:00
|
|
|
from svtplay_dl.fetcher.hds import hdsparse
|
2015-10-24 21:55:33 +02:00
|
|
|
from svtplay_dl.fetcher.hls import hlsparse
|
2014-08-31 01:20:36 +02:00
|
|
|
from svtplay_dl.subtitle import subtitle
|
2015-09-06 14:19:10 +02:00
|
|
|
from svtplay_dl.error import ServiceError
|
2013-02-12 19:43:37 +01:00
|
|
|
|
2015-09-15 20:10:32 +02:00
|
|
|
|
2014-01-26 01:54:20 +01:00
|
|
|
class Viaplay(Service, OpenGraphThumbMixin):
|
2014-01-01 14:57:17 +01:00
|
|
|
supported_domains = [
|
2014-01-16 21:41:48 +01:00
|
|
|
'tv3play.se', 'tv6play.se', 'tv8play.se', 'tv10play.se',
|
|
|
|
'tv3play.no', 'tv3play.dk', 'tv6play.no', 'viasat4play.no',
|
2015-09-10 21:57:55 +02:00
|
|
|
'tv3play.ee', 'tv3play.lv', 'tv3play.lt', 'tvplay.lv', 'viagame.com',
|
2017-09-16 18:32:29 +02:00
|
|
|
'juicyplay.se', 'viafree.se', 'viafree.dk', 'viafree.no', 'viafree.fi',
|
2016-10-31 19:20:18 +01:00
|
|
|
'play.tv3.lt', 'tv3play.tv3.ee', 'tvplay.skaties.lv'
|
2016-10-20 19:07:56 +02:00
|
|
|
]
|
2013-01-17 00:21:47 +01:00
|
|
|
|
2017-04-21 19:34:43 +02:00
|
|
|
def _get_video_id(self, url=None):
|
2014-03-09 15:56:00 +01:00
|
|
|
"""
|
|
|
|
Extract video id. It will try to avoid making an HTTP request
|
|
|
|
if it can find the ID in the URL, but otherwise it will try
|
|
|
|
to scrape it from the HTML document. Returns None in case it's
|
|
|
|
unable to extract the ID at all.
|
|
|
|
"""
|
2017-04-21 19:34:43 +02:00
|
|
|
if url:
|
|
|
|
html_data = self.http.request("get", url).text
|
|
|
|
else:
|
|
|
|
html_data = self.get_urldata()
|
2015-08-31 17:14:08 +02:00
|
|
|
html_data = self.get_urldata()
|
2014-06-22 22:46:00 +02:00
|
|
|
match = re.search(r'data-video-id="([0-9]+)"', html_data)
|
2014-06-26 22:04:16 +02:00
|
|
|
if match:
|
|
|
|
return match.group(1)
|
|
|
|
match = re.search(r'data-videoid="([0-9]+)', html_data)
|
2014-03-09 15:56:00 +01:00
|
|
|
if match:
|
|
|
|
return match.group(1)
|
|
|
|
|
2016-08-17 00:43:34 +02:00
|
|
|
clips = False
|
2018-03-04 12:25:44 +01:00
|
|
|
slug = None
|
2016-08-17 00:43:34 +02:00
|
|
|
match = re.search('params":({.*}),"query', self.get_urldata())
|
2016-08-15 19:32:52 +02:00
|
|
|
if match:
|
2016-08-17 00:43:34 +02:00
|
|
|
jansson = json.loads(match.group(1))
|
2016-09-14 20:52:14 +02:00
|
|
|
if "seasonNumberOrVideoId" in jansson:
|
|
|
|
season = jansson["seasonNumberOrVideoId"]
|
2016-09-28 12:48:56 +02:00
|
|
|
match = re.search("\w-(\d+)$", season)
|
|
|
|
if match:
|
|
|
|
season = match.group(1)
|
2016-09-14 20:52:14 +02:00
|
|
|
else:
|
|
|
|
return False
|
2016-08-20 17:16:40 +02:00
|
|
|
if "videoIdOrEpisodeNumber" in jansson:
|
|
|
|
videp = jansson["videoIdOrEpisodeNumber"]
|
2016-09-28 12:48:56 +02:00
|
|
|
match = re.search('(\w+)-(\d+)', videp)
|
2016-08-20 17:16:40 +02:00
|
|
|
if match:
|
|
|
|
episodenr = match.group(2)
|
|
|
|
else:
|
|
|
|
episodenr = videp
|
|
|
|
clips = True
|
2016-09-14 20:52:14 +02:00
|
|
|
match = re.search('(s\w+)-(\d+)', season)
|
|
|
|
if match:
|
|
|
|
season = match.group(2)
|
2016-08-17 00:43:34 +02:00
|
|
|
else:
|
2016-10-01 12:33:20 +02:00
|
|
|
# sometimes videoIdOrEpisodeNumber does not work.. this is a workaround
|
|
|
|
match = re.search('(episode|avsnitt)-(\d+)', self.url)
|
|
|
|
if match:
|
|
|
|
episodenr = match.group(2)
|
|
|
|
else:
|
|
|
|
episodenr = season
|
2018-03-04 12:25:44 +01:00
|
|
|
if "slug" in jansson:
|
|
|
|
slug = jansson["slug"]
|
2016-08-17 00:43:34 +02:00
|
|
|
|
|
|
|
if clips:
|
|
|
|
return episodenr
|
|
|
|
else:
|
2018-03-06 19:37:36 +01:00
|
|
|
match = self._conentpage(self.get_urldata())
|
2016-08-17 00:43:34 +02:00
|
|
|
if match:
|
|
|
|
janson = json.loads(match.group(1))
|
2016-09-03 18:39:49 +02:00
|
|
|
for i in janson["format"]["videos"].keys():
|
2017-02-02 14:20:33 +01:00
|
|
|
if "program" in janson["format"]["videos"][str(i)]:
|
|
|
|
for n in janson["format"]["videos"][i]["program"]:
|
|
|
|
if str(n["episodeNumber"]) and int(episodenr) == n["episodeNumber"] and int(season) == n["seasonNumber"]:
|
2018-03-04 12:25:44 +01:00
|
|
|
if slug is None or slug == n["formatSlug"]:
|
|
|
|
return n["id"]
|
2017-02-02 14:20:33 +01:00
|
|
|
elif n["id"] == episodenr:
|
|
|
|
return episodenr
|
2016-08-21 01:08:39 +02:00
|
|
|
|
2014-06-02 22:13:11 +02:00
|
|
|
parse = urlparse(self.url)
|
2014-09-11 23:45:08 +02:00
|
|
|
match = re.search(r'/\w+/(\d+)', parse.path)
|
2015-09-10 21:57:55 +02:00
|
|
|
if match:
|
|
|
|
return match.group(1)
|
2016-02-22 20:43:57 +01:00
|
|
|
match = re.search(r'iframe src="http://play.juicyplay.se[^\"]+id=(\d+)', html_data)
|
2014-03-09 15:56:00 +01:00
|
|
|
if match:
|
|
|
|
return match.group(1)
|
2018-05-06 15:30:41 +02:00
|
|
|
|
|
|
|
match = re.search(r'<meta property="og:image" content="([\S]+)"', html_data)
|
|
|
|
if match:
|
|
|
|
return match.group(1).split("/")[-2]
|
|
|
|
|
2014-03-09 15:56:00 +01:00
|
|
|
return None
|
2018-01-30 20:11:37 +01:00
|
|
|
|
2015-12-26 11:46:14 +01:00
|
|
|
def get(self):
|
2014-12-08 23:07:02 +01:00
|
|
|
vid = self._get_video_id()
|
2014-03-09 15:56:00 +01:00
|
|
|
if vid is None:
|
2017-10-09 22:35:13 +02:00
|
|
|
yield ServiceError("Can't find video file for: {0}".format(self.url))
|
2014-10-06 23:21:43 +02:00
|
|
|
return
|
2018-01-30 20:11:37 +01:00
|
|
|
|
2017-04-21 19:34:43 +02:00
|
|
|
data = self. _get_video_data(vid)
|
2015-08-30 00:06:20 +02:00
|
|
|
if data.status_code == 403:
|
2015-09-06 14:19:10 +02:00
|
|
|
yield ServiceError("Can't play this because the video is geoblocked.")
|
2014-11-01 21:10:06 +01:00
|
|
|
return
|
2015-08-31 23:18:37 +02:00
|
|
|
dataj = json.loads(data.text)
|
2018-01-30 20:11:37 +01:00
|
|
|
|
2014-10-23 00:03:14 +02:00
|
|
|
if "msg" in dataj:
|
2015-09-06 14:19:10 +02:00
|
|
|
yield ServiceError(dataj["msg"])
|
2014-09-11 23:51:32 +02:00
|
|
|
return
|
2014-08-11 19:44:20 +02:00
|
|
|
|
2014-10-23 00:03:14 +02:00
|
|
|
if dataj["type"] == "live":
|
2015-12-26 11:46:14 +01:00
|
|
|
self.options.live = True
|
2014-10-23 00:03:14 +02:00
|
|
|
|
2017-04-21 19:34:43 +02:00
|
|
|
if self.options.output_auto:
|
2018-01-30 20:11:37 +01:00
|
|
|
self.options.output = self.outputfilename(dataj, vid, self.options.output)
|
|
|
|
|
2016-05-14 22:54:30 +02:00
|
|
|
if self.exclude():
|
2015-09-06 23:04:48 +02:00
|
|
|
yield ServiceError("Excluding video")
|
2014-12-22 17:41:40 +01:00
|
|
|
return
|
|
|
|
|
2017-10-09 22:35:13 +02:00
|
|
|
streams = self.http.request("get", "http://playapi.mtgx.tv/v3/videos/stream/{0}".format(vid))
|
2015-08-30 00:06:20 +02:00
|
|
|
if streams.status_code == 403:
|
2015-09-06 14:19:10 +02:00
|
|
|
yield ServiceError("Can't play this because the video is geoblocked.")
|
2014-11-01 21:10:06 +01:00
|
|
|
return
|
2015-08-31 23:18:37 +02:00
|
|
|
streamj = json.loads(streams.text)
|
2014-06-26 21:52:32 +02:00
|
|
|
|
2014-10-23 00:03:14 +02:00
|
|
|
if "msg" in streamj:
|
2015-09-06 14:19:10 +02:00
|
|
|
yield ServiceError("Can't play this because the video is either not found or geoblocked.")
|
2014-10-23 00:03:14 +02:00
|
|
|
return
|
|
|
|
|
2016-02-07 10:25:49 +01:00
|
|
|
if dataj["sami_path"]:
|
2016-12-05 19:57:57 +01:00
|
|
|
if dataj["sami_path"].endswith("vtt"):
|
|
|
|
subtype = "wrst"
|
|
|
|
else:
|
|
|
|
subtype = "sami"
|
|
|
|
yield subtitle(copy.copy(self.options), subtype, dataj["sami_path"])
|
2016-12-05 20:53:22 +01:00
|
|
|
if dataj["subtitles_webvtt"]:
|
|
|
|
yield subtitle(copy.copy(self.options), "wrst", dataj["subtitles_webvtt"])
|
2016-02-07 10:25:49 +01:00
|
|
|
if dataj["subtitles_for_hearing_impaired"]:
|
2016-12-05 19:57:57 +01:00
|
|
|
if dataj["subtitles_for_hearing_impaired"].endswith("vtt"):
|
|
|
|
subtype = "wrst"
|
|
|
|
else:
|
|
|
|
subtype = "sami"
|
2016-12-17 11:09:07 +01:00
|
|
|
if self.options.get_all_subtitles:
|
2017-02-15 23:15:50 +01:00
|
|
|
yield subtitle(copy.copy(self.options), subtype, dataj["subtitles_for_hearing_impaired"], "-SDH")
|
2018-01-30 20:11:37 +01:00
|
|
|
else:
|
2016-12-17 11:09:07 +01:00
|
|
|
yield subtitle(copy.copy(self.options), subtype, dataj["subtitles_for_hearing_impaired"])
|
2016-02-07 10:25:49 +01:00
|
|
|
|
2014-06-26 21:52:32 +02:00
|
|
|
if streamj["streams"]["medium"]:
|
|
|
|
filename = streamj["streams"]["medium"]
|
2015-09-10 21:38:29 +02:00
|
|
|
if ".f4m" in filename:
|
2015-12-26 11:46:14 +01:00
|
|
|
streams = hdsparse(self.options, self.http.request("get", filename, params={"hdcore": "3.7.0"}), filename)
|
2014-10-12 23:31:02 +02:00
|
|
|
if streams:
|
|
|
|
for n in list(streams.keys()):
|
|
|
|
yield streams[n]
|
2014-06-26 21:52:32 +02:00
|
|
|
else:
|
|
|
|
parse = urlparse(filename)
|
2014-08-27 15:13:57 +02:00
|
|
|
match = re.search("^(/[^/]+)/(.*)", parse.path)
|
2014-06-26 21:52:32 +02:00
|
|
|
if not match:
|
2015-09-06 14:19:10 +02:00
|
|
|
yield ServiceError("Can't get rtmpparse info")
|
2014-11-25 21:46:33 +01:00
|
|
|
return
|
2017-10-09 22:35:13 +02:00
|
|
|
filename = "{0}://{1}:{2}{3}".format(parse.scheme, parse.hostname, parse.port, match.group(1))
|
|
|
|
path = "-y {0}".format(match.group(2))
|
|
|
|
self.options.other = "-W http://flvplayer.viastream.viasat.tv/flvplayer/play/swf/player.swf {0}".format(path)
|
2015-12-26 11:46:14 +01:00
|
|
|
yield RTMP(copy.copy(self.options), filename, 800)
|
2014-05-01 17:04:08 +02:00
|
|
|
|
2014-06-26 21:52:32 +02:00
|
|
|
if streamj["streams"]["hls"]:
|
2015-12-26 11:46:14 +01:00
|
|
|
streams = hlsparse(self.options, self.http.request("get", streamj["streams"]["hls"]), streamj["streams"]["hls"])
|
2015-01-16 21:18:54 +01:00
|
|
|
if streams:
|
|
|
|
for n in list(streams.keys()):
|
2015-10-04 14:37:16 +02:00
|
|
|
yield streams[n]
|
2014-01-11 23:02:47 +01:00
|
|
|
|
2014-03-25 20:21:52 +01:00
|
|
|
def find_all_episodes(self, options):
|
2017-09-08 18:59:18 +02:00
|
|
|
seasons = []
|
|
|
|
match = re.search("(sasong|sesong)-(\d+)", urlparse(self.url).path)
|
2016-08-15 22:46:32 +02:00
|
|
|
if match:
|
2017-09-08 18:59:18 +02:00
|
|
|
seasons.append(match.group(2))
|
|
|
|
else:
|
|
|
|
match = self._conentpage(self.get_urldata())
|
|
|
|
if match:
|
|
|
|
janson = json.loads(match.group(1))
|
|
|
|
for i in janson["format"]["seasons"]:
|
2017-02-06 12:37:46 +01:00
|
|
|
seasons.append(i["seasonNumber"])
|
|
|
|
|
2017-09-08 18:59:18 +02:00
|
|
|
episodes = self._grab_episodes(options, seasons)
|
2017-04-21 17:09:36 +02:00
|
|
|
if options.all_last > 0:
|
2018-02-22 04:44:19 +01:00
|
|
|
return episodes[-options.all_last:]
|
2017-04-21 17:09:36 +02:00
|
|
|
return sorted(episodes)
|
2017-09-08 18:59:18 +02:00
|
|
|
|
|
|
|
def _grab_episodes(self, options, seasons):
|
|
|
|
episodes = []
|
|
|
|
baseurl = self.url
|
2018-03-06 19:37:36 +01:00
|
|
|
match = re.search("(saeson|sasong|sesong)-\d+", urlparse(self.url).path)
|
2017-09-08 18:59:18 +02:00
|
|
|
if match:
|
|
|
|
baseurl = self.url[:self.url.rfind("/")]
|
2018-02-22 04:44:19 +01:00
|
|
|
baseurl = baseurl[:baseurl.rfind("/")]
|
2017-09-08 18:59:18 +02:00
|
|
|
|
|
|
|
for i in seasons:
|
|
|
|
url = "{0}/{1}-{2}".format(baseurl, self._isswe(self.url), i)
|
|
|
|
res = self.http.get(url)
|
|
|
|
if res:
|
|
|
|
match = self._conentpage(res.text)
|
|
|
|
if match:
|
|
|
|
janson = json.loads(match.group(1))
|
|
|
|
if "program" in janson["format"]["videos"][str(i)]:
|
|
|
|
for n in janson["format"]["videos"][str(i)]["program"]:
|
2018-01-30 20:11:37 +01:00
|
|
|
episodes = self._videos_to_list(n["sharingUrl"], n["id"], episodes)
|
2017-09-08 18:59:18 +02:00
|
|
|
if options.include_clips:
|
|
|
|
if "clip" in janson["format"]["videos"][str(i)]:
|
|
|
|
for n in janson["format"]["videos"][str(i)]["clip"]:
|
2018-01-30 20:11:37 +01:00
|
|
|
episodes = self._videos_to_list(n["sharingUrl"], n["id"], episodes)
|
2017-09-08 18:59:18 +02:00
|
|
|
return episodes
|
|
|
|
|
|
|
|
def _isswe(self, url):
|
|
|
|
if re.search(".se$", urlparse(url).netloc):
|
|
|
|
return "sasong"
|
2018-03-06 19:37:36 +01:00
|
|
|
elif re.search(".dk$", urlparse(url).netloc):
|
|
|
|
return "saeson"
|
2017-09-08 18:59:18 +02:00
|
|
|
else:
|
|
|
|
return "sesong"
|
|
|
|
|
|
|
|
def _conentpage(self, data):
|
2018-03-06 19:37:36 +01:00
|
|
|
return re.search('"ContentPageProgramStore":({.*}),[ ]*"ApplicationStore', data)
|
2017-09-08 18:59:18 +02:00
|
|
|
|
2018-01-30 20:11:37 +01:00
|
|
|
def _videos_to_list(self, url, vid, episodes):
|
2017-04-21 19:34:43 +02:00
|
|
|
dataj = json.loads(self._get_video_data(vid).text)
|
2018-01-30 20:11:37 +01:00
|
|
|
if "msg" not in dataj:
|
2017-04-21 19:34:43 +02:00
|
|
|
filename = self.outputfilename(dataj, vid, self.options.output)
|
|
|
|
if not self.exclude2(filename) and url not in episodes:
|
|
|
|
episodes.append(url)
|
|
|
|
return episodes
|
2018-01-30 20:11:37 +01:00
|
|
|
|
2017-04-21 19:34:43 +02:00
|
|
|
def _get_video_data(self, vid):
|
2017-10-09 22:35:13 +02:00
|
|
|
url = "http://playapi.mtgx.tv/v3/videos/{0}".format(vid)
|
2017-04-21 19:34:43 +02:00
|
|
|
self.options.other = ""
|
|
|
|
data = self.http.request("get", url)
|
|
|
|
return data
|
2018-01-30 20:11:37 +01:00
|
|
|
|
|
|
|
def outputfilename(self, data, vid, filename):
|
2017-04-21 19:34:43 +02:00
|
|
|
self.options.service = "viafree"
|
|
|
|
if filename:
|
|
|
|
directory = os.path.dirname(filename)
|
|
|
|
else:
|
|
|
|
directory = ""
|
2018-01-30 20:11:37 +01:00
|
|
|
|
2017-04-21 19:34:43 +02:00
|
|
|
basename = self._autoname(data)
|
2017-10-09 22:35:13 +02:00
|
|
|
title = "{0}-{1}-{2}".format(basename, vid, self.options.service)
|
2017-04-21 19:34:43 +02:00
|
|
|
if len(directory):
|
|
|
|
output = os.path.join(directory, title)
|
|
|
|
else:
|
|
|
|
output = title
|
|
|
|
return output
|
2017-05-07 14:43:06 +02:00
|
|
|
|
2015-10-24 21:55:33 +02:00
|
|
|
def _autoname(self, dataj):
|
|
|
|
program = dataj["format_slug"]
|
2017-02-02 14:20:33 +01:00
|
|
|
season = None
|
2015-10-24 21:55:33 +02:00
|
|
|
episode = None
|
2017-02-02 14:20:33 +01:00
|
|
|
title = None
|
2017-02-15 23:15:50 +01:00
|
|
|
|
2017-02-02 14:20:33 +01:00
|
|
|
if "season" in dataj["format_position"]:
|
|
|
|
if dataj["format_position"]["season"] > 0:
|
|
|
|
season = dataj["format_position"]["season"]
|
2015-10-24 21:55:33 +02:00
|
|
|
if season:
|
|
|
|
if len(dataj["format_position"]["episode"]) > 0:
|
|
|
|
episode = dataj["format_position"]["episode"]
|
2018-03-10 11:40:36 +01:00
|
|
|
if episode:
|
|
|
|
try:
|
|
|
|
episode = int(episode)
|
|
|
|
except TypeError:
|
|
|
|
title = filenamify(episode)
|
|
|
|
episode = None
|
2018-03-10 19:37:05 +01:00
|
|
|
else:
|
|
|
|
title = filenamify(dataj["title"])
|
2017-02-11 10:19:57 +01:00
|
|
|
|
2017-02-02 14:20:33 +01:00
|
|
|
if dataj["type"] == "clip":
|
2018-01-30 20:11:37 +01:00
|
|
|
# Removes the show name from the end of the filename
|
|
|
|
# e.g. Showname.S0X.title instead of Showname.S07.title-showname
|
2017-02-02 14:20:33 +01:00
|
|
|
match = re.search(r'(.+)-', dataj["title"])
|
|
|
|
if match:
|
|
|
|
title = filenamify(match.group(1))
|
2017-02-15 23:15:50 +01:00
|
|
|
else:
|
2017-02-02 14:20:33 +01:00
|
|
|
title = filenamify(dataj["title"])
|
2017-02-11 10:19:57 +01:00
|
|
|
if "derived_from_id" in dataj:
|
|
|
|
if dataj["derived_from_id"]:
|
|
|
|
parent_id = dataj["derived_from_id"]
|
2017-10-09 22:35:13 +02:00
|
|
|
parent_episode = self.http.request("get", "http://playapi.mtgx.tv/v3/videos/{0}".format(parent_id))
|
2018-01-30 20:11:37 +01:00
|
|
|
if parent_episode.status_code != 403: # if not geoblocked
|
2017-02-11 10:19:57 +01:00
|
|
|
datajparent = json.loads(parent_episode.text)
|
|
|
|
if not season and datajparent["format_position"]["season"] > 0:
|
|
|
|
season = datajparent["format_position"]["season"]
|
|
|
|
if len(datajparent["format_position"]["episode"]) > 0:
|
|
|
|
episode = datajparent["format_position"]["episode"]
|
2017-02-15 23:15:50 +01:00
|
|
|
|
2015-10-24 21:55:33 +02:00
|
|
|
name = filenamify(program)
|
|
|
|
if season:
|
2017-02-12 09:01:40 +01:00
|
|
|
name = "{0}.s{1:02d}".format(name, int(season))
|
2015-10-24 21:55:33 +02:00
|
|
|
if episode:
|
2017-02-12 09:01:40 +01:00
|
|
|
name = "{0}e{1:02d}".format(name, int(episode))
|
2017-02-02 14:20:33 +01:00
|
|
|
if title:
|
2017-02-12 09:01:40 +01:00
|
|
|
name = "{0}.{1}".format(name, title)
|
2017-02-15 23:15:50 +01:00
|
|
|
|
|
|
|
return name
|