mirror of
https://github.com/spaam/svtplay-dl.git
synced 2024-11-24 04:05:39 +01:00
309 lines
12 KiB
Python
309 lines
12 KiB
Python
# ex:ts=4:sw=4:sts=4:et
|
|
# -*- tab-width: 4; c-basic-offset: 4; indent-tabs-mode: nil -*-
|
|
|
|
# pylint has issues with urlparse: "some types could not be inferred"
|
|
# pylint: disable=E1103
|
|
|
|
from __future__ import absolute_import
|
|
import re
|
|
import json
|
|
import copy
|
|
import os
|
|
|
|
from svtplay_dl.utils import filenamify
|
|
from svtplay_dl.utils.urllib import urlparse
|
|
from svtplay_dl.service import Service, OpenGraphThumbMixin
|
|
from svtplay_dl.log import log
|
|
from svtplay_dl.fetcher.rtmp import RTMP
|
|
from svtplay_dl.fetcher.hds import hdsparse
|
|
from svtplay_dl.fetcher.hls import hlsparse
|
|
from svtplay_dl.subtitle import subtitle
|
|
from svtplay_dl.error import ServiceError
|
|
|
|
|
|
class Viaplay(Service, OpenGraphThumbMixin):
|
|
supported_domains = [
|
|
'tv3play.se', 'tv6play.se', 'tv8play.se', 'tv10play.se',
|
|
'tv3play.no', 'tv3play.dk', 'tv6play.no', 'viasat4play.no',
|
|
'tv3play.ee', 'tv3play.lv', 'tv3play.lt', 'tvplay.lv', 'viagame.com',
|
|
'juicyplay.se', 'viafree.se', 'viafree.dk', 'viafree.no', 'viafree.fi',
|
|
'play.tv3.lt', 'tv3play.tv3.ee', 'tvplay.skaties.lv'
|
|
]
|
|
|
|
def _get_video_id(self, url=None):
|
|
"""
|
|
Extract video id. It will try to avoid making an HTTP request
|
|
if it can find the ID in the URL, but otherwise it will try
|
|
to scrape it from the HTML document. Returns None in case it's
|
|
unable to extract the ID at all.
|
|
"""
|
|
if url:
|
|
html_data = self.http.request("get", url).text
|
|
else:
|
|
html_data = self.get_urldata()
|
|
html_data = self.get_urldata()
|
|
match = re.search(r'data-video-id="([0-9]+)"', html_data)
|
|
if match:
|
|
return match.group(1)
|
|
match = re.search(r'data-videoid="([0-9]+)', html_data)
|
|
if match:
|
|
return match.group(1)
|
|
|
|
clips = False
|
|
match = re.search('params":({.*}),"query', self.get_urldata())
|
|
if match:
|
|
jansson = json.loads(match.group(1))
|
|
if "seasonNumberOrVideoId" in jansson:
|
|
season = jansson["seasonNumberOrVideoId"]
|
|
match = re.search("\w-(\d+)$", season)
|
|
if match:
|
|
season = match.group(1)
|
|
else:
|
|
return False
|
|
if "videoIdOrEpisodeNumber" in jansson:
|
|
videp = jansson["videoIdOrEpisodeNumber"]
|
|
match = re.search('(\w+)-(\d+)', videp)
|
|
if match:
|
|
episodenr = match.group(2)
|
|
else:
|
|
episodenr = videp
|
|
clips = True
|
|
match = re.search('(s\w+)-(\d+)', season)
|
|
if match:
|
|
season = match.group(2)
|
|
else:
|
|
# sometimes videoIdOrEpisodeNumber does not work.. this is a workaround
|
|
match = re.search('(episode|avsnitt)-(\d+)', self.url)
|
|
if match:
|
|
episodenr = match.group(2)
|
|
else:
|
|
episodenr = season
|
|
|
|
if clips:
|
|
return episodenr
|
|
else:
|
|
match = re.search('"ContentPageProgramStore":({.*}),"StartPageStore', self.get_urldata())
|
|
if match:
|
|
janson = json.loads(match.group(1))
|
|
for i in janson["format"]["videos"].keys():
|
|
if "program" in janson["format"]["videos"][str(i)]:
|
|
for n in janson["format"]["videos"][i]["program"]:
|
|
if str(n["episodeNumber"]) and int(episodenr) == n["episodeNumber"] and int(season) == n["seasonNumber"]:
|
|
return n["id"]
|
|
elif n["id"] == episodenr:
|
|
return episodenr
|
|
|
|
parse = urlparse(self.url)
|
|
match = re.search(r'/\w+/(\d+)', parse.path)
|
|
if match:
|
|
return match.group(1)
|
|
match = re.search(r'iframe src="http://play.juicyplay.se[^\"]+id=(\d+)', html_data)
|
|
if match:
|
|
return match.group(1)
|
|
return None
|
|
|
|
|
|
def get(self):
|
|
vid = self._get_video_id()
|
|
if vid is None:
|
|
yield ServiceError("Can't find video file for: {0}".format(self.url))
|
|
return
|
|
|
|
data = self. _get_video_data(vid)
|
|
if data.status_code == 403:
|
|
yield ServiceError("Can't play this because the video is geoblocked.")
|
|
return
|
|
dataj = json.loads(data.text)
|
|
|
|
if "msg" in dataj:
|
|
yield ServiceError(dataj["msg"])
|
|
return
|
|
|
|
if dataj["type"] == "live":
|
|
self.options.live = True
|
|
|
|
if self.options.output_auto:
|
|
self.options.output = self.outputfilename(dataj,vid, self.options.output)
|
|
|
|
if self.exclude():
|
|
yield ServiceError("Excluding video")
|
|
return
|
|
|
|
streams = self.http.request("get", "http://playapi.mtgx.tv/v3/videos/stream/{0}".format(vid))
|
|
if streams.status_code == 403:
|
|
yield ServiceError("Can't play this because the video is geoblocked.")
|
|
return
|
|
streamj = json.loads(streams.text)
|
|
|
|
if "msg" in streamj:
|
|
yield ServiceError("Can't play this because the video is either not found or geoblocked.")
|
|
return
|
|
|
|
if dataj["sami_path"]:
|
|
if dataj["sami_path"].endswith("vtt"):
|
|
subtype = "wrst"
|
|
else:
|
|
subtype = "sami"
|
|
yield subtitle(copy.copy(self.options), subtype, dataj["sami_path"])
|
|
if dataj["subtitles_webvtt"]:
|
|
yield subtitle(copy.copy(self.options), "wrst", dataj["subtitles_webvtt"])
|
|
if dataj["subtitles_for_hearing_impaired"]:
|
|
if dataj["subtitles_for_hearing_impaired"].endswith("vtt"):
|
|
subtype = "wrst"
|
|
else:
|
|
subtype = "sami"
|
|
if self.options.get_all_subtitles:
|
|
yield subtitle(copy.copy(self.options), subtype, dataj["subtitles_for_hearing_impaired"], "-SDH")
|
|
else:
|
|
yield subtitle(copy.copy(self.options), subtype, dataj["subtitles_for_hearing_impaired"])
|
|
|
|
if streamj["streams"]["medium"]:
|
|
filename = streamj["streams"]["medium"]
|
|
if ".f4m" in filename:
|
|
streams = hdsparse(self.options, self.http.request("get", filename, params={"hdcore": "3.7.0"}), filename)
|
|
if streams:
|
|
for n in list(streams.keys()):
|
|
yield streams[n]
|
|
else:
|
|
parse = urlparse(filename)
|
|
match = re.search("^(/[^/]+)/(.*)", parse.path)
|
|
if not match:
|
|
yield ServiceError("Can't get rtmpparse info")
|
|
return
|
|
filename = "{0}://{1}:{2}{3}".format(parse.scheme, parse.hostname, parse.port, match.group(1))
|
|
path = "-y {0}".format(match.group(2))
|
|
self.options.other = "-W http://flvplayer.viastream.viasat.tv/flvplayer/play/swf/player.swf {0}".format(path)
|
|
yield RTMP(copy.copy(self.options), filename, 800)
|
|
|
|
if streamj["streams"]["hls"]:
|
|
streams = hlsparse(self.options, self.http.request("get", streamj["streams"]["hls"]), streamj["streams"]["hls"])
|
|
if streams:
|
|
for n in list(streams.keys()):
|
|
yield streams[n]
|
|
|
|
def find_all_episodes(self, options):
|
|
seasons = []
|
|
match = re.search("(sasong|sesong)-(\d+)", urlparse(self.url).path)
|
|
if match:
|
|
seasons.append(match.group(2))
|
|
else:
|
|
match = self._conentpage(self.get_urldata())
|
|
if match:
|
|
janson = json.loads(match.group(1))
|
|
for i in janson["format"]["seasons"]:
|
|
seasons.append(i["seasonNumber"])
|
|
|
|
episodes = self._grab_episodes(options, seasons)
|
|
if options.all_last > 0:
|
|
return sorted(episodes)[-options.all_last:]
|
|
return sorted(episodes)
|
|
|
|
def _grab_episodes(self, options, seasons):
|
|
episodes = []
|
|
baseurl = self.url
|
|
match = re.search("(sasong|sesong)-\d+", urlparse(self.url).path)
|
|
if match:
|
|
baseurl = self.url[:self.url.rfind("/")]
|
|
|
|
for i in seasons:
|
|
url = "{0}/{1}-{2}".format(baseurl, self._isswe(self.url), i)
|
|
res = self.http.get(url)
|
|
if res:
|
|
match = self._conentpage(res.text)
|
|
if match:
|
|
janson = json.loads(match.group(1))
|
|
if "program" in janson["format"]["videos"][str(i)]:
|
|
for n in janson["format"]["videos"][str(i)]["program"]:
|
|
episodes = self._videos_to_list(n["sharingUrl"],n["id"],episodes)
|
|
if options.include_clips:
|
|
if "clip" in janson["format"]["videos"][str(i)]:
|
|
for n in janson["format"]["videos"][str(i)]["clip"]:
|
|
episodes = self._videos_to_list(n["sharingUrl"],n["id"],episodes)
|
|
return episodes
|
|
|
|
def _isswe(self, url):
|
|
if re.search(".se$", urlparse(url).netloc):
|
|
return "sasong"
|
|
else:
|
|
return "sesong"
|
|
|
|
def _conentpage(self, data):
|
|
return re.search('"ContentPageProgramStore":({.*}),"StartPageStore', data)
|
|
|
|
def _videos_to_list(self, url,vid, episodes):
|
|
dataj = json.loads(self._get_video_data(vid).text)
|
|
if not "msg" in dataj:
|
|
filename = self.outputfilename(dataj, vid, self.options.output)
|
|
if not self.exclude2(filename) and url not in episodes:
|
|
episodes.append(url)
|
|
return episodes
|
|
|
|
def _get_video_data(self, vid):
|
|
url = "http://playapi.mtgx.tv/v3/videos/{0}".format(vid)
|
|
self.options.other = ""
|
|
data = self.http.request("get", url)
|
|
|
|
return data
|
|
|
|
def outputfilename(self, data,vid, filename):
|
|
self.options.service = "viafree"
|
|
if filename:
|
|
directory = os.path.dirname(filename)
|
|
else:
|
|
directory = ""
|
|
|
|
basename = self._autoname(data)
|
|
title = "{0}-{1}-{2}".format(basename, vid, self.options.service)
|
|
if len(directory):
|
|
output = os.path.join(directory, title)
|
|
else:
|
|
output = title
|
|
return output
|
|
|
|
def _autoname(self, dataj):
|
|
program = dataj["format_slug"]
|
|
season = None
|
|
episode = None
|
|
title = None
|
|
|
|
if "season" in dataj["format_position"]:
|
|
if dataj["format_position"]["season"] > 0:
|
|
season = dataj["format_position"]["season"]
|
|
if season:
|
|
if len(dataj["format_position"]["episode"]) > 0:
|
|
episode = dataj["format_position"]["episode"]
|
|
try:
|
|
episode = int(episode)
|
|
except ValueError:
|
|
title = filenamify(episode)
|
|
episode = None
|
|
|
|
if dataj["type"] == "clip":
|
|
#Removes the show name from the end of the filename
|
|
#e.g. Showname.S0X.title instead of Showname.S07.title-showname
|
|
match = re.search(r'(.+)-', dataj["title"])
|
|
if match:
|
|
title = filenamify(match.group(1))
|
|
else:
|
|
title = filenamify(dataj["title"])
|
|
if "derived_from_id" in dataj:
|
|
if dataj["derived_from_id"]:
|
|
parent_id = dataj["derived_from_id"]
|
|
parent_episode = self.http.request("get", "http://playapi.mtgx.tv/v3/videos/{0}".format(parent_id))
|
|
if parent_episode.status_code != 403: #if not geoblocked
|
|
datajparent = json.loads(parent_episode.text)
|
|
if not season and datajparent["format_position"]["season"] > 0:
|
|
season = datajparent["format_position"]["season"]
|
|
if len(datajparent["format_position"]["episode"]) > 0:
|
|
episode = datajparent["format_position"]["episode"]
|
|
|
|
name = filenamify(program)
|
|
if season:
|
|
name = "{0}.s{1:02d}".format(name, int(season))
|
|
if episode:
|
|
name = "{0}e{1:02d}".format(name, int(episode))
|
|
if title:
|
|
name = "{0}.{1}".format(name, title)
|
|
|
|
return name
|