1
0
mirror of https://github.com/spaam/svtplay-dl.git synced 2024-11-24 12:15:40 +01:00
svtplay-dl/lib/svtplay_dl/service/urplay.py

98 lines
3.8 KiB
Python
Raw Normal View History

2013-03-02 21:26:28 +01:00
# ex:ts=4:sw=4:sts=4:et
# -*- tab-width: 4; c-basic-offset: 4; indent-tabs-mode: nil -*-
from __future__ import absolute_import
import re
import json
2014-06-07 20:43:40 +02:00
import copy
2014-04-03 21:09:42 +02:00
import xml.etree.ElementTree as ET
from svtplay_dl.service import Service, OpenGraphThumbMixin
from svtplay_dl.utils.urllib import urljoin
from svtplay_dl.fetcher.hls import hlsparse
2015-09-06 22:41:29 +02:00
from svtplay_dl.log import log
from svtplay_dl.error import ServiceError
from svtplay_dl.subtitle import subtitle
from svtplay_dl.utils import filenamify
2015-09-15 20:10:32 +02:00
class Urplay(Service, OpenGraphThumbMixin):
supported_domains = ['urplay.se', 'ur.se', 'betaplay.ur.se', 'urskola.se']
def get(self):
data = self.get_urldata()
2014-12-08 23:07:02 +01:00
match = re.search(r"urPlayer.init\((.*)\);", data)
if not match:
yield ServiceError("Can't find json info")
2014-10-06 23:21:43 +02:00
return
2016-05-14 22:54:30 +02:00
if self.exclude():
2015-09-06 23:04:48 +02:00
yield ServiceError("Excluding video")
return
data = match.group(1)
jsondata = json.loads(data)
if len(jsondata["subtitles"]) > 0:
for sub in jsondata["subtitles"]:
if "label" in sub:
if self.options.get_all_subtitles:
yield subtitle(copy.copy(self.options), "tt", sub["file"].split(",")[0], "-" + filenamify(sub["label"]))
else:
yield subtitle(copy.copy(self.options), "tt", sub["file"].split(",")[0])
2015-10-25 02:07:25 +02:00
if "streamer" in jsondata["streaming_config"]:
basedomain = jsondata["streaming_config"]["streamer"]["redirect"]
else:
lbjson = self.http.request("get", jsondata["streaming_config"]["loadbalancer"]).text
lbjson = json.loads(lbjson)
basedomain = lbjson["redirect"]
http = "http://%s/%s" % (basedomain, jsondata["file_http"])
2014-01-09 00:32:14 +01:00
hd = None
if len(jsondata["file_http_hd"]) > 0:
http_hd = "http://%s/%s" % (basedomain, jsondata["file_http_hd"])
2014-01-09 00:32:14 +01:00
hls_hd = "%s%s" % (http_hd, jsondata["streaming_config"]["http_streaming"]["hls_file"])
hd = True
hls = "%s%s" % (http, jsondata["streaming_config"]["http_streaming"]["hls_file"])
streams = hlsparse(self.options, self.http.request("get", hls), hls)
2014-04-21 21:55:39 +02:00
for n in list(streams.keys()):
yield streams[n]
2014-01-09 00:32:14 +01:00
if hd:
streams = hlsparse(self.options, self.http.request("get", hls_hd), hls_hd)
2014-04-21 21:55:39 +02:00
for n in list(streams.keys()):
yield streams[n]
def scrape_episodes(self, options):
res = []
for relurl in re.findall(r'<a class="puff tv video"\s+title="[^"]*"\s+href="([^"]*)"',
self.get_urldata()):
res.append(urljoin(self.url, relurl.replace("&amp;", "&")))
for relurl in re.findall(r'<a class="card program"\s+href="([^"]*)"',
self.get_urldata()):
res.append(urljoin(self.url, relurl.replace("&amp;", "&")))
if options.all_last != -1:
res = res[-options.all_last:]
return res
2014-04-03 21:09:42 +02:00
def find_all_episodes(self, options):
match = re.search(r'<link rel="alternate" type="application/rss\+xml" [^>]*href="([^"]+)"',
self.get_urldata())
2014-04-03 21:09:42 +02:00
if match is None:
log.info("Couldn't retrieve episode list as rss, trying to scrape")
return self.scrape_episodes(options)
2014-04-03 21:09:42 +02:00
url = "http://urplay.se%s" % match.group(1).replace("&amp;", "&")
xml = ET.XML(self.http.request("get", url).content)
2014-04-03 21:09:42 +02:00
episodes = [x.text for x in xml.findall(".//item/link")]
episodes_new = []
n = 0
for i in episodes:
if n == options.all_last:
break
2015-09-06 22:41:49 +02:00
if i not in episodes_new:
episodes_new.append(i)
n += 1
return episodes_new