1
0
mirror of https://github.com/spaam/svtplay-dl.git synced 2024-11-24 04:05:39 +01:00
svtplay-dl/lib/svtplay_dl/service/picsearch.py

115 lines
4.9 KiB
Python
Raw Normal View History

# ex:ts=4:sw=4:sts=4:et
# -*- tab-width: 4; c-basic-offset: 4; indent-tabs-mode: nil -*-
2014-06-07 20:43:40 +02:00
import copy
2019-08-25 00:40:39 +02:00
import json
import re
2018-01-30 22:07:21 +01:00
from urllib.parse import urlparse
2019-08-25 00:40:39 +02:00
from svtplay_dl.error import ServiceError
2016-04-19 21:08:17 +02:00
from svtplay_dl.fetcher.hls import hlsparse
from svtplay_dl.fetcher.http import HTTP
2019-08-25 00:40:39 +02:00
from svtplay_dl.service import OpenGraphThumbMixin
from svtplay_dl.service import Service
2015-09-15 20:10:32 +02:00
class Picsearch(Service, OpenGraphThumbMixin):
supported_domains = ["dn.se", "mobil.dn.se", "di.se", "csp.picsearch.com", "csp.screen9.com"]
2021-12-18 21:37:09 +01:00
backupapi = None
def get(self):
ajax_auth = self.get_auth()
if not ajax_auth:
yield ServiceError("Cant find token for video")
return
mediaid = self.get_mediaid()
if not mediaid:
yield ServiceError("Cant find media id")
return
if not isinstance(mediaid, str):
mediaid = mediaid.group(1)
2019-08-25 00:27:31 +02:00
jsondata = self.http.request(
2020-12-26 13:10:56 +01:00
"get",
2021-12-18 19:52:08 +01:00
f"http://csp.screen9.com/player?eventParam=1&ajaxauth={ajax_auth.group(1)}&method=embed&mediaid={mediaid}",
2019-08-25 00:27:31 +02:00
).text
jsondata = json.loads(jsondata)
if "data" in jsondata:
if "live" in jsondata["data"]["publishing_status"]:
2018-05-13 13:06:45 +02:00
self.config.set("live", jsondata["data"]["publishing_status"]["live"])
playlist = jsondata["data"]["streams"]
for i in playlist:
2019-03-23 00:57:19 +01:00
if "application/x-mpegurl" in i:
yield from hlsparse(
2020-12-26 13:10:56 +01:00
self.config,
self.http.request("get", i["application/x-mpegurl"]),
i["application/x-mpegurl"],
output=self.output,
2019-08-25 00:27:31 +02:00
)
2019-03-23 00:57:19 +01:00
if "video/mp4" in i:
yield HTTP(copy.copy(self.config), i["video/mp4"], 800, output=self.output)
if self.backupapi:
res = self.http.get(self.backupapi.replace("i=", ""), params={"i": "object"})
2019-08-25 00:27:31 +02:00
data = res.text.replace("ps.embedHandler(", "").replace('"");', "")
data = data[: data.rfind(",")]
jansson = json.loads(data)
for i in jansson["media"]["playerconfig"]["playlist"]:
if "provider" in i and i["provider"] == "httpstreaming":
yield from hlsparse(self.config, self.http.request("get", i["url"]), i["url"], output=self.output)
def get_auth(self):
match = re.search(r"picsearch_ajax_auth[ ]*=[ ]*['\"]([^'\"]+)['\"]", self.get_urldata())
if not match:
match = re.search(r'screen9-ajax-auth="([^"]+)"', self.get_urldata())
2016-04-19 21:08:17 +02:00
if not match:
match = re.search('screen9"[ ]*:[ ]*"([^"]+)"', self.get_urldata())
if not match:
match = re.search('data-auth="([^"]+)"', self.get_urldata())
if not match:
match = re.search('s.src="(https://csp-ssl.picsearch.com[^"]+|http://csp.picsearch.com/rest[^"]+)', self.get_urldata())
if match:
data = self.http.request("get", match.group(1))
self.backupapi = match.group(1)
match = re.search(r'ajaxAuth": "([^"]+)"', data.text)
if not match:
match = re.search('iframe src="(//csp.screen9.com[^"]+)"', self.get_urldata())
if match:
2021-04-27 19:44:09 +02:00
url = f"http:{match.group(1)}"
data = self.http.request("get", url)
self.backupapi = url
match = re.search(r"picsearch_ajax_auth = '([^']+)'", data.text)
if not match:
match = re.search(r"screen9_ajax_auth = '([^']+)'", data.text)
return match
def get_mediaid(self):
match = re.search(r"mediaId = '([^']+)';", self.get_urldata())
if not match:
match = re.search(r'media-id="([^"]+)"', self.get_urldata())
if not match:
match = re.search(r'screen9-mid="([^"]+)"', self.get_urldata())
2016-04-19 21:08:17 +02:00
if not match:
match = re.search(r'data-id="([^"]+)"', self.get_urldata())
if not match:
2019-08-25 00:27:31 +02:00
match = re.search(r"data-id=([^ ]+) ", self.get_urldata())
if not match:
match = re.search(r'data-videoid="([^"]+)"', self.get_urldata())
if not match:
match = re.search('s.src="(https://csp-ssl.picsearch.com[^"]+|http://csp.picsearch.com/rest[^"]+)', self.get_urldata())
if match:
data = self.http.request("get", match.group(1))
match = re.search(r'mediaid": "([^"]+)"', data.text)
if not match:
match = re.search('iframe src="(//csp.screen9.com[^"]+)"', self.get_urldata())
if match:
2021-04-27 19:44:09 +02:00
url = f"http:{match.group(1)}"
data = self.http.request("get", url)
match = re.search(r"mediaid: '([^']+)'", data.text)
if not match:
urlp = urlparse(self.url)
match = urlp.fragment
return match