svtplay-dl/lib/svtplay_dl/service/dr.py

# ex:ts=4:sw=4:sts=4:et
# -*- tab-width: 4; c-basic-offset: 4; indent-tabs-mode: nil -*-
from __future__ import absolute_import
import base64
import re
import json
import copy
import binascii
import hashlib
from urllib.parse import urljoin, urlparse

from cryptography.hazmat.primitives.ciphers import Cipher, algorithms, modes
from cryptography.hazmat.backends import default_backend

from svtplay_dl.service import Service, OpenGraphThumbMixin
from svtplay_dl.fetcher.hls import hlsparse
from svtplay_dl.fetcher.hds import hdsparse
from svtplay_dl.subtitle import subtitle
from svtplay_dl.error import ServiceError


class Dr(Service, OpenGraphThumbMixin):
    supported_domains = ["dr.dk"]

    def get(self):
        data = self.get_urldata()

        match = re.search(r'resource:[ ]*"([^"]*)",', data)
        if match:
            resource_url = match.group(1)
            resource_data = self.http.request("get", resource_url).content
            resource = json.loads(resource_data)
            streams = self.find_stream(self.config, resource)
            yield from streams
        else:
            match = re.search(r'resource="([^"]*)"', data)
            if not match:
                yield ServiceError("Cant find resource info for this video")
                return
            if match.group(1)[:4] != "http":
                resource_url = "http:{}".format(match.group(1))
            else:
                resource_url = match.group(1)
            resource_data = self.http.request("get", resource_url).text
            resource = json.loads(resource_data)

            if "Links" not in resource:
                yield ServiceError("Cant access this video. its geoblocked.")
                return
            if "SubtitlesList" in resource and len(resource["SubtitlesList"]) > 0:
                suburl = resource["SubtitlesList"][0]["Uri"]
                yield subtitle(copy.copy(self.config), "wrst", suburl, output=self.output)
            if "Data" in resource:
                streams = self.find_stream(self.config, resource)
                yield from streams
            else:
                for stream in resource["Links"]:
                    uri = stream["Uri"]
                    if uri is None:
                        uri = self._decrypt(stream["EncryptedUri"])

                    if stream["Target"] == "HDS":
                        streams = hdsparse(copy.copy(self.config), self.http.request("get", uri, params={"hdcore": "3.7.0"}), uri, output=self.output)
                        if streams:
                            for n in list(streams.keys()):
                                yield streams[n]
                    if stream["Target"] == "HLS":
                        streams = hlsparse(self.config, self.http.request("get", uri), uri, output=self.output)
                        for n in list(streams.keys()):
                            yield streams[n]

    def find_all_episodes(self, config):
        episodes = []
        matches = re.findall(r'<button class="show-more" data-url="([^"]+)" data-partial="([^"]+)"', self.get_urldata())
        for encpath, enccomp in matches:
            newstyle = "_" in encpath
            if newstyle:
                encbasepath = encpath.split("_")[0]
                path = base64.b64decode(encbasepath + "===").decode("latin1")
            else:
                path = base64.b64decode(encpath + "===").decode("latin1")

            if "/view/" in path:
                continue

            params = "offset=0&limit=1000"
            if newstyle:
                encparams = base64.b64encode(params.encode("latin1")).decode("latin1").rstrip("=")
                encpath = "{}_{}".format(encbasepath, encparams)
            else:
                path = "{}?{}".format(urlparse(path).path, params)
                encpath = base64.b64encode(path.encode("latin1")).decode("latin1").rstrip("=")

            url = urljoin("https://www.dr.dk/tv/partial/", "{}/{}".format(enccomp, encpath))
            data = self.http.request("get", url).content.decode("latin1")

            matches = re.findall(r'"program-link" href="([^"]+)">', data)
            episodes = [urljoin("https://www.dr.dk/", url) for url in matches]
            break

        if not episodes:
            prefix = "/".join(urlparse(self.url).path.rstrip("/").split("/")[:-1])
            matches = re.findall(r'"program-link" href="([^"]+)">', self.get_urldata())
            episodes = [urljoin("https://www.dr.dk/", url) for url in matches if url.startswith(prefix)]

        if config.get("all_last") != -1:
            episodes = episodes[: config.get("all_last")]
        else:
            episodes.reverse()

        return episodes

    def find_stream(self, config, resource):
        tempresource = resource["Data"][0]["Assets"]
        # To find the VideoResource, they have Images as well
        for resources in tempresource:
            if resources["Kind"] == "VideoResource":
                links = resources["Links"]
                break
        for i in links:
            if i["Target"] == "Ios" or i["Target"] == "HLS":
                streams = hlsparse(config, self.http.request("get", i["Uri"]), i["Uri"], output=self.output)
                for n in list(streams.keys()):
                    yield streams[n]

    def _decrypt(self, url):
        n = int(url[2:10], 16)
        iv_hex = url[10 + n :]
        data = binascii.a2b_hex(url[10 : 10 + n].encode("ascii"))
        key = hashlib.sha256(("%s:sRBzYNXBzkKgnjj8pGtkACch" % iv_hex).encode("utf-8")).digest()
        iv = bytes.fromhex(iv_hex)

        backend = default_backend()
        cipher = Cipher(algorithms.AES(key), modes.CBC(iv), backend=backend)
        decryptor = cipher.decryptor()
        decrypted = decryptor.update(data)
        return decrypted[: -decrypted[-1]].decode("utf-8")
Add editor modelines 2013-03-02 21:26:28 +01:00			`# ex:ts=4:sw=4:sts=4:et`
			`# -- tab-width: 4; c-basic-offset: 4; indent-tabs-mode: nil --`
Use absolute_import from __future__ everywhere 2013-03-01 23:39:42 +01:00			`from __future__ import absolute_import`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00			`import base64`
Add minimal set of imports for services to work 2013-02-12 19:43:37 +01:00			`import re`
			`import json`
service: copy options to fetcher 2014-06-07 20:43:40 +02:00			`import copy`
dr: they have started to use encrypted url’s Fixes: #1056 Fixes: #1047 2019-03-24 21:06:23 +01:00			`import binascii`
			`import hashlib`
No need for utils.urllib anymore 2018-01-30 22:07:21 +01:00			`from urllib.parse import urljoin, urlparse`
Add minimal set of imports for services to work 2013-02-12 19:43:37 +01:00
dr: they have started to use encrypted url’s Fixes: #1056 Fixes: #1047 2019-03-24 21:06:23 +01:00			`from cryptography.hazmat.primitives.ciphers import Cipher, algorithms, modes`
			`from cryptography.hazmat.backends import default_backend`

dr: support for thumbnail 2014-01-26 01:51:53 +01:00			`from svtplay_dl.service import Service, OpenGraphThumbMixin`
reorder arguments for hlsparse and hdsparse 2015-10-04 14:37:16 +02:00			`from svtplay_dl.fetcher.hls import hlsparse`
dr.dk: support for the new site. 2014-06-02 21:43:22 +02:00			`from svtplay_dl.fetcher.hds import hdsparse`
dr: subtitle support this fixes #214 2015-03-01 21:46:22 +01:00			`from svtplay_dl.subtitle import subtitle`
Show only one error message instead of two 2015-09-06 14:19:10 +02:00			`from svtplay_dl.error import ServiceError`
pip8. expected 2 lines found 1 2015-09-15 20:10:32 +02:00
Flake8 fixes 2018-01-30 20:11:37 +01:00
dr: support for thumbnail 2014-01-26 01:51:53 +01:00			`class Dr(Service, OpenGraphThumbMixin):`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`supported_domains = ["dr.dk"]`
Initial work on splitting script to modules Does not work reliably (downloading SVTPlay videos with HDS may work if you're lucky). 2013-01-17 00:21:47 +01:00
Move options to when we init the service class 2015-12-26 11:46:14 +01:00			`def get(self):`
adding request support. still need some more work 2015-08-30 00:06:20 +02:00			`data = self.get_urldata()`
Support for exclude filenames with WORD in them. this fixes #190 2014-12-22 17:41:40 +01:00
Initial work on splitting script to modules Does not work reliably (downloading SVTPlay videos with HDS may work if you're lucky). 2013-01-17 00:21:47 +01:00			`match = re.search(r'resource:[ ]"([^"])",', data)`
dr.dk: News still use the old thing 2013-09-14 22:39:37 +02:00			`if match:`
			`resource_url = match.group(1)`
replace self.http.get with our own function with debug info 2015-08-31 19:45:15 +02:00			`resource_data = self.http.request("get", resource_url).content`
dr.dk: News still use the old thing 2013-09-14 22:39:37 +02:00			`resource = json.loads(resource_data)`
Some more options to config 2018-05-22 00:02:20 +02:00			`streams = self.find_stream(self.config, resource)`
pre-commit: pyupgrade 2019-08-25 00:33:51 +02:00			`yield from streams`
dr.dk: Support for more qualities 2013-09-14 21:58:55 +02:00			`else:`
dr.dk: News still use the old thing 2013-09-14 22:39:37 +02:00			`match = re.search(r'resource="([^"]*)"', data)`
			`if not match:`
Show only one error message instead of two 2015-09-06 14:19:10 +02:00			`yield ServiceError("Cant find resource info for this video")`
service: replace sys.exit with return 2014-10-06 23:21:43 +02:00			`return`
dr.dk: fix url parsing for some urls fixes #277 2015-10-08 09:52:36 +02:00			`if match.group(1)[:4] != "http":`
pre-commit: pyupgrade 2019-08-25 00:33:51 +02:00			`resource_url = "http:{}".format(match.group(1))`
dr.dk: fix url parsing for some urls fixes #277 2015-10-08 09:52:36 +02:00			`else:`
			`resource_url = match.group(1)`
dr: use text for json and send the url to the playlist 2015-09-01 00:37:06 +02:00			`resource_data = self.http.request("get", resource_url).text`
dr.dk: News still use the old thing 2013-09-14 22:39:37 +02:00			`resource = json.loads(resource_data)`
dr.dk: Support for more qualities 2013-09-14 21:58:55 +02:00
dr.dk: geoblock check 2015-10-08 09:54:07 +02:00			`if "Links" not in resource:`
			`yield ServiceError("Cant access this video. its geoblocked.")`
			`return`
dr: dont crash when there is no subtitles. 2015-11-15 15:21:42 +01:00			`if "SubtitlesList" in resource and len(resource["SubtitlesList"]) > 0:`
dr: subtitle support this fixes #214 2015-03-01 21:46:22 +01:00			`suburl = resource["SubtitlesList"][0]["Uri"]`
dr: missing output 2018-06-03 01:18:15 +02:00			`yield subtitle(copy.copy(self.config), "wrst", suburl, output=self.output)`
dr.dk: fixed a crash when looking on news videos 2014-08-11 19:46:56 +02:00			`if "Data" in resource:`
Options to config 2018-05-13 13:06:45 +02:00			`streams = self.find_stream(self.config, resource)`
pre-commit: pyupgrade 2019-08-25 00:33:51 +02:00			`yield from streams`
dr.dk: fixed a crash when looking on news videos 2014-08-11 19:46:56 +02:00			`else:`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`for stream in resource["Links"]:`
dr: they have started to use encrypted url’s Fixes: #1056 Fixes: #1047 2019-03-24 21:06:23 +01:00			`uri = stream["Uri"]`
			`if uri is None:`
			`uri = self._decrypt(stream["EncryptedUri"])`

dr.dk: fixed a crash when looking on news videos 2014-08-11 19:46:56 +02:00			`if stream["Target"] == "HDS":`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`streams = hdsparse(copy.copy(self.config), self.http.request("get", uri, params={"hdcore": "3.7.0"}), uri, output=self.output)`
HDS: show an error message when we see DRM files. 2014-10-12 23:31:02 +02:00			`if streams:`
			`for n in list(streams.keys()):`
			`yield streams[n]`
dr.dk: fixed a crash when looking on news videos 2014-08-11 19:46:56 +02:00			`if stream["Target"] == "HLS":`
dr: they have started to use encrypted url’s Fixes: #1056 Fixes: #1047 2019-03-24 21:06:23 +01:00			`streams = hlsparse(self.config, self.http.request("get", uri), uri, output=self.output)`
dr.dk: fixed a crash when looking on news videos 2014-08-11 19:46:56 +02:00			`for n in list(streams.keys()):`
reorder arguments for hlsparse and hdsparse 2015-10-04 14:37:16 +02:00			`yield streams[n]`
dr.dk: fixed a crash when looking on news videos 2014-08-11 19:46:56 +02:00
Some more options to config 2018-05-22 00:02:20 +02:00			`def find_all_episodes(self, config):`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00			`episodes = []`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`matches = re.findall(r'<button class="show-more" data-url="([^"]+)" data-partial="([^"]+)"', self.get_urldata())`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00			`for encpath, enccomp in matches:`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`newstyle = "_" in encpath`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00			`if newstyle:`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`encbasepath = encpath.split("_")[0]`
			`path = base64.b64decode(encbasepath + "===").decode("latin1")`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00			`else:`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`path = base64.b64decode(encpath + "===").decode("latin1")`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`if "/view/" in path:`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00			`continue`

pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`params = "offset=0&limit=1000"`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00			`if newstyle:`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`encparams = base64.b64encode(params.encode("latin1")).decode("latin1").rstrip("=")`
pre-commit: pyupgrade 2019-08-25 00:33:51 +02:00			`encpath = "{}_{}".format(encbasepath, encparams)`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00			`else:`
pre-commit: pyupgrade 2019-08-25 00:33:51 +02:00			`path = "{}?{}".format(urlparse(path).path, params)`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`encpath = base64.b64encode(path.encode("latin1")).decode("latin1").rstrip("=")`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00
pre-commit: pyupgrade 2019-08-25 00:33:51 +02:00			`url = urljoin("https://www.dr.dk/tv/partial/", "{}/{}".format(enccomp, encpath))`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`data = self.http.request("get", url).content.decode("latin1")`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00
			`matches = re.findall(r'"program-link" href="([^"]+)">', data)`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`episodes = [urljoin("https://www.dr.dk/", url) for url in matches]`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00			`break`

			`if not episodes:`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`prefix = "/".join(urlparse(self.url).path.rstrip("/").split("/")[:-1])`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00			`matches = re.findall(r'"program-link" href="([^"]+)">', self.get_urldata())`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`episodes = [urljoin("https://www.dr.dk/", url) for url in matches if url.startswith(prefix)]`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00
Some more options to config 2018-05-22 00:02:20 +02:00			`if config.get("all_last") != -1:`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`episodes = episodes[: config.get("all_last")]`
dr: support --all-episodes 2016-06-29 23:58:37 +02:00			`else:`
			`episodes.reverse()`

			`return episodes`

Options to config 2018-05-13 13:06:45 +02:00			`def find_stream(self, config, resource):`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`tempresource = resource["Data"][0]["Assets"]`
dr: use text for json and send the url to the playlist 2015-09-01 00:37:06 +02:00			`# To find the VideoResource, they have Images as well`
			`for resources in tempresource:`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`if resources["Kind"] == "VideoResource":`
			`links = resources["Links"]`
dr: use text for json and send the url to the playlist 2015-09-01 00:37:06 +02:00			`break`
			`for i in links:`
			`if i["Target"] == "Ios" or i["Target"] == "HLS":`
services: add output variable to fetchers 2018-05-21 00:56:22 +02:00			`streams = hlsparse(config, self.http.request("get", i["Uri"]), i["Uri"], output=self.output)`
dr: use text for json and send the url to the playlist 2015-09-01 00:37:06 +02:00			`for n in list(streams.keys()):`
reorder arguments for hlsparse and hdsparse 2015-10-04 14:37:16 +02:00			`yield streams[n]`
dr: they have started to use encrypted url’s Fixes: #1056 Fixes: #1047 2019-03-24 21:06:23 +01:00
			`def _decrypt(self, url):`
			`n = int(url[2:10], 16)`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`iv_hex = url[10 + n :]`
			`data = binascii.a2b_hex(url[10 : 10 + n].encode("ascii"))`
			`key = hashlib.sha256(("%s:sRBzYNXBzkKgnjj8pGtkACch" % iv_hex).encode("utf-8")).digest()`
dr: they have started to use encrypted url’s Fixes: #1056 Fixes: #1047 2019-03-24 21:06:23 +01:00			`iv = bytes.fromhex(iv_hex)`

			`backend = default_backend()`
			`cipher = Cipher(algorithms.AES(key), modes.CBC(iv), backend=backend)`
			`decryptor = cipher.decryptor()`
			`decrypted = decryptor.update(data)`
pre-commit: black fixes 2019-08-25 00:27:31 +02:00			`return decrypted[: -decrypted[-1]].decode("utf-8")`