youtube-dl/youtube_dl/extractor/npo.py

# coding: utf-8
from __future__ import unicode_literals

import json
import re

from .common import InfoExtractor
from ..utils import ExtractorError


class NPOIE(InfoExtractor):
    IE_NAME = 'npo'
    IE_DESC = 'npo.nl'
    _VALID_URL = r'https?://(?:www\.)?npo\.nl/start/serie/'

    _TESTS = [{
        'url': 'https://npo.nl/start/serie/zembla/seizoen-2015/wie-is-de-mol-2/',
        'md5': 'f9ce9c43cc8bc3b8138df1562b99c379',
        'info_dict': {
            'description': 'Wie is de mol? (2)',
            'duration': 2439,
            'ext': 'm4v',
            'id': 'wie-is-de-mol-2',
            'thumbnail': 'https://assets-start.npo.nl/resources/2023/07/01/e723c3cf-3e42-418a-9ba5-f6dbb64b516a.jpg',
            'title': 'Wie is de mol? (2)'
        }
    }, {
        'url': 'https://npo.nl/start/serie/vpro-tegenlicht/seizoen-11/zwart-geld-de-toekomst-komt-uit-afrika',
        'md5': 'c84d054219c4888ed53b4ee3d01b2d93',
        'info_dict': {
            'id': 'zwart-geld-de-toekomst-komt-uit-afrika',
            'title': 'Zwart geld: de toekomst komt uit Afrika',
            'ext': 'mp4',
            'description': 'Zwart geld: de toekomst komt uit Afrika',
            'thumbnail': 'https://assets-start.npo.nl/resources/2023/06/30/d9879593-1944-4249-990c-1561dac14d8e.jpg',
            'duration': 3000
        },
    }]

    def _get_token(self, video_id):
        return self._download_json(
            'https://npo.nl/start/api/domain/player-token?productId=%s' % video_id,
            video_id,
            note='Downloading token')['token']

    def _real_extract(self, url):
        # You might want to use removesuffix here,
        # but removesuffix is introduced in Python 3.9
        # and youtube-dl supports Python 3.2+
        if url.endswith('/afspelen'):
            url = url[:-9]
        elif url.endswith('/afspelen/'):
            url = url[:-10]
        url = url.rstrip('/')
        slug = url.split('/')[-1]

        program_metadata = self._download_json('https://npo.nl/start/api/domain/program-detail',
                                               slug, query={'slug': slug})
        product_id = program_metadata.get('productId')
        images = program_metadata.get('images')
        thumbnail = None
        for image in images:
            thumbnail = image.get('url')
            break
        title = program_metadata.get('title')
        descriptions = program_metadata.get('description', {})
        description = descriptions.get('long') or descriptions.get('short') or descriptions.get('brief')
        duration = program_metadata.get('durationInSeconds')

        if not product_id:
            raise ExtractorError('No productId found for slug: %s' % slug)

        formats = self._extract_formats_by_product_id(product_id, slug, url)

        return {
            'id': slug,
            'formats': formats,
            'title': title or slug,
            'description': description or title or slug,
            'thumbnail': thumbnail,
            'duration': duration,
        }

    def _extract_formats_by_product_id(self, product_id, slug, url=None):
        token = self._get_token(product_id)
        formats = []
        for profile in (
                'dash',
                # 'hls' is available too, but implementing it doesn't add much
                # As far as I know 'dash' is always available
        ):
            stream_link = self._download_json(
                'https://prod.npoplayer.nl/stream-link', video_id=slug,
                data=json.dumps({
                    'profileName': profile,
                    'referrerUrl': url or '',
                }).encode('utf8'),
                headers={
                    'Authorization': token,
                    'Content-Type': 'application/json',
                },
                fatal=False,
            )
            stream_url = stream_link.get('stream', {}).get('streamURL')
            formats.extend(self._extract_mpd_formats(stream_url, slug, mpd_id='dash', fatal=False))
        return formats


class BNNVaraIE(NPOIE):
    IE_NAME = 'bnnvara'
    IE_DESC = 'bnnvara.nl'
    _VALID_URL = r'https?://(?:www\.)?bnnvara\.nl/videos/[0-9]*'
    _TESTS = [{
        'url': 'https://www.bnnvara.nl/videos/27455',
        'md5': '392dd367877739e49b9e0a9a550b178a',
        'info_dict': {
            'id': 'VARA_101369808',
            'thumbnail': 'https://media.vara.nl/files/thumbnails/321291_custom_zembla__wie_is_de_mol_680x383.jpg',
            'title': 'Zembla - Wie is de mol?',
            'ext': 'mp4',
        }
    }]

    def _real_extract(self, url):
        url = url.rstrip('/')
        video_id = url.split('/')[-1]

        media = self._download_json('https://api.bnnvara.nl/bff/graphql',
                                    video_id,
                                    data=json.dumps(
                                        {
                                            'operationName': 'getMedia',
                                            'variables': {
                                                'id': video_id,
                                                'hasAdConsent': False,
                                                'atInternetId': 70
                                            },
                                            'query': 'query getMedia($id: ID!, $mediaUrl: String, $hasAdConsent: Boolean!, $atInternetId: Int) {\n  player(\n    id: $id\n    mediaUrl: $mediaUrl\n    hasAdConsent: $hasAdConsent\n    atInternetId: $atInternetId\n  ) {\n    ... on PlayerSucces {\n      brand {\n        name\n        slug\n        broadcastsEnabled\n        __typename\n      }\n      title\n      programTitle\n      pomsProductId\n      broadcasters {\n        name\n        __typename\n      }\n      duration\n      classifications {\n        title\n        imageUrl\n        type\n        __typename\n      }\n      image {\n        title\n        url\n        __typename\n      }\n      cta {\n        title\n        url\n        __typename\n      }\n      genres {\n        name\n        __typename\n      }\n      subtitles {\n        url\n        language\n        __typename\n      }\n      sources {\n        name\n        url\n        ratio\n        __typename\n      }\n      type\n      token\n      __typename\n    }\n    ... on PlayerError {\n      error\n      __typename\n    }\n    __typename\n  }\n}'
                                        }).encode('utf8'),
                                    headers={
                                        'Content-Type': 'application/json',
                                    })
        product_id = media.get('data', {}).get('player', {}).get('pomsProductId')

        formats = self._extract_formats_by_product_id(product_id, video_id)

        return {
            'id': product_id,
            'title': media.get('data', {}).get('player', {}).get('title'),
            'formats': formats,
            'thumbnail': media.get('data', {}).get('player', {}).get('image').get('url'),
        }


class ONIE(NPOIE):
    IE_NAME = 'on'
    IE_DESC = 'ongehoordnederland.tv'
    _VALID_URL = r'https?://(?:www\.)?ongehoordnederland.tv/.*'
    _TESTS = [{
        'url': 'https://ongehoordnederland.tv/2024/03/01/korte-clips/heeft-preppen-zin-betwijfel-dat-je-daar-echt-iets-aan-zult-hebben-bij-oorlog-lydia-daniel/',
        'md5': 'a85ebd50fa86fe5cbce654655f7dbb12',
        'info_dict': {

        }
    }]

    def _real_extract(self, url):
        video_id = url.rstrip('/').split('/')[-1]
        page, _ = self._download_webpage_handle(url, video_id)
        results = re.findall("page: '(.+)'", page)
        formats = []
        for result in results:
            formats.extend(self._extract_formats_by_product_id(result, video_id))

        if not formats:
            raise ExtractorError('Could not find a POMS product id in the provided URL, '
                                 'perhaps because all stream URLs are DRM protected.')

        return {
            'id': video_id,
            'title': video_id,
            'formats': formats,
        }


class ZAPPIE(NPOIE):
    IE_NAME = 'zapp'
    IE_DESC = 'zapp.nl'
    _VALID_URL = r'https?://(?:www\.)?zapp.nl/.*'

    _TESTS = [{
        'url': 'https://www.zapp.nl/programmas/zappsport/gemist/POMS_AT_811523',
        'md5': '9eb2d8b6f88b72b6b986ea2c26a81588',
        'info_dict': {
            'id': 'POMS_AT_811523',
            'title': 'POMS_AT_811523',
        },
    }]

    def _real_extract(self, url):
        video_id = url.rstrip('/').split('/')[-1]

        formats = self._extract_formats_by_product_id(video_id, video_id, url=url)

        return {
            'id': video_id,
            'title': video_id,
            'formats': formats,
        }


class SchoolTVIE(NPOIE):
    IE_NAME = 'schooltv'
    IE_DESC = 'schooltv.nl'
    _VALID_URL = r'https?://(?:www\.)?schooltv.nl/item/.*'

    _TESTS = [{
        'url': 'https://schooltv.nl/item/zapp-music-challenge-2015-zapp-music-challenge-2015',
        'md5': 'e9ef151c4886994e2bea23593348cb14',
        'info_dict': {
            'id': 'zapp-music-challenge-2015-zapp-music-challenge-2015',
            'title': 'Zapp Music Challenge 2015 - Alain Clark & Yaell',
            'description': "Een nummer schrijven met de super bekende soulzanger en producer Alain Clark? Dat is de uitdaging voor de dertienjarige Yaell uit Delft. En als het dan echt goed is, mag hij het ook nog eens live gaan spelen op de speelplaats bij Giel Beelen! Muziek is heel erg belangrijk in het leven van Yaell. 'Als er geen muziek zou zijn, dan zou ik heel veel niet kunnen.' Hij is dan ook altijd aan het schrijven, vaak over zijn eigen leven. Maar soms is het best lastig om die teksten te verzinnen. Vindt hij de inspiratie om een hit te maken met Alain?"
        },
    }]

    def _real_extract(self, url):
        video_id = url.rstrip('/').split('/')[-1]

        # TODO Find out how we could obtain this automatically
        #      Otherwise this extractor might break each time SchoolTV deploys a new release
        build_id = 'b7eHUzAVO7wHXCopYxQhV'

        metadata_url = 'https://schooltv.nl/_next/data/' \
                       + build_id \
                       + '/item/' \
                       + video_id + '.json'

        metadata = self._download_json(metadata_url,
                                       video_id).get('pageProps', {}).get('data', {})

        formats = self._extract_formats_by_product_id(metadata.get('poms_mid'), video_id)

        if not formats:
            raise ExtractorError('Could not find a POMS product id in the provided URL, '
                                 'perhaps because all stream URLs are DRM protected.')

        return {
            'id': video_id,
            'title': metadata.get('title', '') + ' - ' + metadata.get('subtitle', ''),
            'description': metadata.get('description') or metadata.get('short_description'),
            'formats': formats,
        }


class NTRSubsiteIE(NPOIE):
    def _real_extract(self, url):
        video_id = url.rstrip('/').split('/')[-1]

        page, _ = self._download_webpage_handle(url, video_id)
        results = re.findall(r'data-mid="(.+_.+)"', page)
        formats = []
        for result in results:
            formats.extend(self._extract_formats_by_product_id(result, video_id))
            break

        if not formats:
            raise ExtractorError('Could not find a POMS product id in the provided URL, '
                                 'perhaps because all stream URLs are DRM protected.')

        return {
            'id': video_id,
            'title': video_id,
            'formats': formats,
        }


class HetKlokhuisIE(NTRSubsiteIE):
    IE_NAME = 'hetklokhuis'
    IE_DESC = 'hetklokhuis.nl'
    _VALID_URL = r'https?://(?:www\.)?hetklokhuis\.nl/.*'
    _TESTS = [{
        'url': 'https://hetklokhuis.nl/dossier/142/zoek-het-uit/tv-uitzending/2987/aliens',
        'md5': '4664b54ed4e05183b1e4f2f4290d551e',
        'info_dict': {
            'id': 'aliens',
            'title': 'aliens',
        },
    }]


class VPROIE(NPOIE):
    IE_NAME = 'vpro'
    IE_DESC = 'vpro.nl'
    _VALID_URL = r'https?://(?:www\.)?vpro.nl/.*'
    _TESTS = [{
        'url': 'https://www.vpro.nl/programmas/tegenlicht/kijk/afleveringen/2015-2016/offline-als-luxe.html',
        'md5': 'cf302e066b5313cfaf8d5adf50d64f13',
        'info_dict': {
            'id': 'offline-als-luxe.html',
            'title': 'offline-als-luxe.html',
            'ext': 'm4v',
        },
    }]

    def _real_extract(self, url):
        video_id = url.rstrip('/').split('/')[-1]
        page, _ = self._download_webpage_handle(url, video_id)
        results = re.findall(r'data-media-id="([a-zA-Z0-9_]+)"\s', page)
        formats = []
        for result in results:
            formats.extend(self._extract_formats_by_product_id(result, video_id))
            break  # TODO find a better solution, VPRO pages can have multiple videos embedded

        if not formats:
            raise ExtractorError('Could not find a POMS product id in the provided URL, '
                                 'perhaps because all stream URLs are DRM protected.')

        return {
            'id': video_id,
            'title': video_id,
            'formats': formats,
        }


class AndereTijdenIE(NTRSubsiteIE):
    IE_NAME = 'anderetijden'
    IE_DESC = 'anderetijden.nl'
    _VALID_URL = r'https?://(?:www\.)?anderetijden\.nl/.*'
    _TESTS = [{
        'url': 'https://anderetijden.nl/programma/1/Andere-Tijden/aflevering/676/Duitse-soldaten-over-de-Slag-bij-Arnhem',
        'md5': '3d607b16e00b459156b4ab6e163dccd7',
        'info_dict': {
            'id': 'Duitse-soldaten-over-de-Slag-bij-Arnhem',
            'title': 'Duitse-soldaten-over-de-Slag-bij-Arnhem',
        },
    }]
Encoding suggestion from PR 3 months ago			`# coding: utf-8`
[npo] Add extractor (closes #3145) 10 years ago			`from __future__ import unicode_literals`

Convert the description into code 3 months ago			`import json`
Add Ongehoord Nederland and test URL for BNNVARA 3 months ago			`import re`
[npo] Add support for omroepwnl fragments 9 years ago
[npo:radio] Move to extractor to common npo place and add extractor for fragments 9 years ago			`from .common import InfoExtractor`
First version of a VPRO regex 3 months ago			`from ..utils import ExtractorError`
[npo] Add extractor (closes #3145) 10 years ago

Delete all broken extractors Re-implementing these is quicker for the cases where that's even still possible 3 months ago			`class NPOIE(InfoExtractor):`
[npo] Extend _VALID_URL to support ntr.nl (Closes #6248) 9 years ago			`IE_NAME = 'npo'`
Delete all broken extractors Re-implementing these is quicker for the cases where that's even still possible 3 months ago			`IE_DESC = 'npo.nl'`
Make regex more specific and remove redundant .* 3 months ago			`_VALID_URL = r'https?://(?:www\.)?npo\.nl/start/serie/'`
[npo] Add extractor (closes #3145) 10 years ago
[npo] Improve extraction and update tests 7 years ago			`_TESTS = [{`
Add notes on new npo.nl site 3 months ago			`'url': 'https://npo.nl/start/serie/zembla/seizoen-2015/wie-is-de-mol-2/',`
Update unit tests 3 months ago			`'md5': 'f9ce9c43cc8bc3b8138df1562b99c379',`
			`'info_dict': {`
			`'description': 'Wie is de mol? (2)',`
			`'duration': 2439,`
Resolve some of the pull request feedback 3 months ago			`'ext': 'm4v',`
Update unit tests 3 months ago			`'id': 'wie-is-de-mol-2',`
			`'thumbnail': 'https://assets-start.npo.nl/resources/2023/07/01/e723c3cf-3e42-418a-9ba5-f6dbb64b516a.jpg',`
			`'title': 'Wie is de mol? (2)'`
			`}`
[npo] Improve extraction and update tests 7 years ago			`}, {`
Add notes on new npo.nl site 3 months ago			`'url': 'https://npo.nl/start/serie/vpro-tegenlicht/seizoen-11/zwart-geld-de-toekomst-komt-uit-afrika',`
Update unit tests 3 months ago			`'md5': 'c84d054219c4888ed53b4ee3d01b2d93',`
[npo] Improve extraction and update tests 7 years ago			`'info_dict': {`
Update unit tests 3 months ago			`'id': 'zwart-geld-de-toekomst-komt-uit-afrika',`
			`'title': 'Zwart geld: de toekomst komt uit Afrika',`
Resolve some of the pull request feedback 3 months ago			`'ext': 'mp4',`
Update unit tests 3 months ago			`'description': 'Zwart geld: de toekomst komt uit Afrika',`
			`'thumbnail': 'https://assets-start.npo.nl/resources/2023/06/30/d9879593-1944-4249-990c-1561dac14d8e.jpg',`
			`'duration': 3000`
[npo] Add support for streams (Closes #4276) 10 years ago			`},`
[npo] Improve extraction and update tests 7 years ago			`}]`
[npo] Add extractor (closes #3145) 10 years ago
Delete all broken extractors Re-implementing these is quicker for the cases where that's even still possible 3 months ago			`def _get_token(self, video_id):`
			`return self._download_json(`
			`'https://npo.nl/start/api/domain/player-token?productId=%s' % video_id,`
			`video_id,`
			`note='Downloading token')['token']`
[npo] Extend _VALID_URL (closes #16682) 6 years ago
[npo] Add extractor (closes #3145) 10 years ago			`def _real_extract(self, url):`
Convert the description into code 3 months ago			`# You might want to use removesuffix here,`
			`# but removesuffix is introduced in Python 3.9`
			`# and youtube-dl supports Python 3.2+`
			`if url.endswith('/afspelen'):`
			`url = url[:-9]`
			`elif url.endswith('/afspelen/'):`
			`url = url[:-10]`
Comply with coding conventions a bit more 3 months ago			`url = url.rstrip('/')`
Convert the description into code 3 months ago			`slug = url.split('/')[-1]`
Use program-detail endpoint and remove a test 3 months ago
			`program_metadata = self._download_json('https://npo.nl/start/api/domain/program-detail',`
Adhere to code style Co-authored-by: dirkf <fieldhouse@gmx.net> 3 months ago			`slug, query={'slug': slug})`
Use program-detail endpoint and remove a test 3 months ago			`product_id = program_metadata.get('productId')`
			`images = program_metadata.get('images')`
			`thumbnail = None`
			`for image in images:`
			`thumbnail = image.get('url')`
			`break`
			`title = program_metadata.get('title')`
			`descriptions = program_metadata.get('description', {})`
			`description = descriptions.get('long') or descriptions.get('short') or descriptions.get('brief')`
			`duration = program_metadata.get('durationInSeconds')`

Convert the description into code 3 months ago			`if not product_id:`
			`raise ExtractorError('No productId found for slug: %s' % slug)`

Resolve some of the pull request feedback 3 months ago			`formats = self._extract_formats_by_product_id(product_id, slug, url)`
Refactor into reusable method 3 months ago
			`return {`
			`'id': slug,`
			`'formats': formats,`
			`'title': title or slug,`
Use program-detail endpoint and remove a test 3 months ago			`'description': description or title or slug,`
Refactor into reusable method 3 months ago			`'thumbnail': thumbnail,`
Use program-detail endpoint and remove a test 3 months ago			`'duration': duration,`
Refactor into reusable method 3 months ago			`}`
Convert the description into code 3 months ago
Resolve some of the pull request feedback 3 months ago			`def _extract_formats_by_product_id(self, product_id, slug, url=None):`
Refactor into reusable method 3 months ago			`token = self._get_token(product_id)`
Add the possibility to add 'hls' later 3 months ago			`formats = []`
			`for profile in (`
Re-add SchoolTV 3 months ago			`'dash',`
			`# 'hls' is available too, but implementing it doesn't add much`
			`# As far as I know 'dash' is always available`
Add the possibility to add 'hls' later 3 months ago			`):`
			`stream_link = self._download_json(`
			`'https://prod.npoplayer.nl/stream-link', video_id=slug,`
			`data=json.dumps({`
			`'profileName': profile,`
Refactor into reusable method 3 months ago			`'referrerUrl': url or '',`
Add the possibility to add 'hls' later 3 months ago			`}).encode('utf8'),`
			`headers={`
			`'Authorization': token,`
			`'Content-Type': 'application/json',`
Fix zapp extractor 3 months ago			`},`
			`fatal=False,`
Add the possibility to add 'hls' later 3 months ago			`)`
			`stream_url = stream_link.get('stream', {}).get('streamURL')`
			`formats.extend(self._extract_mpd_formats(stream_url, slug, mpd_id='dash', fatal=False))`
Refactor into reusable method 3 months ago			`return formats`


			`class BNNVaraIE(NPOIE):`
			`IE_NAME = 'bnnvara'`
			`IE_DESC = 'bnnvara.nl'`
			`_VALID_URL = r'https?://(?:www\.)?bnnvara\.nl/videos/[0-9]*'`
Add Ongehoord Nederland and test URL for BNNVARA 3 months ago			`_TESTS = [{`
			`'url': 'https://www.bnnvara.nl/videos/27455',`
Update unit tests 3 months ago			`'md5': '392dd367877739e49b9e0a9a550b178a',`
			`'info_dict': {`
			`'id': 'VARA_101369808',`
			`'thumbnail': 'https://media.vara.nl/files/thumbnails/321291_custom_zembla__wie_is_de_mol_680x383.jpg',`
Resolve some of the pull request feedback 3 months ago			`'title': 'Zembla - Wie is de mol?',`
			`'ext': 'mp4',`
Update unit tests 3 months ago			`}`
Add Ongehoord Nederland and test URL for BNNVARA 3 months ago			`}]`
Refactor into reusable method 3 months ago
			`def _real_extract(self, url):`
			`url = url.rstrip('/')`
			`video_id = url.split('/')[-1]`

			`media = self._download_json('https://api.bnnvara.nl/bff/graphql',`
			`video_id,`
			`data=json.dumps(`
			`{`
			`'operationName': 'getMedia',`
			`'variables': {`
			`'id': video_id,`
			`'hasAdConsent': False,`
			`'atInternetId': 70`
			`},`
			'query': 'query getMedia($id: ID!, $mediaUrl: String, $hasAdConsent: Boolean!, $atInternetId: Int) {\n player(\n id: $id\n mediaUrl: $mediaUrl\n hasAdConsent: $hasAdConsent\n atInternetId: $atInternetId\n ) {\n ... on PlayerSucces {\n brand {\n name\n slug\n broadcastsEnabled\n __typename\n }\n title\n programTitle\n pomsProductId\n broadcasters {\n name\n __typename\n }\n duration\n classifications {\n title\n imageUrl\n type\n __typename\n }\n image {\n title\n url\n __typename\n }\n cta {\n title\n url\n __typename\n }\n genres {\n name\n __typename\n }\n subtitles {\n url\n language\n __typename\n }\n sources {\n name\n url\n ratio\n __typename\n }\n type\n token\n __typename\n }\n ... on PlayerError {\n error\n __typename\n }\n __typename\n }\n}'
			`}).encode('utf8'),`
			`headers={`
			`'Content-Type': 'application/json',`
			`})`
			`product_id = media.get('data', {}).get('player', {}).get('pomsProductId')`

Resolve some of the pull request feedback 3 months ago			`formats = self._extract_formats_by_product_id(product_id, video_id)`
[npo] Add extractor (closes #3145) 10 years ago
			`return {`
Refactor into reusable method 3 months ago			`'id': product_id,`
			`'title': media.get('data', {}).get('player', {}).get('title'),`
Add the possibility to add 'hls' later 3 months ago			`'formats': formats,`
Refactor into reusable method 3 months ago			`'thumbnail': media.get('data', {}).get('player', {}).get('image').get('url'),`
[npo] Add extractor (closes #3145) 10 years ago			`}`
Add Ongehoord Nederland and test URL for BNNVARA 3 months ago

			`class ONIE(NPOIE):`
			`IE_NAME = 'on'`
			`IE_DESC = 'ongehoordnederland.tv'`
			`_VALID_URL = r'https?://(?:www\.)?ongehoordnederland.tv/.*'`
			`_TESTS = [{`
			`'url': 'https://ongehoordnederland.tv/2024/03/01/korte-clips/heeft-preppen-zin-betwijfel-dat-je-daar-echt-iets-aan-zult-hebben-bij-oorlog-lydia-daniel/',`
Add an MD5 3 months ago			`'md5': 'a85ebd50fa86fe5cbce654655f7dbb12',`
			`'info_dict': {`

			`}`
Add Ongehoord Nederland and test URL for BNNVARA 3 months ago			`}]`

			`def _real_extract(self, url):`
			`video_id = url.rstrip('/').split('/')[-1]`
			`page, _ = self._download_webpage_handle(url, video_id)`
			`results = re.findall("page: '(.+)'", page)`
			`formats = []`
			`for result in results:`
Resolve some of the pull request feedback 3 months ago			`formats.extend(self._extract_formats_by_product_id(result, video_id))`
Add Ongehoord Nederland and test URL for BNNVARA 3 months ago
			`if not formats:`
Fix flake8 and better error reporting 3 months ago			`raise ExtractorError('Could not find a POMS product id in the provided URL, '`
			`'perhaps because all stream URLs are DRM protected.')`
Add Ongehoord Nederland and test URL for BNNVARA 3 months ago
			`return {`
			`'id': video_id,`
			`'title': video_id,`
			`'formats': formats,`
			`}`
First version of a VPRO regex 3 months ago

Re-add Zapp 3 months ago			`class ZAPPIE(NPOIE):`
			`IE_NAME = 'zapp'`
			`IE_DESC = 'zapp.nl'`
			`_VALID_URL = r'https?://(?:www\.)?zapp.nl/.*'`

			`_TESTS = [{`
Fix zapp extractor 3 months ago			`'url': 'https://www.zapp.nl/programmas/zappsport/gemist/POMS_AT_811523',`
			`'md5': '9eb2d8b6f88b72b6b986ea2c26a81588',`
			`'info_dict': {`
			`'id': 'POMS_AT_811523',`
			`'title': 'POMS_AT_811523',`
			`},`
Re-add Zapp 3 months ago			`}]`

			`def _real_extract(self, url):`
			`video_id = url.rstrip('/').split('/')[-1]`

Resolve some of the pull request feedback 3 months ago			`formats = self._extract_formats_by_product_id(video_id, video_id, url=url)`
Re-add Zapp 3 months ago
			`return {`
			`'id': video_id,`
			`'title': video_id,`
			`'formats': formats,`
			`}`
Re-add SchoolTV 3 months ago

			`class SchoolTVIE(NPOIE):`
			`IE_NAME = 'schooltv'`
			`IE_DESC = 'schooltv.nl'`
			`_VALID_URL = r'https?://(?:www\.)?schooltv.nl/item/.*'`

			`_TESTS = [{`
			`'url': 'https://schooltv.nl/item/zapp-music-challenge-2015-zapp-music-challenge-2015',`
Work work 3 months ago			`'md5': 'e9ef151c4886994e2bea23593348cb14',`
			`'info_dict': {`
			`'id': 'zapp-music-challenge-2015-zapp-music-challenge-2015',`
			`'title': 'Zapp Music Challenge 2015 - Alain Clark & Yaell',`
			'description': "Een nummer schrijven met de super bekende soulzanger en producer Alain Clark? Dat is de uitdaging voor de dertienjarige Yaell uit Delft. En als het dan echt goed is, mag hij het ook nog eens live gaan spelen op de speelplaats bij Giel Beelen! Muziek is heel erg belangrijk in het leven van Yaell. 'Als er geen muziek zou zijn, dan zou ik heel veel niet kunnen.' Hij is dan ook altijd aan het schrijven, vaak over zijn eigen leven. Maar soms is het best lastig om die teksten te verzinnen. Vindt hij de inspiratie om een hit te maken met Alain?"
			`},`
Re-add SchoolTV 3 months ago			`}]`

			`def _real_extract(self, url):`
			`video_id = url.rstrip('/').split('/')[-1]`

Fix flake8 and better error reporting 3 months ago			`# TODO Find out how we could obtain this automatically`
			`# Otherwise this extractor might break each time SchoolTV deploys a new release`
Re-add SchoolTV 3 months ago			`build_id = 'b7eHUzAVO7wHXCopYxQhV'`

			`metadata_url = 'https://schooltv.nl/_next/data/' \`
			`+ build_id \`
			`+ '/item/' \`
			`+ video_id + '.json'`

			`metadata = self._download_json(metadata_url,`
			`video_id).get('pageProps', {}).get('data', {})`

Resolve some of the pull request feedback 3 months ago			`formats = self._extract_formats_by_product_id(metadata.get('poms_mid'), video_id)`
Re-add SchoolTV 3 months ago
			`if not formats:`
Fix flake8 and better error reporting 3 months ago			`raise ExtractorError('Could not find a POMS product id in the provided URL, '`
			`'perhaps because all stream URLs are DRM protected.')`
Re-add SchoolTV 3 months ago
			`return {`
			`'id': video_id,`
			`'title': metadata.get('title', '') + ' - ' + metadata.get('subtitle', ''),`
			`'description': metadata.get('description') or metadata.get('short_description'),`
			`'formats': formats,`
			`}`
Add scaffolding for last few extractors and change order so the PR diff looks nice 3 months ago

Reusable code for two NTR sites 3 months ago			`class NTRSubsiteIE(NPOIE):`
Add scaffolding for last few extractors and change order so the PR diff looks nice 3 months ago			`def _real_extract(self, url):`
Reusable code for two NTR sites 3 months ago			`video_id = url.rstrip('/').split('/')[-1]`

Work work 3 months ago			`page, _ = self._download_webpage_handle(url, video_id)`
Reusable code for two NTR sites 3 months ago			`results = re.findall(r'data-mid="(.+_.+)"', page)`
			`formats = []`
			`for result in results:`
Resolve some of the pull request feedback 3 months ago			`formats.extend(self._extract_formats_by_product_id(result, video_id))`
Reusable code for two NTR sites 3 months ago			`break`

			`if not formats:`
			`raise ExtractorError('Could not find a POMS product id in the provided URL, '`
			`'perhaps because all stream URLs are DRM protected.')`

			`return {`
			`'id': video_id,`
			`'title': video_id,`
			`'formats': formats,`
			`}`


			`class HetKlokhuisIE(NTRSubsiteIE):`
Work work 3 months ago			`IE_NAME = 'hetklokhuis'`
Reusable code for two NTR sites 3 months ago			`IE_DESC = 'hetklokhuis.nl'`
Work work 3 months ago			`_VALID_URL = r'https?://(?:www\.)?hetklokhuis\.nl/.*'`
Reusable code for two NTR sites 3 months ago			`_TESTS = [{`
Work work 3 months ago			`'url': 'https://hetklokhuis.nl/dossier/142/zoek-het-uit/tv-uitzending/2987/aliens',`
			`'md5': '4664b54ed4e05183b1e4f2f4290d551e',`
			`'info_dict': {`
			`'id': 'aliens',`
Fix zapp extractor 3 months ago			`'title': 'aliens',`
			`},`
Reusable code for two NTR sites 3 months ago			`}]`
Add scaffolding for last few extractors and change order so the PR diff looks nice 3 months ago

			`class VPROIE(NPOIE):`
			`IE_NAME = 'vpro'`
			`IE_DESC = 'vpro.nl'`
			`_VALID_URL = r'https?://(?:www\.)?vpro.nl/.*'`
			`_TESTS = [{`
			`'url': 'https://www.vpro.nl/programmas/tegenlicht/kijk/afleveringen/2015-2016/offline-als-luxe.html',`
Update unit tests 3 months ago			`'md5': 'cf302e066b5313cfaf8d5adf50d64f13',`
			`'info_dict': {`
			`'id': 'offline-als-luxe.html',`
			`'title': 'offline-als-luxe.html',`
			`'ext': 'm4v',`
Fix zapp extractor 3 months ago			`},`
Add scaffolding for last few extractors and change order so the PR diff looks nice 3 months ago			`}]`

			`def _real_extract(self, url):`
			`video_id = url.rstrip('/').split('/')[-1]`
			`page, _ = self._download_webpage_handle(url, video_id)`
Improve regex Co-authored-by: Roy <git@rvsit.nl> 3 months ago			`results = re.findall(r'data-media-id="([a-zA-Z0-9_]+)"\s', page)`
Add scaffolding for last few extractors and change order so the PR diff looks nice 3 months ago			`formats = []`
			`for result in results:`
Resolve some of the pull request feedback 3 months ago			`formats.extend(self._extract_formats_by_product_id(result, video_id))`
Add scaffolding for last few extractors and change order so the PR diff looks nice 3 months ago			`break # TODO find a better solution, VPRO pages can have multiple videos embedded`

			`if not formats:`
			`raise ExtractorError('Could not find a POMS product id in the provided URL, '`
			`'perhaps because all stream URLs are DRM protected.')`

			`return {`
			`'id': video_id,`
			`'title': video_id,`
			`'formats': formats,`
			`}`


Reusable code for two NTR sites 3 months ago			`class AndereTijdenIE(NTRSubsiteIE):`
			`IE_NAME = 'anderetijden'`
			`IE_DESC = 'anderetijden.nl'`
			`_VALID_URL = r'https?://(?:www\.)?anderetijden\.nl/.*'`
			`_TESTS = [{`
Work work 3 months ago			`'url': 'https://anderetijden.nl/programma/1/Andere-Tijden/aflevering/676/Duitse-soldaten-over-de-Slag-bij-Arnhem',`
			`'md5': '3d607b16e00b459156b4ab6e163dccd7',`
			`'info_dict': {`
			`'id': 'Duitse-soldaten-over-de-Slag-bij-Arnhem',`
Fix zapp extractor 3 months ago			`'title': 'Duitse-soldaten-over-de-Slag-bij-Arnhem',`
			`},`
Reusable code for two NTR sites 3 months ago			`}]`