bpb Add new extractor

2024-01-07 17:16:08 +00:00 · 2014-11-24 20:02:00 +01:00 · 2014-11-24 20:02:00 +01:00 · 355682be01
parent b74e86f48a
commit 355682be01
2 changed files with 42 additions and 0 deletions
--- a/youtube_dl/extractor/init.py
+++ b/youtube_dl/extractor/init.py
@ -32,6 +32,7 @@ from .bilibili import BiliBiliIE
 from .blinkx import BlinkxIE
 from .bliptv import BlipTVIE, BlipTVUserIE
 from .bloomberg import BloombergIE
 from .bpb import BpbIE
 from .br import BRIE
 from .breakcom import BreakIE
 from .brightcove import BrightcoveIE
--- a/youtube_dl/extractor/bpb.py
+++ b/youtube_dl/extractor/bpb.py
@ -0,0 +1,41 @@
 # coding: utf-8
 from __future__ import unicode_literals
 import re
 from .common import InfoExtractor
 class BpbIE(InfoExtractor):
 	IE_NAME = 'Bundeszentrale für politische Bildung'
 	_VALID_URL = r'http://www\.bpb\.de/mediathek/.*'
 	_TEST = {
 		'url': 'http://www.bpb.de/mediathek/297/joachim-gauck-zu-1989-und-die-erinnerung-an-die-ddr',
 		'md5': '0792086e8e2bfbac9cdf27835d5f2093',
 		'info_dict': {
 			'id': '12490',
 			'ext': 'mp4',
 			'title': 'Joachim Gauck zu 1989 und die Erinnerung an die DDR',
 			'description': 'Joachim Gauck, erster Beauftragter für die Stasi-Unterlagen, spricht auf dem Geschichtsforum über die friedliche Revolution 1989 und eine "gewisse Traurigkeit" im Umgang mit der DDR-Vergangenheit.'
 		}
 	}
 	def _real_extract(self, url):
 		webpage = self._download_webpage(url, '')
 		title = self._html_search_regex(r'<h2 class="white">(.*?)</h2>', webpage, 'title')
 		video_id = self._html_search_regex(r'http://film\.bpb\.de/player/dokument_(?P<video_id>[0-9]+)\.mp4', webpage, 'video_id')
 		url = 'http://film.bpb.de/player/dokument_' + video_id + '.mp4'
 		description = self._og_search_description(webpage)
 		return {
 			'id': video_id,
 			'url': url,
 			'title': title,
 			'description': description,
 			'ext': 'mp4'
 		}