bpb Add new extractor

This commit is contained in:
Oskar Jauch 2014-11-24 20:02:00 +01:00
parent b74e86f48a
commit 355682be01
2 changed files with 42 additions and 0 deletions

View file

@ -32,6 +32,7 @@ from .bilibili import BiliBiliIE
from .blinkx import BlinkxIE from .blinkx import BlinkxIE
from .bliptv import BlipTVIE, BlipTVUserIE from .bliptv import BlipTVIE, BlipTVUserIE
from .bloomberg import BloombergIE from .bloomberg import BloombergIE
from .bpb import BpbIE
from .br import BRIE from .br import BRIE
from .breakcom import BreakIE from .breakcom import BreakIE
from .brightcove import BrightcoveIE from .brightcove import BrightcoveIE

View file

@ -0,0 +1,41 @@
# coding: utf-8
from __future__ import unicode_literals
import re
from .common import InfoExtractor
class BpbIE(InfoExtractor):
IE_NAME = 'Bundeszentrale für politische Bildung'
_VALID_URL = r'http://www\.bpb\.de/mediathek/.*'
_TEST = {
'url': 'http://www.bpb.de/mediathek/297/joachim-gauck-zu-1989-und-die-erinnerung-an-die-ddr',
'md5': '0792086e8e2bfbac9cdf27835d5f2093',
'info_dict': {
'id': '12490',
'ext': 'mp4',
'title': 'Joachim Gauck zu 1989 und die Erinnerung an die DDR',
'description': 'Joachim Gauck, erster Beauftragter für die Stasi-Unterlagen, spricht auf dem Geschichtsforum über die friedliche Revolution 1989 und eine "gewisse Traurigkeit" im Umgang mit der DDR-Vergangenheit.'
}
}
def _real_extract(self, url):
webpage = self._download_webpage(url, '')
title = self._html_search_regex(r'<h2 class="white">(.*?)</h2>', webpage, 'title')
video_id = self._html_search_regex(r'http://film\.bpb\.de/player/dokument_(?P<video_id>[0-9]+)\.mp4', webpage, 'video_id')
url = 'http://film.bpb.de/player/dokument_' + video_id + '.mp4'
description = self._og_search_description(webpage)
return {
'id': video_id,
'url': url,
'title': title,
'description': description,
'ext': 'mp4'
}