release 2014.06.04

[ard] Fix format extraction (fixes #3006 and #3032 )
Merge pull request #2962 from simonwjackson/patch-1
2025-12-14 10:02:42 +01:00 · 2014-06-04 06:47:57 +02:00 · 2014-06-03 21:56:49 +02:00 · 2014-06-03 16:47:59 +02:00 · 2014-06-03 19:59:08 +07:00 · 2014-06-02 20:20:21 +07:00
5 changed files with 14 additions and 21 deletions
--- a/test/test_age_restriction.py
+++ b/test/test_age_restriction.py
@@ -13,7 +13,7 @@ from youtube_dl import YoutubeDL


 def _download_restricted(url, filename, age):
-    """ Returns true iff the file has been downloaded """
+    """ Returns true if the file has been downloaded """

    params = {
        'age_limit': age,
--- a/youtube_dl/extractor/ard.py
+++ b/youtube_dl/extractor/ard.py
@@ -39,16 +39,18 @@ class ARDIE(InfoExtractor):

        title = self._html_search_regex(
            [r'<h1(?:\s+class="boxTopHeadline")?>(.*?)</h1>',
+             r'<meta name="dcterms.title" content="(.*?)"/>',
             r'<h4 class="headline">(.*?)</h4>'],
            webpage, 'title')
        description = self._html_search_meta(
            'dcterms.abstract', webpage, 'description')
        thumbnail = self._og_search_thumbnail(webpage)

-        streams = [
-            mo.groupdict()
-            for mo in re.finditer(
-                r'mediaCollection\.addMediaStream\((?P<media_type>\d+), (?P<quality>\d+), "(?P<rtmp_url>[^"]*)", "(?P<video_url>[^"]*)", "[^"]*"\)', webpage)]
+
+        media_info = self._download_json(
+            'http://www.ardmediathek.de/play/media/%s' % video_id, video_id)
+        # The second element of the _mediaArray contains the standard http urls
+        streams = media_info['_mediaArray'][1]['_mediaStreamArray']
        if not streams:
            if '"fsk"' in webpage:
                raise ExtractorError('This video is only available after 20:00')
@@ -56,21 +58,12 @@ class ARDIE(InfoExtractor):
        formats = []
        for s in streams:
            format = {
-                'quality': int(s['quality']),
+                'quality': s['_quality'],
+                'url': s['_stream'],
            }
-            if s.get('rtmp_url'):
-                format['protocol'] = 'rtmp'
-                format['url'] = s['rtmp_url']
-                format['playpath'] = s['video_url']
-            else:
-                format['url'] = s['video_url']

-            quality_name = self._search_regex(
-                r'[,.]([a-zA-Z0-9_-]+),?\.mp4', format['url'],
-                'quality name', default='NA')
-            format['format_id'] = '%s-%s-%s-%s' % (
-                determine_ext(format['url']), quality_name, s['media_type'],
-                s['quality'])
+            format['format_id'] = '%s-%s' % (
+                determine_ext(format['url']), format['quality'])

            formats.append(format)

--- a/youtube_dl/extractor/extremetube.py
+++ b/youtube_dl/extractor/extremetube.py
@@ -37,7 +37,7 @@ class ExtremeTubeIE(InfoExtractor):
        webpage = self._download_webpage(req, video_id)

        video_title = self._html_search_regex(
-            r'<h1 [^>]*?title="([^"]+)"[^>]*>\1<', webpage, 'title')
+            r'<h1 [^>]*?title="([^"]+)"[^>]*>', webpage, 'title')
        uploader = self._html_search_regex(
            r'>Posted by:(?=<)(?:\s|<[^>]*>)*(.+?)\|', webpage, 'uploader',
            fatal=False)
--- a/youtube_dl/extractor/youtube.py
+++ b/youtube_dl/extractor/youtube.py
@@ -1140,7 +1140,7 @@ class YoutubeIE(YoutubeBaseInfoExtractor, SubtitlesInfoExtractor):
        mobj = re.search(r'(?s)id="eow-date.*?>(.*?)</span>', video_webpage)
        if mobj is None:
            mobj = re.search(
-                r'(?s)id="watch-uploader-info".*?>.*?(?:Published|Uploaded) on (.*?)</strong>',
+                r'(?s)id="watch-uploader-info".*?>.*?(?:Published|Uploaded|Streamed live) on (.*?)</strong>',
                video_webpage)
        if mobj is not None:
            upload_date = ' '.join(re.sub(r'[/,-]', r' ', mobj.group(1)).split())
--- a/youtube_dl/version.py
+++ b/youtube_dl/version.py
@@ -1,2 +1,2 @@

-__version__ = '2014.06.02'
+__version__ = '2014.06.04'
Author	SHA1	Message	Date
Philipp Hagemeister	b675b32e6b	release 2014.06.04	2014-06-04 06:47:57 +02:00
Jaime Marquínez Ferrándiz	6a3fa81ffb	[ard] Fix format extraction (fixes #3006 and #3032 )	2014-06-03 21:56:49 +02:00
Jaime Marquínez Ferrándiz	0d69795014	Merge pull request #2962 from simonwjackson/patch-1 Update test_age_restriction.py	2014-06-03 16:47:59 +02:00
Sergey M.	3374f3fdc2	Merge pull request #3022 from MikeCol/Extremetube_title title extraction condition less restrictive	2014-06-03 19:59:08 +07:00
Sergey M.	4bf0727b1f	Merge pull request #3033 from Forever-Young/patch-2 Recognize a third format of the upload_date in the 'watch-uploader-info'...	2014-06-02 20:20:21 +07:00
Anton Novosyolov	263bd4ec50	Recognize a third format of the upload_date in the 'watch-uploader-info' element	2014-06-02 13:30:23 +04:00
MikeCol	9c7b79acd9	title extraction condition less restrictive	2014-05-31 18:31:39 +02:00
Simon W. Jackson	8ae980807a	Update test_age_restriction.py typo	2014-05-21 16:35:49 +02:00