diff options
| author | Tithen-Firion <Tithen-Firion@users.noreply.github.com> | 2017-05-04 11:00:06 +0200 | 
|---|---|---|
| committer | GitHub <noreply@github.com> | 2017-05-04 11:00:06 +0200 | 
| commit | c89267d31ad99eb5b1a87cd354de5280a2a087b1 (patch) | |
| tree | 8bb3b01cd088d0646089344bddd3d4ff272c0065 /youtube_dl/extractor/pbs.py | |
| parent | 7552f96352f35cd877e52fd0770b77ba1856fc62 (diff) | |
| parent | 0c265486016b06342fb257966474ce591667aaff (diff) | |
Merge branch 'master' into openload-phantomjs-method
Diffstat (limited to 'youtube_dl/extractor/pbs.py')
| -rw-r--r-- | youtube_dl/extractor/pbs.py | 19 | 
1 files changed, 18 insertions, 1 deletions
| diff --git a/youtube_dl/extractor/pbs.py b/youtube_dl/extractor/pbs.py index 3e51b4dd7..0727e381b 100644 --- a/youtube_dl/extractor/pbs.py +++ b/youtube_dl/extractor/pbs.py @@ -8,6 +8,7 @@ from ..utils import (      ExtractorError,      determine_ext,      int_or_none, +    float_or_none,      js_to_json,      strip_jsonp,      strip_or_none, @@ -464,6 +465,7 @@ class PBSIE(InfoExtractor):                      redirects.append(redirect)                      redirect_urls.add(redirect_url) +        chapters = []          # Player pages may also serve different qualities          for page in ('widget/partnerplayer', 'portalplayer'):              player = self._download_webpage( @@ -479,6 +481,20 @@ class PBSIE(InfoExtractor):                      extract_redirect_urls(video_info)                      if not info:                          info = video_info +                if not chapters: +                    for chapter_data in re.findall(r'(?s)chapters\.push\(({.*?})\)', player): +                        chapter = self._parse_json(chapter_data, video_id, js_to_json, fatal=False) +                        if not chapter: +                            continue +                        start_time = float_or_none(chapter.get('start_time'), 1000) +                        duration = float_or_none(chapter.get('duration'), 1000) +                        if start_time is None or duration is None: +                            continue +                        chapters.append({ +                            'start_time': start_time, +                            'end_time': start_time + duration, +                            'title': chapter.get('title'), +                        })          formats = []          http_url = None @@ -515,7 +531,7 @@ class PBSIE(InfoExtractor):                      http_url = format_url          self._remove_duplicate_formats(formats)          m3u8_formats = list(filter( -            lambda f: f.get('protocol') == 'm3u8' and f.get('vcodec') != 'none' and f.get('resolution') != 'multiple', +            lambda f: f.get('protocol') == 'm3u8' and f.get('vcodec') != 'none',              formats))          if http_url:              for m3u8_format in m3u8_formats: @@ -588,4 +604,5 @@ class PBSIE(InfoExtractor):              'upload_date': upload_date,              'formats': formats,              'subtitles': subtitles, +            'chapters': chapters,          } | 
