diff options
Diffstat (limited to 'youtube_dl/extractor/common.py')
| -rw-r--r-- | youtube_dl/extractor/common.py | 68 | 
1 files changed, 65 insertions, 3 deletions
| diff --git a/youtube_dl/extractor/common.py b/youtube_dl/extractor/common.py index 0dd504444..6fa60622e 100644 --- a/youtube_dl/extractor/common.py +++ b/youtube_dl/extractor/common.py @@ -9,6 +9,7 @@ import xml.etree.ElementTree  from ..utils import (      compat_http_client,      compat_urllib_error, +    compat_urllib_parse_urlparse,      compat_str,      clean_html, @@ -37,10 +38,12 @@ class InfoExtractor(object):      id:             Video identifier.      title:          Video title, unescaped. -    Additionally, it must contain either a formats entry or url and ext: +    Additionally, it must contain either a formats entry or a url one: -    formats:        A list of dictionaries for each format available, it must -                    be ordered from worst to best quality. Potential fields: +    formats:        A list of dictionaries for each format available, ordered +                    from worst to best quality. + +                    Potential fields:                      * url        Mandatory. The URL of the video file                      * ext        Will be calculated from url if missing                      * format     A human-readable description of the format @@ -53,12 +56,21 @@ class InfoExtractor(object):                                   ("3D" or "DASH video")                      * width      Width of the video, if known                      * height     Height of the video, if known +                    * resolution Textual description of width and height +                    * tbr        Average bitrate of audio and video in KBit/s                      * abr        Average audio bitrate in KBit/s                      * acodec     Name of the audio codec in use                      * vbr        Average video bitrate in KBit/s                      * vcodec     Name of the video codec in use                      * filesize   The number of bytes, if known in advance                      * player_url SWF Player URL (used for rtmpdump). +                    * protocol   The protocol that will be used for the actual +                                 download, lower-case. +                                 "http", "https", "rtsp", "rtmp" or so. +                    * preference Order number of this format. If this field is +                                 present, the formats get sorted by this field. +                                 -1 for default (order by other properties), +                                 -2 or smaller for less than default.      url:            Final video URL.      ext:            Video filename extension.      format:         The video format, defaults to ext (used for --get-format) @@ -429,6 +441,56 @@ class InfoExtractor(object):          }          return RATING_TABLE.get(rating.lower(), None) +    def _sort_formats(self, formats): +        def _formats_key(f): +            # TODO remove the following workaround +            from ..utils import determine_ext +            if not f.get('ext') and 'url' in f: +                f['ext'] = determine_ext(f['url']) + +            preference = f.get('preference') +            if preference is None: +                proto = f.get('protocol') +                if proto is None: +                    proto = compat_urllib_parse_urlparse(f.get('url', '')).scheme + +                preference = 0 if proto in ['http', 'https'] else -0.1 +                if f.get('ext') in ['f4f', 'f4m']:  # Not yet supported +                    preference -= 0.5 + +            if f.get('vcodec') == 'none':  # audio only +                if self._downloader.params.get('prefer_free_formats'): +                    ORDER = [u'aac', u'mp3', u'm4a', u'webm', u'ogg', u'opus'] +                else: +                    ORDER = [u'webm', u'opus', u'ogg', u'mp3', u'aac', u'm4a'] +                ext_preference = 0 +                try: +                    audio_ext_preference = ORDER.index(f['ext']) +                except ValueError: +                    audio_ext_preference = -1 +            else: +                if self._downloader.params.get('prefer_free_formats'): +                    ORDER = [u'flv', u'mp4', u'webm'] +                else: +                    ORDER = [u'webm', u'flv', u'mp4'] +                try: +                    ext_preference = ORDER.index(f['ext']) +                except ValueError: +                    ext_preference = -1 +                audio_ext_preference = 0 + +            return ( +                preference, +                f.get('height') if f.get('height') is not None else -1, +                f.get('width') if f.get('width') is not None else -1, +                ext_preference, +                f.get('vbr') if f.get('vbr') is not None else -1, +                f.get('abr') if f.get('abr') is not None else -1, +                audio_ext_preference, +                f.get('filesize') if f.get('filesize') is not None else -1, +                f.get('format_id'), +            ) +        formats.sort(key=_formats_key)  class SearchInfoExtractor(InfoExtractor): | 
