diff options
Diffstat (limited to 'test')
| -rw-r--r-- | test/helper.py | 131 | ||||
| -rw-r--r-- | test/test_InfoExtractor.py | 8 | ||||
| -rw-r--r-- | test/test_YoutubeDL.py | 98 | ||||
| -rw-r--r-- | test/test_all_urls.py | 4 | ||||
| -rw-r--r-- | test/test_compat.py | 21 | ||||
| -rw-r--r-- | test/test_download.py | 6 | ||||
| -rw-r--r-- | test/test_jsinterp.py | 3 | ||||
| -rw-r--r-- | test/test_subtitles.py | 34 | ||||
| -rw-r--r-- | test/test_utils.py | 142 | ||||
| -rw-r--r-- | test/test_write_annotations.py | 2 | ||||
| -rw-r--r-- | test/test_youtube_lists.py | 9 | 
11 files changed, 378 insertions, 80 deletions
| diff --git a/test/helper.py b/test/helper.py index e1129e58f..bdd7acca4 100644 --- a/test/helper.py +++ b/test/helper.py @@ -89,66 +89,81 @@ def gettestcases(include_onlymatching=False):  md5 = lambda s: hashlib.md5(s.encode('utf-8')).hexdigest() -def expect_info_dict(self, got_dict, expected_dict): +def expect_value(self, got, expected, field): +    if isinstance(expected, compat_str) and expected.startswith('re:'): +        match_str = expected[len('re:'):] +        match_rex = re.compile(match_str) + +        self.assertTrue( +            isinstance(got, compat_str), +            'Expected a %s object, but got %s for field %s' % ( +                compat_str.__name__, type(got).__name__, field)) +        self.assertTrue( +            match_rex.match(got), +            'field %s (value: %r) should match %r' % (field, got, match_str)) +    elif isinstance(expected, compat_str) and expected.startswith('startswith:'): +        start_str = expected[len('startswith:'):] +        self.assertTrue( +            isinstance(got, compat_str), +            'Expected a %s object, but got %s for field %s' % ( +                compat_str.__name__, type(got).__name__, field)) +        self.assertTrue( +            got.startswith(start_str), +            'field %s (value: %r) should start with %r' % (field, got, start_str)) +    elif isinstance(expected, compat_str) and expected.startswith('contains:'): +        contains_str = expected[len('contains:'):] +        self.assertTrue( +            isinstance(got, compat_str), +            'Expected a %s object, but got %s for field %s' % ( +                compat_str.__name__, type(got).__name__, field)) +        self.assertTrue( +            contains_str in got, +            'field %s (value: %r) should contain %r' % (field, got, contains_str)) +    elif isinstance(expected, type): +        self.assertTrue( +            isinstance(got, expected), +            'Expected type %r for field %s, but got value %r of type %r' % (expected, field, got, type(got))) +    elif isinstance(expected, dict) and isinstance(got, dict): +        expect_dict(self, got, expected) +    elif isinstance(expected, list) and isinstance(got, list): +        self.assertEqual( +            len(expected), len(got), +            'Expect a list of length %d, but got a list of length %d for field %s' % ( +                len(expected), len(got), field)) +        for index, (item_got, item_expected) in enumerate(zip(got, expected)): +            type_got = type(item_got) +            type_expected = type(item_expected) +            self.assertEqual( +                type_expected, type_got, +                'Type mismatch for list item at index %d for field %s, expected %r, got %r' % ( +                    index, field, type_expected, type_got)) +            expect_value(self, item_got, item_expected, field) +    else: +        if isinstance(expected, compat_str) and expected.startswith('md5:'): +            got = 'md5:' + md5(got) +        elif isinstance(expected, compat_str) and expected.startswith('mincount:'): +            self.assertTrue( +                isinstance(got, (list, dict)), +                'Expected field %s to be a list or a dict, but it is of type %s' % ( +                    field, type(got).__name__)) +            expected_num = int(expected.partition(':')[2]) +            assertGreaterEqual( +                self, len(got), expected_num, +                'Expected %d items in field %s, but only got %d' % (expected_num, field, len(got))) +            return +        self.assertEqual( +            expected, got, +            'Invalid value for field %s, expected %r, got %r' % (field, expected, got)) + + +def expect_dict(self, got_dict, expected_dict):      for info_field, expected in expected_dict.items(): -        if isinstance(expected, compat_str) and expected.startswith('re:'): -            got = got_dict.get(info_field) -            match_str = expected[len('re:'):] -            match_rex = re.compile(match_str) +        got = got_dict.get(info_field) +        expect_value(self, got, expected, info_field) -            self.assertTrue( -                isinstance(got, compat_str), -                'Expected a %s object, but got %s for field %s' % ( -                    compat_str.__name__, type(got).__name__, info_field)) -            self.assertTrue( -                match_rex.match(got), -                'field %s (value: %r) should match %r' % (info_field, got, match_str)) -        elif isinstance(expected, compat_str) and expected.startswith('startswith:'): -            got = got_dict.get(info_field) -            start_str = expected[len('startswith:'):] -            self.assertTrue( -                isinstance(got, compat_str), -                'Expected a %s object, but got %s for field %s' % ( -                    compat_str.__name__, type(got).__name__, info_field)) -            self.assertTrue( -                got.startswith(start_str), -                'field %s (value: %r) should start with %r' % (info_field, got, start_str)) -        elif isinstance(expected, compat_str) and expected.startswith('contains:'): -            got = got_dict.get(info_field) -            contains_str = expected[len('contains:'):] -            self.assertTrue( -                isinstance(got, compat_str), -                'Expected a %s object, but got %s for field %s' % ( -                    compat_str.__name__, type(got).__name__, info_field)) -            self.assertTrue( -                contains_str in got, -                'field %s (value: %r) should contain %r' % (info_field, got, contains_str)) -        elif isinstance(expected, type): -            got = got_dict.get(info_field) -            self.assertTrue(isinstance(got, expected), -                            'Expected type %r for field %s, but got value %r of type %r' % (expected, info_field, got, type(got))) -        else: -            if isinstance(expected, compat_str) and expected.startswith('md5:'): -                got = 'md5:' + md5(got_dict.get(info_field)) -            elif isinstance(expected, compat_str) and expected.startswith('mincount:'): -                got = got_dict.get(info_field) -                self.assertTrue( -                    isinstance(got, list), -                    'Expected field %s to be a list, but it is of type %s' % ( -                        info_field, type(got).__name__)) -                expected_num = int(expected.partition(':')[2]) -                assertGreaterEqual( -                    self, len(got), expected_num, -                    'Expected %d items in field %s, but only got %d' % ( -                        expected_num, info_field, len(got) -                    ) -                ) -                continue -            else: -                got = got_dict.get(info_field) -            self.assertEqual(expected, got, -                             'invalid value for field %s, expected %r, got %r' % (info_field, expected, got)) +def expect_info_dict(self, got_dict, expected_dict): +    expect_dict(self, got_dict, expected_dict)      # Check for the presence of mandatory fields      if got_dict.get('_type') not in ('playlist', 'multi_video'):          for key in ('id', 'url', 'title', 'ext'): @@ -160,7 +175,7 @@ def expect_info_dict(self, got_dict, expected_dict):      # Are checkable fields missing from the test case definition?      test_info_dict = dict((key, value if not isinstance(value, compat_str) or len(value) < 250 else 'md5:' + md5(value))                            for key, value in got_dict.items() -                          if value and key in ('id', 'title', 'description', 'uploader', 'upload_date', 'timestamp', 'uploader_id', 'location')) +                          if value and key in ('id', 'title', 'description', 'uploader', 'upload_date', 'timestamp', 'uploader_id', 'location', 'age_limit'))      missing_keys = set(test_info_dict.keys()) - set(expected_dict.keys())      if missing_keys:          def _repr(v): diff --git a/test/test_InfoExtractor.py b/test/test_InfoExtractor.py index be8d12997..938466a80 100644 --- a/test/test_InfoExtractor.py +++ b/test/test_InfoExtractor.py @@ -35,10 +35,18 @@ class TestInfoExtractor(unittest.TestCase):              <meta name="og:title" content='Foo'/>              <meta content="Some video's description " name="og:description"/>              <meta property='og:image' content='http://domain.com/pic.jpg?key1=val1&key2=val2'/> +            <meta content='application/x-shockwave-flash' property='og:video:type'> +            <meta content='Foo' property=og:foobar> +            <meta name="og:test1" content='foo > < bar'/> +            <meta name="og:test2" content="foo >//< bar"/>              '''          self.assertEqual(ie._og_search_title(html), 'Foo')          self.assertEqual(ie._og_search_description(html), 'Some video\'s description ')          self.assertEqual(ie._og_search_thumbnail(html), 'http://domain.com/pic.jpg?key1=val1&key2=val2') +        self.assertEqual(ie._og_search_video_url(html, default=None), None) +        self.assertEqual(ie._og_search_property('foobar', html), 'Foo') +        self.assertEqual(ie._og_search_property('test1', html), 'foo > < bar') +        self.assertEqual(ie._og_search_property('test2', html), 'foo >//< bar')      def test_html_search_meta(self):          ie = self.ie diff --git a/test/test_YoutubeDL.py b/test/test_YoutubeDL.py index a13c09ef4..0388c0bf3 100644 --- a/test/test_YoutubeDL.py +++ b/test/test_YoutubeDL.py @@ -15,7 +15,7 @@ from youtube_dl import YoutubeDL  from youtube_dl.compat import compat_str  from youtube_dl.extractor import YoutubeIE  from youtube_dl.postprocessor.common import PostProcessor -from youtube_dl.utils import match_filter_func +from youtube_dl.utils import ExtractorError, match_filter_func  TEST_URL = 'http://localhost/sample.mp4' @@ -105,6 +105,7 @@ class TestFormatSelection(unittest.TestCase):      def test_format_selection(self):          formats = [              {'format_id': '35', 'ext': 'mp4', 'preference': 1, 'url': TEST_URL}, +            {'format_id': 'example-with-dashes', 'ext': 'webm', 'preference': 1, 'url': TEST_URL},              {'format_id': '45', 'ext': 'webm', 'preference': 2, 'url': TEST_URL},              {'format_id': '47', 'ext': 'webm', 'preference': 3, 'url': TEST_URL},              {'format_id': '2', 'ext': 'flv', 'preference': 4, 'url': TEST_URL}, @@ -136,6 +137,11 @@ class TestFormatSelection(unittest.TestCase):          downloaded = ydl.downloaded_info_dicts[0]          self.assertEqual(downloaded['format_id'], '35') +        ydl = YDL({'format': 'example-with-dashes'}) +        ydl.process_ie_result(info_dict.copy()) +        downloaded = ydl.downloaded_info_dicts[0] +        self.assertEqual(downloaded['format_id'], 'example-with-dashes') +      def test_format_selection_audio(self):          formats = [              {'format_id': 'audio-low', 'ext': 'webm', 'preference': 1, 'vcodec': 'none', 'url': TEST_URL}, @@ -229,21 +235,70 @@ class TestFormatSelection(unittest.TestCase):              '141', '172', '140', '171', '139',          ] -        for f1id, f2id in zip(order, order[1:]): -            f1 = YoutubeIE._formats[f1id].copy() -            f1['format_id'] = f1id -            f1['url'] = 'url:' + f1id -            f2 = YoutubeIE._formats[f2id].copy() -            f2['format_id'] = f2id -            f2['url'] = 'url:' + f2id +        def format_info(f_id): +            info = YoutubeIE._formats[f_id].copy() +            info['format_id'] = f_id +            info['url'] = 'url:' + f_id +            return info +        formats_order = [format_info(f_id) for f_id in order] + +        info_dict = _make_result(list(formats_order), extractor='youtube') +        ydl = YDL({'format': 'bestvideo+bestaudio'}) +        yie = YoutubeIE(ydl) +        yie._sort_formats(info_dict['formats']) +        ydl.process_ie_result(info_dict) +        downloaded = ydl.downloaded_info_dicts[0] +        self.assertEqual(downloaded['format_id'], '137+141') +        self.assertEqual(downloaded['ext'], 'mp4') + +        info_dict = _make_result(list(formats_order), extractor='youtube') +        ydl = YDL({'format': 'bestvideo[height>=999999]+bestaudio/best'}) +        yie = YoutubeIE(ydl) +        yie._sort_formats(info_dict['formats']) +        ydl.process_ie_result(info_dict) +        downloaded = ydl.downloaded_info_dicts[0] +        self.assertEqual(downloaded['format_id'], '38') + +        info_dict = _make_result(list(formats_order), extractor='youtube') +        ydl = YDL({'format': 'bestvideo/best,bestaudio'}) +        yie = YoutubeIE(ydl) +        yie._sort_formats(info_dict['formats']) +        ydl.process_ie_result(info_dict) +        downloaded_ids = [info['format_id'] for info in ydl.downloaded_info_dicts] +        self.assertEqual(downloaded_ids, ['137', '141']) + +        info_dict = _make_result(list(formats_order), extractor='youtube') +        ydl = YDL({'format': '(bestvideo[ext=mp4],bestvideo[ext=webm])+bestaudio'}) +        yie = YoutubeIE(ydl) +        yie._sort_formats(info_dict['formats']) +        ydl.process_ie_result(info_dict) +        downloaded_ids = [info['format_id'] for info in ydl.downloaded_info_dicts] +        self.assertEqual(downloaded_ids, ['137+141', '248+141']) + +        info_dict = _make_result(list(formats_order), extractor='youtube') +        ydl = YDL({'format': '(bestvideo[ext=mp4],bestvideo[ext=webm])[height<=720]+bestaudio'}) +        yie = YoutubeIE(ydl) +        yie._sort_formats(info_dict['formats']) +        ydl.process_ie_result(info_dict) +        downloaded_ids = [info['format_id'] for info in ydl.downloaded_info_dicts] +        self.assertEqual(downloaded_ids, ['136+141', '247+141']) + +        info_dict = _make_result(list(formats_order), extractor='youtube') +        ydl = YDL({'format': '(bestvideo[ext=none]/bestvideo[ext=webm])+bestaudio'}) +        yie = YoutubeIE(ydl) +        yie._sort_formats(info_dict['formats']) +        ydl.process_ie_result(info_dict) +        downloaded_ids = [info['format_id'] for info in ydl.downloaded_info_dicts] +        self.assertEqual(downloaded_ids, ['248+141']) +        for f1, f2 in zip(formats_order, formats_order[1:]):              info_dict = _make_result([f1, f2], extractor='youtube')              ydl = YDL({'format': 'best/bestvideo'})              yie = YoutubeIE(ydl)              yie._sort_formats(info_dict['formats'])              ydl.process_ie_result(info_dict)              downloaded = ydl.downloaded_info_dicts[0] -            self.assertEqual(downloaded['format_id'], f1id) +            self.assertEqual(downloaded['format_id'], f1['format_id'])              info_dict = _make_result([f2, f1], extractor='youtube')              ydl = YDL({'format': 'best/bestvideo'}) @@ -251,7 +306,18 @@ class TestFormatSelection(unittest.TestCase):              yie._sort_formats(info_dict['formats'])              ydl.process_ie_result(info_dict)              downloaded = ydl.downloaded_info_dicts[0] -            self.assertEqual(downloaded['format_id'], f1id) +            self.assertEqual(downloaded['format_id'], f1['format_id']) + +    def test_invalid_format_specs(self): +        def assert_syntax_error(format_spec): +            ydl = YDL({'format': format_spec}) +            info_dict = _make_result([{'format_id': 'foo', 'url': TEST_URL}]) +            self.assertRaises(SyntaxError, ydl.process_ie_result, info_dict) + +        assert_syntax_error('bestvideo,,best') +        assert_syntax_error('+bestaudio') +        assert_syntax_error('bestvideo+') +        assert_syntax_error('/')      def test_format_filtering(self):          formats = [ @@ -308,6 +374,18 @@ class TestFormatSelection(unittest.TestCase):          downloaded = ydl.downloaded_info_dicts[0]          self.assertEqual(downloaded['format_id'], 'G') +        ydl = YDL({'format': 'all[width>=400][width<=600]'}) +        ydl.process_ie_result(info_dict) +        downloaded_ids = [info['format_id'] for info in ydl.downloaded_info_dicts] +        self.assertEqual(downloaded_ids, ['B', 'C', 'D']) + +        ydl = YDL({'format': 'best[height<40]'}) +        try: +            ydl.process_ie_result(info_dict) +        except ExtractorError: +            pass +        self.assertEqual(ydl.downloaded_info_dicts, []) +  class TestYoutubeDL(unittest.TestCase):      def test_subtitles(self): diff --git a/test/test_all_urls.py b/test/test_all_urls.py index a9db42b30..a0c11e6c1 100644 --- a/test/test_all_urls.py +++ b/test/test_all_urls.py @@ -121,8 +121,8 @@ class TestAllURLsMatching(unittest.TestCase):      def test_pbs(self):          # https://github.com/rg3/youtube-dl/issues/2350 -        self.assertMatch('http://video.pbs.org/viralplayer/2365173446/', ['PBS']) -        self.assertMatch('http://video.pbs.org/widget/partnerplayer/980042464/', ['PBS']) +        self.assertMatch('http://video.pbs.org/viralplayer/2365173446/', ['pbs']) +        self.assertMatch('http://video.pbs.org/widget/partnerplayer/980042464/', ['pbs'])      def test_yahoo_https(self):          # https://github.com/rg3/youtube-dl/issues/2701 diff --git a/test/test_compat.py b/test/test_compat.py index c3ba8ad2e..b6bfad05e 100644 --- a/test/test_compat.py +++ b/test/test_compat.py @@ -13,7 +13,10 @@ sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))  from youtube_dl.utils import get_filesystem_encoding  from youtube_dl.compat import (      compat_getenv, +    compat_etree_fromstring,      compat_expanduser, +    compat_shlex_split, +    compat_str,      compat_urllib_parse_unquote,      compat_urllib_parse_unquote_plus,  ) @@ -67,5 +70,23 @@ class TestCompat(unittest.TestCase):          self.assertEqual(compat_urllib_parse_unquote_plus('abc%20def'), 'abc def')          self.assertEqual(compat_urllib_parse_unquote_plus('%7e/abc+def'), '~/abc def') +    def test_compat_shlex_split(self): +        self.assertEqual(compat_shlex_split('-option "one two"'), ['-option', 'one two']) + +    def test_compat_etree_fromstring(self): +        xml = ''' +            <root foo="bar" spam="中文"> +                <normal>foo</normal> +                <chinese>中文</chinese> +                <foo><bar>spam</bar></foo> +            </root> +        ''' +        doc = compat_etree_fromstring(xml.encode('utf-8')) +        self.assertTrue(isinstance(doc.attrib['foo'], compat_str)) +        self.assertTrue(isinstance(doc.attrib['spam'], compat_str)) +        self.assertTrue(isinstance(doc.find('normal').text, compat_str)) +        self.assertTrue(isinstance(doc.find('chinese').text, compat_str)) +        self.assertTrue(isinstance(doc.find('foo/bar').text, compat_str)) +  if __name__ == '__main__':      unittest.main() diff --git a/test/test_download.py b/test/test_download.py index 1110357a7..a3f1c0644 100644 --- a/test/test_download.py +++ b/test/test_download.py @@ -102,7 +102,7 @@ def generator(test_case):          params = get_params(test_case.get('params', {}))          if is_playlist and 'playlist' not in test_case: -            params.setdefault('extract_flat', True) +            params.setdefault('extract_flat', 'in_playlist')              params.setdefault('skip_download', True)          ydl = YoutubeDL(params, auto_init=False) @@ -136,7 +136,9 @@ def generator(test_case):                      # We're not using .download here sine that is just a shim                      # for outside error handling, and returns the exit code                      # instead of the result dict. -                    res_dict = ydl.extract_info(test_case['url']) +                    res_dict = ydl.extract_info( +                        test_case['url'], +                        force_generic_extractor=params.get('force_generic_extractor', False))                  except (DownloadError, ExtractorError) as err:                      # Check if the exception is not a network related one                      if not err.exc_info[0] in (compat_urllib_error.URLError, socket.timeout, UnavailableVideoError, compat_http_client.BadStatusLine) or (err.exc_info[0] == compat_HTTPError and err.exc_info[1].code == 503): diff --git a/test/test_jsinterp.py b/test/test_jsinterp.py index fc73e5dc2..63c350b8f 100644 --- a/test/test_jsinterp.py +++ b/test/test_jsinterp.py @@ -19,6 +19,9 @@ class TestJSInterpreter(unittest.TestCase):          jsi = JSInterpreter('function x3(){return 42;}')          self.assertEqual(jsi.call_function('x3'), 42) +        jsi = JSInterpreter('var x5 = function(){return 42;}') +        self.assertEqual(jsi.call_function('x5'), 42) +      def test_calc(self):          jsi = JSInterpreter('function x4(a){return 2*a+1;}')          self.assertEqual(jsi.call_function('x4', 3), 7) diff --git a/test/test_subtitles.py b/test/test_subtitles.py index c4e3adb67..75f0ea75f 100644 --- a/test/test_subtitles.py +++ b/test/test_subtitles.py @@ -25,8 +25,10 @@ from youtube_dl.extractor import (      RaiIE,      VikiIE,      ThePlatformIE, +    ThePlatformFeedIE,      RTVEALaCartaIE,      FunnyOrDieIE, +    DemocracynowIE,  ) @@ -307,6 +309,18 @@ class TestThePlatformSubtitles(BaseTestSubtitles):          self.assertEqual(md5(subtitles['en']), '97e7670cbae3c4d26ae8bcc7fdd78d4b') +class TestThePlatformFeedSubtitles(BaseTestSubtitles): +    url = 'http://feed.theplatform.com/f/7wvmTC/msnbc_video-p-test?form=json&pretty=true&range=-40&byGuid=n_hardball_5biden_140207' +    IE = ThePlatformFeedIE + +    def test_allsubtitles(self): +        self.DL.params['writesubtitles'] = True +        self.DL.params['allsubtitles'] = True +        subtitles = self.getSubtitles() +        self.assertEqual(set(subtitles.keys()), set(['en'])) +        self.assertEqual(md5(subtitles['en']), '48649a22e82b2da21c9a67a395eedade') + +  class TestRtveSubtitles(BaseTestSubtitles):      url = 'http://www.rtve.es/alacarta/videos/los-misterios-de-laura/misterios-laura-capitulo-32-misterio-del-numero-17-2-parte/2428621/'      IE = RTVEALaCartaIE @@ -333,5 +347,25 @@ class TestFunnyOrDieSubtitles(BaseTestSubtitles):          self.assertEqual(md5(subtitles['en']), 'c5593c193eacd353596c11c2d4f9ecc4') +class TestDemocracynowSubtitles(BaseTestSubtitles): +    url = 'http://www.democracynow.org/shows/2015/7/3' +    IE = DemocracynowIE + +    def test_allsubtitles(self): +        self.DL.params['writesubtitles'] = True +        self.DL.params['allsubtitles'] = True +        subtitles = self.getSubtitles() +        self.assertEqual(set(subtitles.keys()), set(['en'])) +        self.assertEqual(md5(subtitles['en']), 'acaca989e24a9e45a6719c9b3d60815c') + +    def test_subtitles_in_page(self): +        self.url = 'http://www.democracynow.org/2015/7/3/this_flag_comes_down_today_bree' +        self.DL.params['writesubtitles'] = True +        self.DL.params['allsubtitles'] = True +        subtitles = self.getSubtitles() +        self.assertEqual(set(subtitles.keys()), set(['en'])) +        self.assertEqual(md5(subtitles['en']), 'acaca989e24a9e45a6719c9b3d60815c') + +  if __name__ == '__main__':      unittest.main() diff --git a/test/test_utils.py b/test/test_utils.py index 65692a9fb..1c3290d9b 100644 --- a/test/test_utils.py +++ b/test/test_utils.py @@ -21,6 +21,8 @@ from youtube_dl.utils import (      clean_html,      DateRange,      detect_exe_version, +    determine_ext, +    encode_compat_str,      encodeFilename,      escape_rfc3986,      escape_url, @@ -42,6 +44,7 @@ from youtube_dl.utils import (      sanitize_path,      prepend_extension,      replace_extension, +    remove_quotes,      shell_quote,      smuggle_url,      str_to_int, @@ -57,11 +60,19 @@ from youtube_dl.utils import (      urlencode_postdata,      version_tuple,      xpath_with_ns, +    xpath_element,      xpath_text, +    xpath_attr,      render_table,      match_str,      parse_dfxp_time_expr,      dfxp2srt, +    cli_option, +    cli_valueless_option, +    cli_bool_option, +) +from youtube_dl.compat import ( +    compat_etree_fromstring,  ) @@ -191,6 +202,15 @@ class TestUtil(unittest.TestCase):          self.assertEqual(replace_extension('.abc', 'temp'), '.abc.temp')          self.assertEqual(replace_extension('.abc.ext', 'temp'), '.abc.temp') +    def test_remove_quotes(self): +        self.assertEqual(remove_quotes(None), None) +        self.assertEqual(remove_quotes('"'), '"') +        self.assertEqual(remove_quotes("'"), "'") +        self.assertEqual(remove_quotes(';'), ';') +        self.assertEqual(remove_quotes('";'), '";') +        self.assertEqual(remove_quotes('""'), '') +        self.assertEqual(remove_quotes('";"'), ';') +      def test_ordered_set(self):          self.assertEqual(orderedSet([1, 1, 2, 3, 4, 4, 5, 6, 7, 3, 5]), [1, 2, 3, 4, 5, 6, 7])          self.assertEqual(orderedSet([]), []) @@ -202,8 +222,8 @@ class TestUtil(unittest.TestCase):          self.assertEqual(unescapeHTML('%20;'), '%20;')          self.assertEqual(unescapeHTML('/'), '/')          self.assertEqual(unescapeHTML('/'), '/') -        self.assertEqual( -            unescapeHTML('é'), 'é') +        self.assertEqual(unescapeHTML('é'), 'é') +        self.assertEqual(unescapeHTML('�'), '�')      def test_daterange(self):          _20century = DateRange("19000101", "20000101") @@ -228,6 +248,14 @@ class TestUtil(unittest.TestCase):              unified_strdate('2/2/2015 6:47:40 PM', day_first=False),              '20150202')          self.assertEqual(unified_strdate('25-09-2014'), '20140925') +        self.assertEqual(unified_strdate('UNKNOWN DATE FORMAT'), None) + +    def test_determine_ext(self): +        self.assertEqual(determine_ext('http://example.com/foo/bar.mp4/?download'), 'mp4') +        self.assertEqual(determine_ext('http://example.com/foo/bar/?download', None), None) +        self.assertEqual(determine_ext('http://example.com/foo/bar.nonext/?download', None), None) +        self.assertEqual(determine_ext('http://example.com/foo/bar/mp4?download', None), None) +        self.assertEqual(determine_ext('http://example.com/foo/bar.m3u8//?download'), 'm3u8')      def test_find_xpath_attr(self):          testxml = '''<root> @@ -235,12 +263,21 @@ class TestUtil(unittest.TestCase):              <node x="a"/>              <node x="a" y="c" />              <node x="b" y="d" /> +            <node x="" />          </root>''' -        doc = xml.etree.ElementTree.fromstring(testxml) +        doc = compat_etree_fromstring(testxml) +        self.assertEqual(find_xpath_attr(doc, './/fourohfour', 'n'), None)          self.assertEqual(find_xpath_attr(doc, './/fourohfour', 'n', 'v'), None) +        self.assertEqual(find_xpath_attr(doc, './/node', 'n'), None) +        self.assertEqual(find_xpath_attr(doc, './/node', 'n', 'v'), None) +        self.assertEqual(find_xpath_attr(doc, './/node', 'x'), doc[1])          self.assertEqual(find_xpath_attr(doc, './/node', 'x', 'a'), doc[1]) +        self.assertEqual(find_xpath_attr(doc, './/node', 'x', 'b'), doc[3]) +        self.assertEqual(find_xpath_attr(doc, './/node', 'y'), doc[2])          self.assertEqual(find_xpath_attr(doc, './/node', 'y', 'c'), doc[2]) +        self.assertEqual(find_xpath_attr(doc, './/node', 'y', 'd'), doc[3]) +        self.assertEqual(find_xpath_attr(doc, './/node', 'x', ''), doc[4])      def test_xpath_with_ns(self):          testxml = '''<root xmlns:media="http://example.com/"> @@ -249,23 +286,56 @@ class TestUtil(unittest.TestCase):                  <url>http://server.com/download.mp3</url>              </media:song>          </root>''' -        doc = xml.etree.ElementTree.fromstring(testxml) +        doc = compat_etree_fromstring(testxml)          find = lambda p: doc.find(xpath_with_ns(p, {'media': 'http://example.com/'}))          self.assertTrue(find('media:song') is not None)          self.assertEqual(find('media:song/media:author').text, 'The Author')          self.assertEqual(find('media:song/url').text, 'http://server.com/download.mp3') +    def test_xpath_element(self): +        doc = xml.etree.ElementTree.Element('root') +        div = xml.etree.ElementTree.SubElement(doc, 'div') +        p = xml.etree.ElementTree.SubElement(div, 'p') +        p.text = 'Foo' +        self.assertEqual(xpath_element(doc, 'div/p'), p) +        self.assertEqual(xpath_element(doc, ['div/p']), p) +        self.assertEqual(xpath_element(doc, ['div/bar', 'div/p']), p) +        self.assertEqual(xpath_element(doc, 'div/bar', default='default'), 'default') +        self.assertEqual(xpath_element(doc, ['div/bar'], default='default'), 'default') +        self.assertTrue(xpath_element(doc, 'div/bar') is None) +        self.assertTrue(xpath_element(doc, ['div/bar']) is None) +        self.assertTrue(xpath_element(doc, ['div/bar'], 'div/baz') is None) +        self.assertRaises(ExtractorError, xpath_element, doc, 'div/bar', fatal=True) +        self.assertRaises(ExtractorError, xpath_element, doc, ['div/bar'], fatal=True) +        self.assertRaises(ExtractorError, xpath_element, doc, ['div/bar', 'div/baz'], fatal=True) +      def test_xpath_text(self):          testxml = '''<root>              <div>                  <p>Foo</p>              </div>          </root>''' -        doc = xml.etree.ElementTree.fromstring(testxml) +        doc = compat_etree_fromstring(testxml)          self.assertEqual(xpath_text(doc, 'div/p'), 'Foo') +        self.assertEqual(xpath_text(doc, 'div/bar', default='default'), 'default')          self.assertTrue(xpath_text(doc, 'div/bar') is None)          self.assertRaises(ExtractorError, xpath_text, doc, 'div/bar', fatal=True) +    def test_xpath_attr(self): +        testxml = '''<root> +            <div> +                <p x="a">Foo</p> +            </div> +        </root>''' +        doc = compat_etree_fromstring(testxml) +        self.assertEqual(xpath_attr(doc, 'div/p', 'x'), 'a') +        self.assertEqual(xpath_attr(doc, 'div/bar', 'x'), None) +        self.assertEqual(xpath_attr(doc, 'div/p', 'y'), None) +        self.assertEqual(xpath_attr(doc, 'div/bar', 'x', default='default'), 'default') +        self.assertEqual(xpath_attr(doc, 'div/p', 'y', default='default'), 'default') +        self.assertRaises(ExtractorError, xpath_attr, doc, 'div/bar', 'x', fatal=True) +        self.assertRaises(ExtractorError, xpath_attr, doc, 'div/p', 'y', fatal=True) +      def test_smuggle_url(self):          data = {"ö": "ö", "abc": [3]}          url = 'https://foo.bar/baz?x=y#a' @@ -380,11 +450,17 @@ class TestUtil(unittest.TestCase):          data = urlencode_postdata({'username': 'foo@bar.com', 'password': '1234'})          self.assertTrue(isinstance(data, bytes)) +    def test_encode_compat_str(self): +        self.assertEqual(encode_compat_str(b'\xd1\x82\xd0\xb5\xd1\x81\xd1\x82', 'utf-8'), 'тест') +        self.assertEqual(encode_compat_str('тест', 'utf-8'), 'тест') +      def test_parse_iso8601(self):          self.assertEqual(parse_iso8601('2014-03-23T23:04:26+0100'), 1395612266)          self.assertEqual(parse_iso8601('2014-03-23T22:04:26+0000'), 1395612266)          self.assertEqual(parse_iso8601('2014-03-23T22:04:26Z'), 1395612266)          self.assertEqual(parse_iso8601('2014-03-23T22:04:26.1234Z'), 1395612266) +        self.assertEqual(parse_iso8601('2015-09-29T08:27:31.727'), 1443515251) +        self.assertEqual(parse_iso8601('2015-09-29T08-27-31.727'), None)      def test_strip_jsonp(self):          stripped = strip_jsonp('cb ([ {"id":"532cb",\n\n\n"x":\n3}\n]\n);') @@ -455,6 +531,9 @@ class TestUtil(unittest.TestCase):              "playlist":[{"controls":{"all":null}}]          }''') +        inp = '''"The CW\\'s \\'Crazy Ex-Girlfriend\\'"''' +        self.assertEqual(js_to_json(inp), '''"The CW's 'Crazy Ex-Girlfriend'"''') +          inp = '"SAND Number: SAND 2013-7800P\\nPresenter: Tom Russo\\nHabanero Software Training - Xyce Software\\nXyce, Sandia\\u0027s"'          json_code = js_to_json(inp)          self.assertEqual(json.loads(json_code), json.loads(inp)) @@ -587,12 +666,13 @@ ffmpeg version 2.4.4 Copyright (c) 2000-2014 the FFmpeg ...'''), '2.4.4')              {'like_count': 190, 'dislike_count': 10}))      def test_parse_dfxp_time_expr(self): -        self.assertEqual(parse_dfxp_time_expr(None), 0.0) -        self.assertEqual(parse_dfxp_time_expr(''), 0.0) +        self.assertEqual(parse_dfxp_time_expr(None), None) +        self.assertEqual(parse_dfxp_time_expr(''), None)          self.assertEqual(parse_dfxp_time_expr('0.1'), 0.1)          self.assertEqual(parse_dfxp_time_expr('0.1s'), 0.1)          self.assertEqual(parse_dfxp_time_expr('00:00:01'), 1.0)          self.assertEqual(parse_dfxp_time_expr('00:00:01.100'), 1.1) +        self.assertEqual(parse_dfxp_time_expr('00:00:01:100'), 1.1)      def test_dfxp2srt(self):          dfxp_data = '''<?xml version="1.0" encoding="UTF-8"?> @@ -602,6 +682,9 @@ ffmpeg version 2.4.4 Copyright (c) 2000-2014 the FFmpeg ...'''), '2.4.4')                      <p begin="0" end="1">The following line contains Chinese characters and special symbols</p>                      <p begin="1" end="2">第二行<br/>♪♪</p>                      <p begin="2" dur="1"><span>Third<br/>Line</span></p> +                    <p begin="3" end="-1">Lines with invalid timestamps are ignored</p> +                    <p begin="-1" end="-1">Ignore, two</p> +                    <p begin="3" dur="-1">Ignored, three</p>                  </div>              </body>              </tt>''' @@ -637,6 +720,51 @@ The first line  '''          self.assertEqual(dfxp2srt(dfxp_data_no_default_namespace), srt_data) +    def test_cli_option(self): +        self.assertEqual(cli_option({'proxy': '127.0.0.1:3128'}, '--proxy', 'proxy'), ['--proxy', '127.0.0.1:3128']) +        self.assertEqual(cli_option({'proxy': None}, '--proxy', 'proxy'), []) +        self.assertEqual(cli_option({}, '--proxy', 'proxy'), []) + +    def test_cli_valueless_option(self): +        self.assertEqual(cli_valueless_option( +            {'downloader': 'external'}, '--external-downloader', 'downloader', 'external'), ['--external-downloader']) +        self.assertEqual(cli_valueless_option( +            {'downloader': 'internal'}, '--external-downloader', 'downloader', 'external'), []) +        self.assertEqual(cli_valueless_option( +            {'nocheckcertificate': True}, '--no-check-certificate', 'nocheckcertificate'), ['--no-check-certificate']) +        self.assertEqual(cli_valueless_option( +            {'nocheckcertificate': False}, '--no-check-certificate', 'nocheckcertificate'), []) +        self.assertEqual(cli_valueless_option( +            {'checkcertificate': True}, '--no-check-certificate', 'checkcertificate', False), []) +        self.assertEqual(cli_valueless_option( +            {'checkcertificate': False}, '--no-check-certificate', 'checkcertificate', False), ['--no-check-certificate']) + +    def test_cli_bool_option(self): +        self.assertEqual( +            cli_bool_option( +                {'nocheckcertificate': True}, '--no-check-certificate', 'nocheckcertificate'), +            ['--no-check-certificate', 'true']) +        self.assertEqual( +            cli_bool_option( +                {'nocheckcertificate': True}, '--no-check-certificate', 'nocheckcertificate', separator='='), +            ['--no-check-certificate=true']) +        self.assertEqual( +            cli_bool_option( +                {'nocheckcertificate': True}, '--check-certificate', 'nocheckcertificate', 'false', 'true'), +            ['--check-certificate', 'false']) +        self.assertEqual( +            cli_bool_option( +                {'nocheckcertificate': True}, '--check-certificate', 'nocheckcertificate', 'false', 'true', '='), +            ['--check-certificate=false']) +        self.assertEqual( +            cli_bool_option( +                {'nocheckcertificate': False}, '--check-certificate', 'nocheckcertificate', 'false', 'true'), +            ['--check-certificate', 'true']) +        self.assertEqual( +            cli_bool_option( +                {'nocheckcertificate': False}, '--check-certificate', 'nocheckcertificate', 'false', 'true', '='), +            ['--check-certificate=true']) +  if __name__ == '__main__':      unittest.main() diff --git a/test/test_write_annotations.py b/test/test_write_annotations.py index 780636c77..84b8f39e0 100644 --- a/test/test_write_annotations.py +++ b/test/test_write_annotations.py @@ -33,7 +33,7 @@ params = get_params({  TEST_ID = 'gr51aVj-mLg' -ANNOTATIONS_FILE = TEST_ID + '.flv.annotations.xml' +ANNOTATIONS_FILE = TEST_ID + '.annotations.xml'  EXPECTED_ANNOTATIONS = ['Speech bubble', 'Note', 'Title', 'Spotlight', 'Label'] diff --git a/test/test_youtube_lists.py b/test/test_youtube_lists.py index c889b6f15..26aadb34f 100644 --- a/test/test_youtube_lists.py +++ b/test/test_youtube_lists.py @@ -57,5 +57,14 @@ class TestYoutubeLists(unittest.TestCase):          entries = result['entries']          self.assertEqual(len(entries), 100) +    def test_youtube_flat_playlist_titles(self): +        dl = FakeYDL() +        dl.params['extract_flat'] = True +        ie = YoutubePlaylistIE(dl) +        result = ie.extract('https://www.youtube.com/playlist?list=PLwiyx1dc3P2JR9N8gQaQN_BCvlSlap7re') +        self.assertIsPlaylist(result) +        for entry in result['entries']: +            self.assertTrue(entry.get('title')) +  if __name__ == '__main__':      unittest.main() | 
