diff options
| author | Filippo Valsorda <filippo.valsorda@gmail.com> | 2012-10-28 22:47:02 +0100 | 
|---|---|---|
| committer | Filippo Valsorda <filippo.valsorda@gmail.com> | 2012-10-28 22:47:02 +0100 | 
| commit | 42cb53fcfa2e8bbc7a96bc1a0ad1e90c1917dccd (patch) | |
| tree | 39e1a4b11aeb7290f77103611dba0a6dc718a3f8 | |
| parent | fe4d68e1967cc39cc00a06c3e2e722d51b8e1419 (diff) | |
modified filename escaping to a "smarter" one
| -rw-r--r-- | test/test_utils.py | 10 | ||||
| -rw-r--r-- | youtube_dl/utils.py | 16 | 
2 files changed, 18 insertions, 8 deletions
| diff --git a/test/test_utils.py b/test/test_utils.py index eb0af703f..878840120 100644 --- a/test/test_utils.py +++ b/test/test_utils.py @@ -22,13 +22,13 @@ class TestUtil(unittest.TestCase):  		self.assertEqual(sanitize_filename(u'123'), u'123') -		self.assertEqual(u'abc_de', sanitize_filename(u'abc/de')) -		self.assertTrue(u'de' in sanitize_filename(u'abc/de')) +		self.assertEqual(u'abc-de', sanitize_filename(u'abc/de'))  		self.assertFalse(u'/' in sanitize_filename(u'abc/de///')) -		self.assertEqual(u'abc_de', sanitize_filename(u'abc\\de')) -		self.assertEqual(u'abc_de', sanitize_filename(u'abc\\de')) -		self.assertTrue(u'de' in  sanitize_filename(u'abc\\de')) +		self.assertEqual(u'abc-de', sanitize_filename(u'abc/<>\\*|de')) +		self.assertEqual(u'xxx', sanitize_filename(u'xxx/<>\\*|')) +		self.assertEqual(u'yes no', sanitize_filename(u'yes? no')) +		self.assertEqual(u'this - that', sanitize_filename(u'this: that'))  		self.assertEqual(sanitize_filename(u'ä'), u'ä')  		self.assertEqual(sanitize_filename(u'кириллица'), u'кириллица') diff --git a/youtube_dl/utils.py b/youtube_dl/utils.py index 839da17d0..a64937b4c 100644 --- a/youtube_dl/utils.py +++ b/youtube_dl/utils.py @@ -194,10 +194,20 @@ def timeconvert(timestr):  def sanitize_filename(s):  	"""Sanitizes a string so it could be used as part of a filename."""  	def replace_insane(char): -		if char in u' .\\/|?*<>:"' or ord(char) < 32: -			return '_' +		if char == '?' or ord(char) < 32 or ord(char) == 127: +			return '' +		elif char == '"': +			return '\'' +		elif char == ':': +			return ' -' +		elif char in '\\/|*<>': +			return '-'  		return char -	return u''.join(map(replace_insane, s)).strip('_') + +	result = u''.join(map(replace_insane, s)) +	while '--' in result: +		result = result.replace('--', '-') +	return result.strip('-')  def orderedSet(iterable):  	""" Remove all duplicates from the input iterable """ | 
