aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authormars67857 <mars67857@yahoo.com>2017-10-14 22:09:44 -0700
committerSergey M․ <dstftw@gmail.com>2018-05-26 21:25:21 +0700
commit2a49d01992e0b4b87d78da8f83af2f6e57fb8ba8 (patch)
treef7522e95fe480249e0cd872edf18d3caee53bd6b
parent261f47306c594614edb8a5f0b8f5f3b8a87ce9c0 (diff)
downloadyoutube-dl-2a49d01992e0b4b87d78da8f83af2f6e57fb8ba8.tar.xz
[cammodels] Add extractor
-rw-r--r--youtube_dl/extractor/cammodels.py93
-rw-r--r--youtube_dl/extractor/extractors.py1
2 files changed, 94 insertions, 0 deletions
diff --git a/youtube_dl/extractor/cammodels.py b/youtube_dl/extractor/cammodels.py
new file mode 100644
index 000000000..1711d7096
--- /dev/null
+++ b/youtube_dl/extractor/cammodels.py
@@ -0,0 +1,93 @@
+from __future__ import unicode_literals
+from .common import InfoExtractor
+from .common import ExtractorError
+import json
+import re
+from ..utils import int_or_none
+
+
+class CamModelsIE(InfoExtractor):
+ _VALID_URL = r'https?://(?:www\.)?cammodels\.com/cam/(?P<id>\w+)'
+ _HEADERS = {
+ 'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/51.0.2704.103 Safari/537.36'
+ # Needed because server doesn't return links to video URLs if a browser-like User-Agent is not used
+ }
+
+ def _real_extract(self, url):
+ video_id = self._match_id(url)
+ webpage = self._download_webpage(
+ url,
+ video_id,
+ headers=self._HEADERS)
+ manifest_url_root = self._html_search_regex(
+ r'manifestUrlRoot=(?P<id>https?:\/\/(www\.)?[-a-zA-Z0-9@:%._\+~#=]{2,256}\.[a-z]{2,6}\b([-a-zA-Z0-9@:%_\+.~#?&//=]*))',
+ webpage,
+ 'manifest',
+ None,
+ False)
+ if not manifest_url_root:
+ offline = self._html_search_regex(
+ r'(?P<id>I\'m offline, but let\'s stay connected!)',
+ webpage,
+ 'offline indicator',
+ None,
+ False)
+ private = self._html_search_regex(
+ r'(?P<id>I’m in a private show right now)',
+ webpage,
+ 'private show indicator',
+ None,
+ False)
+ err = 'This user is currently offline, so nothing can be downloaded.' if offline \
+ else 'This user is doing a private show, which requires payment. This extractor currently does not support private streams.' if private \
+ else 'Unable to find link to stream info on webpage. Room is not offline, so something else is wrong.'
+ raise ExtractorError(
+ err,
+ expected=True if offline or private else False,
+ video_id=video_id
+ )
+ manifest_url = manifest_url_root + video_id + '.json'
+ manifest = self._download_json(
+ manifest_url,
+ video_id,
+ 'Downloading links to streams.',
+ 'Link to stream URLs was found, but we couldn\'t access it.',
+ headers=self._HEADERS)
+ try:
+ formats = []
+ for fmtName in ['mp4-rtmp', 'mp4-hls']:
+ for encoding in manifest['formats'][fmtName]['encodings']:
+ formats.append({
+ 'ext': 'mp4',
+ 'url': encoding['location'],
+ 'width': int_or_none(encoding.get('videoWidth')),
+ 'height': int_or_none(encoding.get('videoHeight')),
+ 'vbr': int_or_none(encoding.get('videoKbps')),
+ 'abr': int_or_none(encoding.get('audioKbps')),
+ 'format_id': fmtName + str(encoding.get('videoWidth'))
+ })
+ # If they change the JSON format, then fallback to parsing out RTMP links via regex.
+ except KeyError:
+ manifest_json = json.dumps(manifest)
+ manifest_links = re.finditer(
+ r'(?P<id>rtmp?:\/\/[-a-zA-Z0-9@:%._\+~#=]{2,256}\.[a-z]{2,6}\b([-a-zA-Z0-9@:%_\+.~#&//=]*))',
+ manifest_json)
+ if not manifest_links:
+ raise ExtractorError(
+ 'Link to stream info was found, but we couldn\'t read the response. This is probably a bug.',
+ expected=False,
+ video_id=video_id)
+ formats = []
+ for manifest_link in manifest_links:
+ url = manifest_link.group('id')
+ formats.append({
+ 'ext': 'mp4',
+ 'url': url,
+ 'format_id': url.split(sep='/')[-1]
+ })
+ self._sort_formats(formats)
+ return {
+ 'id': video_id,
+ 'title': self._live_title(video_id),
+ 'formats': formats
+ }
diff --git a/youtube_dl/extractor/extractors.py b/youtube_dl/extractor/extractors.py
index c9b49a0cd..d54e8df9f 100644
--- a/youtube_dl/extractor/extractors.py
+++ b/youtube_dl/extractor/extractors.py
@@ -145,6 +145,7 @@ from .camdemy import (
CamdemyIE,
CamdemyFolderIE
)
+from .cammodels import CamModelsIE
from .camwithher import CamWithHerIE
from .canalplus import CanalplusIE
from .canalc2 import Canalc2IE