2 from __future__ import unicode_literals
6 from .common import InfoExtractor
7 from ..compat import compat_str
19 class PeerTubeIE(InfoExtractor):
20 _INSTANCES_RE = r'''(?:
21 # Taken from https://instances.joinpeertube.org/instances
22 peertube\.rainbowswingers\.net|
26 videomensoif\.ynh\.fr|
27 peertube\.travelpandas\.eu|
28 peertube\.rachetjay\.fr|
29 peertube\.montecsys\.fr|
32 peertube\.umeahackerspace\.se|
34 video\.monsieurbidouille\.fr|
35 tube\.openalgeria\.org|
37 video\.anormallostpod\.ovh|
38 tube\.crapaud-fou\.org|
42 peertube\.snargol\.com|
47 peertube\.osureplayviewer\.xyz|
48 peertube\.mathieufamily\.ovh|
51 peertube\.fediverse\.ru|
52 peertube\.oiseauroch\.fr|
60 peertube\.chantierlibre\.org|
66 videos\.elbinario\.net|
72 peertube\.gnumeria\.eu\.org|
76 tube\.kalah-france\.org|
80 peertube\.hatthieves\.es|
81 video\.fitchfamily\.org|
86 peertube\.harmoniescreatives\.com|
89 video\.bruitbruit\.com|
90 peertube\.foxfam\.club|
93 peertube\.malbert\.xyz|
94 peertube\.bilange\.ca|
97 peertube\.fedilab\.app|
99 video\.mstddntfdn\.online|
101 peertube\.sl-network\.fr|
102 peertube\.dynlinux\.io|
103 peertube\.david\.durieux\.family|
104 peertube\.linuxrocks\.online|
106 v\.kretschmann\.social|
109 tube\.dragonpsi\.xyz|
110 peertube\.boneheadmedia\.com|
111 videos\.funkwhale\.audio|
113 peertube\.gcaillaut\.fr|
120 peertube\.simounet\.net|
124 peertube\.kerenon\.com|
126 tube\.calculate\.social|
127 peertube\.mckillop\.org|
128 tube\.netzspielplatz\.de|
132 peertube\.stephenson\.cc|
134 peertube\.kajalinifi\.de|
137 peertube\.ffs2play\.fr|
138 peertube\.leboulaire\.ovh|
139 peertube\.tronic-studio\.com|
140 peertube\.public\.cat|
141 peertube\.metalbanana\.net|
143 peertube\.alter-nativ-voll\.de|
145 tube\.worldofhauru\.xyz|
147 peertube\.teleassist\.fr|
150 media\.privacyinternational\.org|
152 video\.halle-leaks\.de|
153 video\.grosskopfgames\.de|
154 peertube\.schaeferit\.de|
155 peertube\.jackbot\.fr|
156 tube\.extinctionrebellion\.fr|
160 peertube\.zergy\.net|
161 peertube\.roflcopter\.fr|
162 peertube\.floss-marketing-school\.com|
164 peertube\.iriseden\.eu|
165 videos\.ubuntu-paris\.org|
166 peertube\.mastodon\.host|
168 peertube\.s2s\.video|
173 peertube\.normandie-libre\.fr|
175 video\.lacaveatonton\.ovh|
177 peertube\.servebeer\.com|
178 peertube\.fedi\.quebec|
183 tube\.unmondemeilleur\.eu|
190 video\.devinberg\.com|
192 peertube\.kosebamse\.com|
193 yunopeertube\.myddns\.me|
194 peertube\.varney\.fr|
195 peertube\.anon-kenkai\.com|
198 videos\.dinofly\.com|
202 video\.heromuster\.com|
203 video\.lemediatv\.fr|
208 pt\.laurentkruger\.fr|
209 video\.monarch-pass\.net|
210 peertube\.artica\.center|
211 video\.alternanet\.fr|
213 fanvid\.stopthatimp\.net|
218 peertube\.mablr\.org|
222 devtube\.dev-wiki\.de|
223 raptube\.antipub\.org|
225 peertube\.mygaia\.org|
227 peertube\.livingutopia\.org|
228 peertube\.the-penguin\.de|
229 tube\.thechangebook\.org|
233 mplayer\.demouliere\.eu|
236 peertube\.zapashcanon\.fr|
237 video\.latavernedejohnjohn\.fr|
238 peertube\.pcservice46\.fr|
239 peertube\.mazzonetto\.eu|
240 video\.irem\.univ-paris-diderot\.fr|
241 video\.livecchi\.cloud|
244 video\.cabane-libre\.org|
245 peertube\.openstreetmap\.fr|
246 videos\.alolise\.org|
252 peertube\.freeforge\.eu|
253 video\.arbitrarion\.com|
254 video\.datsemultimedia\.com|
256 peertube\.ricostrongxxx\.com|
257 docker\.videos\.lecygnenoir\.info|
258 peertube\.togart\.de|
259 tube\.postblue\.info|
260 videos\.domainepublic\.net|
261 peertube\.cyber-tribal\.com|
262 video\.gresille\.org|
263 peertube\.dsmouse\.net|
264 cinema\.yunohost\.support|
265 tube\.theocevaer\.fr|
269 peertube\.metawurst\.space|
272 video\.freeradical\.zone|
275 pt\.kircheneuenburg\.de|
278 videos\.side-ways\.net|
281 video\.taboulisme\.com|
285 video\.monsieur-a\.fr|
286 peertube\.librelois\.fr|
287 videos\.pair2jeux\.tube|
288 videos\.pueseso\.club|
289 peer\.mathdacloud\.ovh|
290 media\.assassinate-you\.net|
292 ptube\.rousset\.nom\.fr|
296 peertube\.makotoworkshop\.org|
297 peertube\.serveur\.slv-valbonne\.fr|
302 pire\.artisanlogiciel\.net|
303 videos\.numerique-en-commun\.fr|
305 video\.die-partei\.social|
307 peertube\.swarm\.solvingmaz\.es|
308 tube\.pericoloso\.ovh|
309 watching\.cypherpunk\.observer|
310 videos\.adhocmusic\.com|
312 peertube\.librelabucm\.org|
313 videos\.numericoop\.fr|
314 peertube\.koehn\.com|
315 peertube\.anarchmusicall\.net|
316 tube\.kampftoast\.de|
318 peertube\.xtenz\.xyz|
321 peertube\.nomagic\.uk|
323 videos\.koumoul\.com|
324 video\.rastapuls\.com|
325 video\.mantlepro\.com|
326 video\.deadsuperhero\.com|
327 peertube\.musicstudio\.pro|
328 peertube\.we-keys\.fr|
329 artitube\.artifaille\.fr|
330 peertube\.ethernia\.net|
334 peertube\.donnadieu\.fr|
335 argos\.aquilenet\.fr|
338 videos\.darckoune\.moe|
339 tube\.traydent\.info|
340 dev\.videos\.lecygnenoir\.info|
341 peertube\.nayya\.org|
343 peertube\.mofgao\.space|
344 video\.lequerrec\.eu|
345 peertube\.amicale\.net|
354 peertube\.heberge\.fr|
356 videos\.cloudfrancois\.fr|
365 videos\.lescommuns\.org|
369 peertube\.nogafa\.org|
370 megatube\.lilomoino\.fr|
371 peertube\.tamanoir\.foucry\.net|
372 peertube\.devosi\.org|
373 peertube\.1312\.media|
374 tube\.bootlicker\.party|
377 tube\.homecomputing\.fr|
378 tube\.ouahpiti\.info|
382 peertube\.gaialabs\.ch|
385 video\.migennes\.net|
388 videos\.iut-orsay\.fr|
389 peertube\.solidev\.net|
391 video\.passageenseine\.fr|
392 videos\.festivalparminous\.org|
393 peertube\.touhoppai\.moe|
395 peer\.hostux\.social|
397 peertube\.walkingmountains\.fr|
399 peertube\.parleur\.net|
400 peertube\.heraut\.eu|
402 peertube\.gegeweb\.eu|
405 tube\.conferences-gesticulees\.net|
406 peertube\.datagueule\.tv|
408 tube\.mochi\.academy|
410 video\.colibris-outilslibres\.org|
419 _UUID_RE = r'[\da-fA-F]{8}-[\da-fA-F]{4}-[\da-fA-F]{4}-[\da-fA-F]{4}-[\da-fA-F]{12}'
420 _API_BASE = 'https://%s/api/v1/videos/%s/%s'
421 _VALID_URL = r'''(?x)
423 peertube:(?P<host>[^:]+):|
424 https?://(?P<host_2>%s)/(?:videos/(?:watch|embed)|api/v\d/videos)/
427 ''' % (_INSTANCES_RE, _UUID_RE)
429 'url': 'https://framatube.org/videos/watch/9c9de5e8-0a1e-484a-b099-e80766180a6d',
430 'md5': '9bed8c0137913e17b86334e5885aacff',
432 'id': '9c9de5e8-0a1e-484a-b099-e80766180a6d',
434 'title': 'What is PeerTube?',
435 'description': 'md5:3fefb8dde2b189186ce0719fda6f7b10',
436 'thumbnail': r're:https?://.*\.(?:jpg|png)',
437 'timestamp': 1538391166,
438 'upload_date': '20181001',
439 'uploader': 'Framasoft',
441 'uploader_url': 'https://framatube.org/accounts/framasoft',
442 'channel': 'Les vidéos de Framasoft',
444 'channel_url': 'https://framatube.org/video-channels/bf54d359-cfad-4935-9d45-9d6be93f63e8',
446 'license': 'Attribution - Share Alike',
450 'dislike_count': int,
451 'tags': ['framasoft', 'peertube'],
452 'categories': ['Science & Technology'],
456 'url': 'peertube:spacepub.space:d8943b2d-8280-497b-85ec-bc282ec2afdc',
458 'id': 'd8943b2d-8280-497b-85ec-bc282ec2afdc',
460 'title': 'Dot matrix printer shell demo',
462 'timestamp': 1587401293,
463 'upload_date': '20200420',
464 'uploader': 'Drew DeVault',
467 'url': 'https://peertube.tamanoir.foucry.net/videos/watch/0b04f13d-1e18-4f1d-814e-4979aa7c9c44',
468 'only_matching': True,
471 'url': 'https://tube.22decembre.eu/videos/watch/9bb88cd3-9959-46d9-9ab9-33d2bb704c39',
472 'only_matching': True,
474 'url': 'https://tube.22decembre.eu/videos/embed/fed67262-6edb-4d1c-833b-daa9085c71d7',
475 'only_matching': True,
477 'url': 'https://tube.openalgeria.org/api/v1/videos/c1875674-97d0-4c94-a058-3f7e64c962e8',
478 'only_matching': True,
480 'url': 'peertube:video.blender.org:b37a5b9f-e6b5-415c-b700-04a5cd6ec205',
481 'only_matching': True,
485 def _extract_peertube_url(webpage, source_url):
487 r'https?://(?P<host>[^/]+)/videos/(?:watch|embed)/(?P<id>%s)'
488 % PeerTubeIE._UUID_RE, source_url)
489 if mobj and any(p in webpage for p in (
491 'There will be other non JS-based clients to access PeerTube',
492 '>We are sorry but it seems that PeerTube is not compatible with your web browser.<')):
493 return 'peertube:%s:%s' % mobj.group('host', 'id')
496 def _extract_urls(webpage, source_url):
497 entries = re.findall(
498 r'''(?x)<iframe[^>]+\bsrc=["\'](?P<url>(?:https?:)?//%s/videos/embed/%s)'''
499 % (PeerTubeIE._INSTANCES_RE, PeerTubeIE._UUID_RE), webpage)
501 peertube_url = PeerTubeIE._extract_peertube_url(webpage, source_url)
503 entries = [peertube_url]
506 def _call_api(self, host, video_id, path, note=None, errnote=None, fatal=True):
507 return self._download_json(
508 self._API_BASE % (host, video_id, path), video_id,
509 note=note, errnote=errnote, fatal=fatal)
511 def _get_subtitles(self, host, video_id):
512 captions = self._call_api(
513 host, video_id, 'captions', note='Downloading captions JSON',
515 if not isinstance(captions, dict):
517 data = captions.get('data')
518 if not isinstance(data, list):
522 language_id = try_get(e, lambda x: x['language']['id'], compat_str)
523 caption_url = urljoin('https://%s' % host, e.get('captionPath'))
526 subtitles.setdefault(language_id or 'en', []).append({
531 def _real_extract(self, url):
532 mobj = re.match(self._VALID_URL, url)
533 host = mobj.group('host') or mobj.group('host_2')
534 video_id = mobj.group('id')
536 video = self._call_api(
537 host, video_id, '', note='Downloading video JSON')
539 title = video['name']
542 files = video.get('files') or []
543 for playlist in (video.get('streamingPlaylists') or []):
544 if not isinstance(playlist, dict):
546 playlist_files = playlist.get('files')
547 if not (playlist_files and isinstance(playlist_files, list)):
549 files.extend(playlist_files)
551 if not isinstance(file_, dict):
553 file_url = url_or_none(file_.get('fileUrl'))
556 file_size = int_or_none(file_.get('size'))
558 file_, lambda x: x['resolution']['label'], compat_str)
559 f = parse_resolution(format_id)
562 'format_id': format_id,
563 'filesize': file_size,
565 if format_id == '0p':
568 f['fps'] = int_or_none(file_.get('fps'))
570 self._sort_formats(formats)
572 description = video.get('description')
573 if len(description) >= 250:
574 # description is shortened
575 full_description = self._call_api(
576 host, video_id, 'description', note='Downloading description JSON',
579 if isinstance(full_description, dict):
580 description = str_or_none(full_description.get('description')) or description
582 subtitles = self.extract_subtitles(host, video_id)
584 def data(section, field, type_):
585 return try_get(video, lambda x: x[section][field], type_)
587 def account_data(field, type_):
588 return data('account', field, type_)
590 def channel_data(field, type_):
591 return data('channel', field, type_)
593 category = data('category', 'label', compat_str)
594 categories = [category] if category else None
596 nsfw = video.get('nsfw')
598 age_limit = 18 if nsfw else 0
602 webpage_url = 'https://%s/videos/watch/%s' % (host, video_id)
607 'description': description,
608 'thumbnail': urljoin(webpage_url, video.get('thumbnailPath')),
609 'timestamp': unified_timestamp(video.get('publishedAt')),
610 'uploader': account_data('displayName', compat_str),
611 'uploader_id': str_or_none(account_data('id', int)),
612 'uploader_url': url_or_none(account_data('url', compat_str)),
613 'channel': channel_data('displayName', compat_str),
614 'channel_id': str_or_none(channel_data('id', int)),
615 'channel_url': url_or_none(channel_data('url', compat_str)),
616 'language': data('language', 'id', compat_str),
617 'license': data('licence', 'label', compat_str),
618 'duration': int_or_none(video.get('duration')),
619 'view_count': int_or_none(video.get('views')),
620 'like_count': int_or_none(video.get('likes')),
621 'dislike_count': int_or_none(video.get('dislikes')),
622 'age_limit': age_limit,
623 'tags': try_get(video, lambda x: x['tags'], list),
624 'categories': categories,
626 'subtitles': subtitles,
627 'webpage_url': webpage_url,