cinetecamilano.py 2.4 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162
  1. import json
  2. import urllib.error
  3. from .common import InfoExtractor
  4. from ..utils import (
  5. ExtractorError,
  6. float_or_none,
  7. parse_iso8601,
  8. strip_or_none,
  9. traverse_obj,
  10. try_get,
  11. urljoin,
  12. )
  13. class CinetecaMilanoIE(InfoExtractor):
  14. _VALID_URL = r'https?://(?:www\.)?cinetecamilano\.it/film/(?P<id>\d+)'
  15. _TESTS = [{
  16. 'url': 'https://www.cinetecamilano.it/film/1942',
  17. 'info_dict': {
  18. 'id': '1942',
  19. 'ext': 'mp4',
  20. 'title': 'Il draghetto Gris\u00f9 (4 episodi)',
  21. 'release_date': '20220129',
  22. 'thumbnail': r're:.+\.png',
  23. 'description': 'md5:5328cbe080b93224712b6f17fcaf2c01',
  24. 'modified_date': '20200520',
  25. 'duration': 3139,
  26. 'release_timestamp': 1643446208,
  27. 'modified_timestamp': int
  28. }
  29. }]
  30. def _real_extract(self, url):
  31. video_id = self._match_id(url)
  32. try:
  33. film_json = self._download_json(
  34. f'https://www.cinetecamilano.it/api/catalogo/{video_id}/?',
  35. video_id, headers={
  36. 'Referer': url,
  37. 'Authorization': try_get(self._get_cookies('https://www.cinetecamilano.it'), lambda x: f'Bearer {x["cnt-token"].value}') or ''
  38. })
  39. except ExtractorError as e:
  40. if ((isinstance(e.cause, urllib.error.HTTPError) and e.cause.code == 500)
  41. or isinstance(e.cause, json.JSONDecodeError)):
  42. self.raise_login_required(method='cookies')
  43. raise
  44. if not film_json.get('success') or not film_json.get('archive'):
  45. raise ExtractorError('Video information not found')
  46. archive = film_json['archive']
  47. return {
  48. 'id': video_id,
  49. 'title': archive.get('title'),
  50. 'description': strip_or_none(archive.get('description')),
  51. 'duration': float_or_none(archive.get('duration'), invscale=60),
  52. 'release_timestamp': parse_iso8601(archive.get('updated_at'), delimiter=' '),
  53. 'modified_timestamp': parse_iso8601(archive.get('created_at'), delimiter=' '),
  54. 'thumbnail': urljoin(url, try_get(archive, lambda x: x['thumb']['src'].replace('/public/', '/storage/'))),
  55. 'formats': self._extract_m3u8_formats(
  56. urljoin(url, traverse_obj(archive, ('drm', 'hls'))), video_id, 'mp4')
  57. }