sportdeutschland.py 2.9 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182
  1. # coding: utf-8
  2. from __future__ import unicode_literals
  3. import re
  4. from .common import InfoExtractor
  5. from ..utils import (
  6. parse_iso8601,
  7. sanitized_Request,
  8. )
  9. class SportDeutschlandIE(InfoExtractor):
  10. _VALID_URL = r'https?://sportdeutschland\.tv/(?P<sport>[^/?#]+)/(?P<id>[^?#/]+)(?:$|[?#])'
  11. _TESTS = [{
  12. 'url': 'https://sportdeutschland.tv/badminton/re-live-deutsche-meisterschaften-2020-halbfinals?playlistId=0',
  13. 'info_dict': {
  14. 'id': 're-live-deutsche-meisterschaften-2020-halbfinals',
  15. 'ext': 'mp4',
  16. 'title': 're:Re-live: Deutsche Meisterschaften 2020.*Halbfinals',
  17. 'categories': ['Badminton-Deutschland'],
  18. 'view_count': int,
  19. 'thumbnail': r're:^https?://.*\.(?:jpg|png)$',
  20. 'timestamp': int,
  21. 'upload_date': '20200201',
  22. 'description': 're:.*', # meaningless description for THIS video
  23. },
  24. }]
  25. def _real_extract(self, url):
  26. mobj = re.match(self._VALID_URL, url)
  27. video_id = mobj.group('id')
  28. sport_id = mobj.group('sport')
  29. api_url = 'https://proxy.vidibusdynamic.net/ssl/backend.sportdeutschland.tv/api/permalinks/%s/%s?access_token=true' % (
  30. sport_id, video_id)
  31. req = sanitized_Request(api_url, headers={
  32. 'Accept': 'application/vnd.vidibus.v2.html+json',
  33. 'Referer': url,
  34. })
  35. data = self._download_json(req, video_id)
  36. asset = data['asset']
  37. categories = [data['section']['title']]
  38. formats = []
  39. smil_url = asset['video']
  40. if '.smil' in smil_url:
  41. m3u8_url = smil_url.replace('.smil', '.m3u8')
  42. formats.extend(
  43. self._extract_m3u8_formats(m3u8_url, video_id, ext='mp4'))
  44. smil_doc = self._download_xml(
  45. smil_url, video_id, note='Downloading SMIL metadata')
  46. base_url_el = smil_doc.find('./head/meta')
  47. if base_url_el:
  48. base_url = base_url_el.attrib['base']
  49. formats.extend([{
  50. 'format_id': 'rmtp',
  51. 'url': base_url if base_url_el else n.attrib['src'],
  52. 'play_path': n.attrib['src'],
  53. 'ext': 'flv',
  54. 'preference': -100,
  55. 'format_note': 'Seems to fail at example stream',
  56. } for n in smil_doc.findall('./body/video')])
  57. else:
  58. formats.append({'url': smil_url})
  59. self._sort_formats(formats)
  60. return {
  61. 'id': video_id,
  62. 'formats': formats,
  63. 'title': asset['title'],
  64. 'thumbnail': asset.get('image'),
  65. 'description': asset.get('teaser'),
  66. 'duration': asset.get('duration'),
  67. 'categories': categories,
  68. 'view_count': asset.get('views'),
  69. 'rtmp_live': asset.get('live'),
  70. 'timestamp': parse_iso8601(asset.get('date')),
  71. }