amp.py 3.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384
  1. # coding: utf-8
  2. from __future__ import unicode_literals
  3. from .common import InfoExtractor
  4. from ..utils import (
  5. int_or_none,
  6. parse_iso8601,
  7. )
  8. class AMPIE(InfoExtractor):
  9. def _get_media_node(self, item, name, default=None):
  10. media_name = 'media-%s' % name
  11. media_group = item.get('media-group') or item
  12. return media_group.get(media_name) or item.get(media_name) or item.get(name, default)
  13. # parse Akamai Adaptive Media Player feed
  14. def _extract_feed_info(self, url):
  15. item = self._download_json(
  16. url, None,
  17. 'Downloading Akamai AMP feed',
  18. 'Unable to download Akamai AMP feed'
  19. )['channel']['item']
  20. video_id = item['guid']
  21. thumbnails = []
  22. media_thumbnail = self._get_media_node(item, 'thumbnail')
  23. if media_thumbnail:
  24. if isinstance(media_thumbnail, dict):
  25. media_thumbnail = [media_thumbnail]
  26. for thumbnail_data in media_thumbnail:
  27. thumbnail = thumbnail_data['@attributes']
  28. thumbnails.append({
  29. 'url': self._proto_relative_url(thumbnail['url'], 'http:'),
  30. 'width': int_or_none(thumbnail.get('width')),
  31. 'height': int_or_none(thumbnail.get('height')),
  32. })
  33. subtitles = {}
  34. media_subtitle = self._get_media_node(item, 'subTitle')
  35. if media_subtitle:
  36. if isinstance(media_subtitle, dict):
  37. media_subtitle = [media_subtitle]
  38. for subtitle_data in media_subtitle:
  39. subtitle = subtitle_data['@attributes']
  40. lang = subtitle.get('lang') or 'en'
  41. subtitles[lang] = [{'url': subtitle['href']}]
  42. formats = []
  43. media_content = self._get_media_node(item, 'content')
  44. if isinstance(media_content, dict):
  45. media_content = [media_content]
  46. for media_data in media_content:
  47. media = media_data['@attributes']
  48. media_type = media['type']
  49. if media_type == 'video/f4m':
  50. f4m_formats = self._extract_f4m_formats(media['url'] + '?hdcore=3.4.0&plugin=aasp-3.4.0.132.124', video_id, f4m_id='hds', fatal=False)
  51. if f4m_formats:
  52. formats.extend(f4m_formats)
  53. elif media_type == 'application/x-mpegURL':
  54. m3u8_formats = self._extract_m3u8_formats(media['url'], video_id, m3u8_id='hls', fatal=False)
  55. if m3u8_formats:
  56. formats.extend(m3u8_formats)
  57. else:
  58. formats.append({
  59. 'format_id': media_data['media-category']['@attributes']['label'],
  60. 'url': media['url'],
  61. 'preference': 1,
  62. 'vbr': int_or_none(media.get('bitrate')),
  63. 'filesize': int_or_none(media.get('fileSize')),
  64. })
  65. self._sort_formats(formats)
  66. return {
  67. 'id': video_id,
  68. 'title': self._get_media_node(item, 'title'),
  69. 'description': self._get_media_node(item, 'description'),
  70. 'thumbnails': thumbnails,
  71. 'timestamp': parse_iso8601(item.get('pubDate'), ' '),
  72. 'duration': int_or_none(media_content[0].get('@attributes', {}).get('duration')),
  73. 'formats': formats,
  74. }