americastestkitchen.py 3.3 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485
  1. # coding: utf-8
  2. from __future__ import unicode_literals
  3. import re
  4. from .common import InfoExtractor
  5. class AmericasTestKitchenIE(InfoExtractor):
  6. _VALID_URL = r'https?://(?:www\.)?americastestkitchen\.com/episode/(?P<id>\d+)'
  7. _TESTS = [{
  8. 'url':
  9. 'https://www.americastestkitchen.com/episode/548-summer-dinner-party',
  10. 'md5': 'b861c3e365ac38ad319cfd509c30577f',
  11. 'info_dict': {
  12. 'id': '1_5g5zua6e',
  13. 'title': 'atk_s17_e24.mp4',
  14. 'ext': 'mp4',
  15. 'description': '<p>Host Julia Collin Davison goes into the test kitchen with test cook Dan Souza to learn how to make the ultimate Grill-Roasted Beef Tenderloin. Next, equipment expert Adam Ried reviews gas grills in the Equipment Corner. Then, gadget guru Lisa McManus uncovers the best quirky gadgets. Finally, test cook Erin McMurrer shows host Bridget Lancaster how to make an elegant Pear-Walnut Upside-Down Cake.</p>',
  16. 'timestamp': 1497285541,
  17. 'upload_date': '20170612',
  18. 'uploader_id': 'roger.metcalf@americastestkitchen.com',
  19. 'release_date': '2017-06-17',
  20. 'thumbnail': 'http://d3cizcpymoenau.cloudfront.net/images/35973/e24-tenderloin-16.jpg',
  21. 'episode_number': 24,
  22. 'episode': 'Summer Dinner Party',
  23. 'episode_id': '548-summer-dinner-party',
  24. 'season_number': 17
  25. },
  26. 'params': {
  27. # m3u8 download
  28. 'skip_download': True,
  29. },
  30. }, {
  31. 'url':
  32. 'https://www.americastestkitchen.com/episode/546-a-spanish-affair',
  33. 'only_matching':
  34. True,
  35. }]
  36. def _real_extract(self, url):
  37. video_id = self._match_id(url)
  38. webpage = self._download_webpage(url, video_id)
  39. partner_id = self._search_regex(
  40. r'partner_id/(?P<partner_id>\d+)',
  41. webpage,
  42. 'partner_id',
  43. group='partner_id')
  44. video_data = self._parse_json(
  45. self._search_regex(
  46. r'window\.__INITIAL_STATE__\s*=\s*({.+?});\s*</script>',
  47. webpage, 'initial context'),
  48. video_id)
  49. episode_data = video_data['episodeDetail']['content']['data']
  50. episode_content_meta = episode_data['full_video']
  51. external_id = episode_content_meta['external_id']
  52. # photo data
  53. photo_data = episode_content_meta.get('photo')
  54. thumbnail = photo_data.get('image_url') if photo_data else None
  55. # meta
  56. release_date = episode_data.get('aired_at')
  57. description = episode_content_meta.get('description')
  58. episode_number = int(episode_content_meta.get('episode_number'))
  59. episode = episode_content_meta.get('title')
  60. episode_id = episode_content_meta.get('episode_slug')
  61. season_number = int(episode_content_meta.get('season_number'))
  62. return {
  63. '_type': 'url_transparent',
  64. 'url': 'kaltura:%s:%s' % (partner_id, external_id),
  65. 'ie_key': 'Kaltura',
  66. 'id': video_id,
  67. 'release_date': release_date,
  68. 'thumbnail': thumbnail,
  69. 'description': description,
  70. 'episode_number': episode_number,
  71. 'episode': episode,
  72. 'episode_id': episode_id,
  73. 'season_number': season_number
  74. }