indavideo.py 2.9 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879
  1. # coding: utf-8
  2. from __future__ import unicode_literals
  3. from .. import utils
  4. from .common import InfoExtractor
  5. class IndavideoIE(InfoExtractor):
  6. _VALID_URL = r'https?://(?:www\.)?indavideo\.hu/video/(?P<id>.+)'
  7. _TESTS = [
  8. {
  9. 'url': 'http://indavideo.hu/video/Cicatanc',
  10. 'md5': 'c8a507a1c7410685f83a06eaeeaafeab',
  11. 'info_dict': {
  12. 'id': '1837039',
  13. 'title': 'Cicatánc',
  14. 'ext': 'mp4',
  15. 'display_id': 'Cicatanc',
  16. 'thumbnail': 're:^https?://.*\.jpg$',
  17. 'description': '',
  18. 'uploader': 'cukiajanlo',
  19. 'uploader_id': '83729',
  20. 'duration': 72,
  21. 'age_limit': 0,
  22. 'tags': ['tánc', 'cica', 'cuki', 'cukiajanlo', 'newsroom']
  23. },
  24. },
  25. {
  26. 'url': 'http://indavideo.hu/video/Vicces_cica_1',
  27. 'md5': '8c82244ba85d2a2310275b318eb51eac',
  28. 'info_dict': {
  29. 'id': '1335611',
  30. 'title': 'Vicces cica',
  31. 'ext': 'mp4',
  32. 'display_id': 'Vicces_cica_1',
  33. 'thumbnail': 're:^https?://.*\.jpg$',
  34. 'description': 'Játszik a tablettel. :D',
  35. 'uploader': 'Jet_Pack',
  36. 'uploader_id': '491217',
  37. 'duration': 7,
  38. 'age_limit': 0,
  39. 'tags': ['vicces', 'macska', 'cica', 'ügyes', 'nevetés', 'játszik', 'Cukiság', 'Jet_Pack'],
  40. },
  41. },
  42. ]
  43. def _real_extract(self, url):
  44. video_disp_id = self._match_id(url)
  45. webpage = self._download_webpage(url, video_disp_id)
  46. embed_url = self._html_search_regex(r'<link rel="video_src" href="(.+?)"/>', webpage, 'embed_url')
  47. video_hash = embed_url.split('/')[-1]
  48. payload = self._download_json('http://amfphp.indavideo.hu/SYm0json.php/player.playerHandler.getVideoData/' + video_hash, video_disp_id)
  49. video_info = payload['data']
  50. thumbnails = video_info.get('thumbnails')
  51. if thumbnails:
  52. thumbnails = [{'url': self._proto_relative_url(x)} for x in thumbnails]
  53. tags = video_info.get('tags')
  54. if tags:
  55. tags = [x['title'] for x in tags]
  56. return {
  57. 'id': video_info.get('id'),
  58. 'title': video_info['title'],
  59. 'url': video_info['video_file'],
  60. 'ext': 'mp4',
  61. 'display_id': video_disp_id,
  62. 'thumbnails': thumbnails,
  63. 'description': video_info.get('description'),
  64. 'uploader': video_info.get('user_name'),
  65. # TODO: upload date (it's in CET/CEST)
  66. 'uploader_id': video_info.get('user_id'),
  67. 'duration': utils.int_or_none(video_info.get('length')),
  68. 'age_limit': utils.int_or_none(video_info.get('age_limit')),
  69. 'tags': tags,
  70. }