adobepass.py 7.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177
  1. # -*- coding: utf-8 -*-
  2. from __future__ import unicode_literals
  3. import re
  4. import time
  5. import xml.etree.ElementTree as etree
  6. from .common import InfoExtractor
  7. from ..compat import compat_urlparse
  8. from ..utils import (
  9. unescapeHTML,
  10. urlencode_postdata,
  11. unified_timestamp,
  12. ExtractorError,
  13. )
  14. MSO_INFO = {
  15. 'DTV': {
  16. 'name': 'DirecTV',
  17. 'username_field': 'username',
  18. 'password_field': 'password',
  19. },
  20. 'Rogers': {
  21. 'name': 'Rogers Cable',
  22. 'username_field': 'UserName',
  23. 'password_field': 'UserPassword',
  24. },
  25. }
  26. class AdobePassIE(InfoExtractor):
  27. _SERVICE_PROVIDER_TEMPLATE = 'https://sp.auth.adobe.com/adobe-services/%s'
  28. _USER_AGENT = 'Mozilla/5.0 (X11; Linux i686; rv:47.0) Gecko/20100101 Firefox/47.0'
  29. @staticmethod
  30. def _get_mvpd_resource(provider_id, title, guid, rating):
  31. channel = etree.Element('channel')
  32. channel_title = etree.SubElement(channel, 'title')
  33. channel_title.text = provider_id
  34. item = etree.SubElement(channel, 'item')
  35. resource_title = etree.SubElement(item, 'title')
  36. resource_title.text = title
  37. resource_guid = etree.SubElement(item, 'guid')
  38. resource_guid.text = guid
  39. resource_rating = etree.SubElement(item, 'media:rating')
  40. resource_rating.attrib = {'scheme': 'urn:v-chip'}
  41. resource_rating.text = rating
  42. return '<rss version="2.0" xmlns:media="http://search.yahoo.com/mrss/">' + etree.tostring(channel).decode() + '</rss>'
  43. def _extract_mvpd_auth(self, url, video_id, requestor_id, resource):
  44. def xml_text(xml_str, tag):
  45. return self._search_regex(
  46. '<%s>(.+?)</%s>' % (tag, tag), xml_str, tag)
  47. def is_expired(token, date_ele):
  48. token_expires = unified_timestamp(re.sub(r'[_ ]GMT', '', xml_text(token, date_ele)))
  49. return token_expires and token_expires <= int(time.time())
  50. def post_form(form_page_res, note, data={}):
  51. form_page, urlh = form_page_res
  52. post_url = self._html_search_regex(r'<form[^>]+action=(["\'])(?P<url>.+?)\1', form_page, 'post url', group='url')
  53. if not re.match(r'https?://', post_url):
  54. post_url = compat_urlparse.urljoin(urlh.geturl(), post_url)
  55. form_data = self._hidden_inputs(form_page)
  56. form_data.update(data)
  57. return self._download_webpage_handle(
  58. post_url, video_id, note, data=urlencode_postdata(form_data), headers={
  59. 'Content-Type': 'application/x-www-form-urlencoded',
  60. })
  61. def raise_mvpd_required():
  62. raise ExtractorError(
  63. 'This video is only available for users of participating TV providers. '
  64. 'Use --ap-mso-id to specify Adobe Pass Multiple-system operator Identifier '
  65. 'and --netrc to provide account credentials.', expected=True)
  66. mvpd_headers = {
  67. 'ap_42': 'anonymous',
  68. 'ap_11': 'Linux i686',
  69. 'ap_z': self._USER_AGENT,
  70. 'User-Agent': self._USER_AGENT,
  71. }
  72. guid = xml_text(resource, 'guid')
  73. retries = self._downloader.params.get('ap_retries', 3)
  74. count = 0
  75. while count < retries:
  76. requestor_info = self._downloader.cache.load('mvpd', requestor_id) or {}
  77. authn_token = requestor_info.get('authn_token')
  78. if authn_token and is_expired(authn_token, 'simpleTokenExpires'):
  79. authn_token = None
  80. if not authn_token:
  81. # TODO add support for other TV Providers
  82. mso_id = self._downloader.params.get('ap_mso_id')
  83. if not mso_id:
  84. raise_mvpd_required()
  85. if mso_id not in MSO_INFO:
  86. raise ExtractorError(
  87. 'Unsupported TV Provider, use --list-ap-mso-ids to get a list of supported TV Providers' % mso_id, expected=True)
  88. username, password = self._get_login_info('ap_username', 'ap_password', mso_id)
  89. if not username or not password:
  90. raise_mvpd_required()
  91. mso_info = MSO_INFO[mso_id]
  92. provider_redirect_page_res = self._download_webpage_handle(
  93. self._SERVICE_PROVIDER_TEMPLATE % 'authenticate/saml', video_id,
  94. 'Downloading Provider Redirect Page', query={
  95. 'noflash': 'true',
  96. 'mso_id': mso_id,
  97. 'requestor_id': requestor_id,
  98. 'no_iframe': 'false',
  99. 'domain_name': 'adobe.com',
  100. 'redirect_url': url,
  101. })
  102. provider_login_page_res = post_form(
  103. provider_redirect_page_res, 'Downloading Provider Login Page')
  104. mvpd_confirm_page_res = post_form(provider_login_page_res, 'Logging in', {
  105. mso_info['username_field']: username,
  106. mso_info['password_field']: password,
  107. })
  108. if mso_id == 'DTV':
  109. post_form(mvpd_confirm_page_res, 'Confirming Login')
  110. session = self._download_webpage(
  111. self._SERVICE_PROVIDER_TEMPLATE % 'session', video_id,
  112. 'Retrieving Session', data=urlencode_postdata({
  113. '_method': 'GET',
  114. 'requestor_id': requestor_id,
  115. }), headers=mvpd_headers)
  116. if '<pendingLogout' in session:
  117. self._downloader.cache.store('mvpd', requestor_id, {})
  118. count += 1
  119. continue
  120. authn_token = unescapeHTML(xml_text(session, 'authnToken'))
  121. requestor_info['authn_token'] = authn_token
  122. self._downloader.cache.store('mvpd', requestor_id, requestor_info)
  123. authz_token = requestor_info.get(guid)
  124. if authz_token and is_expired(authz_token, 'simpleTokenTTL'):
  125. authz_token = None
  126. if not authz_token:
  127. authorize = self._download_webpage(
  128. self._SERVICE_PROVIDER_TEMPLATE % 'authorize', video_id,
  129. 'Retrieving Authorization Token', data=urlencode_postdata({
  130. 'resource_id': resource,
  131. 'requestor_id': requestor_id,
  132. 'authentication_token': authn_token,
  133. 'mso_id': xml_text(authn_token, 'simpleTokenMsoID'),
  134. 'userMeta': '1',
  135. }), headers=mvpd_headers)
  136. if '<pendingLogout' in authorize:
  137. self._downloader.cache.store('mvpd', requestor_id, {})
  138. count += 1
  139. continue
  140. authz_token = unescapeHTML(xml_text(authorize, 'authzToken'))
  141. requestor_info[guid] = authz_token
  142. self._downloader.cache.store('mvpd', requestor_id, requestor_info)
  143. mvpd_headers.update({
  144. 'ap_19': xml_text(authn_token, 'simpleSamlNameID'),
  145. 'ap_23': xml_text(authn_token, 'simpleSamlSessionIndex'),
  146. })
  147. short_authorize = self._download_webpage(
  148. self._SERVICE_PROVIDER_TEMPLATE % 'shortAuthorize',
  149. video_id, 'Retrieving Media Token', data=urlencode_postdata({
  150. 'authz_token': authz_token,
  151. 'requestor_id': requestor_id,
  152. 'session_guid': xml_text(authn_token, 'simpleTokenAuthenticationGuid'),
  153. 'hashed_guid': 'false',
  154. }), headers=mvpd_headers)
  155. if '<pendingLogout' in short_authorize:
  156. self._downloader.cache.store('mvpd', requestor_id, {})
  157. count += 1
  158. continue
  159. return short_authorize