logo

oasis-root

Compiled tree of Oasis Linux based on own branch at <https://hacktivis.me/git/oasis/> git clone https://anongit.hacktivis.me/git/oasis-root.git

mediaklikk.py (7514B)


  1. import urllib.parse
  2. from .common import InfoExtractor
  3. from ..utils import (
  4. ExtractorError,
  5. traverse_obj,
  6. unified_strdate,
  7. url_or_none,
  8. )
  9. class MediaKlikkIE(InfoExtractor):
  10. _VALID_URL = r'''(?x)https?://(?:www\.)?
  11. (?:mediaklikk|m4sport|hirado|petofilive)\.hu/.*?(?:videok?|cikk)/
  12. (?:(?P<year>[0-9]{4})/(?P<month>[0-9]{1,2})/(?P<day>[0-9]{1,2})/)?
  13. (?P<id>[^/#?_]+)'''
  14. _TESTS = [{
  15. 'url': 'https://mediaklikk.hu/filmajanlo/cikk/az-ajto/',
  16. 'info_dict': {
  17. 'id': '668177',
  18. 'title': 'Az ajtó',
  19. 'display_id': 'az-ajto',
  20. 'ext': 'mp4',
  21. 'thumbnail': 'https://cdn.cms.mtv.hu/wp-content/uploads/sites/4/2016/01/vlcsnap-2023-07-31-14h18m52s111.jpg',
  22. },
  23. }, {
  24. # (old) mediaklikk. date in html.
  25. 'url': 'https://mediaklikk.hu/video/hazajaro-delnyugat-bacska-a-duna-menten-palankatol-doroszloig/',
  26. 'info_dict': {
  27. 'id': '4754129',
  28. 'title': 'Hazajáró, DÉLNYUGAT-BÁCSKA – A Duna mentén Palánkától Doroszlóig',
  29. 'ext': 'mp4',
  30. 'upload_date': '20210901',
  31. 'thumbnail': 'http://mediaklikk.hu/wp-content/uploads/sites/4/2014/02/hazajarouj_JO.jpg',
  32. },
  33. 'skip': 'Webpage redirects to 404 page',
  34. }, {
  35. # mediaklikk. date in html.
  36. 'url': 'https://mediaklikk.hu/video/hazajaro-fabova-hegyseg-kishont-koronaja/',
  37. 'info_dict': {
  38. 'id': '6696133',
  39. 'title': 'Hazajáró, Fabova-hegység - Kishont koronája',
  40. 'display_id': 'hazajaro-fabova-hegyseg-kishont-koronaja',
  41. 'ext': 'mp4',
  42. 'upload_date': '20230903',
  43. 'thumbnail': 'https://mediaklikk.hu/wp-content/uploads/sites/4/2014/02/hazajarouj_JO.jpg',
  44. },
  45. 'skip': 'Webpage redirects to 404 page',
  46. }, {
  47. # (old) m4sport
  48. 'url': 'https://m4sport.hu/video/2021/08/30/gyemant-liga-parizs/',
  49. 'info_dict': {
  50. 'id': '4754999',
  51. 'title': 'Gyémánt Liga, Párizs',
  52. 'ext': 'mp4',
  53. 'upload_date': '20210830',
  54. 'thumbnail': 'http://m4sport.hu/wp-content/uploads/sites/4/2021/08/vlcsnap-2021-08-30-18h21m20s10-1024x576.jpg',
  55. },
  56. 'skip': 'Webpage redirects to 404 page',
  57. }, {
  58. # m4sport
  59. 'url': 'https://m4sport.hu/sportkozvetitesek/video/2023/09/08/atletika-gyemant-liga-brusszel/',
  60. 'info_dict': {
  61. 'id': '6711136',
  62. 'title': 'Atlétika – Gyémánt Liga, Brüsszel',
  63. 'display_id': 'atletika-gyemant-liga-brusszel',
  64. 'ext': 'mp4',
  65. 'upload_date': '20230908',
  66. 'thumbnail': 'https://m4sport.hu/wp-content/uploads/sites/4/2023/09/vlcsnap-2023-09-08-22h43m18s691.jpg',
  67. },
  68. 'skip': 'Webpage redirects to 404 page',
  69. }, {
  70. # m4sport with *video/ url and no date
  71. 'url': 'https://m4sport.hu/bl-video/real-madrid-chelsea-1-1/',
  72. 'info_dict': {
  73. 'id': '4492099',
  74. 'title': 'Real Madrid - Chelsea 1-1',
  75. 'display_id': 'real-madrid-chelsea-1-1',
  76. 'ext': 'mp4',
  77. 'thumbnail': 'https://m4sport.hu/wp-content/uploads/sites/4/2021/04/Sequence-01.Still001-1024x576.png',
  78. },
  79. 'skip': 'Webpage redirects to 404 page',
  80. }, {
  81. # (old) hirado
  82. 'url': 'https://hirado.hu/videok/felteteleket-szabott-a-fovaros/',
  83. 'info_dict': {
  84. 'id': '4760120',
  85. 'title': 'Feltételeket szabott a főváros',
  86. 'ext': 'mp4',
  87. 'thumbnail': 'http://hirado.hu/wp-content/uploads/sites/4/2021/09/vlcsnap-2021-09-01-20h20m37s165.jpg',
  88. },
  89. 'skip': 'Webpage redirects to video list page',
  90. }, {
  91. # hirado
  92. 'url': 'https://hirado.hu/belfold/video/2023/09/11/marad-az-eves-elszamolas-a-napelemekre-beruhazo-csaladoknal',
  93. 'info_dict': {
  94. 'id': '6716068',
  95. 'title': 'Marad az éves elszámolás a napelemekre beruházó családoknál',
  96. 'display_id': 'marad-az-eves-elszamolas-a-napelemekre-beruhazo-csaladoknal',
  97. 'ext': 'mp4',
  98. 'upload_date': '20230911',
  99. 'thumbnail': 'https://hirado.hu/wp-content/uploads/sites/4/2023/09/vlcsnap-2023-09-11-09h16m09s882.jpg',
  100. },
  101. 'skip': 'Webpage redirects to video list page',
  102. }, {
  103. # (old) petofilive
  104. 'url': 'https://petofilive.hu/video/2021/06/07/tha-shudras-az-akusztikban/',
  105. 'info_dict': {
  106. 'id': '4571948',
  107. 'title': 'Tha Shudras az Akusztikban',
  108. 'ext': 'mp4',
  109. 'upload_date': '20210607',
  110. 'thumbnail': 'http://petofilive.hu/wp-content/uploads/sites/4/2021/06/vlcsnap-2021-06-07-22h14m23s915-1024x576.jpg',
  111. },
  112. 'skip': 'Webpage redirects to empty page',
  113. }, {
  114. # petofilive
  115. 'url': 'https://petofilive.hu/video/2023/09/09/futball-fesztival-a-margitszigeten/',
  116. 'info_dict': {
  117. 'id': '6713233',
  118. 'title': 'Futball Fesztivál a Margitszigeten',
  119. 'display_id': 'futball-fesztival-a-margitszigeten',
  120. 'ext': 'mp4',
  121. 'upload_date': '20230909',
  122. 'thumbnail': 'https://petofilive.hu/wp-content/uploads/sites/4/2023/09/Clipboard11-2.jpg',
  123. },
  124. 'skip': 'Webpage redirects to video list page',
  125. }]
  126. def _real_extract(self, url):
  127. mobj = self._match_valid_url(url)
  128. display_id = mobj.group('id')
  129. webpage = self._download_webpage(url, display_id)
  130. player_data_str = self._html_search_regex(
  131. r'mtva_player_manager\.player\(document.getElementById\(.*\),\s?(\{.*\}).*\);', webpage, 'player data')
  132. player_data = self._parse_json(player_data_str, display_id, urllib.parse.unquote)
  133. video_id = str(player_data['contentId'])
  134. title = player_data.get('title') or self._og_search_title(webpage, fatal=False) or \
  135. self._html_search_regex(r'<h\d+\b[^>]+\bclass="article_title">([^<]+)<', webpage, 'title')
  136. upload_date = unified_strdate(
  137. '{}-{}-{}'.format(mobj.group('year'), mobj.group('month'), mobj.group('day')))
  138. if not upload_date:
  139. upload_date = unified_strdate(self._html_search_regex(
  140. r'<p+\b[^>]+\bclass="article_date">([^<]+)<', webpage, 'upload date', default=None))
  141. player_data['video'] = player_data.pop('token')
  142. player_page = self._download_webpage(
  143. 'https://player.mediaklikk.hu/playernew/player.php', video_id,
  144. query=player_data, headers={'Referer': url})
  145. player_json = self._search_json(
  146. r'\bpl\.setup\s*\(', player_page, 'player json', video_id, end_pattern=r'\);')
  147. playlist_url = traverse_obj(
  148. player_json, ('playlist', lambda _, v: v['type'] == 'hls', 'file', {url_or_none}), get_all=False)
  149. if not playlist_url:
  150. raise ExtractorError('Unable to extract playlist url')
  151. formats, subtitles = self._extract_m3u8_formats_and_subtitles(playlist_url, video_id)
  152. return {
  153. 'id': video_id,
  154. 'title': title,
  155. 'display_id': display_id,
  156. 'formats': formats,
  157. 'subtitles': subtitles,
  158. 'upload_date': upload_date,
  159. 'thumbnail': player_data.get('bgImage') or self._og_search_thumbnail(webpage),
  160. }