2024-12-14 22:31:47 -06:00
|
|
|
import enum
|
|
|
|
import functools
|
|
|
|
import re
|
|
|
|
import time
|
|
|
|
|
|
|
|
from .common import InfoExtractor
|
2024-12-14 23:13:44 -06:00
|
|
|
from ..utils import ExtractorError
|
2024-12-14 22:31:47 -06:00
|
|
|
|
|
|
|
|
|
|
|
class EventStatus(enum.Enum):
|
|
|
|
NOT_STARTED = enum.auto()
|
|
|
|
STARTED = enum.auto()
|
|
|
|
REPLAY = enum.auto()
|
|
|
|
ENDED = enum.auto()
|
|
|
|
UNKNOWN = enum.auto()
|
|
|
|
|
|
|
|
|
|
|
|
class PeatixIE(InfoExtractor):
|
|
|
|
IE_NAME = 'peatix.com'
|
|
|
|
|
|
|
|
_VALID_URL = r'(?P<root_url>https?://peatix\.com)/event/(?P<id>[0-9]+)'
|
|
|
|
|
|
|
|
def _extract_var(self, variable, html):
|
2024-12-14 23:06:12 -06:00
|
|
|
return self._search_regex(
|
2024-12-14 22:31:47 -06:00
|
|
|
rf'(?:var|let|const)\s+{variable}\s*=\s*(?P<value>([^;]+))\s*;?',
|
|
|
|
html, f'variable {variable}', group='value')
|
|
|
|
|
2024-12-14 22:43:06 -06:00
|
|
|
def get_event_status(self, broadcast_info, webpage):
|
2024-12-14 22:31:47 -06:00
|
|
|
now = int(time.time())
|
2024-12-14 23:06:12 -06:00
|
|
|
go_live_epoch = broadcast_info.get('go_live_epoch') / 1000
|
|
|
|
event_start_epoch = broadcast_info.get('event_start_epoch') / 1000
|
|
|
|
end_live_epoch = broadcast_info.get('end_live_epoch') / 1000
|
|
|
|
event_end_epoch = broadcast_info.get('event_end_epoch') / 1000
|
2024-12-14 22:31:47 -06:00
|
|
|
if now < go_live_epoch or now < event_start_epoch:
|
|
|
|
return EventStatus.NOT_STARTED
|
|
|
|
if now > end_live_epoch or now > event_end_epoch:
|
|
|
|
if self._extract_var('replay_enabled', webpage) == 'parseInt("1")':
|
|
|
|
replay_period_hr = re.findall(r'(\d+)', self._extract_var('replay_period_hr', webpage))
|
|
|
|
if now < event_end_epoch + functools.reduce(lambda x, y: x * y, map(int, replay_period_hr)) * 3600:
|
|
|
|
return EventStatus.REPLAY
|
|
|
|
return EventStatus.ENDED
|
|
|
|
if (now >= go_live_epoch or now >= event_start_epoch) and (now <= end_live_epoch or now <= event_end_epoch):
|
|
|
|
return EventStatus.STARTED
|
|
|
|
return EventStatus.UNKNOWN
|
|
|
|
|
|
|
|
def _real_extract(self, url):
|
|
|
|
video_id, root_url = self._match_valid_url(url).group('id', 'root_url')
|
|
|
|
event_webpage = self._download_webpage(f'{root_url}/event/{video_id}', video_id)
|
|
|
|
try:
|
2024-12-14 23:06:12 -06:00
|
|
|
state = self.get_event_status(self._download_json(f'{root_url}/event/{video_id}/broadcast_info', video_id,
|
|
|
|
note='Downloading broadcast information', errnote='Failed to download broadcast information').get('json_data'),
|
|
|
|
self._download_webpage(f'{root_url}/event/{video_id}/watch_live', video_id,
|
|
|
|
note='Downloading player information', errnote='Failed to download player information'))
|
2024-12-14 22:31:47 -06:00
|
|
|
|
|
|
|
except ExtractorError as e:
|
|
|
|
raise ExtractorError(e.msg, video_id=video_id)
|
|
|
|
|
|
|
|
if state == EventStatus.NOT_STARTED:
|
|
|
|
raise ExtractorError('The event has not started yet', expected=True, video_id=video_id)
|
|
|
|
if state == EventStatus.ENDED:
|
|
|
|
raise ExtractorError('The event has ended', expected=True, video_id=video_id)
|
|
|
|
if state == EventStatus.UNKNOWN:
|
|
|
|
raise ExtractorError('The event status is unknown', video_id=video_id)
|
|
|
|
|
|
|
|
if state == EventStatus.REPLAY:
|
|
|
|
m3u8_url = f'https://live-play.peatix.com/event{video_id}.m3u8'
|
|
|
|
if state == EventStatus.STARTED:
|
|
|
|
m3u8_url = f'https://live-play.peatix.com/live2/streams/{video_id}.m3u8?v={int(time.time() * 1000)}'
|
|
|
|
|
|
|
|
manifest = self._download_webpage(
|
|
|
|
m3u8_url, video_id, headers={'Referer': root_url}, note='Downloading m3u8 information', errnote='Failed to download m3u8 information')
|
|
|
|
formats, _ = self._parse_m3u8_formats_and_subtitles(
|
|
|
|
manifest, m3u8_url, 'mp4', m3u8_id='hls', video_id=video_id)
|
|
|
|
|
|
|
|
return {
|
|
|
|
'id': video_id,
|
|
|
|
'title': self._html_extract_title(event_webpage) or self._html_search_meta(['og:title', 'twitter:title'], event_webpage, 'title', default=None),
|
|
|
|
'thumbnail': self._html_search_meta(
|
|
|
|
['twitter:image', 'og:image'],
|
|
|
|
event_webpage, 'thumbnail', default=None),
|
|
|
|
'description': self._html_search_meta(
|
|
|
|
['description', 'twitter:description', 'og:description'],
|
|
|
|
event_webpage, 'description', default=None),
|
|
|
|
'formats': formats,
|
|
|
|
}
|