2023-02-21 01:18:45 +00:00
import functools
2022-12-03 02:00:26 +00:00
import re
from . common import InfoExtractor
from . . utils import (
2023-02-21 01:18:45 +00:00
ExtractorError ,
OnDemandPagedList ,
2022-12-03 02:00:26 +00:00
date_from_str ,
determine_ext ,
int_or_none ,
qualities ,
traverse_obj ,
unified_strdate ,
unified_timestamp ,
update_url_query ,
url_or_none ,
urlencode_postdata ,
xpath_text ,
)
class AfreecaTVIE ( InfoExtractor ) :
IE_NAME = ' afreecatv '
IE_DESC = ' afreecatv.com '
_VALID_URL = r ''' (?x)
https ? : / /
( ? :
( ? : ( ? : live | afbbs | www ) \. ) ? afreeca ( ? : tv ) ? \. com ( ? : : \d + ) ?
( ? :
/ app / ( ? : index | read_ucc_bbs ) \. cgi |
/ player / [ Pp ] layer \. ( ? : swf | html )
) \? . * ? \bnTitleNo = |
2023-02-21 01:18:45 +00:00
vod \. afreecatv \. com / ( PLAYER / STATION | player ) /
2022-12-03 02:00:26 +00:00
)
( ? P < id > \d + )
'''
_NETRC_MACHINE = ' afreecatv '
_TESTS = [ {
' url ' : ' http://live.afreecatv.com:8079/app/index.cgi?szType=read_ucc_bbs&szBjId=dailyapril&nStationNo=16711924&nBbsNo=18605867&nTitleNo=36164052&szSkin= ' ,
' md5 ' : ' f72c89fe7ecc14c1b5ce506c4996046e ' ,
' info_dict ' : {
' id ' : ' 36164052 ' ,
' ext ' : ' mp4 ' ,
' title ' : ' 데일리 에이프릴 요정들의 시상식! ' ,
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
' uploader ' : ' dailyapril ' ,
' uploader_id ' : ' dailyapril ' ,
' upload_date ' : ' 20160503 ' ,
} ,
' skip ' : ' Video is gone ' ,
} , {
' url ' : ' http://afbbs.afreecatv.com:8080/app/read_ucc_bbs.cgi?nStationNo=16711924&nTitleNo=36153164&szBjId=dailyapril&nBbsNo=18605867 ' ,
' info_dict ' : {
' id ' : ' 36153164 ' ,
' title ' : " BJ유트루와 함께하는 ' 팅커벨 메이크업! ' " ,
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
' uploader ' : ' dailyapril ' ,
' uploader_id ' : ' dailyapril ' ,
} ,
' playlist_count ' : 2 ,
' playlist ' : [ {
' md5 ' : ' d8b7c174568da61d774ef0203159bf97 ' ,
' info_dict ' : {
' id ' : ' 36153164_1 ' ,
' ext ' : ' mp4 ' ,
' title ' : " BJ유트루와 함께하는 ' 팅커벨 메이크업! ' " ,
' upload_date ' : ' 20160502 ' ,
} ,
} , {
' md5 ' : ' 58f2ce7f6044e34439ab2d50612ab02b ' ,
' info_dict ' : {
' id ' : ' 36153164_2 ' ,
' ext ' : ' mp4 ' ,
' title ' : " BJ유트루와 함께하는 ' 팅커벨 메이크업! ' " ,
' upload_date ' : ' 20160502 ' ,
} ,
} ] ,
' skip ' : ' Video is gone ' ,
} , {
' url ' : ' http://vod.afreecatv.com/PLAYER/STATION/18650793 ' ,
' info_dict ' : {
' id ' : ' 18650793 ' ,
' ext ' : ' mp4 ' ,
' title ' : ' 오늘은 다르다! 쏘님의 우월한 위아래~ 댄스리액션! ' ,
' thumbnail ' : r ' re:^https?://.* \ .jpg$ ' ,
' uploader ' : ' 윈아디 ' ,
' uploader_id ' : ' badkids ' ,
' duration ' : 107 ,
} ,
' params ' : {
' skip_download ' : True ,
} ,
} , {
' url ' : ' http://vod.afreecatv.com/PLAYER/STATION/10481652 ' ,
' info_dict ' : {
' id ' : ' 10481652 ' ,
' title ' : " BJ유트루와 함께하는 ' 팅커벨 메이크업! ' " ,
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
' uploader ' : ' dailyapril ' ,
' uploader_id ' : ' dailyapril ' ,
' duration ' : 6492 ,
} ,
' playlist_count ' : 2 ,
' playlist ' : [ {
' md5 ' : ' d8b7c174568da61d774ef0203159bf97 ' ,
' info_dict ' : {
' id ' : ' 20160502_c4c62b9d_174361386_1 ' ,
' ext ' : ' mp4 ' ,
' title ' : " BJ유트루와 함께하는 ' 팅커벨 메이크업! ' (part 1) " ,
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
' uploader ' : ' dailyapril ' ,
' uploader_id ' : ' dailyapril ' ,
' upload_date ' : ' 20160502 ' ,
' duration ' : 3601 ,
} ,
} , {
' md5 ' : ' 58f2ce7f6044e34439ab2d50612ab02b ' ,
' info_dict ' : {
' id ' : ' 20160502_39e739bb_174361386_2 ' ,
' ext ' : ' mp4 ' ,
' title ' : " BJ유트루와 함께하는 ' 팅커벨 메이크업! ' (part 2) " ,
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
' uploader ' : ' dailyapril ' ,
' uploader_id ' : ' dailyapril ' ,
' upload_date ' : ' 20160502 ' ,
' duration ' : 2891 ,
} ,
} ] ,
' params ' : {
' skip_download ' : True ,
} ,
} , {
# non standard key
' url ' : ' http://vod.afreecatv.com/PLAYER/STATION/20515605 ' ,
' info_dict ' : {
' id ' : ' 20170411_BE689A0E_190960999_1_2_h ' ,
' ext ' : ' mp4 ' ,
' title ' : ' 혼자사는여자집 ' ,
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
' uploader ' : ' ♥이슬이 ' ,
' uploader_id ' : ' dasl8121 ' ,
' upload_date ' : ' 20170411 ' ,
' duration ' : 213 ,
} ,
' params ' : {
' skip_download ' : True ,
} ,
} , {
# PARTIAL_ADULT
' url ' : ' http://vod.afreecatv.com/PLAYER/STATION/32028439 ' ,
' info_dict ' : {
' id ' : ' 20180327_27901457_202289533_1 ' ,
' ext ' : ' mp4 ' ,
' title ' : ' [생]빨개요♥ (part 1) ' ,
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
' uploader ' : ' [SA]서아 ' ,
' uploader_id ' : ' bjdyrksu ' ,
' upload_date ' : ' 20180327 ' ,
' duration ' : 3601 ,
} ,
' params ' : {
' skip_download ' : True ,
} ,
' expected_warnings ' : [ ' adult content ' ] ,
} , {
' url ' : ' http://www.afreecatv.com/player/Player.swf?szType=szBjId=djleegoon&nStationNo=11273158&nBbsNo=13161095&nTitleNo=36327652 ' ,
' only_matching ' : True ,
} , {
' url ' : ' http://vod.afreecatv.com/PLAYER/STATION/15055030 ' ,
' only_matching ' : True ,
2023-02-21 01:18:45 +00:00
} , {
' url ' : ' http://vod.afreecatv.com/player/15055030 ' ,
' only_matching ' : True ,
2022-12-03 02:00:26 +00:00
} ]
@staticmethod
def parse_video_key ( key ) :
video_key = { }
m = re . match ( r ' ^(?P<upload_date> \ d {8} )_ \ w+_(?P<part> \ d+)$ ' , key )
if m :
video_key [ ' upload_date ' ] = m . group ( ' upload_date ' )
video_key [ ' part ' ] = int ( m . group ( ' part ' ) )
return video_key
2023-02-21 01:18:45 +00:00
def _perform_login ( self , username , password ) :
2022-12-03 02:00:26 +00:00
login_form = {
' szWork ' : ' login ' ,
' szType ' : ' json ' ,
' szUid ' : username ,
' szPassword ' : password ,
' isSaveId ' : ' false ' ,
' szScriptVar ' : ' oLoginRet ' ,
' szAction ' : ' ' ,
}
response = self . _download_json (
' https://login.afreecatv.com/app/LoginAction.php ' , None ,
' Logging in ' , data = urlencode_postdata ( login_form ) )
_ERRORS = {
- 4 : ' Your account has been suspended due to a violation of our terms and policies. ' ,
- 5 : ' https://member.afreecatv.com/app/user_delete_progress.php ' ,
- 6 : ' https://login.afreecatv.com/membership/changeMember.php ' ,
- 8 : " Hello! AfreecaTV here. \n The username you have entered belongs to \n an account that requires a legal guardian ' s consent. \n If you wish to use our services without restriction, \n please make sure to go through the necessary verification process. " ,
- 9 : ' https://member.afreecatv.com/app/pop_login_block.php ' ,
- 11 : ' https://login.afreecatv.com/afreeca/second_login.php ' ,
- 12 : ' https://member.afreecatv.com/app/user_security.php ' ,
0 : ' The username does not exist or you have entered the wrong password. ' ,
- 1 : ' The username does not exist or you have entered the wrong password. ' ,
- 3 : ' You have entered your username/password incorrectly. ' ,
- 7 : ' You cannot use your Global AfreecaTV account to access Korean AfreecaTV. ' ,
- 10 : ' Sorry for the inconvenience. \n Your account has been blocked due to an unauthorized access. \n Please contact our Help Center for assistance. ' ,
- 32008 : ' You have failed to log in. Please contact our Help Center. ' ,
}
result = int_or_none ( response . get ( ' RESULT ' ) )
if result != 1 :
error = _ERRORS . get ( result , ' You have failed to log in. ' )
raise ExtractorError (
' Unable to login: %s said: %s ' % ( self . IE_NAME , error ) ,
expected = True )
def _real_extract ( self , url ) :
video_id = self . _match_id ( url )
webpage = self . _download_webpage ( url , video_id )
if re . search ( r ' alert \ ([ " \' ]This video has been deleted ' , webpage ) :
raise ExtractorError (
' Video %s has been deleted ' % video_id , expected = True )
station_id = self . _search_regex (
r ' nStationNo \ s*= \ s*( \ d+) ' , webpage , ' station ' )
bbs_id = self . _search_regex (
r ' nBbsNo \ s*= \ s*( \ d+) ' , webpage , ' bbs ' )
video_id = self . _search_regex (
r ' nTitleNo \ s*= \ s*( \ d+) ' , webpage , ' title ' , default = video_id )
partial_view = False
adult_view = False
for _ in range ( 2 ) :
query = {
' nTitleNo ' : video_id ,
' nStationNo ' : station_id ,
' nBbsNo ' : bbs_id ,
}
if partial_view :
query [ ' partialView ' ] = ' SKIP_ADULT '
if adult_view :
query [ ' adultView ' ] = ' ADULT_VIEW '
video_xml = self . _download_xml (
' http://afbbs.afreecatv.com:8080/api/video/get_video_info.php ' ,
video_id , ' Downloading video info XML %s '
% ( ' (skipping adult) ' if partial_view else ' ' ) ,
video_id , headers = {
' Referer ' : url ,
} , query = query )
flag = xpath_text ( video_xml , ' ./track/flag ' , ' flag ' , default = None )
if flag and flag == ' SUCCEED ' :
break
if flag == ' PARTIAL_ADULT ' :
self . report_warning (
' In accordance with local laws and regulations, underage users are restricted from watching adult content. '
' Only content suitable for all ages will be downloaded. '
' Provide account credentials if you wish to download restricted content. ' )
partial_view = True
continue
elif flag == ' ADULT ' :
if not adult_view :
adult_view = True
continue
error = ' Only users older than 19 are able to watch this video. Provide account credentials to download this content. '
else :
error = flag
raise ExtractorError (
' %s said: %s ' % ( self . IE_NAME , error ) , expected = True )
else :
raise ExtractorError ( ' Unable to download video info ' )
2023-02-21 01:18:45 +00:00
video_element = video_xml . findall ( ' ./track/video ' ) [ - 1 ]
2022-12-03 02:00:26 +00:00
if video_element is None or video_element . text is None :
raise ExtractorError (
' Video %s does not exist ' % video_id , expected = True )
video_url = video_element . text . strip ( )
title = xpath_text ( video_xml , ' ./track/title ' , ' title ' , fatal = True )
uploader = xpath_text ( video_xml , ' ./track/nickname ' , ' uploader ' )
uploader_id = xpath_text ( video_xml , ' ./track/bj_id ' , ' uploader id ' )
duration = int_or_none ( xpath_text (
video_xml , ' ./track/duration ' , ' duration ' ) )
thumbnail = xpath_text ( video_xml , ' ./track/titleImage ' , ' thumbnail ' )
common_entry = {
' uploader ' : uploader ,
' uploader_id ' : uploader_id ,
' thumbnail ' : thumbnail ,
}
info = common_entry . copy ( )
info . update ( {
' id ' : video_id ,
' title ' : title ,
' duration ' : duration ,
} )
if not video_url :
entries = [ ]
2023-02-21 01:18:45 +00:00
file_elements = video_element . findall ( ' ./file ' )
2022-12-03 02:00:26 +00:00
one = len ( file_elements ) == 1
for file_num , file_element in enumerate ( file_elements , start = 1 ) :
file_url = url_or_none ( file_element . text )
if not file_url :
continue
key = file_element . get ( ' key ' , ' ' )
upload_date = unified_strdate ( self . _search_regex (
r ' ^( \ d {8} )_ ' , key , ' upload date ' , default = None ) )
if upload_date is not None :
# sometimes the upload date isn't included in the file name
# instead, another random ID is, which may parse as a valid
# date but be wildly out of a reasonable range
parsed_date = date_from_str ( upload_date )
if parsed_date . year < 2000 or parsed_date . year > = 2100 :
upload_date = None
file_duration = int_or_none ( file_element . get ( ' duration ' ) )
format_id = key if key else ' %s _ %s ' % ( video_id , file_num )
if determine_ext ( file_url ) == ' m3u8 ' :
formats = self . _extract_m3u8_formats (
file_url , video_id , ' mp4 ' , entry_protocol = ' m3u8_native ' ,
m3u8_id = ' hls ' ,
note = ' Downloading part %d m3u8 information ' % file_num )
else :
formats = [ {
' url ' : file_url ,
' format_id ' : ' http ' ,
} ]
if not formats and not self . get_param ( ' ignore_no_formats ' ) :
continue
file_info = common_entry . copy ( )
file_info . update ( {
' id ' : format_id ,
' title ' : title if one else ' %s (part %d ) ' % ( title , file_num ) ,
' upload_date ' : upload_date ,
' duration ' : file_duration ,
' formats ' : formats ,
} )
entries . append ( file_info )
entries_info = info . copy ( )
entries_info . update ( {
' _type ' : ' multi_video ' ,
' entries ' : entries ,
} )
return entries_info
info = {
' id ' : video_id ,
' title ' : title ,
' uploader ' : uploader ,
' uploader_id ' : uploader_id ,
' duration ' : duration ,
' thumbnail ' : thumbnail ,
}
if determine_ext ( video_url ) == ' m3u8 ' :
info [ ' formats ' ] = self . _extract_m3u8_formats (
video_url , video_id , ' mp4 ' , entry_protocol = ' m3u8_native ' ,
m3u8_id = ' hls ' )
else :
app , playpath = video_url . split ( ' mp4: ' )
info . update ( {
' url ' : app ,
' ext ' : ' flv ' ,
' play_path ' : ' mp4: ' + playpath ,
' rtmp_live ' : True , # downloading won't end without this
} )
return info
2023-02-21 01:18:45 +00:00
class AfreecaTVLiveIE ( AfreecaTVIE ) : # XXX: Do not subclass from concrete IE
2022-12-03 02:00:26 +00:00
IE_NAME = ' afreecatv:live '
_VALID_URL = r ' https?://play \ .afreeca(?:tv)? \ .com/(?P<id>[^/]+)(?:/(?P<bno> \ d+))? '
_TESTS = [ {
' url ' : ' https://play.afreecatv.com/pyh3646/237852185 ' ,
' info_dict ' : {
' id ' : ' 237852185 ' ,
' ext ' : ' mp4 ' ,
' title ' : ' 【 우루과이 오늘은 무슨일이? 】 ' ,
' uploader ' : ' 박진우[JINU] ' ,
' uploader_id ' : ' pyh3646 ' ,
' timestamp ' : 1640661495 ,
' is_live ' : True ,
} ,
' skip ' : ' Livestream has ended ' ,
} , {
' url ' : ' http://play.afreeca.com/pyh3646/237852185 ' ,
' only_matching ' : True ,
} , {
' url ' : ' http://play.afreeca.com/pyh3646 ' ,
' only_matching ' : True ,
} ]
_LIVE_API_URL = ' https://live.afreecatv.com/afreeca/player_live_api.php '
_QUALITIES = ( ' sd ' , ' hd ' , ' hd2k ' , ' original ' )
def _real_extract ( self , url ) :
broadcaster_id , broadcast_no = self . _match_valid_url ( url ) . group ( ' id ' , ' bno ' )
2023-02-21 01:18:45 +00:00
password = self . get_param ( ' videopassword ' )
2022-12-03 02:00:26 +00:00
info = self . _download_json ( self . _LIVE_API_URL , broadcaster_id , fatal = False ,
data = urlencode_postdata ( { ' bid ' : broadcaster_id } ) ) or { }
channel_info = info . get ( ' CHANNEL ' ) or { }
broadcaster_id = channel_info . get ( ' BJID ' ) or broadcaster_id
broadcast_no = channel_info . get ( ' BNO ' ) or broadcast_no
2023-02-21 01:18:45 +00:00
password_protected = channel_info . get ( ' BPWD ' )
2022-12-03 02:00:26 +00:00
if not broadcast_no :
raise ExtractorError ( f ' Unable to extract broadcast number ( { broadcaster_id } may not be live) ' , expected = True )
2023-02-21 01:18:45 +00:00
if password_protected == ' Y ' and password is None :
raise ExtractorError (
' This livestream is protected by a password, use the --video-password option ' ,
expected = True )
2022-12-03 02:00:26 +00:00
formats = [ ]
quality_key = qualities ( self . _QUALITIES )
for quality_str in self . _QUALITIES :
2023-02-21 01:18:45 +00:00
params = {
' bno ' : broadcast_no ,
' stream_type ' : ' common ' ,
' type ' : ' aid ' ,
' quality ' : quality_str ,
}
if password is not None :
params [ ' pwd ' ] = password
2022-12-03 02:00:26 +00:00
aid_response = self . _download_json (
self . _LIVE_API_URL , broadcast_no , fatal = False ,
2023-02-21 01:18:45 +00:00
data = urlencode_postdata ( params ) ,
2022-12-03 02:00:26 +00:00
note = f ' Downloading access token for { quality_str } stream ' ,
errnote = f ' Unable to download access token for { quality_str } stream ' )
aid = traverse_obj ( aid_response , ( ' CHANNEL ' , ' AID ' ) )
if not aid :
continue
stream_base_url = channel_info . get ( ' RMD ' ) or ' https://livestream-manager.afreecatv.com '
stream_info = self . _download_json (
f ' { stream_base_url } /broad_stream_assign.html ' , broadcast_no , fatal = False ,
query = {
' return_type ' : channel_info . get ( ' CDN ' , ' gcp_cdn ' ) ,
' broad_key ' : f ' { broadcast_no } -common- { quality_str } -hls ' ,
} ,
note = f ' Downloading metadata for { quality_str } stream ' ,
errnote = f ' Unable to download metadata for { quality_str } stream ' ) or { }
if stream_info . get ( ' view_url ' ) :
formats . append ( {
' format_id ' : quality_str ,
' url ' : update_url_query ( stream_info [ ' view_url ' ] , { ' aid ' : aid } ) ,
' ext ' : ' mp4 ' ,
' protocol ' : ' m3u8 ' ,
' quality ' : quality_key ( quality_str ) ,
} )
station_info = self . _download_json (
' https://st.afreecatv.com/api/get_station_status.php ' , broadcast_no ,
query = { ' szBjId ' : broadcaster_id } , fatal = False ,
note = ' Downloading channel metadata ' , errnote = ' Unable to download channel metadata ' ) or { }
return {
' id ' : broadcast_no ,
' title ' : channel_info . get ( ' TITLE ' ) or station_info . get ( ' station_title ' ) ,
' uploader ' : channel_info . get ( ' BJNICK ' ) or station_info . get ( ' station_name ' ) ,
' uploader_id ' : broadcaster_id ,
' timestamp ' : unified_timestamp ( station_info . get ( ' broad_start ' ) ) ,
' formats ' : formats ,
' is_live ' : True ,
}
2023-02-21 01:18:45 +00:00
class AfreecaTVUserIE ( InfoExtractor ) :
IE_NAME = ' afreecatv:user '
_VALID_URL = r ' https?://bj \ .afreeca(?:tv)? \ .com/(?P<id>[^/]+)/vods/?(?P<slug_type>[^/]+)? '
_TESTS = [ {
' url ' : ' https://bj.afreecatv.com/ryuryu24/vods/review ' ,
' info_dict ' : {
' _type ' : ' playlist ' ,
' id ' : ' ryuryu24 ' ,
' title ' : ' ryuryu24 - review ' ,
} ,
' playlist_count ' : 218 ,
} , {
' url ' : ' https://bj.afreecatv.com/parang1995/vods/highlight ' ,
' info_dict ' : {
' _type ' : ' playlist ' ,
' id ' : ' parang1995 ' ,
' title ' : ' parang1995 - highlight ' ,
} ,
' playlist_count ' : 997 ,
} , {
' url ' : ' https://bj.afreecatv.com/ryuryu24/vods ' ,
' info_dict ' : {
' _type ' : ' playlist ' ,
' id ' : ' ryuryu24 ' ,
' title ' : ' ryuryu24 - all ' ,
} ,
' playlist_count ' : 221 ,
} , {
' url ' : ' https://bj.afreecatv.com/ryuryu24/vods/balloonclip ' ,
' info_dict ' : {
' _type ' : ' playlist ' ,
' id ' : ' ryuryu24 ' ,
' title ' : ' ryuryu24 - balloonclip ' ,
} ,
' playlist_count ' : 0 ,
} ]
_PER_PAGE = 60
def _fetch_page ( self , user_id , user_type , page ) :
page + = 1
info = self . _download_json ( f ' https://bjapi.afreecatv.com/api/ { user_id } /vods/ { user_type } ' , user_id ,
query = { ' page ' : page , ' per_page ' : self . _PER_PAGE , ' orderby ' : ' reg_date ' } ,
note = f ' Downloading { user_type } video page { page } ' )
for item in info [ ' data ' ] :
yield self . url_result (
f ' https://vod.afreecatv.com/player/ { item [ " title_no " ] } / ' , AfreecaTVIE , item [ ' title_no ' ] )
def _real_extract ( self , url ) :
user_id , user_type = self . _match_valid_url ( url ) . group ( ' id ' , ' slug_type ' )
user_type = user_type or ' all '
entries = OnDemandPagedList ( functools . partial ( self . _fetch_page , user_id , user_type ) , self . _PER_PAGE )
return self . playlist_result ( entries , user_id , f ' { user_id } - { user_type } ' )