2016-05-05 03:11:04 +09:00
# coding: utf-8
from __future__ import unicode_literals
2016-05-06 12:07:29 +09:00
import re
2016-05-05 03:11:04 +09:00
from . common import InfoExtractor
2017-03-06 00:31:44 +08:00
from . . compat import compat_xpath
2016-05-05 03:11:04 +09:00
from . . utils import (
2021-08-30 12:07:34 -04:00
date_from_str ,
2017-04-11 02:05:53 +07:00
determine_ext ,
2016-05-05 03:11:04 +09:00
ExtractorError ,
int_or_none ,
2021-08-30 12:07:34 -04:00
unified_strdate ,
2018-07-21 19:08:28 +07:00
url_or_none ,
2018-04-01 22:47:39 +07:00
urlencode_postdata ,
2016-05-06 01:24:02 +09:00
xpath_text ,
2016-05-05 03:11:04 +09:00
)
class AfreecaTVIE ( InfoExtractor ) :
2017-01-25 07:38:17 +01:00
IE_NAME = ' afreecatv '
2016-05-05 03:11:04 +09:00
IE_DESC = ' afreecatv.com '
2016-11-13 06:02:26 +07:00
_VALID_URL = r ''' (?x)
https ? : / /
( ? :
( ? : ( ? : live | afbbs | www ) \. ) ? afreeca ( ? : tv ) ? \. com ( ? : : \d + ) ?
( ? :
/ app / ( ? : index | read_ucc_bbs ) \. cgi |
/ player / [ Pp ] layer \. ( ? : swf | html )
) \? . * ? \bnTitleNo = |
vod \. afreecatv \. com / PLAYER / STATION /
)
( ? P < id > \d + )
'''
2018-04-01 22:47:39 +07:00
_NETRC_MACHINE = ' afreecatv '
2016-05-06 12:08:43 +09:00
_TESTS = [ {
2016-05-05 03:11:04 +09:00
' url ' : ' http://live.afreecatv.com:8079/app/index.cgi?szType=read_ucc_bbs&szBjId=dailyapril&nStationNo=16711924&nBbsNo=18605867&nTitleNo=36164052&szSkin= ' ,
' md5 ' : ' f72c89fe7ecc14c1b5ce506c4996046e ' ,
' info_dict ' : {
' id ' : ' 36164052 ' ,
' ext ' : ' mp4 ' ,
' title ' : ' 데일리 에이프릴 요정들의 시상식! ' ,
2016-05-08 10:02:19 +09:00
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
2016-05-05 03:11:04 +09:00
' uploader ' : ' dailyapril ' ,
' uploader_id ' : ' dailyapril ' ,
2016-05-06 12:08:43 +09:00
' upload_date ' : ' 20160503 ' ,
2017-03-06 00:31:44 +08:00
} ,
' skip ' : ' Video is gone ' ,
2016-05-06 12:08:43 +09:00
} , {
' url ' : ' http://afbbs.afreecatv.com:8080/app/read_ucc_bbs.cgi?nStationNo=16711924&nTitleNo=36153164&szBjId=dailyapril&nBbsNo=18605867 ' ,
' info_dict ' : {
' id ' : ' 36153164 ' ,
' title ' : " BJ유트루와 함께하는 ' 팅커벨 메이크업! ' " ,
2016-05-08 10:02:19 +09:00
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
2016-05-06 12:08:43 +09:00
' uploader ' : ' dailyapril ' ,
' uploader_id ' : ' dailyapril ' ,
} ,
' playlist_count ' : 2 ,
' playlist ' : [ {
' md5 ' : ' d8b7c174568da61d774ef0203159bf97 ' ,
' info_dict ' : {
' id ' : ' 36153164_1 ' ,
' ext ' : ' mp4 ' ,
' title ' : " BJ유트루와 함께하는 ' 팅커벨 메이크업! ' " ,
' upload_date ' : ' 20160502 ' ,
} ,
} , {
' md5 ' : ' 58f2ce7f6044e34439ab2d50612ab02b ' ,
' info_dict ' : {
' id ' : ' 36153164_2 ' ,
' ext ' : ' mp4 ' ,
' title ' : " BJ유트루와 함께하는 ' 팅커벨 메이크업! ' " ,
' upload_date ' : ' 20160502 ' ,
} ,
} ] ,
2017-03-06 00:31:44 +08:00
' skip ' : ' Video is gone ' ,
} , {
' url ' : ' http://vod.afreecatv.com/PLAYER/STATION/18650793 ' ,
' info_dict ' : {
' id ' : ' 18650793 ' ,
2017-04-11 02:05:53 +07:00
' ext ' : ' mp4 ' ,
' title ' : ' 오늘은 다르다! 쏘님의 우월한 위아래~ 댄스리액션! ' ,
' thumbnail ' : r ' re:^https?://.* \ .jpg$ ' ,
2017-03-06 00:31:44 +08:00
' uploader ' : ' 윈아디 ' ,
' uploader_id ' : ' badkids ' ,
2017-04-11 02:05:53 +07:00
' duration ' : 107 ,
} ,
' params ' : {
' skip_download ' : True ,
} ,
} , {
' url ' : ' http://vod.afreecatv.com/PLAYER/STATION/10481652 ' ,
' info_dict ' : {
' id ' : ' 10481652 ' ,
' title ' : " BJ유트루와 함께하는 ' 팅커벨 메이크업! ' " ,
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
' uploader ' : ' dailyapril ' ,
' uploader_id ' : ' dailyapril ' ,
' duration ' : 6492 ,
2017-03-06 00:31:44 +08:00
} ,
2017-04-11 02:05:53 +07:00
' playlist_count ' : 2 ,
' playlist ' : [ {
' md5 ' : ' d8b7c174568da61d774ef0203159bf97 ' ,
' info_dict ' : {
2017-04-12 02:15:37 +07:00
' id ' : ' 20160502_c4c62b9d_174361386_1 ' ,
2017-04-11 02:05:53 +07:00
' ext ' : ' mp4 ' ,
' title ' : " BJ유트루와 함께하는 ' 팅커벨 메이크업! ' (part 1) " ,
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
' uploader ' : ' dailyapril ' ,
' uploader_id ' : ' dailyapril ' ,
' upload_date ' : ' 20160502 ' ,
' duration ' : 3601 ,
} ,
} , {
' md5 ' : ' 58f2ce7f6044e34439ab2d50612ab02b ' ,
' info_dict ' : {
2017-04-12 02:15:37 +07:00
' id ' : ' 20160502_39e739bb_174361386_2 ' ,
2017-04-11 02:05:53 +07:00
' ext ' : ' mp4 ' ,
' title ' : " BJ유트루와 함께하는 ' 팅커벨 메이크업! ' (part 2) " ,
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
' uploader ' : ' dailyapril ' ,
' uploader_id ' : ' dailyapril ' ,
' upload_date ' : ' 20160502 ' ,
' duration ' : 2891 ,
} ,
} ] ,
2017-03-06 00:31:44 +08:00
' params ' : {
2017-04-11 02:05:53 +07:00
' skip_download ' : True ,
2017-03-06 00:31:44 +08:00
} ,
2017-04-12 02:15:37 +07:00
} , {
# non standard key
' url ' : ' http://vod.afreecatv.com/PLAYER/STATION/20515605 ' ,
' info_dict ' : {
' id ' : ' 20170411_BE689A0E_190960999_1_2_h ' ,
' ext ' : ' mp4 ' ,
' title ' : ' 혼자사는여자집 ' ,
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
' uploader ' : ' ♥이슬이 ' ,
' uploader_id ' : ' dasl8121 ' ,
' upload_date ' : ' 20170411 ' ,
' duration ' : 213 ,
} ,
' params ' : {
' skip_download ' : True ,
} ,
2017-10-02 03:28:25 +07:00
} , {
2018-04-02 00:00:45 +07:00
# PARTIAL_ADULT
' url ' : ' http://vod.afreecatv.com/PLAYER/STATION/32028439 ' ,
2017-10-02 03:28:25 +07:00
' info_dict ' : {
2018-04-02 00:00:45 +07:00
' id ' : ' 20180327_27901457_202289533_1 ' ,
2017-10-02 03:28:25 +07:00
' ext ' : ' mp4 ' ,
2018-04-02 00:00:45 +07:00
' title ' : ' [생]빨개요♥ (part 1) ' ,
2017-10-02 03:28:25 +07:00
' thumbnail ' : ' re:^https?://(?:video|st)img.afreecatv.com/.*$ ' ,
2018-04-02 00:00:45 +07:00
' uploader ' : ' [SA]서아 ' ,
2017-10-02 03:28:25 +07:00
' uploader_id ' : ' bjdyrksu ' ,
2018-04-02 00:00:45 +07:00
' upload_date ' : ' 20180327 ' ,
' duration ' : 3601 ,
2017-10-02 03:28:25 +07:00
} ,
' params ' : {
' skip_download ' : True ,
} ,
2018-04-02 00:00:45 +07:00
' expected_warnings ' : [ ' adult content ' ] ,
2016-05-08 10:02:19 +09:00
} , {
' url ' : ' http://www.afreecatv.com/player/Player.swf?szType=szBjId=djleegoon&nStationNo=11273158&nBbsNo=13161095&nTitleNo=36327652 ' ,
' only_matching ' : True ,
2016-11-13 06:02:26 +07:00
} , {
' url ' : ' http://vod.afreecatv.com/PLAYER/STATION/15055030 ' ,
' only_matching ' : True ,
2016-05-06 12:08:43 +09:00
} ]
2016-05-05 03:11:04 +09:00
2016-05-06 12:07:29 +09:00
@staticmethod
def parse_video_key ( key ) :
2016-05-08 08:56:22 +09:00
video_key = { }
2016-05-06 12:07:29 +09:00
m = re . match ( r ' ^(?P<upload_date> \ d {8} )_ \ w+_(?P<part> \ d+)$ ' , key )
if m :
video_key [ ' upload_date ' ] = m . group ( ' upload_date ' )
2017-04-11 02:05:53 +07:00
video_key [ ' part ' ] = int ( m . group ( ' part ' ) )
2016-05-06 12:07:29 +09:00
return video_key
2018-04-01 22:47:39 +07:00
def _real_initialize ( self ) :
self . _login ( )
def _login ( self ) :
username , password = self . _get_login_info ( )
if username is None :
return
login_form = {
' szWork ' : ' login ' ,
' szType ' : ' json ' ,
' szUid ' : username ,
' szPassword ' : password ,
' isSaveId ' : ' false ' ,
' szScriptVar ' : ' oLoginRet ' ,
' szAction ' : ' ' ,
}
response = self . _download_json (
' https://login.afreecatv.com/app/LoginAction.php ' , None ,
' Logging in ' , data = urlencode_postdata ( login_form ) )
_ERRORS = {
- 4 : ' Your account has been suspended due to a violation of our terms and policies. ' ,
- 5 : ' https://member.afreecatv.com/app/user_delete_progress.php ' ,
- 6 : ' https://login.afreecatv.com/membership/changeMember.php ' ,
- 8 : " Hello! AfreecaTV here. \n The username you have entered belongs to \n an account that requires a legal guardian ' s consent. \n If you wish to use our services without restriction, \n please make sure to go through the necessary verification process. " ,
- 9 : ' https://member.afreecatv.com/app/pop_login_block.php ' ,
- 11 : ' https://login.afreecatv.com/afreeca/second_login.php ' ,
- 12 : ' https://member.afreecatv.com/app/user_security.php ' ,
0 : ' The username does not exist or you have entered the wrong password. ' ,
- 1 : ' The username does not exist or you have entered the wrong password. ' ,
- 3 : ' You have entered your username/password incorrectly. ' ,
- 7 : ' You cannot use your Global AfreecaTV account to access Korean AfreecaTV. ' ,
- 10 : ' Sorry for the inconvenience. \n Your account has been blocked due to an unauthorized access. \n Please contact our Help Center for assistance. ' ,
- 32008 : ' You have failed to log in. Please contact our Help Center. ' ,
}
result = int_or_none ( response . get ( ' RESULT ' ) )
if result != 1 :
error = _ERRORS . get ( result , ' You have failed to log in. ' )
raise ExtractorError (
' Unable to login: %s said: %s ' % ( self . IE_NAME , error ) ,
expected = True )
2016-05-05 03:11:04 +09:00
def _real_extract ( self , url ) :
video_id = self . _match_id ( url )
2016-11-13 06:02:26 +07:00
2018-02-10 22:36:26 +07:00
webpage = self . _download_webpage ( url , video_id )
2018-03-04 03:12:24 +07:00
if re . search ( r ' alert \ ([ " \' ]This video has been deleted ' , webpage ) :
raise ExtractorError (
' Video %s has been deleted ' % video_id , expected = True )
2018-02-10 22:36:26 +07:00
station_id = self . _search_regex (
r ' nStationNo \ s*= \ s*( \ d+) ' , webpage , ' station ' )
bbs_id = self . _search_regex (
r ' nBbsNo \ s*= \ s*( \ d+) ' , webpage , ' bbs ' )
video_id = self . _search_regex (
r ' nTitleNo \ s*= \ s*( \ d+) ' , webpage , ' title ' , default = video_id )
2018-04-01 23:07:54 +07:00
2018-04-02 00:00:45 +07:00
partial_view = False
2021-08-30 11:35:48 -04:00
adult_view = False
2018-04-02 00:00:45 +07:00
for _ in range ( 2 ) :
query = {
2017-10-02 03:28:25 +07:00
' nTitleNo ' : video_id ,
2018-02-10 22:36:26 +07:00
' nStationNo ' : station_id ,
' nBbsNo ' : bbs_id ,
2018-04-02 00:00:45 +07:00
}
if partial_view :
query [ ' partialView ' ] = ' SKIP_ADULT '
2021-08-30 11:35:48 -04:00
if adult_view :
query [ ' adultView ' ] = ' ADULT_VIEW '
2018-04-02 00:00:45 +07:00
video_xml = self . _download_xml (
' http://afbbs.afreecatv.com:8080/api/video/get_video_info.php ' ,
video_id , ' Downloading video info XML %s '
% ( ' (skipping adult) ' if partial_view else ' ' ) ,
video_id , headers = {
' Referer ' : url ,
} , query = query )
2017-10-02 03:28:25 +07:00
2018-04-02 00:00:45 +07:00
flag = xpath_text ( video_xml , ' ./track/flag ' , ' flag ' , default = None )
if flag and flag == ' SUCCEED ' :
break
if flag == ' PARTIAL_ADULT ' :
2021-04-16 15:31:10 +05:30
self . report_warning (
2018-04-02 00:00:45 +07:00
' In accordance with local laws and regulations, underage users are restricted from watching adult content. '
' Only content suitable for all ages will be downloaded. '
' Provide account credentials if you wish to download restricted content. ' )
partial_view = True
continue
elif flag == ' ADULT ' :
2021-08-30 11:35:48 -04:00
if not adult_view :
adult_view = True
continue
2018-04-02 00:00:45 +07:00
error = ' Only users older than 19 are able to watch this video. Provide account credentials to download this content. '
else :
error = flag
2017-10-02 03:28:25 +07:00
raise ExtractorError (
2018-04-02 00:00:45 +07:00
' %s said: %s ' % ( self . IE_NAME , error ) , expected = True )
else :
raise ExtractorError ( ' Unable to download video info ' )
2016-05-05 03:11:04 +09:00
2018-03-04 03:01:58 +07:00
video_element = video_xml . findall ( compat_xpath ( ' ./track/video ' ) ) [ - 1 ]
2017-03-06 00:31:44 +08:00
if video_element is None or video_element . text is None :
2018-03-04 03:12:24 +07:00
raise ExtractorError (
2020-11-20 00:52:59 +05:30
' Video %s does not exist ' % video_id , expected = True )
2016-05-31 17:28:49 +09:00
2017-04-11 02:05:53 +07:00
video_url = video_element . text . strip ( )
2017-03-06 00:31:44 +08:00
title = xpath_text ( video_xml , ' ./track/title ' , ' title ' , fatal = True )
2017-04-11 02:05:53 +07:00
2016-05-06 01:24:02 +09:00
uploader = xpath_text ( video_xml , ' ./track/nickname ' , ' uploader ' )
uploader_id = xpath_text ( video_xml , ' ./track/bj_id ' , ' uploader id ' )
2017-04-11 02:05:53 +07:00
duration = int_or_none ( xpath_text (
video_xml , ' ./track/duration ' , ' duration ' ) )
2016-05-06 01:24:02 +09:00
thumbnail = xpath_text ( video_xml , ' ./track/titleImage ' , ' thumbnail ' )
2016-05-05 03:11:04 +09:00
2017-04-11 02:05:53 +07:00
common_entry = {
' uploader ' : uploader ,
' uploader_id ' : uploader_id ,
' thumbnail ' : thumbnail ,
}
info = common_entry . copy ( )
info . update ( {
' id ' : video_id ,
' title ' : title ,
' duration ' : duration ,
} )
if not video_url :
entries = [ ]
2017-04-12 02:15:37 +07:00
file_elements = video_element . findall ( compat_xpath ( ' ./file ' ) )
one = len ( file_elements ) == 1
for file_num , file_element in enumerate ( file_elements , start = 1 ) :
2018-07-21 19:08:28 +07:00
file_url = url_or_none ( file_element . text )
2017-04-11 02:05:53 +07:00
if not file_url :
continue
2017-04-12 02:15:37 +07:00
key = file_element . get ( ' key ' , ' ' )
2021-08-30 12:07:34 -04:00
upload_date = unified_strdate ( self . _search_regex (
r ' ^( \ d {8} )_ ' , key , ' upload date ' , default = None ) )
if upload_date is not None :
# sometimes the upload date isn't included in the file name
# instead, another random ID is, which may parse as a valid
# date but be wildly out of a reasonable range
parsed_date = date_from_str ( upload_date )
if parsed_date . year < 2000 or parsed_date . year > = 2100 :
upload_date = None
2017-04-11 02:05:53 +07:00
file_duration = int_or_none ( file_element . get ( ' duration ' ) )
2017-04-12 02:15:37 +07:00
format_id = key if key else ' %s _ %s ' % ( video_id , file_num )
2017-12-19 00:38:39 +07:00
if determine_ext ( file_url ) == ' m3u8 ' :
formats = self . _extract_m3u8_formats (
file_url , video_id , ' mp4 ' , entry_protocol = ' m3u8_native ' ,
m3u8_id = ' hls ' ,
note = ' Downloading part %d m3u8 information ' % file_num )
else :
formats = [ {
' url ' : file_url ,
' format_id ' : ' http ' ,
} ]
2021-05-17 17:53:08 +05:30
if not formats and not self . get_param ( ' ignore_no_formats ' ) :
2017-12-19 00:38:39 +07:00
continue
self . _sort_formats ( formats )
2017-04-11 02:05:53 +07:00
file_info = common_entry . copy ( )
file_info . update ( {
' id ' : format_id ,
2017-04-27 23:00:15 +02:00
' title ' : title if one else ' %s (part %d ) ' % ( title , file_num ) ,
2017-04-12 02:15:37 +07:00
' upload_date ' : upload_date ,
2017-04-11 02:05:53 +07:00
' duration ' : file_duration ,
' formats ' : formats ,
} )
entries . append ( file_info )
entries_info = info . copy ( )
entries_info . update ( {
' _type ' : ' multi_video ' ,
' entries ' : entries ,
} )
return entries_info
info = {
2016-05-05 03:11:04 +09:00
' id ' : video_id ,
' title ' : title ,
' uploader ' : uploader ,
' uploader_id ' : uploader_id ,
' duration ' : duration ,
' thumbnail ' : thumbnail ,
}
2017-04-11 02:05:53 +07:00
if determine_ext ( video_url ) == ' m3u8 ' :
info [ ' formats ' ] = self . _extract_m3u8_formats (
video_url , video_id , ' mp4 ' , entry_protocol = ' m3u8_native ' ,
m3u8_id = ' hls ' )
else :
app , playpath = video_url . split ( ' mp4: ' )
info . update ( {
' url ' : app ,
' ext ' : ' flv ' ,
' play_path ' : ' mp4: ' + playpath ,
' rtmp_live ' : True , # downloading won't end without this
} )
return info