KurtBestor
diff --git a/‎src/extractor/afreeca_downloader.py‎
Lines changed: 26 additions & 18 deletions b/‎src/extractor/afreeca_downloader.py‎
Lines changed: 26 additions & 18 deletions
diff --git a/‎src/extractor/artstation_downloader.py‎
Lines changed: 0 additions & 1 deletion b/‎src/extractor/artstation_downloader.py‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎src/extractor/bdsmlr_downloader.py‎
Lines changed: 1 addition & 1 deletion b/‎src/extractor/bdsmlr_downloader.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/extractor/bili_downloader.py‎
Lines changed: 6 additions & 3 deletions b/‎src/extractor/bili_downloader.py‎
Lines changed: 6 additions & 3 deletions
diff --git a/‎src/extractor/danbooru_downloader.py‎
Lines changed: 6 additions & 5 deletions b/‎src/extractor/danbooru_downloader.py‎
Lines changed: 6 additions & 5 deletions
diff --git a/‎src/extractor/etc_downloader.py‎
Lines changed: 63 additions & 22 deletions b/‎src/extractor/etc_downloader.py‎
Lines changed: 63 additions & 22 deletions
@@ -6,20 +6,21 @@
 import errors
 import utils
 import os
+import dateutil.parser
 
 
 class LoginRequired(errors.LoginRequired):
     def __init__(self, *args):
-        super().__init__(*args, method='browser', url='https://login.afreecatv.com/afreeca/login.php')
+        super().__init__(*args, method='browser', url='https://login.sooplive.co.kr/afreeca/login.php')
 
 
 
 class Downloader_afreeca(Downloader):
     type = 'afreeca'
-    URLS = ['afreecatv.com']
+    URLS = ['afreecatv.com', 'sooplive.co.kr']
     single = True
-    display_name = 'AfreecaTV'
-    ACCEPT_COOKIES = [r'(.*\.)?afreecatv\.com']
+    display_name = 'SOOP'
+    ACCEPT_COOKIES = [r'(.*\.)?afreecatv\.com', r'(.*\.)?sooplive\.co\.kr']
 
     def init(self):
         self.session = Session()
@@ -82,23 +83,24 @@ def get(self):
             if alert:
                 raise LoginRequired(alert)
         soup = Soup(html)
+        date = None
 
         url_thumb = soup.find('meta', {'property': 'og:image'}).attrs['content']
         print_('url_thumb: {}'.format(url_thumb))
 
         vid = re.find('/player/([0-9]+)', url)
         if vid is None: # live
-            bid = re.find('afreecatv.com/([^/]+)', url, err='no bid')
+            bid = re.find('sooplive.co.kr/([^/]+)', url, err='no bid')
 
-            url_api = f'https://st.afreecatv.com/api/get_station_status.php?szBjId={bid}'
+            url_api = f'https://st.sooplive.co.kr/api/get_station_status.php?szBjId={bid}'
             r = session.post(url_api, headers={'Referer': url})
             d = json.loads(r.text)
             artist = d['DATA']['user_nick']
             if self._live_info is not None:
                 self._live_info['title'] = artist
 
-            url_api = f'https://live.afreecatv.com/afreeca/player_live_api.php?bjid={bid}'
-            #bno = re.find('afreecatv.com/[^/]+/([0-9]+)', url, err='no bno')
+            url_api = f'https://live.sooplive.co.kr/afreeca/player_live_api.php?bjid={bid}'
+            #bno = re.find('sooplive.co.kr/[^/]+/([0-9]+)', url, err='no bno')
             bno = re.find(r'nBroadNo\s=\s([0-9]+)', html, err='no bno') #6915
             r = session.post(url_api, data={'bid': bid, 'bno': bno, 'type': 'aid', 'pwd': '', 'player_type': 'html5', 'stream_type': 'common', 'quality': 'master', 'mode': 'landing', 'from_api': '0'}, headers={'Referer': url})
             d = json.loads(r.text)
@@ -110,11 +112,11 @@ def get(self):
 
             data = {}
             data['title'] = soup.find('meta', {'property': 'og:title'})['content'].strip()
-            data['files'] = [{'file': f'https://pc-web.stream.afreecatv.com/live-stm-16/auth_master_playlist.m3u8?aid={aid}'}]
+            data['files'] = [{'file': f'https://pc-web.stream.sooplive.co.kr/live-stm-16/auth_master_playlist.m3u8?aid={aid}'}]
             data['writer_nick'] = artist
             data['live'] = True
         elif f'{vid}/catch' in url: #6215
-            url_api = 'https://api.m.afreecatv.com/station/video/a/catchview'
+            url_api = 'https://api.m.sooplive.co.kr/station/video/a/catchview'
             r = session.post(url_api, data={'nPageNo': '1', 'nLimit': '10', 'nTitleNo': vid}, headers={'Referer': url})
             try:
                 s = cut_pair(r.text)
@@ -123,8 +125,9 @@ def get(self):
                 print_(r.text)
                 raise e
             data = d['data'][0]
+            date = dateutil.parser.parse(data['reg_date']) #7054
         else:
-            url_api = 'https://api.m.afreecatv.com/station/video/a/view'
+            url_api = 'https://api.m.sooplive.co.kr/station/video/a/view'
             r = session.post(url_api, data={'nTitleNo': vid, 'nApiLevel': '10', 'nPlaylistIdx': '0'}, headers={'Referer': url})
             try:
                 s = cut_pair(r.text)
@@ -133,6 +136,7 @@ def get(self):
                 print_(r.text)
                 raise e
             data = d['data']
+            date = dateutil.parser.parse(data.get('broad_start') or data['write_tm']) #7054, #7093
 
         title = data.get('full_title') or data['title']
         artist = data.get('copyright_nickname') or data.get('original_user_nick') or data['writer_nick']
@@ -150,9 +154,12 @@ def get(self):
         print_(f'urls_m3u8: {len(urls_m3u8)}')
 
         if data.get('live'):
-            hdr = session.headers.copy()
-            hdr['Referer'] = url
-            stream = utils.LiveStream(urls_m3u8[0], headers=hdr, cw=self.cw)
+            stream = playlist2stream(urls_m3u8[0], url, session=session) #6934
+            if stream.ms:
+                stream = stream.live
+                stream._cw = self.cw
+            if not stream.live:
+                stream.live = True#
         else:
             streams = []
             for url_m3u8 in urls_m3u8:
@@ -165,9 +172,10 @@ def get(self):
             for stream in streams[1:]:
                 streams[0] += stream
             stream = streams[0]
+            stream.live = None#
 
         live = data.get('live') or False
-        return {'url': stream, 'title': title, 'name': format_filename(title, vid, '.mp4', artist=artist, live=live), 'url_thumb': url_thumb, 'artist': artist, 'live': live}
+        return {'url': stream, 'title': title, 'name': format_filename(title, vid, '.mp4', artist=artist, live=live, date=date), 'url_thumb': url_thumb, 'artist': artist, 'live': live}
 
 
 
@@ -176,12 +184,12 @@ class Live_afreeca(utils.Live):
 
     @classmethod
     def is_live(cls, url):
-        return bool(re.match(r'https?://(play|bj).afreecatv.com/([^/?#]+)', url)) and url.strip('/').count('/') <= 4
+        return bool(re.match(r'https?://(play|bj|ch).(afreecatv.com|sooplive.co.kr)/([^/?#]+)', url)) and url.strip('/').count('/') <= 4
 
     @classmethod
     def fix_url(cls, url):
-        bj = re.find(r'https?://(play|bj).afreecatv.com/([^/?#]+)', url)[1]
-        return f'https://play.afreecatv.com/{bj}'
+        bj = re.find(r'https?://(play|bj|ch).(afreecatv.com|sooplive.co.kr)/([^/?#]+)', url)[2]
+        return f'https://play.sooplive.co.kr/{bj}'
 
     @classmethod
     def check_live(cls, url, info=None):
 
@@ -86,7 +86,6 @@ def read(self):
 
 @try_n(2)
 def get_imgs(id_, title, session, cw=None):
-    print_ = get_print(cw)
     referer = f'https://www.artstation.com/{id_}'
     downloader.read_html(referer, session=session)
     #print(session.cookies.keys())
 
@@ -31,7 +31,7 @@ def id_(self):
         if 'bdsmlr.com' in url:
             if 'www.bdsmlr.com' in url:
                 raise Exception('www.bdsmlr.com')
-            gal_num = url.split('.bdsmlr.com')[0].split('/')[(-1)]
+            gal_num = url.split('.bdsmlr.com')[0].split('/')[-1]
         else:
             gal_num = url
         return gal_num
 
@@ -8,7 +8,7 @@
 import ree as re
 import ytdl
 import constants
-from putils import DIR
+import putils
 import threading
 import errors
 _VALID_URL = r'''(?x)
@@ -76,17 +76,19 @@ def get(self):
 
         mobj = re.match(_VALID_URL, self['referer'])
         video_id = mobj.group('id')
+        artist = info.get('uploader') or None
 
         info = {
             'url': f_video['url'],
             'url_thumb': url_thumb,
-            'name': format_filename(title, video_id, ext),
+            'artist': artist,
+            'name': format_filename(title, video_id, ext, artist=artist), #7127
             }
 
         if f_audio:
             def f():
                 audio = f_audio['url']
-                path = os.path.join(DIR, f'{uuid()}_a.tmp')
+                path = os.path.join(putils.DIRf, f'{uuid()}_a.tmp')
                 if cw is not None:
                     cw.trash_can.append(path)
                 if constants.FAST:
@@ -211,3 +213,4 @@ def read(self):
         n = int(math.ceil(8.0 / len(self.urls)))
         self.print_(f'n_threads: {n}')
         self.enableSegment(n_threads=n, overwrite=True)
+        self.artist = file['artist']
@@ -1,22 +1,23 @@
 #coding: utf-8
 import downloader
 import ree as re
-from utils import Downloader, get_max_range, clean_title, get_print, try_n, urljoin, check_alive, LazyUrl, get_ext, limits
+from utils import Downloader, Session, get_max_range, clean_title, get_print, try_n, urljoin, check_alive, LazyUrl, get_ext, limits
 from translator import tr_
 from urllib.parse import urlparse, parse_qs, quote
 import clf2
 
 
-
 class Downloader_danbooru(Downloader):
     type = 'danbooru'
     URLS = ['danbooru.donmai.us']
-    MAX_CORE = 6
+    MAX_CORE = 4
     _name = None
     ACCEPT_COOKIES = [r'(.*\.)?donmai\.us']
 
     def init(self):
-        self.session = clf2.solve(self.url, cw=self.cw)['session'] #5336
+        self.session = Session('chrome')
+        clf2.solve(self.url, session=self.session, cw=self.cw) #5336
+        self.session.headers['User-Agent'] = 'Mozilla/5.' #7034
 
     @classmethod
     def fix_url(cls, url):
@@ -95,7 +96,7 @@ def get(self, url):
         return img, None
 
 
-@limits(.5)
+@limits(1)
 def wait(cw):
     check_alive(cw)
 
 
@@ -1,6 +1,6 @@
 import downloader
 import ytdl
-from utils import Downloader, Session, try_n, LazyUrl, get_ext, format_filename, get_print, get_resolution
+from utils import Downloader, Session, try_n, LazyUrl, get_ext, format_filename, get_print, get_resolution, print_error, cut_pair, json
 from io import BytesIO
 import ree as re
 from m3u8_tools import playlist2stream, M3u8_stream
@@ -19,7 +19,8 @@ class Downloader_etc(Downloader):
     display_name = 'Etc'
     PRIORITY = 10
 
-    def init(self):
+    @try_n(2)
+    def read(self):
         self.session = Session()
         name = ytdl.get_extractor_name(self.url)
         self.print_('extractor: {}'.format(name))
@@ -28,21 +29,20 @@ def init(self):
         #if name == 'generic':
         #    raise NotImplementedError()
 
-    def read(self):
         video = get_video(self.url, self.session, self.cw)
 
         if video.artist:
             self.artist = video.artist
 
-        self.urls.append(video.url)
-
         self.print_('url_thumb: {}'.format(video.url_thumb))
         self.setIcon(video.thumb)
-        if video.header.lower() not in ['yourporn', 'spankbang']:
+        if video.header.lower() not in ['yourporn']:
             self.enableSegment()#
         if isinstance(video.url(), M3u8_stream):
             self.disableSegment()
 
+        self.urls.append(video.url)
+
         self.title = os.path.splitext(video.filename)[0].replace('：', ':')
 
 
@@ -69,17 +69,52 @@ def get_video(url, session, cw, ie_key=None):
         if isinstance(video, Exception):
             raise video
         if isinstance(video.url(), M3u8_stream):
-            c = video.url().segs[0].download(2, cw)
+            c = video.url().urls[0][1].download(cw)
             if not c:
                 raise Exception('invalid m3u8')
         return video
     except Exception as e:
         if isinstance(e, UnSupportedError):
             raise e
-        print_(e)
+        print_(print_error(e))
         return _get_video(url, session, cw, ie_key, allow_m3u8=False)
 
-@try_n(4)
+
+def extract_info_spankbang(url, session, cw): # temp fix
+    print_ = get_print(cw)
+    soup = downloader.read_soup(url, session=session)
+
+    for script in soup.findAll('script'):
+        script = script.string
+        if script and 'var stream_data'in script:
+            s = cut_pair(script.split('var stream_data')[-1].strip(' \t=').replace("'", '"'))
+            break
+    else:
+        raise Exception('no stream_data')
+
+    info = {}
+    info['url'] = url
+    info['title'] = soup.find('h1').text.strip()
+    info['id'] = re.find(r'spankbang\.com/([^/]+)', soup.find('meta', {'property': 'og:url'})['content'], err='no id')
+    info['thumbnail'] = soup.find('meta', {'property': 'og:image'})['content']
+    info['formats'] = []
+    data = json.loads(s)
+    for res, item in data.items():
+        if res == 'main':
+            continue
+        if item and isinstance(item,  list):
+            item = item[0]
+        else:
+            continue
+        ext = get_ext_(item, session, url)
+        res = {'4k': '2160p', '8k': '4320p', '16k': '8640p'}.get(res, res)
+        f = {'url': item, 'format': res}
+        info['formats'].append(f)
+
+    return info
+
+
+@try_n(2)
 def _get_video(url, session, cw, ie_key=None, allow_m3u8=True):
     print_ = get_print(cw)
     print_('get_video: {}, {}'.format(allow_m3u8, url))
@@ -90,14 +125,15 @@ def _get_video(url, session, cw, ie_key=None, allow_m3u8=True):
         'writesubtitles': True,
         }
     if ytdl.get_extractor_name(url) == 'spankbang':
-        options['legacyserverconnect'] = True #6545
-    ydl = ytdl.YoutubeDL(options, cw=cw)
-    try:
-        info = ydl.extract_info(url)
-    except Exception as e:
-        if 'ERROR: Unsupported URL' in str(e):
-            return UnSupportedError(str(e))
-        raise e
+        info = extract_info_spankbang(url, session, cw)
+    else:
+        ydl = ytdl.YoutubeDL(options, cw=cw)
+        try:
+            info = ydl.extract_info(url)
+        except Exception as e:
+            if 'ERROR: Unsupported URL' in str(e):
+                return UnSupportedError(str(e))
+            raise e
     if not ie_key:
         ie_key = ytdl.get_extractor_name(url)
     info['ie_key'] = ie_key
@@ -191,6 +227,7 @@ class Video:
     def __init__(self, f, f_audio, info, session, referer, cw=None):
         self.f_audio = f_audio
         self.cw = cw
+        print_ = get_print(cw)
         self.title = title = info['title']
         self.id = info['id']
         self.url = f['url']
@@ -222,15 +259,19 @@ def foo():
 
         if ext.lower() == '.m3u8':
             res = get_resolution() #4773
-            if info.get('live_status') == 'is_live':
+            ls = info.get('live_status')
+            print_(f'live_status: {ls}')
+            if ls == 'is_live':
                 url = foo()
             else:
                 try:
-                    url = playlist2stream(self.url, referer, session=session, n_thread=4)
+                    url = playlist2stream(self.url, referer, session=session)
                 except:
-                    url = M3u8_stream(self.url, referer=referer, session=session, n_thread=4)
-                if url.live is not None: #5110
-                    url = foo()
+                    url = M3u8_stream(self.url, referer=referer, session=session)
+                print_(f'mpegts: {url.mpegts}')
+                if url.ms or url.mpegts == False: #5110
+                    url = url.live
+                    url._cw = cw
             ext = '.mp4'
         elif ext.lower() == '.mpd': # TVer
             url = foo()