Separate modules
This commit is contained in:
@@ -1,31 +1,21 @@
|
|||||||
import argparse
|
import argparse
|
||||||
import asyncio
|
|
||||||
try:
|
try:
|
||||||
from asyncio import CancelledError
|
from asyncio import CancelledError
|
||||||
except ImportError:
|
except ImportError:
|
||||||
from asyncio.futures import CancelledError
|
from asyncio.futures import CancelledError
|
||||||
import os
|
import os
|
||||||
import signal
|
|
||||||
from json.decoder import JSONDecodeError
|
|
||||||
from pathlib import Path
|
|
||||||
from httpcore import ReadTimeout as HCReadTimeout, NetworkError as HCNetworkError
|
|
||||||
from .arguments import Arguments
|
from .arguments import Arguments
|
||||||
from .echo import Echo
|
from .echo import Echo
|
||||||
from .progressbar import ProgressBar
|
from .. exceptions import InvalidVideoIdException
|
||||||
from .. exceptions import InvalidVideoIdException, NoContents, PatternUnmatchError, UnknownConnectionError
|
|
||||||
from .. processors.html_archiver import HTMLArchiver
|
|
||||||
from .. tool.extract.extractor import Extractor
|
|
||||||
from .. tool.videoinfo import VideoInfo
|
|
||||||
from .. util.extract_video_id import extract_video_id
|
|
||||||
from .. import util
|
|
||||||
from .. import __version__
|
from .. import __version__
|
||||||
|
from .cli_extractor import CLIExtractor
|
||||||
|
|
||||||
|
|
||||||
'''
|
'''
|
||||||
Most of CLI modules refer to
|
Most of CLI modules refer to
|
||||||
Petter Kraabøl's Twitch-Chat-Downloader
|
Petter Kraabøl's Twitch-Chat-Downloader
|
||||||
https://github.com/PetterKraabol/Twitch-Chat-Downloader
|
https://github.com/PetterKraabol/Twitch-Chat-Downloader
|
||||||
(MIT License)
|
(MIT License)
|
||||||
|
|
||||||
'''
|
'''
|
||||||
|
|
||||||
|
|
||||||
@@ -38,20 +28,19 @@ def main():
|
|||||||
'If ID starts with a hyphen (-), enclose the ID in square brackets.')
|
'If ID starts with a hyphen (-), enclose the ID in square brackets.')
|
||||||
parser.add_argument('-o', f'--{Arguments.Name.OUTPUT}', type=str,
|
parser.add_argument('-o', f'--{Arguments.Name.OUTPUT}', type=str,
|
||||||
help='Output directory (end with "/"). default="./"', default='./')
|
help='Output directory (end with "/"). default="./"', default='./')
|
||||||
parser.add_argument(f'--{Arguments.Name.SAVE_ERROR_DATA}', action='store_true',
|
parser.add_argument(f'--{Arguments.Name.DEBUG}', action='store_true',
|
||||||
help='Save error data when error occurs(".dat" file)')
|
help='Debug mode. Stop when exceptions have occurred and save error data (".dat" file).')
|
||||||
parser.add_argument(f'--{Arguments.Name.VERSION}', action='store_true',
|
parser.add_argument(f'--{Arguments.Name.VERSION}', action='store_true',
|
||||||
help='Show version')
|
help='Show version.')
|
||||||
parser.add_argument(f'--{Arguments.Name.ECHO}', action='store_true',
|
parser.add_argument(f'--{Arguments.Name.ECHO}', action='store_true',
|
||||||
help='Show chats of specified video')
|
help='Display chats of specified video.')
|
||||||
|
|
||||||
Arguments(parser.parse_args().__dict__)
|
Arguments(parser.parse_args().__dict__)
|
||||||
|
|
||||||
if Arguments().print_version:
|
if Arguments().print_version:
|
||||||
print(f'pytchat v{__version__} © 2019,2020 taizan-hokuto')
|
print(f'pytchat v{__version__} © 2019, 2020 taizan-hokuto')
|
||||||
return
|
return
|
||||||
|
|
||||||
# Extractor
|
|
||||||
if not Arguments().video_ids:
|
if not Arguments().video_ids:
|
||||||
parser.print_help()
|
parser.print_help()
|
||||||
return
|
return
|
||||||
@@ -59,7 +48,7 @@ def main():
|
|||||||
# Echo
|
# Echo
|
||||||
if Arguments().echo:
|
if Arguments().echo:
|
||||||
if len(Arguments().video_ids) > 1:
|
if len(Arguments().video_ids) > 1:
|
||||||
print("You can specify only one video ID.")
|
print("When using --echo option, only one video ID can be specified.")
|
||||||
return
|
return
|
||||||
try:
|
try:
|
||||||
Echo(Arguments().video_ids[0]).run()
|
Echo(Arguments().video_ids[0]).run()
|
||||||
@@ -67,111 +56,16 @@ def main():
|
|||||||
print("Invalid video id:", str(e))
|
print("Invalid video id:", str(e))
|
||||||
except Exception as e:
|
except Exception as e:
|
||||||
print(type(e), str(e))
|
print(type(e), str(e))
|
||||||
|
if Arguments().debug:
|
||||||
|
raise
|
||||||
finally:
|
finally:
|
||||||
return
|
return
|
||||||
|
|
||||||
|
# Extractor
|
||||||
if not os.path.exists(Arguments().output):
|
if not os.path.exists(Arguments().output):
|
||||||
print("\nThe specified directory does not exist.:{}\n".format(Arguments().output))
|
print("\nThe specified directory does not exist.:{}\n".format(Arguments().output))
|
||||||
return
|
return
|
||||||
try:
|
try:
|
||||||
Runner().run()
|
CLIExtractor().run()
|
||||||
except CancelledError as e:
|
except CancelledError as e:
|
||||||
print(str(e))
|
print(str(e))
|
||||||
|
|
||||||
|
|
||||||
class Runner:
|
|
||||||
|
|
||||||
def run(self) -> None:
|
|
||||||
ex = None
|
|
||||||
pbar = None
|
|
||||||
for counter, video_id in enumerate(Arguments().video_ids):
|
|
||||||
if len(Arguments().video_ids) > 1:
|
|
||||||
print(f"\n{'-' * 10} video:{counter + 1} of {len(Arguments().video_ids)} {'-' * 10}")
|
|
||||||
|
|
||||||
try:
|
|
||||||
video_id = extract_video_id(video_id)
|
|
||||||
separated_path = str(Path(Arguments().output)) + os.path.sep
|
|
||||||
path = util.checkpath(separated_path + video_id + '.html')
|
|
||||||
try:
|
|
||||||
info = VideoInfo(video_id)
|
|
||||||
except (PatternUnmatchError, JSONDecodeError) as e:
|
|
||||||
print("Cannot parse video information.:{} {}".format(video_id, type(e)))
|
|
||||||
if Arguments().save_error_data:
|
|
||||||
util.save(str(e.doc), "ERR", ".dat")
|
|
||||||
continue
|
|
||||||
except Exception as e:
|
|
||||||
print("Cannot parse video information.:{} {}".format(video_id, type(e)))
|
|
||||||
continue
|
|
||||||
|
|
||||||
print(f"\n"
|
|
||||||
f" video_id: {video_id}\n"
|
|
||||||
f" channel: {info.get_channel_name()}\n"
|
|
||||||
f" title: {info.get_title()}\n"
|
|
||||||
f" output path: {path}")
|
|
||||||
|
|
||||||
duration = info.get_duration()
|
|
||||||
pbar = ProgressBar(total=(duration * 1000), status_txt="Extracting")
|
|
||||||
ex = Extractor(video_id,
|
|
||||||
callback=pbar.disp,
|
|
||||||
div=10)
|
|
||||||
signal.signal(signal.SIGINT, (lambda a, b: self.cancel(ex, pbar)))
|
|
||||||
|
|
||||||
data = ex.extract()
|
|
||||||
if data == []:
|
|
||||||
continue
|
|
||||||
pbar.reset("#", "=", total=len(data), status_txt="Rendering ")
|
|
||||||
processor = HTMLArchiver(path, callback=pbar.disp)
|
|
||||||
processor.process(
|
|
||||||
[{'video_id': None,
|
|
||||||
'timeout': 1,
|
|
||||||
'chatdata': (action["replayChatItemAction"]["actions"][0] for action in data)}]
|
|
||||||
)
|
|
||||||
processor.finalize()
|
|
||||||
pbar.reset('#', '#', status_txt='Completed ')
|
|
||||||
pbar.close()
|
|
||||||
print()
|
|
||||||
if pbar.is_cancelled():
|
|
||||||
print("\nThe extraction process has been discontinued.\n")
|
|
||||||
except InvalidVideoIdException:
|
|
||||||
print("Invalid Video ID or URL:", video_id)
|
|
||||||
except NoContents as e:
|
|
||||||
print(f"Abort:{str(e)}:[{video_id}]")
|
|
||||||
except (JSONDecodeError, PatternUnmatchError) as e:
|
|
||||||
print("{}:{}".format(e.msg, video_id))
|
|
||||||
if Arguments().save_error_data:
|
|
||||||
util.save(e.doc, "ERR_", ".dat")
|
|
||||||
except (UnknownConnectionError, HCNetworkError, HCReadTimeout) as e:
|
|
||||||
print(f"An unknown network error occurred during the processing of [{video_id}]. : " + str(e))
|
|
||||||
except Exception as e:
|
|
||||||
print(f"Abort:{str(type(e))} {str(e)[:80]}")
|
|
||||||
finally:
|
|
||||||
clear_tasks()
|
|
||||||
|
|
||||||
return
|
|
||||||
|
|
||||||
def cancel(self, ex=None, pbar=None) -> None:
|
|
||||||
'''Called when keyboard interrupted has occurred.
|
|
||||||
'''
|
|
||||||
print("\nKeyboard interrupted.\n")
|
|
||||||
if ex and pbar:
|
|
||||||
ex.cancel()
|
|
||||||
pbar.cancel()
|
|
||||||
|
|
||||||
|
|
||||||
def clear_tasks():
|
|
||||||
'''
|
|
||||||
Clear remained tasks.
|
|
||||||
Called when internal exception has occurred or
|
|
||||||
after each extraction process is completed.
|
|
||||||
'''
|
|
||||||
async def _shutdown():
|
|
||||||
tasks = [t for t in asyncio.all_tasks()
|
|
||||||
if t is not asyncio.current_task()]
|
|
||||||
for task in tasks:
|
|
||||||
task.cancel()
|
|
||||||
|
|
||||||
try:
|
|
||||||
loop = asyncio.get_event_loop()
|
|
||||||
loop.run_until_complete(_shutdown())
|
|
||||||
except Exception as e:
|
|
||||||
print(e)
|
|
||||||
|
|||||||
123
pytchat/cli/cli_extractor.py
Normal file
123
pytchat/cli/cli_extractor.py
Normal file
@@ -0,0 +1,123 @@
|
|||||||
|
import asyncio
|
||||||
|
import os
|
||||||
|
import signal
|
||||||
|
import traceback
|
||||||
|
from httpcore import ReadTimeout as HCReadTimeout, NetworkError as HCNetworkError
|
||||||
|
from json.decoder import JSONDecodeError
|
||||||
|
from pathlib import Path
|
||||||
|
from .arguments import Arguments
|
||||||
|
from .progressbar import ProgressBar
|
||||||
|
from .. import util
|
||||||
|
from .. exceptions import InvalidVideoIdException, NoContents, PatternUnmatchError, UnknownConnectionError
|
||||||
|
from .. processors.html_archiver import HTMLArchiver
|
||||||
|
from .. tool.extract.extractor import Extractor
|
||||||
|
from .. tool.videoinfo import VideoInfo
|
||||||
|
from .. util.extract_video_id import extract_video_id
|
||||||
|
|
||||||
|
|
||||||
|
class CLIExtractor:
|
||||||
|
# def __init__(self, arguments):
|
||||||
|
# self.arguments = arguments
|
||||||
|
|
||||||
|
def run(self) -> None:
|
||||||
|
ex = None
|
||||||
|
pbar = None
|
||||||
|
for counter, video_id in enumerate(Arguments().video_ids):
|
||||||
|
if len(Arguments().video_ids) > 1:
|
||||||
|
print(f"\n{'-' * 10} video:{counter + 1} of {len(Arguments().video_ids)} {'-' * 10}")
|
||||||
|
|
||||||
|
try:
|
||||||
|
video_id = extract_video_id(video_id)
|
||||||
|
separated_path = str(Path(Arguments().output)) + os.path.sep
|
||||||
|
path = util.checkpath(separated_path + video_id + '.html')
|
||||||
|
try:
|
||||||
|
info = VideoInfo(video_id)
|
||||||
|
except (PatternUnmatchError, JSONDecodeError) as e:
|
||||||
|
print("Cannot parse video information.:{} {}".format(video_id, type(e)))
|
||||||
|
if Arguments().debug:
|
||||||
|
util.save(str(e.doc), "ERR", ".dat")
|
||||||
|
continue
|
||||||
|
except Exception as e:
|
||||||
|
print("Cannot parse video information.:{} {}".format(video_id, type(e)))
|
||||||
|
continue
|
||||||
|
|
||||||
|
print(f"\n"
|
||||||
|
f" video_id: {video_id}\n"
|
||||||
|
f" channel: {info.get_channel_name()}\n"
|
||||||
|
f" title: {info.get_title()}\n"
|
||||||
|
f" output path: {path}")
|
||||||
|
|
||||||
|
duration = info.get_duration()
|
||||||
|
pbar = ProgressBar(total=(duration * 1000), status_txt="Extracting")
|
||||||
|
ex = Extractor(video_id,
|
||||||
|
callback=pbar.disp,
|
||||||
|
div=10)
|
||||||
|
signal.signal(signal.SIGINT, (lambda a, b: self.cancel(ex, pbar)))
|
||||||
|
|
||||||
|
data = ex.extract()
|
||||||
|
if data == [] or data is None:
|
||||||
|
continue
|
||||||
|
pbar.reset("#", "=", total=1000, status_txt="Rendering ")
|
||||||
|
processor = HTMLArchiver(path, callback=pbar.disp)
|
||||||
|
processor.process(
|
||||||
|
[{'video_id': None,
|
||||||
|
'timeout': 1,
|
||||||
|
'chatdata': (action["replayChatItemAction"]["actions"][0] for action in data)}]
|
||||||
|
)
|
||||||
|
processor.finalize()
|
||||||
|
pbar.reset('#', '#', status_txt='Completed ')
|
||||||
|
pbar.close()
|
||||||
|
print()
|
||||||
|
if pbar.is_cancelled():
|
||||||
|
print("\nThe extraction process has been discontinued.\n")
|
||||||
|
except InvalidVideoIdException:
|
||||||
|
print("Invalid Video ID or URL:", video_id)
|
||||||
|
except NoContents as e:
|
||||||
|
print(f"Abort:{str(e)}:[{video_id}]")
|
||||||
|
except (JSONDecodeError, PatternUnmatchError) as e:
|
||||||
|
print("{}:{}".format(e.msg, video_id))
|
||||||
|
if Arguments().debug:
|
||||||
|
filename = util.save(e.doc, "ERR_", ".dat")
|
||||||
|
traceback.print_exc()
|
||||||
|
print(f"Saved error data: {filename}")
|
||||||
|
except (UnknownConnectionError, HCNetworkError, HCReadTimeout) as e:
|
||||||
|
if Arguments().debug:
|
||||||
|
traceback.print_exc()
|
||||||
|
print(f"An unknown network error occurred during the processing of [{video_id}]. : " + str(e))
|
||||||
|
except Exception as e:
|
||||||
|
print(f"Abort:{str(type(e))} {str(e)[:80]}")
|
||||||
|
if Arguments().debug:
|
||||||
|
traceback.print_exc()
|
||||||
|
finally:
|
||||||
|
clear_tasks()
|
||||||
|
|
||||||
|
return
|
||||||
|
|
||||||
|
def cancel(self, ex=None, pbar=None) -> None:
|
||||||
|
'''Called when keyboard interrupted has occurred.
|
||||||
|
'''
|
||||||
|
print("\nKeyboard interrupted.\n")
|
||||||
|
if ex and pbar:
|
||||||
|
ex.cancel()
|
||||||
|
pbar.cancel()
|
||||||
|
|
||||||
|
|
||||||
|
def clear_tasks():
|
||||||
|
'''
|
||||||
|
Clear remained tasks.
|
||||||
|
Called when internal exception has occurred or
|
||||||
|
after each extraction process is completed.
|
||||||
|
'''
|
||||||
|
async def _shutdown():
|
||||||
|
tasks = [t for t in asyncio.all_tasks()
|
||||||
|
if t is not asyncio.current_task()]
|
||||||
|
for task in tasks:
|
||||||
|
task.cancel()
|
||||||
|
|
||||||
|
try:
|
||||||
|
loop = asyncio.get_event_loop()
|
||||||
|
loop.run_until_complete(_shutdown())
|
||||||
|
except Exception as e:
|
||||||
|
print(str(e))
|
||||||
|
if Arguments().debug:
|
||||||
|
traceback.print_exc()
|
||||||
Reference in New Issue
Block a user