From b4faa53417f49e5a6bde997aeefc17c4b3445faa Mon Sep 17 00:00:00 2001 From: William Wei <128806514+weilycoder@users.noreply.github.com> Date: Tue, 17 Dec 2024 23:10:35 +0800 Subject: [PATCH 1/2] Resolve IO.output_gen's issues (#155) * Resolve end-of-line sequence issues * Add a buffer * Add test * Fix type annotations * Rewrite output_gen * Ensure all child processes are terminated * Fix test * Rewrite output_gen test * Fix type hints; fix some io test * Use a simpler and more straightforward method to terminate the process tree --- .gitignore | 1 + .pylintrc | 2 +- cyaron/io.py | 143 ++++++++++++++++++++++++++-------------- cyaron/tests/io_test.py | 66 +++++++++++-------- poetry.lock | 2 +- 5 files changed, 132 insertions(+), 82 deletions(-) diff --git a/.gitignore b/.gitignore index bf4997a..76f1197 100644 --- a/.gitignore +++ b/.gitignore @@ -1,4 +1,5 @@ config.py +*.cpp *.in *.out *.exe diff --git a/.pylintrc b/.pylintrc index de2c0b1..61e0596 100644 --- a/.pylintrc +++ b/.pylintrc @@ -1,3 +1,3 @@ [MASTER] -py-version=3.5 +py-version=3.6 disable=R0902,R0903,R0913,R0917,R0912 \ No newline at end of file diff --git a/cyaron/io.py b/cyaron/io.py index bbfa7f9..3bee2ee 100644 --- a/cyaron/io.py +++ b/cyaron/io.py @@ -3,12 +3,14 @@ Classes: IO: IO tool class. It will process the input and output files. """ + from __future__ import absolute_import import os import re +import signal import subprocess import tempfile -from typing import Union, overload, Optional +from typing import Union, overload, Optional, List, cast from io import IOBase from . import log from .utils import list_like, make_unicode @@ -18,34 +20,39 @@ class IO: """IO tool class. It will process the input and output files.""" @overload - def __init__(self, - input_file: Optional[Union[IOBase, str, int]] = None, - output_file: Optional[Union[IOBase, str, int]] = None, - data_id: Optional[int] = None, - disable_output: bool = False, - make_dirs: bool = False): + def __init__( + self, + input_file: Optional[Union[IOBase, str, int]] = None, + output_file: Optional[Union[IOBase, str, int]] = None, + data_id: Optional[int] = None, + disable_output: bool = False, + make_dirs: bool = False, + ): ... @overload - def __init__(self, - data_id: Optional[int] = None, - file_prefix: Optional[str] = None, - input_suffix: str = '.in', - output_suffix: str = '.out', - disable_output: bool = False, - make_dirs: bool = False): + def __init__( + self, + data_id: Optional[int] = None, + file_prefix: Optional[str] = None, + input_suffix: str = ".in", + output_suffix: str = ".out", + disable_output: bool = False, + make_dirs: bool = False, + ): ... def __init__( # type: ignore - self, - input_file: Optional[Union[IOBase, str, int]] = None, - output_file: Optional[Union[IOBase, str, int]] = None, - data_id: Optional[int] = None, - file_prefix: Optional[str] = None, - input_suffix: str = '.in', - output_suffix: str = '.out', - disable_output: bool = False, - make_dirs: bool = False): + self, + input_file: Optional[Union[IOBase, str, int]] = None, + output_file: Optional[Union[IOBase, str, int]] = None, + data_id: Optional[int] = None, + file_prefix: Optional[str] = None, + input_suffix: str = ".in", + output_suffix: str = ".out", + disable_output: bool = False, + make_dirs: bool = False, + ): """ Args: input_file (optional): input file object or filename or file descriptor. @@ -84,12 +91,13 @@ def __init__( # type: ignore # if the dir "./io" not found it will be created """ self.__closed = False - self.input_file, self.output_file = None, None + self.input_file = cast(IOBase, None) + self.output_file = None if file_prefix is not None: # legacy mode - input_file = '{}{{}}{}'.format(self.__escape_format(file_prefix), + input_file = "{}{{}}{}".format(self.__escape_format(file_prefix), self.__escape_format(input_suffix)) - output_file = '{}{{}}{}'.format( + output_file = "{}{{}}{}".format( self.__escape_format(file_prefix), self.__escape_format(output_suffix)) self.input_filename, self.output_filename = None, None @@ -101,9 +109,13 @@ def __init__( # type: ignore self.output_file = None self.is_first_char = {} - def __init_file(self, f: Union[IOBase, str, int, - None], data_id: Union[int, None], - file_type: str, make_dirs: bool): + def __init_file( + self, + f: Union[IOBase, str, int, None], + data_id: Union[int, None], + file_type: str, + make_dirs: bool, + ): if isinstance(f, IOBase): # consider ``f`` as a file object if file_type == "i": @@ -112,8 +124,12 @@ def __init_file(self, f: Union[IOBase, str, int, self.output_file = f elif isinstance(f, int): # consider ``f`` as a file descor - self.__init_file(open(f, 'w+', encoding="utf-8", newline='\n'), - data_id, file_type, make_dirs) + self.__init_file( + open(f, "w+", encoding="utf-8", newline="\n"), + data_id, + file_type, + make_dirs, + ) elif f is None: # consider wanna temp file fd, self.input_filename = tempfile.mkstemp() @@ -133,8 +149,11 @@ def __init_file(self, f: Union[IOBase, str, int, else: self.output_filename = filename self.__init_file( - open(filename, 'w+', newline='\n', encoding='utf-8'), data_id, - file_type, make_dirs) + open(filename, "w+", newline="\n", encoding="utf-8"), + data_id, + file_type, + make_dirs, + ) def __escape_format(self, st: str): """replace "{}" to "{{}}" """ @@ -211,6 +230,15 @@ def __clear(self, file: IOBase, pos: int = 0): self.is_first_char[file] = True file.seek(pos) + @staticmethod + def _kill_process_and_children(proc: subprocess.Popen): + if os.name == "posix": + os.killpg(os.getpgid(proc.pid), signal.SIGKILL) + elif os.name == "nt": + os.system(f"TASKKILL /F /T /PID {proc.pid} > nul") + else: + proc.kill() # Not currently supported + def input_write(self, *args, **kwargs): """ Write every element in *args into the input file. Splits with `separator`. @@ -243,7 +271,11 @@ def input_clear_content(self, pos: int = 0): self.__clear(self.input_file, pos) - def output_gen(self, shell_cmd, time_limit=None): + def output_gen(self, + shell_cmd: Union[str, List[str]], + time_limit: Optional[float] = None, + *, + replace_EOL: bool = True): """ Run the command `shell_cmd` (usually the std program) and send it the input file as stdin. Write its output to the output file. @@ -251,30 +283,37 @@ def output_gen(self, shell_cmd, time_limit=None): shell_cmd: the command to run, usually the std program. time_limit: the time limit (seconds) of the command to run. None means infinity. Defaults to None. + replace_EOL: Set whether to replace the end-of-line sequence with `'\\n'`. + Defaults to True. """ if self.output_file is None: raise ValueError("Output file is disabled") self.flush_buffer() origin_pos = self.input_file.tell() self.input_file.seek(0) - if time_limit is not None: - subprocess.check_call( - shell_cmd, - shell=True, - timeout=time_limit, - stdin=self.input_file.fileno(), - stdout=self.output_file.fileno(), - universal_newlines=True, - ) + + proc = subprocess.Popen( + shell_cmd, + shell=True, + stdin=self.input_file.fileno(), + stdout=subprocess.PIPE, + universal_newlines=replace_EOL, + preexec_fn=os.setsid if os.name == "posix" else None, + ) + + try: + output, _ = proc.communicate(timeout=time_limit) + except subprocess.TimeoutExpired: + # proc.kill() # didn't work because `shell=True`. + self._kill_process_and_children(proc) + raise else: - subprocess.check_call( - shell_cmd, - shell=True, - stdin=self.input_file.fileno(), - stdout=self.output_file.fileno(), - universal_newlines=True, - ) - self.input_file.seek(origin_pos) + if replace_EOL: + self.output_file.write(output) + else: + os.write(self.output_file.fileno(), output) + finally: + self.input_file.seek(origin_pos) log.debug(self.output_filename, " done") @@ -309,6 +348,8 @@ def output_clear_content(self, pos: int = 0): Args: pos: Where file will truncate """ + if self.output_file is None: + raise ValueError("Output file is disabled") self.__clear(self.output_file, pos) def flush_buffer(self): diff --git a/cyaron/tests/io_test.py b/cyaron/tests/io_test.py index 42cb996..6a0032d 100644 --- a/cyaron/tests/io_test.py +++ b/cyaron/tests/io_test.py @@ -1,5 +1,7 @@ import unittest +import sys import os +import time import shutil import tempfile import subprocess @@ -68,38 +70,47 @@ def test_output_gen(self): with IO("test_gen.in", "test_gen.out") as test: test.output_gen("echo 233") - with open("test_gen.out") as f: + with open("test_gen.out", "rb") as f: output = f.read() - self.assertEqual(output.strip("\n"), "233") + self.assertEqual(output, b"233\n") def test_output_gen_time_limit_exceeded(self): - time_limit_exceeded = False - with captured_output() as (out, err): - with open("long_time.py", "w") as f: - f.write("import time\ntime.sleep(10)\nprint(1)") + with captured_output(): + TIMEOUT = 0.02 + WAIT_TIME = 0.4 # If the wait time is too short, an error may occur + with open("long_time.py", "w", encoding="utf-8") as f: + f.write("import time, os\n" + "fn = input()\n" + f"time.sleep({WAIT_TIME})\n" + "os.remove(fn)\n") - try: - with IO("test_gen.in", "test_gen.out") as test: - test.output_gen("python long_time.py", time_limit=1) - except subprocess.TimeoutExpired: - time_limit_exceeded = True - self.assertEqual(time_limit_exceeded, True) + with IO("test_gen.in", "test_gen.out") as test: + fd, input_filename = tempfile.mkstemp() + os.close(fd) + abs_input_filename: str = os.path.abspath(input_filename) + with self.assertRaises(subprocess.TimeoutExpired): + test.input_writeln(abs_input_filename) + test.output_gen(f'"{sys.executable}" long_time.py', + time_limit=TIMEOUT) + time.sleep(WAIT_TIME) + try: + os.remove(input_filename) + except FileNotFoundError: + self.fail("Child processes have not been terminated.") def test_output_gen_time_limit_not_exceeded(self): - time_limit_exceeded = False - with captured_output() as (out, err): - with open("short_time.py", "w") as f: - f.write("import time\ntime.sleep(0.2)\nprint(1)") - - try: - with IO("test_gen.in", "test_gen.out") as test: - test.output_gen("python short_time.py", time_limit=1) - except subprocess.TimeoutExpired: - time_limit_exceeded = True - with open("test_gen.out") as f: + with captured_output(): + with open("short_time.py", "w", encoding="utf-8") as f: + f.write("import time\n" + "time.sleep(0.1)\n" + "print(1)") + + with IO("test_gen.in", "test_gen.out") as test: + test.output_gen(f'"{sys.executable}" short_time.py', + time_limit=0.5) + with open("test_gen.out", encoding="utf-8") as f: output = f.read() - self.assertEqual(output.strip("\n"), "1") - self.assertEqual(time_limit_exceeded, False) + self.assertEqual(output, "1\n") def test_init_overload(self): with IO(file_prefix="data{", data_id=5) as test: @@ -124,10 +135,7 @@ def test_make_dirs(self): mkdir_false = False try: - with IO( - "./automkdir_false/data.in", - "./automkdir_false/data.out", - ): + with IO("./automkdir_false/data.in", "./automkdir_false/data.out"): pass except FileNotFoundError: mkdir_false = True diff --git a/poetry.lock b/poetry.lock index b1294ef..e9bf565 100644 --- a/poetry.lock +++ b/poetry.lock @@ -1,4 +1,4 @@ -# This file is automatically @generated by Poetry 1.8.3 and should not be changed by hand. +# This file is automatically @generated by Poetry 1.8.4 and should not be changed by hand. [[package]] name = "colorama" From a56cc266344c4433ff9e9b4813e62caf050ec63d Mon Sep 17 00:00:00 2001 From: William Wei <128806514+weilycoder@users.noreply.github.com> Date: Wed, 18 Dec 2024 16:42:50 +0800 Subject: [PATCH 2/2] Support generating a random seed from the command-line arguments. (#160) * Rewrite utils.py; Add function comments. * Support generating a random seed from the command-line arguments * Add the functions __all__ * Fix some warnings * Use another way to process args; write tests --- cyaron/tests/__init__.py | 1 + cyaron/tests/compare_test.py | 2 + cyaron/tests/general_test.py | 44 +++++++++++++++++ cyaron/tests/io_test.py | 2 + cyaron/utils.py | 96 +++++++++++++++++++++--------------- 5 files changed, 104 insertions(+), 41 deletions(-) diff --git a/cyaron/tests/__init__.py b/cyaron/tests/__init__.py index 328a930..6fcff5c 100644 --- a/cyaron/tests/__init__.py +++ b/cyaron/tests/__init__.py @@ -5,3 +5,4 @@ from .compare_test import TestCompare from .graph_test import TestGraph from .vector_test import TestVector +from .general_test import TestGeneral diff --git a/cyaron/tests/compare_test.py b/cyaron/tests/compare_test.py index c52a6a7..7b6c487 100644 --- a/cyaron/tests/compare_test.py +++ b/cyaron/tests/compare_test.py @@ -15,10 +15,12 @@ class TestCompare(unittest.TestCase): def setUp(self): + self.original_directory = os.getcwd() self.temp_directory = tempfile.mkdtemp() os.chdir(self.temp_directory) def tearDown(self): + os.chdir(self.original_directory) try: shutil.rmtree(self.temp_directory) except: diff --git a/cyaron/tests/general_test.py b/cyaron/tests/general_test.py index e69de29..69f7a7f 100644 --- a/cyaron/tests/general_test.py +++ b/cyaron/tests/general_test.py @@ -0,0 +1,44 @@ +import subprocess +import unittest +import os +import tempfile +import shutil +import sys + + +class TestGeneral(unittest.TestCase): + + def setUp(self): + self.original_directory = os.getcwd() + self.temp_directory = tempfile.mkdtemp() + os.chdir(self.temp_directory) + + def tearDown(self): + os.chdir(self.original_directory) + try: + shutil.rmtree(self.temp_directory) + except: + pass + + def test_randseed_arg(self): + with open("test_randseed.py", 'w', encoding='utf-8') as f: + f.write("import cyaron as c\n" + "c.process_args()\n" + "for i in range(10):\n" + " print(c.randint(1,1000000000),end=' ')\n") + + env = os.environ.copy() + env['PYTHONPATH'] = self.original_directory + os.pathsep + env.get( + 'PYTHONPATH', '') + result = subprocess.run([ + sys.executable, 'test_randseed.py', + '--randseed=pinkrabbit147154220' + ], + env=env, + stdout=subprocess.PIPE, + universal_newlines=True, + check=True) + self.assertEqual( + result.stdout, + "243842479 490459912 810766286 646030451 191412261 929378523 273000814 982402032 436668773 957169453 " + ) diff --git a/cyaron/tests/io_test.py b/cyaron/tests/io_test.py index 6a0032d..02b5a98 100644 --- a/cyaron/tests/io_test.py +++ b/cyaron/tests/io_test.py @@ -12,10 +12,12 @@ class TestIO(unittest.TestCase): def setUp(self): + self.original_directory = os.getcwd() self.temp_directory = tempfile.mkdtemp() os.chdir(self.temp_directory) def tearDown(self): + os.chdir(self.original_directory) try: shutil.rmtree(self.temp_directory) except: diff --git a/cyaron/utils.py b/cyaron/utils.py index 5b7cfd5..4ef5ad8 100644 --- a/cyaron/utils.py +++ b/cyaron/utils.py @@ -1,67 +1,81 @@ -def ati(array): - """ati(array) -> list - Convert all the elements in the array and return them in a list. - """ +"""Some utility functions.""" +import sys +import random +from typing import cast, Any, Dict, Iterable, Tuple, Union + +__all__ = [ + "ati", "list_like", "int_like", "strtolines", "make_unicode", + "unpack_kwargs", "process_args" +] + + +def ati(array: Iterable[Any]): + """Convert all the elements in the array and return them in a list.""" return [int(i) for i in array] -def list_like(data): - """list_like(data) -> bool - Judge whether the object data is like a list or a tuple. - object data -> the data to judge - """ +def list_like(data: Any): + """Judge whether the object data is like a list or a tuple.""" return isinstance(data, (tuple, list)) -def int_like(data): - isint = False - try: - isint = isint or isinstance(data, long) - except NameError: - pass - isint = isint or isinstance(data, int) - return isint +def int_like(data: Any): + """Judge whether the object data is like a int.""" + return isinstance(data, int) -def strtolines(str): - lines = str.split('\n') - for i in range(len(lines)): +def strtolines(string: str): + """ + Split the string by the newline character, remove trailing spaces from each line, + and remove any blank lines at the end of the the string. + """ + lines = string.split("\n") + for i, _ in enumerate(lines): lines[i] = lines[i].rstrip() - while len(lines) > 0 and len(lines[len(lines) - 1]) == 0: - del lines[len(lines) - 1] + while len(lines) > 0 and len(lines[-1]) == 0: + lines.pop() return lines -def make_unicode(data): +def make_unicode(data: Any): + """Convert the data to a string.""" return str(data) -def unpack_kwargs(funcname, kwargs, arg_pattern): +def unpack_kwargs( + funcname: str, + kwargs: Dict[str, Any], + arg_pattern: Iterable[Union[str, Tuple[str, Any]]], +): + """Parse the keyword arguments.""" rv = {} kwargs = kwargs.copy() for tp in arg_pattern: if list_like(tp): - k, v = tp - rv[k] = kwargs.get(k, v) - try: - del kwargs[k] - except KeyError: - pass + k, v = cast(Tuple[str, Any], tp) + rv[k] = kwargs.pop(k, v) else: - error = False + tp = cast(str, tp) try: - rv[tp] = kwargs[tp] - del kwargs[tp] - except KeyError as e: - error = True - if error: + rv[tp] = kwargs.pop(tp) + except KeyError: raise TypeError( - '{}() missing 1 required keyword-only argument: \'{}\''. - format(funcname, tp)) + f"{funcname}() missing 1 required keyword-only argument: '{tp}'" + ) from None if kwargs: raise TypeError( - '{}() got an unexpected keyword argument \'{}\''.format( - funcname, - next(iter(kwargs.items()))[0])) + f"{funcname}() got an unexpected keyword argument '{next(iter(kwargs.items()))[0]}'" + ) return rv + + +def process_args(): + """ + Process the command line arguments. + Now we support: + - randseed: set the random seed + """ + for s in sys.argv: + if s.startswith("--randseed="): + random.seed(s.split("=")[1])