gaogaotiantian · gaogaotiantian · Sep 8, 2022 · Aug 28, 2022 · Aug 28, 2022 · Aug 28, 2022
diff --git a/tests/test_vcompressor.py b/tests/test_vcompressor.py
@@ -2,10 +2,17 @@
 # For details: https://github.com/gaogaotiantian/viztracer/blob/master/NOTICE.txt
 
 
+import logging
+import lzma
 import os
 import tempfile
+from collections import namedtuple
+from functools import wraps
+from shutil import copyfileobj
+from typing import Callable, List, Optional, Tuple, overload
 
 from .cmdline_tmpl import CmdlineTmpl
+from .test_performance import Timer
 from .util import get_json_file_path
 
 
@@ -23,3 +30,129 @@ def test_basic(self):
                 ["viztracer", "-o", dup_json_path, "--decompress", cvf_path],
                 expected_output_file=dup_json_path
             )
+
+
+class TestVCompressorPerformance(CmdlineTmpl):
+
+    BenchmarkResult = namedtuple("BenchmarkResult", ["file_size", "elapsed_time"])  # unit: byte, second
+
+    @overload
+    def _benchmark(benchmark_process: Callable[..., None]):
+        ...
+
+    @overload
+    def _benchmark(repeat: int):
+        ...
+
+    def _benchmark(*args, **kargs):
+        def _decorator(benchmark_process: Callable) -> Callable:
+            @wraps(benchmark_process)
+            def _wrapper(self, uncompressed_file_path: str) -> "TestVCompressorPerformance.BenchmarkResult":
+                compression_time_total = 0.
+                with tempfile.TemporaryDirectory() as tmpdir:
+                    compressed_file_path = os.path.join(tmpdir, "result.compressed")
+                    # pre-warm
+                    benchmark_process(self, uncompressed_file_path, compressed_file_path)
+                    os.remove(compressed_file_path)
+                    # real benchmark
+                    for _ in range(loop_time):
+                        with Timer() as t:
+                            benchmark_process(self, uncompressed_file_path, compressed_file_path)
+                            compression_time_total += t.get_time()
+                        compressed_file_size = os.path.getsize(compressed_file_path)
+                        os.remove(compressed_file_path)
+                return TestVCompressorPerformance.BenchmarkResult(compressed_file_size, compression_time_total / loop_time)
+            return _wrapper
+
+        if len(args) == 0 and len(kargs) == 0:
+            raise TypeError("_benchmark must decorate a function.")
+
+        # used as @_benchmark
+        if len(args) == 1 and len(kargs) == 0 and callable(args[0]):
+            loop_time = 3
+            return _decorator(args[0])
+
+        # used as @_benchmark(...)
+        loop_time = kargs["repeat"] if "repeat" in kargs else args[0]
+        return _decorator
+
+    @staticmethod
+    def _human_readable_filesize(filesize: int) -> str:  # filesize in bytes
+        units = [("PB", 1 << 50), ("TB", 1 << 40), ("GB", 1 << 30), ("MB", 1 << 20), ("KB", 1 << 10)]
+        for unit_name, unit_base in units:
+            norm_size = filesize / unit_base
+            if norm_size >= 0.8:
+                return f"{norm_size:8.2f}{unit_name}"
+        return f"{filesize:8.2f}B"
+
+    @classmethod
+    def _print_result(
+        cls,
+        filename: str,
+        original_size: int,
+        vcompress_result: BenchmarkResult,
+        other_results: List[Tuple[str, BenchmarkResult]],  # [(compressor_name, BenchmarkResult)]
+        subtest_idx: Optional[int] = None
+    ):
+        if subtest_idx is None:
+            logging.info(f"On file \"{filename}\":")
+        else:
+            logging.info(f"{subtest_idx}. On file \"{filename}\":")
+
+        # Space-wise Info
+        logging.info("    [Space]")
+        logging.info("      Uncompressed:   {}".format(
+            cls._human_readable_filesize(original_size)),
+        )
+        logging.info("      VCompressor:    {}(1.000) [CR:{:6.2f}%]".format(  # CR stands for compress ratio
+            cls._human_readable_filesize(vcompress_result.file_size),
+            vcompress_result.file_size / original_size * 100,
+        ))
+        for name, result in other_results:
+            logging.info("      {}{}({:.3f}) [CR:{:6.2f}%]".format(
+                name + ":" + " " * max(15 - len(name), 0),
+                cls._human_readable_filesize(result.file_size),
+                result.file_size / vcompress_result.file_size,
+                result.file_size / original_size * 100,
+            ))
+
+        # Time-wise Info
+        logging.info("    [Time]")
+        logging.info("      VCompressor:    {:9.3f}s(1.000)".format(
+            vcompress_result.elapsed_time,
+        ))
+        for name, result in other_results:
+            logging.info("      {}{:9.3f}s({:.3f})".format(
+                name + ":" + " " * max(15 - len(name), 0),
+                result.elapsed_time,
+                result.elapsed_time / vcompress_result.elapsed_time
+            ))
+
+    @_benchmark
+    def _benchmark_vcompressor(self, uncompressed_file_path: str, compressed_file_path: str) -> None:
+        self.template(
+            ["viztracer", "-o", compressed_file_path, "--compress", uncompressed_file_path],
+            expected_output_file=compressed_file_path, cleanup=False
+        )
+
+    @_benchmark
+    def _benchmark_lzma(self, uncompressed_file_path: str, compressed_file_path: str) -> None:
+        with open(uncompressed_file_path, "rb") as original_file:
+            with lzma.open(compressed_file_path, "wb", preset=lzma.PRESET_DEFAULT) as compressed_file:
+                copyfileobj(original_file, compressed_file)
+
+    def test_benchmark_basic(self):
+        # More testcases can be added here
+        testcases_filename = ["vdb_basic.json", "multithread.json"]
+
+        for subtest_idx, filename in enumerate(testcases_filename, start=1):
+            path = get_json_file_path(filename)
+            original_size = os.path.getsize(path)
+            # More compressors can be added here
+            other_results = [
+                ("LZMA", self._benchmark_lzma(path)),
+            ]
+            with self.subTest(testcase=filename):
+                vcompress_result = self._benchmark_vcompressor(path)
+                self._print_result(filename, original_size,
+                                   vcompress_result, other_results, subtest_idx=subtest_idx)