From d2708ecf792aea74b4f1746e257e8a8417f9bb5d Mon Sep 17 00:00:00 2001 From: Wei Li Date: Thu, 12 Oct 2023 13:00:28 -0700 Subject: [PATCH] Enhance Python strValStore speed with generator (#264) --- pecos/utils/mmap_valstore_util.py | 15 +++++++-------- 1 file changed, 7 insertions(+), 8 deletions(-) diff --git a/pecos/utils/mmap_valstore_util.py b/pecos/utils/mmap_valstore_util.py index f306353..e152154 100644 --- a/pecos/utils/mmap_valstore_util.py +++ b/pecos/utils/mmap_valstore_util.py @@ -300,18 +300,17 @@ def __init__(self, max_row_size: int, max_col_size: int, trunc_val_len: int): for start_idx in bytes_start_loc ] - # Buffer for return string objects - self.ret_obj = np.zeros(max_row_size * max_col_size, dtype=np.object_) - def format_ret(self, n_rows, n_cols): """ Reshape return into decoded string matrix """ - for idx in range(n_rows * n_cols): - self.ret_obj[idx] = str( - self.byte_mem_views[idx][: self.vals_lens[idx]], "utf-8", "ignore" - ) - return self.ret_obj[: n_rows * n_cols].reshape(n_rows, n_cols).tolist() + ret_len = n_rows * n_cols + ret = [ + str(mem_view[:val_len], "utf-8", "ignore") + for mem_view, val_len in zip(self.byte_mem_views[:ret_len], self.vals_lens[:ret_len]) + ] + + return [ret[i : i + n_cols] for i in range(0, ret_len, n_cols)] class _MmapValStoreWrite(_MmapValStoreBase):