Skip to content

Commit 9c6118c

Browse files
committed
convert.py: Fix loading safetensors and ggml format on Windows
Calling `mmap.mmap` on Windows apparently resets the file offset of the raw file object (and makes the BufferedReader return a *negative* file offset). For safetensors, avoid using the file offset after calling mmap. For GGML format, explicitly save and restore the offset. Fixes ggml-org#966.
1 parent c85e03d commit 9c6118c

File tree

1 file changed

+4
-2
lines changed

1 file changed

+4
-2
lines changed

convert.py

+4-2
Original file line numberDiff line numberDiff line change
@@ -735,7 +735,7 @@ def lazy_load_safetensors_file(fp: IO[bytes], path: Path) -> ModelPlus:
735735
header: Dict[str, Dict[str, Any]] = json.loads(fp.read(header_size))
736736
# Use mmap for the actual data to avoid race conditions with the file offset.
737737
mapped = memoryview(mmap.mmap(fp.fileno(), 0, access=mmap.ACCESS_READ))
738-
byte_buf = mapped[fp.tell():]
738+
byte_buf = mapped[8 + header_size:]
739739

740740
def convert(info: Dict[str, Any]) -> LazyTensor:
741741
data_type = SAFETENSORS_DATA_TYPES[info['dtype']]
@@ -761,7 +761,7 @@ def must_read(fp: IO[bytes], length: int) -> bytes:
761761
return ret
762762

763763

764-
def lazy_load_ggml_file(fp: IO[bytes], path: Path) -> ModelPlus:
764+
def lazy_load_ggml_file(fp: io.BufferedReader, path: Path) -> ModelPlus:
765765
magic = must_read(fp, 4)[::-1]
766766
if magic in (b'ggmf', b'ggjt'):
767767
version, = struct.unpack("i", must_read(fp, 4))
@@ -795,7 +795,9 @@ def lazy_load_ggml_file(fp: IO[bytes], path: Path) -> ModelPlus:
795795

796796
model: LazyModel = {}
797797
# Use mmap for the actual data to avoid race conditions with the file offset.
798+
off = fp.raw.tell()
798799
mapped = memoryview(mmap.mmap(fp.fileno(), 0, access=mmap.ACCESS_READ))
800+
fp.raw.seek(off) # needed on Windows
799801

800802
def read_tensor() -> None: # this is a function so that variables captured in `load` don't change
801803
shape_len, name_len, ftype = struct.unpack("iii", must_read(fp, 12))

0 commit comments

Comments
 (0)