py : re-enable mmap in convert hf (#4732)

author Nam D. Tran <redacted>

Tue, 2 Jan 2024 09:23:38 +0000 (16:23 +0700)

committer GitHub <redacted>

Tue, 2 Jan 2024 09:23:38 +0000 (11:23 +0200)
author Nam D. Tran <redacted>
Tue, 2 Jan 2024 09:23:38 +0000 (16:23 +0700)
committer GitHub <redacted>
Tue, 2 Jan 2024 09:23:38 +0000 (11:23 +0200)
diff --git a/awq-py/requirements.txt b/awq-py/requirements.txt

index 5fe604329b354d90a7621945d7545603df2f4241..99189611607745fc6fee19501763ab1e7cd45506 100644 (file)
--- a/awq-py/requirements.txt
+++ b/awq-py/requirements.txt
@@ -1,2 +1,2 @@
-torch>=2.0.0
+torch>=2.1.1
  transformers>=4.32.0
diff --git a/convert-hf-to-gguf.py b/convert-hf-to-gguf.py

index 51724c0dfca564771c41f06f42487b9386700d50..203eaf64b3fc36a1a25dacb4fded02ea294c7102 100755 (executable)
--- a/convert-hf-to-gguf.py
+++ b/convert-hf-to-gguf.py
@@ -59,7 +59,7 @@ class Model:
                  from safetensors import safe_open
                  ctx = cast(ContextManager[Any], safe_open(self.dir_model / part_name, framework="pt", device="cpu"))
              else:
-                ctx = contextlib.nullcontext(torch.load(str(self.dir_model / part_name), map_location="cpu", weights_only=True))
+                ctx = contextlib.nullcontext(torch.load(str(self.dir_model / part_name), map_location="cpu", mmap=True, weights_only=True))
  
              with ctx as model_part:
                  for name in model_part.keys():
author	Nam D. Tran <redacted>
	Tue, 2 Jan 2024 09:23:38 +0000 (16:23 +0700)
committer	GitHub <redacted>
	Tue, 2 Jan 2024 09:23:38 +0000 (11:23 +0200)
awq-py/requirements.txt		patch \| blob \| history
convert-hf-to-gguf.py		patch \| blob \| history