revert: can't fix that bug locally

zhudotexe · zhudotexe · commit 9ba2df7b3ecf · 2025-02-17T17:06:09.000-05:00
diff --git a/kani/engines/llamacpp/base.py b/kani/engines/llamacpp/base.py
@@ -65,18 +65,10 @@ def __init__(
         if match := re.match(r"(.*?)-(\d+)-of-(\d+)\.gguf", filename):
             log.info("Sharded GGUF file given - ensuring that all GGUF shards are downloaded")
             additional_files = []
-            # there is a bug in llama-cpp-python that makes the additional_files inherit the subfolder of the parent
-            *subfolders, basename = match[1].split("/")
-            if subfolders:
-                log.warning(
-                    "llama-cpp-python can fail to find additional model files in subfolders. If you see a 404 error,"
-                    ' try manually supplying `model_load_kwargs={"additional_files": [...]}` or use huggingface-cli to'
-                    " download model files."
-                )
             for n in range(1, int(match[3]) + 1):
                 if n == int(match[2]):
                     continue
-                additional_files.append(f"{basename}-*{n}-of-{match[3]}.gguf")
+                additional_files.append(f"{match[1]}-*{n}-of-{match[3]}.gguf")
             log.info(f"additional_files={additional_files}")
             model_load_kwargs.setdefault("additional_files", additional_files)
 
diff --git a/sandbox/r1-quant.py b/sandbox/r1-quant.py
@@ -26,7 +26,7 @@
     repo_id="unsloth/DeepSeek-R1-GGUF",
     filename="DeepSeek-R1-Q2_K_XS/DeepSeek-R1-Q2_K_XS-00001-of-00005.gguf",
     prompt_pipeline=pipeline,
-    model_load_kwargs={"n_gpu_layers": -1},
+    model_load_kwargs={"n_gpu_layers": -1, "additional_files": []},
 )
 
 

Original file line number	Diff line number	Diff line change
`@@ -26,7 +26,7 @@`
`26`	`26`	`repo_id="unsloth/DeepSeek-R1-GGUF",`
`27`	`27`	`filename="DeepSeek-R1-Q2_K_XS/DeepSeek-R1-Q2_K_XS-00001-of-00005.gguf",`
`28`	`28`	`prompt_pipeline=pipeline,`
`29`		`- model_load_kwargs={"n_gpu_layers": -1},`
	`29`	`+ model_load_kwargs={"n_gpu_layers": -1, "additional_files": []},`
`30`	`30`	`)`
`31`	`31`
`32`	`32`