]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
llava : avoid changing the original BakLLaVA model (#5577)
authorDaniel Bevenius <redacted>
Mon, 19 Feb 2024 08:31:59 +0000 (09:31 +0100)
committerGitHub <redacted>
Mon, 19 Feb 2024 08:31:59 +0000 (10:31 +0200)
This is a follup of Commit fc0c8d286a533363a9a663510b62af85ffad58b3
("llava : update surgery script to not remove tensors") but this time
the change is to the BakLLaVA specific part of the surgery script.

I've been able to test this using SkunkworksAI/BakLLaVA-1 and it works
as expected using the instructions in README.md.

Signed-off-by: Daniel Bevenius <redacted>
examples/llava/llava-surgery.py

index 8b7a62fbaa145b358ed84093685514a7557faa90..4f2da3beefff670cfd61ffcff3769651d74a551c 100644 (file)
@@ -25,9 +25,6 @@ if len(clip_tensors) > 0:
     clip = {name.replace("vision_tower.vision_tower.", ""): checkpoint[name].float() for name in clip_tensors}
     torch.save(clip, f"{args.model}/llava.clip")
 
-    # remove these tensors
-    for name in clip_tensors:
-        del checkpoint[name]
 
     # added tokens should be removed to be able to convert Mistral models
     if os.path.exists(f"{args.model}/added_tokens.json"):
@@ -35,7 +32,6 @@ if len(clip_tensors) > 0:
             f.write("{}\n")
 
 
-    torch.save(checkpoint, path)
 
 print("Done!")
 print(f"Now you can convert {args.model} to a regular LLaMA GGUF file.")