mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-12 19:50:17 +00:00
convert : identify missing model files (#9397)
Some checks failed
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/full-cuda.Dockerfile platforms:linux/amd64 tag:full-cuda]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/full.Dockerfile platforms:linux/amd64,linux/arm64 tag:full]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/llama-cli-cuda.Dockerfile platforms:linux/amd64 tag:light-cuda]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/llama-cli-intel.Dockerfile platforms:linux/amd64 tag:light-intel]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/llama-cli.Dockerfile platforms:linux/amd64,linux/arm64 tag:light]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/llama-server-cuda.Dockerfile platforms:linux/amd64 tag:server-cuda]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/llama-server-intel.Dockerfile platforms:linux/amd64 tag:server-intel]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/llama-server.Dockerfile platforms:linux/amd64,linux/arm64 tag:server]) (push) Waiting to run
Nix CI / nix-eval (macos-latest) (push) Waiting to run
Nix CI / nix-eval (ubuntu-latest) (push) Waiting to run
Nix CI / nix-build (macos-latest) (push) Waiting to run
Nix CI / nix-build (ubuntu-latest) (push) Waiting to run
Python check requirements.txt / check-requirements (push) Waiting to run
flake8 Lint / Lint (push) Waiting to run
Python Type-Check / pyright type-check (push) Waiting to run
Nix aarch64 builds / nix-build-aarch64 (push) Has been cancelled
Some checks failed
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/full-cuda.Dockerfile platforms:linux/amd64 tag:full-cuda]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/full.Dockerfile platforms:linux/amd64,linux/arm64 tag:full]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/llama-cli-cuda.Dockerfile platforms:linux/amd64 tag:light-cuda]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/llama-cli-intel.Dockerfile platforms:linux/amd64 tag:light-intel]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/llama-cli.Dockerfile platforms:linux/amd64,linux/arm64 tag:light]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/llama-server-cuda.Dockerfile platforms:linux/amd64 tag:server-cuda]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/llama-server-intel.Dockerfile platforms:linux/amd64 tag:server-intel]) (push) Waiting to run
Publish Docker image / Push Docker image to Docker Hub (map[dockerfile:.devops/llama-server.Dockerfile platforms:linux/amd64,linux/arm64 tag:server]) (push) Waiting to run
Nix CI / nix-eval (macos-latest) (push) Waiting to run
Nix CI / nix-eval (ubuntu-latest) (push) Waiting to run
Nix CI / nix-build (macos-latest) (push) Waiting to run
Nix CI / nix-build (ubuntu-latest) (push) Waiting to run
Python check requirements.txt / check-requirements (push) Waiting to run
flake8 Lint / Lint (push) Waiting to run
Python Type-Check / pyright type-check (push) Waiting to run
Nix aarch64 builds / nix-build-aarch64 (push) Has been cancelled
This commit is contained in:
parent
19514d632e
commit
d54c21df7e
@ -132,12 +132,14 @@ class Model:
|
|||||||
def get_tensors(self) -> Iterator[tuple[str, Tensor]]:
|
def get_tensors(self) -> Iterator[tuple[str, Tensor]]:
|
||||||
tensor_names_from_parts: set[str] = set()
|
tensor_names_from_parts: set[str] = set()
|
||||||
|
|
||||||
if len(self.part_names) > 1:
|
|
||||||
self.tensor_names = set()
|
|
||||||
index_name = "model.safetensors" if self.is_safetensors else "pytorch_model.bin"
|
index_name = "model.safetensors" if self.is_safetensors else "pytorch_model.bin"
|
||||||
index_name += ".index.json"
|
index_name += ".index.json"
|
||||||
|
index_file = self.dir_model / index_name
|
||||||
|
|
||||||
|
if index_file.is_file():
|
||||||
|
self.tensor_names = set()
|
||||||
logger.info(f"gguf: loading model weight map from '{index_name}'")
|
logger.info(f"gguf: loading model weight map from '{index_name}'")
|
||||||
with open(self.dir_model / index_name, "r", encoding="utf-8") as f:
|
with open(index_file, "r", encoding="utf-8") as f:
|
||||||
index: dict[str, Any] = json.load(f)
|
index: dict[str, Any] = json.load(f)
|
||||||
weight_map = index.get("weight_map")
|
weight_map = index.get("weight_map")
|
||||||
if weight_map is None or not isinstance(weight_map, dict):
|
if weight_map is None or not isinstance(weight_map, dict):
|
||||||
@ -145,6 +147,7 @@ class Model:
|
|||||||
self.tensor_names.update(weight_map.keys())
|
self.tensor_names.update(weight_map.keys())
|
||||||
else:
|
else:
|
||||||
self.tensor_names = tensor_names_from_parts
|
self.tensor_names = tensor_names_from_parts
|
||||||
|
weight_map = {}
|
||||||
|
|
||||||
for part_name in self.part_names:
|
for part_name in self.part_names:
|
||||||
logger.info(f"gguf: loading model part '{part_name}'")
|
logger.info(f"gguf: loading model part '{part_name}'")
|
||||||
@ -171,9 +174,17 @@ class Model:
|
|||||||
data = LazyTorchTensor.from_eager(data)
|
data = LazyTorchTensor.from_eager(data)
|
||||||
yield name, data
|
yield name, data
|
||||||
|
|
||||||
# only verify tensor name presence; it doesn't matter if they are not in the right files
|
# verify tensor name presence and identify potentially missing files
|
||||||
if len(sym_diff := tensor_names_from_parts.symmetric_difference(self.tensor_names)) > 0:
|
if len(tensor_names_from_parts.symmetric_difference(self.tensor_names)) > 0:
|
||||||
raise ValueError(f"Mismatch between weight map and model parts for tensor names: {sym_diff}")
|
missing = sorted(self.tensor_names.difference(tensor_names_from_parts))
|
||||||
|
extra = sorted(tensor_names_from_parts.difference(self.tensor_names))
|
||||||
|
missing_files = sorted(set(weight_map[n] for n in missing if n in weight_map))
|
||||||
|
if len(extra) == 0 and len(missing_files) > 0:
|
||||||
|
raise ValueError(f"Missing or incomplete model files: {missing_files}")
|
||||||
|
else:
|
||||||
|
raise ValueError("Mismatch between weight map and model parts for tensor names:\n"
|
||||||
|
f"Missing tensors: {missing}\n"
|
||||||
|
f"Extra tensors: {extra}")
|
||||||
|
|
||||||
def format_tensor_name(self, key: gguf.MODEL_TENSOR, bid: int | None = None, suffix: str = ".weight") -> str:
|
def format_tensor_name(self, key: gguf.MODEL_TENSOR, bid: int | None = None, suffix: str = ".weight") -> str:
|
||||||
if key not in gguf.MODEL_TENSORS[self.model_arch]:
|
if key not in gguf.MODEL_TENSORS[self.model_arch]:
|
||||||
|
Loading…
Reference in New Issue
Block a user