From e68431b7324b5ca850d8863c865bf5cf1192ac2c Mon Sep 17 00:00:00 2001 From: Gabe Goodhart Date: Mon, 23 Sep 2024 09:32:23 -0600 Subject: [PATCH] Typo fix in docstring Co-Authored-By: ggerganov@gmail.com Co-authored-by: Georgi Gerganov Signed-off-by: Gabe Goodhart --- convert_hf_to_gguf.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py index ea9daca826366b..d62ecb99790806 100755 --- a/convert_hf_to_gguf.py +++ b/convert_hf_to_gguf.py @@ -4122,7 +4122,7 @@ class GraniteMoeModel(GraniteModel): def modify_tensors(self, data_torch: Tensor, name: str, bid: int | None) -> Iterable[tuple[str, Tensor]]: """In modeling_granitemoe, the JetMoe implementation of parallel experts is used. This essentially merges w1 and w3 into a single tensor with 2x - the hidden size that is then split during forward. To keep compativility + the hidden size that is then split during forward. To keep compatibility with existing mixtral support, we pull them apart here. """