Skip to content

Commit fe3b812

Browse files
committed
Do not use defaultdict
1 parent f3ed732 commit fe3b812

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

convert_hf_to_gguf.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,6 @@
1111
import os
1212
import re
1313
import sys
14-
from collections import defaultdict
1514
from enum import IntEnum
1615
from pathlib import Path
1716
from hashlib import sha256
@@ -8859,7 +8858,7 @@ def set_gguf_parameters(self):
88598858
self.gguf_writer.add_shortconv_l_cache(self.hparams["conv_L_cache"])
88608859

88618860
# cache for experts weights for merging
8862-
_experts_cache: dict[int, dict[str, Tensor]] | None = defaultdict(lambda: defaultdict(dict))
8861+
_experts_cache: dict[int, dict[str, Tensor]] = {}
88638862

88648863
def modify_tensors(self, data_torch: Tensor, name: str, bid: int | None) -> Iterable[tuple[str, Tensor]]:
88658864
# conv op requires 2d tensor
@@ -8871,6 +8870,8 @@ def modify_tensors(self, data_torch: Tensor, name: str, bid: int | None) -> Iter
88718870
n_experts = self.hparams["num_experts"]
88728871
assert bid is not None
88738872

8873+
if bid not in self._experts_cache:
8874+
self._experts_cache[bid] = {}
88748875
self._experts_cache[bid][name] = data_torch
88758876
expert_weights = ["w1", "w2", "w3"]
88768877

0 commit comments

Comments
 (0)