Skip to content

Commit 5cd85b5

Browse files
authored
convert : add BertForMaskedLM (#10919)
1 parent a91a413 commit 5cd85b5

File tree

1 file changed

+16
-1
lines changed

1 file changed

+16
-1
lines changed

convert_hf_to_gguf.py

+16-1
Original file line numberDiff line numberDiff line change
@@ -2628,7 +2628,7 @@ def modify_tensors(self, data_torch: Tensor, name: str, bid: int | None) -> Iter
26282628
return [(self.map_tensor_name(name), data_torch)]
26292629

26302630

2631-
@Model.register("BertModel", "CamembertModel")
2631+
@Model.register("BertModel", "BertForMaskedLM", "CamembertModel")
26322632
class BertModel(Model):
26332633
model_arch = gguf.MODEL_ARCH.BERT
26342634

@@ -2694,10 +2694,25 @@ def phantom(tok):
26942694
def modify_tensors(self, data_torch: Tensor, name: str, bid: int | None) -> Iterable[tuple[str, Tensor]]:
26952695
del bid # unused
26962696

2697+
if name.startswith("bert."):
2698+
name = name[5:]
2699+
2700+
if name.endswith(".gamma"):
2701+
name = name[:-6] + ".weight"
2702+
2703+
if name.endswith(".beta"):
2704+
name = name[:-5] + ".bias"
2705+
26972706
# we are only using BERT for embeddings so we don't need the pooling layer
26982707
if name in ("embeddings.position_ids", "pooler.dense.weight", "pooler.dense.bias"):
26992708
return [] # we don't need these
27002709

2710+
if name.startswith("cls.predictions"):
2711+
return []
2712+
2713+
if name.startswith("cls.seq_relationship"):
2714+
return []
2715+
27012716
return [(self.map_tensor_name(name), data_torch)]
27022717

27032718

0 commit comments

Comments
 (0)