Skip to content

Commit 60e17ce

Browse files
authored
Remove identical wte/etw logic for jais (#10203)
1 parent 5107e8c commit 60e17ce

File tree

1 file changed

+0
-6
lines changed

1 file changed

+0
-6
lines changed

convert_hf_to_gguf.py

-6
Original file line numberDiff line numberDiff line change
@@ -3748,10 +3748,7 @@ def __init__(self, *args, **kwargs):
37483748

37493749
# Embeddings scale
37503750
self.embeddings_scale = 1.0
3751-
# note: For some JAIS flavors, output is tied to (same as) wte in original model
3752-
self.output_is_wte = False
37533751
if 'mup_embeddings_scale' in self.hparams:
3754-
self.output_is_wte = True # Hack (?)
37553752
self.embeddings_scale = self.hparams['mup_embeddings_scale']
37563753
elif 'embeddings_scale' in self.hparams:
37573754
self.embeddings_scale = self.hparams['embeddings_scale']
@@ -3808,10 +3805,7 @@ def modify_tensors(self, data_torch: Tensor, name: str, bid: int | None) -> Iter
38083805

38093806
if new_name == self.format_tensor_name(gguf.MODEL_TENSOR.TOKEN_EMBD):
38103807
tensors.append((new_name, data_torch * self.embeddings_scale))
3811-
if self.output_is_wte:
3812-
tensors.append((self.format_tensor_name(gguf.MODEL_TENSOR.OUTPUT), data_torch * self.width_scale))
38133808
elif new_name == self.format_tensor_name(gguf.MODEL_TENSOR.OUTPUT):
3814-
assert not self.output_is_wte
38153809
tensors.append((new_name, data_torch * self.width_scale))
38163810
else:
38173811
tensors.append((new_name, data_torch))

0 commit comments

Comments
 (0)