Skip to content

Commit d62e4aa

Browse files
fairydreamingsszymczymofosyne
authored
gguf-py : fix tensor groups for encoder-decoder models in gguf-dump.py (#8090)
Co-authored-by: Stanisław Szymczyk <[email protected]> Co-authored-by: Brian <[email protected]>
1 parent 9a590c8 commit d62e4aa

File tree

1 file changed

+7
-1
lines changed

1 file changed

+7
-1
lines changed

gguf-py/scripts/gguf-dump.py

Lines changed: 7 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -208,7 +208,9 @@ def translate_tensor_name(name):
208208
'ssm_d': 'State space model skip connection',
209209
'ssm_dt': 'State space model time step',
210210
'ssm_out': 'State space model output projection',
211-
'blk': 'Block'
211+
'blk': 'Block',
212+
'enc': 'Encoder',
213+
'dec': 'Decoder',
212214
}
213215

214216
expanded_words = []
@@ -291,6 +293,10 @@ def dump_markdown_metadata(reader: GGUFReader, args: argparse.Namespace) -> None
291293
tensor_group_name = "base"
292294
if tensor_components[0] == 'blk':
293295
tensor_group_name = f"{tensor_components[0]}.{tensor_components[1]}"
296+
elif tensor_components[0] in ['enc', 'dec'] and tensor_components[1] == 'blk':
297+
tensor_group_name = f"{tensor_components[0]}.{tensor_components[1]}.{tensor_components[2]}"
298+
elif tensor_components[0] in ['enc', 'dec']:
299+
tensor_group_name = f"{tensor_components[0]}"
294300

295301
# Check if new Tensor Group
296302
if tensor_group_name not in tensor_groups:

0 commit comments

Comments
 (0)