Skip to content

Commit 5d16abb

Browse files
Merge pull request #3528 from AI-Hypercomputer:agagik-kimi-checkpoint
PiperOrigin-RevId: 895408378
2 parents e0cb1d5 + fb99a79 commit 5d16abb

1 file changed

Lines changed: 8 additions & 4 deletions

File tree

src/maxtext/checkpoint_conversion/standalone_scripts/convert_deepseek_family_unscanned_ckpt.py

Lines changed: 8 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -70,10 +70,14 @@ def _convert_huggingface_to_jax_weights(base_model_path, model_params, mem_info)
7070
if key.endswith("_scale_inv"):
7171
raise ValueError("fp8 checkpoint is not supported.")
7272
if ds_ckpt.is_key_allowed(key, ds_ckpt.MTP_KEYS_TO_SKIP):
73-
mapped_key = ds_ckpt.hf_to_maxtext_mapping(layer, num_experts, first_num_dense_layers, base_num_decoder_layers)[
74-
key
75-
]
76-
chkpt_vars[mapped_key] = f.get_tensor(key)
73+
mapped_key = ds_ckpt.hf_to_maxtext_mapping(
74+
layer, num_experts, first_num_dense_layers, base_num_decoder_layers
75+
).get(key)
76+
if mapped_key:
77+
chkpt_vars[mapped_key] = f.get_tensor(key)
78+
else:
79+
# This catches keys that are allowed but missing from the mapping dictionary
80+
max_logging.log(f"Debug: Allowed key '{key}' (layer {layer}) has no mapping in hf_to_maxtext_mapping.")
7781

7882
logging.debug("Memory usage: %f GB", mem_info.memory_info().rss / (1024**3))
7983

0 commit comments

Comments
 (0)