You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: src/maxtext/configs/types.py
+6Lines changed: 6 additions & 0 deletions
Original file line number
Diff line number
Diff line change
@@ -1126,6 +1126,12 @@ class Distillation(BaseModel):
1126
1126
distill_beta: float=Field(0.0, description="Weight for the feature loss component. Use 0.0 to disable")
1127
1127
distill_layer_indices: None|list=Field(None, description="Feature indices for feature loss.")
1128
1128
1129
+
# --- Distillation freezing filter --
1130
+
student_params_to_update: None|list=Field(
1131
+
None,
1132
+
description="a list of model param name templates to finetune in the student model. The other parameters will be frozen if this attribute is non empty)",
1133
+
)
1134
+
1129
1135
1130
1136
classTrainingLoop(BaseModel):
1131
1137
"""Configuration for the main training loop, evaluation, and reproducibility."""
0 commit comments