Compare commits

...

1 Commits

Author SHA1 Message Date
Ryuichi Leo Takashige
9a92eea656 Add explicit mx.eval on model parameters
If this doesn't, we should fall back to the other strategies we have
2026-01-26 11:09:22 +00:00

View File

@@ -337,6 +337,7 @@ def tensor_auto_parallel(
if hasattr(model, "shard") and not isinstance(model, GptOssModel):
try:
model.shard(group) # type: ignore
mx.eval(model.parameters())
return patch_tensor_model(model)
except (AttributeError, TypeError, NameError):
pass