We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 239f375 commit eadaea7Copy full SHA for eadaea7
src/twinkle/model/transformers/transformers.py
@@ -955,9 +955,6 @@ def _get_full_state_dict(self) -> dict:
955
the local expert shards across the EP group to reconstruct the
956
full expert tensor (all num_experts on dim-0).
957
"""
958
- import torch
959
- import torch.distributed as dist
960
-
961
model = self.strategy.unwrap_model(self.model)
962
state_dict = {}
963
0 commit comments