-
Notifications
You must be signed in to change notification settings - Fork 11
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Signed-off-by: Mayank Mishra <[email protected]>
- Loading branch information
1 parent
917c3c6
commit 15aa971
Showing
6 changed files
with
49 additions
and
30 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,8 +1,8 @@ | ||
from ...mixins import CausalLMModelMixin_TP | ||
from .base import GPTDolomiteModel_TP, GPTDolomitePreTrainedModel_TP | ||
from .weights import get_gpt_dolomite_tensor_parallel_state_dict | ||
from .weights import get_gpt_dolomite_model_parallel_state_dict | ||
|
||
|
||
class GPTDolomiteForCausalLM_TP(GPTDolomitePreTrainedModel_TP, CausalLMModelMixin_TP): | ||
base_model_class = GPTDolomiteModel_TP | ||
tensor_parallel_state_dict_function = get_gpt_dolomite_tensor_parallel_state_dict | ||
model_parallel_state_dict_function = get_gpt_dolomite_model_parallel_state_dict |
2 changes: 1 addition & 1 deletion
2
dolomite_engine/hf_models/models/gpt_dolomite_TP/weights/__init__.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,2 +1,2 @@ | ||
from .shard import get_gpt_dolomite_tensor_parallel_state_dict | ||
from .shard import get_gpt_dolomite_model_parallel_state_dict | ||
from .unshard import fix_gpt_dolomite_unsharded_state_dict, unshard_gpt_dolomite_tensor_parallel_state_dicts |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters