File tree Expand file tree Collapse file tree 1 file changed +7
-6
lines changed Expand file tree Collapse file tree 1 file changed +7
-6
lines changed Original file line number Diff line number Diff line change 722
722
),
723
723
)
724
724
725
-
725
+ # Config only runs on v6e-256
726
726
llama3_1_405b_8192_fsdp_dcn = _add_to_model_dictionary (
727
727
trillium_model_dict ,
728
728
MaxTextModel (
776
776
),
777
777
)
778
778
779
+ # Config only runs on v6e-256
779
780
llama3_1_405b_8192_pure_fsdp_ici = _add_to_model_dictionary (
780
781
trillium_model_dict ,
781
782
MaxTextModel (
1524
1525
),
1525
1526
)
1526
1527
1528
+ # Config only runs on v6e-256
1527
1529
mixtral_8x22b_dropped = _add_to_model_dictionary (
1528
1530
trillium_model_dict ,
1529
1531
MaxTextModel (
1568
1570
),
1569
1571
)
1570
1572
1573
+ # Config only runs on v6e-256
1571
1574
deepseek_v3_ep16 = _add_to_model_dictionary (
1572
1575
trillium_model_dict ,
1573
1576
MaxTextModel (
1608
1611
),
1609
1612
)
1610
1613
1611
-
1614
+ # Config only runs on v6e-256
1612
1615
gemma2_9b_8192 = _add_to_model_dictionary (
1613
1616
trillium_model_dict ,
1614
1617
MaxTextModel (
1641
1644
),
1642
1645
)
1643
1646
1644
-
1647
+ # Config only runs on v6e-256
1645
1648
gemma2_27b_8192 = _add_to_model_dictionary (
1646
1649
trillium_model_dict ,
1647
1650
MaxTextModel (
1736
1739
)
1737
1740
)
1738
1741
1739
- # Customized MoE model - 700B
1742
+ # Customized MoE model - 700B, and config only runs on v6e-256
1740
1743
custom_moe_700b = _add_to_model_dictionary (
1741
1744
trillium_model_dict ,
1742
1745
MaxTextModel (
1797
1800
),
1798
1801
),
1799
1802
)
1800
-
1801
-
You can’t perform that action at this time.
0 commit comments