Skip to content

Commit 4b099d9

Browse files
author
maxtext authors
committed
Merge pull request #1830 from AI-Hypercomputer:model_comment
PiperOrigin-RevId: 771232937
2 parents 02b6b8d + be799de commit 4b099d9

File tree

1 file changed

+7
-6
lines changed

1 file changed

+7
-6
lines changed

benchmarks/maxtext_trillium_model_configs.py

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -722,7 +722,7 @@
722722
),
723723
)
724724

725-
725+
# Config only runs on v6e-256
726726
llama3_1_405b_8192_fsdp_dcn = _add_to_model_dictionary(
727727
trillium_model_dict,
728728
MaxTextModel(
@@ -776,6 +776,7 @@
776776
),
777777
)
778778

779+
# Config only runs on v6e-256
779780
llama3_1_405b_8192_pure_fsdp_ici = _add_to_model_dictionary(
780781
trillium_model_dict,
781782
MaxTextModel(
@@ -1524,6 +1525,7 @@
15241525
),
15251526
)
15261527

1528+
# Config only runs on v6e-256
15271529
mixtral_8x22b_dropped = _add_to_model_dictionary(
15281530
trillium_model_dict,
15291531
MaxTextModel(
@@ -1568,6 +1570,7 @@
15681570
),
15691571
)
15701572

1573+
# Config only runs on v6e-256
15711574
deepseek_v3_ep16 = _add_to_model_dictionary(
15721575
trillium_model_dict,
15731576
MaxTextModel(
@@ -1608,7 +1611,7 @@
16081611
),
16091612
)
16101613

1611-
1614+
# Config only runs on v6e-256
16121615
gemma2_9b_8192 = _add_to_model_dictionary(
16131616
trillium_model_dict,
16141617
MaxTextModel(
@@ -1641,7 +1644,7 @@
16411644
),
16421645
)
16431646

1644-
1647+
# Config only runs on v6e-256
16451648
gemma2_27b_8192 = _add_to_model_dictionary(
16461649
trillium_model_dict,
16471650
MaxTextModel(
@@ -1736,7 +1739,7 @@
17361739
)
17371740
)
17381741

1739-
# Customized MoE model - 700B
1742+
# Customized MoE model - 700B, and config only runs on v6e-256
17401743
custom_moe_700b = _add_to_model_dictionary(
17411744
trillium_model_dict,
17421745
MaxTextModel(
@@ -1797,5 +1800,3 @@
17971800
),
17981801
),
17991802
)
1800-
1801-

0 commit comments

Comments
 (0)