We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 8390b01 commit f2cd562Copy full SHA for f2cd562
tests/models/glm4_moe/test_modeling_glm4_moe.py
@@ -61,6 +61,7 @@ class Glm4MoeModelTest(CausalLMModelTest, unittest.TestCase):
61
model_tester_class = Glm4MoeModelTester
62
# used in `test_torch_compile_for_training`. Skip as "Dynamic control flow in MoE"
63
_torch_compile_train_cls = None
64
+ model_split_percents = [0.5, 0.85, 0.9] # it tries to offload everything with the default value
65
66
67
@require_torch_accelerator
0 commit comments