Skip to content

Commit ea529c5

Browse files
authored
Merge pull request #134 from foundation-model-stack/fix_test_scripts
update test scripts to work with 4 layer micro model
2 parents 24b25b0 + f997e8a commit ea529c5

File tree

1 file changed

+10
-7
lines changed

1 file changed

+10
-7
lines changed

tests/models/test_scripts.py

Lines changed: 10 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -17,9 +17,9 @@
1717
else:
1818
common_model_paths = common_model_paths.split(",")
1919

20-
common_batch_sizes = [1, 8]
20+
common_batch_sizes = [1, 4]
2121
common_seq_lengths = [64]
22-
common_max_new_tokens = [12]
22+
common_max_new_tokens = [8]
2323
common_attn_types = ["sdpa", "paged"]
2424

2525
common_params = list(
@@ -36,7 +36,10 @@
3636

3737

3838
def execute_script(execute_cmd):
39-
current_env["MAX_SHAREDPROG_ITERS"] = f"{common_max_new_tokens[0]}"
39+
# using these options temporarily
40+
current_env["VLLM_DT_MAX_BATCH_TKV_LIMIT"] = "16384"
41+
current_env["VLLM_DT_MAX_BATCH_SIZE"] = "4"
42+
current_env["VLLM_DT_MAX_CONTEXT_LEN"] = "4096"
4043

4144
with Popen(
4245
execute_cmd,
@@ -79,10 +82,10 @@ def execute_inference(model_path, batch_size, seq_length, max_new_tokens, attn_t
7982

8083

8184
common_asserts = [
82-
"### Response:\nProvide a list of instructions for preparing chicken soup",
83-
"### Response:\nExplain some popular greetings in Spanish.",
84-
"### Response:\nExplain to me why ignorance is bliss.",
85-
"### Response:\nI have just come into a very large sum of money",
85+
"### Response:\n\n1.\n\nThe following",
86+
"### Response:\n\n1.\n\nI am",
87+
"### Response:\n\nI am not sure what you",
88+
"### Response:\n\nI have just come into a",
8689
]
8790

8891

0 commit comments

Comments
 (0)