Skip to content

Commit ca0e7ef

Browse files
committed
Adding Compute-Context-Length(CCL)
Signed-off-by: Vahid Janfaza <vjanfaza@qti.qualcomm.com>
1 parent 1142eba commit ca0e7ef

File tree

1 file changed

+12
-12
lines changed

1 file changed

+12
-12
lines changed

QEfficient/cloud/infer.py

Lines changed: 12 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -336,18 +336,18 @@ def main(
336336
"--prompt-len", "--prompt_len", default=32, type=int, help="Sequence length for text generation."
337337
)
338338
parser.add_argument("--ctx-len", "--ctx_len", default=128, type=int, help="Context length for text generation.")
339-
parser.add_argument('--comp-ctx-lengths-prefill',
340-
type=lambda comp_ctx_lengths_prefill:
341-
[int(x) for x in comp_ctx_lengths_prefill.split(",")],
342-
default=[512],
343-
help='Define ccl list in csv format (e.g.,'
344-
'--comp-ctx-lengths 512,1024,2048).')
345-
parser.add_argument('--comp-ctx-lengths-decode',
346-
type=lambda comp_ctx_lengths_decode:
347-
[int(x) for x in comp_ctx_lengths_decode.split(",")],
348-
default=[2048],
349-
help='Define ccl list in csv format (e.g.,'
350-
'--comp-ctx-lengths 512,1024,2048).')
339+
parser.add_argument(
340+
"--comp-ctx-lengths-prefill",
341+
type=lambda comp_ctx_lengths_prefill: [int(x) for x in comp_ctx_lengths_prefill.split(",")],
342+
default=[512],
343+
help="Define ccl list in csv format (e.g.,--comp-ctx-lengths 512,1024,2048).",
344+
)
345+
parser.add_argument(
346+
"--comp-ctx-lengths-decode",
347+
type=lambda comp_ctx_lengths_decode: [int(x) for x in comp_ctx_lengths_decode.split(",")],
348+
default=[2048],
349+
help="Define ccl list in csv format (e.g.,--comp-ctx-lengths 512,1024,2048).",
350+
)
351351
parser.add_argument(
352352
"--mxfp6",
353353
"--mxfp6_matmul",

0 commit comments

Comments
 (0)