Skip to content

Commit 1142eba

Browse files
committed
Adding Compute-Context-Length(CCL)
Signed-off-by: Vahid Janfaza <vjanfaza@qti.qualcomm.com>
1 parent 0b4ee3a commit 1142eba

File tree

1 file changed

+12
-0
lines changed

1 file changed

+12
-0
lines changed

QEfficient/cloud/infer.py

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -336,6 +336,18 @@ def main(
336336
"--prompt-len", "--prompt_len", default=32, type=int, help="Sequence length for text generation."
337337
)
338338
parser.add_argument("--ctx-len", "--ctx_len", default=128, type=int, help="Context length for text generation.")
339+
parser.add_argument('--comp-ctx-lengths-prefill',
340+
type=lambda comp_ctx_lengths_prefill:
341+
[int(x) for x in comp_ctx_lengths_prefill.split(",")],
342+
default=[512],
343+
help='Define ccl list in csv format (e.g.,'
344+
'--comp-ctx-lengths 512,1024,2048).')
345+
parser.add_argument('--comp-ctx-lengths-decode',
346+
type=lambda comp_ctx_lengths_decode:
347+
[int(x) for x in comp_ctx_lengths_decode.split(",")],
348+
default=[2048],
349+
help='Define ccl list in csv format (e.g.,'
350+
'--comp-ctx-lengths 512,1024,2048).')
339351
parser.add_argument(
340352
"--mxfp6",
341353
"--mxfp6_matmul",

0 commit comments

Comments
 (0)