Adding Compute-Context-Length(CCL)

vjanfaza · vjanfaza · commit 0b4ee3a99e29 · 2025-10-14T09:47:49.000-07:00
Signed-off-by: Vahid Janfaza &lt;vjanfaza@qti.qualcomm.com&gt;
diff --git a/QEfficient/utils/check_ccl_specializations.py b/QEfficient/utils/check_ccl_specializations.py
@@ -7,14 +7,17 @@
 
 from typing import List, Optional
 
-def process_ccl_specializations(ccl_prefill: Optional[List[int]]=None, ccl_decode: Optional[List[int]]=None, ctx_len: Optional[int]=None):
+
+def process_ccl_specializations(
+    ccl_prefill: Optional[List[int]] = None, ccl_decode: Optional[List[int]] = None, ctx_len: Optional[int] = None
+):
     if ctx_len is None:
         raise TypeError("`ctx_len` is required when loading the model.")
     if ccl_prefill is None:
         ccl_prefill = [ctx_len]
     if ccl_decode is None:
         ccl_decode = [ctx_len]
-        
+
     # Step 1: Cap values to ctx_len
     ccl_prefill = [min(x, ctx_len) for x in ccl_prefill]
     ccl_decode = [min(x, ctx_len) for x in ccl_decode]
@@ -37,4 +40,4 @@ def process_ccl_specializations(ccl_prefill: Optional[List[int]]=None, ccl_decod
     updated_prefill.sort()
     ccl_decode.sort()
 
-    return updated_prefill, ccl_decode
+    return updated_prefill, ccl_decode