We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
block_size
1 parent c261237 commit f226a3fCopy full SHA for f226a3f
tests/v1/kv_connector/nixl_integration/run_accuracy_test.sh
@@ -49,8 +49,8 @@ NUM_DECODE_INSTANCES=${NUM_DECODE_INSTANCES:-1} # Default to 1
49
PREFILLER_TP_SIZE=${PREFILLER_TP_SIZE:-1}
50
DECODER_TP_SIZE=${DECODER_TP_SIZE:-1}
51
GPU_MEMORY_UTILIZATION=${GPU_MEMORY_UTILIZATION:-0.2}
52
-PREFILL_BLOCK_SIZE=${PREFILL_BLOCK_SIZE:-16}
53
-DECODE_BLOCK_SIZE=${DECODE_BLOCK_SIZE:-16}
+PREFILL_BLOCK_SIZE=${PREFILL_BLOCK_SIZE:-128}
+DECODE_BLOCK_SIZE=${DECODE_BLOCK_SIZE:-128}
54
55
# Find the git repository root directory
56
GIT_ROOT=$(git rev-parse --show-toplevel)
0 commit comments