|
16 | 16 | required: false |
17 | 17 | type: string |
18 | 18 | default: 'terminal-bench-core==0.1.1' |
19 | | - concurrency: |
20 | | - description: 'Number of concurrent tasks (--n-concurrent)' |
21 | | - required: false |
22 | | - type: string |
23 | | - default: '4' |
24 | 19 | livestream: |
25 | 20 | description: 'Enable livestream mode (verbose output to console)' |
26 | 21 | required: false |
|
30 | 25 | description: 'Number of random tasks to run (empty = all tasks)' |
31 | 26 | required: false |
32 | 27 | type: string |
| 28 | + load_threshold: |
| 29 | + description: 'Load threshold for adaptive concurrency (default: 1.0)' |
| 30 | + required: false |
| 31 | + type: string |
| 32 | + default: '1.0' |
| 33 | + check_interval: |
| 34 | + description: 'Seconds between adaptive bursts (default: 60)' |
| 35 | + required: false |
| 36 | + type: string |
| 37 | + default: '60' |
33 | 38 | extra_args: |
34 | 39 | description: 'Additional arguments to pass to terminal-bench' |
35 | 40 | required: false |
|
46 | 51 | required: false |
47 | 52 | default: 'terminal-bench-core==0.1.1' |
48 | 53 | type: string |
49 | | - concurrency: |
50 | | - description: 'Number of concurrent tasks (--n-concurrent)' |
51 | | - required: false |
52 | | - default: '4' |
53 | | - type: string |
54 | 54 | livestream: |
55 | 55 | description: 'Enable livestream mode (verbose output to console)' |
56 | 56 | required: false |
|
68 | 68 | description: 'Thinking level (off, low, medium, high)' |
69 | 69 | required: false |
70 | 70 | type: string |
| 71 | + load_threshold: |
| 72 | + description: 'Load threshold for adaptive concurrency (default: 1.0)' |
| 73 | + required: false |
| 74 | + default: '1.0' |
| 75 | + type: string |
| 76 | + check_interval: |
| 77 | + description: 'Seconds between adaptive bursts (default: 60)' |
| 78 | + required: false |
| 79 | + default: '60' |
| 80 | + type: string |
71 | 81 | extra_args: |
72 | 82 | description: 'Additional arguments to pass to terminal-bench' |
73 | 83 | required: false |
@@ -105,7 +115,8 @@ jobs: |
105 | 115 | run: make benchmark-terminal 2>&1 | tee benchmark.log |
106 | 116 | env: |
107 | 117 | TB_DATASET: ${{ inputs.dataset }} |
108 | | - TB_CONCURRENCY: ${{ inputs.concurrency }} |
| 118 | + TB_LOAD_THRESHOLD: ${{ inputs.load_threshold }} |
| 119 | + TB_CHECK_INTERVAL: ${{ inputs.check_interval }} |
109 | 120 | TB_LIVESTREAM: ${{ inputs.livestream && '1' || '' }} |
110 | 121 | TB_SAMPLE_SIZE: ${{ inputs.sample_size }} |
111 | 122 | TB_ARGS: ${{ inputs.model_name && format('--agent-kwarg model_name={0} --agent-kwarg thinking_level={1} {2}', inputs.model_name, inputs.thinking_level, inputs.extra_args) || inputs.extra_args }} |
|
0 commit comments