Skip to content

Commit 8508d15

Browse files
RobertLucianvishalbollu
authored andcommitted
Remove unnecessary env var & reposition env var source (#1184)
(cherry picked from commit 8843326)
1 parent 5db3084 commit 8508d15

File tree

4 files changed

+11
-13
lines changed

4 files changed

+11
-13
lines changed

cli/local/docker_spec.go

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -93,7 +93,7 @@ func getAPIEnv(api *spec.API, awsClient *aws.Client) []string {
9393
"CORTEX_THREADS_PER_PROCESS="+s.Int32(api.Predictor.ThreadsPerProcess),
9494
// add 1 because it was required to achieve the target concurrency for 1 process, 1 thread
9595
"CORTEX_MAX_PROCESS_CONCURRENCY="+s.Int64(1+int64(math.Round(float64(consts.DefaultMaxReplicaConcurrency)/float64(api.Predictor.ProcessesPerReplica)))),
96-
"CORTEX_SO_MAX_CONN=1000",
96+
"CORTEX_SO_MAX_CONN="+s.Int64(consts.DefaultMaxReplicaConcurrency+100), // add a buffer to be safe
9797
"AWS_REGION="+awsClient.Region,
9898
)
9999

pkg/operator/operator/k8s_specs.go

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -624,10 +624,6 @@ func getEnvVars(api *spec.API, container string) []kcore.EnvVar {
624624
Name: "CORTEX_THREADS_PER_PROCESS",
625625
Value: s.Int32(api.Predictor.ThreadsPerProcess),
626626
},
627-
kcore.EnvVar{
628-
Name: "CORTEX_MAX_REPLICA_CONCURRENCY",
629-
Value: s.Int64(api.Autoscaling.MaxReplicaConcurrency),
630-
},
631627
kcore.EnvVar{
632628
Name: "CORTEX_MAX_PROCESS_CONCURRENCY",
633629
// add 1 because it was required to achieve the target concurrency for 1 process, 1 thread

pkg/workloads/cortex/serve/run.sh

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -39,6 +39,13 @@ rm -rf /mnt/workspace/api_readiness.txt
3939
# allow for the liveness check to pass until the API is running
4040
echo "9999999999" > /mnt/workspace/api_liveness.txt
4141

42+
# export environment variables
43+
if [ -f "/mnt/project/.env" ]; then
44+
set -a
45+
source /mnt/project/.env
46+
set +a
47+
fi
48+
4249
export PYTHONPATH=$PYTHONPATH:$PYTHON_PATH
4350
# ensure predictor print() statements are always flushed
4451
export PYTHONUNBUFFERED=TRUE
@@ -49,13 +56,6 @@ if [ "$CORTEX_PROVIDER" != "local" ]; then
4956
sysctl -w net.ipv4.tcp_fin_timeout=30 >/dev/null
5057
fi
5158

52-
# export environment variables
53-
if [ -f "/mnt/project/.env" ]; then
54-
set -a
55-
source /mnt/project/.env
56-
set +a
57-
fi
58-
5959
# execute script if present in project's directory
6060
if [ -f "/mnt/project/dependencies.sh" ]; then
6161
bash -e /mnt/project/dependencies.sh

pkg/workloads/cortex/serve/start_uvicorn.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -87,7 +87,9 @@ def main():
8787
host="0.0.0.0",
8888
port=int(os.environ["CORTEX_SERVING_PORT"]),
8989
workers=int(os.environ["CORTEX_PROCESSES_PER_REPLICA"]),
90-
limit_concurrency=int(os.environ["CORTEX_MAX_PROCESS_CONCURRENCY"]),
90+
limit_concurrency=int(
91+
os.environ["CORTEX_MAX_PROCESS_CONCURRENCY"]
92+
), # this is a per process limit
9193
backlog=int(os.environ["CORTEX_SO_MAX_CONN"]),
9294
log_config=log_config,
9395
log_level="info",

0 commit comments

Comments
 (0)