adding unit test

Ziqun Ye · Ziqun Ye · commit 350f0eaabed4 · 2023-04-10T12:24:53.000-07:00
diff --git a/ads/model/deployment/model_deployment.py b/ads/model/deployment/model_deployment.py
@@ -1404,7 +1404,7 @@ def _update_from_oci_model(self, oci_model_instance) -> "ModelDeployment":
             infrastructure.CONST_WEB_CONCURRENCY,
             runtime.env.get("WEB_CONCURRENCY", None),
         )
-        if runtime.env.pop("CONTAINER_TYPE", None) == "TRITON":
+        if runtime.env.get("CONTAINER_TYPE", None) == "TRITON":
             runtime.set_spec(
                 runtime.CONST_INFERENCE_SERVER, "triton"
             )
@@ -1584,7 +1584,7 @@ def _build_model_deployment_configuration_details(self) -> Dict:
                 infrastructure.web_concurrency
             )
             runtime.set_spec(runtime.CONST_ENV, environment_variables)
-        if runtime.inference_server.lower() == "triton":
+        if hasattr(runtime, "inference_server") and runtime.inference_server and runtime.inference_server.lower() == "triton":
             environment_variables["CONTAINER_TYPE"] = "TRITON"
             runtime.set_spec(runtime.CONST_ENV, environment_variables)
         environment_configuration_details = {
diff --git a/tests/unitary/default_setup/model_deployment/test_model_deployment_v2.py b/tests/unitary/default_setup/model_deployment/test_model_deployment_v2.py
@@ -308,6 +308,62 @@ def initialize_model_deployment_from_spec(self):
                 "runtime": runtime,
             }
         )
+        
+    def initialize_model_deployment_triton_builder(self):
+        infrastructure = ModelDeploymentInfrastructure()\
+            .with_compartment_id("fakeid.compartment.oc1..xxx")\
+            .with_project_id("fakeid.datascienceproject.oc1.iad.xxx")\
+            .with_shape_name("VM.Standard.E4.Flex")\
+            .with_replica(2)\
+            .with_bandwidth_mbps(10)\
+
+        runtime = ModelDeploymentContainerRuntime()\
+            .with_image("fake_image")\
+            .with_server_port(5000)\
+            .with_health_check_port(5000)\
+            .with_model_uri("fake_model_id")\
+            .with_env({"key":"value", "key2":"value2"})\
+            .with_inference_server("triton")
+        
+        deployment = ModelDeployment()\
+            .with_display_name("triton case")\
+            .with_infrastructure(infrastructure)\
+            .with_runtime(runtime)
+        return deployment
+
+    def initialize_model_deployment_triton_yaml(self):
+        yaml_string = """
+kind: deployment
+spec:
+  displayName: triton
+  infrastructure:
+    kind: infrastructure
+    spec:
+      bandwidthMbps: 10
+      compartmentId: fake_compartment_id
+      deploymentType: SINGLE_MODEL
+      policyType: FIXED_SIZE
+      replica: 2
+      shapeConfigDetails:
+        memoryInGBs: 16.0
+        ocpus: 1.0
+      shapeName: VM.Standard.E4.Flex
+    type: datascienceModelDeployment
+  runtime:
+    kind: runtime
+    spec:
+      env:
+        key: value
+        key2: value2
+      inference_server: triton
+      healthCheckPort: 8000
+      image: fake_image
+      modelUri: fake_model_id
+      serverPort: 8000
+    type: container
+"""
+        deployment_from_yaml = ModelDeployment.from_yaml(yaml_string)
+        return deployment_from_yaml
 
     def initialize_model_deployment_from_kwargs(self):
         infrastructure = (
@@ -435,11 +491,34 @@ def test_initialize_model_deployment_with_error(self):
                 },
             )
 
+
     def test_initialize_model_deployment_with_spec_kwargs(self):
         model_deployment_kwargs = self.initialize_model_deployment_from_kwargs()
         model_deployment_builder = self.initialize_model_deployment()
 
         assert model_deployment_kwargs.to_dict() == model_deployment_builder.to_dict()
+        
+        
+    def test_initialize_model_deployment_triton_builder(self):
+        temp_model_deployment = self.initialize_model_deployment_triton_builder()
+        assert isinstance(
+            temp_model_deployment.runtime, ModelDeploymentContainerRuntime
+        )
+        assert isinstance(
+            temp_model_deployment.infrastructure, ModelDeploymentInfrastructure
+        )
+        assert temp_model_deployment.runtime.inference_server == "triton"
+    
+    def test_initialize_model_deployment_triton_yaml(self):
+        temp_model_deployment = self.initialize_model_deployment_triton_yaml()
+        assert isinstance(
+            temp_model_deployment.runtime, ModelDeploymentContainerRuntime
+        )
+        assert isinstance(
+            temp_model_deployment.infrastructure, ModelDeploymentInfrastructure
+        )
+        assert temp_model_deployment.runtime.inference_server == "triton"
+        
 
     def test_model_deployment_to_dict(self):
         model_deployment = self.initialize_model_deployment()

Original file line number	Diff line number	Diff line change
`@@ -1404,7 +1404,7 @@ def _update_from_oci_model(self, oci_model_instance) -> "ModelDeployment":`
`1404`	`1404`	`infrastructure.CONST_WEB_CONCURRENCY,`
`1405`	`1405`	`runtime.env.get("WEB_CONCURRENCY", None),`
`1406`	`1406`	`)`
`1407`		`- if runtime.env.pop("CONTAINER_TYPE", None) == "TRITON":`
	`1407`	`+ if runtime.env.get("CONTAINER_TYPE", None) == "TRITON":`
`1408`	`1408`	`runtime.set_spec(`
`1409`	`1409`	`runtime.CONST_INFERENCE_SERVER, "triton"`
`1410`	`1410`	`)`
`@@ -1584,7 +1584,7 @@ def _build_model_deployment_configuration_details(self) -> Dict:`
`1584`	`1584`	`infrastructure.web_concurrency`
`1585`	`1585`	`)`
`1586`	`1586`	`runtime.set_spec(runtime.CONST_ENV, environment_variables)`
`1587`		`- if runtime.inference_server.lower() == "triton":`
	`1587`	`+ if hasattr(runtime, "inference_server") and runtime.inference_server and runtime.inference_server.lower() == "triton":`
`1588`	`1588`	`environment_variables["CONTAINER_TYPE"] = "TRITON"`
`1589`	`1589`	`runtime.set_spec(runtime.CONST_ENV, environment_variables)`
`1590`	`1590`	`environment_configuration_details = {`