modified unit tests to include fine tuned models

elizjo · elizjo · commit f5e1bb074b44 · 2025-05-09T15:43:37.000-07:00
diff --git a/ads/aqua/common/entities.py b/ads/aqua/common/entities.py
@@ -157,6 +157,8 @@ class AquaMultiModelRef(Serializable):
         Optional environment variables to override during deployment.
     artifact_location : Optional[str]
         Artifact path of model in the multimodel group.
+    fine_tune_artifact : Optional[str]
+        For fine tuned models, the artifact path of the modified model weights
     """
 
     model_id: str = Field(..., description="The model OCID to deploy.")
@@ -171,6 +173,9 @@ class AquaMultiModelRef(Serializable):
     artifact_location: Optional[str] = Field(
         None, description="Artifact path of model in the multimodel group."
     )
+    fine_tune_artifact: Optional[str] = Field(
+        None, description="For fine tuned models, the artifact path of the modified model weights"
+    )
 
     class Config:
         extra = "ignore"
diff --git a/ads/aqua/model/utils.py b/ads/aqua/model/utils.py
@@ -48,7 +48,7 @@ def set_fine_tune_env_var(aqua_model: DataScienceModel, env_var: Optional[Dict[s
     # we add the correct artifact location when using FT in Multi Model Deployment
     if model:
         model.artifact_location = base_model_path # validated later in _create_multi method in deployment.py
-        model.env_var.update({"FT_MODEL": f"{fine_tune_output_path}"})
+        model.fine_tune_artifact = fine_tune_output_path
 
     else:
         env_var.update({"FT_MODEL": f"{fine_tune_output_path}"})
diff --git a/ads/aqua/modeldeployment/deployment.py b/ads/aqua/modeldeployment/deployment.py
@@ -623,10 +623,8 @@ def _create_multi(
             if model.model_task:
                 config_data["model_task"] = model.model_task
 
-            fine_tuned_model = model.env_var.get("FT_MODEL")
-
-            if fine_tuned_model:
-                config_data["FT_MODEL"] = fine_tuned_model
+            if model.fine_tune_artifact:
+                config_data["fine_tune_path"] = model.fine_tune_artifact
 
             model_config.append(config_data)
             model_name_list.append(model.model_name)
diff --git a/tests/unitary/with_extras/aqua/test_deployment.py b/tests/unitary/with_extras/aqua/test_deployment.py
@@ -275,7 +275,7 @@ class TestDataset:
                         "environment_configuration_type": "OCIR_CONTAINER",
                         "environment_variables": {
                             "MODEL_DEPLOY_PREDICT_ENDPOINT": "/v1/completions",
-                            "MULTI_MODEL_CONFIG": '{ "models": [{ "params": "--served-model-name model_one --tensor-parallel-size 1 --max-model-len 2096", "model_path": "models/model_one/5be6479/artifact/", "model_task": "text_embedding"}, {"params": "--served-model-name model_two --tensor-parallel-size 1 --max-model-len 2096", "model_path": "models/model_two/83e9aa1/artifact/", "model_task": "image_text_to_text"}, {"params": "--served-model-name model_three --tensor-parallel-size 1 --max-model-len 2096", "model_path": "models/model_three/83e9aa1/artifact/", "model_task": "code_synthesis"}]}',
+                            "MULTI_MODEL_CONFIG": '{ "models": [{ "params": "--served-model-name model_one --tensor-parallel-size 1 --max-model-len 2096", "model_path": "models/model_one/5be6479/artifact/", "model_task": "text_embedding"}, {"params": "--served-model-name model_two --tensor-parallel-size 1 --max-model-len 2096", "model_path": "models/model_two/83e9aa1/artifact/", "model_task": "image_text_to_text"}, {"params": "--served-model-name model_three --tensor-parallel-size 1 --max-model-len 2096", "model_path": "models/model_three/83e9aa1/artifact/", "model_task": "code_synthesis", "fine_tune_path": "oci://test_bucket@test_namespace/models/ft-models/meta-llama-3b/ocid1.datasciencejob.oc1.iad.<ocid>"}]}',
                         },
                         "health_check_port": 8080,
                         "image": "dsmc://image-name:1.0.0.0",
@@ -487,6 +487,7 @@ class TestDataset:
                 "model_name": "test_model_1",
                 "model_task": "text_embedding",
                 "artifact_location": "test_location_1",
+                "fine_tune_artifact" : None
             },
             {
                 "env_var": {},
@@ -495,6 +496,7 @@ class TestDataset:
                 "model_name": "test_model_2",
                 "model_task": "image_text_to_text",
                 "artifact_location": "test_location_2",
+                "fine_tune_artifact" : None
             },
             {
                 "env_var": {},
@@ -503,12 +505,13 @@ class TestDataset:
                 "model_name": "test_model_3",
                 "model_task": "code_synthesis",
                 "artifact_location": "test_location_3",
+                "fine_tune_artifact" : "oci://test_bucket@test_namespace/models/ft-models/meta-llama-3b/ocid1.datasciencejob.oc1.iad.<ocid>"
             },
         ],
         "model_id": "ocid1.datasciencemodel.oc1.<region>.<OCID>",
         "environment_variables": {
             "MODEL_DEPLOY_PREDICT_ENDPOINT": "/v1/completions",
-            "MULTI_MODEL_CONFIG": '{ "models": [{ "params": "--served-model-name model_one --tensor-parallel-size 1 --max-model-len 2096", "model_path": "models/model_one/5be6479/artifact/", "model_task": "text_embedding"}, {"params": "--served-model-name model_two --tensor-parallel-size 1 --max-model-len 2096", "model_path": "models/model_two/83e9aa1/artifact/", "model_task": "image_text_to_text"}, {"params": "--served-model-name model_three --tensor-parallel-size 1 --max-model-len 2096", "model_path": "models/model_three/83e9aa1/artifact/", "model_task": "code_synthesis"}]}',
+            "MULTI_MODEL_CONFIG": '{ "models": [{ "params": "--served-model-name model_one --tensor-parallel-size 1 --max-model-len 2096", "model_path": "models/model_one/5be6479/artifact/", "model_task": "text_embedding"}, {"params": "--served-model-name model_two --tensor-parallel-size 1 --max-model-len 2096", "model_path": "models/model_two/83e9aa1/artifact/", "model_task": "image_text_to_text"}, {"params": "--served-model-name model_three --tensor-parallel-size 1 --max-model-len 2096", "model_path": "models/model_three/83e9aa1/artifact/", "model_task": "code_synthesis", "fine_tune_path": "oci://test_bucket@test_namespace/models/ft-models/meta-llama-3b/ocid1.datasciencejob.oc1.iad.<ocid>"}]}',
         },
         "cmd": [],
         "console_link": "https://cloud.oracle.com/data-science/model-deployments/ocid1.datasciencemodeldeployment.oc1.<region>.<MD_OCID>?region=region-name",
@@ -969,6 +972,7 @@ class TestDataset:
             "model_name": "model_one",
             "model_task": "text_embedding",
             "artifact_location": "artifact_location_one",
+            "fine_tune_artifact": None
         },
         {
             "env_var": {"--test_key_two": "test_value_two"},
@@ -977,6 +981,7 @@ class TestDataset:
             "model_name": "model_two",
             "model_task": "image_text_to_text",
             "artifact_location": "artifact_location_two",
+            "fine_tune_artifact": None
         },
         {
             "env_var": {"--test_key_three": "test_value_three"},
@@ -985,6 +990,7 @@ class TestDataset:
             "model_name": "model_three",
             "model_task": "code_synthesis",
             "artifact_location": "artifact_location_three",
+            "fine_tune_artifact" : "oci://test_bucket@test_namespace/models/ft-models/meta-llama-3b/ocid1.datasciencejob.oc1.iad.<ocid>"
         },
     ]
 
@@ -1811,6 +1817,7 @@ def test_create_deployment_for_multi_model(
             model_task="code_synthesis",
             gpu_count=2,
             artifact_location="test_location_3",
+            fine_tune_artifact= "oci://test_bucket@test_namespace/models/ft-models/meta-llama-3b/ocid1.datasciencejob.oc1.iad.<ocid>"
         )
 
         result = self.app.create(
diff --git a/tests/unitary/with_extras/aqua/test_model.py b/tests/unitary/with_extras/aqua/test_model.py
@@ -254,6 +254,74 @@ class TestDataset:
         ],
     }
 
+    fine_tuned_model_file_description = {
+        "version": "1.0",
+        "type": "modelOSSReferenceDescription",
+        "models": [
+            {
+                "namespace": "test_namespace",
+                "bucketName": "test_bucket",
+                "prefix": "models/meta-llama/Llama-3.2-3B-Instruct",
+                "objects": [
+                    {
+                        "name": "models/meta-llama/Llama-3.2-3B-Instruct/.gitattributes",
+                        "version": "bfbf278c-10af-4f2c-8240-11fed02e1322",
+                        "sizeInBytes": 1519,
+                    },
+                    {
+                        "name": "models/meta-llama/Llama-3.2-3B-Instruct/LICENSE.txt",
+                        "version": "4238d1e2-d826-4300-a344-0ead410afa27",
+                        "sizeInBytes": 7712,
+                    },
+                    {
+                        "name": "models/meta-llama/Llama-3.2-3B-Instruct/README.md",
+                        "version": "57382552-9ad0-4546-b38c-c96634f3b8a2",
+                        "sizeInBytes": 41744,
+                    },
+                ],
+            },
+            {
+                "namespace": "test_namespace",
+                "bucketName": "test_bucket",
+                "prefix": "models/meta-llama/Llama-3.2-3B-Instruct",
+                "objects": [
+                    {
+                        "name": "models/meta-llama/Llama-3.2-3B-Instruct/.gitattributes",
+                        "version": "bfbf278c-10af-4f2c-8240-11fed02e1322",
+                        "sizeInBytes": 1519,
+                    },
+                    {
+                        "name": "models/meta-llama/Llama-3.2-3B-Instruct/LICENSE.txt",
+                        "version": "4238d1e2-d826-4300-a344-0ead410afa27",
+                        "sizeInBytes": 7712,
+                    },
+                    {
+                        "name": "models/meta-llama/Llama-3.2-3B-Instruct/README.md",
+                        "version": "57382552-9ad0-4546-b38c-c96634f3b8a2",
+                        "sizeInBytes": 41744,
+                    },
+                ],
+            },
+            {
+                "namespace": "test_namespace",
+                "bucketName": "test_bucket",
+                "prefix": "models/ft-models/meta-llama-3b/ocid1.datasciencejob.oc1.iad.<ocid>",
+                "objects": [
+                    {
+                    "name": "models/ft-models/meta-llama-3b/ocid1.datasciencejob.oc1.iad.<ocid>/README.md",
+                    "version": "636b83ae-be59-445f-a8d7-da7277535ef0",
+                    "sizeInBytes": 5176
+                    },
+                    {
+                    "name": "models/ft-models/meta-llama-3b/ocid1.datasciencejob.oc1.iad.<ocid>/adapter_config.json",
+                    "version": "6d6ea6c9-05e1-44d9-bab6-0ad175c924e6",
+                    "sizeInBytes": 805
+                    }
+                ]
+            },
+        ],
+    }
+
     SERVICE_COMPARTMENT_ID = "ocid1.compartment.oc1..<OCID>"
     COMPARTMENT_ID = "ocid1.compartment.oc1..<UNIQUE_OCID>"
     SERVICE_MODEL_ID = "ocid1.datasciencemodel.oc1.iad.<OCID>"
@@ -488,9 +556,23 @@ def test_create_multimodel(
         mock_model.freeform_tags["task"] = "text-generation"
         model_info_1.model_task = "text_embedding"
 
+
+        # testing requesting metadata from fine tuned model to add to model group
+        mock_model.model_file_description = TestDataset.fine_tuned_model_file_description
+
+        # testing fine tuned model in model group
+        model_info_3 = AquaMultiModelRef(
+            model_id="test_model_id_3",
+            gpu_count=2,
+            model_task="image_text_to_text",
+            env_var={"params": "--trust-remote-code --max-model-len 32000"},
+            artifact_location="oci://test_bucket@test_namespace/models/meta-llama/Llama-3.2-3B-Instruct",
+            fine_tune_artifact="oci://test_bucket@test_namespace/models/ft-models/meta-llama-3b/ocid1.datasciencejob.oc1.iad.<ocid>"
+        )
+
         # will create a multi-model group
         model = self.app.create_multi(
-            models=[model_info_1, model_info_2],
+            models=[model_info_1, model_info_2, model_info_3],
             project_id="test_project_id",
             compartment_id="test_compartment_id",
         )
@@ -503,7 +585,7 @@ def test_create_multimodel(
         mock_create.return_value = mock_model
 
         assert model.freeform_tags == {"aqua_multimodel": "true"}
-        assert model.custom_metadata_list.get("model_group_count").value == "2"
+        assert model.custom_metadata_list.get("model_group_count").value == "3"
         assert (
             model.custom_metadata_list.get("deployment-container").value
             == "odsc-vllm-serving"