Resolve merge conflicts and ruff update

VipulMascarenhas · VipulMascarenhas · commit 1e418dba7726 · 2025-02-06T16:17:08.000+05:30
diff --git a/ads/aqua/extension/deployment_handler.py b/ads/aqua/extension/deployment_handler.py
@@ -215,9 +215,10 @@ class AquaDeploymentParamsHandler(AquaAPIhandler):
     def get(self, model_id):
         """Handle GET request."""
         instance_shape = self.get_argument("instance_shape")
+        gpu_count = self.get_argument("gpu_count", default=None)
         return self.finish(
             AquaDeploymentApp().get_deployment_default_params(
-                model_id=model_id, instance_shape=instance_shape
+                model_id=model_id, instance_shape=instance_shape, gpu_count=gpu_count
             )
         )
 
diff --git a/ads/aqua/modeldeployment/deployment.py b/ads/aqua/modeldeployment/deployment.py
@@ -808,6 +808,7 @@ def get_deployment_default_params(
         self,
         model_id: str,
         instance_shape: str,
+        gpu_count: int = None,
     ) -> List[str]:
         """Gets the default params set in the deployment configs for the given model and instance shape.
 
@@ -819,6 +820,9 @@ def get_deployment_default_params(
         instance_shape: (str).
             The shape of the instance used for deployment.
 
+        gpu_count: (int, optional).
+            The number of GPUs used by the Aqua model. Defaults to None.
+
         Returns
         -------
         List[str]:
@@ -827,6 +831,7 @@ def get_deployment_default_params(
 
         """
         default_params = []
+        config_params = {}
         model = DataScienceModel.from_id(model_id)
         try:
             container_type_key = model.custom_metadata_list.get(
@@ -843,12 +848,28 @@ def get_deployment_default_params(
             and container_type_key in InferenceContainerTypeFamily.values()
         ):
             deployment_config = self.get_deployment_config(model_id)
-            config_params = (
-                deployment_config.get("configuration", UNKNOWN_DICT)
-                .get(instance_shape, UNKNOWN_DICT)
-                .get("parameters", UNKNOWN_DICT)
-                .get(get_container_params_type(container_type_key), UNKNOWN)
-            )
+
+            instance_shape_config = deployment_config.get(
+                "configuration", UNKNOWN_DICT
+            ).get(instance_shape, UNKNOWN_DICT)
+
+            if "multi_model_deployment" in instance_shape_config and gpu_count:
+                gpu_params = instance_shape_config.get(
+                    "multi_model_deployment", UNKNOWN_DICT
+                )
+
+                for gpu_config in gpu_params:
+                    if gpu_config["gpu_count"] == gpu_count:
+                        config_params = gpu_config.get("parameters", UNKNOWN_DICT).get(
+                            get_container_params_type(container_type_key), UNKNOWN
+                        )
+                        break
+
+            else:
+                config_params = instance_shape_config.get(
+                    "parameters", UNKNOWN_DICT
+                ).get(get_container_params_type(container_type_key), UNKNOWN)
+
             if config_params:
                 params_list = get_params_list(config_params)
                 restricted_params_set = get_restricted_params_by_container(
diff --git a/tests/unitary/with_extras/aqua/test_data/deployment/deployment_config.json b/tests/unitary/with_extras/aqua/test_data/deployment/deployment_config.json
@@ -1,6 +1,6 @@
 {
   "configuration": {
-    "VM.GPU.A10.1": {
+    "VM.GPU.A10.4": {
       "parameters": {
         "TGI_PARAMS": "--max-stop-sequences 6",
         "VLLM_PARAMS": "--max-model-len 4096"
@@ -24,7 +24,7 @@
     }
   },
   "shape": [
-    "VM.GPU.A10.1",
+    "VM.GPU.A10.4",
     "VM.Standard.A1.Flex"
   ]
 }
diff --git a/tests/unitary/with_extras/aqua/test_data/deployment/deployment_gpu_config.json b/tests/unitary/with_extras/aqua/test_data/deployment/deployment_gpu_config.json
@@ -0,0 +1,43 @@
+{
+    "shape": [
+        "VM.GPU.A10.1",
+        "VM.GPU.A10.2",
+        "BM.GPU.A10.4",
+        "BM.GPU.L40S-NC.4"
+    ],
+    "configuration": {
+        "VM.GPU.A10.2": {
+            "parameters": {
+                "VLLM_PARAMS": "--trust-remote-code --max-model-len 60000"
+            },
+            "multi_model_deployment": [
+                {
+                    "gpu_count": 1
+                }
+            ]
+        },
+        "BM.GPU.A10.4": {
+            "parameters": {
+                "VLLM_PARAMS": "--trust-remote-code --max-model-len 60000"
+            },
+            "multi_model_deployment": [
+                {
+                    "gpu_count": 1
+                },
+                {
+                    "gpu_count": 2
+                }
+            ]
+        },
+        "BM.GPU.L40S-NC.4": {
+            "parameters": {
+                "VLLM_PARAMS": "--trust-remote-code --max-model-len 60000"
+            },
+            "multi_model_deployment": [
+                {
+                    "gpu_count": 2
+                }
+            ]
+        }
+    }
+}
diff --git a/tests/unitary/with_extras/aqua/test_deployment.py b/tests/unitary/with_extras/aqua/test_deployment.py
@@ -40,7 +40,9 @@ class TestDataset:
     MODEL_DEPLOYMENT_URL = "https://modeldeployment.customer-oci.com/ocid1.datasciencemodeldeployment.oc1.<region>.<MD_OCID>"
     MODEL_ID = "ocid1.datasciencemodeldeployment.oc1.<region>.<MODEL_OCID>"
     DEPLOYMENT_IMAGE_NAME = "dsmc://image-name:1.0.0.0"
-    DEPLOYMENT_SHAPE_NAME = "VM.GPU.A10.1"
+    DEPLOYMENT_SHAPE_NAME = "BM.GPU.A10.4"
+    DEPLOYMENT_GPU_COUNT = 1
+    DEPLOYMENT_GPU_COUNT_B = 2
     DEPLOYMENT_SHAPE_NAME_CPU = "VM.Standard.A1.Flex"
 
     model_deployment_object = [
@@ -908,24 +910,28 @@ def test_create_deployment_for_tei_byoc_embedding_model(
             (
                 "VLLM_PARAMS",
                 "odsc-vllm-serving",
+                2,
                 ["--max-model-len 4096", "--seed 42", "--trust-remote-code"],
                 ["--max-model-len 4096", "--trust-remote-code"],
             ),
             (
                 "VLLM_PARAMS",
                 "odsc-vllm-serving",
-                [],
-                [],
+                None,
+                ["--max-model-len 4096"],
+                ["--max-model-len 4096"],
             ),
             (
                 "TGI_PARAMS",
                 "odsc-tgi-serving",
-                ["--sharded true", "--trust-remote-code", "--max-stop-sequences"],
-                ["--max-stop-sequences"],
+                1,
+                [],
+                [],
             ),
             (
                 "CUSTOM_PARAMS",
                 "custom-container-key",
+                None,
                 ["--max-model-len 4096", "--seed 42", "--trust-remote-code"],
                 ["--max-model-len 4096", "--seed 42", "--trust-remote-code"],
             ),
@@ -936,21 +942,34 @@ def test_get_deployment_default_params(
         self,
         container_params_field,
         container_type_key,
+        gpu_count,
         params,
         allowed_params,
         mock_from_id,
     ):
         """Test for fetching config details for a given deployment."""
 
         config_json = os.path.join(
-            self.curr_dir, "test_data/deployment/deployment_config.json"
+            self.curr_dir, "test_data/deployment/deployment_gpu_config.json"
         )
         with open(config_json, "r") as _file:
             config = json.load(_file)
         # update config params for testing
-        config["configuration"][TestDataset.DEPLOYMENT_SHAPE_NAME]["parameters"][
-            container_params_field
-        ] = " ".join(params)
+        if gpu_count:
+            # build field for multi_model_deployment
+            config["configuration"][TestDataset.DEPLOYMENT_SHAPE_NAME][
+                "multi_model_deployment"
+            ] = [
+                {
+                    "gpu_count": gpu_count,
+                    "parameters": {container_params_field: " ".join(params)},
+                }
+            ]
+        else:
+            # build field for normal deployment
+            config["configuration"][TestDataset.DEPLOYMENT_SHAPE_NAME]["parameters"][
+                container_params_field
+            ] = " ".join(params)
 
         mock_model = MagicMock()
         custom_metadata_list = ModelCustomMetadata()
@@ -961,10 +980,12 @@ def test_get_deployment_default_params(
         mock_from_id.return_value = mock_model
 
         self.app.get_deployment_config = MagicMock(return_value=config)
+
         result = self.app.get_deployment_default_params(
-            TestDataset.MODEL_ID, TestDataset.DEPLOYMENT_SHAPE_NAME
+            TestDataset.MODEL_ID, TestDataset.DEPLOYMENT_SHAPE_NAME, gpu_count
         )
-        if container_params_field == "CUSTOM_PARAMS":
+
+        if container_params_field in ("CUSTOM_PARAMS", "TGI_PARAMS"):
             assert result == []
         else:
             assert result == allowed_params

Original file line number	Diff line number	Diff line change
`@@ -215,9 +215,10 @@ class AquaDeploymentParamsHandler(AquaAPIhandler):`
`215`	`215`	`def get(self, model_id):`
`216`	`216`	`"""Handle GET request."""`
`217`	`217`	`instance_shape = self.get_argument("instance_shape")`
	`218`	`+ gpu_count = self.get_argument("gpu_count", default=None)`
`218`	`219`	`return self.finish(`
`219`	`220`	`AquaDeploymentApp().get_deployment_default_params(`
`220`		`- model_id=model_id, instance_shape=instance_shape`
	`221`	`+ model_id=model_id, instance_shape=instance_shape, gpu_count=gpu_count`
`221`	`222`	`)`
`222`	`223`	`)`
`223`	`224`
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`	`2`	`"configuration": {`
`3`		`- "VM.GPU.A10.1": {`
	`3`	`+ "VM.GPU.A10.4": {`
`4`	`4`	`"parameters": {`
`5`	`5`	`"TGI_PARAMS": "--max-stop-sequences 6",`
`6`	`6`	`"VLLM_PARAMS": "--max-model-len 4096"`
`@@ -24,7 +24,7 @@`
`24`	`24`	`}`
`25`	`25`	`},`
`26`	`26`	`"shape": [`
`27`		`- "VM.GPU.A10.1",`
	`27`	`+ "VM.GPU.A10.4",`
`28`	`28`	`"VM.Standard.A1.Flex"`
`29`	`29`	`]`
`30`	`30`	`}`