File tree 3 files changed +35
-4
lines changed
3 files changed +35
-4
lines changed Original file line number Diff line number Diff line change @@ -49,6 +49,7 @@ class InferenceContainerType(ExtendedEnum):
49
49
class InferenceContainerTypeFamily (ExtendedEnum ):
50
50
AQUA_VLLM_CONTAINER_FAMILY = "odsc-vllm-serving"
51
51
AQUA_VLLM_V1_CONTAINER_FAMILY = "odsc-vllm-serving-v1"
52
+ AQUA_VLLM_LLAMA4_CONTAINER_FAMILY = "odsc-vllm-serving-llama4"
52
53
AQUA_TGI_CONTAINER_FAMILY = "odsc-tgi-serving"
53
54
AQUA_LLAMA_CPP_CONTAINER_FAMILY = "odsc-llama-cpp-serving"
54
55
@@ -119,4 +120,9 @@ class Platform(ExtendedEnum):
119
120
InferenceContainerTypeFamily .AQUA_VLLM_V1_CONTAINER_FAMILY ,
120
121
InferenceContainerTypeFamily .AQUA_VLLM_CONTAINER_FAMILY ,
121
122
],
123
+ InferenceContainerTypeFamily .AQUA_VLLM_LLAMA4_CONTAINER_FAMILY : [
124
+ InferenceContainerTypeFamily .AQUA_VLLM_LLAMA4_CONTAINER_FAMILY ,
125
+ InferenceContainerTypeFamily .AQUA_VLLM_V1_CONTAINER_FAMILY ,
126
+ InferenceContainerTypeFamily .AQUA_VLLM_CONTAINER_FAMILY ,
127
+ ],
122
128
}
Original file line number Diff line number Diff line change @@ -316,11 +316,17 @@ def create_multi(
316
316
# )
317
317
318
318
# check if model is a fine-tuned model and if so, add the fine tuned weights path to the fine_tune_weights_location pydantic field
319
- is_fine_tuned_model = Tags .AQUA_FINE_TUNED_MODEL_TAG in source_model .freeform_tags
319
+ is_fine_tuned_model = (
320
+ Tags .AQUA_FINE_TUNED_MODEL_TAG in source_model .freeform_tags
321
+ )
320
322
321
323
if is_fine_tuned_model :
322
- model .model_id , model .model_name = extract_base_model_from_ft (source_model )
323
- model_artifact_path , model .fine_tune_weights_location = extract_fine_tune_artifacts_path (source_model )
324
+ model .model_id , model .model_name = extract_base_model_from_ft (
325
+ source_model
326
+ )
327
+ model_artifact_path , model .fine_tune_weights_location = (
328
+ extract_fine_tune_artifacts_path (source_model )
329
+ )
324
330
325
331
else :
326
332
# Retrieve model artifact for base models
@@ -380,7 +386,8 @@ def create_multi(
380
386
raise AquaValueError (
381
387
"The selected models are associated with different container families: "
382
388
f"{ list (selected_models_deployment_containers )} ."
383
- "For multi-model deployment, all models in the group must share the same container family."
389
+ "For multi-model deployment, all models in the group must belong to the same container "
390
+ "family or to compatible container families."
384
391
)
385
392
else :
386
393
deployment_container = selected_models_deployment_containers .pop ()
Original file line number Diff line number Diff line change @@ -16,8 +16,26 @@ class TestCommonUtils:
16
16
{"odsc-vllm-serving" , "odsc-vllm-serving-v1" },
17
17
"odsc-vllm-serving-v1" ,
18
18
),
19
+ (
20
+ {"odsc-vllm-serving" , "odsc-vllm-serving-llama4" },
21
+ "odsc-vllm-serving-llama4" ,
22
+ ),
23
+ (
24
+ {"odsc-vllm-serving-v1" , "odsc-vllm-serving-llama4" },
25
+ "odsc-vllm-serving-llama4" ,
26
+ ),
27
+ (
28
+ {
29
+ "odsc-vllm-serving" ,
30
+ "odsc-vllm-serving-v1" ,
31
+ "odsc-vllm-serving-llama4" ,
32
+ },
33
+ "odsc-vllm-serving-llama4" ,
34
+ ),
19
35
({"odsc-tgi-serving" , "odsc-vllm-serving" }, None ),
20
36
({"non-existing-one" , "odsc-tgi-serving" }, None ),
37
+ ({"odsc-tgi-serving" , "odsc-vllm-serving-llama4" }, None ),
38
+ ({"odsc-tgi-serving" , "odsc-vllm-serving-v1" }, None ),
21
39
],
22
40
)
23
41
def test_get_preferred_compatible_family (self , input_families , expected ):
You can’t perform that action at this time.
0 commit comments