diff --git a/assets/models/system/phi-3.5-mini-128k-instruct/spec.yaml b/assets/models/system/phi-3.5-mini-128k-instruct/spec.yaml index 9c4963bdd4..af6ee28a13 100644 --- a/assets/models/system/phi-3.5-mini-128k-instruct/spec.yaml +++ b/assets/models/system/phi-3.5-mini-128k-instruct/spec.yaml @@ -34,6 +34,9 @@ tags: author: microsoft SharedComputeCapacityEnabled : "" hiddenlayerscanned : "" + maas-finetuning: true + maas-finetuning-offer: true + maas-finetuning-regions: eastus2 _aml_system_vanity_registry: "azureml-phi" inference_compute_allow_list: [ diff --git a/assets/models/system/phi-3.5-moe-128k-instruct/spec.yaml b/assets/models/system/phi-3.5-moe-128k-instruct/spec.yaml index 73906b320b..e91c8d4dc6 100644 --- a/assets/models/system/phi-3.5-moe-128k-instruct/spec.yaml +++ b/assets/models/system/phi-3.5-moe-128k-instruct/spec.yaml @@ -6,6 +6,9 @@ properties: languages: en inference-min-sku-spec: 48|2|440|128 inference-recommended-sku: Standard_NC48ads_A100_v4, Standard_NC96ads_A100_v4, Standard_ND96amsr_A100_v4 + finetuning-tasks: chat-completion + finetune-min-sku-spec: 24|1|220|64 + finetune-recommended-sku: Standard_NC24ads_A100_v4, Standard_NC48ads_A100_v4, Standard_NC96ads_A100_v4, Standard_ND96amsr_A100_v4 tags: freePlayground: "false" displayName: "Phi-3.5 MoE instruct (128k)" @@ -27,6 +30,9 @@ tags: author: microsoft SharedComputeCapacityEnabled : "" hiddenlayerscanned : "" + maas-finetuning: true + maas-finetuning-offer: true + maas-finetuning-regions: eastus2 _aml_system_vanity_registry: "azureml-phi" inference_compute_allow_list: [ @@ -34,11 +40,18 @@ tags: Standard_ND96amsr_A100_v4, Standard_NC96ads_A100_v4 ] + finetune_compute_allow_list: + [ + Standard_NC24ads_A100_v4, + Standard_NC48ads_A100_v4, + Standard_NC96ads_A100_v4, + Standard_ND96amsr_A100_v4 + ] inference_supported_envs: - vllm model_specific_defaults: apply_deepspeed: "true" - deepspeed_stage: 2 + deepspeed_stage: 3 apply_lora: "true" apply_ort: "false" precision: 16 @@ -52,4 +65,4 @@ tags: logging_strategy: "steps" logging_steps: 10 save_total_limit: 1 -version: 2 +version: 3