In [3]:
from azureml.core import Model, Environment
from azureml.core.model import InferenceConfig
from azureml.core.webservice import AciWebservice, Webservice
from azureml.core import Workspace

# Connect to Azure ML Workspace
ws = Workspace.from_config()

# Load the registered model
model = Model(ws, name="catboost-thrombosis-predictor")

# Define environment for deployment
env = Environment(name="catboost-env")
env.python.conda_dependencies.add_pip_package("catboost")
env.python.conda_dependencies.add_pip_package("azureml-defaults")

# Create inference configuration
inference_config = InferenceConfig(
    entry_script="score.py",  # This script will handle requests
    environment=env
)

# Define deployment configuration (1 CPU, 1GB RAM)
aci_config = AciWebservice.deploy_configuration(cpu_cores=1, memory_gb=1)

# Deploy model as a web service
service = Model.deploy(
    workspace=ws,
    name="catboost-endpoint",
    models=[model],
    inference_config=inference_config,
    deployment_config=aci_config
)

service.wait_for_deployment(show_output=True)
print(f"✅ Model deployed successfully! Endpoint URL: {service.scoring_uri}")


To leverage new model deployment capabilities, AzureML recommends using CLI/SDK v2 to deploy models as online endpoint, 
please refer to respective documentations 
https://docs.microsoft.com/azure/machine-learning/how-to-deploy-managed-online-endpoints /
https://docs.microsoft.com/azure/machine-learning/how-to-attach-kubernetes-anywhere 
For more information on migration, see https://aka.ms/acimoemigration 
  service = Model.deploy(


Tips: You can try get_logs(): https://aka.ms/debugimage#dockerlog or local deployment: https://aka.ms/debugimage#debug-locally to debug if deployment takes longer than 10 minutes.
Running
2025-01-31 21:28:03+00:00 Creating Container Registry if not exists.
2025-01-31 21:28:05+00:00 Building image.