import pandas as pd
import seaborn as sns
#
from pyspark.sql.functions import *
#
from pyspark.ml.feature import VectorAssembler
from pyspark.ml.regression import LinearRegression
#
import mlflow
import logging
#
import json
import requests
from mlflow.utils.rest_utils import http_request
from mlflow.utils.databricks_utils import get_databricks_host_creds

logging.getLogger("mlflow").setLevel(logging.FATAL)

diamonds_df = sns.load_dataset("diamonds").drop(["cut", "color", "clarity"], axis=1)
#
diamonds_sdf = spark.createDataFrame(diamonds_df)
#
train_df, test_df = diamonds_sdf.randomSplit([.8, .2], seed=42)

assembler_inputs = [column for column in diamonds_sdf.columns if column not in ['price']]
vec_assembler = VectorAssembler(inputCols=assembler_inputs, outputCol="features")
#
train_df_processed = vec_assembler.transform(train_df)

lrm = LinearRegression(featuresCol="features", labelCol='price')

model_path = 'webhook-model'
#
with mlflow.start_run(run_name="webhook-run") as run:
    model = lrm.fit(train_df_processed)
    #
    mlflow.spark.log_model(model, model_path)

# model name
model_name = "webhook_diamonds"
#
# register the latest logged model
latest_run_id = mlflow.search_runs().sort_values(by="end_time", ascending=False).head(1)['run_id'][0]
#
mlflow.register_model(f"runs:/{latest_run_id}/{model_path}", name=model_name);

Registered model 'webhook_diamonds' already exists. Creating a new version of this model...
Created version '2' of model 'webhook_diamonds'.

def find_job_id(instance, headers, job_name, offset_limit=1000):
    params = {"offset": 0}
    uri = f"{instance}/api/2.1/jobs/list"
    done = False
    job_id = None
    while not done:
        done = True
        res = requests.get(uri, params=params, headers=headers)
        assert res.status_code == 200, f"Job list not returned; {res.content}"

        jobs = res.json().get("jobs", [])
        if len(jobs) > 0:
            for job in jobs:
                if job.get("settings", {}).get("name", None) == job_name:
                    job_id = job.get("job_id", None)
                    break
                  
            # if job_id not found; update the offset and try again
            if job_id is None:
                params["offset"] += len(jobs)
                if params["offset"] < offset_limit:
                    done = False
    return job_id

token = dbutils.notebook.entry_point.getDbutils().notebook().getContext().apiToken().getOrElse(None)

# define some parameters
job_name = "webhook_test"
headers = {"Authorization": f"Bearer {token}"}
host_creds = get_databricks_host_creds("databricks")
endpoint = "/api/2.0/mlflow/registry-webhooks/create"
instance = mlflow.utils.databricks_utils.get_webapp_url()
job_id = find_job_id(instance, headers, job_name, offset_limit=1000)

# define job_json
job_json = {"model_name": model_name,
            "events": ["MODEL_VERSION_TRANSITIONED_TO_STAGING"],
            "description": "Job webhook trigger",
            "status": "Active",
            "job_spec": {"job_id": job_id,
                         "workspace_url": instance,
                         "access_token": token}
           }

response = http_request(
    host_creds=host_creds, 
    endpoint=endpoint,
    method="POST",
    json=job_json
)

assert response.status_code == 200, f"Expected HTTP 200, received {response.status_code}"

client = mlflow.MlflowClient()
#
client.transition_model_version_stage(model_name, 1, 'Staging')

Out[11]: <ModelVersion: creation_timestamp=1699615322888, current_stage='Staging', description='', last_updated_timestamp=1699616004219, name='webhook_diamonds', run_id='ed6f91126eb149e7bf39c024da865a00', run_link='', source='dbfs:/databricks/mlflow-tracking/1352035400533066/ed6f91126eb149e7bf39c024da865a00/artifacts/webhook-model', status='READY', status_message='', tags={}, user_id='2329071338839022', version='1'>

from mlflow.utils.rest_utils import http_request
from mlflow.utils.databricks_utils import get_databricks_host_creds
import urllib

slack_incoming_webhook = "https://hooks.slack.com/services/T00000000/B00000000/XXXXXXXXXXXXXXXXXXXXXXXX" 

endpoint = "/api/2.0/mlflow/registry-webhooks/create"
host_creds = get_databricks_host_creds("databricks")

## specify http url of the slack notification
http_json = {"model_name": model_name,
             "events": ["MODEL_VERSION_TRANSITIONED_TO_STAGING"],
             "description": "Job webhook trigger",
             "status": "Active",
             "http_url_spec": {
               "url": slack_incoming_webhook,
               "enable_ssl_verification": "false"}}

response = http_request(
  host_creds=host_creds, 
  endpoint=endpoint,
  method="POST",
  json=http_json
)

print(json.dumps(response.json(), indent=4))

%sh
pip install databricks-registry-webhooks -q

WARNING: You are using pip version 21.2.4; however, version 23.3.1 is available.
You should consider upgrading via the '/local_disk0/.ephemeral_nfs/envs/pythonEnv-02a00090-d306-4c63-a422-b79fa56b5c38/bin/python -m pip install --upgrade pip' command.

from databricks_registry_webhooks import RegistryWebhooksClient
#
webhooks_list = RegistryWebhooksClient().list_webhooks(model_name=model_name)
#
for webhook in webhooks_list:
    print(dict(webhook))

{'creation_timestamp': 1699615877080, 'description': 'Job webhook trigger', 'events': ['MODEL_VERSION_TRANSITIONED_TO_STAGING'], 'http_url_spec': None, 'id': '574346f1870847db8a76e252030d33f1', 'job_spec': <JobSpec: access_token='', job_id='483529352125879', workspace_url='https://eastus-c3.azuredatabricks.net'>, 'last_updated_timestamp': 1699615877080, 'model_name': 'webhook_diamonds', 'status': 'ACTIVE'}

RegistryWebhooksClient().delete_webhook(id="574346f1870847db8a76e252030d33f1")

Databricks-ML-professional-S02c-Model-Lifecycle-Automation