end-to-end-mlops-databricks · srues2 · Nov 15, 2024 · Nov 15, 2024 · Nov 15, 2024 · Nov 18, 2024
@@ -1,10 +1,10 @@
 # Databricks notebook source
 # The 2 cells below is only when you are running from databricks UI, because of 'possible' not working locally in VS
-# %pip install mlops_with_databricks-0.0.1-py3-none-any.whl
+%pip install ../mlops_with_databricks-0.0.1-py3-none-any.whl
 
 # COMMAND ----------
 
-# dbutils.library.restartPython()
+dbutils.library.restartPython()
 
 # COMMAND ----------
 
@@ -176,12 +176,12 @@
 testing_df = testing_set.load_df().toPandas()
 
 # Split features and target
-X_train = training_df[num_features + cat_features]
+X_train = training_df[num_features + cat_features + ["AverageTemperature"]]
 # Don't use sleep_hours_duration, because it's covered in sleep_duration, but was a example to use feature function option
 # X_train = training_df[num_features + cat_features + ["sleep_hours_duration"]]
 
 y_train = training_df[target]
-X_test = testing_df[num_features + cat_features]
+X_test = testing_df[num_features + cat_features + ["AverageTemperature"]]
 # Don't use sleep_hours_duration, because it's covered in sleep_duration, but was a example to use feature function option
 # X_test= testing_df[num_features + cat_features + ["sleep_hours_duration"]]
 y_test = testing_df[target]
@@ -226,5 +226,5 @@
         signature=signature,
     )
 mlflow.register_model(
-    model_uri=f"runs:/{run_id}/lightgbm-pipeline-model-fe", name=f"{catalog_name}.{schema_name}.house_prices_model_fe"
+    model_uri=f"runs:/{run_id}/lightgbm-pipeline-model-fe", name=f"{catalog_name}.{schema_name}.sleep_efficiencies_model_fe"
 )
@@ -0,0 +1,263 @@
+# Databricks notebook source
+# MAGIC %pip install ../mlops_with_databricks-0.0.1-py3-none-any.whl
+
+# COMMAND ----------
+
+# MAGIC %restart_python
+
+# COMMAND ----------
+
+"""
+Create feature table in unity catalog, it will be a delta table
+Create online table which uses the feature delta table created in the previous step
+Create a feature spec. When you create a feature spec,
+you specify the source Delta table.
+This allows the feature spec to be used in both offline and online scenarios.
+For online lookups, the serving endpoint automatically uses the online table to perform low-latency feature lookups.
+The source Delta table and the online table must use the same primary key.
+
+"""
+
+import random
+import time
+from concurrent.futures import ThreadPoolExecutor, as_completed
+
+import mlflow
+import pandas as pd
+import requests
+from databricks import feature_engineering
+from databricks.feature_engineering import FeatureLookup
+from databricks.sdk import WorkspaceClient
+from databricks.sdk.service.catalog import (
+    OnlineTableSpec,
+    OnlineTableSpecTriggeredSchedulingPolicy,
+)
+from databricks.sdk.service.serving import EndpointCoreConfigInput, ServedEntityInput
+from pyspark.sql import SparkSession
+
+from sleep_efficiency.config import ProjectConfig
+
+spark = SparkSession.builder.getOrCreate()
+
+# Initialize Databricks clients
+workspace = WorkspaceClient()
+fe = feature_engineering.FeatureEngineeringClient()
+
+# Set the MLflow registry URI
+mlflow.set_registry_uri("databricks-uc")
+
+# COMMAND ----------
+
+# MAGIC %md
+# MAGIC ## Load config, train and test tables
+
+# COMMAND ----------
+
+# Load config
+config = ProjectConfig.from_yaml(config_path="../../project_config.yml")
+
+# Get feature columns details
+num_features = config.num_features
+cat_features = config.cat_features
+target = config.target
+catalog_name = config.catalog_name
+schema_name = config.schema_name
+
+# Define table names
+feature_table_name = f"{catalog_name}.{schema_name}.sleep_efficiencies_preds"
+online_table_name = f"{catalog_name}.{schema_name}.sleep_efficiencies_preds_online"
+
+# Load training and test sets from Catalog
+train_set = spark.table(f"{catalog_name}.{schema_name}.train_set").toPandas()
+test_set = spark.table(f"{catalog_name}.{schema_name}.test_set").toPandas()
+
+df = pd.concat([train_set, test_set])
+
+# COMMAND ----------
+
+# MAGIC %md
+# MAGIC ## Load a registered model
+
+# COMMAND ----------
+
+# Load the MLflow model for predictions
+pipeline = mlflow.sklearn.load_model(f"models:/{catalog_name}.{schema_name}.sleep_efficiency_model_basic/3")
+
+# COMMAND ----------
+
+# Prepare the DataFrame for predictions and feature table creation - these features are the ones we want to serve.
+preds_df = df[["id", "sleep_duration", "awakenings", "sleep_month"]]
+preds_df["Predicted_SleepEfficiency"] = pipeline.predict(df[cat_features + num_features])
+
+preds_df = spark.createDataFrame(preds_df)
+
+# 1. Create the feature table in Databricks
+
+fe.create_table(
+    name=feature_table_name,
+    primary_keys=["id"],
+    df=preds_df,
+    description="Sleep efficiencies predictions feature table",
+)
+
+# Enable Change Data Feed
+spark.sql(f"""
+    ALTER TABLE {feature_table_name}
+    SET TBLPROPERTIES (delta.enableChangeDataFeed = true)
+""")
+
+# COMMAND ----------
+
+# 2. Create the online table using feature table
+
+spec = OnlineTableSpec(
+    primary_key_columns=["id"],
+    source_table_full_name=feature_table_name,
+    run_triggered=OnlineTableSpecTriggeredSchedulingPolicy.from_dict({"triggered": "true"}),
+    perform_full_copy=False,
+)
+
+# Create the online table in Databricks
+online_table_pipeline = workspace.online_tables.create(name=online_table_name, spec=spec)
+
+# COMMAND ----------
+
+# 3. Create feture look up and feature spec table feature table
+
+# Define features to look up from the feature table
+features = [
+    FeatureLookup(
+        table_name=feature_table_name,
+        lookup_key="Id",
+        feature_names=["id", "sleep_duration", "awakenings", "sleep_month", "Predicted_SleepEfficiency"],
+    )
+]
+
+# Create the feature spec for serving
+feature_spec_name = f"{catalog_name}.{schema_name}.return_predictions"
+
+fe.create_feature_spec(name=feature_spec_name, features=features, exclude_columns=None)
+
+# COMMAND ----------
+
+# MAGIC %md
+# MAGIC ## Deploy Feature Serving Endpoint
+
+# COMMAND ----------
+
+# 4. Create endpoing using feature spec
+
+# Create a serving endpoint for the sleep efficiencies predictions
+workspace.serving_endpoints.create(
+    name="sleep-efficiencies-feature-serving",
+    config=EndpointCoreConfigInput(
+        served_entities=[
+            ServedEntityInput(
+                entity_name=feature_spec_name,  # feature spec name defined in the previous step
+                scale_to_zero_enabled=True,
+                workload_size="Small",  # Define the workload size (Small, Medium, Large)
+            )
+        ]
+    ),
+)
+
+# COMMAND ----------
+
+# MAGIC %md
+# MAGIC ## Call The Endpoint
+
+# COMMAND ----------
+
+
+# COMMAND ----------
+
+token = dbutils.notebook.entry_point.getDbutils().notebook().getContext().apiToken().get()
+host = spark.conf.get("spark.databricks.workspaceUrl")
+
+# COMMAND ----------
+
+id_list = preds_df["Id"]
+
+# COMMAND ----------
+
+display(id_list)
+
+# COMMAND ----------
+
+# MAGIC %md
+# MAGIC
+
+# COMMAND ----------
+
+start_time = time.time()
+serving_endpoint = f"https://{host}/serving-endpoints/sleep-efficiencies-feature-serving/invocations"
+response = requests.post(
+    f"{serving_endpoint}",
+    headers={"Authorization": f"Bearer {token}"},
+    json={"dataframe_records": [{"Id": "2"}]},
+)
+
+end_time = time.time()
+execution_time = end_time - start_time
+
+print("Response status:", response.status_code)
+print("Reponse text:", response.text)
+print("Execution time:", execution_time, "seconds")
+
+
+# COMMAND ----------
+
+# another way to call the endpoint
+
+response = requests.post(
+    f"{serving_endpoint}",
+    headers={"Authorization": f"Bearer {token}"},
+    json={"dataframe_split": {"columns": ["Id"], "data": [["2"]]}},
+)
+
+
+## Load Test
+
+# COMMAND ----------
+
+# Initialize variables
+serving_endpoint = f"https://{host}/serving-endpoints/sleep-efficiencies-feature-serving/invocations"
+id_list = preds_df.select("Id").rdd.flatMap(lambda x: x).collect()
+headers = {"Authorization": f"Bearer {token}"}
+num_requests = 10
+
+
+# Function to make a request and record latency
+def send_request():
+    random_id = random.choice(id_list)
+    start_time = time.time()
+    response = requests.post(
+        serving_endpoint,
+        headers=headers,
+        json={"dataframe_records": [{"Id": random_id}]},
+    )
+    end_time = time.time()
+    latency = end_time - start_time  # Calculate latency for this request
+    return response.status_code, latency
+
+
+# Measure total execution time
+total_start_time = time.time()
+latencies = []
+
+# Send requests concurrently
+with ThreadPoolExecutor(max_workers=100) as executor:
+    futures = [executor.submit(send_request) for _ in range(num_requests)]
+
+    for future in as_completed(futures):
+        status_code, latency = future.result()
+        latencies.append(latency)
+
+total_end_time = time.time()
+total_execution_time = total_end_time - total_start_time
+
+# Calculate the average latency
+average_latency = sum(latencies) / len(latencies)
+
+print("\nTotal execution time:", total_execution_time, "seconds")
+print("Average latency per request:", average_latency, "seconds")