Merge 6b86f08 into e79e43c

manuelgilm · web-flow · commit e2abbe716f56 · 2025-05-18T12:38:57.000-05:00
diff --git a/README.md b/README.md
@@ -188,6 +188,13 @@ Then, run the script with the desired function as an argument:
                     - video: [43. Example 1. Custom model (multimodel)](https://youtu.be/ttm--W1OBVU)
                     - video: [44. Example 1. Custom model (multimodel) Part 2](https://youtu.be/yqvkXNADsYU)
 
+### Local Model Serving Use cases.
+
+In this section, we explore how MLflow enables local model serving. You'll learn how to launch a local MLflow server to deploy and serve ML models, making them accessible for real-time predictions via REST API endpoints. This approach is useful for testing, prototyping, and integrating models into local applications before moving to production environments.
+
+#### Iris classifier. 
+
+
 
 ## Contributing
 
diff --git a/examples/iris_classifier/data.py b/examples/iris_classifier/data.py
@@ -0,0 +1,26 @@
+from sklearn.datasets import load_iris
+from sklearn.model_selection import train_test_split
+from typing import Optional
+from typing import Tuple
+import pandas as pd
+
+
+def get_train_test_data(
+    test_size: Optional[float] = 0.2, random_state: Optional[int] = 42
+) -> Tuple[pd.DataFrame, pd.DataFrame, pd.Series, pd.Series]:
+    """
+    Load the iris dataset and split it into training and testing sets.
+    The function returns the training and testing data as pandas DataFrames.
+
+    :param test_size: The proportion of the dataset to include in the test split (default is 0.2).
+    :param random_state: Controls the shuffling applied to the data before applying the split (default is 42).
+    :return: A tuple containing the training features (X_train), testing features (X_test),
+             training labels (y_train), and testing labels (y_test).
+    """
+    iris = load_iris(as_frame=True)
+    X = iris.data
+    y = iris.target
+    X_train, X_test, y_train, y_test = train_test_split(
+        X, y, test_size=test_size, random_state=random_state
+    )
+    return X_train, X_test, y_train, y_test
diff --git a/examples/iris_classifier/inference.py b/examples/iris_classifier/inference.py
@@ -0,0 +1,21 @@
+import mlflow
+from examples.utils.decorators import mlflow_tracking_uri
+from examples.iris_classifier.data import get_train_test_data
+
+
+@mlflow_tracking_uri
+def main():
+    """
+    Main function to run the batch inference process.
+    """
+    # Load the model from the specified path
+    _, x_test, _, _ = get_train_test_data()
+    registered_model_name = "Iris_Classifier_Model"
+    model_path = f"models:/{registered_model_name}@production"
+    model = mlflow.sklearn.load_model(model_path)
+
+    # Perform inference on the test data
+    predictions = model.predict(x_test)
+    x_test["predictions"] = predictions
+    print(x_test.head())
+    print("Batch inference completed successfully.")
diff --git a/examples/iris_classifier/online_inference.py b/examples/iris_classifier/online_inference.py
@@ -0,0 +1,63 @@
+from examples.iris_classifier.data import get_train_test_data
+import httpx
+import json
+import pandas as pd
+
+
+def get_predictions_from_response(response):
+    """
+    Process the response from the REST API.
+
+    :param response: The response object from the HTTP request.
+    :return: The JSON content of the response.
+    """
+    if response.status_code == 200:
+        json_response = response.json()
+        predictions = json_response.get("predictions")
+        if predictions is not None:
+            return predictions
+        else:
+            raise Exception("No predictions found in the response.")
+    else:
+        raise Exception(f"Error: {response.status_code} - {response.text}")
+
+
+def get_payload(samples: int) -> dict:
+    """
+    Get the payload for online inference.
+
+    :param samples: Number of samples to include in the payload.
+    :return: Dictionary containing the payload for online inference.
+    """
+    _, x_test, _, y_test = get_train_test_data()
+    # Uncomment the following line to make the api call fail
+    # x_test["sepal length (cm)"] = ["" for _ in range(len(x_test))]
+    payload = {
+        "dataframe_split": x_test.iloc[0:samples].to_dict(orient="split"),
+    }
+    return payload, y_test.iloc[0:samples]
+
+
+def main() -> None:
+    """
+    Perform online inference using a REST API.
+
+    To deploy the model in the local server, run the following command:
+    `poetry run mlflow models serve -m models:/Iris_Classifier_Model@production --no-conda`
+
+    """
+    payload, labels = get_payload(1)
+    url = "http://127.0.0.1:5000/invocations"
+
+    print(payload)
+    headers = {"Content-Type": "application/json"}
+    response = httpx.post(url, data=json.dumps(payload), headers=headers)
+    predictions = get_predictions_from_response(response)
+    print(
+        pd.DataFrame(
+            {
+                "predictions": predictions,
+                "labels": labels,
+            }
+        )
+    )
diff --git a/examples/iris_classifier/train.py b/examples/iris_classifier/train.py
@@ -0,0 +1,70 @@
+from sklearn.ensemble import RandomForestClassifier
+from examples.iris_classifier.data import get_train_test_data
+from examples.utils.decorators import mlflow_tracking_uri
+from examples.utils.decorators import mlflow_client
+from examples.utils.decorators import mlflow_experiment
+from typing import Optional
+from typing import Dict
+from mlflow.models import infer_signature
+import mlflow
+
+
+def train(x_train, y_train, params: Optional[Dict[str, str]]) -> RandomForestClassifier:
+    """
+    Train a Random Forest Classifier on the provided training data.
+    The function returns the trained model.
+
+    :param x_train: The training features (input data).
+    :param y_train: The training labels (target data).
+    :return: The trained Random Forest Classifier model.
+    """
+    clf = RandomForestClassifier(**params)
+    clf.fit(x_train, y_train)
+    return clf
+
+
+@mlflow_tracking_uri
+@mlflow_experiment(name="iris_classifier")
+@mlflow_client
+def main(**kwargs) -> None:
+    # Example usage of the train function
+    x_train, x_test, y_train, y_test = get_train_test_data()
+    params = {"n_estimators": 1, "max_depth": 10}
+    model = train(x_train, y_train, params)
+    model_signature = infer_signature(x_train, y_train)
+
+    eval_data = x_test.copy()
+    eval_data["target"] = y_test
+    client = kwargs["mlflow_client"]
+    registered_model_name = "Iris_Classifier_Model"
+    with mlflow.start_run(run_name="training-rfc-model") as run:
+        # log parameters.
+        mlflow.log_params(model.get_params())
+
+        # log model
+        mlflow.sklearn.log_model(
+            sk_model=model,
+            artifact_path="model",
+            signature=model_signature,
+            input_example=x_train.iloc[0:3],
+            registered_model_name=registered_model_name,
+        )
+
+        # set model version alias to "production"
+        model_version = mlflow.search_model_versions(
+            filter_string=f"name='{registered_model_name}'", max_results=1
+        )[0]
+        client.set_registered_model_alias(
+            name=registered_model_name,
+            version=model_version.version,
+            alias="production",
+        )
+
+        # model uri
+        model_uri = f"runs:/{run.info.run_id}/model"
+        mlflow.evaluate(
+            model=model_uri,
+            data=eval_data,
+            model_type="classifier",
+            targets="target",
+        )
diff --git a/mlflow_for_ml_dev/notebooks/local_model_serving/deploying_local_iris_model.ipynb b/mlflow_for_ml_dev/notebooks/local_model_serving/deploying_local_iris_model.ipynb
@@ -0,0 +1,189 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "7e44f382",
+   "metadata": {},
+   "source": [
+    "# Local Model Serving with MLflow"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 37,
+   "id": "f7c4b8ed",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import httpx \n",
+    "import json\n",
+    "import mlflow\n",
+    "from mlflow_for_ml_dev.src.utils.folder_operations import get_project_root\n",
+    "\n",
+    "# set mlflow tracking uri\n",
+    "mlflow.set_tracking_uri(uri=(get_project_root() / 'mlruns').as_uri())"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "94833c27",
+   "metadata": {},
+   "source": [
+    "```shell\n",
+    "mlflow models serve --options\n",
+    "```\n",
+    "\n",
+    "To run the code below make sure you deploy the model using.\n",
+    "\n",
+    "`poetry run mlflow models serve --model-uri models:/Iris_Classifier_Model@production --env-manager local`"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "358ba627",
+   "metadata": {},
+   "source": [
+    "## Scoring Iris Classifier Model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 50,
+   "id": "096a2fa0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "url = \"http://127.0.0.1:5001/invocations\"\n",
+    "\n",
+    "payload = {'dataframe_split':\n",
+    "            {\n",
+    "                'columns': ['sepal length (cm)', 'sepal width (cm)', 'petal length (cm)', 'petal width (cm)'], \n",
+    "                'data': [[6.1, 2.8, 4.7, 1.2]]\n",
+    "            }\n",
+    "        } \n",
+    "headers = {\"Content-Type\": \"application/json\"}\n",
+    "response = httpx.post(url, data=json.dumps(payload), headers=headers)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 51,
+   "id": "4cee092a",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "<Response [200 OK]>"
+      ]
+     },
+     "execution_count": 51,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "response"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "2ce72d97",
+   "metadata": {},
+   "source": [
+    "## Signature validation"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 52,
+   "id": "cba325a0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "url = \"http://127.0.0.1:5001/invocations\"\n",
+    "\n",
+    "payload = {'dataframe_split':\n",
+    "            {\n",
+    "                'columns': ['sepal length (cm)', 'sepal width (cm)', 'petal length (cm)', 'petal width (cm)'], \n",
+    "                'data': [[6.1, 2.8, 4.7, \"string\"]] # invalid data type\n",
+    "            }\n",
+    "        } \n",
+    "headers = {\"Content-Type\": \"application/json\"}\n",
+    "response = httpx.post(url, data=json.dumps(payload), headers=headers)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 53,
+   "id": "dadf245c",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "<Response [400 BAD REQUEST]>"
+      ]
+     },
+     "execution_count": 53,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "response"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 54,
+   "id": "da6b0d77",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'error_code': 'BAD_REQUEST',\n",
+       " 'message': 'Invalid input. Data is not compatible with model signature. Failed to convert column petal width (cm) to type \\'float64\\'. Error: \\'ValueError(\"could not convert string to float: \\'string\\'\")\\''}"
+      ]
+     },
+     "execution_count": 54,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "response.json()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0b064f0c",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.9"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/pyproject.toml b/pyproject.toml