From b9ae34399bba7de4ec135b7d46fa80bcefc2ee9d Mon Sep 17 00:00:00 2001
From: copandrej <ac8560@student.uni-lj.si>
Date: Fri, 28 Jun 2024 09:28:01 +0200
Subject: [PATCH] Added model deployment docker template, fixed typos.

---
 README.md                                     |  6 ++--
 docker_build/Dockerfile                       |  8 -----
 docker_build/model_deployment/Dockerfile      | 13 +++++++
 docker_build/model_deployment/api-endpoint.py | 35 +++++++++++++++++++
 .../model_deployment/requirements.txt         | 11 ++++++
 docker_build/ray_image/Dockerfile             |  7 ++++
 docker_build/{ => ray_image}/requirements.txt |  0
 7 files changed, 69 insertions(+), 11 deletions(-)
 delete mode 100644 docker_build/Dockerfile
 create mode 100644 docker_build/model_deployment/Dockerfile
 create mode 100644 docker_build/model_deployment/api-endpoint.py
 create mode 100644 docker_build/model_deployment/requirements.txt
 create mode 100644 docker_build/ray_image/Dockerfile
 rename docker_build/{ => ray_image}/requirements.txt (100%)

diff --git a/README.md b/README.md
index 4c170da..ae53220 100644
--- a/README.md
+++ b/README.md
@@ -1,9 +1,9 @@
-# Self-Evolving AI/ML Workflow
+# Self-Evolving AI/ML Workflow System
 
 AI/ML workflow solution is an MLOps system designed for deployment on a heterogeneous Kubernetes cluster with ARM and x86 GNU/Linux nodes, simulating distributed edge infrastructure common in RAN (Radio Access Networks), network slices and MEC (Multi-Access Edge Computing) devices.
 
 The system leverages the Ray framework for data processing, model training, and model inference, distributing the computational load on edge and non-edge nodes. 
-Data preparation can done with frameworks like Pandas or Ray Data while using Minio as a object store. 
+Data preparation can be done with frameworks like Pandas or Ray Data while using Minio as an object store. 
 Model training, managed by Ray, supports Keras, TensorFlow, and PyTorch with minor modifications.
 MLflow handles model storage and management, facilitating easy access and updates. 
 Trained models are deployed as inference API endpoints using Ray Serve or as Kubernetes deployments using helm charts and docker containers.
@@ -11,7 +11,7 @@ Flyte orchestrates AI/ML workflows for retraining and redeployment of ML models,
 Prometheus and Grafana provide system monitoring. 
 
 Developers register workflows with Flyte and monitor the system, while users can trigger workflows, monitor progress, and access models in MLflow. 
-For example, in a RAN network, the system can enhance and control network operations through periodic metrics collection and automated retraining, ensuring up-to-date AI/ML solutions. 
+For example, in a RAN network, the system can enhance and control network operations through periodic metrics collection and automated retraining, ensuring up-to-date AI/ML assisted solutions. 
 This system aims to run autonomously, delivering efficient production AI/ML workflows at the network edge.
 
 The system is modular and can be adjusted to different use cases and requirements by enabling or disabling system components.
diff --git a/docker_build/Dockerfile b/docker_build/Dockerfile
deleted file mode 100644
index 8a55d4a..0000000
--- a/docker_build/Dockerfile
+++ /dev/null
@@ -1,8 +0,0 @@
-# TODO seperate docker files for both architecures, requirements and script for building images, maybe github ci/cd
-# Start from the rayproject/2.9.3-py310-aarch64 image for raspberry pi
-
-FROM rayproject/ray:2.10.0-py310
-
-# Install dependencies from requirements.txt
-COPY requirements.txt .
-RUN pip install -r requirements.txt
diff --git a/docker_build/model_deployment/Dockerfile b/docker_build/model_deployment/Dockerfile
new file mode 100644
index 0000000..758b3c2
--- /dev/null
+++ b/docker_build/model_deployment/Dockerfile
@@ -0,0 +1,13 @@
+# Use an official Python runtime as a parent image
+FROM python:3.10
+
+WORKDIR /app
+
+# Install any needed packages specified in requirements.txt, append your dependencies to requirements.txt
+RUN pip install requirements.txt
+
+ADD . /app
+EXPOSE 8000
+
+# Run api-endpoint.py with uvicorn when the container launches
+CMD ["uvicorn", "api-endpoint:app", "--host", "0.0.0.0", "--port", "8000", "--workers", "4", "--limit-concurrency", "8000", "--log-level", "error", "--backlog", "8000"]
diff --git a/docker_build/model_deployment/api-endpoint.py b/docker_build/model_deployment/api-endpoint.py
new file mode 100644
index 0000000..d303e68
--- /dev/null
+++ b/docker_build/model_deployment/api-endpoint.py
@@ -0,0 +1,35 @@
+from typing import List
+from fastapi import FastAPI
+import os
+import mlflow
+
+# Add your own imports and functions here
+
+app = FastAPI()
+
+# SEMR's model store endpoint, CHANGE THIS TO YOUR OWN IP
+os.environ['MLFLOW_TRACKING_URI'] = 'http://<SEMR_IP>:31007'
+
+# Read the model version from the os variable (Defined in the helm charts)
+model_version = os.getenv('MODEL_VERSION', "latest")
+
+# Modify the model_uri to point to the correct model name
+model_uri = f"models:/<model_name>/{model_version}"
+
+# Modify the MLflow loading function https://mlflow.org/docs/2.10.2/index.html
+model = mlflow.pytorch.load_model(model_uri)
+model.eval()
+print("Model loaded!")
+
+@app.post("/")
+async def echo(data: List[List[List[float]]]):
+    # Data transformations
+    # tensor_data = torch.tensor(data)
+    # tensor_data = tensor_data.unsqueeze(0)
+
+    # Inference
+    # cnn_labels_array = cnn_predict(tensor_data, model)
+    # counts = Counter(cnn_labels_array)
+
+    return {"prediction": str(counts)}
+
diff --git a/docker_build/model_deployment/requirements.txt b/docker_build/model_deployment/requirements.txt
new file mode 100644
index 0000000..2129f0c
--- /dev/null
+++ b/docker_build/model_deployment/requirements.txt
@@ -0,0 +1,11 @@
+# Requirements by model deplyoment template
+fastapi
+uvicorn
+python-multipart
+mlflow==2.10.2
+
+# Add your own dependencies for model inference and data preprocessing
+# numpy
+# torch
+# torch_geometric
+# torchvision
diff --git a/docker_build/ray_image/Dockerfile b/docker_build/ray_image/Dockerfile
new file mode 100644
index 0000000..4f36fa2
--- /dev/null
+++ b/docker_build/ray_image/Dockerfile
@@ -0,0 +1,7 @@
+# Start from the rayproject/2.10.0-py310-aarch64 image for raspberry pi
+
+FROM rayproject/ray:2.10.0-py310
+
+# Install dependencies from requirements.txt
+COPY requirements.txt .
+RUN pip install -r requirements.txt
diff --git a/docker_build/requirements.txt b/docker_build/ray_image/requirements.txt
similarity index 100%
rename from docker_build/requirements.txt
rename to docker_build/ray_image/requirements.txt