Spaces:

re-mind
/

DTD-XGBoost

Running

App Files Files Community

amaye15 commited on Jan 23

Commit

f9ce179

1 Parent(s): 01e7bff

Feat - Deployment

Browse files

Files changed (6) hide show

.gitignore +4 -0
Dockerfile +70 -0
README.md +3 -0
api/main.py +288 -0
api/model/saved_tuned_model.pkl +3 -0
requirements.txt +6 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,4 @@

+*env*
+*DS_Store*
+*.log
+*__pycache__*

Dockerfile ADDED Viewed

	@@ -0,0 +1,70 @@

+# Stage 1: Build stage
+FROM python:3.12-slim as builder
+# Set environment variables
+ENV PYTHONDONTWRITEBYTECODE=1 \
+    PYTHONUNBUFFERED=1 \
+    PATH="/root/.local/bin:$PATH"
+# Install system dependencies (curl and ca-certificates for uv installer)
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    curl \
+    ca-certificates \
+    && rm -rf /var/lib/apt/lists/*
+# Install uv using the official installer
+RUN curl -sSfL https://astral.sh/uv/install.sh | sh
+# Verify uv is installed and available
+RUN uv --version
+# Create a non-root user
+RUN useradd -m -u 1000 user
+# Set the working directory
+WORKDIR /app
+# Create a virtual environment
+RUN uv venv /opt/venv
+# Update PATH to include the virtual environment's bin directory
+ENV PATH="/opt/venv/bin:$PATH"
+# Copy only the requirements file first to leverage Docker cache
+COPY --chown=user ./requirements.txt /app/requirements.txt
+# Install dependencies into the virtual environment using uv
+RUN uv pip install --no-cache-dir -r requirements.txt
+# Copy the rest of the application code
+COPY --chown=user . /app
+# Stage 2: Runtime stage
+FROM python:3.12-slim
+# Create a non-root user
+RUN useradd -m -u 1000 user
+USER user
+# Set environment variables
+ENV PATH="/opt/venv/bin:$PATH" \
+    PYTHONUNBUFFERED=1
+# Set the working directory
+WORKDIR /app
+# Copy the virtual environment from the builder stage
+COPY --from=builder --chown=user /opt/venv /opt/venv
+# Copy only the necessary files from the builder stage
+COPY --from=builder --chown=user /app /app
+# Expose the port the app runs on
+EXPOSE 7860
+# Health check to ensure the application is running
+HEALTHCHECK --interval=30s --timeout=30s --start-period=5s --retries=3 \
+    CMD curl -f http://localhost:7860/health || exit 1
+# Command to run the application with hot reloading
+CMD ["uvicorn", "api.main:app", "--host", "0.0.0.0", "--port", "7860", "--reload"]

README.md CHANGED Viewed

@@ -6,6 +6,9 @@ colorTo: green
 sdk: docker
 pinned: false
 license: mit
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 sdk: docker
 pinned: false
 license: mit
+python_version: 3.11
+app_port: 7860
+app_file: api/main.py
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

api/main.py ADDED Viewed

	@@ -0,0 +1,288 @@

+# from fastapi import FastAPI, HTTPException, status, Depends
+# from fastapi.responses import RedirectResponse
+# from pydantic import BaseModel, conlist
+# import pandas as pd
+# from pycaret.classification import load_model, predict_model
+# import logging
+# from typing import Optional
+# import numpy as np
+# import os
+# # Constants
+# MODEL_PATH = "./api/model/saved_tuned_model"  # os.getenv("MODEL_PATH", "saved_tuned_model")  # Load model path from environment variable
+# EMBEDDING_DIMENSION = 1024  # Update this to match your model's expected input dimension
+# LOG_LEVEL = os.getenv("LOG_LEVEL", "INFO")  # Logging level from environment variable
+# # Configure logging
+# logging.basicConfig(level=LOG_LEVEL)
+# logger = logging.getLogger(__name__)
+# # Load the saved model
+# def load_tuned_model(model_path: str):
+#     """Load the pre-trained model from the specified path."""
+#     try:
+#         logger.info(f"Loading model from {model_path}...")
+#         model = load_model(model_path)
+#         logger.info("Model loaded successfully.")
+#         return model
+#     except Exception as e:
+#         logger.error(f"Failed to load the model: {str(e)}")
+#         raise RuntimeError(f"Model loading failed: {str(e)}")
+# tuned_model = load_tuned_model(MODEL_PATH)
+# # Define the input data model using Pydantic
+# class EmbeddingRequest(BaseModel):
+#     embedding: conlist(
+#         float, min_length=EMBEDDING_DIMENSION, max_length=EMBEDDING_DIMENSION
+#     )
+# # Define the response model
+# class PredictionResponse(BaseModel):
+#     predicted_label: int
+#     predicted_score: float
+# # Initialize FastAPI app
+# app = FastAPI(
+#     title="Embedding Prediction API",
+#     description="API for predicting labels and scores from embeddings using a pre-trained model.",
+#     version="1.0.0",
+# )
+# # Dependency for model access
+# def get_model():
+#     """Dependency to provide the loaded model to endpoints."""
+#     return tuned_model
+# # Define the prediction endpoint
+# @app.post("/predict", response_model=PredictionResponse)
+# async def predict(
+#     request: EmbeddingRequest,
+#     model=Depends(get_model),
+# ):
+#     """
+#     Predicts the label and score for a given embedding.
+#     Args:
+#         request (EmbeddingRequest): A request containing the embedding as a list of floats.
+#         model: The pre-trained model injected via dependency.
+#     Returns:
+#         PredictionResponse: A response containing the predicted label and score.
+#     """
+#     try:
+#         logger.info("Received prediction request.")
+#         # Convert the input embedding to a DataFrame
+#         input_data = pd.DataFrame(
+#             [request.embedding],
+#             columns=[f"embedding_{i}" for i in range(EMBEDDING_DIMENSION)],
+#         )
+#         # Make a prediction using the loaded model
+#         logger.info("Making prediction...")
+#         prediction = predict_model(model, data=input_data)
+#         # Extract the predicted label and score
+#         predicted_label = prediction["prediction_label"].iloc[0]
+#         predicted_score = prediction["prediction_score"].iloc[0]
+#         logger.info(
+#             f"Prediction successful: label={predicted_label}, score={predicted_score}"
+#         )
+#         return PredictionResponse(
+#             predicted_label=int(predicted_label),
+#             predicted_score=float(predicted_score),
+#         )
+#     except Exception as e:
+#         logger.error(f"Prediction failed: {str(e)}")
+#         raise HTTPException(
+#             status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+#             detail=f"An error occurred during prediction: {str(e)}",
+#         )
+# # Health check endpoint
+# @app.get("/health", status_code=status.HTTP_200_OK)
+# async def health_check():
+#     """Health check endpoint to verify the API is running."""
+#     return {"status": "healthy"}
+# # Run the FastAPI app
+# if __name__ == "__main__":
+#     import uvicorn
+#     uvicorn.run(app, host="0.0.0.0", port=8000)
+from fastapi import FastAPI, HTTPException, status, Depends
+from fastapi.responses import RedirectResponse
+from pydantic import BaseModel, conlist, ValidationError
+from pydantic_settings import BaseSettings
+import pandas as pd
+from pycaret.classification import load_model, predict_model
+import logging
+from typing import Optional, List
+import numpy as np
+import os
+# Configure structured logging
+logging.basicConfig(
+    level=logging.INFO, format="%(asctime)s - %(name)s - %(levelname)s - %(message)s"
+)
+logger = logging.getLogger(__name__)
+# Define settings using Pydantic BaseSettings
+class Settings(BaseSettings):
+    model_path: str = "./api/model/saved_tuned_model"
+    embedding_dimension: int = 1024
+    log_level: str = "INFO"
+    class Config:
+        env_file = ".env"
+        env_file_encoding = "utf-8"
+settings = Settings()
+# Load the saved model
+def load_tuned_model(model_path: str):
+    """Load the pre-trained model from the specified path."""
+    try:
+        logger.info(f"Loading model from {model_path}...")
+        model = load_model(model_path)
+        logger.info("Model loaded successfully.")
+        return model
+    except Exception as e:
+        logger.error(f"Failed to load the model: {str(e)}")
+        raise RuntimeError(f"Model loading failed: {str(e)}")
+tuned_model = load_tuned_model(settings.model_path)
+# Define the input data model using Pydantic
+class EmbeddingRequest(BaseModel):
+    embedding: conlist(
+        float,
+        min_length=settings.embedding_dimension,
+        max_length=settings.embedding_dimension,
+    )
+# Define the response model
+class PredictionResponse(BaseModel):
+    predicted_label: int
+    predicted_score: float
+# Initialize FastAPI app
+app = FastAPI(
+    title="Embedding Prediction API",
+    description="API for predicting labels and scores from embeddings using a pre-trained model.",
+    version="1.0.0",
+)
+# Dependency for model access
+def get_model():
+    """Dependency to provide the loaded model to endpoints."""
+    return tuned_model
+# Define the prediction endpoint
+@app.post("/predict", response_model=PredictionResponse)
+async def predict(
+    request: EmbeddingRequest,
+    model=Depends(get_model),
+):
+    """
+    Predicts the label and score for a given embedding.
+    Args:
+        request (EmbeddingRequest): A request containing the embedding as a list of floats.
+        model: The pre-trained model injected via dependency.
+    Returns:
+        PredictionResponse: A response containing the predicted label and score.
+    """
+    try:
+        logger.info("Received prediction request.")
+        # Convert the input embedding to a DataFrame
+        input_data = pd.DataFrame(
+            [request.embedding],
+            columns=[f"embedding_{i}" for i in range(settings.embedding_dimension)],
+        )
+        # Make a prediction using the loaded model
+        logger.info("Making prediction...")
+        prediction = predict_model(model, data=input_data)
+        # Validate the prediction output
+        if (
+            "prediction_label" not in prediction.columns
+            or "prediction_score" not in prediction.columns
+        ):
+            raise ValueError("Model prediction output is missing required columns.")
+        # Extract the predicted label and score
+        predicted_label = prediction["prediction_label"].iloc[0]
+        predicted_score = prediction["prediction_score"].iloc[0]
+        if predicted_label == 3:
+            predicted_label = 4
+        logger.info(
+            f"Prediction successful: label={predicted_label}, score={predicted_score}"
+        )
+        return PredictionResponse(
+            predicted_label=int(predicted_label),
+            predicted_score=float(predicted_score),
+        )
+    except ValidationError as e:
+        logger.error(f"Validation error: {str(e)}")
+        raise HTTPException(
+            status_code=status.HTTP_400_BAD_REQUEST,
+            detail=f"Invalid input data: {str(e)}",
+        )
+    except ValueError as e:
+        logger.error(f"Value error: {str(e)}")
+        raise HTTPException(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            detail=f"Model output validation failed: {str(e)}",
+        )
+    except Exception as e:
+        logger.error(f"Prediction failed: {str(e)}")
+        raise HTTPException(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            detail=f"An error occurred during prediction: {str(e)}",
+        )
+# Health check endpoint
+@app.get("/health", status_code=status.HTTP_200_OK)
+async def health_check():
+    """Health check endpoint to verify the API is running."""
+    return {"status": "healthy"}
+# Run the FastAPI app
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=8000)

api/model/saved_tuned_model.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8ebc64beeeb89ba17af4b68dd13e322ae5a411f858f4816435f8db96c7d46e71
+size 4142287

requirements.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+pycaret==3.3.2
+fastapi==0.115.7
+uvicorn==0.34.0
+xgboost==2.1.3
+dill==0.3.9
+pydantic-settings==2.7.1