Spaces:

G44mlops
/

API

Running

API

File size: 8,178 Bytes

250a0ca

import torch
from pathlib import Path
from huggingface_hub import hf_hub_download
from PIL import Image
from torchvision import transforms
from medmnist import INFO
import gradio as gr
import os
import base64
from io import BytesIO
from huggingface_hub import HfApi
from datetime import datetime
import io

from model import resnet18, resnet50

DEVICE = torch.device("cuda" if torch.cuda.is_available() else "mps" if torch.backends.mps.is_available() else "cpu")
AUTH_TOKEN = os.getenv("APP_TOKEN")#to acces the app
DATASET_REPO = os.getenv("Dataset_repo") #"G44mlops/API_received"  
HF_TOKEN = os.getenv("HF_TOKEN")  #to acces dataset repo
MODEL = os.getenv("Model_repo")#"G44mlops/ResNet-medmnist"

#taken from Mikolaj code with closed PR
def load_model_from_hf(
    repo_id: str,
    filename: str,
    model_type: str,
    num_classes: int,
    in_channels: int,
    device: str,
) -> torch.nn.Module:
    """Load trained model from Hugging Face Hub.
    
    Args:
        repo_id: Hugging Face repository ID
        filename: Model checkpoint filename
        model_type: Type of model ('resnet18' or 'resnet50')
        num_classes: Number of output classes
        in_channels: Number of input channels
        device: Device to load model on
        
    Returns:
        Loaded model in eval mode
    """
    print(f"Downloading model from Hugging Face: {repo_id}/{filename}")
    checkpoint_path = hf_hub_download(repo_id=repo_id, filename=filename)

    # Create model
    if model_type == "resnet18":
        model = resnet18(num_classes=num_classes, in_channels=in_channels)
    else:
        model = resnet50(num_classes=num_classes, in_channels=in_channels)

    # Load checkpoint
    checkpoint = torch.load(checkpoint_path, map_location=device, weights_only=True)
    model.load_state_dict(checkpoint["model_state_dict"])
    model.to(device)
    model.eval()

    return model
#taken from Mikolaj code with closed PR


# Image preprocessing pipeline (basic so far, can be improved)
def get_preprocessing_pipeline() -> transforms.Compose:
    """Get preprocessing pipeline for images."""
    #getting information on number of image channels (RGB or Grayscale) for trained model
    info = INFO["organamnist"]  # Using organamnist as reference
    output_channels = info["n_channels"] # RGB or Grayscale
    #chosing 'standard' mean and std values for normalization if dataset statistics are not available
    mean = (0.5,) * output_channels
    std = (0.5,) * output_channels
    #preparing transformation pipeline
    trans = transforms.Compose([
        transforms.Resize(256),
        transforms.CenterCrop(224),
        transforms.ToTensor(),
        transforms.Normalize(mean=mean, std=std),
    ])
    #returning the transformation pipeline
    return trans
def get_class_labels(data_flag: str = "organamnist") -> list[str]:
    """Get class labels for MedMNIST dataset."""
    #retrieving dataset info
    info = INFO[data_flag]
    labels = info["label"]
    #returning class labels
    return labels

def save_image_to_hf_folder(image_path, prediction_label):
    """Upload image to HF dataset folder."""
    api = HfApi()
    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
    
    # Create a text file with metadata
    metadata = f"prediction: {prediction_label}\ntimestamp: {timestamp}"
    metadata_path = f"{Path(image_path).stem}_metadata.txt"
    
    # Upload image
    api.upload_file(
        path_or_fileobj=image_path,
        path_in_repo=f"uploads/{timestamp}_{Path(image_path).name}",
        repo_id=DATASET_REPO,
        repo_type="dataset",
        token=HF_TOKEN
    )
     # Upload metadata as separate file
    api.upload_file(
        path_or_fileobj=io.BytesIO(metadata.encode()),
        path_in_repo=f"uploads/{timestamp}_{Path(image_path).stem}_metadata.txt",
        repo_id=DATASET_REPO,
        repo_type="dataset",
        token=HF_TOKEN
    )

def classify_images(images) -> str:
    """Classify images and return formatted HTML with embedded images."""
    # Handle case with no images
    if images is None:
        return "<p>No images uploaded</p>"
    # Ensure images is a list if(case when only one image is uploaded is problematic without it)
    if isinstance(images, str):
        images = [images]
    #creating HTML structure for results
    html = "<div style='display: flex; flex-wrap: wrap; gap: 30px; padding: 20px; justify-content: center;'>"
    #loop over images and classify them
    for image_path in images:
        #preparing image for classification
        img = Image.open(image_path).convert("L")  # Convert to grayscale (as project uses grayscale images)
        input_tensor = preprocess(img).unsqueeze(0)
        #forward pass + softmax to get probabilities
        with torch.no_grad():
            output = model(input_tensor)
            probs = torch.nn.functional.softmax(output[0], dim=0)
            top_class = probs.argmax().item()
        #getting class label
        label = class_labels[str(top_class)]
        #getting image filename
        filename = Path(image_path).name
        #Preparing image for embedding in HTML (base64 encoding)
        buffered = BytesIO()
        img.save(buffered, format="JPEG")
        img_str = base64.b64encode(buffered.getvalue()).decode()
        #adding current image block to HTML
        html += f"""
        <div style='border: 2px solid #ddd; padding: 15px; border-radius: 8px; background: #f9f9f9; width: 280px;'>
            <p style='font-size: 14px; color: #666; margin: 0 0 10px 0; text-align: center; font-weight: bold;'>{filename}</p>
            <img src='data:image/jpeg;base64,{img_str}' style='width: 250px; height: 250px; object-fit: contain; display: block; margin: 0 auto 10px;'>
            <p style='font-size: 18px; color: #0066cc; margin: 10px 0 0 0; text-align: center; font-weight: bold;'>{label}</p>
        </div>
        """
        # Save image and metadata to HF dataset folder
        save_image_to_hf_folder(image_path, label)
    #closing HTML container
    html += "</div>"
    #returning results
    return html

###main code to launch Gradio app###

#prepare model and preprocessing pipeline (kind of backend)
model =  load_model_from_hf(#taken from Mikolaj code with closed PR
            repo_id=MODEL, 
            filename="resnet18_best.pth",
            model_type="resnet18",
            num_classes=11,
            in_channels=1,
            device=DEVICE,
        )
preprocess = get_preprocessing_pipeline()
class_labels = get_class_labels()
#preparing Gradio interface (frontend)
with gr.Blocks() as demo:
    #app "title"
    gr.Markdown("<h1 style='text-align: center;'> MLOps project - MedMNIST dataset Image Classifier</h1>")
    #app message/information )
    gr.Markdown("This is a Gradio web application for MLOps course project. Given images are stored in our dataset. " \
    "By uploading images you agrree that they will be stored by us and insures that they can be stored by us. " \
    "If you somewhat passed the login and are not connected to the project, please do not upload any images. " )
    #app spine layout
    with gr.Column():
        #title of load segment
        gr.Markdown("<h2 style='text-align: center;'> Upload Images</h2>")
        #images loading component
        images_input = gr.File(file_count="multiple", file_types=["image"], label="Upload Images")
        #buttons row for app functionality
        with gr.Row():
            submit_btn = gr.Button("Classify")
            reset_btn = gr.Button("Reset")
        #title of results segment
        gr.Markdown("<h2 style='text-align: center;'> Results</h2>")
        #classification results output component
        output = gr.HTML(label="Results")
    #getting callable reset function
    def reset():
        return None, ""
    #linking buttons to functions
    submit_btn.click(classify_images, inputs=images_input, outputs=output)
    reset_btn.click(reset, outputs=[images_input, output])


    #just launch
    server_name = os.getenv("GRADIO_SERVER_NAME", "127.0.0.1")
    demo.launch(
        server_name=server_name,
        auth=[("user", AUTH_TOKEN)] if AUTH_TOKEN else None
        )