Spaces:

sumoy47
/

medguard-api

Sleeping

App Files Files Community

medguard-api / main.py

sumoy47

Upload 10 files

49945fa verified 23 days ago

raw

history blame contribute delete

3.33 kB

	from fastapi import FastAPI, HTTPException
	from fastapi.middleware.cors import CORSMiddleware
	from pydantic import BaseModel
	import torch
	import torch.nn.functional as F
	from transformers import AutoTokenizer, AutoModelForSequenceClassification
	from lime.lime_text import LimeTextExplainer
	import numpy as np
	import os

	app = FastAPI(title="MedGuard API")

	# --- NUCLEAR CORS FIX ---
	# Allow EVERYTHING. This rules out CORS as the problem.
	app.add_middleware(
	CORSMiddleware,
	allow_origins=["*"],
	allow_credentials=True,
	allow_methods=["*"],
	allow_headers=["*"],
	)

	# --- CONFIGURATION ---
	MODEL_PATH = "./model"
	DEVICE = "cpu"

	print(f"🔄 Loading Model from {MODEL_PATH}...")
	model = None
	tokenizer = None

	try:
	tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH)
	model = AutoModelForSequenceClassification.from_pretrained(MODEL_PATH)
	model.to(DEVICE)
	model.eval()
	print("✅ Model Loaded Successfully!")
	except Exception as e:
	print(f"❌ Error loading local model: {e}")
	MODEL_NAME = "csebuetnlp/banglabert"
	tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
	model = AutoModelForSequenceClassification.from_pretrained(MODEL_NAME, num_labels=3)

	# --- DATA MODELS ---
	class QueryRequest(BaseModel):
	text: str

	class PredictionResponse(BaseModel):
	label: str
	confidence: float
	probs: dict
	explanation: list = None

	LABELS = ["Highly Relevant", "Partially Relevant", "Not Relevant"]

	def predict_proba_lime(texts):
	inputs = tokenizer(texts, return_tensors="pt", padding=True, truncation=True, max_length=128).to(DEVICE)
	with torch.no_grad():
	outputs = model(**inputs)
	return torch.nn.functional.softmax(outputs.logits, dim=-1).cpu().numpy()

	@app.get("/")
	def health_check():
	return {"status": "active", "model": "MedGuard v1.0"}

	@app.post("/predict", response_model=PredictionResponse)
	def predict(request: QueryRequest):
	if not model or not tokenizer:
	raise HTTPException(status_code=503, detail="Model not loaded")

	try:
	inputs = tokenizer(request.text, return_tensors="pt", truncation=True, max_length=128).to(DEVICE)
	with torch.no_grad():
	outputs = model(**inputs)
	probs = F.softmax(outputs.logits, dim=-1).cpu().numpy()[0]

	pred_idx = np.argmax(probs)

	# LIME (Reduced to 20 samples for speed testing)
	explainer = LimeTextExplainer(class_names=LABELS, split_expression=lambda x: x.split())
	exp = explainer.explain_instance(request.text, predict_proba_lime, num_features=6, num_samples=20, labels=[pred_idx])
	lime_features = exp.as_list(label=pred_idx)

	return {
	"label": LABELS[pred_idx],
	"confidence": round(float(probs[pred_idx]) * 100, 2),
	"probs": {l: round(float(p), 4) for l, p in zip(LABELS, probs)},
	"explanation": lime_features
	}
	except Exception as e:
	print(f"Server Error: {e}") # Print error to backend terminal
	raise HTTPException(status_code=500, detail=str(e))

	if __name__ == "__main__":
	import uvicorn
	# Bind to localhost specifically
	uvicorn.run(app, host="127.0.0.1", port=8000)