Add api/main.py

f830825 verified 3 months ago

7.25 kB

	#!/usr/bin/env python3
	"""
	RetinaSense-ViT — FastAPI Inference Server (Phase 4B)
	======================================================
	REST API for clinical retinal screening integration.

	Endpoints:
	POST /predict — single image prediction
	POST /predict/batch — multiple images
	GET /health — service health check
	"""

	import os, sys, json, io, time, tempfile, warnings
	import numpy as np
	import cv2
	import torch
	import torch.nn as nn
	import torch.nn.functional as F
	from torchvision import transforms
	from PIL import Image
	import timm
	from fastapi import FastAPI, UploadFile, File, HTTPException
	from fastapi.responses import JSONResponse
	from pydantic import BaseModel
	from typing import List, Optional
	warnings.filterwarnings('ignore')

	# ================================================================
	# CONFIG
	# ================================================================
	DEVICE = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
	IMG_SIZE = 224
	NUM_CLASSES = 5
	CLASS_NAMES = ['Normal', 'Diabetes/DR', 'Glaucoma', 'Cataract', 'AMD']
	SEVERITY_NAMES = ['No DR', 'Mild', 'Moderate', 'Severe', 'Proliferative']
	BASE_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__))) # repo root

	# Config files: look in configs/ first (committed to git), fall back to original locations
	def _cfg(name, subdir):
	committed = os.path.join(BASE_DIR, 'configs', name)
	original = os.path.join(BASE_DIR, subdir, name)
	return committed if os.path.exists(committed) else original

	# Load configs
	with open(_cfg('fundus_norm_stats.json', 'data')) as f:
	ns = json.load(f)
	NORM_MEAN, NORM_STD = ns['mean_rgb'], ns['std_rgb']
	with open(_cfg('temperature.json', 'outputs_v3')) as f:
	T_OPT = json.load(f)['temperature']
	with open(_cfg('thresholds.json', 'outputs_v3')) as f:
	THRESHOLDS = json.load(f)['thresholds']


	# ================================================================
	# MODEL
	# ================================================================
	class MultiTaskViT(nn.Module):
	def __init__(self, n_disease=5, n_severity=5, drop=0.3):
	super().__init__()
	self.backbone = timm.create_model('vit_base_patch16_224', pretrained=False, num_classes=0)
	self.drop = nn.Dropout(drop)
	self.disease_head = nn.Sequential(
	nn.Linear(768, 512), nn.BatchNorm1d(512), nn.ReLU(), nn.Dropout(0.3),
	nn.Linear(512, 256), nn.BatchNorm1d(256), nn.ReLU(), nn.Dropout(0.2),
	nn.Linear(256, n_disease),
	)
	self.severity_head = nn.Sequential(
	nn.Linear(768, 256), nn.BatchNorm1d(256), nn.ReLU(), nn.Dropout(0.3),
	nn.Linear(256, n_severity),
	)

	def forward(self, x):
	f = self.backbone(x)
	f = self.drop(f)
	return self.disease_head(f), self.severity_head(f)


	model = MultiTaskViT().to(DEVICE)
	ckpt = torch.load(os.path.join(BASE_DIR, 'outputs_v3', 'best_model.pth'),
	map_location=DEVICE, weights_only=False)
	model.load_state_dict(ckpt['model_state_dict'])
	model.eval()

	normalize = transforms.Normalize(NORM_MEAN, NORM_STD)
	val_transform = transforms.Compose([
	transforms.ToPILImage(), transforms.ToTensor(), normalize,
	])


	# ================================================================
	# HELPERS
	# ================================================================
	def preprocess(img_bytes):
	img = Image.open(io.BytesIO(img_bytes)).convert('RGB')
	img_np = cv2.resize(np.array(img), (IMG_SIZE, IMG_SIZE))
	lab = cv2.cvtColor(img_np, cv2.COLOR_RGB2LAB)
	clahe = cv2.createCLAHE(clipLimit=2.0, tileGridSize=(8, 8))
	lab[:, :, 0] = clahe.apply(lab[:, :, 0])
	processed = cv2.cvtColor(lab, cv2.COLOR_LAB2RGB)
	return val_transform(processed).unsqueeze(0)


	RECOMMENDATIONS = {
	0: 'Routine re-screening in 12 months.',
	1: {0: 'Annual diabetic eye screening.', 1: 'Re-screen in 6-9 months.',
	2: 'Refer to ophthalmologist within 3 months.',
	3: 'URGENT: Retina specialist within 2-4 weeks.',
	4: 'URGENT: Immediate anti-VEGF/PRP referral.'},
	2: 'Refer for IOP measurement and visual field test.',
	3: 'Refer for visual acuity assessment.',
	4: 'Refer for OCT and anti-VEGF evaluation.',
	}


	def get_recommendation(pred, sev=0):
	r = RECOMMENDATIONS.get(pred, '')
	return r.get(sev, r.get(0, '')) if isinstance(r, dict) else r


	@torch.no_grad()
	def run_inference(tensor):
	tensor = tensor.to(DEVICE)
	d_out, s_out = model(tensor)
	probs = torch.softmax(d_out / T_OPT, dim=1).cpu().numpy()[0]
	sev_probs = torch.softmax(s_out, dim=1).cpu().numpy()[0]
	pred = int(probs.argmax())
	conf = float(probs[pred])
	sev = int(sev_probs.argmax()) if pred == 1 else -1
	return pred, conf, probs, sev


	# ================================================================
	# FASTAPI APP
	# ================================================================
	app = FastAPI(
	title="RetinaSense-ViT API",
	description="AI-powered retinal disease screening API",
	version="3.0.0",
	)


	class PredictionResult(BaseModel):
	prediction: str
	class_index: int
	confidence: float
	severity: Optional[str] = None
	probabilities: dict
	recommendation: str
	inference_time_ms: float


	@app.get("/health")
	async def health():
	return {
	"status": "healthy",
	"model": "ViT-Base/16 (RetinaSense v3.0)",
	"device": str(DEVICE),
	"classes": CLASS_NAMES,
	"checkpoint_epoch": ckpt['epoch'] + 1,
	}


	@app.post("/predict", response_model=PredictionResult)
	async def predict(image: UploadFile = File(...)):
	if not image.content_type or not image.content_type.startswith('image/'):
	raise HTTPException(400, "File must be an image")

	img_bytes = await image.read()
	t0 = time.time()
	tensor = preprocess(img_bytes)
	pred, conf, probs, sev = run_inference(tensor)
	elapsed = (time.time() - t0) * 1000

	return PredictionResult(
	prediction=CLASS_NAMES[pred],
	class_index=pred,
	confidence=conf,
	severity=SEVERITY_NAMES[sev] if sev >= 0 else None,
	probabilities={cn: float(probs[i]) for i, cn in enumerate(CLASS_NAMES)},
	recommendation=get_recommendation(pred, max(sev, 0)),
	inference_time_ms=round(elapsed, 1),
	)


	@app.post("/predict/batch")
	async def predict_batch(images: List[UploadFile] = File(...)):
	results = []
	for image in images:
	img_bytes = await image.read()
	t0 = time.time()
	tensor = preprocess(img_bytes)
	pred, conf, probs, sev = run_inference(tensor)
	elapsed = (time.time() - t0) * 1000
	results.append({
	"filename": image.filename,
	"prediction": CLASS_NAMES[pred],
	"confidence": conf,
	"severity": SEVERITY_NAMES[sev] if sev >= 0 else None,
	"probabilities": {cn: float(probs[i]) for i, cn in enumerate(CLASS_NAMES)},
	"recommendation": get_recommendation(pred, max(sev, 0)),
	"inference_time_ms": round(elapsed, 1),
	})
	return {"results": results, "total": len(results)}


	if __name__ == '__main__':
	import uvicorn
	uvicorn.run(app, host='0.0.0.0', port=8000)