Spaces:

varunkul
/

Voice-guard

Sleeping

App Files Files Community

Voice-guard / app /api.py

varunkul

Upload 6 files

e2c61ce verified about 1 month ago

raw

history blame contribute delete

2.28 kB

	import os, io, base64
	import numpy as np
	from fastapi import FastAPI, UploadFile, File, Form
	from fastapi.middleware.cors import CORSMiddleware
	from pydantic import BaseModel
	from typing import Optional, Dict, Any
	from PIL import Image
	from matplotlib import cm

	BACKEND = os.getenv("DETECTOR_BACKEND", "wav2vec2").lower()
	try:
	if BACKEND == "wav2vec2":
	from .inference_wav2vec import Detector # type: ignore
	else:
	from .inference import Detector # type: ignore
	except Exception:
	if BACKEND == "wav2vec2":
	from app.inference_wav2vec import Detector # type: ignore
	else:
	from app.inference import Detector # type: ignore

	DEFAULT_WEIGHTS = "app/models/weights/wav2vec2_classifier.pth" if BACKEND=="wav2vec2" else "app/models/weights/cnn_melspec.pth"
	WEIGHTS = os.getenv("MODEL_WEIGHTS_PATH", DEFAULT_WEIGHTS)
	det = Detector(weights_path=WEIGHTS)

	app = FastAPI(title="Voice Guard API", version="1.1.0")
	app.add_middleware(
	CORSMiddleware,
	allow_origins=["*"], # tighten in prod
	allow_methods=["*"],
	allow_headers=["*"],
	)

	class AnalyzeResponse(BaseModel):
	human: float
	ai: float
	label: str
	threshold: float
	threshold_source: Optional[str] = None
	backend: str
	source_hint: str
	replay_score: Optional[float] = None
	decision: Optional[str] = None
	decision_details: Optional[Dict[str, Any]] = None
	heatmap_b64: str

	def heatmap_png_b64(cam: np.ndarray) -> str:
	cam = np.clip(cam, 0.0, 1.0).astype(np.float32)
	rgb = (cm.magma(cam)[..., :3] * 255).astype(np.uint8)
	im = Image.fromarray(rgb)
	buf = io.BytesIO(); im.save(buf, format="PNG")
	return "data:image/png;base64," + base64.b64encode(buf.getvalue()).decode("ascii")

	@app.post("/analyze", response_model=AnalyzeResponse)
	async def analyze(file: UploadFile = File(...), source_hint: str = Form("auto")):
	raw = await file.read()
	proba = det.predict_proba(raw, source_hint=source_hint)
	cam = np.array(det.explain(raw, source_hint=source_hint)["cam"], dtype=np.float32)
	return {
	**proba,
	"heatmap_b64": heatmap_png_b64(cam),
	}

	@app.get("/health")
	def health(): return {"ok": True, "backend": BACKEND}