Spaces:
Sleeping
Sleeping
File size: 1,480 Bytes
05dfd9d 71eb861 b0ccf04 71eb861 b0ccf04 05dfd9d 71eb861 b0ccf04 71eb861 b0ccf04 71eb861 b0ccf04 71eb861 b0ccf04 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 |
import os
from fastapi import FastAPI, HTTPException, Depends
from pydantic import BaseModel
from fastapi.security.api_key import APIKeyHeader
from utils import retrive_context, generate_response
# Initialize FastAPI
app = FastAPI()
class QueryRequest(BaseModel):
# Asked query should be in string format
query: str
class QueryResponse(BaseModel):
# Response should be in string format
response: str
api_key_header = APIKeyHeader(name="Authorization", auto_error=False)
def get_api_key(api_key: str = Depends(api_key_header)):
if api_key == os.getenv("API_KEY"):
return api_key
else:
raise HTTPException(status_code=401, detail="Invalid API key")
@app.post("/infer", response_model=QueryResponse)
def infer(query_request: QueryRequest, api_key: str = Depends(get_api_key)):
query = query_request.query
context = retrive_context(query)
if context == 500:
raise HTTPException(status_code=500, detail="Error retrieving context")
response = generate_response(query, context)
if response == 500:
raise HTTPException(status_code=500, detail="Error generating response")
return QueryResponse(response=response)
# Root endpoint for testing
@app.get("/")
def read_root():
return {"message": "Inference API is running"}
if __name__ == "__main__":
import uvicorn
uvicorn.run(app, host="127.0.0.1", port=8000, log_level="info")
|