Shankarm08 commited on
Commit
185ec49
·
verified ·
1 Parent(s): adac503

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +19 -0
app.py ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from transformers import AutoTokenizer, AutoModelForCausalLM
2
+ from fastapi import FastAPI, Body
3
+
4
+ app = FastAPI()
5
+
6
+ # Load pre-trained model and tokenizer
7
+ tokenizer = AutoTokenizer.from_pretrained("meta-llama/Meta-Llama-3-8B")
8
+ model = AutoModelForCausalLM.from_pretrained("meta-llama/Meta-Llama-3-8B")
9
+
10
+ @app.post("/generate")
11
+ async def generate_text(input_text: str = Body(..., embed=True)):
12
+ input_ids = tokenizer.encode(input_text, return_tensors='pt')
13
+ output = model.generate(input_ids, max_length=50, num_beams=4)
14
+ generated_text = tokenizer.decode(output[0], skip_special_tokens=True)
15
+ return {"generated_text": generated_text}
16
+
17
+ if __name__ == "__main__":
18
+ import uvicorn
19
+ uvicorn.run(app, host="0.0.0.0", port=8000)