Gokulavelan commited on
Commit
f075bd4
·
1 Parent(s): b099d18
Files changed (2) hide show
  1. app/main.py +2 -2
  2. requirements.txt +0 -1
app/main.py CHANGED
@@ -4,7 +4,7 @@ from fastapi import FastAPI, HTTPException
4
  from pydantic import BaseModel
5
  from transformers import AutoModelForCausalLM, AutoTokenizer
6
 
7
- # Set Hugging Face cache directory (to avoid permission issues in Docker)
8
  os.environ["HF_HOME"] = "/app/huggingface_cache"
9
  os.environ["TRANSFORMERS_CACHE"] = "/app/huggingface_cache"
10
 
@@ -23,7 +23,7 @@ model = AutoModelForCausalLM.from_pretrained(
23
  model_name,
24
  trust_remote_code=True,
25
  torch_dtype=torch.float32, # Use float32 for CPU
26
- device_map="cpu" # Force CPU
27
  )
28
 
29
  @app.get("/")
 
4
  from pydantic import BaseModel
5
  from transformers import AutoModelForCausalLM, AutoTokenizer
6
 
7
+ # Set Hugging Face cache directory to avoid permission issues in Docker
8
  os.environ["HF_HOME"] = "/app/huggingface_cache"
9
  os.environ["TRANSFORMERS_CACHE"] = "/app/huggingface_cache"
10
 
 
23
  model_name,
24
  trust_remote_code=True,
25
  torch_dtype=torch.float32, # Use float32 for CPU
26
+ device_map={"": "cpu"} # Ensure CPU usage
27
  )
28
 
29
  @app.get("/")
requirements.txt CHANGED
@@ -3,4 +3,3 @@ uvicorn
3
  torch
4
  transformers
5
  accelerate
6
- bitsandbytes
 
3
  torch
4
  transformers
5
  accelerate