Mykes commited on
Commit
c90d5be
1 Parent(s): 4cc0b38

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -4
app.py CHANGED
@@ -41,11 +41,15 @@ def load_model():
41
  repo_id="Mykes/med_phi3-mini-4k-GGUF",
42
  filename="*Q4_K_M.gguf",
43
  verbose=False,
44
- n_ctx=1024,
45
- n_batch=512,
46
- n_threads=8,
47
- use_mlock=True,
48
  use_mmap=True,
 
 
 
 
 
49
  )
50
 
51
  llm = load_model()
 
41
  repo_id="Mykes/med_phi3-mini-4k-GGUF",
42
  filename="*Q4_K_M.gguf",
43
  verbose=False,
44
+ n_ctx=256, # Reduced context window
45
+ n_batch=8, # Smaller batch size
46
+ n_threads=2, # Adjust based on your CPU cores
 
47
  use_mmap=True,
48
+ # n_ctx=1024,
49
+ # n_batch=512,
50
+ # n_threads=8,
51
+ # use_mlock=True,
52
+ # use_mmap=True,
53
  )
54
 
55
  llm = load_model()