DongfuJiang commited on
Commit
f33be86
1 Parent(s): 19d0707
Files changed (1) hide show
  1. app.py +1 -0
app.py CHANGED
@@ -51,6 +51,7 @@ fuser_config.model_name = "llm-blender/gen_fuser_3b" # our pre-trained fuser
51
  fuser_config.max_length = 1024
52
  fuser_config.candidate_maxlength = DEFAULT_CANDIDATE_MAX_LENGTH
53
  blender_config = llm_blender.BlenderConfig()
 
54
  blender_config.device = "cuda" # blender ranker and fuser device
55
  blender = llm_blender.Blender(blender_config, ranker_config, fuser_config)
56
 
 
51
  fuser_config.max_length = 1024
52
  fuser_config.candidate_maxlength = DEFAULT_CANDIDATE_MAX_LENGTH
53
  blender_config = llm_blender.BlenderConfig()
54
+ blender_config.load_in_8bit = True
55
  blender_config.device = "cuda" # blender ranker and fuser device
56
  blender = llm_blender.Blender(blender_config, ranker_config, fuser_config)
57