inflaton commited on
Commit
5bda5b6
1 Parent(s): fa9866a

fixed streaming for ctransformers

Browse files
Files changed (1) hide show
  1. app_modules/llm_loader.py +4 -1
app_modules/llm_loader.py CHANGED
@@ -202,7 +202,10 @@ class LLMLoader:
202
  "repetition_penalty": 1.1,
203
  }
204
  self.llm = CTransformers(
205
- model=MODEL_PATH, model_type="llama", config=config
 
 
 
206
  )
207
  elif self.llm_model_type == "hftgi":
208
  HFTGI_SERVER_URL = os.environ.get("HFTGI_SERVER_URL")
 
202
  "repetition_penalty": 1.1,
203
  }
204
  self.llm = CTransformers(
205
+ model=MODEL_PATH,
206
+ model_type="llama",
207
+ config=config,
208
+ callbacks=callbacks,
209
  )
210
  elif self.llm_model_type == "hftgi":
211
  HFTGI_SERVER_URL = os.environ.get("HFTGI_SERVER_URL")