FortuneT commited on
Commit
46a1867
·
verified ·
1 Parent(s): 548f7ad

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -23,7 +23,7 @@ download_model()
23
  # Define OmniAI's chat function (handles two arguments: user message + history)
24
  def omni_ai_chat(user_message, history):
25
  try:
26
- llm = Llama(model_path=MODEL_PATH, n_ctx=4096) # Load locally downloaded model
27
  response = llm(user_message) # Process only the latest prompt
28
  return response["choices"][0]["text"].strip()
29
  except Exception as e:
 
23
  # Define OmniAI's chat function (handles two arguments: user message + history)
24
  def omni_ai_chat(user_message, history):
25
  try:
26
+ llm = Llama(model_path=MODEL_PATH, n_ctx=4096, n_batch=256, flash_attn=True) # Load locally downloaded model
27
  response = llm(user_message) # Process only the latest prompt
28
  return response["choices"][0]["text"].strip()
29
  except Exception as e: