Update app.py
Browse files
app.py
CHANGED
@@ -20,8 +20,7 @@ def fetch_model(model_name: str, dtype=torch.bfloat16):
|
|
20 |
model_info = load_model(model_name, dtype=dtype)
|
21 |
tokenizer, model, vl_chat_processor = model_info
|
22 |
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
|
23 |
-
|
24 |
-
model = model.to(device).eval() # Move to device and set eval mode
|
25 |
DEPLOY_MODELS[model_name] = (tokenizer, model, vl_chat_processor)
|
26 |
logger.info(f"Loaded {model_name} on {device}")
|
27 |
return DEPLOY_MODELS[model_name]
|
|
|
20 |
model_info = load_model(model_name, dtype=dtype)
|
21 |
tokenizer, model, vl_chat_processor = model_info
|
22 |
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
|
23 |
+
model = model.to(device)
|
|
|
24 |
DEPLOY_MODELS[model_name] = (tokenizer, model, vl_chat_processor)
|
25 |
logger.info(f"Loaded {model_name} on {device}")
|
26 |
return DEPLOY_MODELS[model_name]
|