Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -55,6 +55,7 @@ model = AutoModelForCausalLM.from_pretrained(
|
|
55 |
model_name,
|
56 |
# quantization_config=quantization_config_4bit, # Comment out if not using quantization
|
57 |
device_map="auto",
|
|
|
58 |
).to(torch.float16) #.to(torch.device("cuda:0"), torch.bfloat16)
|
59 |
|
60 |
print(f"Loading tokenizer: {model_name}")
|
|
|
55 |
model_name,
|
56 |
# quantization_config=quantization_config_4bit, # Comment out if not using quantization
|
57 |
device_map="auto",
|
58 |
+
offload_folder='./',
|
59 |
).to(torch.float16) #.to(torch.device("cuda:0"), torch.bfloat16)
|
60 |
|
61 |
print(f"Loading tokenizer: {model_name}")
|