ford442 commited on
Commit
a27a107
·
verified ·
1 Parent(s): 07fc14f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -0
app.py CHANGED
@@ -55,6 +55,7 @@ model = AutoModelForCausalLM.from_pretrained(
55
  model_name,
56
  # quantization_config=quantization_config_4bit, # Comment out if not using quantization
57
  device_map="auto",
 
58
  ).to(torch.float16) #.to(torch.device("cuda:0"), torch.bfloat16)
59
 
60
  print(f"Loading tokenizer: {model_name}")
 
55
  model_name,
56
  # quantization_config=quantization_config_4bit, # Comment out if not using quantization
57
  device_map="auto",
58
+ offload_folder='./',
59
  ).to(torch.float16) #.to(torch.device("cuda:0"), torch.bfloat16)
60
 
61
  print(f"Loading tokenizer: {model_name}")