Spaces:
Runtime error
Runtime error
erwold
commited on
Commit
·
3307da6
1
Parent(s):
bc9137b
Initial Commit
Browse files
app.py
CHANGED
@@ -15,6 +15,7 @@ import os
|
|
15 |
# 设置环境变量,强制禁用 accelerate 的显存管理
|
16 |
os.environ["ACCELERATE_USE_MEMORY_EFFICIENT_ATTENTION"] = "false"
|
17 |
os.environ["ACCELERATE_DISABLE_MEMORY_EFFICIENT_ATTENTION"] = "1"
|
|
|
18 |
|
19 |
from qwen2_vl.modeling_qwen2_vl import Qwen2VLSimplifiedModel
|
20 |
|
@@ -60,6 +61,9 @@ class FluxInterface:
|
|
60 |
return
|
61 |
|
62 |
logger.info("Starting model loading...")
|
|
|
|
|
|
|
63 |
|
64 |
# Load FLUX components
|
65 |
tokenizer = CLIPTokenizer.from_pretrained(self.MODEL_ID, subfolder="flux/tokenizer")
|
|
|
15 |
# 设置环境变量,强制禁用 accelerate 的显存管理
|
16 |
os.environ["ACCELERATE_USE_MEMORY_EFFICIENT_ATTENTION"] = "false"
|
17 |
os.environ["ACCELERATE_DISABLE_MEMORY_EFFICIENT_ATTENTION"] = "1"
|
18 |
+
os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "expandable_segments:True,garbage_collection_threshold:0.6,max_split_size_mb:512"
|
19 |
|
20 |
from qwen2_vl.modeling_qwen2_vl import Qwen2VLSimplifiedModel
|
21 |
|
|
|
61 |
return
|
62 |
|
63 |
logger.info("Starting model loading...")
|
64 |
+
# 3. 显式设置 PyTorch 缓存分配器的行为
|
65 |
+
torch.cuda.set_per_process_memory_fraction(0.95) # 允许使用95%的显存
|
66 |
+
torch.cuda.max_memory_allocated = lambda *args, **kwargs: 0 # 忽略已分配内存的限制
|
67 |
|
68 |
# Load FLUX components
|
69 |
tokenizer = CLIPTokenizer.from_pretrained(self.MODEL_ID, subfolder="flux/tokenizer")
|