Elea Zhong commited on
Commit
e34d60b
·
1 Parent(s): 2288967
Files changed (1) hide show
  1. app.py +9 -5
app.py CHANGED
@@ -29,11 +29,15 @@ from qwenimage.models.qwen_fa3_processor import QwenDoubleStreamAttnProcessorFA3
29
  dtype = torch.bfloat16
30
  device = "cuda" if torch.cuda.is_available() else "cpu"
31
 
32
- exp = Qwen_FA3_AoT_int8()
33
- # exp = Qwen_FA3_AoT_fp8()
34
- exp.load()
35
- exp.optimize()
36
- pipe = exp.pipe
 
 
 
 
37
 
38
 
39
  MAX_SEED = np.iinfo(np.int32).max
 
29
  dtype = torch.bfloat16
30
  device = "cuda" if torch.cuda.is_available() else "cpu"
31
 
32
+ @spaces.GPU
33
+ def load_pipe():
34
+ exp = Qwen_FA3_AoT_int8()
35
+ # exp = Qwen_FA3_AoT_fp8()
36
+ exp.load()
37
+ exp.optimize()
38
+ return exp.pipe
39
+
40
+ pipe = load_pipe()
41
 
42
 
43
  MAX_SEED = np.iinfo(np.int32).max