Elea Zhong commited on
Commit
2c9dc50
·
1 Parent(s): ab8f53b
Files changed (1) hide show
  1. app.py +6 -5
app.py CHANGED
@@ -29,15 +29,16 @@ from qwenimage.models.qwen_fa3_processor import QwenDoubleStreamAttnProcessorFA3
29
  dtype = torch.bfloat16
30
  device = "cuda" if torch.cuda.is_available() else "cpu"
31
 
 
 
 
 
32
  @spaces.GPU(duration=1500)
33
- def load_pipe():
34
- exp = Qwen_FA3_AoT_int8()
35
- # exp = Qwen_FA3_AoT_fp8()
36
- exp.load()
37
  exp.optimize()
38
  return exp.pipe
39
 
40
- pipe = load_pipe()
41
 
42
 
43
  MAX_SEED = np.iinfo(np.int32).max
 
29
  dtype = torch.bfloat16
30
  device = "cuda" if torch.cuda.is_available() else "cpu"
31
 
32
+ exp = Qwen_FA3_AoT_int8()
33
+ # exp = Qwen_FA3_AoT_fp8()
34
+ exp.load()
35
+
36
  @spaces.GPU(duration=1500)
37
+ def optim_pipe(exp):
 
 
 
38
  exp.optimize()
39
  return exp.pipe
40
 
41
+ pipe = optim_pipe(exp)
42
 
43
 
44
  MAX_SEED = np.iinfo(np.int32).max