Spaces:

kudui
/

dream-s1k-demo

Paused

App Files Files Community

况兑 commited on Oct 7

Commit

a769d64

1 Parent(s): a088db3

fix: cast attention_mask to bool to satisfy Dream forward/generate expectations

Browse files

Files changed (1) hide show

loss_probe.py +13 -23

loss_probe.py CHANGED Viewed

@@ -5,33 +5,27 @@ MODEL_ID = os.getenv("MODEL_ID", "Dream-org/Dream-v0-Instruct-7B")
 REV = os.getenv("REV", None)
 print(f"[INFO] Using MODEL_ID={MODEL_ID} REV={REV or '(latest)'}")
-print("[INFO] Loading tokenizer...")
 tok = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True, revision=REV)
-print("[INFO] Loading model...")
 dtype = torch.bfloat16 if torch.cuda.is_available() else torch.float32
-model = AutoModel.from_pretrained(
-    MODEL_ID, trust_remote_code=True, torch_dtype=dtype, revision=REV
-)
 device = "cuda" if torch.cuda.is_available() else "cpu"
-model = model.to(device).eval()
 def check_loss():
     msgs = [
         {"role": "system", "content": "只输出一个数字"},
         {"role": "user", "content": "Compute: 1+1"},
     ]
-    enc = tok.apply_chat_template(
-        msgs, return_tensors="pt", return_dict=True, add_generation_prompt=False
-    )
-    enc = {k: v.to(device) for k, v in enc.items()}
-    labels = enc["input_ids"].clone()
     try:
-        out = model(
-            input_ids=enc["input_ids"],
-            attention_mask=enc.get("attention_mask"),
-            labels=labels,
-        )
         has_loss = getattr(out, "loss", None) is not None
         return f"[CHECK] supports labels->loss? {has_loss} | type={type(out)}"
     except Exception as e:
@@ -41,11 +35,9 @@ def quick_infer(q: str):
     if not q.strip():
         return ""
     messages = [{"role": "user", "content": q}]
-    inputs = tok.apply_chat_template(
-        messages, return_tensors="pt", return_dict=True, add_generation_prompt=True
-    )
     input_ids = inputs.input_ids.to(device)
-    attention_mask = inputs.attention_mask.to(device)
     with torch.no_grad():
         out = model.diffusion_generate(
             input_ids,
@@ -55,9 +47,7 @@ def quick_infer(q: str):
             temperature=0.0,
             return_dict_in_generate=True,
         )
-    text = tok.decode(
-        out.sequences[0][input_ids.shape[1]:], skip_special_tokens=True
-    ).strip()
     return text
 with gr.Blocks() as demo:

 REV = os.getenv("REV", None)
 print(f"[INFO] Using MODEL_ID={MODEL_ID} REV={REV or '(latest)'}")
 tok = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True, revision=REV)
 dtype = torch.bfloat16 if torch.cuda.is_available() else torch.float32
 device = "cuda" if torch.cuda.is_available() else "cpu"
+model = AutoModel.from_pretrained(MODEL_ID, trust_remote_code=True, torch_dtype=dtype, revision=REV).to(device).eval()
 def check_loss():
     msgs = [
         {"role": "system", "content": "只输出一个数字"},
         {"role": "user", "content": "Compute: 1+1"},
     ]
+    enc = tok.apply_chat_template(msgs, return_tensors="pt", return_dict=True, add_generation_prompt=False)
+    # 保证 dtype / device 正确；attention_mask 用 bool 可兼容
+    input_ids = enc["input_ids"].to(device)
+    attn = enc.get("attention_mask", None)
+    if attn is not None:
+        attn = attn.to(device).to(torch.bool)
+    labels = input_ids.clone()
     try:
+        out = model(input_ids=input_ids, attention_mask=attn, labels=labels)
         has_loss = getattr(out, "loss", None) is not None
         return f"[CHECK] supports labels->loss? {has_loss} | type={type(out)}"
     except Exception as e:
     if not q.strip():
         return ""
     messages = [{"role": "user", "content": q}]
+    inputs = tok.apply_chat_template(messages, return_tensors="pt", return_dict=True, add_generation_prompt=True)
     input_ids = inputs.input_ids.to(device)
+    attention_mask = inputs.attention_mask.to(device).to(torch.bool)
     with torch.no_grad():
         out = model.diffusion_generate(
             input_ids,
             temperature=0.0,
             return_dict_in_generate=True,
         )
+    text = tok.decode(out.sequences[0][input_ids.shape[1]:], skip_special_tokens=True).strip()
     return text
 with gr.Blocks() as demo: