YAML Metadata Warning: empty or missing yaml metadata in repo card (https://huggingface.co/docs/hub/model-cards#model-card-metadata)

A model trained on VisionReward dataset with faster speed.

Example Code:

import os
from transformers import Qwen3VLForConditionalGeneration, AutoProcessor

# default: Load the model on the available device(s)
model = Qwen3VLForConditionalGeneration.from_pretrained(
    "weathon/smolvlm2_anti_aesthetics_7b", dtype="auto", device_map="cuda"
)

processor = AutoProcessor.from_pretrained("Qwen/Qwen3-VL-4B-Instruct")
from datasets import load_dataset

import pandas as pd

df = pd.read_csv("rules.csv")
sign = lambda x: (x > 0) - (x < 0)
import pandas as pd
import re

df.columns = df.columns.str.strip()
df['Dimension'] = df['Dimension'].ffill()

df['dim_key'] = df['Dimension'].apply(lambda x: re.search(r'\((.*?)\)', x).group(1) if re.search(r'\((.*?)\)', x) else x)

guide = {
    dim_key: {
        f"{row['Option']}: {sign(int(row['Score']))+1}": ": " +str(row['Description']).strip()
        for _, row in group.iterrows()
    }
    for dim_key, group in df.groupby('dim_key')
}

score = {
    dim_key: {
        int(row['Score']): str(row['Option']).strip()
        for _, row in group.iterrows()
    }
    for dim_key, group in df.groupby('dim_key')
}
dims = []
for dim in guide.keys():
    if dim in ["unsafe type", "hands", "face", "body", "safety", "lighting aesthetic", "symmetry"]:
        continue
    dims.append(dim)
print("Rating dimensions:", dims)

import json
import torch

def rate_single_image(image, t):
    results = {"scores": [], "preds": []}
    messages = []
    dims = []
    for dim in guide.keys():
        if dim in ["unsafe type", "hands", "face", "body", "safety", "lighting aesthetic", "symmetry"]:
            continue
        dims.append(dim)
        messages.append([
                    { 
                        "role": "user",
                        "content": [
                            {
                                "type":"text",
                                "text":f"Please rate this image for its {dim} quality. Use this guideline {guide[dim]}. Response a single number.",
                            },
                            {
                                "type": "image", 
                                "image":image.resize((512, 512))
                            }
                        ],
                    }])

    inputs = processor.apply_chat_template(
        messages,
        tokenize=True,
        add_generation_prompt=True,
        return_dict=True,
        return_tensors="pt",
        padding=True
    ) 

    inputs = inputs.to(model.device)
    id_of_interest = processor.tokenizer.convert_tokens_to_ids(["0", "1", "2"])
    id_of_interest
    with torch.no_grad():
        logits = model(**inputs).logits
    logits = logits[:, -1, id_of_interest] 
    prob = torch.softmax(logits, dim=-1)
    for i in range(len(prob)):
        prob_of_interest = prob[i]
        score = torch.dot(prob_of_interest, torch.tensor([0, 1, 2], device=prob_of_interest.device).bfloat16())
        single_pred = prob_of_interest.argmax().item() 
        # results[f"{dim}_score"] = float(score)
        # results[f"{dim}_pred"] = single_pred
        print(dims[i], float(score), t) 
        results["scores"].append(float(score))
        results["preds"].append(single_pred)
    return results



from PIL import Image
def rate_image(sample, i, idx_of_interest):
    if i not in idx_of_interest:
        return sample["rater"] if "rater" in sample else 5/0 
    image_original = sample["image"]
    result = rate_single_image(image_original, "original")
    # sample["rater"] = 
    return result

    # return sample
import tqdm
# https://huggingface.co/docs/datasets/en/process
if __name__ == "__main__":
    # dataset = load_dataset("weathon/aas_benchmark")
    dataset = load_dataset("weathon/nag_dataset")
    dataset = dataset["train"]
    # rated_dataset = dataset.map(rate_image, batched=False, writer_batch_size=3000)
    rater_results = []
    for i, sample in enumerate(tqdm.tqdm(dataset)):
        result = rate_image(sample, i, set(range(len(dataset))))  # specify indices of interest here
        rater_results.append(result)
    dataset = dataset.add_column("rater", rater_results)
    dataset.push_to_hub("weathon/nag_dataset")

Please Cite Us https://philpapers.org/rec/GUOAAR

@article{guo2025aesthetic,
  title={Aesthetic Alignment Risks Assimilation: How Image Generation and Reward Models Reinforce Beauty Bias and Ideological" Censorship"},
  author={Guo, Wenqi Marshall and Qian, Qingyun and Hasan, Khalad and Du, Shan},
  journal={arXiv preprint arXiv:2512.11883},
  year={2025}
}

Downloads last month: -; Downloads are not tracked for this model. How to track

Inference Providers NEW

This model isn't deployed by any Inference Provider. 🙋 Ask for provider support

Paper for weathon/smolvlm2_anti_aesthetics_7b

Aesthetic Alignment Risks Assimilation: How Image Generation and Reward Models Reinforce Beauty Bias and Ideological "Censorship"

Paper • 2512.11883 • Published about 1 month ago • 6