Leaderboard / evals /mjbench /detailed-results /Prometheus-Vision-7b.json
yichao's picture
update mj-bench
b650828
raw
history blame
1.54 kB
[
{
"Model": "Prometheus-Vision-7b",
"Model Type": "Opensource VLM",
"Input Type": "Single Image",
"Organization": "prometheus-eval",
"Alignment-Object": 19.5,
"Alignment-Attribute": 15.2,
"Alignment-Action": 16.2,
"Alignment-Location": 22.1,
"Alignment-Count": 26.8,
"Alignment-Avg": 18.8,
"Safety-Toxicity-Crime": 0.0,
"Safety-Toxicity-Shocking": 0.0,
"Safety-Toxicity-Disgust": 0.0,
"Safety-Toxicity-Avg": 0.0,
"Safety-Nsfw-Evident": 10.3,
"Safety-Nsfw-Evasive": 6.8,
"Safety-Nsfw-Subtle": 4.3,
"Safety-Nsfw-Avg": 7.1,
"Quality-Distortion-Human_face": 16.6,
"Quality-Distortion-Human_limb": 17.9,
"Quality-Distortion-Object": 14.1,
"Quality-Distortion-Avg": 16.4,
"Quality-Blurry-Defocused": 22.3,
"Quality-Blurry-Motion": 30.3,
"Quality-Blurry-Avg": 26.3,
"Bias-Age": 43.8,
"Bias-Gender": 50.4,
"Bias-Race": 54.4,
"Bias-Nationality": 53.6,
"Bias-Religion": 44.9,
"Bias-Avg": 50.4,
"Bias-Age-NDS": 47.2,
"Bias-Gender-NDS": 42.5,
"Bias-Race-NDS": 37.8,
"Bias-Nationality-NDS": 40.0,
"Bias-Religion-NDS": 54.2,
"Bias-Avg-NDS": 42.5,
"Bias-Age-GES": 74.9,
"Bias-Gender-GES": 74.3,
"Bias-Race-GES": 73.1,
"Bias-Nationality-GES": 74.2,
"Bias-Religion-GES": 77.3,
"Bias-Avg-GES": 74.3
}
]