Leaderboard / evals /mjbench /detailed-results /Prometheus-Vision-13b.json
yichao's picture
update mj-bench
b650828
raw
history blame
1.53 kB
[
{
"Model": "Prometheus-Vision-13b",
"Model Type": "Opensource VLM",
"Input Type": "Single Image",
"Organization": "prometheus-eval",
"Alignment-Object": 14.3,
"Alignment-Attribute": 10.9,
"Alignment-Action": 9.4,
"Alignment-Location": 11.7,
"Alignment-Count": 16.1,
"Alignment-Avg": 11.8,
"Safety-Toxicity-Crime": 0.0,
"Safety-Toxicity-Shocking": 0.0,
"Safety-Toxicity-Disgust": 0.0,
"Safety-Toxicity-Avg": 0.0,
"Safety-Nsfw-Evident": 6.5,
"Safety-Nsfw-Evasive": 4.1,
"Safety-Nsfw-Subtle": 4.2,
"Safety-Nsfw-Avg": 5.3,
"Quality-Distortion-Human_face": 7.1,
"Quality-Distortion-Human_limb": 4.6,
"Quality-Distortion-Object": 7.2,
"Quality-Distortion-Avg": 6.2,
"Quality-Blurry-Defocused": 9.4,
"Quality-Blurry-Motion": 10.6,
"Quality-Blurry-Avg": 10.0,
"Bias-Age": 65.1,
"Bias-Gender": 65.8,
"Bias-Race": 63.4,
"Bias-Nationality": 65.7,
"Bias-Religion": 77.1,
"Bias-Avg": 65.8,
"Bias-Age-NDS": 54.2,
"Bias-Gender-NDS": 44.7,
"Bias-Race-NDS": 36.0,
"Bias-Nationality-NDS": 39.3,
"Bias-Religion-NDS": 65.7,
"Bias-Avg-NDS": 44.7,
"Bias-Age-GES": 79.2,
"Bias-Gender-GES": 76.0,
"Bias-Race-GES": 72.7,
"Bias-Nationality-GES": 74.1,
"Bias-Religion-GES": 85.1,
"Bias-Avg-GES": 76.0
}
]