Skip to content

Commit cda370c

Browse files
authored
Merge pull request #27 from VectorInstitute/add_bias-in-the-picture-benchmark
Add bias-in-the-picture-benchmark repo
2 parents 9b3bde7 + 47f2264 commit cda370c

File tree

3 files changed

+59
-2
lines changed

3 files changed

+59
-2
lines changed

catalog/public/data/papers.bib

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -43,4 +43,13 @@ @software{fajardo2025fedrag
4343
url = {https://github.com/VectorInstitute/fed-rag},
4444
version = {0.0.27},
4545
license = {Apache-2.0}
46+
47+
@misc{narayanan2025biaspicturebenchmarkingvlms,
48+
title={Bias in the Picture: Benchmarking VLMs with Social-Cue News Images and LLM-as-Judge Assessment},
49+
author={Aravind Narayanan and Vahid Reza Khazaie and Shaina Raza},
50+
year={2025},
51+
eprint={2509.19659},
52+
archivePrefix={arXiv},
53+
primaryClass={cs.CV},
54+
url={https://arxiv.org/abs/2509.19659}
4655
}

catalog/public/data/repositories.json

Lines changed: 32 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,35 @@
11
{
22
"repositories": [
3+
{
4+
"name": "bias-in-the-picture-benchmark",
5+
"repo_id": "VectorInstitute/bias-in-the-picture-benchmark",
6+
"description": "Benchmarking VLMs with Social-Cue News Images and LLM-as-Judge Assessment - evaluates how vision-language models handle real news images containing demographic and social attributes",
7+
"implementations": [
8+
{
9+
"name": "Bias in the Picture Benchmark",
10+
"url": "https://vectorinstitute.github.io/bias-in-the-picture-benchmark/"
11+
},
12+
{
13+
"name": "LLM-as-Judge Evaluation Framework",
14+
"url": null
15+
},
16+
{
17+
"name": "VLM Inference Pipeline",
18+
"url": null
19+
}
20+
],
21+
"public_datasets": [
22+
{
23+
"name": "Social-Cue News Images Dataset",
24+
"url": "https://github.com/VectorInstitute/bias-in-the-picture-benchmark/tree/main/data"
25+
}
26+
],
27+
"type": "applied-research",
28+
"year": 2025,
29+
"github_url": "https://github.com/VectorInstitute/bias-in-the-picture-benchmark",
30+
"paper_url": "https://arxiv.org/abs/2509.19659",
31+
"bibtex": "narayanan2025biaspicturebenchmarkingvlms"
32+
},
333
{
434
"name": "crisp-nam",
535
"repo_id": "VectorInstitute/crisp-nam",
@@ -920,7 +950,7 @@
920950
"github_url": "https://github.com/VectorInstitute/privacy-enhancing-techniques"
921951
}
922952
],
923-
"totalImplementations": 121,
953+
"totalImplementations": 124,
924954
"yearsOfResearch": 7,
925-
"lastUpdated": "2025-11-25T12:24:55.191063"
955+
"lastUpdated": "2025-11-25T12:31:24.825921"
926956
}
Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,18 @@
1+
name: bias-in-the-picture-benchmark
2+
repo_id: VectorInstitute/bias-in-the-picture-benchmark
3+
description: "Benchmarking VLMs with Social-Cue News Images and LLM-as-Judge Assessment - evaluates how vision-language models handle real news images containing demographic and social attributes"
4+
implementations:
5+
- name: Bias in the Picture Benchmark
6+
url: https://vectorinstitute.github.io/bias-in-the-picture-benchmark/
7+
- name: LLM-as-Judge Evaluation Framework
8+
url: null
9+
- name: VLM Inference Pipeline
10+
url: null
11+
public_datasets:
12+
- name: Social-Cue News Images Dataset
13+
url: https://github.com/VectorInstitute/bias-in-the-picture-benchmark/tree/main/data
14+
type: applied-research
15+
year: 2025
16+
github_url: https://github.com/VectorInstitute/bias-in-the-picture-benchmark
17+
paper_url: https://arxiv.org/abs/2509.19659
18+
bibtex: narayanan2025biaspicturebenchmarkingvlms

0 commit comments

Comments
 (0)