Merge pull request #27 from VectorInstitute/add_bias-in-the-picture-benchmark

amrit110 · web-flow · commit cda370c65d2e · 2025-11-25T12:40:21.000-05:00
Add bias-in-the-picture-benchmark repo
diff --git a/catalog/public/data/papers.bib b/catalog/public/data/papers.bib
@@ -43,4 +43,13 @@ @software{fajardo2025fedrag
   url = {https://github.com/VectorInstitute/fed-rag},
   version = {0.0.27},
   license = {Apache-2.0}
+
+@misc{narayanan2025biaspicturebenchmarkingvlms,
+  title={Bias in the Picture: Benchmarking VLMs with Social-Cue News Images and LLM-as-Judge Assessment},
+  author={Aravind Narayanan and Vahid Reza Khazaie and Shaina Raza},
+  year={2025},
+  eprint={2509.19659},
+  archivePrefix={arXiv},
+  primaryClass={cs.CV},
+  url={https://arxiv.org/abs/2509.19659}
 }
diff --git a/catalog/public/data/repositories.json b/catalog/public/data/repositories.json
@@ -1,5 +1,35 @@
 {
   "repositories": [
+    {
+      "name": "bias-in-the-picture-benchmark",
+      "repo_id": "VectorInstitute/bias-in-the-picture-benchmark",
+      "description": "Benchmarking VLMs with Social-Cue News Images and LLM-as-Judge Assessment - evaluates how vision-language models handle real news images containing demographic and social attributes",
+      "implementations": [
+        {
+          "name": "Bias in the Picture Benchmark",
+          "url": "https://vectorinstitute.github.io/bias-in-the-picture-benchmark/"
+        },
+        {
+          "name": "LLM-as-Judge Evaluation Framework",
+          "url": null
+        },
+        {
+          "name": "VLM Inference Pipeline",
+          "url": null
+        }
+      ],
+      "public_datasets": [
+        {
+          "name": "Social-Cue News Images Dataset",
+          "url": "https://github.com/VectorInstitute/bias-in-the-picture-benchmark/tree/main/data"
+        }
+      ],
+      "type": "applied-research",
+      "year": 2025,
+      "github_url": "https://github.com/VectorInstitute/bias-in-the-picture-benchmark",
+      "paper_url": "https://arxiv.org/abs/2509.19659",
+      "bibtex": "narayanan2025biaspicturebenchmarkingvlms"
+    },
     {
       "name": "crisp-nam",
       "repo_id": "VectorInstitute/crisp-nam",
@@ -920,7 +950,7 @@
       "github_url": "https://github.com/VectorInstitute/privacy-enhancing-techniques"
     }
   ],
-  "totalImplementations": 121,
+  "totalImplementations": 124,
   "yearsOfResearch": 7,
-  "lastUpdated": "2025-11-25T12:24:55.191063"
+  "lastUpdated": "2025-11-25T12:31:24.825921"
 }
diff --git a/repositories/bias-in-the-picture-benchmark.yaml b/repositories/bias-in-the-picture-benchmark.yaml
@@ -0,0 +1,18 @@
+name: bias-in-the-picture-benchmark
+repo_id: VectorInstitute/bias-in-the-picture-benchmark
+description: "Benchmarking VLMs with Social-Cue News Images and LLM-as-Judge Assessment - evaluates how vision-language models handle real news images containing demographic and social attributes"
+implementations:
+  - name: Bias in the Picture Benchmark
+    url: https://vectorinstitute.github.io/bias-in-the-picture-benchmark/
+  - name: LLM-as-Judge Evaluation Framework
+    url: null
+  - name: VLM Inference Pipeline
+    url: null
+public_datasets:
+  - name: Social-Cue News Images Dataset
+    url: https://github.com/VectorInstitute/bias-in-the-picture-benchmark/tree/main/data
+type: applied-research
+year: 2025
+github_url: https://github.com/VectorInstitute/bias-in-the-picture-benchmark
+paper_url: https://arxiv.org/abs/2509.19659
+bibtex: narayanan2025biaspicturebenchmarkingvlms