AISmithLab
diff --git a/‎.github/workflows/sync-studies-index.yml‎
Lines changed: 23 additions & 0 deletions b/‎.github/workflows/sync-studies-index.yml‎
Lines changed: 23 additions & 0 deletions
diff --git a/‎.github/workflows/validate-studies.yml‎
Lines changed: 78 additions & 0 deletions b/‎.github/workflows/validate-studies.yml‎
Lines changed: 78 additions & 0 deletions
diff --git a/‎.gitignore‎
Lines changed: 87 additions & 0 deletions b/‎.gitignore‎
Lines changed: 87 additions & 0 deletions
diff --git a/‎LICENSE‎
Lines changed: 21 additions & 0 deletions b/‎LICENSE‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 94 additions & 0 deletions b/‎README.md‎
Lines changed: 94 additions & 0 deletions
diff --git a/‎co_website/.gitignore‎
Lines changed: 41 additions & 0 deletions b/‎co_website/.gitignore‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎co_website/README.md‎
Lines changed: 41 additions & 0 deletions b/‎co_website/README.md‎
Lines changed: 41 additions & 0 deletions
@@ -0,0 +1,23 @@
+name: Sync studies index
+on:
+  push:
+    branches: [dev, main]
+    paths:
+      - "studies/**"
+      - "scripts/build_studies_index.py"
+
+jobs:
+  rebuild:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - uses: actions/setup-python@v5
+        with:
+          python-version: "3.11"
+      - name: Build studies index
+        run: python scripts/build_studies_index.py
+      - name: Commit updated index
+        uses: stefanzweifel/git-auto-commit-action@v5
+        with:
+          commit_message: "chore: rebuild studies_index.json"
+          file_pattern: co_website/data/studies_index.json
@@ -0,0 +1,78 @@
+name: Validate studies
+on:
+  pull_request:
+    branches: [dev, main]
+    paths:
+      - "studies/**"
+      - "scripts/build_studies_index.py"
+      - "scripts/verify_study.sh"
+
+jobs:
+  validate:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - uses: actions/setup-python@v5
+        with:
+          python-version: "3.11"
+      - name: Install dependencies
+        run: pip install -r requirements.txt
+      - name: Build studies index
+        run: python scripts/build_studies_index.py
+      - name: Verify changed studies
+        run: |
+          # Find study directories changed in this PR
+          CHANGED_STUDIES=$(git diff --name-only origin/${{ github.base_ref }}...HEAD -- studies/ | grep -oP 'studies/[^/]+' | sort -u)
+          if [ -z "$CHANGED_STUDIES" ]; then
+            echo "No study directories changed."
+            exit 0
+          fi
+          for study_path in $CHANGED_STUDIES; do
+            study_id=$(basename "$study_path")
+            echo "--- Verifying $study_id ---"
+            bash scripts/verify_study.sh "$study_id"
+            echo ""
+          done
+      - name: Verify contributor attribution
+        env:
+          PR_AUTHOR: ${{ github.event.pull_request.user.login }}
+        run: |
+          CHANGED_STUDIES=$(git diff --name-only origin/${{ github.base_ref }}...HEAD -- studies/ | grep -oP 'studies/[^/]+' | sort -u)
+          if [ -z "$CHANGED_STUDIES" ]; then
+            exit 0
+          fi
+          FAILED=0
+          for study_path in $CHANGED_STUDIES; do
+            INDEX="$study_path/index.json"
+            if [ ! -f "$INDEX" ]; then
+              continue
+            fi
+            # Check if any contributor github field contains the PR author's username
+            MATCH=$(python3 -c "
+          import json, sys
+          with open('$INDEX') as f:
+              data = json.load(f)
+          contributors = data.get('contributors', [])
+          if not contributors:
+              print('MISSING')
+              sys.exit(0)
+          author = '$PR_AUTHOR'.lower()
+          for c in contributors:
+              gh = c.get('github', '').lower()
+              # Match 'username' or 'https://github.com/username'
+              if gh.rstrip('/').split('/')[-1] == author:
+                  print('MATCH')
+                  sys.exit(0)
+          print('MISMATCH')
+          ")
+            study_id=$(basename "$study_path")
+            if [ "$MATCH" = "MISSING" ] || [ "$MATCH" = "MISMATCH" ]; then
+              echo "::error file=$INDEX::Contributor check failed for $study_id. Your GitHub username is '$PR_AUTHOR'. Please add the following to your index.json:%0A%0A\"contributors\": [%0A  { \"name\": \"Your Name\", \"github\": \"$PR_AUTHOR\" }%0A]"
+              FAILED=1
+            else
+              echo "$study_id: Contributor @$PR_AUTHOR verified."
+            fi
+          done
+          if [ "$FAILED" -eq 1 ]; then
+            exit 1
+          fi
@@ -0,0 +1,87 @@
+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+
+
+# Virtual environments
+venv/
+env/
+ENV/
+.venv
+
+# IDEs
+.vscode/
+.idea/
+*.swp
+*.swo
+*~
+.DS_Store
+
+# Jupyter Notebook
+.ipynb_checkpoints
+*.ipynb_checkpoints/
+
+# Testing
+.pytest_cache/
+.coverage
+htmlcov/
+coverage.xml
+.tox/
+.nox/
+
+# Type checking
+.mypy_cache/
+.dmypy.json
+dmypy.json
+.pytype/
+
+# Results and logs
+results/*
+!results/benchmark/
+results/benchmark/study_*/
+results/benchmark/full_benchmark_*.json
+logs/
+*.log
+
+# Data (except schemas and registry)
+# Uncomment if you want to exclude large study materials
+# studies/*/materials/large_files/
+
+# Environment variables
+.env
+.env.local
+
+# OS
+Thumbs.db
+
+# AI assistants
+.claude/
+.cursor/
+CLAUDE.md
+claude.md
+
+# co_website and build artifacts (lite branch)
+co_website/.history/
+co_website/node_modules/
+co_website/.next/
+humanstudybench.egg-info/
+dist/
+site/
@@ -0,0 +1,21 @@
+MIT License
+
+Copyright (c) 2026 Xuan Liu
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
@@ -0,0 +1,94 @@
+<div align="center">
+  <img src="docs/img/new-HS-bench_logo.png" alt="HumanStudy-Bench Logo" width="300">
+
+  <h1>HumanStudy-Bench: Towards AI Agent Design for Participant Simulation</h1>
+
+  <h3><a href="https://www.hs-bench.clawder.ai">📊 See Leaderboard & Results</a> | <a href="https://arxiv.org/abs/2602.00685">📖 Read the Paper</a></h3>
+
+  [![Release v1.0.0](https://img.shields.io/github/v/release/AISmithLab/HumanStudy-Bench)](https://github.com/AISmithLab/HumanStudy-Bench/releases/tag/v1.0.0)
+  [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
+  [![Python 3.8+](https://img.shields.io/badge/python-3.8+-blue.svg)](https://www.python.org/downloads/)
+  [![Docs](https://img.shields.io/badge/docs-website-blue)](https://www.hs-bench.clawder.ai)
+
+</div>
+
+---
+
+> HumanStudy-Bench is a standardized testbed for replaying human-subject experiments with LLM agents. We currently include **12 foundational studies** — and we need your help to grow the benchmark. This repository is the community contribution hub.
+
+## How to Contribute a Study
+
+### 1. Fork and clone
+
+```bash
+git clone https://github.com/<your-github-id>/HumanStudy-Bench.git
+cd HumanStudy-Bench
+git checkout -b contrib-<yourgithubid>-013
+```
+
+### 2. Create your study folder
+
+Add a new directory under `studies/` with the required folders:
+
+```
+studies/<yourgithubid>_013/
+  ├── index.json
+  ├── source/
+  ├── scripts/
+  └── README.md
+```
+
+See the docs below for what goes inside each folder and the exact schemas:
+
+| # | Guide | Description |
+|---|-------|-------------|
+| 1 | [What Should I Submit?](https://www.hs-bench.clawder.ai/docs/what_to_submit) | Overview of contribution, required folders and files |
+| 2 | [How to Extract Data from a Paper](https://www.hs-bench.clawder.ai/docs/extract_from_paper) | Paper hierarchy, AI extraction prompt, walkthrough example |
+| 3 | [How to Build Your Study Files](https://www.hs-bench.clawder.ai/docs/build_study_files) | Schemas, code examples, and contracts for each file |
+| 4 | [How to Submit Your Study](https://www.hs-bench.clawder.ai/docs/submit_study) | Fork, verify, push, and open a PR |
+
+### 3. Verify locally
+
+```bash
+bash scripts/verify_study.sh <yourgithubid>_013
+```
+
+### 4. Commit and push
+
+```bash
+git add studies/<yourgithubid>_013/
+git commit -m "Add study: <Your Study Title>"
+git push origin contrib-<yourgithubid>-013
+```
+
+### 5. Open a Pull Request
+
+Open a PR on GitHub targeting the `dev` branch. Maintainers assign final `study_XXX` numbering by merge order. CI runs validation automatically; confirmation is by human review.
+
+You can also submit a study via **web upload** at [hs-bench.clawder.ai/contribute](https://www.hs-bench.clawder.ai/contribute).
+
+## Existing Studies
+
+The 12 foundational studies (cognition, strategic interaction, social psychology) serve as reference examples. Browse them on the [website](https://www.hs-bench.clawder.ai/contribute#studies) or locally under `studies/`.
+
+## Citation & Hugging Face
+
+If you use HumanStudy-Bench, please cite:
+
+```bibtex
+@misc{liu2026humanstudybenchaiagentdesign,
+      title={HumanStudy-Bench: Towards AI Agent Design for Participant Simulation},
+      author={Xuan Liu and Haoyang Shang and Zizhang Liu and Xinyan Liu and Yunze Xiao and Yiwen Tu and Haojian Jin},
+      year={2026},
+      eprint={2602.00685},
+      archivePrefix={arXiv},
+      primaryClass={cs.AI},
+      url={https://arxiv.org/abs/2602.00685},
+}
+```
+
+**Hugging Face:** Benchmark and resources are available on the [Hugging Face Hub](https://huggingface.co/) — `fuyyckwhy/HS-Bench-results`.
+
+## License
+
+MIT License. See [LICENSE](LICENSE) for details.
@@ -0,0 +1,41 @@
+# See https://help.github.com/articles/ignoring-files/ for more about ignoring files.
+
+# dependencies
+/node_modules
+/.pnp
+.pnp.*
+.yarn/*
+!.yarn/patches
+!.yarn/plugins
+!.yarn/releases
+!.yarn/versions
+
+# testing
+/coverage
+
+# next.js
+/.next/
+/out/
+
+# production
+/build
+
+# misc
+.DS_Store
+*.pem
+
+# debug
+npm-debug.log*
+yarn-debug.log*
+yarn-error.log*
+.pnpm-debug.log*
+
+# env files (can opt-in for committing if needed)
+.env*
+
+# vercel
+.vercel
+
+# typescript
+*.tsbuildinfo
+next-env.d.ts
@@ -0,0 +1,41 @@
+## co_website (HumanStudy-Bench web app)
+
+Next.js app for:
+- Homepage sections (`Overview`, `Leaderboard`, `Dataset`)
+- Study catalog and study detail pages
+- Contribute flow (upload + PR creation)
+- Docs tab (`/docs`)
+
+## Local preview
+
+```bash
+cd co_website
+npm install
+npm run dev
+```
+
+Open `http://localhost:3000`.
+
+## Build checks
+
+```bash
+cd co_website
+npm run lint
+npm run build
+```
+
+## Study ZIP download
+
+ZIP downloads are served by:
+- `GET /api/studies/:studyId/zip`
+
+This endpoint packages `studies/:studyId` directly from the repository.
+
+## Refreshing effect-size plot data
+
+Homepage effect-size scatter reads:
+- `public/data/effects/gemini_flash_v4_effect_data.json`
+
+To refresh:
+1. From repo root: `python scripts/plot_single_fig3_effects.py --export-data /absolute/path/to/co_website/public/data/effects/gemini_flash_v4_effect_data.json`
+2. Rebuild/redeploy the site.