Skip to main content

Single Skill

The simplest pattern - evaluate one skill per workflow run.

name: Skill Eval
on:
pull_request:
paths:
- 'skills/my-skill/**'

permissions:
contents: read
pull-requests: write

jobs:
eval:
runs-on: ubuntu-latest
timeout-minutes: 30
steps:
- uses: actions/checkout@v6

- uses: skill-bench/skill-eval-action@v1
with:
skill-name: my-skill
skill-path: skills/my-skill
anthropic-api-key: ${{ secrets.ANTHROPIC_API_KEY }}
pass-threshold: '80'