-
Notifications
You must be signed in to change notification settings - Fork 0
60 lines (51 loc) · 1.72 KB
/
eval.yml
File metadata and controls
60 lines (51 loc) · 1.72 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
name: Promptfoo Eval
on:
push:
paths:
- "python/ai-content-quality/prompts/**"
- "python/ai-content-quality/evals/**"
- "python/ai-content-quality/src/content_quality/services/analyzer.py"
- "python/ai-content-quality/promptfooconfig.yaml"
pull_request:
paths:
- "python/ai-content-quality/prompts/**"
- "python/ai-content-quality/evals/**"
- "python/ai-content-quality/src/content_quality/services/analyzer.py"
- "python/ai-content-quality/promptfooconfig.yaml"
concurrency:
group: eval-${{ github.ref }}
cancel-in-progress: true
jobs:
eval:
runs-on: ubuntu-latest
defaults:
run:
working-directory: python/ai-content-quality
env:
OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
steps:
- uses: actions/checkout@v4
- uses: actions/setup-node@v4
with:
node-version: "20"
- name: Install promptfoo
run: npm install -g promptfoo@latest
- name: Run eval
run: promptfoo eval --no-cache -o eval-results.json
- name: Check pass rate
run: |
TOTAL=$(jq '.results.stats.totalAssertions' eval-results.json)
PASSED=$(jq '.results.stats.totalPassedAssertions' eval-results.json)
RATE=$(echo "scale=2; $PASSED * 100 / $TOTAL" | bc)
echo "Pass rate: ${RATE}% (${PASSED}/${TOTAL})"
PASS=$(echo "$RATE >= 95" | bc)
if [ "$PASS" -ne 1 ]; then
echo "::error::Pass rate ${RATE}% is below 95% threshold"
exit 1
fi
- name: Upload eval results
if: always()
uses: actions/upload-artifact@v4
with:
name: eval-results
path: python/ai-content-quality/eval-results.json