Skip to content

Adjustments for Lab01 and added notes for issues. #5

Adjustments for Lab01 and added notes for issues.

Adjustments for Lab01 and added notes for issues. #5

name: Automated Evaluation Pipeline
on:
push:
branches: [ main, develop ]
paths:
- 'src/agents/**'
- 'src/evaluators/**'
- 'data/datasets/**'
pull_request:
branches: [ main ]
paths:
- 'src/agents/**'
- 'src/evaluators/**'
jobs:
evaluate-agents:
runs-on: ubuntu-latest
steps:
- uses: actions/checkout@v4
- name: Set up Python
uses: actions/setup-python@v4
with:
python-version: '3.9'
- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install -r requirements.txt
- name: Run Quality Evaluations
run: |
python -m src.evaluators.quality_evaluators
env:
FOUNDRY_API_KEY: ${{ secrets.FOUNDRY_API_KEY }}
- name: Run Safety Evaluations
run: |
python -m src.evaluators.safety_evaluators
env:
FOUNDRY_API_KEY: ${{ secrets.FOUNDRY_API_KEY }}
- name: Upload Evaluation Results
uses: actions/upload-artifact@v4
with:
name: evaluation-results
path: data/results/automated_evaluations/