36 lines
895 B
YAML
36 lines
895 B
YAML
name: ACE Benchmark Evaluation Test
|
|
on: [push]
|
|
|
|
jobs:
|
|
test:
|
|
runs-on: ubuntu-latest
|
|
strategy:
|
|
matrix:
|
|
python-version: ['3.10']
|
|
|
|
steps:
|
|
- name: Checkout code
|
|
uses: actions/checkout@v4
|
|
|
|
- name: Debug directory structure
|
|
run: |
|
|
echo "Current directory: $(pwd)"
|
|
ls -la
|
|
|
|
- name: Setup Python
|
|
uses: actions/setup-python@v4
|
|
with:
|
|
python-version: ${{ matrix.python-version }}
|
|
|
|
- name: Install dependencies
|
|
run: |
|
|
pip install --upgrade pip
|
|
pip install pytest pytest-asyncio pytest-mock
|
|
pip install agentscope ray
|
|
|
|
- name: Run tests
|
|
env:
|
|
PYTHONPATH: ${{ env.GITHUB_WORKSPACE }}/evaluation/ace_bench
|
|
DASHSCOPE_API_KEY: ${{ secrets.DASHSCOPE_API_KEY }}
|
|
run: |
|
|
python -m pytest tests/evaluation_test.py -v |