name: ACE Benchmark Evaluation Test on: schedule: - cron: '0 0 */3 * *' workflow_dispatch: jobs: test: runs-on: ubuntu-latest strategy: matrix: python-version: ['3.10'] steps: - name: Checkout code uses: actions/checkout@v4 - name: Debug directory structure run: | echo "Current directory: $(pwd)" ls -la - name: Setup Python uses: actions/setup-python@v4 with: python-version: ${{ matrix.python-version }} - name: Install dependencies run: | pip install --upgrade pip pip install pytest pytest-asyncio pytest-mock pip install agentscope ray - name: Run tests env: DASHSCOPE_API_KEY: ${{ secrets.DASHSCOPE_API_KEY }} run: | python -m pytest tests/evaluation_test.py -v