Skip to content

Add llm as judge mt-bench dataset and metrics #867

Add llm as judge mt-bench dataset and metrics

Add llm as judge mt-bench dataset and metrics #867

name: Test Catalog Consistency
on:
push:
branches: [ main ]
pull_request:
branches: [ main ]
jobs:
run-catalog-consistency:
runs-on: ubuntu-latest
env:
OS: ubuntu-latest
GENAI_KEY: "dummy"
UNITXT_ALLOW_PASSING_DATA_TO_REMOTE_API: "True"
steps:
- uses: actions/checkout@v4
- uses: actions/setup-python@v5
with:
python-version: '3.9'
cache: 'pip' # caching pip dependencies
- run: pip install -r requirements/base.rqr
- run: pip install -r requirements/tests.rqr
- name: Install Unitxt From Source
run: pip install -e .
- name: Run Tests
run: python utils/prepare_all_artifacts.py