feat: add CUREv1 retrieval dataset #4150
Workflow file for this run
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# GitHub action for the mmteb contributions | |
# this way the CI related to the mmteb contributions will be separated from the linting CI | |
name: mmteb | |
on: | |
push: | |
branches: [main] | |
pull_request: | |
jobs: | |
check-points: | |
runs-on: ubuntu-latest | |
steps: | |
- uses: actions/checkout@v3 | |
- uses: actions/setup-python@v4 | |
with: | |
python-version: "3.9" | |
cache: "pip" | |
- name: Install dependencies | |
run: | | |
pip install jsonlines pydantic | |
- name: Validate jsonl points files | |
run: python docs/mmteb/validate_points.py | |
create-table: | |
# only run on push to main | |
if: github.event_name == 'push' && github.ref == 'refs/heads/main' | |
runs-on: ubuntu-latest | |
needs: check-points | |
steps: | |
- uses: actions/checkout@v3 | |
with: | |
token: ${{ secrets.RELEASE }} | |
- uses: actions/setup-python@v4 | |
with: | |
python-version: "3.9" | |
cache: "pip" | |
- name: Install dependencies | |
run: | | |
pip install pandas tabulate # for the table creation | |
- name: Create table | |
run: python docs/mmteb/create_points_table.py | |
- name: Push table | |
run: | | |
git config --global user.email "github-actions[bot]@users.noreply.github.com" | |
git config --global user.name "github-actions[bot]" | |
# Check if changes exist in points_table.md | |
if git diff --quiet; then | |
echo "No changes detected" | |
else | |
git add docs/mmteb/points_table.md | |
git commit -m "Update points table" | |
git push | |
fi | |