Skip to content

Hybrid retrieval tutorial (#241) #37

Hybrid retrieval tutorial (#241)

Hybrid retrieval tutorial (#241) #37

Workflow file for this run

name: Sync tutorial with dC workspace
on:
push:
branches:
- main
paths:
- "tutorials/[0-9]*.ipynb"
jobs:
get-tutorials:
runs-on: ubuntu-latest
outputs:
modified-matrix: ${{ steps.create_matrix.outputs.modified-matrix }}
deleted-matrix: ${{ steps.create_matrix.outputs.deleted-matrix }}
steps:
- name: Checkout
uses: actions/checkout@v3
with:
fetch-depth: 0
- name: Get changed files
id: files
uses: tj-actions/changed-files@v34
with:
json: true
files: |
./tutorials/[0-9]*.ipynb
- name: Create matrixes
id: create_matrix
run: |
echo "modified-matrix=${{ steps.files.outputs.all_changed_files }}" >> "$GITHUB_OUTPUT"
echo "deleted-matrix=${{ steps.files.outputs.deleted_files }}" >> "$GITHUB_OUTPUT"
modified:
needs: get-tutorials
if: ${{ needs.get-tutorials.outputs.modified-matrix != '[]' && needs.get-tutorials.outputs.modified-matrix != '' }}
runs-on: ubuntu-latest
strategy:
matrix:
file: ${{ fromJSON(needs.get-tutorials.outputs.modified-matrix) }}
steps:
- name: Checkout
uses: actions/checkout@v3
- uses: actions/setup-python@v4
with:
python-version: "3.11"
- name: Install requirements
run: |
pip install --upgrade pip
pip install -r requirements.txt
- name: Generate file to upload
id: file-generator
run: |
FILE="$(basename ${{ matrix.file }} .ipynb).txt"
METADATA_FILE="$(basename ${{ matrix.file }} .ipynb).yml"
echo "file=text/$FILE" >> "$GITHUB_OUTPUT"
echo "metadata_file=text/$METADATA_FILE" >> "$GITHUB_OUTPUT"
python scripts/generate_txt.py --metadata --notebooks ${{ matrix.file }}
- name: Upload tutorial to deepset Cloud
uses: silvanocerza/deepset-cloud-file-uploader@v1
with:
api-key: ${{ secrets.DEEPSET_CLOUD_API_KEY }}
workspace-name: ${{ secrets.DEEPSET_CLOUD_WORKSPACE }}
file: ${{ steps.file-generator.outputs.file }}
write-mode: OVERWRITE
meta-file: ${{ steps.file-generator.outputs.metadata_file }}
deleted:
needs: get-tutorials
if: ${{ needs.get-tutorials.outputs.deleted-matrix != '[]' && needs.get-tutorials.outputs.deleted-matrix != '' }}
runs-on: ubuntu-latest
strategy:
matrix:
file: ${{ fromJSON(needs.get-tutorials.outputs.deleted-matrix) }}
steps:
# This step is really important as when we remove a tutorial
# notebook we also want to remove the relative file from
# deepset Cloud, but since the remote file will have a .txt
# extension we must first generate the full file name with this step.
- name: Get file with correct extension
id: extension-changer
run: |
FILE="$(basename ${{ matrix.file }} .ipynb).txt"
echo "file=$FILE" >> "$GITHUB_OUTPUT"
- name: Delete file from deepset Cloud
uses: silvanocerza/deepset-cloud-file-deleter@v1
with:
api-key: ${{ secrets.DEEPSET_CLOUD_API_KEY }}
workspace-name: ${{ secrets.DEEPSET_CLOUD_WORKSPACE }}
file: ${{ steps.extension-changer.outputs.file}}