CogStack · alhendrickson · Aug 14, 2025 · Aug 13, 2025 · Aug 13, 2025
diff --git a/.github/workflows/medcat-trainer-v1_ci.yml b/.github/workflows/medcat-trainer-v1_ci.yml
@@ -0,0 +1,68 @@
+name: medcat-trainer-v1 ci-build
+
+on:
+  pull_request:
+    paths:
+      - 'v1/medcat-trainer/**'
+      - '.github/workflows/medcat-trainer-v1**'
+
+defaults:
+  run:
+    working-directory: ./v1/medcat-trainer
+
+jobs:
+  # Test and build client library
+  test-client:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout main
+        uses: actions/checkout@v4
+        with:
+          ref: ${{ github.ref }}
+
+      - name: Set up Python
+        uses: actions/setup-python@v4
+        with:
+          python-version: '3.10'
+
+      - name: Install dependencies
+        run: |
+          python -m pip install --upgrade pip
+          pip install requests pytest build
+
+      - name: Install client package in development mode
+        run: |
+          cd client
+          pip install -e .
+
+      - name: Run client tests
+        run: |
+          cd client
+          python -m pytest tests/ -v
+
+      - name: Build client package
+        run: |
+          cd client
+          python -m build
+
+  # Build and test webapp container
+  build-and-push:
@@ -1,3 +1,5 @@
+permissions:
+  contents: read
 name: medcat-trainer-v1 ci-build
 on:
@@ -1,3 +1,5 @@
+permissions:
+  contents: read
 name: medcat-trainer-v1 ci-build

 on:
+    runs-on: ubuntu-latest
+    needs: test-client
+    steps:
+      - name: Checkout main
+        uses: actions/checkout@v4
+        with:
+          ref: ${{ github.ref }}
+
+      - name: Build
+        env:
+          IMAGE_TAG: ${{ env.RELEASE_VERSION }}
+        run: |
+          docker build -t cogstacksystems/medcat-trainer:dev-latest webapp/.
+      - name: Run Django Tests
+        env:
+          IMAGE_TAG: ${{ env.RELEASE_VERSION }}
+        run: |
+          # run tests
+          docker run --rm cogstacksystems/medcat-trainer:dev-latest python manage.py test
@@ -1,3 +1,5 @@
+permissions:
+  contents: read
 name: medcat-trainer-v1 ci-build
 on:
@@ -1,3 +1,5 @@
+permissions:
+  contents: read
 name: medcat-trainer-v1 ci-build

 on:
diff --git a/.github/workflows/medcat-trainer-v1_qa.yml b/.github/workflows/medcat-trainer-v1_qa.yml
@@ -0,0 +1,82 @@
+name: medcat-trainer-v1 qa-build
+
+on:
+  push:
+    branches: [ main ]
+
+defaults:
+  run:
+    working-directory: ./v1/medcat-trainer
+
+jobs:
+  # Test and build client library
+  test-client:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout main
+        uses: actions/checkout@v4
+        with:
+          ref: 'main'
+
+      - name: Set up Python
+        uses: actions/setup-python@v4
+        with:
+          python-version: '3.10'
+
+      - name: Install dependencies
+        run: |
+          python -m pip install --upgrade pip
+          pip install requests pytest build
+
+      - name: Install client package in development mode
+        run: |
+          cd client
+          pip install -e .
+
+      - name: Run client tests
+        run: |
+          cd client
+          python -m pytest tests/ -v
+
+      - name: Build client package
+        run: |
+          cd client
+          python -m build
+
+      # - name: Publish dev distribution to Test PyPI
+      #   uses: pypa/gh-action-pypi-publish@v1.4.2
+      #   with:
+      #     password: ${{ secrets.MEDCAT_TRAINER_TEST_PYPI_API_TOKEN }}
+      #     repository_url: https://test.pypi.org/legacy/
+      #     packages_dir: v1/medcat-trainer/client/dist
+
+  # Build and test webapp container
+  build-and-push:
@@ -1,3 +1,5 @@
+permissions:
+  contents: read
 name: medcat-trainer-v1 qa-build
 on:
@@ -1,3 +1,5 @@
+permissions:
+  contents: read
 name: medcat-trainer-v1 qa-build

 on:
+    runs-on: ubuntu-latest
+    needs: test-client
+    steps:
+      - name: Checkout main
+        uses: actions/checkout@v4
+        with:
+          ref: 'main'
+
+      - name: Build
+        run: |
+          docker build -t cogstacksystems/medcat-trainer:v1-latest webapp/.
+
+      - name: Run Django Tests
+        env:
+          IMAGE_TAG: latest
+        run: |
+          # run tests
+          docker run --rm cogstacksystems/medcat-trainer:v1-latest python manage.py test
+
+      - name: Login to DockerHub
+        uses: docker/login-action@v3
+        with:
+          username: ${{ secrets.DOCKERHUB_USERNAME }}
+          password: ${{ secrets.DOCKER_HUB_ACCESS_TOKEN }}
+
+      - name: Push to DockerHub
+        run: |
+          docker push cogstacksystems/medcat-trainer:v1-latest
@@ -1,3 +1,5 @@
+permissions:
+  contents: read
 name: medcat-trainer-v1 qa-build
 on:
@@ -1,3 +1,5 @@
+permissions:
+  contents: read
 name: medcat-trainer-v1 qa-build

 on:
diff --git a/.github/workflows/medcat-trainer-v1_release.yml b/.github/workflows/medcat-trainer-v1_release.yml
@@ -0,0 +1,95 @@
+name: medcat-trainer-v1 release-build
+
+on:
+  push:
+    tags:
+      - 'medcat-trainer/v1.*.*'  
+
+defaults:
+  run:
+    working-directory: ./v1/medcat-trainer
+
+jobs:
+  # Test, build and publish client library
+  test-and-publish-client:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout main
+        uses: actions/checkout@v4
+        with:
+          ref: "main"
+
+      - name: Release Tag
+        # If GITHUB_REF=refs/tags/medcat-trainer/v0.1.2, this returns v0.1.2. Note it's including the "v" though it probably shouldnt
+        run: echo "RELEASE_VERSION=${GITHUB_REF##refs/*/}" >> $GITHUB_ENV
+
+      - name: Set up Python
+        uses: actions/setup-python@v4
+        with:
+          python-version: '3.10'
+
+      - name: Install dependencies
+        run: |
+          python -m pip install --upgrade pip
+          pip install requests pytest build twine
+
+      - name: Install client package in development mode
+        run: |
+          cd client
+          pip install -e .
+
+      - name: Run client tests
+        run: |
+          cd client
+          python -m pytest tests/ -v
+
+      - name: Build client package
+        run: |
+          cd client
+          python -m build
+
+      - name: Publish production distribution to PyPI
+        if: startsWith(github.ref, 'refs/tags') && ! github.event.release.prerelease
+        uses: pypa/gh-action-pypi-publish@v1.4.2
+        with:
+          # TODO CU-869a25n7e Use Trusted Platform Publisher based PyPI release
+          password: ${{ secrets.PYPI_API_TOKEN }}
+          packages_dir: v1/medcat-trainer/client/dist
+
+  # Build and test webapp container
+  build-and-push:
@@ -1,3 +1,5 @@
+permissions:
+  contents: read
 name: medcat-trainer-v1 release-build
 on:
@@ -1,3 +1,5 @@
+permissions:
+  contents: read
 name: medcat-trainer-v1 release-build

 on:
+    runs-on: ubuntu-latest
+    needs: test-and-publish-client
+    steps:
+      - name: Checkout main
+        uses: actions/checkout@v4
+        with:
+          ref: "main"
+
+      - name: Release Tag
+        # If GITHUB_REF=refs/tags/medcat-trainer/v0.1.2, this returns v0.1.2. Note it's including the "v" though it probably shouldnt
+        run: echo "RELEASE_VERSION=${GITHUB_REF##refs/*/}" >> $GITHUB_ENV
+      - name: Build
+        env:
+          IMAGE_TAG: ${{ env.RELEASE_VERSION }}
+        run: |
+          docker build -t cogstacksystems/medcat-trainer:$IMAGE_TAG webapp/.
+      - name: Run Django Tests
+        env:
+          IMAGE_TAG: ${{ env.RELEASE_VERSION }}
+        run: |
+          # run tests
+          docker run --rm cogstacksystems/medcat-trainer:$IMAGE_TAG python manage.py test
+
+      - name: Login to DockerHub
+        uses: docker/login-action@v3
+        with:
+          username: ${{ secrets.DOCKERHUB_USERNAME }}
+          password: ${{ secrets.DOCKER_HUB_ACCESS_TOKEN }}
+
+      - name: Push to DockerHub
+        env:
+          IMAGE_TAG: ${{ env.RELEASE_VERSION }}
+        run: |
+          docker push cogstacksystems/medcat-trainer:$IMAGE_TAG
@@ -1,5 +1,8 @@
 name: medcat-trainer-v1 release-build
+permissions:
+  contents: read
+
 on:
  push:
    tags:
@@ -1,5 +1,8 @@
 name: medcat-trainer-v1 release-build

+permissions:
+  contents: read
+
 on:
  push:
    tags:
+
diff --git a/v1/medcat-trainer/.env-example b/v1/medcat-trainer/.env-example
@@ -0,0 +1,6 @@
+# MedCAT
+SPACY_MODELS="en_core_web_sm en_core_web_md en_core_web_lg"
+
+# Ports
+MCTRAINER_PORT=8001
+SOLR_PORT=8983
diff --git a/v1/medcat-trainer/.gitignore b/v1/medcat-trainer/.gitignore
@@ -0,0 +1,51 @@
+#Directories to be ignored fully
+/books/
+/articles/
+/other/
+/output/
+/graphics/
+/webapp/models/*
+data/
+tmp/
+*_tmp/
+.idea
+
+/webapp/frontend/dist/*
+/webapp/api/media/*
+/webapp/api/static/*
+
+# Configuration
+.env
+
+# Keep folders with this
+!.keep
+
+#tmp and similar files
+.nfs*
+*.pyc
+*.out
+*.swp
+*.swn
+tmp_*
+t_*
+tmp_*
+*_tmp
+*.swo
+*.lyx.emergency
+*.lyx#
+*~
+*.log
+*hidden*
+db.sqlite3
+nohup.out
+tmp.py
+
+# docs outputs
+docs/_build
+
+# macOS system files
+.DS_Store
+*/.DS_Store
+
+# Jupyter Notebook checkpoints
+*/.ipynb_checkpoints/*
diff --git a/v1/medcat-trainer/.readthedocs.yaml b/v1/medcat-trainer/.readthedocs.yaml
@@ -0,0 +1,17 @@
+# .readthedocs.yaml
+# Read the Docs configuration file
+# See https://docs.readthedocs.io/en/stable/config-file/v2.html for details
+
+version: 2
+
+build:
+  os: ubuntu-20.04
+  tools:
+    python: "3.9"
+
+sphinx:
+  configuration: medcat-trainer/docs/conf.py
+
+python:
+  install:
+    - requirements: medcat-trainer/docs/requirements.txt