Merge pull request #466 from instructlab/port_old_tests

Add simple and full knowledge pipeline functional tests
instructlab · Feb 3, 2025 · ddc8ec5 · ddc8ec5
2 parents e04c039 + 2a62495
commit ddc8ec5
Show file tree

Hide file tree

Showing 10 changed files with 346 additions and 62 deletions.
diff --git a/.github/mergify.yml b/.github/mergify.yml
@@ -59,6 +59,22 @@ pull_request_rules:
         - -files~=^requirements.*\.txt$
         - -files=.github/workflows/e2e-nvidia-t4-x1.yml
 
+    # functional gpu small workflow
+    - or:
+      - and:
+        # note this should match the triggering criteria in 'functional-gpu-nvidia-t4-x1.yml'
+        - check-success~=functional-gpu-small-workflow-complete
+        - or:
+          - files~=\.py$
+          - files=pyproject.toml
+          - files=^requirements.*\.txt$
+          - files=.github/workflows/functional-gpu-nvidia-t4-x1.yml
+      - and:
+        - -files~=\.py$
+        - -files=pyproject.toml
+        - -files~=^requirements.*\.txt$
+        - -files=.github/workflows/functional-gpu-nvidia-t4-x1.yml
+
     # lint must pass if files change that would trigger this job
     - or:
       - and:

diff --git a/.github/workflows/functional-gpu-nvidia-t4-x1.yml b/.github/workflows/functional-gpu-nvidia-t4-x1.yml
@@ -0,0 +1,153 @@
+# SPDX-License-Identifier: Apache-2.0
+
+name: Functional GPU (NVIDIA Tesla T4 x1)
+
+on:
+  # run against every merge commit to 'main' and release branches
+  push:
+    branches:
+      - main
+      - release-*
+  # only run on PRs that touch certain regex paths
+  pull_request_target:
+    branches:
+      - main
+      - release-*
+    paths:
+      #  note this should match the merging criteria in 'mergify.yml'
+      - "**.py"
+      - "pyproject.toml"
+      - "requirements**.txt"
+      - 'tox.ini'
+      - ".github/workflows/functional-gpu-nvidia-t4-x1.yml" # This workflow
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
+  cancel-in-progress: true
+
+env:
+  LC_ALL: en_US.UTF-8
+
+defaults:
+  run:
+    shell: bash
+
+permissions:
+  contents: read
+
+jobs:
+  start-small-ec2-runner:
+    runs-on: ubuntu-latest
+    outputs:
+      label: ${{ steps.start-ec2-runner.outputs.label }}
+      ec2-instance-id: ${{ steps.start-ec2-runner.outputs.ec2-instance-id }}
+    steps:
+      - name: Configure AWS credentials
+        uses: aws-actions/configure-aws-credentials@e3dd6a429d7300a6a4c196c26e071d42e0343502 # v4.0.2
+        with:
+          aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
+          aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
+          aws-region: ${{ vars.AWS_REGION }}
+
+      - name: Start EC2 runner
+        id: start-ec2-runner
+        uses: machulav/ec2-github-runner@1827d6ca7544d7044ddbd2e9360564651b463da2 # v2.3.7
+        with:
+          mode: start
+          github-token: ${{ secrets.GH_PERSONAL_ACCESS_TOKEN }}
+          ec2-image-id: ${{ vars.AWS_EC2_AMI }}
+          ec2-instance-type: g4dn.2xlarge
+          subnet-id: subnet-02d230cffd9385bd4
+          security-group-id: sg-06300447c4a5fbef3
+          iam-role-name: instructlab-ci-runner
+          aws-resource-tags: >
+            [
+              {"Key": "Name", "Value": "instructlab-ci-github-small-runner"},
+              {"Key": "GitHubRepository", "Value": "${{ github.repository }}"},
+              {"Key": "GitHubRef", "Value": "${{ github.ref }}"},
+              {"Key": "GitHubPR", "Value": "${{ github.event.number }}"}
+            ]
+
+  functional-gpu-small-test:
+    needs:
+      - start-small-ec2-runner
+    runs-on: ${{ needs.start-small-ec2-runner.outputs.label }}
+
+    # It is important that this job has no write permissions and has
+    # no access to any secrets. This part is where we are running
+    # untrusted code from PRs.
+    permissions: {}
+
+    steps:
+      - name: Install Packages
+        run: |
+          cat /etc/os-release
+          sudo dnf install -y gcc gcc-c++ make git python3.11 python3.11-devel
+
+      - name: Checkout instructlab/sdg
+        uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
+        with:
+          # https://github.com/actions/checkout/issues/249
+          fetch-depth: 0
+
+      - name: Fetch and checkout PR
+        if: github.event_name == 'pull_request_target'
+        run: |
+          git fetch origin pull/${{ github.event.pull_request.number }}/merge:pr-merge-${{ github.event.pull_request.number }}
+          git checkout pr-merge-${{ github.event.pull_request.number }}
+          git log -1 --format="%H %s"
+
+      - name: Install instructlab/sdg
+        run: |
+          export PATH="/home/ec2-user/.local/bin:/usr/local/cuda/bin:$PATH"
+          python3.11 -m venv --upgrade-deps venv
+          . venv/bin/activate
+          nvidia-smi
+          python3.11 -m pip install tox tox-gh>=1.2
+          python3.11 -m pip cache remove llama_cpp_python
+
+          CMAKE_ARGS="-DLLAMA_CUDA=on" python3.11 -m pip install -r requirements-dev.txt
+
+      - name: Check disk before tests
+        run: |
+          df -h
+
+      - name: Run functional gpu tests with tox
+        run: |
+          . venv/bin/activate
+          tox -e py3-functional-gpu
+
+      - name: Check disk after tests
+        run: |
+          df -h
+
+  stop-small-ec2-runner:
+    needs:
+      - start-small-ec2-runner
+      - functional-gpu-small-test
+    runs-on: ubuntu-latest
+    if: ${{ always() }}
+    steps:
+      - name: Configure AWS credentials
+        uses: aws-actions/configure-aws-credentials@e3dd6a429d7300a6a4c196c26e071d42e0343502 # v4.0.2
+        with:
+          aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
+          aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
+          aws-region: ${{ vars.AWS_REGION }}
+
+      - name: Stop EC2 runner
+        uses: machulav/ec2-github-runner@1827d6ca7544d7044ddbd2e9360564651b463da2 # v2.3.7
+        with:
+          mode: stop
+          github-token: ${{ secrets.GH_PERSONAL_ACCESS_TOKEN }}
+          label: ${{ needs.start-small-ec2-runner.outputs.label }}
+          ec2-instance-id: ${{ needs.start-small-ec2-runner.outputs.ec2-instance-id }}
+
+  functional-gpu-small-workflow-complete:
+    # we don't want to block PRs on failed EC2 cleanup
+    # so not requiring "stop-small-ec2-runner" as well
+    needs: ["start-small-ec2-runner", "functional-gpu-small-test"]
+    runs-on: ubuntu-latest
+    steps:
+      - name: Functional GPU Workflow Complete
+        run: echo "Functional GPU Workflow Complete"
diff --git a/pyproject.toml b/pyproject.toml
@@ -102,3 +102,8 @@ exclude = [
 ]
 # honor excludes by not following there through imports
 follow_imports = "silent"
+
+[tool.pytest.ini_options]
+markers = [
+    "gpu: marks tests that should run with gpus (deselect with '-m \"not gpu\"')",
+]
diff --git a/requirements-dev.txt b/requirements-dev.txt
@@ -2,12 +2,14 @@
 
 -r requirements.txt
 
+jsonschema
+llama-cpp-python[server]>=0.3.0,<1.0.0
 pre-commit>=3.0.4,<5.0
 pylint>=2.16.2,<4.0
 pylint-pydantic
 pytest
 pytest-asyncio
 pytest-cov
 pytest-html
+starlette>=0.30.0
 tox>=4.4.2,<5
-jsonschema
diff --git a/scripts/test_knowledge.py b/scripts/test_knowledge.py
diff --git a/tests/functional/conftest.py b/tests/functional/conftest.py
@@ -3,6 +3,7 @@
 import typing
 
 # Third Party
+from datasets import Dataset
 import pytest
 
 TESTS_PATH = pathlib.Path(__file__).parent.parent.absolute()
@@ -19,3 +20,24 @@ def testdata_path() -> typing.Generator[pathlib.Path, None, None]:
 def examples_path() -> typing.Generator[pathlib.Path, None, None]:
     """Path to examples directory"""
     yield EXAMPLES_PATH
+
+
+@pytest.fixture
+def tonsils_knowledge_dataset():
+    return Dataset.from_list(
+        [
+            {
+                "icl_query_1": "what is the location of the tubal tonsils?",
+                "icl_response_1": "The location of the tubal tonsils is the roof of the pharynx.",
+                "icl_query_2": "How long does the adenoid grow?",
+                "task_description": "Teaching about human anatomy, specifically tonsils",
+                "icl_response_2": "The adenoid grows until the age of 5, starts to shrink at the age of 7 and becomes small in adulthood.",
+                "icl_query_3": "What is the immune systems first line of defense against ingested or inhaled foreign pathogens?",
+                "icl_response_3": "The tonsils are the immune systems first line of defense.",
+                "document": "The **tonsils** are a set of lymphoid organs facing into the aerodigestive tract, which is known as Waldeyer's tonsillar ring and consists of the adenoid tonsil or pharyngeal tonsil, two tubal tonsils, two palatine tonsils, and the lingual tonsils. These organs play an important role in the immune system. When used unqualified, the term most commonly refers specifically to the palatine tonsils, which are two lymphoid organs situated at either side of the back of the human throat. The palatine tonsils and the adenoid tonsil are organs consisting of lymphoepithelial tissue located near the oropharynx and nasopharynx parts of the throat",
+                "icl_document": "The **tonsils** are a set of lymphoid organs facing into the aerodigestive tract, which is known as Waldeyer's tonsillar ring and consists of the adenoid tonsil or pharyngeal tonsil, two tubal tonsils, two palatine tonsils, and the lingual tonsils.",
+                "domain": "textbook",
+                "document_outline": "Medical description of tonsils",
+            }
+        ]
+    )
diff --git a/tests/functional/llama_cpp_helpers.py b/tests/functional/llama_cpp_helpers.py
@@ -0,0 +1,36 @@
+# Standard
+from importlib import resources
+import pathlib
+import typing
+
+# Third Party
+from llama_cpp.server.app import create_app
+from llama_cpp.server.settings import ModelSettings, ServerSettings
+from openai import OpenAI
+from starlette.testclient import TestClient
+
+
+def llama_cpp_openai_client(model, model_repo_id):
+    server_settings = ServerSettings()
+    model_settings = [
+        ModelSettings(
+            model=model,
+            hf_model_repo_id=model_repo_id,
+            verbose=True,
+        )
+    ]
+    app = create_app(
+        server_settings=server_settings,
+        model_settings=model_settings,
+    )
+
+    @app.get("/")
+    def read_root():
+        return {"message": "Hello from InstructLab! Visit us at https://instructlab.ai"}
+
+    test_client = TestClient(app)
+    return OpenAI(
+        api_key="EMPTY",
+        base_url="http://localhost:8000/v1",
+        http_client=test_client,
+    )
diff --git a/tests/functional/test_full_pipeline.py b/tests/functional/test_full_pipeline.py
@@ -0,0 +1,51 @@
+# Standard
+from importlib import resources
+import unittest
+
+# Third Party
+import pytest
+
+# First Party
+from src.instructlab.sdg.datamixing import _get_question_hack, _get_response_hack
+from src.instructlab.sdg.pipeline import (
+    FULL_PIPELINES_PACKAGE,
+    Pipeline,
+    PipelineContext,
+)
+
+# Local
+from .llama_cpp_helpers import llama_cpp_openai_client
+
+
+@pytest.mark.gpu
+class TestFullPipeline(unittest.TestCase):
+    @pytest.fixture(autouse=True)
+    def _setup_fixtures(self, tonsils_knowledge_dataset):
+        model = "mistral-7b-instruct-v0.2.Q5_K_M.gguf"
+        model_repo_id = "TheBloke/Mistral-7B-Instruct-v0.2-GGUF"
+        model_family = "mixtral"
+        client = llama_cpp_openai_client(model, model_repo_id)
+        teacher_model = client.models.list().data[0].id
+        num_instructions_to_generate = 2
+        max_num_tokens = 1024
+        context = PipelineContext(
+            client=client,
+            model_family=model_family,
+            model_id=teacher_model,
+            num_instructions_to_generate=num_instructions_to_generate,
+            max_num_tokens=max_num_tokens,
+        )
+        yaml_path = resources.files(FULL_PIPELINES_PACKAGE).joinpath("knowledge.yaml")
+        self.knowledge_dataset = tonsils_knowledge_dataset
+        self.knowledge_pipeline = Pipeline.from_file(context, yaml_path)
+
+    def test_knowledge(self):
+        samples = self.knowledge_pipeline.generate(self.knowledge_dataset)
+        assert len(samples) > 0
+        assert "question" in samples.column_names
+        assert "response" in samples.column_names
+        for sample in samples:
+            question = _get_question_hack(sample)
+            response = _get_response_hack(sample)
+            assert len(question) > 0
+            assert len(response) > 0