From 8a18de9c90300083493d4bee0ee3949e4f5b398f Mon Sep 17 00:00:00 2001
From: Saad Zaher <szaher@redhat.com>
Date: Mon, 15 Sep 2025 12:33:45 +0100
Subject: [PATCH 1/2] add localprocess backend tests

Signed-off-by: Saad Zaher <szaher@redhat.com>
---
 Makefile                                      |  11 +-
 .../trainer/backends/localprocess/backend.py  |   6 +-
 .../backends/localprocess/backend_test.py     | 727 ++++++++++++++++++
 3 files changed, 739 insertions(+), 5 deletions(-)
 create mode 100644 kubeflow/trainer/backends/localprocess/backend_test.py

diff --git a/Makefile b/Makefile
index 507b04d5c..79c4cba36 100644
--- a/Makefile
+++ b/Makefile
@@ -68,8 +68,15 @@ uv-venv:
 .PHONY: test-python
 test-python: uv-venv
 	@uv sync
-	@uv run coverage run --source=kubeflow.trainer.backends.kubernetes.backend,kubeflow.trainer.utils.utils -m pytest ./kubeflow/trainer/backends/kubernetes/backend_test.py ./kubeflow/trainer/utils/utils_test.py
-	@uv run coverage report -m kubeflow/trainer/backends/kubernetes/backend.py kubeflow/trainer/utils/utils.py
+	@echo "Discovering all test files..."
+	@TEST_FILES=$$(find ./kubeflow -name "*_test.py" -type f | tr '\n' ' '); \
+	SOURCE_FILES=$$(find ./kubeflow -name "*_test.py" -type f | sed 's/_test\.py$$/.py/' | tr '\n' ' '); \
+	SOURCE_MODULES=$$(find ./kubeflow -name "*_test.py" -type f | sed 's/_test\.py$$/.py/' | sed 's|^\./||g' | sed 's|/|.|g' | sed 's|\.py$$||g' | tr '\n' ','); \
+	SOURCE_MODULES=$$(echo $$SOURCE_MODULES | sed 's/,$$//'); \
+	echo "Running tests: $$TEST_FILES"; \
+	echo "Coverage sources: $$SOURCE_MODULES"; \
+	uv run coverage run --source=$$SOURCE_MODULES -m pytest $$TEST_FILES; \
+	uv run coverage report -m $$(echo $$SOURCE_FILES | tr ' ' '\n' | grep -E '\.(py)$$' | tr '\n' ' ')
 ifeq ($(report),xml)
 	@uv run coverage xml
 else
diff --git a/kubeflow/trainer/backends/localprocess/backend.py b/kubeflow/trainer/backends/localprocess/backend.py
index 4fbb2d465..9c80f54af 100644
--- a/kubeflow/trainer/backends/localprocess/backend.py
+++ b/kubeflow/trainer/backends/localprocess/backend.py
@@ -61,11 +61,11 @@ def get_runtime(self, name: str) -> types.Runtime:
         return runtime
 
     def get_runtime_packages(self, runtime: types.Runtime):
-        runtime = next((rt for rt in local_runtimes if rt.name == runtime.name), None)
-        if not runtime:
+        local_runtime = next((rt for rt in local_runtimes if rt.name == runtime.name), None)
+        if not local_runtime:
             raise ValueError(f"Runtime '{runtime.name}' not found.")
 
-        return runtime.trainer.packages
+        return local_runtime.trainer.packages
 
     def train(
         self,
diff --git a/kubeflow/trainer/backends/localprocess/backend_test.py b/kubeflow/trainer/backends/localprocess/backend_test.py
new file mode 100644
index 000000000..e1fa22612
--- /dev/null
+++ b/kubeflow/trainer/backends/localprocess/backend_test.py
@@ -0,0 +1,727 @@
+# Copyright 2025 The Kubeflow Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Unit tests for the LocalProcessBackend class in the Kubeflow Trainer SDK.
+
+This module uses pytest and unittest.mock to test LocalProcessBackend's behavior
+across job creation, management, and lifecycle operations using local subprocess execution.
+"""
+
+import random
+import string
+import tempfile
+import uuid
+from dataclasses import asdict, dataclass, field
+from datetime import datetime
+from typing import Any, Optional, Set, Type
+from unittest.mock import Mock, patch
+
+import pytest
+
+from kubeflow.trainer.backends.localprocess.backend import LocalProcessBackend
+from kubeflow.trainer.backends.localprocess.constants import local_runtimes
+from kubeflow.trainer.backends.localprocess.job import LocalJob
+from kubeflow.trainer.backends.localprocess.types import (
+    LocalBackendJobs,
+    LocalBackendStep,
+    LocalProcessBackendConfig,
+)
+from kubeflow.trainer.constants import constants
+from kubeflow.trainer.types import types
+
+
+@dataclass
+class TestCase:
+    """Test case configuration for parametrized tests."""
+    name: str
+    expected_status: str
+    config: dict[str, Any] = field(default_factory=dict)
+    expected_output: Optional[Any] = None
+    expected_error: Optional[Type[Exception]] = None
+    __test__ = False
+
+
+# --------------------------
+# Constants for test scenarios
+# --------------------------
+SUCCESS = "success"
+FAILED = "failed"
+TIMEOUT = "timeout"
+RUNTIME_ERROR = "runtime_error"
+VALUE_ERROR = "value_error"
+TORCH_RUNTIME = constants.TORCH_RUNTIME
+BASIC_TRAIN_JOB_NAME = "basic-job"
+TEST_VENV_DIR = "/tmp/test_venv"
+
+
+# --------------------------
+# Fixtures
+# --------------------------
+
+@pytest.fixture
+def local_backend():
+    """Provide a LocalProcessBackend instance for testing."""
+    config = LocalProcessBackendConfig(cleanup_venv=True)
+    return LocalProcessBackend(cfg=config)
+
+
+# --------------------------
+# Object Creators
+# --------------------------
+
+def create_mock_runtime(
+    name: str = TORCH_RUNTIME,
+    framework: str = "torch",
+    trainer_type: types.TrainerType = types.TrainerType.CUSTOM_TRAINER,
+) -> types.Runtime:
+    """Create a mock Runtime object for testing."""
+    return types.Runtime(
+        name=name,
+        trainer=types.RuntimeTrainer(
+            trainer_type=trainer_type,
+            framework=framework,
+            num_nodes=1,
+            device=constants.UNKNOWN,
+            device_count=constants.UNKNOWN,
+        ),
+        pretrained_model=None,
+    )
+
+
+def create_mock_trainer(
+    func_name: str = "Training function",
+    packages: Optional[list[str]] = None,
+    env: Optional[dict[str, str]] = None,
+) -> types.CustomTrainer:
+    """Create a mock CustomTrainer object for testing."""
+    if packages is None:
+        packages = ["torch", "numpy"]
+    if env is None:
+        env = {"ENV_VAR": "test_value"}
+    
+    return types.CustomTrainer(
+        func=lambda: print(func_name),
+        func_args={"param1": "value1"},
+        packages_to_install=packages,
+        env=env,
+    )
+
+
+def create_mock_builtin_trainer() -> types.BuiltinTrainer:
+    """Create a mock BuiltinTrainer object for testing."""
+    return types.BuiltinTrainer(config=types.TorchTuneConfig())
+
+
+def create_local_job(
+    name: str = "test-job",
+    status: str = constants.TRAINJOB_RUNNING,
+) -> LocalJob:
+    """Create a mock LocalJob object for testing."""
+    mock_job = Mock(spec=LocalJob)
+    mock_job.name = name
+    mock_job.status = status
+    mock_job.logs.return_value = ["log line 1", "log line 2"]
+    mock_job.cancel = Mock()
+    mock_job.join = Mock()
+    return mock_job
+
+
+def create_local_backend_job(
+    name: str = "test-job",
+    runtime: Optional[types.Runtime] = None,
+    steps: Optional[list[LocalBackendStep]] = None,
+) -> LocalBackendJobs:
+    """Create a mock LocalBackendJobs object for testing."""
+    if runtime is None:
+        runtime = create_mock_runtime()
+    if steps is None:
+        mock_job = create_local_job()
+        steps = [LocalBackendStep(step_name="train", job=mock_job)]
+    
+    return LocalBackendJobs(
+        name=name,
+        runtime=runtime,
+        created=datetime.now(),
+        steps=steps,
+    )
+
+
+def create_train_job_type(
+    name: str = BASIC_TRAIN_JOB_NAME,
+    runtime: Optional[types.Runtime] = None,
+    status: str = constants.TRAINJOB_COMPLETE,
+) -> types.TrainJob:
+    """Create a mock TrainJob object for testing."""
+    if runtime is None:
+        runtime = create_mock_runtime()
+    
+    return types.TrainJob(
+        name=name,
+        creation_timestamp=datetime.now(),
+        runtime=runtime,
+        steps=[
+            types.Step(
+                name="train",
+                status=status,
+                pod_name="train-pod",
+                device=constants.UNKNOWN,
+                device_count=constants.UNKNOWN,
+            )
+        ],
+        num_nodes=1,
+        status=status,
+    )
+
+
+# --------------------------
+# Tests
+# --------------------------
+
+def test_init():
+    """Test LocalProcessBackend initialization."""
+    config = LocalProcessBackendConfig(cleanup_venv=False)
+    backend = LocalProcessBackend(cfg=config)
+
+    assert backend.cfg == config
+    assert not backend.cfg.cleanup_venv
+    assert len(backend._LocalProcessBackend__local_jobs) == 0
+
+
+def test_list_runtimes(local_backend):
+    """Test list_runtimes method."""
+    runtimes = local_backend.list_runtimes()
+
+    assert isinstance(runtimes, list)
+    assert len(runtimes) == len(local_runtimes)
+
+    # Check that all returned items are Runtime objects
+    for runtime in runtimes:
+        assert isinstance(runtime, types.Runtime)
+        assert isinstance(runtime.trainer, types.RuntimeTrainer)
+
+
+@pytest.mark.parametrize(
+    "test_case",
+    [
+        TestCase(
+            name="valid runtime name",
+            expected_status=SUCCESS,
+            config={"name": TORCH_RUNTIME},
+        ),
+        TestCase(
+            name="invalid runtime name",
+            expected_status=FAILED,
+            config={"name": "invalid-runtime"},
+            expected_error=ValueError,
+        ),
+    ],
+)
+def test_get_runtime(local_backend, test_case):
+    """Test get_runtime method with various scenarios."""
+    print("Executing test:", test_case.name)
+    try:
+        runtime = local_backend.get_runtime(**test_case.config)
+        
+        assert test_case.expected_status == SUCCESS
+        assert isinstance(runtime, types.Runtime)
+        assert runtime.name == test_case.config["name"]
+        
+    except Exception as e:
+        assert test_case.expected_status == FAILED
+        assert type(e) is test_case.expected_error
+        if "invalid" in test_case.config.get("name", ""):
+            assert "not found" in str(e)
+    print("test execution complete")
+
+
+@pytest.mark.parametrize(
+    "test_case",
+    [
+        TestCase(
+            name="valid runtime packages",
+            expected_status=SUCCESS,
+            config={"runtime": create_mock_runtime()},
+        ),
+        TestCase(
+            name="invalid runtime packages",
+            expected_status=FAILED,
+            config={
+                "runtime": types.Runtime(
+                    name="invalid-runtime",
+                    trainer=types.RuntimeTrainer(
+                        trainer_type=types.TrainerType.CUSTOM_TRAINER,
+                        framework="invalid",
+                    ),
+                )
+            },
+            expected_error=ValueError,
+        ),
+    ],
+)
+def test_get_runtime_packages(local_backend, test_case):
+    """Test get_runtime_packages method with various scenarios."""
+    print("Executing test:", test_case.name)
+    try:
+        packages = local_backend.get_runtime_packages(**test_case.config)
+        
+        assert test_case.expected_status == SUCCESS
+        assert isinstance(packages, list)
+        assert "torch" in packages
+        
+    except Exception as e:
+        assert test_case.expected_status == FAILED
+        assert type(e) is test_case.expected_error
+        assert "not found" in str(e)
+    print("test execution complete")
+
+
+@pytest.mark.parametrize(
+    "test_case",
+    [
+        TestCase(
+            name="successful train with custom trainer",
+            expected_status=SUCCESS,
+            config={
+                "runtime": create_mock_runtime(),
+                "trainer": create_mock_trainer(),
+            },
+        ),
+        TestCase(
+            name="failed train with builtin trainer",
+            expected_status=FAILED,
+            config={
+                "runtime": create_mock_runtime(),
+                "trainer": create_mock_builtin_trainer(),
+            },
+            expected_error=ValueError,
+        ),
+    ],
+)
+@patch("kubeflow.trainer.backends.localprocess.backend.tempfile.mkdtemp")
+@patch("kubeflow.trainer.backends.localprocess.backend.local_utils")
+@patch("kubeflow.trainer.backends.localprocess.backend.LocalJob")
+@patch("uuid.uuid4")
+@patch("random.choice")
+def test_train(
+    mock_random_choice,
+    mock_uuid,
+    mock_local_job_class,
+    mock_local_utils,
+    mock_mkdtemp,
+    local_backend,
+    test_case,
+):
+    """Test train method with various scenarios."""
+    print("Executing test:", test_case.name)
+    
+    # Setup mocks
+    mock_random_choice.return_value = "a"
+    mock_uuid.return_value.hex = "mock-uuid-hex"
+    mock_mkdtemp.return_value = TEST_VENV_DIR
+    
+    mock_local_job = create_local_job(name="amock-uuid-h-train")
+    mock_local_job_class.return_value = mock_local_job
+    
+    mock_local_utils.get_local_runtime_trainer.return_value = Mock()
+    mock_local_utils.get_local_train_job_script.return_value = ["python", "script.py"]
+    
+    try:
+        job_name = local_backend.train(**test_case.config)
+        
+        assert test_case.expected_status == SUCCESS
+        assert job_name == "amock-uuid-h"
+        assert len(local_backend._LocalProcessBackend__local_jobs) == 1
+        
+        # Verify mock calls
+        mock_mkdtemp.assert_called_once()
+        mock_local_utils.get_local_runtime_trainer.assert_called_once()
+        mock_local_utils.get_local_train_job_script.assert_called_once()
+        mock_local_job.start.assert_called_once()
+        
+    except Exception as e:
+        assert test_case.expected_status == FAILED
+        assert type(e) is test_case.expected_error
+        assert "CustomTrainer must be set" in str(e)
+    
+    print("test execution complete")
+
+
+@pytest.mark.parametrize(
+    "test_case",
+    [
+        TestCase(
+            name="list jobs when empty",
+            expected_status=SUCCESS,
+            config={},
+            expected_output=[],
+        ),
+        TestCase(
+            name="list jobs with existing jobs",
+            expected_status=SUCCESS,
+            config={"setup_jobs": True},
+        ),
+        TestCase(
+            name="list jobs with runtime filter",
+            expected_status=SUCCESS,
+            config={"setup_jobs": True, "runtime": create_mock_runtime()},
+        ),
+    ],
+)
+def test_list_jobs(local_backend, test_case):
+    """Test list_jobs method with various scenarios."""
+    print("Executing test:", test_case.name)
+    
+    # Setup jobs if requested
+    if test_case.config.get("setup_jobs"):
+        backend_job = create_local_backend_job()
+        local_backend._LocalProcessBackend__local_jobs.append(backend_job)
+    
+    try:
+        runtime_filter = test_case.config.get("runtime")
+        jobs = local_backend.list_jobs(runtime=runtime_filter)
+        
+        assert test_case.expected_status == SUCCESS
+        assert isinstance(jobs, list)
+        
+        if test_case.config.get("setup_jobs"):
+            assert len(jobs) >= 1
+            for job in jobs:
+                assert isinstance(job, types.TrainJob)
+        else:
+            assert jobs == test_case.expected_output
+            
+    except Exception as e:
+        assert test_case.expected_status == FAILED
+        assert type(e) is test_case.expected_error
+    
+    print("test execution complete")
+
+
+@pytest.mark.parametrize(
+    "test_case",
+    [
+        TestCase(
+            name="get existing job",
+            expected_status=SUCCESS,
+            config={"name": BASIC_TRAIN_JOB_NAME},
+        ),
+        TestCase(
+            name="get non-existent job",
+            expected_status=FAILED,
+            config={"name": "non-existent-job"},
+            expected_error=ValueError,
+        ),
+    ],
+)
+def test_get_job(local_backend, test_case):
+    """Test get_job method with various scenarios."""
+    print("Executing test:", test_case.name)
+    
+    # Setup a job if testing success case
+    if test_case.expected_status == SUCCESS:
+        backend_job = create_local_backend_job(name=test_case.config["name"])
+        local_backend._LocalProcessBackend__local_jobs.append(backend_job)
+    
+    try:
+        with patch.object(
+            local_backend,
+            "_LocalProcessBackend__get_job_status",
+            return_value=constants.TRAINJOB_COMPLETE,
+        ):
+            job = local_backend.get_job(**test_case.config)
+        
+        assert test_case.expected_status == SUCCESS
+        assert isinstance(job, types.TrainJob)
+        assert job.name == test_case.config["name"]
+        
+    except Exception as e:
+        assert test_case.expected_status == FAILED
+        assert type(e) is test_case.expected_error
+        assert "No TrainJob with name" in str(e)
+    
+    print("test execution complete")
+
+
+@pytest.mark.parametrize(
+    "test_case",
+    [
+        TestCase(
+            name="get logs for existing job",
+            expected_status=SUCCESS,
+            config={"name": BASIC_TRAIN_JOB_NAME},
+            expected_output=["log line 1", "log line 2"],
+        ),
+        TestCase(
+            name="get logs with follow enabled",
+            expected_status=SUCCESS,
+            config={"name": BASIC_TRAIN_JOB_NAME, "follow": True},
+            expected_output=["log line 1", "log line 2"],
+        ),
+        TestCase(
+            name="get logs for specific step",
+            expected_status=SUCCESS,
+            config={"name": BASIC_TRAIN_JOB_NAME, "step": "train"},
+            expected_output=["log line 1", "log line 2"],
+        ),
+        TestCase(
+            name="get logs for non-existent job",
+            expected_status=FAILED,
+            config={"name": "non-existent-job"},
+            expected_error=ValueError,
+        ),
+    ],
+)
+def test_get_job_logs(local_backend, test_case):
+    """Test get_job_logs method with various scenarios."""
+    print("Executing test:", test_case.name)
+    
+    # Setup a job if testing success case
+    if test_case.expected_status == SUCCESS:
+        backend_job = create_local_backend_job(name=test_case.config["name"])
+        local_backend._LocalProcessBackend__local_jobs.append(backend_job)
+    
+    try:
+        logs = list(local_backend.get_job_logs(**test_case.config))
+        
+        assert test_case.expected_status == SUCCESS
+        assert logs == test_case.expected_output
+        
+    except Exception as e:
+        assert test_case.expected_status == FAILED
+        assert type(e) is test_case.expected_error
+        assert "No TrainJob with name" in str(e)
+    
+    print("test execution complete")
+
+
+@pytest.mark.parametrize(
+    "test_case",
+    [
+        TestCase(
+            name="wait for job with default status",
+            expected_status=SUCCESS,
+            config={"name": BASIC_TRAIN_JOB_NAME},
+        ),
+        TestCase(
+            name="wait for job with custom status",
+            expected_status=SUCCESS,
+            config={
+                "name": BASIC_TRAIN_JOB_NAME,
+                "status": {constants.TRAINJOB_RUNNING, constants.TRAINJOB_COMPLETE},
+                "timeout": 300,
+                "polling_interval": 5,
+            },
+        ),
+        TestCase(
+            name="wait for non-existent job",
+            expected_status=FAILED,
+            config={"name": "non-existent-job"},
+            expected_error=ValueError,
+        ),
+    ],
+)
+def test_wait_for_job_status(local_backend, test_case):
+    """Test wait_for_job_status method with various scenarios."""
+    print("Executing test:", test_case.name)
+    
+    # Setup a job if testing success case
+    if test_case.expected_status == SUCCESS:
+        mock_job = create_local_job(status=constants.TRAINJOB_RUNNING)
+        backend_job = create_local_backend_job(
+            name=test_case.config["name"],
+            steps=[LocalBackendStep(step_name="train", job=mock_job)],
+        )
+        local_backend._LocalProcessBackend__local_jobs.append(backend_job)
+    
+    try:
+        with patch.object(local_backend, "get_job") as mock_get_job:
+            mock_train_job = create_train_job_type(name=test_case.config["name"])
+            mock_get_job.return_value = mock_train_job
+            
+            result = local_backend.wait_for_job_status(**test_case.config)
+            
+            assert test_case.expected_status == SUCCESS
+            assert result == mock_train_job
+            mock_get_job.assert_called_once_with(test_case.config["name"])
+        
+    except Exception as e:
+        assert test_case.expected_status == FAILED
+        assert type(e) is test_case.expected_error
+        assert "No TrainJob with name" in str(e)
+    
+    print("test execution complete")
+
+
+@pytest.mark.parametrize(
+    "test_case",
+    [
+        TestCase(
+            name="delete existing job",
+            expected_status=SUCCESS,
+            config={"name": BASIC_TRAIN_JOB_NAME},
+        ),
+        TestCase(
+            name="delete non-existent job",
+            expected_status=FAILED,
+            config={"name": "non-existent-job"},
+            expected_error=ValueError,
+        ),
+    ],
+)
+def test_delete_job(local_backend, test_case):
+    """Test delete_job method with various scenarios."""
+    print("Executing test:", test_case.name)
+    
+    # Setup a job if testing success case
+    if test_case.expected_status == SUCCESS:
+        backend_job = create_local_backend_job(name=test_case.config["name"])
+        local_backend._LocalProcessBackend__local_jobs.append(backend_job)
+        initial_count = len(local_backend._LocalProcessBackend__local_jobs)
+    
+    try:
+        local_backend.delete_job(**test_case.config)
+        
+        assert test_case.expected_status == SUCCESS
+        # Verify job was removed
+        assert len(local_backend._LocalProcessBackend__local_jobs) == initial_count - 1
+        
+    except Exception as e:
+        assert test_case.expected_status == FAILED
+        assert type(e) is test_case.expected_error
+        assert "No TrainJob with name" in str(e)
+    
+    print("test execution complete")
+
+
+@pytest.mark.parametrize(
+    "test_case",
+    [
+        TestCase(
+            name="job status with failed step",
+            expected_status=SUCCESS,
+            config={"statuses": [constants.TRAINJOB_FAILED, constants.TRAINJOB_COMPLETE]},
+            expected_output=constants.TRAINJOB_FAILED,
+        ),
+        TestCase(
+            name="job status with running step",
+            expected_status=SUCCESS,
+            config={"statuses": [constants.TRAINJOB_RUNNING, constants.TRAINJOB_COMPLETE]},
+            expected_output=constants.TRAINJOB_RUNNING,
+        ),
+        TestCase(
+            name="job status with created step",
+            expected_status=SUCCESS,
+            config={"statuses": [constants.TRAINJOB_CREATED]},
+            expected_output=constants.TRAINJOB_CREATED,
+        ),
+        TestCase(
+            name="job status with unknown step",
+            expected_status=SUCCESS,
+            config={"statuses": ["unknown_status"]},
+            expected_output=constants.TRAINJOB_CREATED,
+        ),
+    ],
+)
+def test_get_job_status(local_backend, test_case):
+    """Test private __get_job_status method with various scenarios."""
+    print("Executing test:", test_case.name)
+    
+    # Create mock steps with the specified statuses
+    steps = []
+    for status in test_case.config["statuses"]:
+        mock_job = create_local_job(status=status)
+        steps.append(LocalBackendStep(step_name=f"step-{status}", job=mock_job))
+    
+    backend_job = create_local_backend_job(steps=steps)
+    
+    try:
+        status = local_backend._LocalProcessBackend__get_job_status(backend_job)
+        
+        assert test_case.expected_status == SUCCESS
+        assert status == test_case.expected_output
+        
+    except Exception as e:
+        assert test_case.expected_status == FAILED
+        assert type(e) is test_case.expected_error
+    
+    print("test execution complete")
+
+
+def test_register_job_scenarios(local_backend):
+    """Test __register_job method with various scenarios."""
+    print("Testing job registration scenarios")
+    
+    mock_job1 = create_local_job(name="job1")
+    mock_job2 = create_local_job(name="job2")
+    runtime = create_mock_runtime()
+    
+    # Test new job registration
+    local_backend._LocalProcessBackend__register_job(
+        train_job_name="new-job",
+        step_name="train",
+        job=mock_job1,
+        runtime=runtime,
+    )
+    
+    assert len(local_backend._LocalProcessBackend__local_jobs) == 1
+    registered_job = local_backend._LocalProcessBackend__local_jobs[0]
+    assert registered_job.name == "new-job"
+    assert len(registered_job.steps) == 1
+    assert registered_job.steps[0].step_name == "train"
+    
+    # Test adding step to existing job
+    local_backend._LocalProcessBackend__register_job(
+        train_job_name="new-job",
+        step_name="validate",
+        job=mock_job2,
+        runtime=runtime,
+    )
+    
+    assert len(local_backend._LocalProcessBackend__local_jobs) == 1
+    assert len(registered_job.steps) == 2
+    
+    # Test duplicate step warning
+    with patch("kubeflow.trainer.backends.localprocess.backend.logger") as mock_logger:
+        local_backend._LocalProcessBackend__register_job(
+            train_job_name="new-job",
+            step_name="train",
+            job=mock_job1,
+            runtime=runtime,
+        )
+        mock_logger.warning.assert_called_once_with("Step 'train' already registered.")
+    
+    print("Job registration tests complete")
+
+
+def test_convert_local_runtime_to_runtime(local_backend):
+    """Test __convert_local_runtime_to_runtime method."""
+    print("Testing runtime conversion")
+    
+    # Use the first local runtime from constants
+    local_runtime = local_runtimes[0]
+    
+    converted_runtime = local_backend._LocalProcessBackend__convert_local_runtime_to_runtime(
+        local_runtime
+    )
+    
+    assert isinstance(converted_runtime, types.Runtime)
+    assert converted_runtime.name == local_runtime.name
+    assert converted_runtime.trainer.framework == local_runtime.trainer.framework
+    assert converted_runtime.trainer.num_nodes == local_runtime.trainer.num_nodes
+    assert converted_runtime.trainer.device == local_runtime.trainer.device
+    assert converted_runtime.trainer.device_count == local_runtime.trainer.device_count
+    assert converted_runtime.pretrained_model == local_runtime.pretrained_model
+    
+    print("Runtime conversion test complete")
\ No newline at end of file

From c4c7883ae6f4c79c3cbc4259a0bebe48ff90eb81 Mon Sep 17 00:00:00 2001
From: Saad Zaher <szaher@redhat.com>
Date: Mon, 15 Sep 2025 13:21:36 +0100
Subject: [PATCH 2/2] fix ruff formatting

Signed-off-by: Saad Zaher <szaher@redhat.com>
---
 .../backends/localprocess/backend_test.py     | 132 +++++++++---------
 1 file changed, 66 insertions(+), 66 deletions(-)

diff --git a/kubeflow/trainer/backends/localprocess/backend_test.py b/kubeflow/trainer/backends/localprocess/backend_test.py
index e1fa22612..5ad38d936 100644
--- a/kubeflow/trainer/backends/localprocess/backend_test.py
+++ b/kubeflow/trainer/backends/localprocess/backend_test.py
@@ -19,13 +19,9 @@
 across job creation, management, and lifecycle operations using local subprocess execution.
 """
 
-import random
-import string
-import tempfile
-import uuid
-from dataclasses import asdict, dataclass, field
+from dataclasses import dataclass, field
 from datetime import datetime
-from typing import Any, Optional, Set, Type
+from typing import Any, Optional, Type
 from unittest.mock import Mock, patch
 
 import pytest
@@ -45,6 +41,7 @@
 @dataclass
 class TestCase:
     """Test case configuration for parametrized tests."""
+
     name: str
     expected_status: str
     config: dict[str, Any] = field(default_factory=dict)
@@ -70,6 +67,7 @@ class TestCase:
 # Fixtures
 # --------------------------
 
+
 @pytest.fixture
 def local_backend():
     """Provide a LocalProcessBackend instance for testing."""
@@ -81,6 +79,7 @@ def local_backend():
 # Object Creators
 # --------------------------
 
+
 def create_mock_runtime(
     name: str = TORCH_RUNTIME,
     framework: str = "torch",
@@ -110,7 +109,7 @@ def create_mock_trainer(
         packages = ["torch", "numpy"]
     if env is None:
         env = {"ENV_VAR": "test_value"}
-    
+
     return types.CustomTrainer(
         func=lambda: print(func_name),
         func_args={"param1": "value1"},
@@ -149,7 +148,7 @@ def create_local_backend_job(
     if steps is None:
         mock_job = create_local_job()
         steps = [LocalBackendStep(step_name="train", job=mock_job)]
-    
+
     return LocalBackendJobs(
         name=name,
         runtime=runtime,
@@ -166,7 +165,7 @@ def create_train_job_type(
     """Create a mock TrainJob object for testing."""
     if runtime is None:
         runtime = create_mock_runtime()
-    
+
     return types.TrainJob(
         name=name,
         creation_timestamp=datetime.now(),
@@ -189,6 +188,7 @@ def create_train_job_type(
 # Tests
 # --------------------------
 
+
 def test_init():
     """Test LocalProcessBackend initialization."""
     config = LocalProcessBackendConfig(cleanup_venv=False)
@@ -233,11 +233,11 @@ def test_get_runtime(local_backend, test_case):
     print("Executing test:", test_case.name)
     try:
         runtime = local_backend.get_runtime(**test_case.config)
-        
+
         assert test_case.expected_status == SUCCESS
         assert isinstance(runtime, types.Runtime)
         assert runtime.name == test_case.config["name"]
-        
+
     except Exception as e:
         assert test_case.expected_status == FAILED
         assert type(e) is test_case.expected_error
@@ -275,11 +275,11 @@ def test_get_runtime_packages(local_backend, test_case):
     print("Executing test:", test_case.name)
     try:
         packages = local_backend.get_runtime_packages(**test_case.config)
-        
+
         assert test_case.expected_status == SUCCESS
         assert isinstance(packages, list)
         assert "torch" in packages
-        
+
     except Exception as e:
         assert test_case.expected_status == FAILED
         assert type(e) is test_case.expected_error
@@ -325,36 +325,36 @@ def test_train(
 ):
     """Test train method with various scenarios."""
     print("Executing test:", test_case.name)
-    
+
     # Setup mocks
     mock_random_choice.return_value = "a"
     mock_uuid.return_value.hex = "mock-uuid-hex"
     mock_mkdtemp.return_value = TEST_VENV_DIR
-    
+
     mock_local_job = create_local_job(name="amock-uuid-h-train")
     mock_local_job_class.return_value = mock_local_job
-    
+
     mock_local_utils.get_local_runtime_trainer.return_value = Mock()
     mock_local_utils.get_local_train_job_script.return_value = ["python", "script.py"]
-    
+
     try:
         job_name = local_backend.train(**test_case.config)
-        
+
         assert test_case.expected_status == SUCCESS
         assert job_name == "amock-uuid-h"
         assert len(local_backend._LocalProcessBackend__local_jobs) == 1
-        
+
         # Verify mock calls
         mock_mkdtemp.assert_called_once()
         mock_local_utils.get_local_runtime_trainer.assert_called_once()
         mock_local_utils.get_local_train_job_script.assert_called_once()
         mock_local_job.start.assert_called_once()
-        
+
     except Exception as e:
         assert test_case.expected_status == FAILED
         assert type(e) is test_case.expected_error
         assert "CustomTrainer must be set" in str(e)
-    
+
     print("test execution complete")
 
 
@@ -382,30 +382,30 @@ def test_train(
 def test_list_jobs(local_backend, test_case):
     """Test list_jobs method with various scenarios."""
     print("Executing test:", test_case.name)
-    
+
     # Setup jobs if requested
     if test_case.config.get("setup_jobs"):
         backend_job = create_local_backend_job()
         local_backend._LocalProcessBackend__local_jobs.append(backend_job)
-    
+
     try:
         runtime_filter = test_case.config.get("runtime")
         jobs = local_backend.list_jobs(runtime=runtime_filter)
-        
+
         assert test_case.expected_status == SUCCESS
         assert isinstance(jobs, list)
-        
+
         if test_case.config.get("setup_jobs"):
             assert len(jobs) >= 1
             for job in jobs:
                 assert isinstance(job, types.TrainJob)
         else:
             assert jobs == test_case.expected_output
-            
+
     except Exception as e:
         assert test_case.expected_status == FAILED
         assert type(e) is test_case.expected_error
-    
+
     print("test execution complete")
 
 
@@ -428,12 +428,12 @@ def test_list_jobs(local_backend, test_case):
 def test_get_job(local_backend, test_case):
     """Test get_job method with various scenarios."""
     print("Executing test:", test_case.name)
-    
+
     # Setup a job if testing success case
     if test_case.expected_status == SUCCESS:
         backend_job = create_local_backend_job(name=test_case.config["name"])
         local_backend._LocalProcessBackend__local_jobs.append(backend_job)
-    
+
     try:
         with patch.object(
             local_backend,
@@ -441,16 +441,16 @@ def test_get_job(local_backend, test_case):
             return_value=constants.TRAINJOB_COMPLETE,
         ):
             job = local_backend.get_job(**test_case.config)
-        
+
         assert test_case.expected_status == SUCCESS
         assert isinstance(job, types.TrainJob)
         assert job.name == test_case.config["name"]
-        
+
     except Exception as e:
         assert test_case.expected_status == FAILED
         assert type(e) is test_case.expected_error
         assert "No TrainJob with name" in str(e)
-    
+
     print("test execution complete")
 
 
@@ -486,23 +486,23 @@ def test_get_job(local_backend, test_case):
 def test_get_job_logs(local_backend, test_case):
     """Test get_job_logs method with various scenarios."""
     print("Executing test:", test_case.name)
-    
+
     # Setup a job if testing success case
     if test_case.expected_status == SUCCESS:
         backend_job = create_local_backend_job(name=test_case.config["name"])
         local_backend._LocalProcessBackend__local_jobs.append(backend_job)
-    
+
     try:
         logs = list(local_backend.get_job_logs(**test_case.config))
-        
+
         assert test_case.expected_status == SUCCESS
         assert logs == test_case.expected_output
-        
+
     except Exception as e:
         assert test_case.expected_status == FAILED
         assert type(e) is test_case.expected_error
         assert "No TrainJob with name" in str(e)
-    
+
     print("test execution complete")
 
 
@@ -535,7 +535,7 @@ def test_get_job_logs(local_backend, test_case):
 def test_wait_for_job_status(local_backend, test_case):
     """Test wait_for_job_status method with various scenarios."""
     print("Executing test:", test_case.name)
-    
+
     # Setup a job if testing success case
     if test_case.expected_status == SUCCESS:
         mock_job = create_local_job(status=constants.TRAINJOB_RUNNING)
@@ -544,23 +544,23 @@ def test_wait_for_job_status(local_backend, test_case):
             steps=[LocalBackendStep(step_name="train", job=mock_job)],
         )
         local_backend._LocalProcessBackend__local_jobs.append(backend_job)
-    
+
     try:
         with patch.object(local_backend, "get_job") as mock_get_job:
             mock_train_job = create_train_job_type(name=test_case.config["name"])
             mock_get_job.return_value = mock_train_job
-            
+
             result = local_backend.wait_for_job_status(**test_case.config)
-            
+
             assert test_case.expected_status == SUCCESS
             assert result == mock_train_job
             mock_get_job.assert_called_once_with(test_case.config["name"])
-        
+
     except Exception as e:
         assert test_case.expected_status == FAILED
         assert type(e) is test_case.expected_error
         assert "No TrainJob with name" in str(e)
-    
+
     print("test execution complete")
 
 
@@ -583,25 +583,25 @@ def test_wait_for_job_status(local_backend, test_case):
 def test_delete_job(local_backend, test_case):
     """Test delete_job method with various scenarios."""
     print("Executing test:", test_case.name)
-    
+
     # Setup a job if testing success case
     if test_case.expected_status == SUCCESS:
         backend_job = create_local_backend_job(name=test_case.config["name"])
         local_backend._LocalProcessBackend__local_jobs.append(backend_job)
         initial_count = len(local_backend._LocalProcessBackend__local_jobs)
-    
+
     try:
         local_backend.delete_job(**test_case.config)
-        
+
         assert test_case.expected_status == SUCCESS
         # Verify job was removed
         assert len(local_backend._LocalProcessBackend__local_jobs) == initial_count - 1
-        
+
     except Exception as e:
         assert test_case.expected_status == FAILED
         assert type(e) is test_case.expected_error
         assert "No TrainJob with name" in str(e)
-    
+
     print("test execution complete")
 
 
@@ -637,36 +637,36 @@ def test_delete_job(local_backend, test_case):
 def test_get_job_status(local_backend, test_case):
     """Test private __get_job_status method with various scenarios."""
     print("Executing test:", test_case.name)
-    
+
     # Create mock steps with the specified statuses
     steps = []
     for status in test_case.config["statuses"]:
         mock_job = create_local_job(status=status)
         steps.append(LocalBackendStep(step_name=f"step-{status}", job=mock_job))
-    
+
     backend_job = create_local_backend_job(steps=steps)
-    
+
     try:
         status = local_backend._LocalProcessBackend__get_job_status(backend_job)
-        
+
         assert test_case.expected_status == SUCCESS
         assert status == test_case.expected_output
-        
+
     except Exception as e:
         assert test_case.expected_status == FAILED
         assert type(e) is test_case.expected_error
-    
+
     print("test execution complete")
 
 
 def test_register_job_scenarios(local_backend):
     """Test __register_job method with various scenarios."""
     print("Testing job registration scenarios")
-    
+
     mock_job1 = create_local_job(name="job1")
     mock_job2 = create_local_job(name="job2")
     runtime = create_mock_runtime()
-    
+
     # Test new job registration
     local_backend._LocalProcessBackend__register_job(
         train_job_name="new-job",
@@ -674,13 +674,13 @@ def test_register_job_scenarios(local_backend):
         job=mock_job1,
         runtime=runtime,
     )
-    
+
     assert len(local_backend._LocalProcessBackend__local_jobs) == 1
     registered_job = local_backend._LocalProcessBackend__local_jobs[0]
     assert registered_job.name == "new-job"
     assert len(registered_job.steps) == 1
     assert registered_job.steps[0].step_name == "train"
-    
+
     # Test adding step to existing job
     local_backend._LocalProcessBackend__register_job(
         train_job_name="new-job",
@@ -688,10 +688,10 @@ def test_register_job_scenarios(local_backend):
         job=mock_job2,
         runtime=runtime,
     )
-    
+
     assert len(local_backend._LocalProcessBackend__local_jobs) == 1
     assert len(registered_job.steps) == 2
-    
+
     # Test duplicate step warning
     with patch("kubeflow.trainer.backends.localprocess.backend.logger") as mock_logger:
         local_backend._LocalProcessBackend__register_job(
@@ -701,21 +701,21 @@ def test_register_job_scenarios(local_backend):
             runtime=runtime,
         )
         mock_logger.warning.assert_called_once_with("Step 'train' already registered.")
-    
+
     print("Job registration tests complete")
 
 
 def test_convert_local_runtime_to_runtime(local_backend):
     """Test __convert_local_runtime_to_runtime method."""
     print("Testing runtime conversion")
-    
+
     # Use the first local runtime from constants
     local_runtime = local_runtimes[0]
-    
+
     converted_runtime = local_backend._LocalProcessBackend__convert_local_runtime_to_runtime(
         local_runtime
     )
-    
+
     assert isinstance(converted_runtime, types.Runtime)
     assert converted_runtime.name == local_runtime.name
     assert converted_runtime.trainer.framework == local_runtime.trainer.framework
@@ -723,5 +723,5 @@ def test_convert_local_runtime_to_runtime(local_backend):
     assert converted_runtime.trainer.device == local_runtime.trainer.device
     assert converted_runtime.trainer.device_count == local_runtime.trainer.device_count
     assert converted_runtime.pretrained_model == local_runtime.pretrained_model
-    
-    print("Runtime conversion test complete")
\ No newline at end of file
+
+    print("Runtime conversion test complete")