Fix CI failures and add TF/Keras + register_model roundtrip tests

Jovonni · Jovonni · commit 60410a7a4e83 · 2026-03-01T14:23:18.000-05:00
- Fix: guard pandas/numpy imports with pytest.importorskip in
  test_datasets.py and test_features.py (caused CI collection errors)
- Fix: add numpy/pandas to SDK unit test CI install step
- Fix: add fix/** branch trigger to test-python.yml
- Add TF/Keras detection tests to test_detect_framework.py
- Add TF serialization roundtrip test to test_serialize_model.py
- Add TF/Keras model registration test to test_models.py
- Add register_model roundtrip integration tests: sklearn, pytorch,
  tensorflow — verifies full pipeline (detect → serialize → codegen →
  exec train/infer) through the SDK abstraction layer
- Remove unnecessary _serialize_model mock from pytorch registration test
  (SimpleNet is now at module level, picklable by torch.save)

190 tests passing, 8 skipped.
diff --git a/.github/workflows/test-python.yml b/.github/workflows/test-python.yml
@@ -2,7 +2,7 @@ name: Python SDK & Model Runner Tests
 
 on:
   push:
-    branches: [main, "dev/**"]
+    branches: [main, "dev/**", "fix/**"]
     paths:
       - "sdk/python/**"
       - "model-runner/python/**"
@@ -44,7 +44,7 @@ jobs:
       - name: Install dependencies
         run: |
           pip install --upgrade pip
-          pip install pytest pytest-cov pytest-mock pytest-timeout responses
+          pip install pytest pytest-cov pytest-mock pytest-timeout responses numpy pandas
           pip install ./sdk/python
 
       - name: Run SDK unit tests
diff --git a/tests/python/frameworks/test_detect_framework.py b/tests/python/frameworks/test_detect_framework.py
@@ -31,6 +31,18 @@ def test_detect_pytorch(self):
     def test_detect_pytorch_custom_module(self, pytorch_model):
         assert _detect_framework(pytorch_model) == "pytorch"
 
+    def test_detect_tensorflow(self, tf_model):
+        """TensorFlow/Keras model detected as 'tensorflow'."""
+        assert _detect_framework(tf_model) == "tensorflow"
+
+    def test_detect_keras_standalone(self):
+        """Standalone Keras 3+ model detected as 'tensorflow'."""
+        keras = pytest.importorskip("keras")
+        model = keras.Sequential([
+            keras.layers.Dense(4, input_shape=(2,)),
+        ])
+        assert _detect_framework(model) == "tensorflow"
+
     @pytest.mark.parametrize("obj", ["hello", {"a": 1}, 42])
     def test_detect_unknown_raises(self, obj):
         with pytest.raises(TypeError, match="Cannot auto-detect framework"):
diff --git a/tests/python/frameworks/test_serialize_model.py b/tests/python/frameworks/test_serialize_model.py
@@ -28,6 +28,25 @@ def test_serialize_pytorch(self, pytorch_model):
         restored = torch.load(buf, map_location="cpu", weights_only=False)
         assert isinstance(restored, torch.nn.Module)
 
+    def test_serialize_tensorflow(self, tf_model):
+        """TF/Keras model serialized to .keras bytes and loadable."""
+        keras = pytest.importorskip("keras")
+        import tempfile, os
+
+        data = _serialize_model(tf_model, "tensorflow")
+        assert isinstance(data, bytes)
+        assert len(data) > 0
+        # Roundtrip: write to temp file and load back
+        tmpfile = tempfile.mktemp(suffix=".keras")
+        try:
+            with open(tmpfile, "wb") as f:
+                f.write(data)
+            restored = keras.models.load_model(tmpfile)
+            assert restored is not None
+        finally:
+            if os.path.exists(tmpfile):
+                os.unlink(tmpfile)
+
     def test_serialize_unsupported_raises(self):
         with pytest.raises(ValueError, match="Unsupported framework"):
             _serialize_model(object(), "unknown_framework")
diff --git a/tests/python/integration/test_register_model_roundtrip.py b/tests/python/integration/test_register_model_roundtrip.py
@@ -0,0 +1,190 @@
+"""Integration test: register_model() with real model objects → verify generated code executes.
+
+This is the critical test that verifies the SDK model abstraction works end-to-end:
+  1. Pass a real model object to register_model()
+  2. SDK auto-detects framework, serializes model, generates source code
+  3. The generated source code is POSTed to the API
+  4. We extract that source code and exec() it with MockModelContext
+  5. Verify train(ctx) logs metrics and infer(ctx) produces predictions
+"""
+
+import json
+import pytest
+import responses
+
+from conftest import TEST_API_URL, TEST_PROJECT_ID, MockModelContext
+
+
+REGISTER_RESPONSE = {
+    "model_id": "model-roundtrip-001",
+    "name": "roundtrip-test",
+    "version": 1,
+}
+
+
+class TestRegisterModelSklearnRoundtrip:
+    """register_model(model=sklearn_obj) → extract source → exec train/infer."""
+
+    def test_sklearn_register_and_train(self, client, mock_api, sklearn_model):
+        """Full pipeline: register sklearn model → exec generated train()."""
+        mock_api.add(
+            responses.POST,
+            f"{TEST_API_URL}/sdk/register-model",
+            json=REGISTER_RESPONSE,
+            status=200,
+        )
+        client.register_model("test-sklearn", model=sklearn_model)
+
+        # Extract the source code that was POSTed
+        body = json.loads(mock_api.calls[0].request.body)
+        source_code = body["source_code"]
+        assert body["framework"] == "sklearn"
+
+        # Execute the generated train() with MockModelContext
+        ctx = MockModelContext(hyperparameters={"n_samples": 50, "n_features": 4})
+        ns = {}
+        exec(source_code, ns)
+        ns["train"](ctx)
+
+        metric_names = [m[0] for m in ctx._logged_metrics]
+        assert "accuracy" in metric_names
+        assert "loss" in metric_names
+        assert "progress" in metric_names
+        # Progress should reach 100
+        progress_values = [m[1] for m in ctx._logged_metrics if m[0] == "progress"]
+        assert 100 in progress_values
+
+    def test_sklearn_register_and_infer(self, client, mock_api, sklearn_model):
+        """Full pipeline: register sklearn model → exec generated infer()."""
+        mock_api.add(
+            responses.POST,
+            f"{TEST_API_URL}/sdk/register-model",
+            json=REGISTER_RESPONSE,
+            status=200,
+        )
+        client.register_model("test-sklearn", model=sklearn_model)
+
+        body = json.loads(mock_api.calls[0].request.body)
+        source_code = body["source_code"]
+
+        ctx = MockModelContext(
+            hyperparameters={"input_data": {"features": [[1.0, 2.0, 3.0, 4.0]]}}
+        )
+        ns = {}
+        exec(source_code, ns)
+        ns["infer"](ctx)
+
+        assert ctx._output is not None
+        assert "predictions" in ctx._output
+        assert isinstance(ctx._output["predictions"], list)
+
+
+class TestRegisterModelPytorchRoundtrip:
+    """register_model(model=pytorch_obj) → extract source → exec train/infer."""
+
+    pytestmark = pytest.mark.skipif(
+        not pytest.importorskip("torch", reason="torch not installed"),
+        reason="torch not installed",
+    )
+
+    def test_pytorch_register_and_train(self, client, mock_api, pytorch_model):
+        """Full pipeline: register PyTorch model → exec generated train()."""
+        mock_api.add(
+            responses.POST,
+            f"{TEST_API_URL}/sdk/register-model",
+            json=REGISTER_RESPONSE,
+            status=200,
+        )
+        client.register_model("test-pytorch", model=pytorch_model)
+
+        body = json.loads(mock_api.calls[0].request.body)
+        source_code = body["source_code"]
+        assert body["framework"] == "pytorch"
+
+        ctx = MockModelContext(hyperparameters={"epochs": 2, "batch_size": 4})
+        ns = {}
+        exec(source_code, ns)
+        ns["train"](ctx)
+
+        metric_names = [m[0] for m in ctx._logged_metrics]
+        assert "loss" in metric_names
+        assert "accuracy" in metric_names
+        assert "progress" in metric_names
+
+    def test_pytorch_register_and_infer(self, client, mock_api, pytorch_model):
+        """Full pipeline: register PyTorch model → exec generated infer()."""
+        mock_api.add(
+            responses.POST,
+            f"{TEST_API_URL}/sdk/register-model",
+            json=REGISTER_RESPONSE,
+            status=200,
+        )
+        client.register_model("test-pytorch", model=pytorch_model)
+
+        body = json.loads(mock_api.calls[0].request.body)
+        source_code = body["source_code"]
+
+        # SimpleNet has input_size=4
+        ctx = MockModelContext(
+            hyperparameters={"input_data": {"features": [[1.0, 2.0, 3.0, 4.0]]}}
+        )
+        ns = {}
+        exec(source_code, ns)
+        ns["infer"](ctx)
+
+        assert ctx._output is not None
+        assert "predictions" in ctx._output
+        preds = ctx._output["predictions"]
+        assert isinstance(preds, list)
+        assert len(preds) == 1  # one sample
+
+
+class TestRegisterModelTensorflowRoundtrip:
+    """register_model(model=keras_obj) → extract source → exec train/infer."""
+
+    def test_tensorflow_register_and_train(self, client, mock_api, tf_model):
+        """Full pipeline: register TF/Keras model → exec generated train()."""
+        mock_api.add(
+            responses.POST,
+            f"{TEST_API_URL}/sdk/register-model",
+            json=REGISTER_RESPONSE,
+            status=200,
+        )
+        client.register_model("test-keras", model=tf_model)
+
+        body = json.loads(mock_api.calls[0].request.body)
+        source_code = body["source_code"]
+        assert body["framework"] == "tensorflow"
+
+        ctx = MockModelContext(hyperparameters={"epochs": 1, "n_samples": 20, "batch_size": 8})
+        ns = {}
+        exec(source_code, ns)
+        ns["train"](ctx)
+
+        metric_names = [m[0] for m in ctx._logged_metrics]
+        assert "loss" in metric_names
+        assert "progress" in metric_names
+
+    def test_tensorflow_register_and_infer(self, client, mock_api, tf_model):
+        """Full pipeline: register TF/Keras model → exec generated infer()."""
+        mock_api.add(
+            responses.POST,
+            f"{TEST_API_URL}/sdk/register-model",
+            json=REGISTER_RESPONSE,
+            status=200,
+        )
+        client.register_model("test-keras", model=tf_model)
+
+        body = json.loads(mock_api.calls[0].request.body)
+        source_code = body["source_code"]
+
+        # tf_model has input_shape=(4,)
+        ctx = MockModelContext(
+            hyperparameters={"input_data": {"features": [[1.0, 2.0, 3.0, 4.0]]}}
+        )
+        ns = {}
+        exec(source_code, ns)
+        ns["infer"](ctx)
+
+        assert ctx._output is not None
+        assert "predictions" in ctx._output
diff --git a/tests/python/sdk/test_datasets.py b/tests/python/sdk/test_datasets.py
@@ -6,7 +6,8 @@
 import os
 import pytest
 import responses
-import pandas as pd
+
+pd = pytest.importorskip("pandas", reason="pandas not installed")
 
 from openmodelstudio.client import Client
 
diff --git a/tests/python/sdk/test_features.py b/tests/python/sdk/test_features.py
@@ -1,11 +1,12 @@
 """Tests for Client.create_features() and Client.load_features()."""
 
 import json
-import numpy as np
-import pandas as pd
 import pytest
 import responses
 
+np = pytest.importorskip("numpy", reason="numpy not installed")
+pd = pytest.importorskip("pandas", reason="pandas not installed")
+
 from openmodelstudio.client import Client
 
 from conftest import TEST_API_URL, TEST_PROJECT_ID
diff --git a/tests/python/sdk/test_models.py b/tests/python/sdk/test_models.py
@@ -124,26 +124,38 @@ def test_register_model_with_sklearn_object(self, client, mock_api, sklearn_mode
         reason="torch not available",
     )
     def test_register_model_with_pytorch_object(self, client, mock_api, pytorch_model):
-        """Auto-detects pytorch, serializes nn.Module, generates source with embedded blob.
-
-        Note: The pytorch_model fixture defines SimpleNet in a local scope,
-        which torch.save cannot pickle. We mock _serialize_model to return
-        dummy bytes so the rest of the registration flow can be tested.
-        """
+        """Auto-detects pytorch, serializes nn.Module, generates source with embedded blob."""
         mock_api.add(
             responses.POST,
             f"{TEST_API_URL}/sdk/register-model",
             json=REGISTER_RESPONSE,
             status=200,
         )
-        dummy_bytes = b"fake-pytorch-model-bytes"
-        with patch("openmodelstudio.client._serialize_model", return_value=dummy_bytes):
-            handle = client.register_model("pytorch-net", model=pytorch_model)
+        handle = client.register_model("pytorch-net", model=pytorch_model)
 
         body = json.loads(mock_api.calls[0].request.body)
         assert body["framework"] == "pytorch"
         assert "_MODEL_B64" in body["source_code"]
         assert "import torch" in body["source_code"]
+        assert "def train(ctx):" in body["source_code"]
+        assert "def infer(ctx):" in body["source_code"]
+        assert handle.model_id == REGISTER_RESPONSE["model_id"]
+
+    def test_register_model_with_tensorflow_object(self, client, mock_api, tf_model):
+        """Auto-detects tensorflow, serializes Keras model, generates source with embedded blob."""
+        mock_api.add(
+            responses.POST,
+            f"{TEST_API_URL}/sdk/register-model",
+            json=REGISTER_RESPONSE,
+            status=200,
+        )
+        handle = client.register_model("keras-net", model=tf_model)
+
+        body = json.loads(mock_api.calls[0].request.body)
+        assert body["framework"] == "tensorflow"
+        assert "_MODEL_B64" in body["source_code"]
+        assert "def train(ctx):" in body["source_code"]
+        assert "def infer(ctx):" in body["source_code"]
         assert handle.model_id == REGISTER_RESPONSE["model_id"]