feat: add provenance tracking to training backends (#551)

arcticfly · claude · web-flow · commit 3a7574c4bb61 · 2026-02-09T16:14:43.000-08:00
* feat: add provenance tracking to LocalBackend and ServerlessBackend training

Records training technique ("local-rl" or "serverless-rl") in W&amp;B run config
at the start of each train() call, enabling downstream consumers to understand
how a model was trained and detect technique changes over its lifecycle.

Co-Authored-By: Claude Opus 4.6 &lt;noreply@anthropic.com&gt;

* chore: move test_provenance to tests/integration/

Co-Authored-By: Claude Opus 4.6 &lt;noreply@anthropic.com&gt;

* fix: resolve type errors and formatting in test_provenance

Co-Authored-By: Claude Opus 4.6 &lt;noreply@anthropic.com&gt;

---------

Co-authored-by: Claude Opus 4.6 &lt;noreply@anthropic.com&gt;
diff --git a/src/art/local/backend.py b/src/art/local/backend.py
@@ -24,6 +24,7 @@
     get_output_dir_from_model_properties,
     get_step_checkpoint_dir,
 )
+from art.utils.record_provenance import record_provenance
 from art.utils.s3 import (
     ExcludableOption,
     pull_model_from_s3,
@@ -459,6 +460,11 @@ async def train(  # type: ignore[override]
         """
         groups_list = list(trajectory_groups)
 
+        # Record provenance in W&B
+        wandb_run = model._get_wandb_run()
+        if wandb_run is not None:
+            record_provenance(wandb_run, "local-rl")
+
         # Build config objects from explicit kwargs
         config = TrainConfig(learning_rate=learning_rate, beta=beta)
         dev_config: dev.TrainConfig = {
diff --git a/src/art/preprocessing/tokenize.py b/src/art/preprocessing/tokenize.py
@@ -1,11 +1,11 @@
-import math
-import random
 from dataclasses import dataclass
 from itertools import takewhile
+import math
+import random
 from typing import Any, Generator, cast
 
-import torch
 from PIL import Image
+import torch
 from transformers.image_processing_utils import BaseImageProcessor
 from transformers.tokenization_utils_base import PreTrainedTokenizerBase
 
@@ -167,8 +167,7 @@ def tokenize_trajectory(
         ):
             last_assistant_index = i
         elif not isinstance(message, dict) and (
-            message.logprobs
-            or allow_training_without_logprobs  # ty:ignore[possibly-missing-attribute]
+            message.logprobs or allow_training_without_logprobs  # ty:ignore[possibly-missing-attribute]
         ):
             last_assistant_index = i
     # If there are no trainable assistant messages, return None
@@ -241,9 +240,7 @@ def tokenize_trajectory(
                 continue
             if not allow_training_without_logprobs:
                 continue
-        elif (
-            message.logprobs is None and not allow_training_without_logprobs
-        ):  # ty:ignore[possibly-missing-attribute]
+        elif message.logprobs is None and not allow_training_without_logprobs:  # ty:ignore[possibly-missing-attribute]
             continue
         start = token_ids.index(sentinal_token_id)
         end = start + 1
@@ -268,16 +265,12 @@ def tokenize_trajectory(
             assistant_mask[start:end] = [1] * len(content_token_ids)
         else:
             choice = message
-            assert (
-                choice.logprobs or allow_training_without_logprobs
-            ), (  # ty:ignore[possibly-missing-attribute]
+            assert choice.logprobs or allow_training_without_logprobs, (  # ty:ignore[possibly-missing-attribute]
                 "Chat completion choices must have logprobs"
             )
             if not choice.logprobs:  # ty:ignore[possibly-missing-attribute]
                 continue
-            token_logprobs = (
-                choice.logprobs.content or choice.logprobs.refusal or []
-            )  # ty:ignore[possibly-missing-attribute]
+            token_logprobs = choice.logprobs.content or choice.logprobs.refusal or []  # ty:ignore[possibly-missing-attribute]
             if (
                 bytes(token_logprobs[0].bytes or []).decode("utf-8")
                 == "<think>"
diff --git a/src/art/serverless/backend.py b/src/art/serverless/backend.py
@@ -11,6 +11,7 @@
 from ..backend import AnyTrainableModel, Backend
 from ..trajectories import TrajectoryGroup
 from ..types import ServerlessTrainResult, TrainConfig
+from ..utils.record_provenance import record_provenance
 
 if TYPE_CHECKING:
     import wandb
@@ -209,6 +210,11 @@ async def train(  # type: ignore[override]
         """
         groups_list = list(trajectory_groups)
 
+        # Record provenance in W&B
+        wandb_run = model._get_wandb_run()
+        if wandb_run is not None:
+            record_provenance(wandb_run, "serverless-rl")
+
         # Build config objects from explicit kwargs
         config = TrainConfig(learning_rate=learning_rate, beta=beta)
         dev_config: dev.TrainConfig = {
diff --git a/src/art/utils/__init__.py b/src/art/utils/__init__.py
@@ -4,10 +4,12 @@
 from .iterate_dataset import iterate_dataset
 from .limit_concurrency import limit_concurrency
 from .log_http_errors import log_http_errors
+from .record_provenance import record_provenance
 from .retry import retry
 
 __all__ = [
     "format_message",
+    "record_provenance",
     "retry",
     "iterate_dataset",
     "limit_concurrency",
diff --git a/src/art/utils/record_provenance.py b/src/art/utils/record_provenance.py
@@ -0,0 +1,17 @@
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+if TYPE_CHECKING:
+    import wandb
+
+
+def record_provenance(run: wandb.Run, provenance: str) -> None:
+    """Record provenance in run metadata, ensuring it's the last value in the array."""
+    if "provenance" in run.config:
+        existing = list(run.config["provenance"])
+        if existing[-1] != provenance:
+            existing.append(provenance)
+        run.config.update({"provenance": existing})
+    else:
+        run.config.update({"provenance": [provenance]})
diff --git a/tests/integration/test_provenance.py b/tests/integration/test_provenance.py
@@ -0,0 +1,91 @@
+"""Integration test: verify provenance tracking in W&B run config via ServerlessBackend."""
+
+import asyncio
+from datetime import datetime
+
+from dotenv import load_dotenv
+
+import art
+from art.serverless.backend import ServerlessBackend
+
+load_dotenv()
+
+
+async def simple_rollout(model: art.TrainableModel) -> art.Trajectory:
+    """Minimal rollout that produces a single turn with a reward."""
+    traj = art.Trajectory(
+        messages_and_choices=[
+            {"role": "system", "content": "Reply with exactly 'hello'."},
+        ],
+        reward=0.0,
+    )
+
+    choice = (
+        await model.openai_client().chat.completions.create(
+            model=model.get_inference_name(),
+            messages=traj.messages(),
+            max_completion_tokens=16,
+            timeout=30,
+        )
+    ).choices[0]
+
+    traj.messages_and_choices.append(choice)
+    traj.reward = (
+        1.0 if (choice.message.content or "").strip().lower() == "hello" else 0.0
+    )
+    return traj
+
+
+async def make_group(model: art.TrainableModel) -> art.TrajectoryGroup:
+    return art.TrajectoryGroup(simple_rollout(model) for _ in range(4))
+
+
+async def main() -> None:
+    backend = ServerlessBackend()
+
+    model = art.TrainableModel(
+        name=f"provenance-test-{datetime.now().strftime('%Y%m%d-%H%M%S')}",
+        project="provenance-test",
+        base_model="OpenPipe/Qwen3-14B-Instruct",
+    )
+    await model.register(backend)
+
+    # --- Step 1: first training call ---
+    groups = await art.gather_trajectory_groups(make_group(model) for _ in range(1))
+    result = await backend.train(model, groups)
+    await model.log(groups, metrics=result.metrics, step=result.step, split="train")
+
+    # Check provenance after first train call
+    run = model._get_wandb_run()
+    assert run is not None, "W&B run should exist"
+    provenance = run.config.get("provenance")
+    print(f"After step 1: provenance = {provenance}")
+    assert provenance == ["serverless-rl"], (
+        f"Expected ['serverless-rl'], got {provenance}"
+    )
+
+    # --- Step 2: second training call (same technique, should NOT duplicate) ---
+    # Provenance is recorded at the start of train(), before the remote call,
+    # so we can verify deduplication even if the server-side training fails.
+    groups2 = await art.gather_trajectory_groups(make_group(model) for _ in range(1))
+    try:
+        result2 = await backend.train(model, groups2)
+        await model.log(
+            groups2, metrics=result2.metrics, step=result2.step, split="train"
+        )
+    except RuntimeError as e:
+        print(f"Step 2 training failed (transient server error, OK for this test): {e}")
+
+    provenance = run.config.get("provenance")
+    print(f"After step 2: provenance = {provenance}")
+    assert provenance == ["serverless-rl"], (
+        f"Expected ['serverless-rl'] (no duplicate), got {provenance}"
+    )
+
+    print("\nAll provenance checks passed!")
+
+    await backend.close()
+
+
+if __name__ == "__main__":
+    asyncio.run(main())