Expose attributes for metrics in . Add example notebook for trainer callback.

monoxgas · monoxgas · commit ad29db0cab3d · 2025-04-27T17:36:56.000-07:00
diff --git a/dreadnode/main.py b/dreadnode/main.py
@@ -48,6 +48,7 @@
 )
 from dreadnode.types import (
     AnyDict,
+    JsonDict,
     JsonValue,
 )
 from dreadnode.util import handle_internal_errors
@@ -759,6 +760,7 @@ def log_metric(
         origin: t.Any | None = None,
         timestamp: datetime | None = None,
         mode: MetricAggMode | None = None,
+        attributes: JsonDict | None = None,
         to: ToObject = "task-or-run",
     ) -> None:
         """
@@ -788,6 +790,7 @@ def log_metric(
                 - avg: the average of all reported values for this metric
                 - sum: the cumulative sum of all reported values for this metric
                 - count: increment every time this metric is logged - disregard value
+            attributes: A dictionary of additional attributes to attach to the metric.
             to: The target object to log the metric to. Can be "task-or-run" or "run".
                 Defaults to "task-or-run". If "task-or-run", the metric will be logged
                 to the current task or run, whichever is the nearest ancestor.
@@ -842,6 +845,7 @@ def log_metric(
         origin: t.Any | None = None,
         timestamp: datetime | None = None,
         mode: MetricAggMode | None = None,
+        attributes: JsonDict | None = None,
         to: ToObject = "task-or-run",
     ) -> None:
         task = current_task_span.get()
@@ -854,7 +858,9 @@ def log_metric(
         metric = (
             value
             if isinstance(value, Metric)
-            else Metric(float(value), step, timestamp or datetime.now(timezone.utc))
+            else Metric(
+                float(value), step, timestamp or datetime.now(timezone.utc), attributes or {}
+            )
         )
         target.log_metric(key, metric, origin=origin, mode=mode)
 
diff --git a/dreadnode/tracing/span.py b/dreadnode/tracing/span.py
@@ -527,6 +527,7 @@ def log_metric(
         origin: t.Any | None = None,
         timestamp: datetime | None = None,
         mode: MetricAggMode | None = None,
+        attributes: JsonDict | None = None,
     ) -> None: ...
 
     @t.overload
@@ -548,11 +549,14 @@ def log_metric(
         origin: t.Any | None = None,
         timestamp: datetime | None = None,
         mode: MetricAggMode | None = None,
+        attributes: JsonDict | None = None,
     ) -> None:
         metric = (
             value
             if isinstance(value, Metric)
-            else Metric(float(value), step, timestamp or datetime.now(timezone.utc))
+            else Metric(
+                float(value), step, timestamp or datetime.now(timezone.utc), attributes or {}
+            )
         )
 
         if origin is not None:
@@ -740,6 +744,7 @@ def log_metric(
         origin: t.Any | None = None,
         timestamp: datetime | None = None,
         mode: MetricAggMode | None = None,
+        attributes: JsonDict | None = None,
     ) -> None: ...
 
     @t.overload
@@ -761,11 +766,14 @@ def log_metric(
         origin: t.Any | None = None,
         timestamp: datetime | None = None,
         mode: MetricAggMode | None = None,
+        attributes: JsonDict | None = None,
     ) -> None:
         metric = (
             value
             if isinstance(value, Metric)
-            else Metric(float(value), step, timestamp or datetime.now(timezone.utc))
+            else Metric(
+                float(value), step, timestamp or datetime.now(timezone.utc), attributes or {}
+            )
         )
 
         if origin is not None:
diff --git a/examples/model_training.ipynb b/examples/model_training.ipynb
@@ -0,0 +1,118 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Model Training Callbacks\n",
+    "\n",
+    "You can use the library to log your model training progress to Strikes.\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import dreadnode as dn\n",
+    "\n",
+    "dn.configure(\n",
+    "    token=\"<YOUR API KEY>\", # Replace with your token\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from datasets import load_dataset\n",
+    "from transformers import AutoModelForSequenceClassification, AutoTokenizer\n",
+    "\n",
+    "# Load dataset\n",
+    "dataset = load_dataset(\"glue\", \"sst2\")\n",
+    "tokenizer = AutoTokenizer.from_pretrained(\"distilbert-base-uncased\")\n",
+    "\n",
+    "# Take a small portion of the dataset\n",
+    "dataset[\"train\"] = dataset[\"train\"].select(range(1000))\n",
+    "dataset[\"validation\"] = dataset[\"validation\"].select(range(1000))\n",
+    "\n",
+    "# Preprocessing function\n",
+    "def preprocess_function(examples):\n",
+    "    return tokenizer(examples[\"sentence\"], truncation=True, padding=\"max_length\")\n",
+    "\n",
+    "# Tokenize the dataset\n",
+    "tokenized_datasets = dataset.map(preprocess_function, batched=True)\n",
+    "\n",
+    "# Load model\n",
+    "model = AutoModelForSequenceClassification.from_pretrained(\"distilbert-base-uncased\", num_labels=2)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from transformers import Trainer, TrainingArguments\n",
+    "\n",
+    "from dreadnode.integrations.transformers import DreadnodeCallback\n",
+    "import dreadnode as dn\n",
+    "\n",
+    "# Define training arguments\n",
+    "training_args = TrainingArguments(\n",
+    "    output_dir=\"./results\",\n",
+    "    learning_rate=2e-5,\n",
+    "    per_device_train_batch_size=6,\n",
+    "    per_device_eval_batch_size=6,\n",
+    "    num_train_epochs=5,\n",
+    "    weight_decay=0.01,\n",
+    "    eval_strategy=\"steps\",\n",
+    "    eval_steps=5,\n",
+    "    load_best_model_at_end=False,\n",
+    "    push_to_hub=False,\n",
+    "    run_name=\"distilbert-sst2-demo\",\n",
+    ")\n",
+    "\n",
+    "# Initialize Trainer with RiggingCallback\n",
+    "trainer = Trainer(\n",
+    "    model=model,\n",
+    "    args=training_args,\n",
+    "    train_dataset=tokenized_datasets[\"train\"],\n",
+    "    eval_dataset=tokenized_datasets[\"validation\"],\n",
+    "    tokenizer=tokenizer,\n",
+    "    callbacks=[DreadnodeCallback(project=\"training\")],\n",
+    ")\n",
+    "\n",
+    "# Train the model\n",
+    "trainer.train()\n",
+    "\n",
+    "# Evaluate the model\n",
+    "trainer.evaluate()"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.14"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}