netboxlabs · arthanson · Apr 30, 2026 · Apr 23, 2026 · Apr 23, 2026 · Apr 23, 2026
diff --git a/netbox_custom_objects/migrations/0010_backfill_base_columns.py b/netbox_custom_objects/migrations/0010_backfill_base_columns.py
@@ -0,0 +1,116 @@
+"""
+Data migration: populate schema_document["base_columns"] for all existing
+CustomObjectType rows that were created before this snapshot feature existed.
+
+Strategy
+--------
+For each CustomObjectType whose schema_document does not yet contain a
+"base_columns" key:
+
+1. Introspect the actual DB table to get its current column names and
+   nullability (this reflects ground truth, not model assumptions).
+2. Subtract the names of user-defined fields (from CustomObjectTypeField) to
+   isolate the columns contributed by the CustomObject base class / mixins.
+3. Cross-reference with the live CustomObject abstract model to attach a
+   Django field_class name to each base column where possible.
+4. Write the result back to schema_document["base_columns"].
+
+The reverse migration is intentionally a no-op: rolling back would leave
+schema_document in a valid state (missing "base_columns" is the pre-feature
+default), and the forward migration is idempotent (skips rows that already
+have the key).
+
+Note: this migration intentionally imports from live plugin code (CustomObject)
+rather than using the historical ORM state.  CustomObject is an abstract base
+class, not a tracked Django model, so its field definitions are not available
+via apps.get_model().  Because CustomObject's base columns are intended to be
+stable across plugin versions, this is safe.
+"""
+
+import logging
+
+from django.conf import settings
+from django.db import migrations
+
+logger = logging.getLogger(__name__)
+
+
+def backfill_base_columns(apps, schema_editor):
+    from django.db import connection
+
+    # Import the live abstract base to get field metadata.
+    # See module docstring for rationale.
+    from netbox_custom_objects.models import CustomObject, USER_TABLE_DATABASE_NAME_PREFIX  # noqa: PLC0415
+
+    CustomObjectType = apps.get_model("netbox_custom_objects", "CustomObjectType")
+    CustomObjectTypeField = apps.get_model("netbox_custom_objects", "CustomObjectTypeField")
+
+    # Build a name → {field_class, null} map from CustomObject's abstract hierarchy.
+    # _meta.get_fields() on an abstract model returns fields declared on it and its
+    # abstract bases.  We filter to concrete fields (those with a "column" attribute).
+    base_field_info = {}
+    for f in CustomObject._meta.get_fields():
+        if hasattr(f, "column") and f.column:
+            base_field_info[f.name] = {
+                "field_class": f.__class__.__name__,
+                "null": getattr(f, "null", False),
+            }
+    # "id" comes from models.Model, which is a concrete base not tracked by
+    # CustomObject's abstract _meta; add it explicitly.  Derive the class name
+    # from DEFAULT_AUTO_FIELD so it matches whatever BigAutoField (or subclass)
+    # concrete models use — CustomObject._meta.pk is always None for abstract
+    # models, so we cannot read it from there.
+    pk_class = getattr(
+        settings, "DEFAULT_AUTO_FIELD", "django.db.models.BigAutoField"
+    ).rsplit(".", 1)[-1]
+    base_field_info.setdefault("id", {"field_class": pk_class, "null": False})
+
+    for cot in CustomObjectType.objects.all():
+        # Skip rows that already have the snapshot.
+        if cot.schema_document and "base_columns" in cot.schema_document:
+            continue
+
+        table_name = f"{USER_TABLE_DATABASE_NAME_PREFIX}{cot.id}"
+
+        user_field_names = set(
+            CustomObjectTypeField.objects.filter(custom_object_type=cot)
+            .values_list("name", flat=True)
+        )
+
+        try:
+            with connection.cursor() as cursor:
+                col_rows = connection.introspection.get_table_description(cursor, table_name)
+        except Exception as exc:
+            logger.warning(
+                "backfill_base_columns: could not introspect table %r for COT %s: %s",
+                table_name, cot.pk, exc,
+            )
+            continue
+
+        # col_rows is a list of FieldInfo namedtuples; .name and .null_ok are stable
+        # across supported Django/PostgreSQL versions.
+        base_columns = []
+        for col in sorted(col_rows, key=lambda c: c.name):
+            if col.name in user_field_names:
+                continue
+            entry = {
+                "name": col.name,
+                "field_class": base_field_info.get(col.name, {}).get("field_class", "UnknownField"),
+                "null": bool(col.null_ok),
+            }
+            base_columns.append(entry)
+
+        doc = cot.schema_document or {}
+        doc["base_columns"] = base_columns
+        CustomObjectType.objects.filter(pk=cot.pk).update(schema_document=doc)
+
+
+class Migration(migrations.Migration):
+
+    dependencies = [
+        ("netbox_custom_objects", "0009_alter_customobjecttype_version"),
+    ]
+
+    operations = [
+        migrations.RunPython(backfill_base_columns, migrations.RunPython.noop),
+    ]
diff --git a/netbox_custom_objects/models.py b/netbox_custom_objects/models.py
@@ -490,6 +490,50 @@ def _after_model_generation(self, attrs, model):
         # Store through models on the model for yielding in get_models()
         model._through_models = through_models
 
+    @staticmethod
+    def _collect_base_columns(model, user_field_names):
+        """
+        Return a list of dicts describing the concrete DB columns contributed by the
+        CustomObject base class (mixins), excluding any user-defined field names.
+
+        Each dict has keys:
+          "name"        – column/field name
+          "field_class" – Django field class name (e.g. "AutoField", "DateTimeField")
+          "null"        – whether the column is nullable (bool)
+
+        This snapshot is stored in schema_document["base_columns"] so that the
+        post_migrate auto-heal handler (issue #391, Phase 2) can detect drift when
+        NetBox upgrades add new columns to the mixin hierarchy.
+        """
+        return sorted(
+            [
+                {
+                    "name": f.name,
+                    "field_class": f.__class__.__name__,
+                    "null": f.null,
+                }
+                for f in model._meta.concrete_fields
+                if f.name not in user_field_names
+            ],
+            key=lambda e: e["name"],
+        )
+
+    def _store_base_column_snapshot(self, model):
+        """
+        Snapshot the current base columns into schema_document["base_columns"].
+
+        Called immediately after the DB table is created by create_model() so that
+        the snapshot reflects exactly what columns are present at birth.  Only the
+        "base_columns" key is written; any existing keys in schema_document
+        (e.g. "fields" written by the schema exporter) are preserved.
+        """
+        user_field_names = set(self.fields.values_list("name", flat=True))
+        base_columns = self._collect_base_columns(model, user_field_names)
+        doc = self.schema_document or {}
+        doc["base_columns"] = base_columns
+        CustomObjectType.objects.filter(pk=self.pk).update(schema_document=doc)
+        self.schema_document = doc
+
     def get_collision_safe_order_id_idx_name(self):
         return f"tbl_order_id_{self.id}_idx"
 
@@ -759,6 +803,8 @@ def create_model(self):
         with connection.schema_editor() as schema_editor:
             schema_editor.create_model(model)
 
+        self._store_base_column_snapshot(model)
+
         get_serializer_class(model)
         self.register_custom_object_search_index(model)
 

diff --git a/netbox_custom_objects/schema/executor.py b/netbox_custom_objects/schema/executor.py
@@ -501,7 +501,11 @@ def apply_diffs(
         # Finalise: persist schema_document and sync next_schema_id counters.
         for diff in ordered:
             cot = cot_map[diff.slug]
-            if diff.is_new or diff.has_changes or not cot.schema_document:
+            # Also update when schema_document exists but was set only by the
+            # base-column snapshot (lacks schema_version), so that the first
+            # apply always writes a proper executor-managed document.
+            has_executor_doc = "schema_version" in (cot.schema_document or {})
+            if diff.is_new or diff.has_changes or not has_executor_doc:
                 _update_schema_document(cot, type_defs_by_slug[diff.slug])
             _sync_next_schema_id(cot, diff)
 

diff --git a/netbox_custom_objects/tests/schema/test_format.py b/netbox_custom_objects/tests/schema/test_format.py
@@ -363,9 +363,17 @@ def test_idempotent(self):
 class SchemaDocumentFieldTestCase(CustomObjectsTestCase, TestCase):
     """schema_document and version fields on CustomObjectType."""
 
-    def test_schema_document_defaults_to_null(self):
+    def test_schema_document_populated_with_base_columns_on_creation(self):
+        # schema_document is no longer NULL after creation: create_model() writes
+        # the base_columns snapshot immediately.  Verify the expected structure.
         cot = self.create_custom_object_type(name='schemadoc', slug='schema-doc')
-        self.assertIsNone(cot.schema_document)
+        cot.refresh_from_db()
+        self.assertIsNotNone(cot.schema_document)
+        self.assertIn('base_columns', cot.schema_document)
+        names = {c['name'] for c in cot.schema_document['base_columns']}
+        self.assertIn('id', names)
+        self.assertIn('created', names)
+        self.assertIn('last_updated', names)
 
     def test_schema_document_can_store_json(self):
         cot = self.create_custom_object_type(name='schemadoc2', slug='schema-doc-2')