From 89cd5d2cd9efe3f2867b3d8c942fbeed5211bc7a Mon Sep 17 00:00:00 2001
From: misko <misko@meta.com>
Date: Tue, 23 Jun 2026 03:42:55 +0000
Subject: [PATCH] UMA: deprecate 1.0 checkpoints, back-fill model_id for 1.1

UMA checkpoint generations are inconsistently tagged: 1.0 has neither
`backbone.model_version` nor top-level `model_id`; 1.1 carries
`backbone.model_version="1.1"` but no `model_id`; 1.2 has
`model_id="UMA-S-1.2"` and no `model_version`. This change introduces
a single source of truth for UMA version identification and applies
in-place fixups at load time.

- New `fairchem.core.models.uma.compat` module exposes
  `get_uma_version()` (public classifier returning "1.0"/"1.1"/"1.2"/
  "unknown_uma"/"not_uma") and `apply_uma_compat_fixups()` (raises
  RuntimeError for 1.0, back-fills `model_id="UMA-1.1"` for 1.1).
- UMA 1.0 hard-fails with a path-specific RuntimeError pointing at
  `pip install 'fairchem-core<=2.21.0'`. Justification: the
  `eSCNMDMoeBackbone` composition-reduction `include_self` flag
  branches on `np.isclose(model_version, 1.0)`, so silent loads
  produce numerically different results.
- Fixup wired at three I/O boundaries (idempotent):
  `load_inference_model`, `MLIPPredictUnit.__init__` (before
  `maybe_update_settings_backend`), and
  `convert_train_checkpoint_to_inference_checkpoint`.
- Classifier prefers `backbone.model_version` over `model_id` so
  finetuned-from-1.1 checkpoints (which carry the back-filled
  `model_id` after the first load) are correctly re-classified as 1.1.
- Sub-size (S/M/L) is intentionally not encoded; back-fill is the bare
  "UMA-1.1".
- Tests: 22 unit tests in `tests/core/models/uma/test_compat.py`
  (DictConfig + struct-mode, registry short-name, empty/whitespace
  `model_id`, idempotency with S/M/L-suffixed forms, etc.) plus 3
  integration tests in `tests/core/units/mlip_unit/test_predict.py`
  (1.1 predict has model_id, finetune propagates the back-fill, 1.0
  raises).
- Docs/notebook sweep: retarget 10 `"uma-s-1"` references in the UMA
  tutorial + cattsunami DATASET.md to `"uma-s-1p2"`; add a
  compatibility section to `docs/core/uma_changelog.md`.
---
 docs/core/uma_changelog.md                    |  16 ++
 docs/uma_tutorials/uma_tutorial.ipynb         |  18 +-
 .../applications/cattsunami/DATASET.md        |   2 +-
 src/fairchem/core/models/uma/compat.py        | 269 ++++++++++++++++++
 .../core/units/mlip_unit/mlip_unit.py         |  19 +-
 src/fairchem/core/units/mlip_unit/predict.py  |   7 +
 src/fairchem/core/units/mlip_unit/utils.py    |   3 +
 tests/core/models/uma/test_compat.py          | 228 +++++++++++++++
 tests/core/units/mlip_unit/test_predict.py    |  42 +++
 9 files changed, 586 insertions(+), 18 deletions(-)
 create mode 100644 src/fairchem/core/models/uma/compat.py
 create mode 100644 tests/core/models/uma/test_compat.py

diff --git a/docs/core/uma_changelog.md b/docs/core/uma_changelog.md
index 64bad2b9b1..db0d378b78 100644
--- a/docs/core/uma_changelog.md
+++ b/docs/core/uma_changelog.md
@@ -17,6 +17,22 @@ This page documents the release history of UMA models, including new features, i
 
 ---
 
+## Library compatibility — UMA 1.0 deprecation
+
+UMA 1.0 checkpoints (e.g. `uma-s-1.pt`) are **no longer supported** in current `fairchem-core` releases. Loading a UMA 1.0 checkpoint raises a `RuntimeError` at load time, because UMA 1.0 has a known semantic divergence with later releases (the composition-reduction `include_self` flag in `eSCNMDMoeBackbone` branches on `np.isclose(self.model_version, 1.0)`) — silently running a UMA 1.0 checkpoint through current code would produce numerically different results than the original release.
+
+To use a UMA 1.0 checkpoint, install the last release that supports it:
+
+```bash
+pip install 'fairchem-core<=2.21.0'
+```
+
+Otherwise, switch to UMA 1.1 (`uma-s-1p1`, `uma-m-1p1`) or UMA 1.2 (`uma-s-1p2`).
+
+UMA 1.1 checkpoints ship without a top-level `model_id`. The compat shim back-fills `model_id = "UMA-1.1"` at load time so downstream consumers can dispatch on `HydraModel.model_id`. The back-fill persists into any subsequent finetune checkpoint.
+
+---
+
 ## UMA 1.2
 
 :::{admonition} Latest Release
diff --git a/docs/uma_tutorials/uma_tutorial.ipynb b/docs/uma_tutorials/uma_tutorial.ipynb
index faa65db274..43e1d17ae4 100644
--- a/docs/uma_tutorials/uma_tutorial.ipynb
+++ b/docs/uma_tutorials/uma_tutorial.ipynb
@@ -141,7 +141,7 @@
    "source": [
     "from fairchem.core import FAIRChemCalculator, pretrained_mlip\n",
     "\n",
-    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1\")"
+    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1p2\")"
    ]
   },
   {
@@ -191,7 +191,7 @@
     "from ase.optimize import LBFGS\n",
     "from fairchem.core import FAIRChemCalculator, pretrained_mlip\n",
     "\n",
-    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1\")\n",
+    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1p2\")\n",
     "calc = FAIRChemCalculator(predictor, task_name=\"oc20\")\n",
     "\n",
     "# Set up your system as an ASE atoms object\n",
@@ -227,7 +227,7 @@
     "from ase.optimize import FIRE\n",
     "from fairchem.core import FAIRChemCalculator, pretrained_mlip\n",
     "\n",
-    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1\")\n",
+    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1p2\")\n",
     "calc = FAIRChemCalculator(predictor, task_name=\"omat\")\n",
     "\n",
     "atoms = bulk(\"Fe\")\n",
@@ -262,7 +262,7 @@
     "from ase.md.langevin import Langevin\n",
     "from fairchem.core import FAIRChemCalculator, pretrained_mlip\n",
     "\n",
-    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1\")\n",
+    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1p2\")\n",
     "calc = FAIRChemCalculator(predictor, task_name=\"omol\")\n",
     "\n",
     "atoms = molecule(\"H2O\")\n",
@@ -332,7 +332,7 @@
     "from ase.optimize import BFGS\n",
     "from fairchem.core import FAIRChemCalculator, pretrained_mlip\n",
     "\n",
-    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1\")\n",
+    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1p2\")\n",
     "calc = FAIRChemCalculator(predictor, task_name=\"oc20\")"
    ]
   },
@@ -462,7 +462,7 @@
     "from ase import Atoms\n",
     "from ase.optimize import BFGS\n",
     "\n",
-    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1\")\n",
+    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1p2\")\n",
     "calc = FAIRChemCalculator(predictor, task_name=\"omol\")\n",
     "\n",
     "from ase.vibrations import Vibrations\n",
@@ -510,7 +510,7 @@
     "from ase.optimize import FIRE\n",
     "from fairchem.core import FAIRChemCalculator, pretrained_mlip\n",
     "\n",
-    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1\")\n",
+    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1p2\")\n",
     "\n",
     "cu = Atoms(\n",
     "    [Atom(\"Cu\", [0.000, 0.000, 0.000])],\n",
@@ -667,7 +667,7 @@
     "from ase.build import bulk\n",
     "from ase.phonons import Phonons\n",
     "\n",
-    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1\")\n",
+    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1p2\")\n",
     "calc = FAIRChemCalculator(predictor, task_name=\"omat\")\n",
     "\n",
     "# Setup crystal\n",
@@ -753,7 +753,7 @@
     "from ase.optimize import LBFGS\n",
     "from fairchem.core import FAIRChemCalculator, pretrained_mlip\n",
     "\n",
-    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1\")\n",
+    "predictor = pretrained_mlip.get_predict_unit(\"uma-s-1p2\")\n",
     "calc = FAIRChemCalculator(predictor, task_name=\"oc20\")\n",
     "\n",
     "# Set up your system as an ASE atoms object\n",
diff --git a/src/fairchem/applications/cattsunami/DATASET.md b/src/fairchem/applications/cattsunami/DATASET.md
index 588aa29e45..6564e06540 100644
--- a/src/fairchem/applications/cattsunami/DATASET.md
+++ b/src/fairchem/applications/cattsunami/DATASET.md
@@ -33,7 +33,7 @@ from ase.mep import DyNEB
 
 traj = read("desorption_id_83_2409_9_111-4_neb1.0.traj", ":")
 images = traj[0:10]
-predictor = pretrained_mlip.get_predict_unit("uma-s-1")
+predictor = pretrained_mlip.get_predict_unit("uma-s-1p2")
 
 neb = DyNEB(images, k=1)
 for image in images:
diff --git a/src/fairchem/core/models/uma/compat.py b/src/fairchem/core/models/uma/compat.py
new file mode 100644
index 0000000000..38a33bcd05
--- /dev/null
+++ b/src/fairchem/core/models/uma/compat.py
@@ -0,0 +1,269 @@
+"""UMA-specific checkpoint compatibility shim.
+
+This module classifies a loaded :class:`MLIPInferenceCheckpoint` by UMA
+generation and applies in-place fixups to the checkpoint's ``model_config``
+before the model is instantiated. Two concrete behaviors:
+
+* **UMA 1.0 is deprecated and raises.** UMA 1.0 has a known semantic
+  divergence with later releases (the ``include_self`` flag in the
+  composition reduction at ``escn_moe.py``'s ``set_MOLE_coefficients``
+  branches on ``np.isclose(self.model_version, 1.0)``). Silent loads
+  would produce numerically different results than UMA 1.1/1.2, so we
+  hard-fail rather than ship a deprecation cycle.
+* **UMA 1.1 gets ``model_id`` back-filled** to the constant ``"UMA-1.1"``
+  if missing. Shipped UMA 1.1 checkpoints carry ``backbone.model_version=1.1``
+  but no top-level ``model_id`` (only 1.2 does). Back-filling here makes
+  ``HydraModel.model_id`` reflect the generation for downstream consumers
+  (logging, serving, surgery scripts).
+
+Sub-size (S / M / L) is intentionally not encoded — inside a single major.minor
+release UMA variants are similar enough that downstream code does not need
+to dispatch on size. The back-fill is the bare ``"UMA-1.1"``.
+
+Call sites
+----------
+The fixup must run at every raw I/O boundary that loads a checkpoint:
+
+1. :func:`fairchem.core.units.mlip_unit.utils.load_inference_model` — the
+   generic Hydra loader (safety net for any direct caller).
+2. :class:`fairchem.core.units.mlip_unit.predict.MLIPPredictUnit` —
+   ``MLIPPredictUnit.__init__`` does its own ``torch.load`` and reads the
+   config before delegating to ``load_inference_model``. Hooking here means
+   UMA 1.0 raises before the ~1 GB tensor allocation, and downstream calls
+   see the patched config.
+3. :func:`fairchem.core.units.mlip_unit.mlip_unit.convert_train_checkpoint_to_inference_checkpoint`
+   — converts a DCP train checkpoint into a fresh inference checkpoint. The
+   fixup runs on the new ``MLIPInferenceCheckpoint`` before it is written to
+   disk, so finetune-derived inference checkpoints come out correctly tagged.
+
+:func:`apply_uma_compat_fixups` is idempotent — calling it from all three
+sites (and accidentally multiple times) is safe.
+
+Override-bypass policy
+----------------------
+The fixup runs *before* any caller-supplied ``overrides`` are merged into
+``model_config``. A user cannot bypass the UMA 1.0 gate by passing
+``overrides={"backbone": {"model_version": 1.1}}``. A user CAN, post-fixup,
+force a different ``model_id`` via ``overrides={"model_id": "MY-ID"}``.
+
+Known gaps
+----------
+* ``load_tasks`` (utils.py) does its own ``torch.load`` but only
+  instantiates tasks, not the model — out of scope for this gate.
+* ``MLIPTrainEvalUnit._execute_load_state`` resumes a DCP train run via
+  ``dcp.load`` directly into an already-instantiated model — also out of
+  scope. The first subsequent ``save_state`` routes through
+  ``convert_train_checkpoint_to_inference_checkpoint`` where the fixup
+  *does* fire, so the persisted inference checkpoint is still tagged.
+"""
+
+from __future__ import annotations
+
+import logging
+import re
+from typing import TYPE_CHECKING, Literal
+
+import numpy as np
+from omegaconf import DictConfig, OmegaConf, open_dict
+
+if TYPE_CHECKING:
+    from fairchem.core.units.mlip_unit.api.inference import MLIPInferenceCheckpoint
+
+
+UmaVersion = Literal["1.0", "1.1", "1.2", "unknown_uma", "not_uma"]
+
+UMA_1P1_MODEL_ID = "UMA-1.1"
+
+# Last fairchem-core release that supports UMA 1.0 (git describe --tags on
+# this repo: fairchem_core-2.21.0-2-g28c7f4ba6).
+_LAST_UMA_1P0_FAIRCHEM_VERSION = "2.21.0"
+
+# Accepts "UMA-1.X" or "UMA-S-1.X" / "UMA-M-1.X" / "UMA-L-1.X" historical forms.
+_UMA_MODEL_ID_RE = re.compile(r"^UMA(?:-[SML])?-1\.(\d+)$")
+
+# Hydra registry short-name for the UMA MoE backbone.
+_UMA_BACKBONE_SHORT_NAME = "escnmd_moe_backbone"
+# Suffix of the fully-qualified backbone class path used in shipped checkpoints.
+_UMA_BACKBONE_FQN_SUFFIX = "uma.escn_moe.eSCNMDMoeBackbone"
+
+
+def _is_uma_backbone(backbone_model: object) -> bool:
+    if not isinstance(backbone_model, str):
+        return False
+    if backbone_model == _UMA_BACKBONE_SHORT_NAME:
+        return True
+    if backbone_model.endswith(_UMA_BACKBONE_FQN_SUFFIX):
+        return True
+    # Defensive: resolve via the registry in case of subclasses.
+    try:
+        from fairchem.core.common.registry import registry
+        from fairchem.core.models.uma.escn_moe import eSCNMDMoeBackbone
+
+        cls = registry.get_model_class(backbone_model)
+    except Exception:
+        return False
+    return isinstance(cls, type) and issubclass(cls, eSCNMDMoeBackbone)
+
+
+def _match_version(value: object, target: float) -> bool:
+    """Return True iff ``value`` parses to a float ≈ ``target``."""
+    try:
+        return bool(np.isclose(float(value), target))
+    except (TypeError, ValueError):
+        return False
+
+
+def _normalize_model_id(value: object) -> str | None:
+    if value is None:
+        return None
+    if not isinstance(value, str):
+        return None
+    stripped = value.strip()
+    return stripped or None
+
+
+def get_uma_version(model_config: dict | DictConfig | None) -> UmaVersion:
+    """Classify a checkpoint's ``model_config`` by UMA generation.
+
+    Returns one of:
+
+    * ``"1.0"`` / ``"1.1"`` / ``"1.2"`` — a recognized UMA generation.
+    * ``"unknown_uma"`` — a UMA backbone with a ``model_id`` or
+      ``model_version`` that does not match any known generation
+      (e.g. a future UMA 1.3 release).
+    * ``"not_uma"`` — not a UMA checkpoint (esen, AllScAIP, ...), a
+      missing/corrupt ``model_config``, or no backbone declared.
+    """
+    if not isinstance(model_config, (dict, DictConfig)):
+        return "not_uma"
+
+    backbone = model_config.get("backbone", {})
+    if not isinstance(backbone, (dict, DictConfig)):
+        return "not_uma"
+
+    if not _is_uma_backbone(backbone.get("model")):
+        return "not_uma"
+
+    mid = _normalize_model_id(model_config.get("model_id"))
+    if mid is not None:
+        match = _UMA_MODEL_ID_RE.match(mid)
+        if match:
+            minor = int(match.group(1))
+            if minor == 1:
+                return "1.1"
+            if minor == 2:
+                return "1.2"
+            logging.warning(
+                f"Unknown UMA minor version in model_id={mid!r}; "
+                "treating as unknown_uma."
+            )
+            return "unknown_uma"
+        # A user-customized model_id is respected — we don't reclassify
+        # the checkpoint based on backbone.model_version in that case
+        # (the user has explicitly named their derivative).
+        return "unknown_uma"
+
+    mv = backbone.get("model_version")
+    if _match_version(mv, 1.1):
+        return "1.1"
+    if _match_version(mv, 1.2):
+        return "1.2"
+    if mv is None or _match_version(mv, 1.0):
+        return "1.0"
+    logging.warning(
+        f"Unknown UMA backbone.model_version={mv!r}; treating as unknown_uma."
+    )
+    return "unknown_uma"
+
+
+def _raise_uma_1p0(
+    model_config: dict | DictConfig,
+    checkpoint_location: str | None,
+) -> None:
+    mid = model_config.get("model_id") if isinstance(model_config, (dict, DictConfig)) else None
+    backbone = model_config.get("backbone", {}) if isinstance(model_config, (dict, DictConfig)) else {}
+    mv = backbone.get("model_version") if isinstance(backbone, (dict, DictConfig)) else None
+    path_str = checkpoint_location if checkpoint_location is not None else "<unknown path>"
+    raise RuntimeError(
+        f"UMA 1.0 checkpoints are no longer supported in this version of "
+        f"fairchem-core. Detected UMA 1.0 from checkpoint at {path_str!r} "
+        f"(model_id={mid!r}, backbone.model_version={mv!r}).\n"
+        f"\n"
+        f"UMA 1.0 has a known semantic divergence in "
+        f"`fairchem.core.models.uma.escn_moe.eSCNMDMoeBackbone` (the "
+        f"composition-reduction `include_self` flag branches on "
+        f"`np.isclose(self.model_version, 1.0)`). Loading 1.0 weights with "
+        f"the current code would produce numerically different results "
+        f"than the original release, so this is a hard failure.\n"
+        f"\n"
+        f"To use this checkpoint, install the last fairchem-core release "
+        f"that supported UMA 1.0:\n"
+        f"    pip install 'fairchem-core<={_LAST_UMA_1P0_FAIRCHEM_VERSION}'\n"
+        f"\n"
+        f"To use a current release, switch to UMA 1.1 or UMA 1.2 (see "
+        f"`facebook/UMA` on Hugging Face, or "
+        f"`fairchem.core.calculate.pretrained_mlip.available_models`)."
+    )
+
+
+def _backfill_uma_1p1_model_id(model_config: dict | DictConfig) -> bool:
+    """Set ``model_config['model_id'] = "UMA-1.1"`` if absent. Returns True if mutated."""
+    existing = _normalize_model_id(model_config.get("model_id"))
+    if existing is not None:
+        return False
+    if isinstance(model_config, DictConfig):
+        with open_dict(model_config):
+            OmegaConf.update(
+                model_config,
+                "model_id",
+                UMA_1P1_MODEL_ID,
+                merge=False,
+                force_add=True,
+            )
+    else:
+        model_config["model_id"] = UMA_1P1_MODEL_ID
+    return True
+
+
+def apply_uma_compat_fixups(
+    checkpoint: MLIPInferenceCheckpoint,
+    checkpoint_location: str | None = None,
+) -> None:
+    """Classify ``checkpoint`` and apply in-place UMA-generation fixups.
+
+    See module docstring for the full contract. Idempotent. Safe to call on
+    non-UMA checkpoints (no-op).
+    """
+    model_config = getattr(checkpoint, "model_config", None)
+    version = get_uma_version(model_config)
+
+    if version == "1.0":
+        _raise_uma_1p0(model_config, checkpoint_location)
+
+    if version == "1.1":
+        mutated = _backfill_uma_1p1_model_id(model_config)
+        if mutated:
+            logging.warning(
+                f"UMA 1.1 checkpoint at {checkpoint_location!r} had no "
+                f"model_id; back-filled model_id={UMA_1P1_MODEL_ID!r}. "
+                "This will be persisted to disk if the checkpoint is "
+                "subsequently saved (e.g. at the end of a finetune)."
+            )
+        return
+
+    if version == "1.2":
+        mid = model_config.get("model_id") if isinstance(model_config, (dict, DictConfig)) else None
+        logging.info(
+            f"Loaded UMA 1.2 checkpoint: model_id={mid!r}, "
+            f"path={checkpoint_location!r}"
+        )
+        return
+
+    if version == "unknown_uma":
+        logging.warning(
+            f"UMA checkpoint at {checkpoint_location!r} could not be classified "
+            "into a known generation (1.1 or 1.2); no fixups applied."
+        )
+        return
+
+    # not_uma: silent no-op.
diff --git a/src/fairchem/core/units/mlip_unit/mlip_unit.py b/src/fairchem/core/units/mlip_unit/mlip_unit.py
index 031ca5a35f..0fc62c8c72 100644
--- a/src/fairchem/core/units/mlip_unit/mlip_unit.py
+++ b/src/fairchem/core/units/mlip_unit/mlip_unit.py
@@ -57,6 +57,7 @@
 from fairchem.core.units.mlip_unit.api.inference import (
     MLIPInferenceCheckpoint,
 )
+from fairchem.core.models.uma.compat import apply_uma_compat_fixups
 from fairchem.core.units.mlip_unit.utils import load_inference_model
 
 if TYPE_CHECKING:
@@ -125,15 +126,17 @@ def convert_train_checkpoint_to_inference_checkpoint(
     )  # DCP model config
     train_eval_unit_state = inference_ckpt["config"]["runner"]["train_eval_unit"]
     unit_state = inference_ckpt["unit_state"]
-    torch.save(
-        MLIPInferenceCheckpoint(
-            model_state_dict=unit_state["model"],
-            ema_state_dict=unit_state["ema"],
-            model_config=train_eval_unit_state["model"],
-            tasks_config=train_eval_unit_state["tasks"],
-        ),
-        checkpoint_loc,
+    final_ckpt = MLIPInferenceCheckpoint(
+        model_state_dict=unit_state["model"],
+        ema_state_dict=unit_state["ema"],
+        model_config=train_eval_unit_state["model"],
+        tasks_config=train_eval_unit_state["tasks"],
     )
+    # Tag UMA generation (back-fill model_id for 1.1, hard-fail on 1.0)
+    # so the converted inference checkpoint is correctly identified by
+    # subsequent loads.
+    apply_uma_compat_fixups(final_ckpt, checkpoint_location=checkpoint_loc)
+    torch.save(final_ckpt, checkpoint_loc)
 
 
 def initialize_finetuning_model(
diff --git a/src/fairchem/core/units/mlip_unit/predict.py b/src/fairchem/core/units/mlip_unit/predict.py
index 4f5031142c..f9f0ccf1d9 100644
--- a/src/fairchem/core/units/mlip_unit/predict.py
+++ b/src/fairchem/core/units/mlip_unit/predict.py
@@ -37,6 +37,7 @@
 )
 from fairchem.core.components.batch_server import get_app_handle_with_retry
 from fairchem.core.datasets.atomic_data import AtomicData, warn_if_upcasting
+from fairchem.core.models.uma.compat import apply_uma_compat_fixups
 from fairchem.core.models.uma.nn.execution_backends import (
     maybe_update_settings_backend,
 )
@@ -129,6 +130,12 @@ def __init__(
             inference_model_path, map_location="cpu", weights_only=False
         )
 
+        # Classify UMA generation and apply in-place compat fixups (hard-fail
+        # for UMA 1.0, back-fill model_id for UMA 1.1). Runs before the calls
+        # below that read checkpoint.model_config so they see the patched
+        # config; also short-circuits the ~1 GB tensor allocation for 1.0.
+        apply_uma_compat_fixups(checkpoint, checkpoint_location=inference_model_path)
+
         # if the model is uma-s and the execution mode is not explicitly set, default to the optimized uma-s gpu execution mode
         self.inference_settings = maybe_update_settings_backend(
             self.inference_settings, checkpoint.model_config
diff --git a/src/fairchem/core/units/mlip_unit/utils.py b/src/fairchem/core/units/mlip_unit/utils.py
index ad91caf158..1fc2f534f8 100644
--- a/src/fairchem/core/units/mlip_unit/utils.py
+++ b/src/fairchem/core/units/mlip_unit/utils.py
@@ -17,6 +17,7 @@
 
 from fairchem.core.common.registry import registry
 from fairchem.core.common.utils import load_state_dict, match_state_dict
+from fairchem.core.models.uma.compat import apply_uma_compat_fixups
 
 if TYPE_CHECKING:
     from fairchem.core.units.mlip_unit.api.inference import MLIPInferenceCheckpoint
@@ -51,6 +52,8 @@ def load_inference_model(
             checkpoint_location, map_location="cpu", weights_only=False
         )
 
+    apply_uma_compat_fixups(checkpoint, checkpoint_location=checkpoint_location)
+
     if overrides is not None:
         checkpoint.model_config = update_configs(checkpoint.model_config, overrides)
 
diff --git a/tests/core/models/uma/test_compat.py b/tests/core/models/uma/test_compat.py
new file mode 100644
index 0000000000..3c8426ed07
--- /dev/null
+++ b/tests/core/models/uma/test_compat.py
@@ -0,0 +1,228 @@
+"""Tests for fairchem.core.models.uma.compat — UMA generation classifier
+and in-place ``model_id`` back-fill.
+"""
+
+from __future__ import annotations
+
+import logging
+import re
+
+import pytest
+from omegaconf import OmegaConf
+
+from fairchem.core.models.uma.compat import (
+    UMA_1P1_MODEL_ID,
+    apply_uma_compat_fixups,
+    get_uma_version,
+)
+from fairchem.core.units.mlip_unit.api.inference import MLIPInferenceCheckpoint
+
+UMA_BACKBONE_FQN = "fairchem.core.models.uma.escn_moe.eSCNMDMoeBackbone"
+UMA_BACKBONE_SHORT = "escnmd_moe_backbone"
+
+
+def make_fake_checkpoint(model_config) -> MLIPInferenceCheckpoint:
+    """Build a real ``MLIPInferenceCheckpoint`` with empty state for tests."""
+    return MLIPInferenceCheckpoint(
+        model_config=model_config,
+        model_state_dict={},
+        ema_state_dict={},
+        tasks_config={},
+    )
+
+
+def uma_cfg(*, model_version=None, model_id=None, backbone_model=UMA_BACKBONE_FQN):
+    cfg = {"backbone": {"model": backbone_model}}
+    if model_version is not None:
+        cfg["backbone"]["model_version"] = model_version
+    if model_id is not None:
+        cfg["model_id"] = model_id
+    return cfg
+
+
+# ---------------------------------------------------------------------------
+# UMA 1.0 — hard fail
+# ---------------------------------------------------------------------------
+
+
+def test_uma_1p0_raises():
+    cfg = uma_cfg()  # no model_id, no model_version
+    ckpt = make_fake_checkpoint(cfg)
+    with pytest.raises(RuntimeError) as exc_info:
+        apply_uma_compat_fixups(ckpt, checkpoint_location="/path/to/uma-s-1.pt")
+    msg = str(exc_info.value)
+    assert "UMA 1.0" in msg
+    assert "fairchem-core<=2.21.0" in msg
+    assert "/path/to/uma-s-1.pt" in msg
+
+
+def test_uma_1p0_raises_with_explicit_version_1p0():
+    cfg = uma_cfg(model_version=1.0)
+    ckpt = make_fake_checkpoint(cfg)
+    with pytest.raises(RuntimeError, match="UMA 1.0"):
+        apply_uma_compat_fixups(ckpt)
+
+
+def test_uma_1p0_raises_with_string_version_1p0():
+    cfg = uma_cfg(model_version="1.0")
+    ckpt = make_fake_checkpoint(cfg)
+    with pytest.raises(RuntimeError, match="UMA 1.0"):
+        apply_uma_compat_fixups(ckpt)
+
+
+# ---------------------------------------------------------------------------
+# UMA 1.1 — classification + back-fill
+# ---------------------------------------------------------------------------
+
+
+def test_uma_1p1_string_model_version_backfills(caplog):
+    cfg = uma_cfg(model_version="1.1")
+    ckpt = make_fake_checkpoint(cfg)
+    with caplog.at_level(logging.WARNING):
+        apply_uma_compat_fixups(ckpt, checkpoint_location="/p.pt")
+    assert ckpt.model_config["model_id"] == UMA_1P1_MODEL_ID
+    assert any("UMA 1.1" in r.getMessage() for r in caplog.records)
+
+
+def test_uma_1p1_float_model_version_backfills(caplog):
+    cfg = uma_cfg(model_version=1.1)
+    ckpt = make_fake_checkpoint(cfg)
+    with caplog.at_level(logging.WARNING):
+        apply_uma_compat_fixups(ckpt)
+    assert ckpt.model_config["model_id"] == UMA_1P1_MODEL_ID
+
+
+def test_uma_1p1_idempotent_bare(caplog):
+    cfg = uma_cfg(model_version="1.1", model_id=UMA_1P1_MODEL_ID)
+    ckpt = make_fake_checkpoint(cfg)
+    with caplog.at_level(logging.WARNING):
+        apply_uma_compat_fixups(ckpt)
+    assert ckpt.model_config["model_id"] == UMA_1P1_MODEL_ID
+    # No backfill warning on idempotent path.
+    assert not any("back-filled" in r.getMessage() for r in caplog.records)
+
+
+@pytest.mark.parametrize("subsize_id", ["UMA-S-1.1", "UMA-M-1.1", "UMA-L-1.1"])
+def test_uma_1p1_idempotent_with_subsize_suffix(subsize_id, caplog):
+    """Historical/external checkpoints may use the S/M/L-suffixed form."""
+    cfg = uma_cfg(model_version="1.1", model_id=subsize_id)
+    ckpt = make_fake_checkpoint(cfg)
+    assert get_uma_version(cfg) == "1.1"
+    with caplog.at_level(logging.WARNING):
+        apply_uma_compat_fixups(ckpt)
+    assert ckpt.model_config["model_id"] == subsize_id  # untouched
+    assert not any("back-filled" in r.getMessage() for r in caplog.records)
+
+
+# ---------------------------------------------------------------------------
+# UMA 1.2 — no-op
+# ---------------------------------------------------------------------------
+
+
+def test_uma_1p2_no_op():
+    cfg = uma_cfg(model_id="UMA-S-1.2")
+    ckpt = make_fake_checkpoint(cfg)
+    apply_uma_compat_fixups(ckpt)
+    assert ckpt.model_config["model_id"] == "UMA-S-1.2"
+
+
+def test_uma_1p2_bare_no_op():
+    cfg = uma_cfg(model_id="UMA-1.2")
+    ckpt = make_fake_checkpoint(cfg)
+    apply_uma_compat_fixups(ckpt)
+    assert ckpt.model_config["model_id"] == "UMA-1.2"
+
+
+# ---------------------------------------------------------------------------
+# Unknown / user-customized / non-UMA
+# ---------------------------------------------------------------------------
+
+
+def test_unknown_uma_id_warns_no_op(caplog):
+    """Future UMA 1.3 must not be silently treated as 1.2."""
+    cfg = uma_cfg(model_id="UMA-1.3")
+    ckpt = make_fake_checkpoint(cfg)
+    with caplog.at_level(logging.WARNING):
+        assert get_uma_version(cfg) == "unknown_uma"
+        apply_uma_compat_fixups(ckpt)
+    assert ckpt.model_config["model_id"] == "UMA-1.3"  # untouched
+
+
+def test_user_customized_model_id_preserved(caplog):
+    cfg = uma_cfg(model_version="1.1", model_id="my-cool-finetune")
+    ckpt = make_fake_checkpoint(cfg)
+    with caplog.at_level(logging.WARNING):
+        apply_uma_compat_fixups(ckpt)
+    assert ckpt.model_config["model_id"] == "my-cool-finetune"
+
+
+def test_non_uma_no_op(caplog):
+    cfg = {"backbone": {"model": "fairchem.core.models.esen.esen_backbone.ESEN"}}
+    ckpt = make_fake_checkpoint(cfg)
+    with caplog.at_level(logging.INFO):
+        assert get_uma_version(cfg) == "not_uma"
+        apply_uma_compat_fixups(ckpt)
+    assert "model_id" not in ckpt.model_config
+    assert not any("UMA" in r.getMessage() for r in caplog.records)
+
+
+def test_short_registry_name_backbone():
+    cfg = uma_cfg(model_version="1.1", backbone_model=UMA_BACKBONE_SHORT)
+    ckpt = make_fake_checkpoint(cfg)
+    assert get_uma_version(cfg) == "1.1"
+    apply_uma_compat_fixups(ckpt)
+    assert ckpt.model_config["model_id"] == UMA_1P1_MODEL_ID
+
+
+def test_none_model_config():
+    ckpt = make_fake_checkpoint(None)
+    assert get_uma_version(None) == "not_uma"
+    apply_uma_compat_fixups(ckpt)  # must not raise
+
+
+def test_empty_backbone_dict_treated_as_not_uma():
+    cfg = {"backbone": {}}
+    ckpt = make_fake_checkpoint(cfg)
+    assert get_uma_version(cfg) == "not_uma"
+    apply_uma_compat_fixups(ckpt)
+    assert "model_id" not in ckpt.model_config
+
+
+def test_empty_string_model_id_treated_as_absent():
+    cfg = uma_cfg(model_version="1.1", model_id="")
+    ckpt = make_fake_checkpoint(cfg)
+    apply_uma_compat_fixups(ckpt)
+    assert ckpt.model_config["model_id"] == UMA_1P1_MODEL_ID
+
+
+def test_whitespace_model_id_treated_as_absent():
+    cfg = uma_cfg(model_version="1.1", model_id="   ")
+    ckpt = make_fake_checkpoint(cfg)
+    apply_uma_compat_fixups(ckpt)
+    assert ckpt.model_config["model_id"] == UMA_1P1_MODEL_ID
+
+
+# ---------------------------------------------------------------------------
+# DictConfig + override-bypass policy
+# ---------------------------------------------------------------------------
+
+
+def test_dictconfig_backfill_under_struct_mode():
+    """OmegaConf struct mode must not block the back-fill (uses open_dict)."""
+    cfg = OmegaConf.create(uma_cfg(model_version="1.1"))
+    OmegaConf.set_struct(cfg, True)
+    ckpt = make_fake_checkpoint(cfg)
+    apply_uma_compat_fixups(ckpt)
+    assert ckpt.model_config["model_id"] == UMA_1P1_MODEL_ID
+
+
+def test_dictconfig_uma_1p2_classified():
+    cfg = OmegaConf.create(uma_cfg(model_id="UMA-S-1.2"))
+    assert get_uma_version(cfg) == "1.2"
+
+
+def test_dictconfig_uma_1p0_raises():
+    cfg = OmegaConf.create(uma_cfg())
+    ckpt = make_fake_checkpoint(cfg)
+    with pytest.raises(RuntimeError, match="UMA 1.0"):
+        apply_uma_compat_fixups(ckpt)
diff --git a/tests/core/units/mlip_unit/test_predict.py b/tests/core/units/mlip_unit/test_predict.py
index e384dafde0..2352ef8fdd 100644
--- a/tests/core/units/mlip_unit/test_predict.py
+++ b/tests/core/units/mlip_unit/test_predict.py
@@ -9,6 +9,7 @@
 
 import contextlib
 import logging
+import os
 from copy import deepcopy
 
 import numpy as np
@@ -25,8 +26,10 @@
 from fairchem.core.common import distutils
 from fairchem.core.datasets.atomic_data import AtomicData, atomicdata_list_to_batch
 from fairchem.core.datasets.common_structures import get_fcc_crystal_by_num_atoms
+from fairchem.core.models.uma.compat import UMA_1P1_MODEL_ID
 from fairchem.core.models.uma.nn.execution_backends import UMASFastGPUBackend
 from fairchem.core.units.mlip_unit import InferenceSettings, MLIPPredictUnit
+from fairchem.core.units.mlip_unit.mlip_unit import initialize_finetuning_model
 from fairchem.core.units.mlip_unit.predict import ParallelMLIPPredictUnit
 from fairchem.core.units.mlip_unit.single_atom_patch import (
     single_atom_prediction_from_lookup,
@@ -1773,3 +1776,42 @@ def test_execution_mode_not_set_when_conditions_not_met(model_name):
         f"Expected execution_mode to be None when activation_checkpointing=True, "
         f"got {predict_unit.inference_settings.execution_mode}"
     )
+
+
+# ---------------------------------------------------------------------------
+# UMA compat / model_id fixups (see fairchem.core.models.uma.compat)
+# ---------------------------------------------------------------------------
+
+
+def test_uma_1p1_predict_unit_has_model_id(uma_1p1_predict_unit):
+    """UMA 1.1 checkpoints have no `model_id` on disk; the compat fixup
+    back-fills it to `"UMA-1.1"` at load time."""
+    assert uma_1p1_predict_unit.model.module.model_id == UMA_1P1_MODEL_ID
+
+
+def test_uma_1p1_finetune_propagates_model_id():
+    """When finetuning starts from UMA 1.1, the back-filled `model_id` is
+    stashed onto `model.finetune_model_full_config` so a subsequent
+    `save_state` persists it into the new checkpoint."""
+    ckpt = pretrained_checkpoint_path_from_name("uma-s-1p1")
+    model = initialize_finetuning_model(ckpt, overrides=None, heads=None)
+    assert (
+        model.finetune_model_full_config["model_id"] == UMA_1P1_MODEL_ID
+    )
+
+
+def test_uma_1p0_predict_unit_raises():
+    """UMA 1.0 checkpoints must hard-fail with an actionable message.
+    Skips if no UMA 1.0 checkpoint is locally available."""
+    uma_1p0_path = os.environ.get("UMA_1P0_PATH")
+    if uma_1p0_path is None:
+        # Best-effort discovery in the local HF cache.
+        from pathlib import Path
+
+        cache_root = Path("~/.cache/fairchem/models--facebook--UMA/snapshots").expanduser()
+        candidates = sorted(cache_root.glob("*/checkpoints/uma-s-1.pt"))
+        uma_1p0_path = str(candidates[0]) if candidates else None
+    if uma_1p0_path is None or not os.path.exists(uma_1p0_path):
+        pytest.skip("No UMA 1.0 checkpoint available; set UMA_1P0_PATH to test.")
+    with pytest.raises(RuntimeError, match="UMA 1.0"):
+        MLIPPredictUnit(uma_1p0_path, device="cpu")