autogluon · LennartPurucker · Jun 20, 2025 · Jun 25, 2025 · Jun 25, 2025
diff --git a/setup.py b/setup.py
@@ -39,6 +39,10 @@
     "modernnca": [
         "category_encoders",
     ],
+    "perpetualboosting": [
+        # used version: 0.9.4
+        "perpetual",
+    ],
 }
 
 benchmark_requires = []

diff --git a/tabrepo/benchmark/models/ag/__init__.py b/tabrepo/benchmark/models/ag/__init__.py
@@ -8,6 +8,7 @@
 from tabrepo.benchmark.models.ag.tabm.tabm_model import TabMModel
 from tabrepo.benchmark.models.ag.tabpfnv2.tabpfnv2_client_model import TabPFNV2ClientModel
 from tabrepo.benchmark.models.ag.tabpfnv2.tabpfnv2_model import TabPFNV2Model
+from tabrepo.benchmark.models.ag.perpetual.perpetual_model import PerpetualBoostingModel
 
 __all__ = [
     "ExplainableBoostingMachineModel",
@@ -18,4 +19,5 @@
     "TabMModel",
     "TabPFNV2ClientModel",
     "TabPFNV2Model",
+    "PerpetualBoostingModel",
 ]
diff --git a/tabrepo/benchmark/models/ag/perpetual/__init__.py b/tabrepo/benchmark/models/ag/perpetual/__init__.py
diff --git a/tabrepo/benchmark/models/ag/perpetual/perpetual_model.py b/tabrepo/benchmark/models/ag/perpetual/perpetual_model.py
@@ -0,0 +1,146 @@
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+from autogluon.core.constants import BINARY, MULTICLASS, REGRESSION
+from autogluon.core.models import AbstractModel
+
+if TYPE_CHECKING:
+    import numpy as np
+    import pandas as pd
+    from autogluon.core.metrics import Scorer
+
+
+# TODO: memory limiting of the lib does not work correctly, can this be fixed?
+# TODO: requires memory estimation logic to become useful to switch to sequential fitting
+class PerpetualBoostingModel(AbstractModel):
+    ag_key = "PB"
+    ag_name = "PerpetualBoosting"
+
+    def __init__(self, **kwargs):
+        super().__init__(**kwargs)
+        self._category_features: list[str] = None
+
+    def _preprocess(self, X: pd.DataFrame, **kwargs) -> pd.DataFrame:
+        X = super()._preprocess(X, **kwargs)
+
+        if self._category_features is None:
+            self._category_features = X.select_dtypes(
+                include=["category"]
+            ).columns.tolist()
+
+        return X
+
+    # TODO: API does not support a random seed, but rust code does (mhm?)
+    # TODO: no GPU support (?), add warning.
+    # TODO: no support for passing validation data... needs to be added (as callback)
+    def _fit(
+        self,
+        X: pd.DataFrame,
+        y: pd.Series,
+        # X_val: pd.DataFrame | None = None,
+        # y_val: pd.Series | None = None,
+        time_limit: float | None = None,
+        num_cpus: int | str = "auto",
+        sample_weight: np.ndarray | None = None,
+        sample_weight_val: np.ndarray | None = None,
+        **kwargs,
+    ):
+        # Preprocess data.
+        X = self.preprocess(X, is_train=True)
+        paras = self._get_model_params()
+
+        from perpetual import PerpetualBooster
+
+        # ----- The below is hacky workaround to set the memory limit
+        # TODO: set this in the outer scope or automatically here
+        sequential_fitting = False
+        if sequential_fitting:
+            memory_limit = 32  # all memory for the job, in GB
+            # 1 if sequential fitting is used
+            # otherwise memory limit is not enforced across threads.
+            num_cpus = 1
+
+        else:
+            #  here we know it is one of 8 folds now.
+            # at this stage, num_cpus == 1 anyhow.
+            memory_limit = 4
+
+            # FIXME: does not work as env var is not set in ray job...
+            #   need to pass this to the model kwargs as well
+            #   future work... hard coding for now.
+            # memory_limit = ResourceManager().get_available_virtual_mem(format="GB") / 8
+
+        # ---- Additional bug
+        # FIXME: with a lot of categorical features, the memory limit is
+        #  not enforced correctly. No way to control this as far as I can tell.
+        # - Example: to make this code run on 363711 (MIC) I set the limit to 32 GB
+        #   but had to give it 64 GB to not OOM. If I set the limit to 64 GB, it uses
+        #   90ish GB and OOMs the job.
+        # memory_limit = 32
+        # Even then, it still hangs on prediction and runs out of time.
+
+        # safety as memory limit should be quicker than cgroups.
+        memory_limit = int(memory_limit * 0.95)
+        self.model = PerpetualBooster(
+            objective=get_metric_from_ag_metric(
+                metric=self.eval_metric, problem_type=self.problem_type
+            ),
+            num_threads=num_cpus,
+            memory_limit=memory_limit,  # TODO: limit per thread?
+            categorical_features=self._category_features,
+            # FIXME: time limit is also not strictly enforced, check when the
+            #  loop is stopped and if preprocessing counts towards the limit.
+            timeout=time_limit,
+            # stopping_rounds - no idea how to set this
+            **paras,
+        )
+
+        # FIXME: why does the out-of-budget message show up several times?
+        self.model.fit(X=X, y=y, sample_weight=sample_weight)
+
+    def _set_default_params(self):
+        default_params = {
+            "iteration_limit": 10_000,
+            # As we use a timeout this should be the max I guess.
+            #   2.0 is used a lot in examples, so I guess it is the max (?).
+            "budget": 2.0,
+        }
+        for param, val in default_params.items():
+            self._set_default_param_value(param, val)
+
+    def _get_default_auxiliary_params(self) -> dict:
+        default_auxiliary_params = super()._get_default_auxiliary_params()
+        extra_auxiliary_params = {
+            "valid_raw_types": ["int", "float", "category"],
+        }
+        default_auxiliary_params.update(extra_auxiliary_params)
+        return default_auxiliary_params
+
+    @classmethod
+    def supported_problem_types(cls) -> list[str] | None:
+        return ["binary", "multiclass", "regression"]
+
+    # TODO: support refit full
+    def _more_tags(self) -> dict:
+        return {"can_refit_full": False}
+
+
+def get_metric_from_ag_metric(*, metric: Scorer, problem_type: str):
+    """Map AutoGluon metric to EBM metric for early stopping."""
+    if problem_type in [BINARY, MULTICLASS]:
+        # Only supports log_loss for classification.
+        metric_map = {
+            "log_loss": "LogLoss",
+        }
+        metric_class = metric_map.get(metric.name, "LogLoss")
+    elif problem_type == REGRESSION:
+        metric_map = {
+            "mean_squared_error": "HuberLoss",  # seems to be a better match than RMSE.
+            "root_mean_squared_error": "SquaredLoss",
+        }
+        metric_class = metric_map.get(metric.name, "SquaredLoss")
+    else:
+        raise AssertionError(f"EBM does not support {problem_type} problem type.")
+
+    return metric_class
diff --git a/tabrepo/benchmark/models/model_register.py b/tabrepo/benchmark/models/model_register.py
@@ -7,6 +7,7 @@
 from tabrepo.benchmark.models.ag import (
     ExplainableBoostingMachineModel,
     ModernNCAModel,
+    PerpetualBoostingModel,
     RealMLPModel,
     TabDPTModel,
     TabICLModel,
@@ -26,6 +27,7 @@
     TabDPTModel,
     TabMModel,
     ModernNCAModel,
+    PerpetualBoostingModel,
 ]
 
 for _model_cls in _models_to_add:
@@ -43,7 +45,10 @@ def infer_model_cls(model_cls: str, model_register: ModelRegistry = None):
                 if real_model_cls.ag_name == model_cls:
                     model_cls = real_model_cls
                     break
-        elif model_cls in [str(real_model_cls.__name__) for real_model_cls in model_register.model_cls_list]:
+        elif model_cls in [
+            str(real_model_cls.__name__)
+            for real_model_cls in model_register.model_cls_list
+        ]:
             for real_model_cls in model_register.model_cls_list:
                 if model_cls == str(real_model_cls.__name__):
                     model_cls = real_model_cls

diff --git a/tabrepo/models/perpetual/__init__.py b/tabrepo/models/perpetual/__init__.py
diff --git a/tabrepo/models/perpetual/generate.py b/tabrepo/models/perpetual/generate.py
@@ -0,0 +1,13 @@
+from __future__ import annotations
+
+from tabrepo.benchmark.models.ag.perpetual.perpetual_model import PerpetualBoostingModel
+from tabrepo.utils.config_utils import ConfigGenerator
+
+# TODO: ask authors for search space / come up with something.
+search_space = {}
+
+gen_perpetual = ConfigGenerator(
+    model_cls=PerpetualBoostingModel,
+    search_space=search_space,
+    manual_configs=[{}],
+)
diff --git a/tabrepo/models/utils.py b/tabrepo/models/utils.py
@@ -46,6 +46,7 @@ def get_configs_generator_from_name(model_name: str):
         # "TabPFN": lambda: importlib.import_module("tabrepo.models.tabpfn.generate").gen_tabpfn, # not supported in TabArena
         "TabPFNv2": lambda: importlib.import_module("tabrepo.models.tabpfnv2.generate").gen_tabpfnv2,
         "XGBoost": lambda: importlib.import_module("tabrepo.models.xgboost.generate").gen_xgboost,
+        "PerpetualBoosting": lambda: importlib.import_module("tabrepo.models.perpetual.generate").gen_perpetual,
     }
 
     if model_name not in name_to_import_map:

diff --git a/tst/benchmark/models/test_perpetual.py b/tst/benchmark/models/test_perpetual.py
@@ -0,0 +1,25 @@
+from __future__ import annotations
+
+import pytest
+
+
+def test_perpetual():
+    model_hyperparameters = {"iteration_limit": 10, "budget": 0.1}
+
+    try:
+        from autogluon.tabular.testing import FitHelper
+        from tabrepo.benchmark.models.ag.perpetual.perpetual_model import (
+            PerpetualBoostingModel,
+        )
+
+        model_cls = PerpetualBoostingModel
+        FitHelper.verify_model(
+            model_cls=model_cls,
+            model_hyperparameters=model_hyperparameters,
+        )
+    except ImportError as err:
+        pytest.skip(
+            f"Import Error, skipping test... "
+            f"Ensure you have the proper dependencies installed to run this test:\n"
+            f"{err}"
+        )