mlr-org
diff --git a/‎DESCRIPTION‎
Lines changed: 2 additions & 0 deletions b/‎DESCRIPTION‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎R/BenchmarkResult.R‎
Lines changed: 5 additions & 8 deletions b/‎R/BenchmarkResult.R‎
Lines changed: 5 additions & 8 deletions
diff --git a/‎R/Measure.R‎
Lines changed: 50 additions & 11 deletions b/‎R/Measure.R‎
Lines changed: 50 additions & 11 deletions
diff --git a/‎R/MeasureSimple.R‎
Lines changed: 54 additions & 15 deletions b/‎R/MeasureSimple.R‎
Lines changed: 54 additions & 15 deletions
diff --git a/‎R/Prediction.R‎
Lines changed: 7 additions & 9 deletions b/‎R/Prediction.R‎
Lines changed: 7 additions & 9 deletions
diff --git a/‎R/ResampleResult.R‎
Lines changed: 7 additions & 10 deletions b/‎R/ResampleResult.R‎
Lines changed: 7 additions & 10 deletions
diff --git a/‎R/helper.R‎
Lines changed: 0 additions & 17 deletions b/‎R/helper.R‎
Lines changed: 0 additions & 17 deletions
diff --git a/‎R/mlr_reflections.R‎
Lines changed: 1 addition & 1 deletion b/‎R/mlr_reflections.R‎
Lines changed: 1 addition & 1 deletion
@@ -76,6 +76,8 @@ Suggests:
     RhpcBLASctl,
     rpart,
     testthat (>= 3.3.0)
+Remotes:
+    mlr-org/mlr3measures
 Encoding: UTF-8
 Config/testthat/edition: 3
 Config/testthat/parallel: false
 
@@ -224,14 +224,11 @@ BenchmarkResult = R6Class("BenchmarkResult",
     },
 
     #' @description
-    #' Calculates the observation-wise loss via the loss function set in the
-    #' [Measure]'s field `obs_loss`.
-    #' Returns a `data.table()` with the columns `row_ids`, `truth`, `response` and
-    #' one additional numeric column for each measure, named with the respective measure id.
-    #' If there is no observation-wise loss function for the measure, the column is filled with
-    #' `NA` values.
-    #' Note that some measures such as RMSE, do have an `$obs_loss`, but they require an
-    #' additional transformation after aggregation, in this example taking the square-root.
+    #' Calculates the observation-wise loss via the [Measure]'s `obs_loss` method.
+    #' Returns a `data.table()` with columns from the predictions (e.g., `row_ids`, `truth`, `response`, etc.), plus one numeric column for each measure, named with the respective measure id, and a `resample_result` column.
+    #' If there is no observation-wise loss function for the measure, the column is filled with `NA_real_` values.
+    #' Note that some measures such as RMSE, do have an `$obs_loss`, but they require an additional transformation after aggregation, in this example taking the square-root.
+    #'
     #' @param predict_sets (`character()`)\cr
     #'   The predict sets.
     #' @examples
 
@@ -91,10 +91,6 @@ Measure = R6Class("Measure",
     #' @template field_param_set
     param_set = NULL,
 
-    #' @field obs_loss (`function()` | `NULL`)
-    #' Function to calculate the observation-wise loss.
-    obs_loss = NULL,
-
     #' @field trafo (`list()` | `NULL`)
     #' `NULL` or a list with two elements:
     #' * `trafo`: the transformation function applied after aggregating
@@ -138,11 +134,23 @@ Measure = R6Class("Measure",
     #' Creates a new instance of this [R6][R6::R6Class] class.
     #'
     #' Note that this object is typically constructed via a derived classes, e.g. [MeasureClassif] or [MeasureRegr].
-    initialize = function(id, task_type = NA, param_set = ps(), range = c(-Inf, Inf), minimize = NA, average = "macro",
-      aggregator = NULL, obs_loss = NULL, properties = character(), predict_type = "response",
-      predict_sets = "test", task_properties = character(), packages = character(),
-      label = NA_character_, man = NA_character_, trafo = NULL) {
-
+    initialize = function(
+      id,
+      task_type = NA,
+      param_set = ps(),
+      range = c(-Inf, Inf),
+      minimize = NA,
+      average = "macro",
+      aggregator = NULL,
+      properties = character(),
+      predict_type = "response",
+      predict_sets = "test",
+      task_properties = character(),
+      packages = character(),
+      label = NA_character_,
+      man = NA_character_,
+      trafo = NULL
+    ) {
       self$id = assert_string(id, min.chars = 1L)
       self$label = assert_string(label, na.ok = TRUE)
       self$task_type = task_type
@@ -151,7 +159,6 @@ Measure = R6Class("Measure",
       self$minimize = assert_flag(minimize, na.ok = TRUE)
       self$average = average
       private$.aggregator = assert_function(aggregator, null.ok = TRUE)
-      self$obs_loss = assert_function(obs_loss, null.ok = TRUE)
       self$trafo = assert_list(trafo, len = 2L, types = "function", null.ok = TRUE)
       if (!is.null(self$trafo)) {
         assert_permutation(names(trafo), c("fn", "deriv"))
@@ -311,6 +318,35 @@ Measure = R6Class("Measure",
           private$.aggregator(rr)
         }
       )
+    },
+
+    #' @description
+    #' Calculates the observation-wise loss.
+    #' Returns a `numeric()` with one element for each row in the [Prediction].
+    #' If there is no observation-wise loss function for the measure, `NA_real_` values are returned.
+    #'
+    #' @param prediction ([Prediction]).
+    #' @param task ([Task]).
+    #' @param learner ([Learner]).
+    #'
+    #' @return `numeric()` with one element for each row in the [Prediction].
+    #' @examples
+    #' task = tsk("penguins")
+    #' learner = lrn("classif.rpart")
+    #' learner$train(task)
+    #' prediction = learner$predict(task)
+    #' msr("classif.ce")$obs_loss(prediction)
+    obs_loss = function(prediction, task = NULL, learner = NULL) {
+
+      if (!is_scalar_na(self$task_type) && self$task_type != prediction$task_type) {
+        stopf("Measure '%s' incompatible with task type '%s'", self$id, prediction$task_type)
+      }
+
+      if ("obs_loss" %nin% self$properties) {
+        return(rep(NA_real_, length(prediction$row_ids)))
+      }
+
+      private$.obs_loss(prediction, task)
     }
   ),
 
@@ -330,7 +366,7 @@ Measure = R6Class("Measure",
     hash = function(rhs) {
       assert_ro_binding(rhs)
       calculate_hash(class(self), self$id, self$param_set$values, private$.score,
-        private$.average, private$.aggregator, self$obs_loss, self$trafo,
+        private$.average, private$.aggregator, private$.obs_loss, self$trafo,
         self$predict_sets, mget(private$.extra_hash, envir = self), private$.use_weights)
     },
 
@@ -412,6 +448,9 @@ Measure = R6Class("Measure",
     .use_weights = NULL,
     .score = function(prediction, task, weights, ...) {
       stop("abstract method")
+    },
+    .obs_loss = function(prediction, task, ...) {
+      stop("abstract method")
     }
   )
 )
 
@@ -3,17 +3,24 @@ MeasureBinarySimple = R6Class("MeasureBinarySimple",
   inherit = MeasureClassif,
   public = list(
     fun = NULL,
+    fun_obs_loss = NULL,
     na_value = NaN,
     initialize = function(name, param_set = ps()) {
       info = mlr3measures::measures[[name]]
       weights = info$sample_weights
+      properties = if (weights) "weights" else character()
+
+      if (!is.na(info$obs_loss)) {
+        properties = c(properties, "obs_loss")
+        self$fun_obs_loss = get(info$obs_loss, envir = asNamespace("mlr3measures"), mode = "function")
+      }
 
       super$initialize(
         id = paste0("classif.", name),
         param_set = param_set,
         range = c(info$lower, info$upper),
         minimize = info$minimize,
-        properties = if (weights) "weights" else character(),
+        properties = properties,
         predict_type = info$predict_type,
         task_properties = "twoclass",
         packages = "mlr3measures",
@@ -22,9 +29,7 @@ MeasureBinarySimple = R6Class("MeasureBinarySimple",
       )
 
       self$fun = get(name, envir = asNamespace("mlr3measures"), mode = "function")
-      if (!is.na(info$obs_loss)) {
-        self$obs_loss = get(info$obs_loss, envir = asNamespace("mlr3measures"), mode = "function")
-      }
+
       if (test_list(info$trafo)) {
         self$trafo = info$trafo
       }
@@ -41,7 +46,18 @@ MeasureBinarySimple = R6Class("MeasureBinarySimple",
       )
     },
 
-    .extra_hash = c("fun", "na_value")
+    .extra_hash = c("fun", "fun_obs_loss", "na_value"),
+
+    .obs_loss = function(prediction, ...) {
+      truth = prediction$truth
+      positive = levels(truth)[1L]
+      invoke(self$fun_obs_loss,
+        .args = self$param_set$get_values(),
+        truth = truth,
+        response = prediction$response,
+        prob = prediction$prob[, positive],
+        positive = positive)
+    }
   )
 )
 
@@ -50,26 +66,29 @@ MeasureClassifSimple = R6Class("MeasureClassifSimple",
   inherit = MeasureClassif,
   public = list(
     fun = NULL,
+    fun_obs_loss = NULL,
     na_value = NaN,
     initialize = function(name, param_set = ps()) {
       info = mlr3measures::measures[[name]]
       weights = info$sample_weights
+      properties = if (weights) "weights" else character()
+      if (!is.na(info$obs_loss)) {
+        properties = c(properties, "obs_loss")
+        self$fun_obs_loss = get(info$obs_loss, envir = asNamespace("mlr3measures"), mode = "function")
+      }
 
       super$initialize(
         id = paste0("classif.", name),
         param_set = param_set,
         range = c(info$lower, info$upper),
         minimize = info$minimize,
-        properties = if (weights) "weights" else character(),
+        properties = properties,
         predict_type = info$predict_type,
         packages = "mlr3measures",
         label = info$title,
         man = paste0("mlr3::mlr_measures_classif.", name)
       )
       self$fun = get(name, envir = asNamespace("mlr3measures"), mode = "function")
-      if (!is.na(info$obs_loss)) {
-        self$obs_loss = get(info$obs_loss, envir = asNamespace("mlr3measures"), mode = "function")
-      }
       if (test_list(info$trafo)) {
         self$trafo = info$trafo
       }
@@ -82,7 +101,15 @@ MeasureClassifSimple = R6Class("MeasureClassifSimple",
         na_value = self$na_value, sample_weights = weights)
     },
 
-    .extra_hash = c("fun", "na_value")
+    .extra_hash = c("fun", "fun_obs_loss", "na_value"),
+
+    .obs_loss = function(prediction, ...) {
+      invoke(self$fun_obs_loss,
+        .args = self$param_set$get_values(),
+        truth = prediction$truth,
+        response = prediction$response,
+        prob = prediction$prob)
+    }
   )
 )
 
@@ -91,6 +118,7 @@ MeasureRegrSimple = R6Class("MeasureRegrSimple",
   inherit = MeasureRegr,
   public = list(
     fun = NULL,
+    fun_obs_loss = NULL,
     na_value = NaN,
     initialize = function(name, param_set = NULL) {
       if (is.null(param_set)) {
@@ -103,22 +131,25 @@ MeasureRegrSimple = R6Class("MeasureRegrSimple",
 
       info = mlr3measures::measures[[name]]
       weights = info$sample_weights
+      properties = if (weights) "weights" else character()
+      if (!is.na(info$obs_loss)) {
+        properties = c(properties, "obs_loss")
+        self$fun_obs_loss = get(info$obs_loss, envir = asNamespace("mlr3measures"), mode = "function")
+      }
 
       super$initialize(
         id = paste0("regr.", name),
         param_set = param_set$clone(),
         range = c(info$lower, info$upper),
         minimize = info$minimize,
-        properties = if (weights) "weights" else character(),
+        properties = properties,
         predict_type = info$predict_type,
         packages = "mlr3measures",
         label = info$title,
         man = paste0("mlr3::mlr_measures_regr.", name)
       )
       self$fun = get(name, envir = asNamespace("mlr3measures"), mode = "function")
-      if (!is.na(info$obs_loss)) {
-        self$obs_loss = get(info$obs_loss, envir = asNamespace("mlr3measures"), mode = "function")
-      }
+
       if (test_list(info$trafo)) {
         self$trafo = info$trafo
       }
@@ -131,7 +162,15 @@ MeasureRegrSimple = R6Class("MeasureRegrSimple",
         na_value = self$na_value, sample_weights = weights)
     },
 
-    .extra_hash = c("fun", "na_value")
+    .extra_hash = c("fun", "fun_obs_loss", "na_value"),
+
+    .obs_loss = function(prediction, ...) {
+      invoke(self$fun_obs_loss,
+        .args = self$param_set$get_values(),
+        truth = prediction$truth,
+        response = prediction$response,
+        se = prediction$se)
+    }
   )
 )
 
 
@@ -96,17 +96,15 @@ Prediction = R6Class("Prediction",
     },
 
     #' @description
-    #' Calculates the observation-wise loss via the loss function set in the
-    #' [Measure]'s field `obs_loss`.
-    #' Returns a `data.table()` with the columns `row_ids`, `truth`, `response` and
-    #' one additional numeric column for each measure, named with the respective measure id.
-    #' If there is no observation-wise loss function for the measure, the column is filled with
-    #' `NA` values.
-    #' Note that some measures such as RMSE, do have an `$obs_loss`, but they require an
-    #' additional transformation after aggregation, in this example taking the square-root.
+    #' Calculates the observation-wise loss via the [Measure]'s `obs_loss` method.
+    #' Returns a `data.table()` with the columns of the matching [Prediction] object plus one additional numeric column for each measure, named with the respective measure id.
+    #' If there is no observation-wise loss function for the measure, the column is filled with `NA_real_` values.
+    #' Note that some measures such as RMSE, do have an `$obs_loss`, but they require an additional transformation after aggregation, in this example taking the square-root.
     obs_loss = function(measures = NULL) {
       measures = assert_measures(as_measures(measures, task_type = self$task_type))
-      get_obs_loss(as.data.table(self), measures)
+      tab = as.data.table(self)
+      walk(measures, function(m) set(tab, j = m$id, value = m$obs_loss(prediction = self)))
+      tab[]
     },
 
 
 
@@ -190,23 +190,20 @@ ResampleResult = R6Class("ResampleResult",
     },
 
     #' @description
-    #' Calculates the observation-wise loss via the loss function set in the
-    #' [Measure]'s field `obs_loss`.
-    #' Returns a `data.table()` with the columns of the matching [Prediction] object plus
-    #' one additional numeric column for each measure, named with the respective measure id.
-    #' If there is no observation-wise loss function for the measure, the column is filled with
-    #' `NA` values.
-    #' Note that some measures such as RMSE, do have an `$obs_loss`, but they require an
-    #' additional transformation after aggregation, in this example taking the square-root.
+    #' Calculates the observation-wise loss via the [Measure]'s `obs_loss` method.
+    #' Returns a `data.table()` with an `iteration` column plus one numeric column for each measure, named with the respective measure id.
+    #' If there is no observation-wise loss function for the measure, the column is filled with `NA_real_` values.
+    #' Note that some measures such as RMSE, do have an `$obs_loss`, but they require an additional transformation after aggregation, in this example taking the square-root.
     #'
     #' @param predict_sets (`character()`)\cr
     #'   The predict sets.
     #' @examples
     #' rr$obs_loss(msr("classif.acc"))
     obs_loss = function(measures = NULL, predict_sets = "test") {
       measures = assert_measures(as_measures(measures, task_type = self$task_type))
-      tab = map_dtr(self$predictions(predict_sets), as.data.table, .idcol = "iteration")
-      get_obs_loss(tab, measures)
+      map_dtr(self$predictions(predict_sets), function(pred) {
+        pred$obs_loss(measures)
+      }, .idcol = "iteration")
     },
 
     #' @description
 
@@ -62,23 +62,6 @@ assert_validate = function(x) {
   assert_choice(x, c("predefined", "test"), null.ok = TRUE)
 }
 
-
-get_obs_loss = function(tab, measures) {
-  for (measure in measures) {
-    fun = measure$obs_loss
-    value = if (is.function(fun)) {
-      args = intersect(names(tab), names(formals(fun)))
-      do.call(fun, tab[, args, with = FALSE])
-    } else {
-      NA_real_
-    }
-
-    set(tab, j = measure$id, value = value)
-  }
-
-  tab[]
-}
-
 # Generalization of quantile(type = 7) for weighted data.
 
 quantile_weighted = function(x, probs, na.rm = FALSE, weights = NULL, digits = 7L, continuous = TRUE) {
 
@@ -147,7 +147,7 @@ local({
   mlr_reflections$resampling_properties = c("duplicated_ids", "weights")
 
   ### Measures
-  tmp = c("na_score", "requires_task", "requires_learner", "requires_model", "requires_train_set", "weights", "primary_iters", "requires_no_prediction")
+  tmp = c("na_score", "requires_task", "requires_learner", "requires_model", "requires_train_set", "weights", "primary_iters", "requires_no_prediction", "obs_loss")
   mlr_reflections$measure_properties = list(
     classif = tmp,
     regr = tmp