ModelOriented
diff --git a/‎.github/workflows/test-coverage.yaml‎
Lines changed: 2 additions & 0 deletions b/‎.github/workflows/test-coverage.yaml‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎DESCRIPTION‎
Lines changed: 7 additions & 7 deletions b/‎DESCRIPTION‎
Lines changed: 7 additions & 7 deletions
diff --git a/‎NAMESPACE‎
Lines changed: 6 additions & 0 deletions b/‎NAMESPACE‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎NEWS.md‎
Lines changed: 1 addition & 0 deletions b/‎NEWS.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎R/kernelshap.R‎
Lines changed: 10 additions & 29 deletions b/‎R/kernelshap.R‎
Lines changed: 10 additions & 29 deletions
diff --git a/‎R/methods.R‎
Lines changed: 24 additions & 1 deletion b/‎R/methods.R‎
Lines changed: 24 additions & 1 deletion
diff --git a/‎R/permshap.R‎
Lines changed: 181 additions & 0 deletions b/‎R/permshap.R‎
Lines changed: 181 additions & 0 deletions
@@ -35,6 +35,8 @@ jobs:
             function_exclusions = c(
               "kernelshap\\.Learner",
               "kernelshap\\.ranger",
+              "permshap\\.Learner",
+              "permshap\\.ranger",
               "mlr3_pred_fun"
             )
           )
 
@@ -7,13 +7,13 @@ Authors@R: c(
     person("Przemyslaw", "Biecek", , "przemyslaw.biecek@gmail.com", role = "ctb",
            comment = c(ORCID = "0000-0001-8423-1823"))
   )
-Description: Efficient implementation of Kernel SHAP, see Lundberg and Lee (2017), 
-    and Covert and Lee (2021) <http://proceedings.mlr.press/v130/covert21a>.
-    For models with up to eight features, the results are exact regarding the
-    selected background data.  Otherwise, an almost exact hybrid algorithm
-    involving iterative sampling is used.  The package plays well together
-    with meta-learning packages like 'tidymodels', 'caret' or 'mlr3'.
-    Visualizations can be done using the R package 'shapviz'.
+Description: Efficient implementation of Kernel SHAP, see Lundberg and Lee
+    (2017), and Covert and Lee (2021)
+    <http://proceedings.mlr.press/v130/covert21a>.  Furthermore, for up to
+    14 features, exact permutation SHAP values can be calculated.  The
+    package plays well together with meta-learning packages like
+    'tidymodels', 'caret' or 'mlr3'.  Visualizations can be done using the
+    R package 'shapviz'.
 License: GPL (>= 2)
 Depends: 
     R (>= 3.2.0)
 
@@ -3,8 +3,14 @@
 S3method(kernelshap,Learner)
 S3method(kernelshap,default)
 S3method(kernelshap,ranger)
+S3method(permshap,Learner)
+S3method(permshap,default)
+S3method(permshap,ranger)
 S3method(print,kernelshap)
+S3method(print,permshap)
 S3method(summary,kernelshap)
 export(is.kernelshap)
+export(is.permshap)
 export(kernelshap)
+export(permshap)
 importFrom(foreach,"%dopar%")
@@ -2,6 +2,7 @@
 
 ## Major changes
 
+- Added `permshap()` to calculate exact permutation SHAP values. The function currently works for up to 14 features.
 - Factor-valued predictions are now supported. Each level is represented by its dummy variable.
 
 ## Other changes
 
@@ -68,7 +68,7 @@
 #'   In cases with a natural "off" value (like MNIST digits), 
 #'   this can also be a single row with all values set to the off value.
 #' @param pred_fun Prediction function of the form `function(object, X, ...)`,
-#'   providing \eqn{K \ge 1} numeric predictions per row. Its first argument 
+#'   providing \eqn{K \ge 1} predictions per row. Its first argument 
 #'   represents the model `object`, its second argument a data structure like `X`. 
 #'   Additional (named) arguments are passed via `...`. 
 #'   The default, [stats::predict()], will work in most cases. 
@@ -113,7 +113,7 @@
 #' @param max_iter If the stopping criterion (see `tol`) is not reached after 
 #'   `max_iter` iterations, the algorithm stops. Ignored if `exact = TRUE`.
 #' @param parallel If `TRUE`, use parallel [foreach::foreach()] to loop over rows
-#'   to be explained. Must register backend beforehand, e.g., via {doFuture} package, 
+#'   to be explained. Must register backend beforehand, e.g., via 'doFuture' package, 
 #'   see README for an example. Parallelization automatically disables the progress bar.
 #' @param parallel_args Named list of arguments passed to [foreach::foreach()]. 
 #'   Ideally, this is `NULL` (default). Only relevant if `parallel = TRUE`. 
@@ -191,19 +191,9 @@ kernelshap.default <- function(object, X, bg_X, pred_fun = stats::predict,
                                m = 2L * length(feature_names) * (1L + 3L * (hybrid_degree == 0L)), 
                                tol = 0.005, max_iter = 100L, parallel = FALSE, 
                                parallel_args = NULL, verbose = TRUE, ...) {
+  basic_checks(X = X, bg_X = bg_X, feature_names = feature_names, pred_fun = pred_fun)
+  p <- length(feature_names)
   stopifnot(
-    is.matrix(X) || is.data.frame(X),
-    is.matrix(bg_X) || is.data.frame(bg_X),
-    is.matrix(X) == is.matrix(bg_X),
-    dim(X) >= 1L,
-    dim(bg_X) >= 1L,
-    !is.null(colnames(X)),
-    !is.null(colnames(bg_X)),
-    (p <- length(feature_names)) >= 1L,
-    all(feature_names %in% colnames(X)),
-    all(feature_names %in% colnames(bg_X)),  # not necessary, but clearer
-    all(colnames(X) %in% colnames(bg_X)),
-    is.function(pred_fun),
     exact %in% c(TRUE, FALSE),
     p == 1L || exact || hybrid_degree %in% 0:(p / 2),
     paired_sampling %in% c(TRUE, FALSE),
@@ -212,27 +202,20 @@ kernelshap.default <- function(object, X, bg_X, pred_fun = stats::predict,
   n <- nrow(X)
   bg_n <- nrow(bg_X)
   if (!is.null(bg_w)) {
-    stopifnot(length(bg_w) == bg_n, all(bg_w >= 0), !all(bg_w == 0))
-    if (!is.double(bg_w)) {
-      bg_w <- as.double(bg_w)
-    }
-  }
-  if (is.matrix(X) && !identical(colnames(X), feature_names)) {
-    stop("If X is a matrix, feature_names must equal colnames(X)")  
+    bg_w <- prep_w(bg_w, bg_n = bg_n)
   }
 
   # Calculate v1 and v0
   v1 <- align_pred(pred_fun(object, X, ...))         # Predictions on X:        n x K
   bg_preds <- align_pred(pred_fun(object, bg_X[, colnames(X), drop = FALSE], ...))
-  v0 <- weighted_colMeans(bg_preds, bg_w)            # Average pred of bg data: 1 x K
+  v0 <- wcolMeans(bg_preds, bg_w)                    # Average pred of bg data: 1 x K
 
   # For p = 1, exact Shapley values are returned
   if (p == 1L) {
-    return(
-      case_p1(
-        n = n, feature_names = feature_names, v0 = v0, v1 = v1, X = X, verbose = verbose
-      )
+    out <- case_p1(
+      n = n, feature_names = feature_names, v0 = v0, v1 = v1, X = X, verbose = verbose
     )
+    return(out)
   }
 
   # Drop unnecessary columns in bg_X. If X is matrix, also column order is relevant
@@ -266,9 +249,7 @@ kernelshap.default <- function(object, X, bg_X, pred_fun = stats::predict,
     message(txt)
   }
   if (max(m, m_exact) * bg_n > 2e5) {
-    warning("\nPredictions on large data sets with ", max(m, m_exact), "x", bg_n,
-            " observations are being done.\n",
-            "Consider reducing the computational burden (e.g. use smaller X_bg)")
+    warning_burden(max(m, m_exact), bg_n = bg_n)
   }
 
   # Apply Kernel SHAP to each row of X
 
@@ -18,6 +18,12 @@ print.kernelshap <- function(x, n = 2L, ...) {
   invisible(x)
 }
 
+#' @describeIn print.kernelshap Print method for "permshap" object
+#' @export
+print.permshap <- function(x, n = 2L, ...) {
+  print.kernelshap(x, n = n, ...)
+}
+
 #' Summary Method
 #'
 #' @param object An object of class "kernelshap".
@@ -76,11 +82,28 @@ summary.kernelshap <- function(object, compact = FALSE, n = 2L, ...) {
 #' @returns `TRUE` if `object` is of class "kernelshap", and `FALSE` otherwise.
 #' @export
 #' @examples
-#' fit <- stats::lm(Sepal.Length ~ ., data = iris)
+#' fit <- lm(Sepal.Length ~ ., data = iris)
 #' s <- kernelshap(fit, iris[1:2, -1], bg_X = iris[-1])
 #' is.kernelshap(s)
 #' is.kernelshap("a")
 #' @seealso [kernelshap()]
 is.kernelshap <- function(object){
   inherits(object, "kernelshap")
 }
+
+#' Check for permshap
+#'
+#' Is object of class "permshap"?
+#'
+#' @param object An R object.
+#' @returns `TRUE` if `object` is of class "permshap", and `FALSE` otherwise.
+#' @export
+#' @examples
+#' fit <- lm(Sepal.Length ~ ., data = iris)
+#' s <- permshap(fit, iris[1:2, -1], bg_X = iris[-1])
+#' is.permshap(s)
+#' is.permshap("a")
+#' @seealso [kernelshap()]
+is.permshap <- function(object){
+  inherits(object, "permshap")
+}
@@ -0,0 +1,181 @@
+#' Permutation SHAP
+#'
+#' Exact permutation SHAP values with respect to a background dataset.
+#' The function is currently limited to maximum 14 features.
+#'
+#' @inheritParams kernelshap
+#' @returns
+#'   An object of class "permshap" with the following components:
+#'   - `S`: \eqn{(n \times p)} matrix with SHAP values or, if the model output has
+#'     dimension \eqn{K > 1}, a list of \eqn{K} such matrices.
+#'   - `X`: Same as input argument `X`.
+#'   - `baseline`: Vector of length K representing the average prediction on the
+#'     background data.
+#'   - `m_exact`: Integer providing the effective number of exact on-off vectors used.
+#'   - `exact`: Logical flag indicating whether calculations are exact or not
+#'     (currently `TRUE`).
+#'   - `txt`: Summary text.
+#'   - `predictions`: \eqn{(n \times K)} matrix with predictions of `X`.
+#' @export
+#' @examples
+#' # MODEL ONE: Linear regression
+#' fit <- lm(Sepal.Length ~ ., data = iris)
+#'
+#' # Select rows to explain (only feature columns)
+#' X_explain <- iris[1:2, -1]
+#'
+#' # Select small background dataset (could use all rows here because iris is small)
+#' set.seed(1)
+#' bg_X <- iris[sample(nrow(iris), 100), ]
+#'
+#' # Calculate SHAP values
+#' s <- permshap(fit, X_explain, bg_X = bg_X)
+#' s
+#'
+#' # MODEL TWO: Multi-response linear regression
+#' fit <- lm(as.matrix(iris[1:2]) ~ Petal.Length + Petal.Width + Species, data = iris)
+#' s <- permshap(fit, iris[1:4, 3:5], bg_X = bg_X)
+#' s
+#'
+#' # Non-feature columns can be dropped via 'feature_names'
+#' s <- permshap(
+#'   fit,
+#'   iris[1:4, ],
+#'   bg_X = bg_X,
+#'   feature_names = c("Petal.Length", "Petal.Width", "Species")
+#' )
+#' s
+permshap <- function(object, ...) {
+  UseMethod("permshap")
+}
+
+#' @describeIn permshap Default permutation SHAP method.
+#' @export
+permshap.default <- function(object, X, bg_X, pred_fun = stats::predict,
+                             feature_names = colnames(X), bg_w = NULL,
+                             parallel = FALSE, parallel_args = NULL,
+                             verbose = TRUE, ...) {
+  basic_checks(X = X, bg_X = bg_X, feature_names = feature_names, pred_fun = pred_fun)
+  p <- length(feature_names)
+  stopifnot("Permutation SHAP only supported for up to 14 features" = p <= 14L)
+  n <- nrow(X)
+  bg_n <- nrow(bg_X)
+  if (!is.null(bg_w)) {
+    bg_w <- prep_w(bg_w, bg_n = bg_n)
+  }
+  txt <- "Exact permutation SHAP"
+  if (verbose) {
+    message(txt)
+  }
+  
+  # Baseline and predictions on explanation data (latter not required in algo)
+  bg_preds <- align_pred(pred_fun(object, bg_X[, colnames(X), drop = FALSE], ...))
+  v0 <- wcolMeans(bg_preds, bg_w)            # Average pred of bg data: 1 x K
+  v1 <- align_pred(pred_fun(object, X, ...)) # Predictions on X:        n x K
+  
+  # Drop unnecessary columns in bg_X. If X is matrix, also column order is relevant
+  # Predictions will never be applied directly to bg_X anymore
+  if (!identical(colnames(bg_X), feature_names)) {
+    bg_X <- bg_X[, feature_names, drop = FALSE]
+  }
+  
+  # Precalculations that are identical for each row to be explained
+  Z <- exact_Z(p, feature_names = feature_names, keep_extremes = TRUE)
+  m_exact <- nrow(Z)
+  precalc <- list(
+    Z = Z,
+    Z_code = rowpaste(Z),
+    bg_X_rep = bg_X[rep(seq_len(bg_n), times = m_exact), , drop = FALSE]
+  )
+  
+  if (m_exact * bg_n > 2e5) {
+    warning_burden(m_exact, bg_n = bg_n)
+  }
+  
+  # Apply permutation SHAP to each row of X
+  if (isTRUE(parallel)) {
+    parallel_args <- c(list(i = seq_len(n)), parallel_args)
+    res <- do.call(foreach::foreach, parallel_args) %dopar% permshap_one(
+      x = X[i, , drop = FALSE],
+      object = object,
+      pred_fun = pred_fun,
+      bg_w = bg_w,
+      precalc = precalc,
+      ...
+    )
+  } else {
+    if (verbose && n >= 2L) {
+      pb <- utils::txtProgressBar(max = n, style = 3)
+    }
+    res <- vector("list", n)
+    for (i in seq_len(n)) {
+      res[[i]] <- permshap_one(
+        x = X[i, , drop = FALSE],
+        object = object,
+        pred_fun = pred_fun,
+        bg_w = bg_w,
+        precalc = precalc,
+        ...
+      )
+      if (verbose && n >= 2L) {
+        utils::setTxtProgressBar(pb, i)
+      }
+    }
+  }
+  out <- list(
+    S = reorganize_list(res), 
+    X = X, 
+    baseline = as.vector(v0),
+    m_exact = m_exact,
+    exact = TRUE,
+    txt = txt,
+    predictions = v1
+  )
+  class(out) <- "permshap"
+  out
+}
+
+#' @describeIn permshap Permutation SHAP method for "ranger" models, see Readme for an example.
+#' @export
+permshap.ranger <- function(object, X, bg_X,
+                            pred_fun = function(m, X, ...) stats::predict(m, X, ...)$predictions,
+                            feature_names = colnames(X),
+                            bg_w = NULL, parallel = FALSE, parallel_args = NULL,
+                            verbose = TRUE, ...) {
+  permshap.default(
+    object = object,
+    X = X,
+    bg_X = bg_X,
+    pred_fun = pred_fun,
+    feature_names = feature_names,
+    bg_w = bg_w,
+    parallel = parallel,
+    parallel_args = parallel_args,
+    verbose = verbose,
+    ...
+  )
+}
+
+#' @describeIn permshap Permutation SHAP method for "mlr3" models, see Readme for an example.
+#' @export
+permshap.Learner <- function(object, X, bg_X,
+                             pred_fun = NULL,
+                             feature_names = colnames(X),
+                             bg_w = NULL, parallel = FALSE, parallel_args = NULL,
+                             verbose = TRUE, ...) {
+  if (is.null(pred_fun)) {
+    pred_fun <- mlr3_pred_fun(object, X = X)
+  }
+  permshap.default(
+    object = object,
+    X = X,
+    bg_X = bg_X,
+    pred_fun = pred_fun,
+    feature_names = feature_names,
+    bg_w = bg_w,
+    parallel = parallel,
+    parallel_args = parallel_args,
+    verbose = verbose,
+    ...
+  )
+}
Original file line number	Diff line number	Diff line change
`@@ -35,6 +35,8 @@ jobs:`
`35`	`35`	`function_exclusions = c(`
`36`	`36`	`"kernelshap\\.Learner",`
`37`	`37`	`"kernelshap\\.ranger",`
	`38`	`+ "permshap\\.Learner",`
	`39`	`+ "permshap\\.ranger",`
`38`	`40`	`"mlr3_pred_fun"`
`39`	`41`	`)`
`40`	`42`	`)`