tidyverse
diff --git a/‎DESCRIPTION‎
Lines changed: 2 additions & 1 deletion b/‎DESCRIPTION‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎NEWS.md‎
Lines changed: 2 additions & 0 deletions b/‎NEWS.md‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎R/case-match.R‎
Lines changed: 84 additions & 45 deletions b/‎R/case-match.R‎
Lines changed: 84 additions & 45 deletions
diff --git a/‎_pkgdown.yml‎
Lines changed: 1 addition & 1 deletion b/‎_pkgdown.yml‎
Lines changed: 1 addition & 1 deletion
@@ -25,7 +25,7 @@ Imports:
     cli (>= 3.6.2),
     generics,
     glue (>= 1.3.2),
-    lifecycle (>= 1.0.3),
+    lifecycle (>= 1.0.4.9000),
     magrittr (>= 1.5),
     methods,
     pillar (>= 1.9.0),
@@ -67,4 +67,5 @@ LazyData: true
 Roxygen: list(markdown = TRUE)
 RoxygenNote: 7.3.3
 Remotes:
+    r-lib/lifecycle,
     r-lib/vctrs
@@ -1,5 +1,7 @@
 # dplyr (development version)
 
+* `case_match()` is now superseded by `recode_values()` and `replace_values()`.
+
 * The superseded `recode()` now has updated documentation showing how to migrate to `recode_values()` and `replace_values()`.
 
 * `case_when()` is now part of a family of 4 related functions, 3 of which are new:
 
@@ -1,34 +1,19 @@
 #' A general vectorised `switch()`
 #'
 #' @description
+#' `r lifecycle::badge("superseded")`
+#'
+#' `case_match()` is superseded by [recode_values()] and [replace_values()],
+#' which are more powerful, have more intuitive names, and have better safety.
+#' In addition to the familiar two-sided formula interface, these functions also
+#' have `from` and `to` arguments which allow you to incorporate a lookup table
+#' into the recoding process.
+#'
 #' This function allows you to vectorise multiple [switch()] statements. Each
 #' case is evaluated sequentially and the first match for each element
 #' determines the corresponding value in the output vector. If no cases match,
 #' the `.default` is used.
 #'
-#' `case_match()` is an R equivalent of the SQL "simple" `CASE WHEN` statement.
-#'
-#' ## Connection to `case_when()`
-#'
-#' While [case_when()] uses logical expressions on the left-hand side of the
-#' formula, `case_match()` uses values to match against `.x` with. The following
-#' two statements are roughly equivalent:
-#'
-#' ```
-#' case_when(
-#'   x %in% c("a", "b") ~ 1,
-#'   x %in% "c" ~ 2,
-#'   x %in% c("d", "e") ~ 3
-#' )
-#'
-#' case_match(
-#'   x,
-#'   c("a", "b") ~ 1,
-#'   "c" ~ 2,
-#'   c("d", "e") ~ 3
-#' )
-#' ```
-#'
 #' @param .x A vector to match against.
 #'
 #' @param ... <[`dynamic-dots`][rlang::dyn-dots]> A sequence of two-sided
@@ -58,61 +43,98 @@
 #' A vector with the same size as `.x` and the same type as the common type of
 #' the RHS inputs and `.default` (if not overridden by `.ptype`).
 #'
-#' @seealso [case_when()]
-#'
 #' @export
 #' @examples
+#' # `case_match()` has been superseded by `recode_values()` and
+#' # `replace_values()`
+#'
 #' x <- c("a", "b", "a", "d", "b", NA, "c", "e")
 #'
-#' # `case_match()` acts like a vectorized `switch()`.
-#' # Unmatched values "fall through" as a missing value.
+#' # `recode_values()` is a 1:1 replacement for `case_match()`
 #' case_match(
 #'   x,
 #'   "a" ~ 1,
 #'   "b" ~ 2,
 #'   "c" ~ 3,
 #'   "d" ~ 4
 #' )
-#'
-#' # Missing values can be matched exactly, and `.default` can be used to
-#' # control the value used for unmatched values of `.x`
-#' case_match(
+#' recode_values(
 #'   x,
 #'   "a" ~ 1,
 #'   "b" ~ 2,
 #'   "c" ~ 3,
-#'   "d" ~ 4,
-#'   NA ~ 0,
-#'   .default = 100
+#'   "d" ~ 4
 #' )
 #'
-#' # Input values can be grouped into the same expression to map them to the
-#' # same output value
-#' case_match(
+#' # `recode_values()` has an additional `unmatched` argument to help you catch
+#' # missed mappings
+#' try(recode_values(
 #'   x,
-#'   c("a", "b") ~ "low",
-#'   c("c", "d", "e") ~ "high"
+#'   "a" ~ 1,
+#'   "b" ~ 2,
+#'   "c" ~ 3,
+#'   "d" ~ 4,
+#'   unmatched = "error"
+#' ))
+#'
+#' # `recode_values()` also has additional `from` and `to` arguments, which are
+#' # useful when your lookup table is defined elsewhere (for example, it could
+#' # be read in from a CSV file). This is very difficult to do with
+#' # `case_match()`!
+#' lookup <- tribble(
+#'   ~from, ~to,
+#'   "a", 1,
+#'   "b", 2,
+#'   "c", 3,
+#'   "d", 4
 #' )
 #'
-#' # `case_match()` isn't limited to character input:
-#' y <- c(1, 2, 1, 3, 1, NA, 2, 4)
+#' recode_values(x, from = lookup$from, to = lookup$to)
+#'
+#' # Both `case_match()` and `recode_values()` work with more than just
+#' # character inputs:
+#' y <- as.integer(c(1, 2, 1, 3, 1, NA, 2, 4))
 #'
 #' case_match(
 #'   y,
 #'   c(1, 3) ~ "odd",
 #'   c(2, 4) ~ "even",
 #'   .default = "missing"
 #' )
+#' recode_values(
+#'   y,
+#'   c(1, 3) ~ "odd",
+#'   c(2, 4) ~ "even",
+#'   default = "missing"
+#' )
+#'
+#' # Or with a lookup table
+#' lookup <- tribble(
+#'   ~from,   ~to,
+#'   c(1, 3), "odd",
+#'   c(2, 4), "even"
+#' )
+#' recode_values(y, from = lookup$from, to = lookup$to, default = "missing")
 #'
-#' # Setting `.default` to the original vector is a useful way to replace
-#' # selected values, leaving everything else as is
+#' # `replace_values()` is a convenient way to replace selected values, leaving
+#' # everything else as is. It's similar to `case_match(y, .default = y)`.
+#' replace_values(y, NA ~ 0)
 #' case_match(y, NA ~ 0, .default = y)
 #'
+#' # Notably, `replace_values()` is type stable, which means that `y` can't
+#' # change types out from under you, unlike with `case_match()`!
+#' typeof(y)
+#' typeof(replace_values(y, NA ~ 0))
+#' typeof(case_match(y, NA ~ 0, .default = y))
+#'
+#' # We believe that `replace_values()` better expresses intent when doing a
+#' # partial replacement. Compare these two `mutate()` calls, each with the
+#' # goals of:
+#' # - Replace missings in `hair_color`
+#' # - Replace some of the `species`
 #' starwars |>
 #'   mutate(
-#'     # Replace missings, but leave everything else alone
 #'     hair_color = case_match(hair_color, NA ~ "unknown", .default = hair_color),
-#'     # Replace some, but not all, of the species
 #'     species = case_match(
 #'       species,
 #'       "Human" ~ "Humanoid",
@@ -122,7 +144,24 @@
 #'     ),
 #'     .keep = "used"
 #'   )
+#'
+#' updates <- tribble(
+#'   ~from,                ~to,
+#'   "Human",              "Humanoid",
+#'   "Droid",              "Robot",
+#'   c("Wookiee", "Ewok"), "Hairy"
+#' )
+#'
+#' starwars |>
+#'   mutate(
+#'     hair_color = replace_values(hair_color, NA ~ "unknown"),
+#'     species = replace_values(species, from = updates$from, to = updates$to),
+#'     .keep = "used"
+#'   )
 case_match <- function(.x, ..., .default = NULL, .ptype = NULL) {
+  # Superseded in dplyr 1.2.0
+  lifecycle::signal_stage("superseded", "case_match()", "recode_values()")
+
   # Matching historical behavior of `case_match()`, which was to work like
   # `case_when()` and not allow empty `...`. Newer `replace_when()` and
   # `replace_values()` are a no-op for this case, but we superseded
 
@@ -89,7 +89,6 @@ reference:
     not data frames.
   contents:
   - between
-  - case_match
   - case_when
   - recode_values
   - coalesce
@@ -137,6 +136,7 @@ reference:
   - vars
   - with_groups
   - recode
+  - case_match
 
 - title: Remote tables
   contents: