Skip to content

Augment fails in 0.1.6 with a character ID column #506

Closed
@cgoo4

Description

@cgoo4

Augment handled character ID columns in version 0.1.5, but errors in 0.1.6 per this reprex:

library(tidyverse)
library(tidymodels)
#> Registered S3 method overwritten by 'tune':
#>   method                   from   
#>   required_pkgs.model_spec parsnip

# devtools::install_version("parsnip", "0.1.5")

mt_model <- boost_tree() %>%
  set_mode("classification") %>%
  set_engine("xgboost")

mtcars_tb <- as_tibble(mtcars %>% rownames_to_column()) %>% 
  mutate(vs = factor(vs))

mt_recipe <-
  mtcars_tb %>%
  recipe() %>%
  update_role(vs, new_role = "outcome") %>%
  update_role(rowname, new_role = "id") %>%
  update_role(-has_role("outcome"), -has_role("id"), new_role = "predictor")

mt_wflow <- workflow() %>%
  add_recipe(mt_recipe) %>%
  add_model(mt_model)

mt_fit <- mt_wflow %>%
  fit(mtcars_tb[1:25, ])
#> [12:54:49] WARNING: amalgamation/../src/learner.cc:1095: Starting in XGBoost 1.3.0, the default evaluation metric used with the objective 'binary:logistic' was changed from 'error' to 'logloss'. Explicitly set eval_metric if you'd like to restore the old behavior.

# Fails for parsnip 0.1.6
mt_results <- mt_fit %>% augment(new_data = mtcars_tb[26:32, ])
#> Error in xgboost::xgb.DMatrix(data = newdata, missing = NA): 'data' has class 'character' and length 77.
#>   'data' accepts either a numeric matrix or a single filename.

# Work-around for parsnip 0.1.6
mt_results <-
  mtcars_tb[26:32, ] %>%
  mutate(
    .pred_class = predict(mt_fit, new_data = mtcars_tb[26:32, ]) %>% pull(.pred_class),
    .pred_0 = predict(mt_fit, new_data = mtcars_tb[26:32, ], type = "prob") %>% pull(.pred_0),
    .pred_1 = predict(mt_fit, new_data = mtcars_tb[26:32, ], type = "prob") %>% pull(.pred_1)
    )

Created on 2021-05-30 by the reprex package (v2.0.0)

Session info
sessioninfo::session_info()
#> ─ Session info ───────────────────────────────────────────────────────────────
#>  setting  value                       
#>  version  R version 4.1.0 (2021-05-18)
#>  os       macOS Big Sur 10.16         
#>  system   x86_64, darwin17.0          
#>  ui       X11                         
#>  language (EN)                        
#>  collate  en_GB.UTF-8                 
#>  ctype    en_GB.UTF-8                 
#>  tz       Europe/London               
#>  date     2021-05-30                  
#> 
#> ─ Packages ───────────────────────────────────────────────────────────────────
#>  package      * version    date       lib source                          
#>  assertthat     0.2.1      2019-03-21 [1] CRAN (R 4.1.0)                  
#>  backports      1.2.1      2020-12-09 [1] CRAN (R 4.1.0)                  
#>  broom        * 0.7.6      2021-04-05 [1] CRAN (R 4.1.0)                  
#>  cellranger     1.1.0      2016-07-27 [1] CRAN (R 4.1.0)                  
#>  class          7.3-19     2021-05-03 [1] CRAN (R 4.1.0)                  
#>  cli            2.5.0      2021-04-26 [1] CRAN (R 4.1.0)                  
#>  codetools      0.2-18     2020-11-04 [1] CRAN (R 4.1.0)                  
#>  colorspace     2.0-1      2021-05-04 [1] CRAN (R 4.1.0)                  
#>  crayon         1.4.1      2021-02-08 [1] CRAN (R 4.1.0)                  
#>  data.table     1.14.0     2021-02-21 [1] CRAN (R 4.1.0)                  
#>  DBI            1.1.1      2021-01-15 [1] CRAN (R 4.1.0)                  
#>  dbplyr         2.1.1      2021-04-06 [1] CRAN (R 4.1.0)                  
#>  dials        * 0.0.9      2020-09-16 [1] CRAN (R 4.1.0)                  
#>  DiceDesign     1.9        2021-02-13 [1] CRAN (R 4.1.0)                  
#>  digest         0.6.27     2020-10-24 [1] CRAN (R 4.1.0)                  
#>  dplyr        * 1.0.6      2021-05-05 [1] CRAN (R 4.1.0)                  
#>  ellipsis       0.3.2      2021-04-29 [1] CRAN (R 4.1.0)                  
#>  evaluate       0.14       2019-05-28 [1] CRAN (R 4.1.0)                  
#>  fansi          0.5.0      2021-05-25 [1] CRAN (R 4.1.0)                  
#>  forcats      * 0.5.1      2021-01-27 [1] CRAN (R 4.1.0)                  
#>  foreach        1.5.1      2020-10-15 [1] CRAN (R 4.1.0)                  
#>  fs             1.5.0      2020-07-31 [1] CRAN (R 4.1.0)                  
#>  furrr          0.2.2      2021-01-29 [1] CRAN (R 4.1.0)                  
#>  future         1.21.0     2020-12-10 [1] CRAN (R 4.1.0)                  
#>  generics       0.1.0      2020-10-31 [1] CRAN (R 4.1.0)                  
#>  ggplot2      * 3.3.3      2020-12-30 [1] CRAN (R 4.1.0)                  
#>  globals        0.14.0     2020-11-22 [1] CRAN (R 4.1.0)                  
#>  glue           1.4.2      2020-08-27 [1] CRAN (R 4.1.0)                  
#>  gower          0.2.2      2020-06-23 [1] CRAN (R 4.1.0)                  
#>  GPfit          1.0-8      2019-02-08 [1] CRAN (R 4.1.0)                  
#>  gtable         0.3.0      2019-03-25 [1] CRAN (R 4.1.0)                  
#>  hardhat        0.1.5      2020-11-09 [1] CRAN (R 4.1.0)                  
#>  haven          2.4.1      2021-04-23 [1] CRAN (R 4.1.0)                  
#>  highr          0.9        2021-04-16 [1] CRAN (R 4.1.0)                  
#>  hms            1.1.0      2021-05-17 [1] CRAN (R 4.1.0)                  
#>  htmltools      0.5.1.1    2021-01-22 [1] CRAN (R 4.1.0)                  
#>  httr           1.4.2      2020-07-20 [1] CRAN (R 4.1.0)                  
#>  infer        * 0.5.4      2021-01-13 [1] CRAN (R 4.1.0)                  
#>  ipred          0.9-11     2021-03-12 [1] CRAN (R 4.1.0)                  
#>  iterators      1.0.13     2020-10-15 [1] CRAN (R 4.1.0)                  
#>  jsonlite       1.7.2      2020-12-09 [1] CRAN (R 4.1.0)                  
#>  knitr          1.33       2021-04-24 [1] CRAN (R 4.1.0)                  
#>  lattice        0.20-44    2021-05-02 [1] CRAN (R 4.1.0)                  
#>  lava           1.6.9      2021-03-11 [1] CRAN (R 4.1.0)                  
#>  lhs            1.1.1      2020-10-05 [1] CRAN (R 4.1.0)                  
#>  lifecycle      1.0.0      2021-02-15 [1] CRAN (R 4.1.0)                  
#>  listenv        0.8.0      2019-12-05 [1] CRAN (R 4.1.0)                  
#>  lubridate      1.7.10     2021-02-26 [1] CRAN (R 4.1.0)                  
#>  magrittr       2.0.1      2020-11-17 [1] CRAN (R 4.1.0)                  
#>  MASS           7.3-54     2021-05-03 [1] CRAN (R 4.1.0)                  
#>  Matrix         1.3-3      2021-05-04 [1] CRAN (R 4.1.0)                  
#>  modeldata    * 0.1.0      2020-10-22 [1] CRAN (R 4.1.0)                  
#>  modelr         0.1.8      2020-05-19 [1] CRAN (R 4.1.0)                  
#>  munsell        0.5.0      2018-06-12 [1] CRAN (R 4.1.0)                  
#>  nnet           7.3-16     2021-05-03 [1] CRAN (R 4.1.0)                  
#>  parallelly     1.25.0     2021-04-30 [1] CRAN (R 4.1.0)                  
#>  parsnip      * 0.1.6      2021-05-27 [1] CRAN (R 4.1.0)                  
#>  pillar         1.6.1      2021-05-16 [1] CRAN (R 4.1.0)                  
#>  pkgconfig      2.0.3      2019-09-22 [1] CRAN (R 4.1.0)                  
#>  plyr           1.8.6      2020-03-03 [1] CRAN (R 4.1.0)                  
#>  pROC           1.17.0.1   2021-01-13 [1] CRAN (R 4.1.0)                  
#>  prodlim        2019.11.13 2019-11-17 [1] CRAN (R 4.1.0)                  
#>  purrr        * 0.3.4.9000 2021-05-22 [1] Github (tidyverse/purrr@5aca9df)
#>  R6             2.5.0      2020-10-28 [1] CRAN (R 4.1.0)                  
#>  Rcpp           1.0.6      2021-01-15 [1] CRAN (R 4.1.0)                  
#>  readr        * 1.4.0      2020-10-05 [1] CRAN (R 4.1.0)                  
#>  readxl         1.3.1      2019-03-13 [1] CRAN (R 4.1.0)                  
#>  recipes      * 0.1.16     2021-04-16 [1] CRAN (R 4.1.0)                  
#>  reprex         2.0.0      2021-04-02 [1] CRAN (R 4.1.0)                  
#>  rlang          0.4.11     2021-04-30 [1] CRAN (R 4.1.0)                  
#>  rmarkdown      2.8        2021-05-07 [1] CRAN (R 4.1.0)                  
#>  rpart          4.1-15     2019-04-12 [1] CRAN (R 4.1.0)                  
#>  rsample      * 0.1.0      2021-05-08 [1] CRAN (R 4.1.0)                  
#>  rstudioapi     0.13       2020-11-12 [1] CRAN (R 4.1.0)                  
#>  rvest          1.0.0      2021-03-09 [1] CRAN (R 4.1.0)                  
#>  scales       * 1.1.1      2020-05-11 [1] CRAN (R 4.1.0)                  
#>  sessioninfo    1.1.1      2018-11-05 [1] CRAN (R 4.1.0)                  
#>  stringi        1.6.2      2021-05-17 [1] CRAN (R 4.1.0)                  
#>  stringr      * 1.4.0      2019-02-10 [1] CRAN (R 4.1.0)                  
#>  styler         1.4.1      2021-03-30 [1] CRAN (R 4.1.0)                  
#>  survival       3.2-11     2021-04-26 [1] CRAN (R 4.1.0)                  
#>  tibble       * 3.1.2      2021-05-16 [1] CRAN (R 4.1.0)                  
#>  tidymodels   * 0.1.3      2021-04-19 [1] CRAN (R 4.1.0)                  
#>  tidyr        * 1.1.3      2021-03-03 [1] CRAN (R 4.1.0)                  
#>  tidyselect     1.1.1      2021-04-30 [1] CRAN (R 4.1.0)                  
#>  tidyverse    * 1.3.1      2021-04-15 [1] CRAN (R 4.1.0)                  
#>  timeDate       3043.102   2018-02-21 [1] CRAN (R 4.1.0)                  
#>  tune         * 0.1.5      2021-04-23 [1] CRAN (R 4.1.0)                  
#>  utf8           1.2.1      2021-03-12 [1] CRAN (R 4.1.0)                  
#>  vctrs          0.3.8      2021-04-29 [1] CRAN (R 4.1.0)                  
#>  withr          2.4.2      2021-04-18 [1] CRAN (R 4.1.0)                  
#>  workflows    * 0.2.2      2021-03-10 [1] CRAN (R 4.1.0)                  
#>  workflowsets * 0.0.2      2021-04-16 [1] CRAN (R 4.1.0)                  
#>  xfun           0.23       2021-05-15 [1] CRAN (R 4.1.0)                  
#>  xgboost        1.4.1.1    2021-04-22 [1] CRAN (R 4.1.0)                  
#>  xml2           1.3.2      2020-04-23 [1] CRAN (R 4.1.0)                  
#>  yaml           2.2.1      2020-02-01 [1] CRAN (R 4.1.0)                  
#>  yardstick    * 0.0.8      2021-03-28 [1] CRAN (R 4.1.0)                  
#> 
#> [1] /Library/Frameworks/R.framework/Versions/4.1/Resources/library

Metadata

Metadata

Assignees

No one assigned

    Labels

    bugan unexpected problem or unintended behavior

    Type

    No type

    Projects

    No projects

    Milestone

    No milestone

    Relationships

    None yet

    Development

    No branches or pull requests

    Issue actions