facebookexperimental
diff --git a/‎R/DESCRIPTION‎
Lines changed: 1 addition & 1 deletion b/‎R/DESCRIPTION‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎R/R/allocator.R‎
Lines changed: 5 additions & 6 deletions b/‎R/R/allocator.R‎
Lines changed: 5 additions & 6 deletions
diff --git a/‎R/R/auxiliary.R‎
Lines changed: 10 additions & 5 deletions b/‎R/R/auxiliary.R‎
Lines changed: 10 additions & 5 deletions
diff --git a/‎R/R/checks.R‎
Lines changed: 3 additions & 2 deletions b/‎R/R/checks.R‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎R/R/clusters.R‎
Lines changed: 3 additions & 1 deletion b/‎R/R/clusters.R‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎R/R/inputs.R‎
Lines changed: 22 additions & 12 deletions b/‎R/R/inputs.R‎
Lines changed: 22 additions & 12 deletions
diff --git a/‎R/R/json.R‎
Lines changed: 55 additions & 38 deletions b/‎R/R/json.R‎
Lines changed: 55 additions & 38 deletions
@@ -1,7 +1,7 @@
 Package: Robyn
 Type: Package
 Title: Semi-Automated Marketing Mix Modeling (MMM) from Meta Marketing Science 
-Version: 3.10.7.9000
+Version: 3.10.7.9001
 Authors@R: c(
     person("Gufeng", "Zhou", , "gufeng@meta.com", c("cre","aut")),
     person("Bernardo", "Lares", , "laresbernardo@gmail.com", c("aut")),
 
@@ -168,7 +168,7 @@ robyn_allocator <- function(robyn_object = NULL,
   if (is.null(channel_constr_up)) {
     channel_constr_up <- case_when(
       scenario == "max_response" ~ 2,
-      scenario == "target_efficiency" ~ Inf
+      scenario == "target_efficiency" ~ 10
     )
   }
   if (length(channel_constr_low) == 1) channel_constr_low <- rep(channel_constr_low, length(paid_media_spends))
@@ -271,8 +271,8 @@ robyn_allocator <- function(robyn_object = NULL,
       select_build = select_build,
       select_model = select_model,
       metric_name = mediaSpendSorted[i],
-      #metric_value = initSpendUnit[i] * simulation_period[i],
-      #date_range = date_range,
+      # metric_value = initSpendUnit[i] * simulation_period[i],
+      # date_range = date_range,
       dt_hyppar = OutputCollect$resultHypParam,
       dt_coef = OutputCollect$xDecompAgg,
       InputCollect = InputCollect,
@@ -478,14 +478,13 @@ robyn_allocator <- function(robyn_object = NULL,
 
   if (scenario == "target_efficiency") {
     ## bounded optimisation
-    total_response <- sum(OutputCollect$xDecompAgg$xDecompAgg)
     nlsMod <- nloptr::nloptr(
       x0 = x0,
       eval_f = eval_f,
       eval_g_eq = if (constr_mode == "eq") eval_g_eq_effi else NULL,
       eval_g_ineq = if (constr_mode == "ineq") eval_g_eq_effi else NULL,
       lb = lb,
-      ub = rep(total_response, length(ub)),
+      ub = x0 * channel_constr_up[1], # Large enough, but not infinite (customizable)
       opts = list(
         "algorithm" = "NLOPT_LD_AUGLAG",
         "xtol_rel" = 1.0e-10,
@@ -501,7 +500,7 @@ robyn_allocator <- function(robyn_object = NULL,
       eval_g_eq = if (constr_mode == "eq") eval_g_eq_effi else NULL,
       eval_g_ineq = if (constr_mode == "ineq") eval_g_eq_effi else NULL,
       lb = lb,
-      ub = rep(total_response, length(ub)),
+      ub = x0 * channel_constr_up[1], # Large enough, but not infinite (customizable)
       opts = list(
         "algorithm" = "NLOPT_LD_AUGLAG",
         "xtol_rel" = 1.0e-10,
 
@@ -77,15 +77,20 @@ baseline_vars <- function(InputCollect, baseline_level) {
   stopifnot(length(baseline_level) == 1)
   stopifnot(baseline_level %in% 0:5)
   x <- ""
-  if (baseline_level >= 1)
+  if (baseline_level >= 1) {
     x <- c(x, "(Intercept)", "intercept")
-  if (baseline_level >= 2)
+  }
+  if (baseline_level >= 2) {
     x <- c(x, "trend")
-  if (baseline_level >= 3)
+  }
+  if (baseline_level >= 3) {
     x <- unique(c(x, InputCollect$prophet_vars))
-  if (baseline_level >= 4)
+  }
+  if (baseline_level >= 4) {
     x <- c(x, InputCollect$context_vars)
-  if (baseline_level >= 5)
+  }
+  if (baseline_level >= 5) {
     x <- c(x, InputCollect$organic_vars)
+  }
   return(x)
 }
@@ -499,7 +499,8 @@ check_hyperparameters <- function(hyperparameters = NULL, adstock = NULL,
     # Adding penalty variations to the dictionary
     if (any(grepl("_penalty", paste0(get_hyp_names)))) {
       ref_hyp_name_penalties <- paste0(
-        c(paid_media_spends, organic_vars, prophet_vars, contextual_vars), "_penalty")
+        c(paid_media_spends, organic_vars, prophet_vars, contextual_vars), "_penalty"
+      )
       all_ref_names <- c(all_ref_names, ref_hyp_name_penalties)
     } else {
       ref_hyp_name_penalties <- NULL
@@ -928,7 +929,7 @@ check_metric_dates <- function(date_range = NULL, all_dates, dayInterval = NULL,
     #     dayInterval >= 30 & dayInterval <= 31 ~ 1,
     #   ))
     # }
-    date_range = "all"
+    date_range <- "all"
     if (!quiet) message(sprintf("Automatically picked date_range = '%s'", date_range))
   }
   if (grepl("last|all", date_range[1])) {
 
@@ -122,7 +122,9 @@ robyn_clusters <- function(input, dep_var_type,
       dim_red = dim_red, quiet = TRUE, seed = seed
     )
   )
-  cls$df <- group_by(cls$df, .data$cluster) %>% mutate(n = n()) %>% ungroup()
+  cls$df <- group_by(cls$df, .data$cluster) %>%
+    mutate(n = n()) %>%
+    ungroup()
 
   # Select top models by minimum (weighted) distance to zero
   all_paid <- setdiff(names(cls$df), c(ignore, "cluster"))
 
@@ -181,7 +181,7 @@ robyn_inputs <- function(dt_input = NULL,
     json <- robyn_read(json_file, step = 1, ...)
     if (is.null(dt_input)) {
       if ("raw_data" %in% names(json[["Extras"]])) {
-        dt_input <- json[["Extras"]]$raw_data
+        dt_input <- as_tibble(json[["Extras"]]$raw_data)
       } else {
         stop("Must provide 'dt_input' input; 'dt_holidays' input optional")
       }
@@ -204,7 +204,8 @@ robyn_inputs <- function(dt_input = NULL,
       dt_input, dt_holidays,
       dep_var, date_var,
       context_vars, paid_media_spends,
-      organic_vars)
+      organic_vars
+    )
 
     ## Check for NA and all negative values
     dt_input <- check_allneg(dt_input)
@@ -254,9 +255,7 @@ robyn_inputs <- function(dt_input = NULL,
 
     ## Check window_start & window_end (and transform parameters/data)
     windows <- check_windows(dt_input, date_var, all_media, window_start, window_end)
-
     if (TRUE) {
-      dt_input <- windows$dt_input
       window_start <- windows$window_start
       rollingWindowStartWhich <- windows$rollingWindowStartWhich
       refreshAddedStart <- windows$refreshAddedStart
@@ -283,9 +282,14 @@ robyn_inputs <- function(dt_input = NULL,
     check_novar(select(dt_input, -all_of(unused_vars)))
 
     # Calculate total media spend used to model
-    paid_media_total <- dt_input[
-      rollingWindowEndWhich:rollingWindowLength, ] %>%
-      select(paid_media_vars) %>% sum()
+    paid_media_total <- dt_input %>%
+      mutate(temp_date = dt_input[[date_var]]) %>%
+      filter(
+        .data$temp_date >= window_start,
+        .data$temp_date <= window_end
+      ) %>%
+      select(all_of(paid_media_spends)) %>%
+      sum()
 
     ## Collect input
     InputCollect <- list(
@@ -320,7 +324,7 @@ robyn_inputs <- function(dt_input = NULL,
       window_end = window_end,
       rollingWindowEndWhich = rollingWindowEndWhich,
       rollingWindowLength = rollingWindowLength,
-      totalObservations = nrow(dt_input),
+      totalObservations = nrow(windows$dt_input),
       refreshAddedStart = refreshAddedStart,
       adstock = adstock,
       hyperparameters = hyperparameters,
@@ -411,7 +415,7 @@ print.robyn_inputs <- function(x, ...) {
   mod_vars <- paste(setdiff(names(x$dt_mod), c("ds", "dep_var")), collapse = ", ")
   print(glued(
     "
-Total Observations: {nrow(x$dt_input)} ({x$intervalType}s)
+Total Observations: {x$totalObservations} ({x$intervalType}s)
 Input Table Columns ({ncol(x$dt_input)}):
   Date: {x$date_var}
   Dependent: {x$dep_var} [{x$dep_var_type}]
@@ -434,8 +438,10 @@ Adstock: {x$adstock}
     windows = paste(x$window_start, x$window_end, sep = ":"),
     custom_params = if (length(x$custom_params) > 0) paste("\n", flatten_hyps(x$custom_params)) else "None",
     prophet = if (length(x$prophet_vars) > 0) {
-      sprintf("%s on %s", paste(x$prophet_vars, collapse = ", "),
-              ifelse(!is.null(x$prophet_country), x$prophet_country, "data"))
+      sprintf(
+        "%s on %s", paste(x$prophet_vars, collapse = ", "),
+        ifelse(!is.null(x$prophet_country), x$prophet_country, "data")
+      )
     } else {
       "\033[0;31mDeactivated\033[0m"
     },
@@ -503,6 +509,7 @@ Adstock: {x$adstock}
 #' Accepts "geometric", "weibull_cdf" or "weibull_pdf"
 #' @param all_media Character vector. Default to \code{InputCollect$all_media}.
 #' Includes \code{InputCollect$paid_media_spends} and \code{InputCollect$organic_vars}.
+#' @param all_vars Used to check the penalties inputs, especially for refreshing models.
 #' @examples
 #' \donttest{
 #' media <- c("facebook_S", "print_S", "tv_S")
@@ -540,7 +547,7 @@ Adstock: {x$adstock}
 #' }
 #' @return Character vector. Names of hyper-parameters that should be defined.
 #' @export
-hyper_names <- function(adstock, all_media) {
+hyper_names <- function(adstock, all_media, all_vars = NULL) {
   adstock <- check_adstock(adstock)
   if (adstock == "geometric") {
     local_name <- sort(apply(expand.grid(all_media, HYPS_NAMES[
@@ -551,6 +558,9 @@ hyper_names <- function(adstock, all_media) {
       grepl("shapes|scales|alphas|gammas", HYPS_NAMES)
     ]), 1, paste, collapse = "_"))
   }
+  if (!is.null(all_vars)) {
+    local_name <- sort(c(local_name, paste0(all_vars, "_penalty")))
+  }
   return(local_name)
 }
 
 
@@ -61,7 +61,6 @@ robyn_write <- function(InputCollect,
 
   # ExportedModel JSON
   if (!is.null(OutputCollect)) {
-
     # Modeling associated data
     collect <- list()
     collect$ts_validation <- OutputCollect$OutputModels$ts_validation
@@ -71,7 +70,8 @@ robyn_write <- function(InputCollect,
     collect$outputs_time <- sprintf("%s min", attr(OutputCollect, "runTime"))
     collect$total_time <- sprintf(
       "%s min", attr(OutputCollect, "runTime") +
-        attr(OutputCollect$OutputModels, "runTime"))
+        attr(OutputCollect$OutputModels, "runTime")
+    )
     collect$total_iters <- OutputCollect$OutputModels$iterations *
       OutputCollect$OutputModels$trials
     collect$conv_msg <- gsub("\\:.*", "", OutputCollect$OutputModels$convergence$conv_msg)
@@ -94,11 +94,14 @@ robyn_write <- function(InputCollect,
       outputs$performance <- df %>%
         filter(.data$rn %in% InputCollect$paid_media_spends) %>%
         group_by(.data$solID) %>%
-        summarise(metric = perf_metric,
-                  performance = ifelse(
-                    perf_metric == "ROAS",
-                    sum(.data$xDecompAgg) / sum(.data$total_spend),
-                    sum(.data$total_spend) / sum(.data$xDecompAgg)), .groups = "drop")
+        summarise(
+          metric = perf_metric,
+          performance = ifelse(
+            perf_metric == "ROAS",
+            sum(.data$xDecompAgg) / sum(.data$total_spend),
+            sum(.data$total_spend) / sum(.data$xDecompAgg)
+          ), .groups = "drop"
+        )
       outputs$summary <- df %>%
         mutate(
           metric = perf_metric,
@@ -136,7 +139,7 @@ robyn_write <- function(InputCollect,
 
   extras <- list(...)
   if (isTRUE(add_data) & !"raw_data" %in% names(extras)) {
-    extras[["raw_data"]] <- InputCollect$dt_input
+    extras[["raw_data"]] <- as_tibble(InputCollect$dt_input)
   }
   if (length(extras) > 0) {
     ret[["Extras"]] <- extras
@@ -153,7 +156,8 @@ robyn_write <- function(InputCollect,
       if (!all(c("solID", "cluster") %in% names(pareto_df))) {
         warning(paste(
           "Input 'pareto_df' is not a valid data.frame;",
-          "must contain 'solID' and 'cluster' columns."))
+          "must contain 'solID' and 'cluster' columns."
+        ))
       } else {
         all_c <- unique(pareto_df$cluster)
         pareto_df <- lapply(all_c, function(x) {
@@ -192,7 +196,8 @@ print.robyn_write <- function(x, ...) {
     "\n\nModel's Performance and Errors:\n    {performance}{errors}",
     performance = ifelse("performance" %in% names(x$ExportedModel), sprintf(
       "Total Model %s = %s\n    ",
-      x$ExportedModel$performance$metric, signif(x$ExportedModel$performance$performance, 4)), ""),
+      x$ExportedModel$performance$metric, signif(x$ExportedModel$performance$performance, 4)
+    ), ""),
     errors = paste(
       sprintf(
         "Adj.R2 (train): %s",
@@ -204,34 +209,36 @@ print.robyn_write <- function(x, ...) {
     )
   ))
 
-  print(glued("\n\nSummary Values on Selected Model:"))
+  if ("ExportedModel" %in% names(x)) {
+    print(glued("\n\nSummary Values on Selected Model:"))
 
-  print(x$ExportedModel$summary %>%
-    select(-contains("boot"), -contains("ci_")) %>%
-    dplyr::rename_at("performance", list(~ ifelse(x$InputCollect$dep_var_type == "revenue", "ROAS", "CPA"))) %>%
-    mutate(decompPer = formatNum(100 * .data$decompPer, pos = "%")) %>%
-    dplyr::mutate_if(is.numeric, function(x) ifelse(!is.infinite(x), x, 0)) %>%
-    dplyr::mutate_if(is.numeric, function(x) formatNum(x, 4, abbr = TRUE)) %>%
-    replace(., . == "NA", "-") %>% as.data.frame())
+    print(x$ExportedModel$summary %>%
+      select(-contains("boot"), -contains("ci_")) %>%
+      dplyr::rename_at("performance", list(~ ifelse(x$InputCollect$dep_var_type == "revenue", "ROAS", "CPA"))) %>%
+      mutate(decompPer = formatNum(100 * .data$decompPer, pos = "%")) %>%
+      dplyr::mutate_if(is.numeric, function(x) ifelse(!is.infinite(x), x, 0)) %>%
+      dplyr::mutate_if(is.numeric, function(x) formatNum(x, 4, abbr = TRUE)) %>%
+      replace(., . == "NA", "-") %>% as.data.frame())
 
-  print(glued(
-    "\n\nHyper-parameters:\n    Adstock: {x$InputCollect$adstock}"
-  ))
+    print(glued(
+      "\n\nHyper-parameters:\n    Adstock: {x$InputCollect$adstock}"
+    ))
 
-  # Nice and tidy table format for hyper-parameters
-  HYPS_NAMES <- c(HYPS_NAMES, "penalty")
-  regex <- paste(paste0("_", HYPS_NAMES), collapse = "|")
-  hyper_df <- as.data.frame(x$ExportedModel$hyper_values) %>%
-    select(-contains("lambda"), -any_of(HYPS_OTHERS)) %>%
-    tidyr::gather() %>%
-    tidyr::separate(.data$key,
-      into = c("channel", "none"),
-      sep = regex, remove = FALSE
-    ) %>%
-    mutate(hyperparameter = gsub("^.*_", "", .data$key)) %>%
-    select(.data$channel, .data$hyperparameter, .data$value) %>%
-    tidyr::spread(key = "hyperparameter", value = "value")
-  print(hyper_df)
+    # Nice and tidy table format for hyper-parameters
+    HYPS_NAMES <- c(HYPS_NAMES, "penalty")
+    regex <- paste(paste0("_", HYPS_NAMES), collapse = "|")
+    hyper_df <- as.data.frame(x$ExportedModel$hyper_values) %>%
+      select(-contains("lambda"), -any_of(HYPS_OTHERS)) %>%
+      tidyr::gather() %>%
+      tidyr::separate(.data$key,
+        into = c("channel", "none"),
+        sep = regex, remove = FALSE
+      ) %>%
+      mutate(hyperparameter = gsub("^.*_", "", .data$key)) %>%
+      select(.data$channel, .data$hyperparameter, .data$value) %>%
+      tidyr::spread(key = "hyperparameter", value = "value")
+    print(hyper_df)
+  }
 }
 
 
@@ -342,7 +349,9 @@ robyn_recreate <- function(json_file, quiet = FALSE, ...) {
         quiet = quiet,
         ...
       )
-    } else OutputCollect <- NULL
+    } else {
+      OutputCollect <- NULL
+    }
   } else {
     # Use case: skip feature engineering when InputCollect is provided
     InputCollect <- args[["InputCollect"]]
@@ -373,7 +382,8 @@ robyn_chain <- function(json_file) {
     temp <- list.files(plot_folder)
     mods <- unique(temp[
       (startsWith(temp, "RobynModel") | grepl("\\.json+$", temp)) &
-        grepl("^[^_]*_[^_]*_[^_]*$", temp)])
+        grepl("^[^_]*_[^_]*_[^_]*$", temp)
+    ])
     avlb <- gsub("RobynModel-|\\.json", "", mods)
     if (length(ids) == length(mods)) {
       chain <- rep_len(chain, length(mods))
@@ -394,7 +404,14 @@ robyn_chain <- function(json_file) {
           filename <- mods[avlb == ids[i]]
           json_new <- robyn_read(filename, quiet = TRUE)
         } else {
-          message("Skipping chain. File can't be found: ", filename)
+          last_try <- gsub(chain[1], "", filename)
+          if (file.exists(last_try)) {
+            json_new <- robyn_read(last_try, quiet = TRUE)
+            message("Stored original model in new file: ", filename)
+            jsonlite::write_json(json_new, filename, pretty = TRUE)
+          } else {
+            message("Skipping chain. File can't be found: ", filename)
+          }
         }
       }
     }
Original file line number	Diff line number	Diff line change
`@@ -122,7 +122,9 @@ robyn_clusters <- function(input, dep_var_type,`
`122`	`122`	`dim_red = dim_red, quiet = TRUE, seed = seed`
`123`	`123`	`)`
`124`	`124`	`)`
`125`		`- cls$df <- group_by(cls$df, .data$cluster) %>% mutate(n = n()) %>% ungroup()`
	`125`	`+ cls$df <- group_by(cls$df, .data$cluster) %>%`
	`126`	`+ mutate(n = n()) %>%`
	`127`	`+ ungroup()`
`126`	`128`
`127`	`129`	`# Select top models by minimum (weighted) distance to zero`
`128`	`130`	`all_paid <- setdiff(names(cls$df), c(ignore, "cluster"))`