posit-dev
diff --git a/‎extensions/prototype-content-with-issues-table/app.R‎
Lines changed: 167 additions & 98 deletions b/‎extensions/prototype-content-with-issues-table/app.R‎
Lines changed: 167 additions & 98 deletions
diff --git a/‎extensions/prototype-content-with-issues-table/connect-extension.toml‎
Lines changed: 3 additions & 3 deletions b/‎extensions/prototype-content-with-issues-table/connect-extension.toml‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎extensions/prototype-content-with-issues-table/get_usage.R‎
Lines changed: 0 additions & 53 deletions b/‎extensions/prototype-content-with-issues-table/get_usage.R‎
Lines changed: 0 additions & 53 deletions
@@ -1,20 +1,24 @@
+library(shinyBS)
 library(shiny)
 library(bslib)
-library(DT)
+library(gt)
 library(connectapi)
 library(dplyr)
 library(purrr)
 library(lubridate)
 library(tidyr)
+library(shinyjs)
+library(shinycssloaders)
+library(shinybusy)
+
+source("./ui.R")
 
 # cache data to disk with a refresh every 8h, table renders in ~7m when cache
 # is expired, deleted, or on initial deploy
 shinyOptions(
   cache = cachem::cache_disk("./app_cache/cache/", max_age = 60 * 60 * 8)
 )
 
-source("get_usage.R")
-
 # Hacky function to get a list of Content class objects without making a request
 # for each item. These objects differ from the ones created by `content_item()`
 # because they also include the full owner info as returned by `get_content()`.
@@ -27,79 +31,97 @@ as_content_list <- function(content_df, client) {
   })
 }
 
-# checks to see if a content item has failed jobs within the last 30d, grabs 
-# usage data if it does, then compiles content, job, and usage data together 
-# into a tibble, returning it.
-get_failed_job_data <- function(item, usage) {
-  failed_jobs <- get_jobs(item) |>
-        # filter out successful and running jobs
-        filter(exit_code != 0 & status != 0 & !(is.na(end_time)))
-  
-  if (is.null(failed_jobs) || nrow(failed_jobs) == 0) {
+# user email is not on the content item owner object so we request it
+# TODO: store user_guid = user_email list so we don't lookup the same user's 
+# email for each failing content item they own
+get_user_email <- function(client, guid) {
+  user_endpoint <- paste0("v1/users/", guid)
+  user <- client$GET(user_endpoint)
+  user$email
+}
+
+# filters content jobs down to failures and sets content_recovered depending on 
+# whether or not the latest job ended in error
+filter_to_failed_jobs <- function(jobs) {
+  failed_jobs <- if (nrow(jobs) == 0) {
+    data.frame() 
+    } else {
+    # grab the latest job and all failing jobs
+    latest_job <- jobs %>%
+      slice_max(start_time, with_ties = FALSE)
+    failed_jobs <- jobs %>%
+      # filter out successful and running jobs 
+      filter(exit_code != 0 & !(is.na(exit_code)) & status != 0 & !(is.na(end_time))) |>
+      # grab only the columns we use for cleaner dplyr pipeline
+      select(end_time, exit_code, tag, key) 
+    # set content_recovered depending on if latest_job was in failed_jobs 
+    failed_jobs %>%
+      mutate(
+        content_recovered = ifelse(latest_job$key %in% failed_jobs$key, FALSE, TRUE)
+      )
+    } 
+  failed_jobs
+}
+
+# checks to see if a content item has failed jobs within the last 30d, then 
+# compiles content and job data into a tibble, returning it.
+get_failed_job_data <- function(item, client) {
+  jobs <- tryCatch(
+    {
+      get_jobs(item) 
+    }, error = function(e) {
+      print(paste("Error encountered with item: ", item, e$message))
+      data.frame() 
+    })
+  failed_jobs <- filter_to_failed_jobs(jobs)
+  all_failed_jobs <- if (nrow(failed_jobs) == 0) {
     # content item does not have failed jobs
-    return(NULL)
+    data.frame() 
   } else {
-    last_visit <- usage %>%
-      filter(content_guid == item$content$guid) %>%
-      slice_max(timestamp) %>%
-      select(timestamp)
-    if (nrow(last_visit) == 0) { # display date 0 for content without visits
-      last_visit <- last_visit %>%
-        bind_rows(data.frame(timestamp = as.POSIXct(0)))
-    }
-    # return required information from https://github.com/posit-dev/connect/issues/30288
-    all_failed_jobs <- map_dfr(seq_len(nrow(failed_jobs)), ~
-                                 tibble(
-                                   "content_title" = item$content$title,
-                                   "content_guid" = item$content$guid,
-                                   "content_owner" = item$content$owner[[1]]$username,
-                                   "job_failed_at" = failed_jobs$end_time[.x],
-                                   "failed_job_type" = failed_jobs$tag[.x],
-                                   "failure_reason" = failed_jobs$exit_code[.x],
-                                   "last_deployed_time" = item$content$last_deployed_time,
-                                   "last_visited" = as.POSIXct(last_visit$timestamp)
-                                 )
-    )
-    all_failed_jobs
+    owner_email <- get_user_email(client, item$content$owner_guid)
+    failed_jobs %>% 
+      mutate(
+        content_title = item$content$title,
+        content_guid = item$content$guid,
+        content_owner = item$content$owner[[1]]$username,
+        log_url = paste0(item$content$dashboard_url,
+                        "/logs?logKey=",
+                        failed_jobs$key),
+        owner_email = owner_email, 
+        content_url = item$content$dashboard_url
+        )
   }
+  all_failed_jobs
 }
 
 server <- function(input, output, session) {
   # initialize Connect API client
   client <- connect()
 
-  # TODO: use `v1/content/failed` when #30414 merges so we only list content we
-  # know has failed before, filter to deployed within last 60d for now
+  # TODO: use `v1/content/failed` to get content items with failed last job 
+  # filter to deployed within last year for now
   content_list <- reactive({
     content <- get_content(client, limit = inf)
     content <- content %>%
-      filter(last_deployed_time >= (Sys.time() - days(60)))
+      filter(last_deployed_time >= (Sys.time() - years(1)))
     as_content_list(content, client)
   }) |> bindCache("static_key")
 
-  # cache last 30d of usage (Jobs.MaxCompleted is 30d), takes ~5m to build
-  usage <- reactive({
-    from = (Sys.time() - days(30))
-    to = Sys.time()
-    get_usage(client, from, to) # ~100 pages of results
-  }) |> bindCache("static_key")
-  
-  # cache failed jobs data, takes ~2m to build with content filtered to items 
-  # deployed within the last 60d
+  # cache failed jobs data, takes ~5m to build with content filtered to items 
+  # deployed within the last year
   bad_content_df <- reactive({
-    req(content_list(), usage())
-    map_dfr(content_list(), ~ get_failed_job_data(.x, usage()))
-  }) |> bindCache("static_key")
-  
-  # output the datatable of failed jobs
-  output$jobs <- renderDT({
-    datatable(bad_content_df() |>
-                # map job type to something more readable
-                mutate(failed_job_type = case_when(
-                  failed_job_type %in% c("build_report", "build_site", "build_jupyter") ~ "Building",
-                  failed_job_type %in% c("packrat_restore", "python_restore") ~ "Restoring environment",
-                  failed_job_type == "configure_report" ~ "Configuring report",
-                  failed_job_type %in% c("run_app", 
+    req(content_list()) 
+    bad_content <- map_dfr(content_list(), ~ get_failed_job_data(.x, client)) 
+    bad_content %>%
+      rename(job_failed_at = end_time,
+            failed_job_type = tag,
+            failure_reason = exit_code) %>%
+            # map job type to something more readable
+              mutate(failed_job_type = case_when(
+                    failed_job_type %in% c("build_report", "build_site", "build_jupyter") ~ "Building",
+                    failed_job_type %in% c("packrat_restore", "python_restore") ~ "Restoring environment",
+                    failed_job_type == "configure_report" ~ "Configuring report",
+                    failed_job_type %in% c("run_app", 
                                          "run_api", 
                                          "run_tensorflow", 
                                          "run_python_api",
@@ -110,45 +132,92 @@ server <- function(input, output, session) {
                                          "run_fastapi_app",
                                          "run_voila_app",
                                          "run_pyshiny_app") ~ "Running",
-                  failed_job_type == "render_shiny" ~ "Rendering",
-                  failed_job_type == "ctrl_extraction" ~ "Extracting parameters",
-                  TRUE ~ failed_job_type)) |>
-                # map exit codes to something more readable 
-                mutate(failure_reason = case_when(
-                  failure_reason %in% c(1, 2, 134) ~ "failed to run / error during running",
-                  failure_reason == 137 ~ "out of memory",
-                  failure_reason %in% c(255, 15, 130) ~ "process terminated by server",
-                  failure_reason %in% c(13, 127) ~ "configuration / permissions error",
-                  # treat any unmapped exit_code integers as characters 
-                  TRUE ~ as.character(failure_reason))) |>
-                mutate(content_title = replace_na(content_title, "")),
-              rownames = FALSE, 
-              escape = FALSE,
-              options = list( # non-interactive table for this prototype
-                paging = FALSE,
-                searching = FALSE,
-                ordering = FALSE, 
-                info = FALSE, 
-                dom = "t" 
-              )
+                    failed_job_type == "render_shiny" ~ "Rendering",
+                    failed_job_type == "ctrl_extraction" ~ "Extracting parameters",
+                    TRUE ~ failed_job_type),
+                    # map exit codes to something more readable 
+                    failure_reason = case_when(
+                    failure_reason %in% c(1, 2, 134) ~ "failed to run / error during running",
+                    failure_reason == 137 ~ "out of memory",
+                    failure_reason %in% c(255, 15, 130) ~ "process terminated by server",
+                    failure_reason %in% c(13, 127) ~ "configuration / permissions error",
+                    # treat any unmapped exit_code integers as characters 
+                    TRUE ~ as.character(failure_reason))) %>%
+              group_by(content_guid) %>%
+              mutate(content_guid = paste0('<a href="', 
+                                            first(content_url), 
+                                            '" target="_blank">', 
+                                            first(content_title), 
+                                            '</a>')) %>%
+              mutate(owner_email = paste0('<span style="font-size: 32px;">',
+                                          "<a href='mailto:",
+                                          owner_email,
+                                          "?subject=Problem%20with%20",
+                                          gsub("'", 
+                                              "%27", 
+                                              gsub('"',
+                                                  "%22",
+                                                  content_title)),
+                                          "&body=Please%20investigate:%0A",
+                                          log_url,
+                                          "'>",
+                                          "✉",
+                                          "</a></span>")) %>%
+              mutate(log_url = paste0('<a href="',
+                                     log_url,
+                                     '" target="_blank">',
+                                     '<span style="font-size: 32px;">🗒',
+                                     '</a></span>')) %>%
+              mutate(content_guid = ifelse(!content_recovered,
+                paste(content_guid, " <span style='color: red;'>⚠️</span>"),
+                content_guid)) %>%
+              select(-content_url, -content_title, -key)
+  }) |> bindCache("static_key")
+  
+  # show helpful information about what is and is not in failed jobs data
+  # along with definitions of terms and descriptions of filter behavior
+  observeEvent(input$show_help, {
+    showModal(modalDialog(
+      title = "Helpful info about this app",
+      easyClose = TRUE,
+      size = "m",
+      help_information)
     )
   })
-}
-
-ui <- fluidPage(
-  fluidRow(
-    column(12, 
-           titlePanel("Content With Issues (table view)")
-    )
-  ),
+ 
+  # populate owners filter with username from compiled failed jobs data 
+  observe({
+    updateSelectInput(session, 
+                      "owner_filter", 
+                      choices = unique(bad_content_df()$content_owner))
+  })
 
-  fluidRow(
-    column(12,
-           titlePanel(tags$h6("All failed jobs on content deployed within 60d:")), 
-           DTOutput("jobs"),
-    )
-  )
-)
-
+  # output the great table of failed jobs
+  # TODO: better reflect current applied filters
+  output$jobs <- render_gt({
+      bad_content_df() %>%
+        filter(if (input$currently_failing) content_recovered == FALSE else TRUE) %>%
+        filter(if (input$not_notified) failed_job_type %in% c("Running",
+                                                              "Configuring report",
+                                                              "Restoring environment",
+                                                              "Extracting parameters") else TRUE) %>%
+        filter(if (!is.null(input$job_type)) failed_job_type %in% input$job_type else TRUE) %>%
+        filter(if (!is.null(input$owner_filter)) content_owner %in% input$owner_filter else TRUE) %>%
+        filter(if (!is.null(input$failure_reason)) failure_reason %in% input$failure_reason else TRUE) %>%
+        gt() %>%
+          fmt_markdown(columns = c(log_url, owner_email)) %>%
+          sub_missing(columns = everything(), missing_text = " ") %>%
+          cols_label(job_failed_at = "Date of Failure",
+                     failure_reason = "Reason for Failure",
+                     failed_job_type = "Job Type",
+                     content_owner = "Owner",
+                     owner_email = "Email Owner",
+                     log_url = "Open Logs") %>% 
+          cols_hide(content_recovered) %>%
+          opt_interactive(use_page_size_select = TRUE,
+                          use_sorting = TRUE,
+                          use_search = TRUE)
+  })
+}
 
-shinyApp(ui, server)
+shinyApp(ui, server)
@@ -1,4 +1,4 @@
-name = "prototype-content-with-issues-table"
-title = "Content With Issues (table view)"
-description = "R Shiny prototype extension that displays a table of all failed content jobs."
+name = "prototype-content-with-issues-interactive-table"
+title = "Content With Issues (interactive table)"
+description = "R Shiny prototype extension that displays an interactive table of all failed content jobs for items deployed within the last year."
 access_type = "acl"