rstudio
diff --git a/‎.github/workflows/R-CMD-check.yaml‎
Lines changed: 5 additions & 6 deletions b/‎.github/workflows/R-CMD-check.yaml‎
Lines changed: 5 additions & 6 deletions
diff --git a/‎NAMESPACE‎
Lines changed: 1 addition & 0 deletions b/‎NAMESPACE‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎NEWS.md‎
Lines changed: 20 additions & 13 deletions b/‎NEWS.md‎
Lines changed: 20 additions & 13 deletions
diff --git a/‎R/install.R‎
Lines changed: 18 additions & 7 deletions b/‎R/install.R‎
Lines changed: 18 additions & 7 deletions
diff --git a/‎R/preprocessing.R‎
Lines changed: 164 additions & 0 deletions b/‎R/preprocessing.R‎
Lines changed: 164 additions & 0 deletions
@@ -39,6 +39,8 @@ jobs:
           # - {os: 'windows-latest', tf: 'release', r: 'release'}
           # - {os: 'macOS-latest'  , tf: 'release', r: 'release'}
 
+          - {os: 'ubuntu-20.04', tf: '2.7', r: 'release'}
+          - {os: 'ubuntu-20.04', tf: '2.6', r: 'release'}
           - {os: 'ubuntu-20.04', tf: '2.5', r: 'release'}
           - {os: 'ubuntu-20.04', tf: '2.4', r: 'release'}
           - {os: 'ubuntu-20.04', tf: '2.3', r: 'release'}
@@ -47,8 +49,8 @@ jobs:
 
           # these are allowed to fail
           # - {os: 'ubuntu-20.04', tf: 'default', r: 'devel'}
-          - {os: 'ubuntu-20.04', tf: '2.7.0rc1', r: 'release'}
-          # - {os: 'ubuntu-20.04', tf: 'nightly' , r: 'release'}
+          # - {os: 'ubuntu-20.04', tf: '2.7.0rc1', r: 'release'}
+          - {os: 'ubuntu-20.04', tf: 'nightly' , r: 'release'}
 
     runs-on: ${{ matrix.os }}
     continue-on-error: ${{ matrix.tf == 'nightly' || contains(matrix.tf, 'rc') || matrix.r == 'devel' }}
@@ -88,7 +90,7 @@ jobs:
         id: r-package-cache
         with:
           path: ${{ env.R_LIBS_USER }}
-          key: ${{ matrix.os }}-${{ steps.setup-r.outputs.installed-r-version }}-${{ steps.get-date.outputs.year-week }}
+          key: ${{ matrix.os }}-${{ steps.setup-r.outputs.installed-r-version }}-${{ steps.get-date.outputs.year-week }}-1
 
       - name: Install remotes
         if: steps.r-package-cache.outputs.cache-hit != 'true'
@@ -105,9 +107,6 @@ jobs:
             sudo $cmd
           done < <(Rscript -e "writeLines(remotes::system_requirements('$ID-$VERSION_ID'))")
 
-      - name: Use dev reticulate
-        run: remotes::install_github("t-kalinowski/reticulate")
-
       - name: Install Package + deps
         run: remotes::install_local(dependencies = TRUE, force = TRUE)
 
 
@@ -588,6 +588,7 @@ export(texts_to_matrix)
 export(texts_to_sequences)
 export(texts_to_sequences_generator)
 export(time_distributed)
+export(timeseries_dataset_from_array)
 export(timeseries_generator)
 export(to_categorical)
 export(train_on_batch)
 
@@ -1,5 +1,7 @@
 # keras (development version)
 
+- Default Tensorflow + Keras version is now 2.7.
+
 - New API for constructing RNN (Recurrent Neural Network) layers. This is a
   flexible interface that complements the existing RNN layers. It is primarily
   intended for advanced / research applications, e.g, prototyping novel
@@ -14,32 +16,35 @@
   To learn more, including how to make a custom cell layer, see the new vignette:
   "Working with RNNs".
 
-- New dataset loader `text_dataset_from_directory()`.
+- New dataset functions:
+  - `text_dataset_from_directory()`
+  - `timeseries_dataset_from_array()`
 
 - New layers:
-    - `layer_additive_attention()`
-    - `layer_conv_lstm_1d()`
-    - `layer_conv_lstm_3d()`
+  - `layer_additive_attention()`
+  - `layer_conv_lstm_1d()`
+  - `layer_conv_lstm_3d()`
 
 - `layer_cudnn_gru()` and `layer_cudnn_lstm()` are deprecated.
   `layer_gru()` and `layer_lstm()` will automatically use CuDNN if it is available.
 
 - `layer_lstm()` and `layer_gru()`:
-    default value for `recurrent_activation` changed
-    from `"hard_sigmoid"` to `"sigmoid"`.
+  default value for `recurrent_activation` changed
+  from `"hard_sigmoid"` to `"sigmoid"`.
 
 - `layer_gru()`: default value `reset_after` changed from `FALSE` to `TRUE`
 
 - New vignette: "Transfer learning and fine-tuning".
 
 - New applications:
-    - MobileNet V3: `application_mobilenet_v3_large()`, `application_mobilenet_v3_small()`
-    - ResNet: `application_resnet101()`, `application_resnet152()`, `resnet_preprocess_input()`
-    - ResNet V2:`application_resnet50_v2()`, `application_resnet101_v2()`,
-                `application_resnet152_v2()` and `resnet_v2_preprocess_input()`
-    - EfficientNet: `application_efficientnet_b{0,1,2,3,4,5,6,7}()`
-
-- Many existing `application_*()`'s gain argument `classifier_activation`, with default `'softmax'`.
+  - MobileNet V3: `application_mobilenet_v3_large()`, `application_mobilenet_v3_small()`
+  - ResNet: `application_resnet101()`, `application_resnet152()`, `resnet_preprocess_input()`
+  - ResNet V2:`application_resnet50_v2()`, `application_resnet101_v2()`,
+              `application_resnet152_v2()` and `resnet_v2_preprocess_input()`
+  - EfficientNet: `application_efficientnet_b{0,1,2,3,4,5,6,7}()`
+
+- Many existing `application_*()`'s gain argument `classifier_activation`,
+  with default `'softmax'`.
   Affected: `application_{xception, inception_resnet_v2, inception_v3, mobilenet, vgg16, vgg19}()`
 
 - New function `%<-active%`, a ergonomic wrapper around `makeActiveBinding()`
@@ -70,6 +75,8 @@
 
 - `k_random_uniform()` now automatically casts `minval` and `maxval` to the output dtype.
 
+- `install_keras()` gains arg with default `pip_ignore_installed = TRUE`.
+
 # keras 2.6.1
 
 - New family of *preprocessing* layers. These are the spiritual successor to the `tfdatasets::step_*` family of data transformers (to be deprecated in a future release).
 
@@ -4,7 +4,7 @@
 #' thin wrapper around [`tensorflow::install_tensorflow()`], with the only
 #' difference being that this includes by default additional extra packages that
 #' keras expects, and the default version of tensorflow installed by
-#' `install_keras()`  may at times be different from the default installed
+#' `install_keras()` may at times be different from the default installed
 #' `install_tensorflow()`. The default version of tensorflow installed by
 #' `install_keras()` is "`r default_version`".
 #'
@@ -13,36 +13,41 @@
 #'   versions potentially constrained for compatibility with the
 #'   requested tensorflow version.
 #'
-#' @inherit tensorflow::install_tensorflow
+#' @inheritParams tensorflow::install_tensorflow
 #'
 #' @param tensorflow Synonym for `version`. Maintained for backwards.
 #'
-#' @seealso [tensorflow::install_tensorflow()]
+#' @seealso [`tensorflow::install_tensorflow()`]
 #' @export
 install_keras <- function(method = c("auto", "virtualenv", "conda"),
                           conda = "auto",
                           version = "default",
                           tensorflow = version,
                           extra_packages = NULL,
-                          ...) {
+                          ...,
+                          pip_ignore_installed = TRUE) {
 
   pkgs <- default_extra_packages(tensorflow)
   if(!is.null(extra_packages)) # user supplied package version constraints take precedence
     pkgs[gsub("[=<>~]{1,2}[0-9.]+$", "", extra_packages)] <- extra_packages
 
-  if(tensorflow == "default") # may be different from tensorflow
-    tensorflow <- default_version
+  if(tensorflow %in% c("cpu", "gpu"))
+    tensorflow <- paste0("default-", tensorflow)
+
+  if(grepl("^default", tensorflow))
+    tensorflow <- sub("^default", as.character(default_version), tensorflow)
 
   tensorflow::install_tensorflow(
     method = match.arg(method),
     conda = conda,
     version = tensorflow,
     extra_packages = pkgs,
+    pip_ignore_installed = pip_ignore_installed,
     ...
   )
 }
 
-default_version <- numeric_version("2.6")
+default_version <- numeric_version("2.7")
 
 default_extra_packages <- function(tensorflow_version) {
   pkgs <- c("tensorflow-hub", "scipy", "requests", "pyyaml", "Pillow", "h5py", "pandas")
@@ -99,3 +104,9 @@ default_extra_packages <- function(tensorflow_version) {
   pkgs
 }
 
+
+#  @inheritSection tensorflow::install_tensorflow "Custom Installation" "Apple Silicon" "Additional Packages"
+#  @inherit tensorflow::install_tensorflow details
+# @inherit tensorflow::install_tensorflow params return references description details sections
+# ## everything except 'seealso' to avoid this warning
+# ## Warning: Link to unknown topic in inherited text: keras::install_keras
@@ -1147,3 +1147,167 @@ function(directory,
                             seed = as_nullable_integer))
   do.call(keras$preprocessing$text_dataset_from_directory, args)
 }
+
+
+#' Creates a dataset of sliding windows over a timeseries provided as array
+#'
+#' @details
+#' This function takes in a sequence of data-points gathered at
+#' equal intervals, along with time series parameters such as
+#' length of the sequences/windows, spacing between two sequence/windows, etc.,
+#' to produce batches of timeseries inputs and targets.
+#'
+#' @section Example 1:
+#'
+#' Consider indices `0:99`. With `sequence_length=10`, `sampling_rate=2`,
+#' `sequence_stride=3`, `shuffle=FALSE`, the dataset will yield batches of
+#' sequences composed of the following indices:
+#'
+#' ```
+#' First sequence:  0  2  4  6  8 10 12 14 16 18
+#' Second sequence: 3  5  7  9 11 13 15 17 19 21
+#' Third sequence:  6  8 10 12 14 16 18 20 22 24
+#' ...
+#' Last sequence:   78 80 82 84 86 88 90 92 94 96
+#' ```
+#'
+#' In this case the last 3 data points are discarded since no full sequence
+#' can be generated to include them (the next sequence would have started
+#' at index 81, and thus its last step would have gone over 99).
+#'
+#' @section Example 2: Temporal regression.
+#'
+#' Consider an array `data` of scalar values, of shape `(steps)`.
+#' To generate a dataset that uses the past 10
+#' timesteps to predict the next timestep, you would use:
+#'
+#' ``` R
+#' steps <- 100
+#' # data is integer seq with some noise
+#' data <- array(1:steps + abs(rnorm(steps, sd = .25)))
+#' inputs_data <- head(data, -10) # drop last 10
+#' targets <- tail(data, -10)    # drop first 10
+#' dataset <- timeseries_dataset_from_array(
+#'   inputs_data, targets, sequence_length=10)
+#' library(tfdatasets)
+#' dataset_iterator <- as_iterator(dataset)
+#' repeat {
+#'   batch <- iter_next(dataset_iterator)
+#'   if(is.null(batch)) break
+#'   c(input, target) %<-% batch
+#'   stopifnot(exprs = {
+#'     # First sequence: steps [1-10]
+#'     # Corresponding target: step 11
+#'     all.equal(as.array(input[1, ]), data[1:10])
+#'     all.equal(as.array(target[1]), data[11])
+#'
+#'     all.equal(as.array(input[2, ]), data[2:11])
+#'     all.equal(as.array(target[2]), data[12])
+#'
+#'     all.equal(as.array(input[3, ]), data[3:12])
+#'     all.equal(as.array(target[3]), data[13])
+#'   })
+#' }
+#' ```
+#'
+#' @section Example 3: Temporal regression for many-to-many architectures.
+#'
+#' Consider two arrays of scalar values `X` and `Y`,
+#' both of shape `(100)`. The resulting dataset should consist of samples with
+#' 20 timestamps each. The samples should not overlap.
+#' To generate a dataset that uses the current timestamp
+#' to predict the corresponding target timestep, you would use:
+#'
+#' ``` R
+#' X <- seq(100)
+#' Y <- X*2
+#'
+#' sample_length <- 20
+#' input_dataset <- timeseries_dataset_from_array(
+#'   X, NULL, sequence_length=sample_length, sequence_stride=sample_length)
+#' target_dataset <- timeseries_dataset_from_array(
+#'   Y, NULL, sequence_length=sample_length, sequence_stride=sample_length)
+#'
+#' library(tfdatasets)
+#' dataset_iterator <-
+#'   zip_datasets(input_dataset, target_dataset) %>%
+#'   as_array_iterator()
+#' while(!is.null(batch <- iter_next(dataset_iterator))) {
+#'   c(inputs, targets) %<-% batch
+#'   stopifnot(
+#'     all.equal(inputs[1,], X[1:sample_length]),
+#'     all.equal(targets[1,], Y[1:sample_length]),
+#'     # second sample equals output timestamps 20-40
+#'     all.equal(inputs[2,], X[(1:sample_length) + sample_length]),
+#'     all.equal(targets[2,], Y[(1:sample_length) + sample_length])
+#'   )
+#' }
+#' ```
+#'
+#' @param data array or eager tensor
+#' containing consecutive data points (timesteps).
+#' The first axis is expected to be the time dimension.
+#'
+#' @param targets Targets corresponding to timesteps in `data`.
+#' `targets[i]` should be the target
+#' corresponding to the window that starts at index `i`
+#' (see example 2 below).
+#' Pass NULL if you don't have target data (in this case the dataset will
+#' only yield the input data).
+#'
+#' @param sequence_length Length of the output sequences (in number of timesteps).
+#'
+#' @param sequence_stride Period between successive output sequences.
+#' For stride `s`, output samples would
+#' start at index `data[i]`, `data[i + s]`, `data[i + (2 * s)]`, etc.
+#'
+#' @param sampling_rate Period between successive individual timesteps
+#' within sequences. For rate `r`, timesteps
+#' `data[i], data[i + r], ... data[i + sequence_length]`
+#' are used for create a sample sequence.
+#'
+#' @param batch_size Number of timeseries samples in each batch
+#' (except maybe the last one).
+#'
+#' @param shuffle Whether to shuffle output samples,
+#' or instead draw them in chronological order.
+#'
+#' @param seed Optional int; random seed for shuffling.
+#'
+#' @param start_index Optional int; data points earlier (exclusive)
+#' than `start_index` will not be used
+#' in the output sequences. This is useful to reserve part of the
+#' data for test or validation.
+#'
+#' @param end_index Optional int; data points later (exclusive) than `end_index`
+#' will not be used in the output sequences.
+#' This is useful to reserve part of the data for test or validation.
+#'
+#' @param ... For backwards and forwards compatibility, ignored presently.
+#'
+#' @seealso
+#'   +  <https://www.tensorflow.org/api_docs/python/tf/keras/utils/timeseries_dataset_from_array>
+#'
+#' @returns A `tf.data.Dataset` instance. If `targets` was passed, the
+#'   dataset yields batches of two items: `(batch_of_sequences,
+#'   batch_of_targets)`. If not, the dataset yields only
+#'   `batch_of_sequences`.
+#'
+#' @export
+timeseries_dataset_from_array <-
+function(data, targets, sequence_length, sequence_stride = 1L,
+         sampling_rate = 1L, batch_size = 128L, shuffle = FALSE, ...,
+         seed = NULL, start_index = NULL, end_index = NULL)
+{
+  require_tf_version("2.6", "timeseries_dataset_from_array")
+  args <- capture_args(match.call(), list(
+    sequence_length = as.integer,
+    sequence_stride = as.integer,
+    sampling_rate = as.integer,
+    batch_size = as.integer,
+    seed = as_nullable_integer,
+    start_index = as_nullable_integer,
+    end_index = as_nullable_integer
+    ))
+  do.call(keras$preprocessing$timeseries_dataset_from_array, args)
+}