|
1 | 1 | #include "data.table.h" |
2 | 2 |
|
| 3 | +#ifndef USE_GROWABLE_ALTREP |
| 4 | + |
3 | 5 | SEXP growable_allocate(SEXPTYPE type, R_xlen_t size, R_xlen_t max_size) { |
4 | 6 | SEXP ret = PROTECT(allocVector(type, max_size)); |
5 | 7 | SET_TRUELENGTH(ret, max_size); |
@@ -32,9 +34,243 @@ Rboolean is_growable(SEXP x) { |
32 | 34 | ; |
33 | 35 | } |
34 | 36 |
|
35 | | -// Assuming no ALTREP for now |
| 37 | +// Assuming no ALTREP columns |
36 | 38 | SEXP make_growable(SEXP x) { |
37 | 39 | if (TRUELENGTH(x) < XLENGTH(x)) SET_TRUELENGTH(x, XLENGTH(x)); |
38 | 40 | SET_GROWABLE_BIT(x); |
39 | 41 | return x; |
40 | 42 | } |
| 43 | + |
| 44 | +#else |
| 45 | + |
| 46 | +#include <R_ext/Altrep.h> |
| 47 | + |
| 48 | +static R_altrep_class_t dta_grow_string, dta_grow_integer, dta_grow_logical, dta_grow_real, dta_grow_complex, dta_grow_raw, dta_grow_list; |
| 49 | +static Rcomplex NA_COMPLEX = { 0, }; |
| 50 | + |
| 51 | +/* |
| 52 | +ALTREP class layout: |
| 53 | +data1 = underlying vector |
| 54 | +data2 = its current length stored as a length-1 REALSXP |
| 55 | +Unless we implement an Unserialize method, this can be changed any time. |
| 56 | +Classes have been released on CRAN with a Serialized_state/Unserialize pair will have to stay as they have been defined in order to keep *.rds files readable. |
| 57 | +*/ |
| 58 | + |
| 59 | +static R_xlen_t altall_Length(SEXP x) { |
| 60 | + return (R_xlen_t)REAL(R_altrep_data2(x))[0]; |
| 61 | +} |
| 62 | + |
| 63 | +#define make_inspect_method(classname) \ |
| 64 | + static Rboolean alt##classname##_Inspect( \ |
| 65 | + SEXP x, int pre, int deep, int pvec, \ |
| 66 | + void (*inspect_subtree)(SEXP x, int pre, int deep, int pvec) \ |
| 67 | + ) { \ |
| 68 | + (void)pre; (void)deep; (void)pvec; (void)inspect_subtree; \ |
| 69 | + Rprintf("data.table::growable" #classname "_v0(truelength=%g) ", (double)XLENGTH(R_altrep_data1(x))); \ |
| 70 | + return FALSE; \ |
| 71 | + } |
| 72 | +make_inspect_method(string) |
| 73 | +make_inspect_method(integer) |
| 74 | +make_inspect_method(logical) |
| 75 | +make_inspect_method(real) |
| 76 | +make_inspect_method(complex) |
| 77 | +make_inspect_method(raw) |
| 78 | +make_inspect_method(list) |
| 79 | +#undef make_inspect_method |
| 80 | + |
| 81 | +#define make_dataptr_method(class, accessor) \ |
| 82 | + static void * alt##class##_Dataptr(SEXP x, Rboolean writable) { \ |
| 83 | + (void)writable; \ |
| 84 | + return (void*)accessor(R_altrep_data1(x)); \ |
| 85 | + } |
| 86 | +make_dataptr_method(string, STRING_PTR_RO) |
| 87 | +make_dataptr_method(integer, INTEGER) |
| 88 | +make_dataptr_method(logical, LOGICAL) |
| 89 | +make_dataptr_method(real, REAL) |
| 90 | +make_dataptr_method(complex, COMPLEX) |
| 91 | +make_dataptr_method(raw, RAW) |
| 92 | +make_dataptr_method(list, DATAPTR_RO) // VECTOR_PTR_RO to appear in R-4.5 |
| 93 | +#undef make_dataptr_method |
| 94 | + |
| 95 | +static const void * altall_Dataptr_or_null(SEXP x) { return DATAPTR_RO(x); } |
| 96 | + |
| 97 | +// lots of boilerplate, but R calling *_ELT one by one would be far too slow |
| 98 | +#define make_extract_subset_method(class, type, accessor, NA) \ |
| 99 | + static SEXP alt##class##_Extract_subset(SEXP x, SEXP indx, SEXP call) { \ |
| 100 | + (void)call; \ |
| 101 | + indx = PROTECT(coerceVector(indx, REALSXP)); \ |
| 102 | + double * ii = REAL(indx); \ |
| 103 | + R_xlen_t rlen = XLENGTH(indx), mylen = XLENGTH(x); \ |
| 104 | + SEXP ret = PROTECT(allocVector(TYPEOF(x), rlen)); \ |
| 105 | + type *rdata = accessor(ret), *mydata = accessor(x); \ |
| 106 | + for (R_xlen_t i = 0; i < rlen; ++i) \ |
| 107 | + rdata[i] = (ii[i] >= 1 && ii[i] <= mylen) ? mydata[(R_xlen_t)ii[i]-1] : NA; \ |
| 108 | + UNPROTECT(2); \ |
| 109 | + return ret; \ |
| 110 | + } |
| 111 | +make_extract_subset_method(integer, int, INTEGER, NA_INTEGER) |
| 112 | +make_extract_subset_method(logical, int, LOGICAL, NA_LOGICAL) |
| 113 | +make_extract_subset_method(real, double, REAL, NA_REAL) |
| 114 | +make_extract_subset_method(complex, Rcomplex, COMPLEX, NA_COMPLEX) |
| 115 | +make_extract_subset_method(raw, Rbyte, RAW, 0) |
| 116 | +// not implementing the string and list methods because those do require the write barrier and are thus no better than calling *_ELT one by one |
| 117 | +#undef make_extract_subset_method |
| 118 | + |
| 119 | +#define make_elt_method(class, accessor) \ |
| 120 | + static SEXP alt##class##_Elt(SEXP x, R_xlen_t i) { \ |
| 121 | + return accessor(R_altrep_data1(x), i); \ |
| 122 | + } |
| 123 | +make_elt_method(string, STRING_ELT) |
| 124 | +make_elt_method(list, VECTOR_ELT) |
| 125 | +#undef make_elt_method |
| 126 | + |
| 127 | +#define make_set_elt_method(class, accessor) \ |
| 128 | + static void alt##class##_Set_elt(SEXP x, R_xlen_t i, SEXP v) { \ |
| 129 | + accessor(R_altrep_data1(x), i, v); \ |
| 130 | + } |
| 131 | +make_set_elt_method(string, SET_STRING_ELT) |
| 132 | +make_set_elt_method(list, SET_VECTOR_ELT) |
| 133 | +#undef make_set_elt_method |
| 134 | + |
| 135 | +// liked the Extract_subset methods? say hello to Get_region |
| 136 | +#define make_get_region_method(class, type, accessor) \ |
| 137 | + static R_xlen_t alt##class##_Get_region( \ |
| 138 | + SEXP x, R_xlen_t i, R_xlen_t n, type * buf \ |
| 139 | + ) { \ |
| 140 | + R_xlen_t j = 0, mylen = XLENGTH(x); \ |
| 141 | + type * data = accessor(x); \ |
| 142 | + for (; j < n && i < mylen; ++i, ++j) buf[j] = data[i]; \ |
| 143 | + return j; \ |
| 144 | + } |
| 145 | +make_get_region_method(integer, int, INTEGER) |
| 146 | +make_get_region_method(logical, int, LOGICAL) |
| 147 | +make_get_region_method(real, double, REAL) |
| 148 | +make_get_region_method(complex, Rcomplex, COMPLEX) |
| 149 | +make_get_region_method(raw, Rbyte, RAW) |
| 150 | +#undef make_get_region_method |
| 151 | + |
| 152 | +void register_altrep_classes(DllInfo * info) { |
| 153 | + // Used by the altcomplex_Extract_subset method |
| 154 | + NA_COMPLEX = (Rcomplex){ .r = NA_REAL, .i = NA_REAL }; |
| 155 | + |
| 156 | + dta_grow_string = R_make_altstring_class("growable_string_v0", "data.table", info); |
| 157 | + R_set_altrep_Length_method(dta_grow_string, altall_Length); |
| 158 | + R_set_altrep_Inspect_method(dta_grow_string, altstring_Inspect); |
| 159 | + R_set_altvec_Dataptr_method(dta_grow_string, altstring_Dataptr); |
| 160 | + R_set_altvec_Dataptr_or_null_method(dta_grow_string, altall_Dataptr_or_null); |
| 161 | + R_set_altstring_Elt_method(dta_grow_string, altstring_Elt); |
| 162 | + R_set_altstring_Set_elt_method(dta_grow_string, altstring_Set_elt); |
| 163 | + dta_grow_integer = R_make_altinteger_class("growable_integer_v0", "data.table", info); |
| 164 | + R_set_altrep_Length_method(dta_grow_integer, altall_Length); |
| 165 | + R_set_altrep_Inspect_method(dta_grow_integer, altinteger_Inspect); |
| 166 | + R_set_altvec_Dataptr_method(dta_grow_integer, altinteger_Dataptr); |
| 167 | + R_set_altvec_Dataptr_or_null_method(dta_grow_integer, altall_Dataptr_or_null); |
| 168 | + R_set_altvec_Extract_subset_method(dta_grow_integer, altinteger_Extract_subset); |
| 169 | + R_set_altinteger_Get_region_method(dta_grow_integer, altinteger_Get_region); |
| 170 | + dta_grow_logical = R_make_altlogical_class("growable_logical_v0", "data.table", info); |
| 171 | + R_set_altrep_Length_method(dta_grow_logical, altall_Length); |
| 172 | + R_set_altrep_Inspect_method(dta_grow_logical, altlogical_Inspect); |
| 173 | + R_set_altvec_Dataptr_method(dta_grow_logical, altlogical_Dataptr); |
| 174 | + R_set_altvec_Dataptr_or_null_method(dta_grow_logical, altall_Dataptr_or_null); |
| 175 | + R_set_altvec_Extract_subset_method(dta_grow_logical, altlogical_Extract_subset); |
| 176 | + R_set_altlogical_Get_region_method(dta_grow_logical, altlogical_Get_region); |
| 177 | + dta_grow_real = R_make_altreal_class("growable_real_v0", "data.table", info); |
| 178 | + R_set_altrep_Length_method(dta_grow_real, altall_Length); |
| 179 | + R_set_altrep_Inspect_method(dta_grow_real, altreal_Inspect); |
| 180 | + R_set_altvec_Dataptr_method(dta_grow_real, altreal_Dataptr); |
| 181 | + R_set_altvec_Dataptr_or_null_method(dta_grow_real, altall_Dataptr_or_null); |
| 182 | + R_set_altvec_Extract_subset_method(dta_grow_real, altreal_Extract_subset); |
| 183 | + R_set_altreal_Get_region_method(dta_grow_real, altreal_Get_region); |
| 184 | + dta_grow_complex = R_make_altcomplex_class("growable_complex_v0", "data.table", info); |
| 185 | + R_set_altrep_Length_method(dta_grow_complex, altall_Length); |
| 186 | + R_set_altrep_Inspect_method(dta_grow_complex, altcomplex_Inspect); |
| 187 | + R_set_altvec_Dataptr_method(dta_grow_complex, altcomplex_Dataptr); |
| 188 | + R_set_altvec_Dataptr_or_null_method(dta_grow_complex, altall_Dataptr_or_null); |
| 189 | + R_set_altvec_Extract_subset_method(dta_grow_complex, altcomplex_Extract_subset); |
| 190 | + R_set_altcomplex_Get_region_method(dta_grow_complex, altcomplex_Get_region); |
| 191 | + dta_grow_raw = R_make_altraw_class("growable_raw_v0", "data.table", info); |
| 192 | + R_set_altrep_Length_method(dta_grow_raw, altall_Length); |
| 193 | + R_set_altrep_Inspect_method(dta_grow_raw, altraw_Inspect); |
| 194 | + R_set_altvec_Dataptr_method(dta_grow_raw, altraw_Dataptr); |
| 195 | + R_set_altvec_Dataptr_or_null_method(dta_grow_raw, altall_Dataptr_or_null); |
| 196 | + R_set_altvec_Extract_subset_method(dta_grow_raw, altraw_Extract_subset); |
| 197 | + R_set_altraw_Get_region_method(dta_grow_raw, altraw_Get_region); |
| 198 | + dta_grow_list = R_make_altlist_class("growable_list_v0", "data.table", info); |
| 199 | + R_set_altrep_Length_method(dta_grow_list, altall_Length); |
| 200 | + R_set_altrep_Inspect_method(dta_grow_list, altlist_Inspect); |
| 201 | + R_set_altvec_Dataptr_method(dta_grow_list, altlist_Dataptr); |
| 202 | + R_set_altvec_Dataptr_or_null_method(dta_grow_list, altall_Dataptr_or_null); |
| 203 | + R_set_altlist_Elt_method(dta_grow_list, altlist_Elt); |
| 204 | + R_set_altlist_Set_elt_method(dta_grow_list, altlist_Set_elt); |
| 205 | +} |
| 206 | + |
| 207 | +static R_altrep_class_t dta_grow_string, dta_grow_integer, dta_grow_logical, dta_grow_real, dta_grow_complex, dta_grow_raw, dta_grow_list; |
| 208 | + |
| 209 | +static R_altrep_class_t type2class(SEXPTYPE type) { |
| 210 | + switch(type) { |
| 211 | + case STRSXP: |
| 212 | + return dta_grow_string; |
| 213 | + case INTSXP: |
| 214 | + return dta_grow_integer; |
| 215 | + case LGLSXP: |
| 216 | + return dta_grow_logical; |
| 217 | + case REALSXP: |
| 218 | + return dta_grow_real; |
| 219 | + case CPLXSXP: |
| 220 | + return dta_grow_complex; |
| 221 | + case RAWSXP: |
| 222 | + return dta_grow_raw; |
| 223 | + case VECSXP: |
| 224 | + case EXPRSXP: |
| 225 | + return dta_grow_list; |
| 226 | + default: |
| 227 | + internal_error(__func__, "Can't create a growable vector of type '%s'", type2char(type)); |
| 228 | + } |
| 229 | +} |
| 230 | + |
| 231 | +SEXP growable_allocate(SEXPTYPE type, R_xlen_t size, R_xlen_t max_size) { |
| 232 | + SEXP ret = PROTECT(R_new_altrep(type2class(type), R_NilValue, R_NilValue)); |
| 233 | + R_set_altrep_data1(ret, allocVector(type, max_size)); |
| 234 | + R_set_altrep_data2(ret, ScalarReal(size)); |
| 235 | + UNPROTECT(1); |
| 236 | + return ret; |
| 237 | +} |
| 238 | + |
| 239 | +R_xlen_t growable_max_size(SEXP x) { |
| 240 | + return XLENGTH(R_altrep_data1(x)); |
| 241 | +} |
| 242 | + |
| 243 | +void growable_resize(SEXP x, R_xlen_t newsize) { |
| 244 | + R_xlen_t max_size; |
| 245 | + if (newsize > (max_size = growable_max_size(x))) internal_error( |
| 246 | + __func__, "newsize=%g > max_size=%g", |
| 247 | + (double)newsize, (double)max_size |
| 248 | + ); |
| 249 | + REAL(R_altrep_data2(x))[0] = newsize; |
| 250 | +} |
| 251 | + |
| 252 | +Rboolean is_growable(SEXP x) { |
| 253 | + switch(TYPEOF(x)) { |
| 254 | + case STRSXP: |
| 255 | + case INTSXP: |
| 256 | + case LGLSXP: |
| 257 | + case REALSXP: |
| 258 | + case CPLXSXP: |
| 259 | + case RAWSXP: |
| 260 | + case VECSXP: |
| 261 | + return R_altrep_inherits(x, type2class(TYPEOF(x))); |
| 262 | + default: |
| 263 | + return FALSE; |
| 264 | + } |
| 265 | +} |
| 266 | + |
| 267 | +SEXP make_growable(SEXP x) { |
| 268 | + SEXP ret = PROTECT(R_new_altrep(type2class(TYPEOF(x)), R_NilValue, R_NilValue)); |
| 269 | + R_set_altrep_data1(ret, x); |
| 270 | + R_set_altrep_data2(ret, ScalarReal(XLENGTH(x))); |
| 271 | + SHALLOW_DUPLICATE_ATTRIB(ret, x); |
| 272 | + UNPROTECT(1); |
| 273 | + return ret; |
| 274 | +} |
| 275 | + |
| 276 | +#endif |
0 commit comments