Rdatatable · MichaelChirico · Jan 2, 2020 · Jan 2, 2020 · Jan 2, 2020 · Jan 3, 2020
@@ -56,6 +56,7 @@ export(nafill)
 export(setnafill)
 export(.Last.updated)
 export(fcoalesce)
+export(unnest)
 
 S3method("[", data.table)
 S3method("[<-", data.table)

@@ -356,8 +356,6 @@ CJ = function(..., sorted = TRUE, unique = FALSE)
       if (unique) l[[i]] = unique(y)
     }
   }
-  nrow = prod( vapply_1i(l, length) )  # lengths(l) will work from R 3.2.0
-  if (nrow > .Machine$integer.max) stop(gettextf("Cross product of elements provided to CJ() would result in %.0f rows which exceeds .Machine$integer.max == %d", nrow, .Machine$integer.max, domain='R-data.table'))
   l = .Call(Ccj, l)
   setDT(l)
   l = setalloccol(l)  # a tiny bit wasteful to over-allocate a fixed join table (column slots only), doing it anyway for consistency since

@@ -11,4 +11,6 @@ fcase   = function(..., default=NA) .Call(CfcaseR, default, parent.frame(), as.l
 colnamesInt = function(x, cols, check_dups=FALSE) .Call(CcolnamesInt, x, cols, check_dups)
 coerceFill = function(x) .Call(CcoerceFillR, x)
 
+unnest = function(x, cols = which(vapply_1b(x, is.list))) .Call(Cunnest, x, cols)
+
 testMsg = function(status=0L, nx=2L, nk=2L) .Call(CtestMsgR, as.integer(status)[1L], as.integer(nx)[1L], as.integer(nk)[1L])
@@ -1,96 +1,235 @@
 #include "data.table.h"
 
+// workhorse for cycling a vector in the correct pattern,
+//   essentially rep(x, m, each = n) for appropriate m,n at each j
+void cycle_vector(SEXP source, SEXP target, int j, int eachrep, int nrow) {
+  int thislen = LENGTH(source);
+  int blocklen = thislen*eachrep;
+  int ncopy = nrow/blocklen;
+  switch(TYPEOF(source)) {
+  case LGLSXP:
+  case INTSXP: {
+    const int *restrict sourceP = INTEGER(source);
+    int *restrict targetP = INTEGER(target);
+    #pragma omp parallel for num_threads(getDTthreads()) if (nrow >= OMP_MIN_VALUE)
+    // default static schedule so two threads won't write to same cache line in last column
+    // if they did write to same cache line (and will when last column's thislen is small) there's no correctness issue
+    for (int i=0; i<thislen; ++i) {
+      const int item = sourceP[i];
+      const int end = (i+1)*eachrep;
+      for (int j=i*eachrep; j<end; ++j)
+        targetP[j] = item;  // no div, mod or read ops inside loop; just rep a const contiguous write
+    }
+    #pragma omp parallel for num_threads(getDTthreads()) if (nrow >= OMP_MIN_VALUE)
+    for (int i=1; i<ncopy; ++i) {
+      memcpy(targetP + i*blocklen, targetP, blocklen*sizeof(int));
+    }
+  } break;
+  case REALSXP: {
+    const double *restrict sourceP = REAL(source);
+    double *restrict targetP = REAL(target);
+    #pragma omp parallel for num_threads(getDTthreads()) if (nrow >= OMP_MIN_VALUE)
+    for (int i=0; i<thislen; ++i) {
+      const double item = sourceP[i];
+      const int end=(i+1)*eachrep;
+      for (int j=i*eachrep; j<end; ++j) targetP[j] = item;
+    }
+    #pragma omp parallel for num_threads(getDTthreads()) if (nrow >= OMP_MIN_VALUE)
+    for (int i=1; i<ncopy; ++i) {
+      memcpy(targetP + i*blocklen, targetP, blocklen*sizeof(double));
+    }
+  } break;
+  case CPLXSXP: {
+    const Rcomplex *restrict sourceP = COMPLEX(source);
+    Rcomplex *restrict targetP = COMPLEX(target);
+    #pragma omp parallel for num_threads(getDTthreads()) if (nrow >= OMP_MIN_VALUE)
+    for (int i=0; i<thislen; ++i) {
+      const Rcomplex item = sourceP[i];
+      const int end=(i+1)*eachrep;
+      for (int j=i*eachrep; j<end; ++j) targetP[j] = item;
+    }
+    #pragma omp parallel for num_threads(getDTthreads()) if (nrow >= OMP_MIN_VALUE)
+    for (int i=1; i<ncopy; ++i) {
+      memcpy(targetP + i*blocklen, targetP, blocklen*sizeof(Rcomplex));
+    }
+  } break;
+  case STRSXP: {
+    const SEXP *sourceP = STRING_PTR(source);
+    int start = 0;
+    for (int i=0; i<ncopy; ++i) {
+      for (int j=0; j<thislen; ++j) {
+        const SEXP item = sourceP[j];
+        const int end = start+eachrep;
+        for (int k=start; k<end; ++k) SET_STRING_ELT(target, k, item);  // no div, mod, or read-API call to STRING_ELT
+        start = end;
+      }
+    }
+  } break;
+  case VECSXP: {
+    const SEXP *sourceP = VECTOR_PTR(source);
+    int start = 0;
+    for (int i=0; i<ncopy; ++i) {
+      for (int j=0; j<thislen; ++j) {
+        const SEXP item = sourceP[j];
+        const int end = start+eachrep;
+        for (int k=start; k<end; ++k) SET_VECTOR_ELT(target, k, item);
+        start = end;
+      }
+    }
+  } break;
+  default:
+    error(_("Type '%s' not supported by for cross-join."), type2char(TYPEOF(source)));
+  }
+}
+
 SEXP cj(SEXP base_list) {
   int ncol = LENGTH(base_list);
   SEXP out = PROTECT(allocVector(VECSXP, ncol));
-  int nrow = 1;
-  // already confirmed to be less than .Machine$integer.max at R level
-  for (int j=0; j<ncol; ++j) nrow *= length(VECTOR_ELT(base_list, j));
+  // start with double to allow overflow
+  double nrow_dbl=1;
+  int nrow;
+  for (int j=0; j<ncol; ++j) nrow_dbl *= length(VECTOR_ELT(base_list, j));
+  if (nrow_dbl > INT_MAX) {
+      error(_("Cross product of elements provided to CJ() would result in %.0f rows which exceeds .Machine$integer.max == %d"), nrow_dbl, INT_MAX);
+  } else {
+    nrow = (int) nrow_dbl;
+  }
   int eachrep = 1;
   for (int j=ncol-1; j>=0; --j) {
     SEXP source = VECTOR_ELT(base_list, j), target;
     SET_VECTOR_ELT(out, j, target=allocVector(TYPEOF(source), nrow));
     copyMostAttrib(source, target);  // includes levels of factors, integer64, custom classes, etc
     if (nrow==0) continue;  // one or more columns are empty so the result will be empty, #2511
-    int thislen = LENGTH(source);
-    int blocklen = thislen*eachrep;
-    int ncopy = nrow/blocklen;
-    switch(TYPEOF(source)) {
-    case LGLSXP:
-    case INTSXP: {
-      const int *restrict sourceP = INTEGER(source);
-      int *restrict targetP = INTEGER(target);
-      #pragma omp parallel for num_threads(getDTthreads())
-      // default static schedule so two threads won't write to same cache line in last column
-      // if they did write to same cache line (and will when last column's thislen is small) there's no correctness issue
-      for (int i=0; i<thislen; ++i) {
-        const int item = sourceP[i];
-        const int end = (i+1)*eachrep;
-        for (int j=i*eachrep; j<end; ++j) targetP[j] = item;  // no div, mod or read ops inside loop; just rep a const contiguous write
-      }
-      #pragma omp parallel for num_threads(getDTthreads())
-      for (int i=1; i<ncopy; ++i) {
-        memcpy(targetP + i*blocklen, targetP, blocklen*sizeof(int));
-      }
-    } break;
-    case REALSXP: {
-      const double *restrict sourceP = REAL(source);
-      double *restrict targetP = REAL(target);
-      #pragma omp parallel for num_threads(getDTthreads())
-      for (int i=0; i<thislen; ++i) {
-        const double item = sourceP[i];
-        const int end=(i+1)*eachrep;
-        for (int j=i*eachrep; j<end; ++j) targetP[j] = item;
-      }
-      #pragma omp parallel for num_threads(getDTthreads())
-      for (int i=1; i<ncopy; ++i) {
-        memcpy(targetP + i*blocklen, targetP, blocklen*sizeof(double));
-      }
-    } break;
-    case CPLXSXP: {
-      const Rcomplex *restrict sourceP = COMPLEX(source);
-      Rcomplex *restrict targetP = COMPLEX(target);
-      #pragma omp parallel for num_threads(getDTthreads())
-      for (int i=0; i<thislen; ++i) {
-        const Rcomplex item = sourceP[i];
-        const int end=(i+1)*eachrep;
-        for (int j=i*eachrep; j<end; ++j) targetP[j] = item;
-      }
-      #pragma omp parallel for num_threads(getDTthreads())
-      for (int i=1; i<ncopy; ++i) {
-        memcpy(targetP + i*blocklen, targetP, blocklen*sizeof(Rcomplex));
-      }
+    cycle_vector(source, target, j, eachrep, nrow);
+    eachrep *= LENGTH(source);
+  }
+  UNPROTECT(1);
+  return out;
+}
+
+SEXP unnest(SEXP x, SEXP cols) {
+  int k = LENGTH(cols);
+  // nothing to unnest -- need to go further, just be sure to copy
+  if (k == 0)
+    return (duplicate(x));
+  int n = LENGTH(VECTOR_ELT(x, 0));
+  int p = LENGTH(x);
+
+  if (TYPEOF(cols) != INTSXP)
+    error(_("cols must be an integer vector, got %s"), type2char(TYPEOF(cols)));
+  int *colp = INTEGER(cols);
+
+  // ignore non-VECSXP elements of cols; use lcols and lk (list-only versions)
+  int lcols[k], j;
+  int lk=0;
+  for (int i=0; i<k; i++) {
+    j = colp[i];
+    if (j < 1 || j > p)
+      error(_("cols to unnest must be in [1, ncol(x)=%d], but cols[%d]=%d"), p, i, j);
+    switch(TYPEOF(VECTOR_ELT(x, j-1))) {
+    case RAWSXP :
+    case LGLSXP :
+    case INTSXP :
+    case REALSXP :
+    case CPLXSXP :
+    case STRSXP : break;
+    case VECSXP : {
+      lcols[lk++] = j-1; // move to 0-based
     } break;
-    case STRSXP: {
-      const SEXP *sourceP = STRING_PTR(source);
-      int start = 0;
-      for (int i=0; i<ncopy; ++i) {
-        for (int j=0; j<thislen; ++j) {
-          const SEXP item = sourceP[j];
-          const int end = start+eachrep;
-          for (int k=start; k<end; ++k) SET_STRING_ELT(target, k, item);  // no div, mod, or read-API call to STRING_ELT
-          start = end;
+    default:
+      error(_("Unsupported type for unnesting: %s"), type2char(TYPEOF(VECTOR_ELT(x, j))));
+    }
+  }
+  if (lk == 0)
+    return (duplicate(x));
+
+  int row_counts[n];
+
+  SEXP cj_rowwise = PROTECT(allocVector(VECSXP, n));
+  for (int i=0; i<n; i++) {
+    SEXP nest_vals = PROTECT(allocVector(VECSXP, lk));
+    for (int j=0; j<lk; j++)
+      SET_VECTOR_ELT(nest_vals, j, VECTOR_ELT(VECTOR_ELT(x, lcols[j]), i));
+    SET_VECTOR_ELT(cj_rowwise, i, cj(nest_vals));
+    row_counts[i] = LENGTH(VECTOR_ELT(VECTOR_ELT(cj_rowwise, i), 0));
+    UNPROTECT(1);
+  }
+  SEXP unnest_lcols = rbindlist(cj_rowwise, ScalarLogical(FALSE), ScalarLogical(FALSE), R_NilValue);
+  UNPROTECT(1);
+  int out_rows = LENGTH(VECTOR_ELT(unnest_lcols, 0));
+
+  SEXP ans = PROTECT(allocVector(VECSXP, p));
+  copyMostAttrib(x, ans);
+  for (int j=0, lj=0; j<p; j++) {
+    if (lj < lk && j == lcols[lj]) { // vec col: apply unnesting
+      SET_VECTOR_ELT(ans, j, VECTOR_ELT(unnest_lcols, lj++));
+    } else { // non-vec col: simply copy
+      int outi=0;
+      SEXP xj = VECTOR_ELT(x, j), ansj;
+      SET_VECTOR_ELT(ans, j, ansj=allocVector(TYPEOF(xj), out_rows));
+      switch(TYPEOF(xj)) {
+      case RAWSXP: {
+        const Rbyte *source = RAW(xj);
+        Rbyte *target = RAW(ansj);
+        for (int i=0; i<n; i++) {
+          for(int repi=0; repi<row_counts[i]; repi++) {
+            memcpy(target + outi + repi, &source[i], sizeof(Rbyte));
+          }
+          outi += row_counts[i];
         }
-      }
-    } break;
-    case VECSXP: {
-      const SEXP *sourceP = VECTOR_PTR(source);
-      int start = 0;
-      for (int i=0; i<ncopy; ++i) {
-        for (int j=0; j<thislen; ++j) {
-          const SEXP item = sourceP[j];
-          const int end = start+eachrep;
-          for (int k=start; k<end; ++k) SET_VECTOR_ELT(target, k, item);
-          start = end;
+      } break;
+      case LGLSXP:
+      case INTSXP: {
+        const int *source = INTEGER(xj);
+        int *target = INTEGER(ansj);
+        for (int i=0; i<n; i++) {
+          for(int repi=0; repi<row_counts[i]; repi++) {
+            memcpy(target + outi + repi, &source[i], sizeof(int));
+          }
+          outi += row_counts[i];
+        }
+      } break;
+      case REALSXP: {
+        const double *source = REAL(xj);
+        double *target = REAL(ansj);
+        for (int i=0; i<n; i++) {
+          for(int repi=0; repi<row_counts[i]; repi++) {
+            memcpy(target + outi + repi, &source[i], sizeof(double));
+          }
+          outi += row_counts[i];
         }
+      } break;
+      case CPLXSXP: {
+        const Rcomplex *source = COMPLEX(xj);
+        Rcomplex *target = COMPLEX(ansj);
+        for (int i=0; i<n; i++) {
+          for(int repi=0; repi<row_counts[i]; repi++) {
+            memcpy(target + outi + repi, &source[i], sizeof(Rcomplex));
+          }
+          outi += row_counts[i];
+        }
+      } break;
+      case STRSXP: {
+        for (int i=0; i<n; i++) {
+          for(int repi=0; repi<row_counts[i]; repi++) {
+            SET_STRING_ELT(ansj, outi + repi, STRING_ELT(xj, i));
+          }
+          outi += row_counts[i];
+        }
+      } break;
+      default: error(_("Unsupported column type %s"), type2char(TYPEOF(xj)));
       }
-    } break;
-    default:
-      error(_("Type '%s' not supported by CJ."), type2char(TYPEOF(source)));
+      copyMostAttrib(xj, ansj);
     }
-    eachrep *= thislen;
   }
-  UNPROTECT(1);
-  return out;
-}
 
+  // copy names
+  SEXP ansNames;
+  SEXP xNames = PROTECT(getAttrib(x, R_NamesSymbol));
+  setAttrib(ans, R_NamesSymbol, ansNames=allocVector(STRSXP, p));
+  for (int j=0; j<p; j++) {
+    SET_STRING_ELT(ansNames, j, STRING_ELT(xNames, j));
+  }
+  UNPROTECT(2);
+  return ans;
+}
@@ -103,6 +103,10 @@ bool GetVerbose();
 
 // cj.c
 SEXP cj(SEXP base_list);
+SEXP unnest(SEXP x, SEXP cols);
+
+// rbindlist.c
+SEXP rbindlist(SEXP l, SEXP usenamesArg, SEXP fillArg, SEXP idcolArg);
 
 // dogroups.c
 SEXP keepattr(SEXP to, SEXP from);

@@ -119,6 +119,7 @@ SEXP lock();
 SEXP unlock();
 SEXP islockedR();
 SEXP allNAR();
+SEXP unnest();
 
 // .Externals
 SEXP fastmean();
@@ -211,6 +212,7 @@ R_CallMethodDef callMethods[] = {
 {"CfrollapplyR", (DL_FUNC) &frollapplyR, -1},
 {"CtestMsgR", (DL_FUNC) &testMsgR, -1},
 {"C_allNAR", (DL_FUNC) &allNAR, -1},
+{"Cunnest", (DL_FUNC) &unnest, -1},
 {NULL, NULL, 0}
 };
 

@@ -11,3 +11,4 @@
   #define omp_get_wtime()        0
 #endif
 
+#define OMP_MIN_VALUE 1024
@@ -1,6 +1,5 @@
 #include "data.table.h"
 #include <Rdefines.h>
-#include <ctype.h>   // for isdigit
 
 SEXP rbindlist(SEXP l, SEXP usenamesArg, SEXP fillArg, SEXP idcolArg)
 {
Original file line number	Diff line number	Diff line change
Expand Up		@@ -11,3 +11,4 @@
		#define omp_get_wtime() 0
		#endif

		#define OMP_MIN_VALUE 1024