LCOV - code coverage report
Current view: top level - gdk - gdk_project.c (source / functions) Hit Total Coverage
Test: coverage.info Lines: 394 714 55.2 %
Date: 2024-04-26 00:35:57 Functions: 21 22 95.5 %

          Line data    Source code
       1             : /*
       2             :  * SPDX-License-Identifier: MPL-2.0
       3             :  *
       4             :  * This Source Code Form is subject to the terms of the Mozilla Public
       5             :  * License, v. 2.0.  If a copy of the MPL was not distributed with this
       6             :  * file, You can obtain one at http://mozilla.org/MPL/2.0/.
       7             :  *
       8             :  * Copyright 2024 MonetDB Foundation;
       9             :  * Copyright August 2008 - 2023 MonetDB B.V.;
      10             :  * Copyright 1997 - July 2008 CWI.
      11             :  */
      12             : 
      13             : #include "monetdb_config.h"
      14             : #include "gdk.h"
      15             : #include "gdk_private.h"
      16             : 
      17             : /*
      18             :  * BATproject returns a BAT aligned with the left input whose values
      19             :  * are the values from the right input that were referred to by the
      20             :  * OIDs in the left input.
      21             :  *
      22             :  * BATproject2 is similar, except instead of a single right input
      23             :  * there are two of which the second's hseqbase is equal to the first
      24             :  * hseqbase + its batCount.
      25             :  */
      26             : 
      27             : #define project1_loop(TYPE)                                             \
      28             : static gdk_return                                                       \
      29             : project1_##TYPE(BAT *restrict bn, BATiter *restrict li,                 \
      30             :                 BATiter *restrict r1i, QryCtx *qry_ctx)                 \
      31             : {                                                                       \
      32             :         BUN lo;                                                         \
      33             :         const TYPE *restrict r1t;                                       \
      34             :         TYPE *restrict bt;                                              \
      35             :         oid r1seq, r1end;                                               \
      36             :                                                                         \
      37             :         MT_thread_setalgorithm(__func__);                               \
      38             :         r1t = (const TYPE *) r1i->base;                                      \
      39             :         bt = (TYPE *) Tloc(bn, 0);                                      \
      40             :         r1seq = r1i->b->hseqbase;                                 \
      41             :         r1end = r1seq + r1i->count;                                  \
      42             :         if (BATtdensebi(li)) {                                          \
      43             :                 if (li->tseq < r1seq ||                                   \
      44             :                     (li->tseq + li->count) >= r1end) {                 \
      45             :                         GDKerror("does not match always\n");          \
      46             :                         return GDK_FAIL;                                \
      47             :                 }                                                       \
      48             :                 oid off = li->tseq - r1seq;                          \
      49             :                 r1t += off;                                             \
      50             :                 TIMEOUT_LOOP_IDX(lo, li->count, qry_ctx)             \
      51             :                         bt[lo] = r1t[lo];                               \
      52             :         } else {                                                        \
      53             :                 assert(li->type);                                    \
      54             :                 const oid *restrict ot = (const oid *) li->base;     \
      55             :                 TIMEOUT_LOOP_IDX(lo, li->count, qry_ctx) {           \
      56             :                         oid o = ot[lo];                                 \
      57             :                         if (o < r1seq || o >= r1end) {                    \
      58             :                                 GDKerror("does not match always\n");  \
      59             :                                 return GDK_FAIL;                        \
      60             :                         }                                               \
      61             :                         bt[lo] = r1t[o - r1seq];                        \
      62             :                 }                                                       \
      63             :         }                                                               \
      64             :         TIMEOUT_CHECK(qry_ctx, TIMEOUT_HANDLER(GDK_FAIL, qry_ctx));     \
      65             :         BATsetcount(bn, lo);                                            \
      66             :         return GDK_SUCCEED;                                             \
      67             : }
      68             : 
      69             : /* project type switch */
      70    64404516 : project1_loop(bte)
      71    31186992 : project1_loop(sht)
      72   619235492 : project1_loop(int)
      73        1554 : project1_loop(flt)
      74     1009263 : project1_loop(dbl)
      75   185065077 : project1_loop(lng)
      76             : #ifdef HAVE_HGE
      77    77180097 : project1_loop(hge)
      78             : #endif
      79         150 : project1_loop(uuid)
      80             : 
      81             : #define project_loop(TYPE)                                              \
      82             : static gdk_return                                                       \
      83             : project_##TYPE(BAT *restrict bn, BATiter *restrict li,                  \
      84             :                struct canditer *restrict ci,                            \
      85             :                BATiter *restrict r1i, BATiter *restrict r2i,            \
      86             :                QryCtx *qry_ctx)                                         \
      87             : {                                                                       \
      88             :         BUN lo;                                                         \
      89             :         const TYPE *restrict r1t;                                       \
      90             :         const TYPE *restrict r2t;                                       \
      91             :         TYPE *restrict bt;                                              \
      92             :         TYPE v;                                                         \
      93             :         oid r1seq, r1end;                                               \
      94             :         oid r2seq, r2end;                                               \
      95             :                                                                         \
      96             :         if (r2i == NULL &&                                              \
      97             :             (ci == NULL || (ci->tpe == cand_dense && BATtdensebi(li))) && \
      98             :             li->nonil && r1i->type && !BATtdensebi(r1i))          \
      99             :                 return project1_##TYPE(bn, li, r1i, qry_ctx);           \
     100             :         MT_thread_setalgorithm(__func__);                               \
     101             :         r1t = (const TYPE *) r1i->base;                                      \
     102             :         bt = (TYPE *) Tloc(bn, 0);                                      \
     103             :         r1seq = r1i->b->hseqbase;                                 \
     104             :         r1end = r1seq + r1i->count;                                  \
     105             :         if (r2i) {                                                      \
     106             :                 r2t = (const TYPE *) r2i->base;                              \
     107             :                 r2seq = r2i->b->hseqbase;                         \
     108             :                 r2end = r2seq + r2i->count;                          \
     109             :         } else {                                                        \
     110             :                 r2t = NULL;                                             \
     111             :                 r2seq = r2end = r1end;                                  \
     112             :         }                                                               \
     113             :         if (ci) {                                                       \
     114             :                 TIMEOUT_LOOP_IDX(lo, ci->ncand, qry_ctx) {           \
     115             :                         oid o = canditer_next(ci);                      \
     116             :                         if (o < r1seq || o >= r2end) {                    \
     117             :                                 GDKerror("does not match always\n");  \
     118             :                                 return GDK_FAIL;                        \
     119             :                         }                                               \
     120             :                         if (o < r1end)                                       \
     121             :                                 v = r1t[o - r1seq];                     \
     122             :                         else                                            \
     123             :                                 v = r2t[o - r2seq];                     \
     124             :                         bt[lo] = v;                                     \
     125             :                 }                                                       \
     126             :         } else if (BATtdensebi(li)) {                                   \
     127             :                 TIMEOUT_LOOP_IDX(lo, li->count, qry_ctx) {           \
     128             :                         oid o = li->tseq + lo;                               \
     129             :                         if (o < r1seq || o >= r2end) {                    \
     130             :                                 GDKerror("does not match always\n");  \
     131             :                                 return GDK_FAIL;                        \
     132             :                         }                                               \
     133             :                         if (o < r1end)                                       \
     134             :                                 v = r1t[o - r1seq];                     \
     135             :                         else                                            \
     136             :                                 v = r2t[o - r2seq];                     \
     137             :                         bt[lo] = v;                                     \
     138             :                 }                                                       \
     139             :         } else {                                                        \
     140             :                 const oid *restrict ot = (const oid *) li->base;     \
     141             :                 TIMEOUT_LOOP_IDX(lo, li->count, qry_ctx) {           \
     142             :                         oid o = ot[lo];                                 \
     143             :                         if (is_oid_nil(o)) {                            \
     144             :                                 bt[lo] = v = TYPE##_nil;                \
     145             :                                 bn->tnil = true;                     \
     146             :                         } else if (o < r1seq || o >= r2end) {             \
     147             :                                 GDKerror("does not match always\n");  \
     148             :                                 return GDK_FAIL;                        \
     149             :                         } else if (o < r1end) {                              \
     150             :                                 v = r1t[o - r1seq];                     \
     151             :                                 bt[lo] = v;                             \
     152             :                         } else {                                        \
     153             :                                 v = r2t[o - r2seq];                     \
     154             :                                 bt[lo] = v;                             \
     155             :                         }                                               \
     156             :                 }                                                       \
     157             :         }                                                               \
     158             :         TIMEOUT_CHECK(qry_ctx, TIMEOUT_HANDLER(GDK_FAIL, qry_ctx));     \
     159             :         BATsetcount(bn, lo);                                            \
     160             :         return GDK_SUCCEED;                                             \
     161             : }
     162             : 
     163             : 
     164             : /* project type switch */
     165      201276 : project_loop(bte)
     166      429888 : project_loop(sht)
     167    19224979 : project_loop(int)
     168          89 : project_loop(flt)
     169        5312 : project_loop(dbl)
     170       24477 : project_loop(lng)
     171             : #ifdef HAVE_HGE
     172     1221816 : project_loop(hge)
     173             : #endif
     174          31 : project_loop(uuid)
     175             : 
     176             : static gdk_return
     177       16161 : project_oid(BAT *restrict bn, BATiter *restrict li,
     178             :             struct canditer *restrict lci,
     179             :             BATiter *restrict r1i, BATiter *restrict r2i, QryCtx *qry_ctx)
     180             : {
     181       16161 :         BUN lo;
     182       16161 :         oid *restrict bt;
     183       16161 :         oid r1seq, r1end;
     184       16161 :         oid r2seq, r2end;
     185       16161 :         const oid *restrict r1t = NULL;
     186       16161 :         const oid *restrict r2t = NULL;
     187       16161 :         struct canditer r1ci = {0}, r2ci = {0};
     188             : 
     189       16161 :         if ((!lci || (lci->tpe == cand_dense && BATtdensebi(li))) && r1i->type && !BATtdensebi(r1i) && !r2i && li->nonil) {
     190        7648 :                 if (sizeof(oid) == sizeof(lng))
     191        7648 :                         return project1_lng(bn, li, r1i, qry_ctx);
     192             :                 else
     193             :                         return project1_int(bn, li, r1i, qry_ctx);
     194             :         }
     195        8513 :         MT_thread_setalgorithm(__func__);
     196        8525 :         if (complex_cand(r1i->b))
     197          28 :                 canditer_init(&r1ci, NULL, r1i->b);
     198        8497 :         else if (!BATtdensebi(r1i))
     199           1 :                 r1t = (const oid *) r1i->base;
     200        8525 :         r1seq = r1i->b->hseqbase;
     201        8525 :         r1end = r1seq + r1i->count;
     202        8525 :         if (r2i) {
     203           0 :                 if (complex_cand(r2i->b))
     204           0 :                         canditer_init(&r2ci, NULL, r2i->b);
     205           0 :                 else if (!BATtdensebi(r2i))
     206           0 :                         r2t = (const oid *) r2i->base;
     207           0 :                 r2seq = r2i->b->hseqbase;
     208           0 :                 r2end = r2seq + r2i->count;
     209             :         } else {
     210             :                 r2seq = r2end = r1end;
     211             :         }
     212        8525 :         bt = (oid *) Tloc(bn, 0);
     213        8525 :         if (lci) {
     214          13 :                 TIMEOUT_LOOP_IDX(lo, lci->ncand, qry_ctx) {
     215           4 :                         oid o = canditer_next(lci);
     216           4 :                         if (o < r1seq || o >= r2end) {
     217           0 :                                 goto nomatch;
     218             :                         }
     219           4 :                         if (o < r1end) {
     220           4 :                                 if (r1ci.s)
     221           0 :                                         bt[lo] = canditer_idx(&r1ci, o - r1seq);
     222           4 :                                 else if (r1t)
     223           1 :                                         bt[lo] = r1t[o - r1seq];
     224             :                                 else
     225           3 :                                         bt[lo] = o - r1seq + r1i->tseq;
     226             :                         } else {
     227           0 :                                 if (r2ci.s)
     228           0 :                                         bt[lo] = canditer_idx(&r2ci, o - r2seq);
     229           0 :                                 else if (r2t)
     230           0 :                                         bt[lo] = r2t[o - r2seq];
     231             :                                 else
     232           0 :                                         bt[lo] = o - r2seq + r2i->tseq;
     233             :                         }
     234             :                 }
     235        8519 :         } else if (BATtdensebi(li)) {
     236           0 :                 TIMEOUT_LOOP_IDX(lo, li->count, qry_ctx) {
     237           0 :                         oid o = li->tseq + lo;
     238           0 :                         if (o < r1seq || o >= r2end) {
     239           0 :                                 goto nomatch;
     240             :                         }
     241           0 :                         if (o < r1end) {
     242           0 :                                 if (r1ci.s)
     243           0 :                                         bt[lo] = canditer_idx(&r1ci, o - r1seq);
     244           0 :                                 else if (r1t)
     245           0 :                                         bt[lo] = r1t[o - r1seq];
     246             :                                 else
     247           0 :                                         bt[lo] = o - r1seq + r1i->tseq;
     248             :                         } else {
     249           0 :                                 if (r2ci.s)
     250           0 :                                         bt[lo] = canditer_idx(&r2ci, o - r2seq);
     251           0 :                                 else if (r2t)
     252           0 :                                         bt[lo] = r2t[o - r2seq];
     253             :                                 else
     254           0 :                                         bt[lo] = o - r2seq + r2i->tseq;
     255             :                         }
     256             :                 }
     257             :         } else {
     258        8519 :                 const oid *ot = (const oid *) li->base;
     259   198181253 :                 TIMEOUT_LOOP_IDX(lo, li->count, qry_ctx) {
     260   198148973 :                         oid o = ot[lo];
     261   198148973 :                         if (is_oid_nil(o)) {
     262           0 :                                 bt[lo] = oid_nil;
     263           0 :                                 bn->tnonil = false;
     264           0 :                                 bn->tnil = true;
     265   198148973 :                         } else if (o < r1seq || o >= r2end) {
     266           0 :                                 goto nomatch;
     267   198148973 :                         } else if (o < r1end) {
     268   198148973 :                                 if (r1ci.s)
     269        7749 :                                         bt[lo] = canditer_idx(&r1ci, o - r1seq);
     270   198141224 :                                 else if (r1t)
     271           0 :                                         bt[lo] = r1t[o - r1seq];
     272             :                                 else
     273   198141224 :                                         bt[lo] = o - r1seq + r1i->tseq;
     274             :                         } else {
     275           0 :                                 if (r2ci.s)
     276           0 :                                         bt[lo] = canditer_idx(&r2ci, o - r2seq);
     277           0 :                                 else if (r2t)
     278           0 :                                         bt[lo] = r2t[o - r2seq];
     279             :                                 else
     280           0 :                                         bt[lo] = o - r2seq + r2i->tseq;
     281             :                         }
     282             :                 }
     283             :         }
     284        8541 :         TIMEOUT_CHECK(qry_ctx, TIMEOUT_HANDLER(GDK_FAIL, qry_ctx));
     285        8529 :         BATsetcount(bn, lo);
     286        8529 :         return GDK_SUCCEED;
     287           0 :   nomatch:
     288           0 :         GDKerror("does not match always\n");
     289           0 :         return GDK_FAIL;
     290             : }
     291             : 
     292             : static gdk_return
     293        1461 : project_any(BAT *restrict bn, BATiter *restrict li,
     294             :             struct canditer *restrict ci,
     295             :             BATiter *restrict r1i, BATiter *restrict r2i, QryCtx *qry_ctx)
     296             : {
     297        1461 :         BUN lo;
     298        1461 :         const void *nil = ATOMnilptr(r1i->type);
     299        1461 :         const void *v;
     300        1461 :         oid r1seq, r1end;
     301        1461 :         oid r2seq, r2end;
     302             : 
     303        1461 :         MT_thread_setalgorithm(__func__);
     304        1463 :         r1seq = r1i->b->hseqbase;
     305        1463 :         r1end = r1seq + r1i->count;
     306        1463 :         if (r2i) {
     307           0 :                 r2seq = r2i->b->hseqbase;
     308           0 :                 r2end = r2seq + r2i->count;
     309             :         } else {
     310             :                 r2seq = r2end = r1end;
     311             :         }
     312        1463 :         if (ci) {
     313           6 :                 TIMEOUT_LOOP_IDX(lo, ci->ncand, qry_ctx) {
     314           0 :                         oid o = canditer_next(ci);
     315           0 :                         if (o < r1seq || o >= r2end) {
     316           0 :                                 GDKerror("does not match always\n");
     317           0 :                                 return GDK_FAIL;
     318             :                         }
     319           0 :                         if (o < r1end)
     320           0 :                                 v = BUNtail(*r1i, o - r1seq);
     321             :                         else
     322           0 :                                 v = BUNtail(*r2i, o - r2seq);
     323           0 :                         if (tfastins_nocheck(bn, lo, v) != GDK_SUCCEED) {
     324             :                                 return GDK_FAIL;
     325             :                         }
     326             :                 }
     327        1457 :         } else if (BATtdensebi(li)) {
     328           0 :                 TIMEOUT_LOOP_IDX(lo, li->count, qry_ctx) {
     329           0 :                         oid o = li->tseq + lo;
     330           0 :                         if (o < r1seq || o >= r2end) {
     331           0 :                                 GDKerror("does not match always\n");
     332           0 :                                 return GDK_FAIL;
     333             :                         }
     334           0 :                         if (o < r1end)
     335           0 :                                 v = BUNtail(*r1i, o - r1seq);
     336             :                         else
     337           0 :                                 v = BUNtail(*r2i, o - r2seq);
     338           0 :                         if (tfastins_nocheck(bn, lo, v) != GDK_SUCCEED) {
     339             :                                 return GDK_FAIL;
     340             :                         }
     341             :                 }
     342             :         } else {
     343        1457 :                 const oid *restrict ot = (const oid *) li->base;
     344             : 
     345      195762 :                 TIMEOUT_LOOP_IDX(lo, li->count, qry_ctx) {
     346      192839 :                         oid o = ot[lo];
     347      192839 :                         if (is_oid_nil(o)) {
     348           0 :                                 v = nil;
     349           0 :                                 bn->tnil = true;
     350      192839 :                         } else if (o < r1seq || o >= r2end) {
     351           0 :                                 GDKerror("does not match always\n");
     352           0 :                                 return GDK_FAIL;
     353      192839 :                         } else if (o < r1end) {
     354      192839 :                                 v = BUNtail(*r1i, o - r1seq);
     355             :                         } else {
     356           0 :                                 v = BUNtail(*r2i, o - r2seq);
     357             :                         }
     358      193080 :                         if (tfastins_nocheck(bn, lo, v) != GDK_SUCCEED) {
     359             :                                 return GDK_FAIL;
     360             :                         }
     361             :                 }
     362             :         }
     363        1477 :         TIMEOUT_CHECK(qry_ctx, TIMEOUT_HANDLER(GDK_FAIL, qry_ctx));
     364        1471 :         BATsetcount(bn, lo);
     365        1471 :         bn->theap->dirty = true;
     366        1471 :         return GDK_SUCCEED;
     367             : }
     368             : 
     369             : static BAT *
     370           0 : project_str(BATiter *restrict li, struct canditer *restrict ci, int tpe,
     371             :             BATiter *restrict r1i, BATiter *restrict r2i,
     372             :             QryCtx *qry_ctx, lng t0)
     373             : {
     374           0 :         BAT *bn;
     375           0 :         BUN lo;
     376           0 :         oid r1seq, r1end;
     377           0 :         oid r2seq, r2end;
     378           0 :         BUN h1off;
     379           0 :         BUN off;
     380           0 :         oid seq;
     381           0 :         var_t v;
     382           0 :         BATiter *ri;
     383             : 
     384           0 :         if ((bn = COLnew(li->b->hseqbase, tpe, ci ? ci->ncand : li->count,
     385             :                          TRANSIENT)) == NULL)
     386             :                 return NULL;
     387             : 
     388           0 :         v = (var_t) r1i->vhfree;
     389           0 :         if (r1i->vh == r2i->vh) {
     390           0 :                 h1off = 0;
     391           0 :                 assert(bn->tvheap->parentid == bn->batCacheid);
     392           0 :                 HEAPdecref(bn->tvheap, true);
     393           0 :                 HEAPincref(r1i->vh);
     394           0 :                 bn->tvheap = r1i->vh;
     395           0 :                 assert(bn->tvheap->parentid != bn->batCacheid);
     396           0 :                 BBPretain(bn->tvheap->parentid);
     397             :         } else {
     398           0 :                 v = (v + GDK_VARALIGN - 1) & ~(GDK_VARALIGN - 1);
     399           0 :                 h1off = (BUN) v;
     400           0 :                 v += ((var_t) r2i->vhfree + GDK_VARALIGN - 1) & ~(GDK_VARALIGN - 1);
     401           0 :                 if (HEAPextend(bn->tvheap, v, false) != GDK_SUCCEED) {
     402           0 :                         BBPreclaim(bn);
     403           0 :                         return NULL;
     404             :                 }
     405           0 :                 memcpy(bn->tvheap->base, r1i->vh->base, r1i->vhfree);
     406             : #ifndef NDEBUG
     407           0 :                 if (h1off > r1i->vhfree)
     408           0 :                         memset(bn->tvheap->base + r1i->vhfree, 0, h1off - r1i->vhfree);
     409             : #endif
     410           0 :                 memcpy(bn->tvheap->base + h1off, r2i->vh->base, r2i->vhfree);
     411           0 :                 bn->tvheap->free = h1off + r2i->vhfree;
     412           0 :                 bn->tvheap->dirty = true;
     413             :         }
     414             : 
     415           0 :         if (v >= ((var_t) 1 << (8 << bn->tshift)) &&
     416           0 :             GDKupgradevarheap(bn, v, false, 0) != GDK_SUCCEED) {
     417           0 :                 BBPreclaim(bn);
     418           0 :                 return NULL;
     419             :         }
     420             : 
     421           0 :         r1seq = r1i->b->hseqbase;
     422           0 :         r1end = r1seq + r1i->count;
     423           0 :         r2seq = r2i->b->hseqbase;
     424           0 :         r2end = r2seq + r2i->count;
     425           0 :         if (ci) {
     426           0 :                 TIMEOUT_LOOP_IDX(lo, ci->ncand, qry_ctx) {
     427           0 :                         oid o = canditer_next(ci);
     428           0 :                         if (o < r1seq || o >= r2end) {
     429           0 :                                 GDKerror("does not match always\n");
     430           0 :                                 BBPreclaim(bn);
     431           0 :                                 return NULL;
     432             :                         }
     433           0 :                         if (o < r1end) {
     434             :                                 ri = r1i;
     435             :                                 off = 0;
     436             :                                 seq = r1seq;
     437             :                         } else {
     438           0 :                                 ri = r2i;
     439           0 :                                 off = h1off;
     440           0 :                                 seq = r2seq;
     441             :                         }
     442           0 :                         switch (ri->width) {
     443           0 :                         case 1:
     444           0 :                                 v = (var_t) ((uint8_t *) ri->base)[o - seq] + GDK_VAROFFSET;
     445           0 :                                 break;
     446           0 :                         case 2:
     447           0 :                                 v = (var_t) ((uint16_t *) ri->base)[o - seq] + GDK_VAROFFSET;
     448           0 :                                 break;
     449           0 :                         case 4:
     450           0 :                                 v = (var_t) ((uint32_t *) ri->base)[o - seq];
     451           0 :                                 break;
     452           0 :                         case 8:
     453           0 :                                 v = (var_t) ((uint64_t *) ri->base)[o - seq];
     454           0 :                                 break;
     455             :                         }
     456           0 :                         v += off;
     457           0 :                         switch (bn->twidth) {
     458           0 :                         case 1:
     459           0 :                                 ((uint8_t *) bn->theap->base)[lo] = (uint8_t) (v - GDK_VAROFFSET);
     460           0 :                                 break;
     461           0 :                         case 2:
     462           0 :                                 ((uint16_t *) bn->theap->base)[lo] = (uint16_t) (v - GDK_VAROFFSET);
     463           0 :                                 break;
     464           0 :                         case 4:
     465           0 :                                 ((uint32_t *) bn->theap->base)[lo] = (uint32_t) v;
     466           0 :                                 break;
     467           0 :                         case 8:
     468           0 :                                 ((uint64_t *) bn->theap->base)[lo] = (uint64_t) v;
     469           0 :                                 break;
     470             :                         }
     471             :                 }
     472           0 :         } else if (BATtdensebi(li)) {
     473           0 :                 TIMEOUT_LOOP_IDX(lo, li->count, qry_ctx) {
     474           0 :                         oid o = li->tseq + lo;
     475           0 :                         if (o < r1seq || o >= r2end) {
     476           0 :                                 GDKerror("does not match always\n");
     477           0 :                                 BBPreclaim(bn);
     478           0 :                                 return NULL;
     479             :                         }
     480           0 :                         if (o < r1end) {
     481             :                                 ri = r1i;
     482             :                                 off = 0;
     483             :                                 seq = r1seq;
     484             :                         } else {
     485           0 :                                 ri = r2i;
     486           0 :                                 off = h1off;
     487           0 :                                 seq = r2seq;
     488             :                         }
     489           0 :                         switch (ri->width) {
     490           0 :                         case 1:
     491           0 :                                 v = (var_t) ((uint8_t *) ri->base)[o - seq] + GDK_VAROFFSET;
     492           0 :                                 break;
     493           0 :                         case 2:
     494           0 :                                 v = (var_t) ((uint16_t *) ri->base)[o - seq] + GDK_VAROFFSET;
     495           0 :                                 break;
     496           0 :                         case 4:
     497           0 :                                 v = (var_t) ((uint32_t *) ri->base)[o - seq];
     498           0 :                                 break;
     499           0 :                         case 8:
     500           0 :                                 v = (var_t) ((uint64_t *) ri->base)[o - seq];
     501           0 :                                 break;
     502             :                         }
     503           0 :                         v += off;
     504           0 :                         switch (bn->twidth) {
     505           0 :                         case 1:
     506           0 :                                 ((uint8_t *) bn->theap->base)[lo] = (uint8_t) (v - GDK_VAROFFSET);
     507           0 :                                 break;
     508           0 :                         case 2:
     509           0 :                                 ((uint16_t *) bn->theap->base)[lo] = (uint16_t) (v - GDK_VAROFFSET);
     510           0 :                                 break;
     511           0 :                         case 4:
     512           0 :                                 ((uint32_t *) bn->theap->base)[lo] = (uint32_t) v;
     513           0 :                                 break;
     514           0 :                         case 8:
     515           0 :                                 ((uint64_t *) bn->theap->base)[lo] = (uint64_t) v;
     516           0 :                                 break;
     517             :                         }
     518             :                 }
     519             :         } else {
     520           0 :                 const oid *restrict ot = (const oid *) li->base;
     521           0 :                 TIMEOUT_LOOP_IDX(lo, li->count, qry_ctx) {
     522           0 :                         oid o = ot[lo];
     523           0 :                         if (o < r1seq || o >= r2end) {
     524           0 :                                 GDKerror("does not match always\n");
     525           0 :                                 BBPreclaim(bn);
     526           0 :                                 return NULL;
     527             :                         }
     528           0 :                         if (o < r1end) {
     529             :                                 ri = r1i;
     530             :                                 off = 0;
     531             :                                 seq = r1seq;
     532             :                         } else {
     533           0 :                                 ri = r2i;
     534           0 :                                 off = h1off;
     535           0 :                                 seq = r2seq;
     536             :                         }
     537           0 :                         switch (ri->width) {
     538           0 :                         case 1:
     539           0 :                                 v = (var_t) ((uint8_t *) ri->base)[o - seq] + GDK_VAROFFSET;
     540           0 :                                 break;
     541           0 :                         case 2:
     542           0 :                                 v = (var_t) ((uint16_t *) ri->base)[o - seq] + GDK_VAROFFSET;
     543           0 :                                 break;
     544           0 :                         case 4:
     545           0 :                                 v = (var_t) ((uint32_t *) ri->base)[o - seq];
     546           0 :                                 break;
     547           0 :                         case 8:
     548           0 :                                 v = (var_t) ((uint64_t *) ri->base)[o - seq];
     549           0 :                                 break;
     550             :                         }
     551           0 :                         v += off;
     552           0 :                         switch (bn->twidth) {
     553           0 :                         case 1:
     554           0 :                                 ((uint8_t *) bn->theap->base)[lo] = (uint8_t) (v - GDK_VAROFFSET);
     555           0 :                                 break;
     556           0 :                         case 2:
     557           0 :                                 ((uint16_t *) bn->theap->base)[lo] = (uint16_t) (v - GDK_VAROFFSET);
     558           0 :                                 break;
     559           0 :                         case 4:
     560           0 :                                 ((uint32_t *) bn->theap->base)[lo] = (uint32_t) v;
     561           0 :                                 break;
     562           0 :                         case 8:
     563           0 :                                 ((uint64_t *) bn->theap->base)[lo] = (uint64_t) v;
     564           0 :                                 break;
     565             :                         }
     566             :                 }
     567             :         }
     568           0 :         TIMEOUT_CHECK(qry_ctx, GOTO_LABEL_TIMEOUT_HANDLER(bailout, qry_ctx));
     569           0 :         BATsetcount(bn, lo);
     570           0 :         bn->tsorted = bn->trevsorted = false;
     571           0 :         bn->tnil = false;
     572           0 :         bn->tnonil = r1i->nonil & r2i->nonil;
     573           0 :         bn->tkey = false;
     574           0 :         TRC_DEBUG(ALGO, "l=" ALGOBATFMT " r1=" ALGOBATFMT " r2=" ALGOBATFMT
     575             :                   " -> " ALGOBATFMT "%s " LLFMT "us\n",
     576             :                   ALGOBATPAR(li->b), ALGOBATPAR(r1i->b), ALGOBATPAR(r2i->b),
     577             :                   ALGOBATPAR(bn),
     578             :                   bn && bn->ttype == TYPE_str && bn->tvheap == r1i->vh ? " sharing string heap" : "",
     579             :                   GDKusec() - t0);
     580             :         return bn;
     581           0 :   bailout:
     582           0 :         BBPreclaim(bn);
     583           0 :         return NULL;
     584             : }
     585             : 
     586             : BAT *
     587     2198889 : BATproject2(BAT *restrict l, BAT *restrict r1, BAT *restrict r2)
     588             : {
     589     2198889 :         BAT *bn = NULL;
     590     2198889 :         BAT *or1 = r1, *or2 = r2, *ol = l;
     591     2198889 :         oid lo, hi;
     592     2198889 :         gdk_return res;
     593     2198889 :         int tpe = ATOMtype(r1->ttype), otpe = tpe;
     594     2198889 :         bool stringtrick = false;
     595     2198889 :         struct canditer ci, *lci = NULL;
     596     2198889 :         const char *msg = "";
     597     2198889 :         lng t0 = 0;
     598     2198889 :         BATiter li = bat_iterator(l);
     599     2208789 :         BATiter r1i = bat_iterator(r1);
     600     2210035 :         BATiter r2i = bat_iterator(r2);
     601     2206429 :         BUN lcount = li.count;
     602             : 
     603     2206429 :         TRC_DEBUG_IF(ALGO) t0 = GDKusec();
     604             : 
     605     2206429 :         assert(ATOMtype(li.type) == TYPE_oid || li.type == TYPE_msk);
     606     2206429 :         assert(r2 == NULL || tpe == ATOMtype(r2i.type));
     607           0 :         assert(r2 == NULL || r1->hseqbase + r1i.count == r2->hseqbase);
     608             : 
     609     2206429 :         QryCtx *qry_ctx = MT_thread_get_qry_ctx();
     610             : 
     611     2204336 :         if (r2 && r1i.count == 0) {
     612             :                 /* unlikely special case: r1 is empty, so we just have r2 */
     613           0 :                 r1 = r2;
     614           0 :                 r2 = NULL;
     615           0 :                 bat_iterator_end(&r1i);
     616           0 :                 r1i = r2i;
     617           0 :                 r2i = bat_iterator(NULL);
     618             :         }
     619             : 
     620     2204336 :         if (BATtdensebi(&li) && lcount > 0) {
     621      758364 :                 lo = l->tseqbase;
     622      758364 :                 hi = l->tseqbase + lcount;
     623      758364 :                 if (lo >= r1->hseqbase && hi <= r1->hseqbase + r1i.count) {
     624      758364 :                         bn = BATslice(r1, lo - r1->hseqbase, hi - r1->hseqbase);
     625      753356 :                         BAThseqbase(bn, l->hseqbase);
     626      751329 :                         msg = " (slice)";
     627      751329 :                         goto doreturn;
     628             :                 }
     629           0 :                 if (lo < r1->hseqbase || r2 == NULL || hi > r2->hseqbase + r2i.count) {
     630           0 :                         GDKerror("does not match always\n");
     631           0 :                         bat_iterator_end(&li);
     632           0 :                         bat_iterator_end(&r1i);
     633           0 :                         bat_iterator_end(&r2i);
     634           0 :                         return NULL;
     635             :                 }
     636           0 :                 if (lo >= r2->hseqbase) {
     637           0 :                         bn = BATslice(r2, lo - r2->hseqbase, hi - r2->hseqbase);
     638           0 :                         BAThseqbase(bn, l->hseqbase);
     639           0 :                         msg = " (slice2)";
     640           0 :                         goto doreturn;
     641             :                 }
     642             :         }
     643     1445972 :         if (complex_cand(l)) {
     644             :                 /* l is candidate list with exceptions or is a bitmask */
     645       14315 :                 assert(li.type == TYPE_msk || !is_oid_nil(l->tseqbase));
     646       14315 :                 canditer_init(&ci, NULL, l);
     647       14320 :                 lcount = ci.ncand;
     648       14320 :                 lci = &ci;
     649     1431657 :         } else if (li.type == TYPE_msk) {
     650           0 :                 l = BATunmask(l);
     651           0 :                 if (l == NULL)
     652           0 :                         goto doreturn;
     653           0 :                 if (complex_cand(l)) {
     654           0 :                         canditer_init(&ci, NULL, l);
     655           0 :                         lcount = ci.ncand;
     656           0 :                         lci = &ci;
     657             :                 }
     658             :         }
     659     1445977 :         if (lcount == 0 ||
     660       14315 :             (li.type == TYPE_void && is_oid_nil(l->tseqbase)) ||
     661      193063 :             (r1i.type == TYPE_void && is_oid_nil(r1->tseqbase) &&
     662           0 :              (r2 == NULL ||
     663           0 :               (r2i.type == TYPE_void && is_oid_nil(r2->tseqbase))))) {
     664             :                 /* trivial: all values are nil (includes no entries at all) */
     665     1252914 :                 const void *nil = r1i.type == TYPE_msk ? &oid_nil : ATOMnilptr(r1i.type);
     666             : 
     667     2496731 :                 bn = BATconstant(l->hseqbase, r1i.type == TYPE_oid || r1i.type == TYPE_msk ? TYPE_void : r1i.type,
     668             :                                  nil, lcount, TRANSIENT);
     669     1246540 :                 if (bn != NULL &&
     670     1246540 :                     ATOMtype(bn->ttype) == TYPE_oid &&
     671      120096 :                     BATcount(bn) == 0) {
     672      120341 :                         BATtseqbase(bn, 0);
     673             :                 }
     674     1246459 :                 msg = " (constant)";
     675     1246459 :                 goto doreturn;
     676             :         }
     677             : 
     678      193063 :         if (ATOMstorage(tpe) == TYPE_str) {
     679       23816 :                 if (li.nonil &&
     680       23815 :                     r2 == NULL &&
     681       23815 :                     (r1i.count == 0 ||
     682       23816 :                      lcount > (r1i.count >> 3) ||
     683        5594 :                      r1i.restricted == BAT_READ)) {
     684             :                         /* insert strings as ints, we need to copy the
     685             :                          * string heap whole sale; we can't do this if
     686             :                          * there are nils in the left column, and we
     687             :                          * won't do it if the left is much smaller than
     688             :                          * the right and the right is writable (meaning
     689             :                          * we have to actually copy the right string
     690             :                          * heap) */
     691       22360 :                         tpe = r1i.width == 1 ? TYPE_bte : (r1i.width == 2 ? TYPE_sht : (r1i.width == 4 ? TYPE_int : TYPE_lng));
     692             :                         stringtrick = true;
     693        1456 :                 } else if (li.nonil &&
     694           0 :                            r2 != NULL &&
     695           0 :                            (r1i.vh == r2i.vh ||
     696           0 :                             (!GDK_ELIMDOUBLES(r1i.vh) /* && size tests */))) {
     697             :                         /* r1 and r2 may explicitly share their vheap,
     698             :                          * if they do, the result will also share the
     699             :                          * vheap; this also means that for this case we
     700             :                          * don't care about duplicate elimination: it
     701             :                          * will remain the same */
     702           0 :                         bn = project_str(&li, lci, tpe, &r1i, &r2i, qry_ctx, t0);
     703           0 :                         bat_iterator_end(&li);
     704           0 :                         bat_iterator_end(&r1i);
     705           0 :                         bat_iterator_end(&r2i);
     706           0 :                         return bn;
     707             :                 }
     708      169247 :         } else if (ATOMvarsized(tpe) &&
     709         154 :                    li.nonil &&
     710         154 :                    r2 == NULL &&
     711         154 :                    (r1i.count == 0 ||
     712         154 :                     lcount > (r1i.count >> 3) ||
     713           0 :                     r1i.restricted == BAT_READ)) {
     714         154 :                 tpe = r1i.width == 4 ? TYPE_int : TYPE_lng;
     715             :                 stringtrick = true;
     716      169093 :         } else if (tpe == TYPE_msk || mask_cand(r1)) {
     717          10 :                 r1 = BATunmask(r1);
     718          10 :                 if (r1 == NULL)
     719           0 :                         goto doreturn;
     720          10 :                 if (r2) {
     721           0 :                         r2 = BATunmask(r2);
     722           0 :                         if (r2 == NULL)
     723           0 :                                 goto doreturn;
     724             :                 }
     725          10 :                 tpe = TYPE_oid;
     726          10 :                 bat_iterator_end(&r1i);
     727          10 :                 bat_iterator_end(&r2i);
     728          10 :                 r1i = bat_iterator(r1);
     729          10 :                 r2i = bat_iterator(r2);
     730             :         }
     731      377955 :         bn = COLnew2(l->hseqbase, ATOMtype(r1i.type), lcount, TRANSIENT, stringtrick ? r1i.width : 0);
     732      190922 :         if (bn == NULL) {
     733           0 :                 goto doreturn;
     734             :         }
     735      190922 :         bn->tnil = false;
     736      190922 :         if (r2) {
     737           0 :                 bn->tnonil = li.nonil & r1i.nonil & r2i.nonil;
     738           0 :                 bn->tsorted = li.count <= 1;
     739           0 :                 bn->trevsorted = li.count <= 1;
     740           0 :                 bn->tkey = li.count <= 1;
     741             :         } else {
     742      192656 :                 bn->tnonil = li.nonil & r1i.nonil;
     743      385312 :                 bn->tsorted = li.count <= 1
     744      191423 :                         || (li.sorted & r1i.sorted)
     745      133643 :                         || (li.revsorted & r1i.revsorted)
     746      324950 :                         || r1i.count <= 1;
     747      385312 :                 bn->trevsorted = li.count <= 1
     748      191744 :                         || (li.sorted & r1i.revsorted)
     749      173641 :                         || (li.revsorted & r1i.sorted)
     750      364710 :                         || r1i.count <= 1;
     751      218771 :                 bn->tkey = li.count <= 1 || (li.key & r1i.key);
     752             :         }
     753             : 
     754      190922 :         if (!stringtrick && tpe != TYPE_oid)
     755      153642 :                 tpe = ATOMbasetype(tpe);
     756      190922 :         switch (tpe) {
     757       13967 :         case TYPE_bte:
     758       13967 :                 res = project_bte(bn, &li, lci, &r1i, r2 ? &r2i : NULL, qry_ctx);
     759       13967 :                 break;
     760       17789 :         case TYPE_sht:
     761       17789 :                 res = project_sht(bn, &li, lci, &r1i, r2 ? &r2i : NULL, qry_ctx);
     762       17789 :                 break;
     763      127233 :         case TYPE_int:
     764      127233 :                 res = project_int(bn, &li, lci, &r1i, r2 ? &r2i : NULL, qry_ctx);
     765      127233 :                 break;
     766          89 :         case TYPE_flt:
     767          89 :                 res = project_flt(bn, &li, lci, &r1i, r2 ? &r2i : NULL, qry_ctx);
     768          89 :                 break;
     769        5224 :         case TYPE_dbl:
     770        5224 :                 res = project_dbl(bn, &li, lci, &r1i, r2 ? &r2i : NULL, qry_ctx);
     771        5224 :                 break;
     772        8446 :         case TYPE_lng:
     773        8446 :                 res = project_lng(bn, &li, lci, &r1i, r2 ? &r2i : NULL, qry_ctx);
     774        8446 :                 break;
     775             : #ifdef HAVE_HGE
     776         507 :         case TYPE_hge:
     777         507 :                 res = project_hge(bn, &li, lci, &r1i, r2 ? &r2i : NULL, qry_ctx);
     778         507 :                 break;
     779             : #endif
     780       16177 :         case TYPE_oid:
     781       16177 :                 res = project_oid(bn, &li, lci, &r1i, r2 ? &r2i : NULL, qry_ctx);
     782       16177 :                 break;
     783          25 :         case TYPE_uuid:
     784          25 :                 res = project_uuid(bn, &li, lci, &r1i, r2 ? &r2i : NULL, qry_ctx);
     785          25 :                 break;
     786        1465 :         default:
     787        1465 :                 res = project_any(bn, &li, lci, &r1i, r2 ? &r2i : NULL, qry_ctx);
     788        1465 :                 break;
     789             :         }
     790             : 
     791      192469 :         if (res != GDK_SUCCEED)
     792        1728 :                 goto bailout;
     793             : 
     794             :         /* handle string trick */
     795      190741 :         if (stringtrick) {
     796       22394 :                 assert(r1i.vh);
     797       22394 :                 if (r1i.restricted == BAT_READ || VIEWvtparent(r1)) {
     798             :                         /* really share string heap */
     799       19805 :                         assert(r1i.vh->parentid > 0);
     800             :                         /* there is no file, so we don't need to remove it */
     801       19805 :                         HEAPdecref(bn->tvheap, false);
     802       19912 :                         bn->tvheap = r1i.vh;
     803       19912 :                         HEAPincref(r1i.vh);
     804       19922 :                         assert(bn->tvheap->parentid != bn->batCacheid);
     805       19922 :                         BBPretain(bn->tvheap->parentid);
     806             :                 } else {
     807             :                         /* make copy of string heap */
     808        2589 :                         bn->tvheap->parentid = bn->batCacheid;
     809        2589 :                         bn->tvheap->farmid = BBPselectfarm(bn->batRole, otpe, varheap);
     810        2589 :                         strconcat_len(bn->tvheap->filename,
     811             :                                       sizeof(bn->tvheap->filename),
     812        2589 :                                       BBP_physical(bn->batCacheid), ".theap",
     813             :                                       NULL);
     814        2605 :                         if (HEAPcopy(bn->tvheap, r1i.vh, 0) != GDK_SUCCEED)
     815           0 :                                 goto bailout;
     816             :                 }
     817       22521 :                 bn->ttype = r1i.type;
     818       22521 :                 bn->twidth = r1i.width;
     819       22521 :                 bn->tshift = r1i.shift;
     820             :         }
     821             : 
     822      190868 :         if (!BATtdensebi(&r1i) || (r2 && !BATtdensebi(&r2i)))
     823      182372 :                 BATtseqbase(bn, oid_nil);
     824             : 
     825        8496 :   doreturn:
     826     2188018 :         TRC_DEBUG(ALGO, "l=" ALGOBATFMT " r1=" ALGOBATFMT " r2=" ALGOOPTBATFMT
     827             :                   " -> " ALGOOPTBATFMT "%s%s " LLFMT "us\n",
     828             :                   ALGOBATPAR(l), ALGOBATPAR(or1), ALGOOPTBATPAR(or2),
     829             :                   ALGOOPTBATPAR(bn),
     830             :                   bn && bn->ttype == TYPE_str && bn->tvheap == r1i.vh ? " sharing string heap" : "",
     831             :                   msg, GDKusec() - t0);
     832     2188018 :         bat_iterator_end(&li);
     833     2198819 :         bat_iterator_end(&r1i);
     834     2207749 :         bat_iterator_end(&r2i);
     835     2202320 :         if (l != ol)
     836           0 :                 BBPreclaim(l);
     837     2172328 :         if (r1 != or1)
     838          10 :                 BBPreclaim(r1);
     839     2179091 :         if (r2 != or2)
     840           0 :                 BBPreclaim(r2);
     841             :         return bn;
     842             : 
     843        1728 :   bailout:
     844        1728 :         BBPreclaim(bn);
     845           0 :         bn = NULL;
     846           0 :         goto doreturn;
     847             : }
     848             : 
     849             : BAT *
     850      616994 : BATproject(BAT *restrict l, BAT *restrict r)
     851             : {
     852      616994 :         return BATproject2(l, r, NULL);
     853             : }
     854             : 
     855             : /* Calculate a chain of BATproject calls.
     856             :  * The argument is a NULL-terminated array of BAT pointers.
     857             :  * This function is equivalent (apart from reference counting) to a
     858             :  * sequence of calls
     859             :  * bn = BATproject(bats[0], bats[1]);
     860             :  * bn = BATproject(bn, bats[2]);
     861             :  * ...
     862             :  * bn = BATproject(bn, bats[n-1]);
     863             :  * return bn;
     864             :  * where none of the intermediates are actually produced (and bats[n]==NULL).
     865             :  * Note that all BATs except the last must have type oid/void or msk.
     866             :  *
     867             :  * We assume that all but the last BAT in the chain is temporary and
     868             :  * therefore there is no chance that another thread will modify it while
     869             :  * we're busy.  This is not necessarily the case for that last BAT, so
     870             :  * it uses a BAT iterator.
     871             :  */
     872             : BAT *
     873      495288 : BATprojectchain(BAT **bats)
     874             : {
     875      495288 :         struct ba {
     876             :                 BAT *b;
     877             :                 oid hlo;
     878             :                 oid hhi;
     879             :                 BUN cnt;
     880             :                 oid *t;
     881             :                 struct canditer ci; /* used if .ci.s != NULL */
     882             :         } *ba;
     883      495288 :         BAT **tobedeleted = NULL;
     884      495288 :         int ndelete = 0;
     885      495288 :         int n, i;
     886      495288 :         BAT *b = NULL, *bn = NULL;
     887      495288 :         BATiter bi;
     888      495288 :         bool allnil = false;
     889      495288 :         bool issorted = true;
     890      495288 :         bool nonil = true;
     891      495288 :         bool stringtrick = false;
     892      495288 :         const void *nil;
     893      495288 :         int tpe;
     894      495288 :         lng t0 = 0;
     895             : 
     896      495288 :         TRC_DEBUG_IF(ALGO) t0 = GDKusec();
     897             : 
     898      495288 :         QryCtx *qry_ctx = MT_thread_get_qry_ctx();
     899             : 
     900             :         /* count number of participating BATs and allocate some
     901             :          * temporary work space */
     902     6527677 :         for (n = 0; bats[n]; n++) {
     903     5538278 :                 b = bats[n];
     904     5538278 :                 ndelete += (b->ttype == TYPE_msk || mask_cand(b));
     905     5538278 :                 TRC_DEBUG(ALGO, "arg %d: " ALGOBATFMT "\n",
     906             :                           n + 1, ALGOBATPAR(b));
     907             :         }
     908      494111 :         if (n == 0) {
     909           0 :                 GDKerror("must have BAT arguments\n");
     910           0 :                 return NULL;
     911             :         }
     912      494111 :         if (n == 1) {
     913           0 :                 bn = COLcopy(b, b->ttype, true, TRANSIENT);
     914           0 :                 TRC_DEBUG(ALGO, "single bat: copy -> " ALGOOPTBATFMT
     915             :                           " " LLFMT " usec\n",
     916             :                           ALGOOPTBATPAR(bn), GDKusec() - t0);
     917           0 :                 return bn;
     918             :         }
     919             : 
     920      494111 :         if (ndelete > 0 &&
     921       12751 :             (tobedeleted = GDKmalloc(sizeof(BAT *) * ndelete)) == NULL)
     922             :                 return NULL;
     923      494112 :         ba = GDKmalloc(sizeof(*ba) * n);
     924      495333 :         if (ba == NULL) {
     925           0 :                 GDKfree(tobedeleted);
     926           0 :                 return NULL;
     927             :         }
     928             : 
     929             :         ndelete = 0;
     930     5946452 :         for (n = 0, i = 0; bats[n]; n++) {
     931     5450490 :                 b = bats[n];
     932     5450490 :                 if (b->ttype == TYPE_msk || mask_cand(b)) {
     933        9153 :                         if ((b = BATunmask(b)) == NULL) {
     934           0 :                                 goto bunins_failed;
     935             :                         }
     936       12717 :                         tobedeleted[ndelete++] = b;
     937             :                 }
     938     5454054 :                 if (bats[n+1] && BATtdense(b) && b->hseqbase == b->tseqbase && b->tseqbase == bats[n+1]->hseqbase && BATcount(b) == BATcount(bats[n+1]))
     939     4481377 :                         continue; /* skip dense bat */
     940      972677 :                 ba[i] = (struct ba) {
     941             :                         .b = b,
     942      972677 :                         .hlo = b->hseqbase,
     943      972677 :                         .hhi = b->hseqbase + b->batCount,
     944             :                         .cnt = b->batCount,
     945      972677 :                         .t = (oid *) Tloc(b, 0),
     946             :                 };
     947      972677 :                 allnil |= b->ttype == TYPE_void && is_oid_nil(b->tseqbase);
     948      972677 :                 issorted &= b->tsorted;
     949      972677 :                 if (bats[n + 1])
     950      476447 :                         nonil &= b->tnonil;
     951      972677 :                 if (b->tnonil && b->tkey && b->tsorted &&
     952      509167 :                     ATOMtype(b->ttype) == TYPE_oid) {
     953      454959 :                         canditer_init(&ba[i].ci, NULL, b);
     954             :                 }
     955      969742 :                 i++;
     956             :         }
     957      495962 :         n = i;
     958      495962 :         if (i<=2) {
     959      445376 :                 if (i == 1) {
     960       61685 :                         bn = ba[0].b;
     961       61685 :                         BBPfix(bn->batCacheid);
     962             :                 } else {
     963      383691 :                         bn = BATproject(ba[0].b, ba[1].b);
     964             :                 }
     965      437785 :                 while (ndelete-- > 0)
     966         146 :                         BBPunfix(tobedeleted[ndelete]->batCacheid);
     967      437639 :                 GDKfree(tobedeleted);
     968      435665 :                 GDKfree(ba);
     969      435665 :                 return bn;
     970             :         }
     971             :         /* b is last BAT in bats array */
     972       50586 :         tpe = ATOMtype(b->ttype);
     973       50586 :         nil = ATOMnilptr(tpe);
     974       50586 :         if (allnil || ba[0].cnt == 0) {
     975       14108 :                 bn = BATconstant(ba[0].hlo, tpe == TYPE_oid ? TYPE_void : tpe,
     976             :                                  nil, ba[0].cnt, TRANSIENT);
     977       14108 :                 while (ndelete-- > 0)
     978       16719 :                         BBPreclaim(tobedeleted[ndelete]);
     979       14141 :                 GDKfree(tobedeleted);
     980       14113 :                 GDKfree(ba);
     981       14205 :                 TRC_DEBUG(ALGO, "with %d bats: nil/empty -> " ALGOOPTBATFMT
     982             :                           " " LLFMT " usec\n",
     983             :                           n, ALGOOPTBATPAR(bn), GDKusec() - t0);
     984       14205 :                 return bn;
     985             :         }
     986             : 
     987       36478 :         bi = bat_iterator(b);
     988       36434 :         if (nonil && ATOMstorage(tpe) == TYPE_str && bi.restricted == BAT_READ) {
     989        6680 :                 stringtrick = true;
     990        6680 :                 bn = COLnew2(ba[0].hlo, tpe, ba[0].cnt, TRANSIENT, bi.width);
     991        6669 :                 if (bn && bn->tvheap) {
     992             :                         /* no need to remove any files since they were
     993             :                          * never created for this bat */
     994        6672 :                         HEAPdecref(bn->tvheap, false);
     995        6684 :                         bn->tvheap = NULL;
     996             :                 }
     997        6681 :                 tpe = bi.width == 1 ? TYPE_bte : (bi.width == 2 ? TYPE_sht : (bi.width == 4 ? TYPE_int : TYPE_lng));
     998             :         } else {
     999       29754 :                 bn = COLnew(ba[0].hlo, tpe, ba[0].cnt, TRANSIENT);
    1000             :         }
    1001       36241 :         if (bn == NULL) {
    1002           0 :                 bat_iterator_end(&bi);
    1003           0 :                 goto bunins_failed;
    1004             :         }
    1005             : 
    1006       36241 :         assert(ba[n - 1].b == b);
    1007       36241 :         ba[n - 1].t = bi.base;
    1008       36241 :         if (ATOMtype(b->ttype) == TYPE_oid) {
    1009             :                 /* oid all the way */
    1010         810 :                 oid *d = (oid *) Tloc(bn, 0);
    1011         810 :                 assert(!stringtrick);
    1012    15726397 :                 TIMEOUT_LOOP_IDX_DECL(p, ba[0].cnt, qry_ctx) {
    1013    15722035 :                         oid o = ba[0].ci.s ? canditer_next(&ba[0].ci) : ba[0].t[p];
    1014    63781029 :                         for (int i = 1; i < n; i++) {
    1015    48058990 :                                 if (is_oid_nil(o)) {
    1016           0 :                                         bn->tnil = true;
    1017           0 :                                         break;
    1018             :                                 }
    1019    48058990 :                                 if (o < ba[i].hlo || o >= ba[i].hhi) {
    1020           0 :                                         GDKerror("does not match always\n");
    1021           0 :                                         bat_iterator_end(&bi);
    1022           0 :                                         goto bunins_failed;
    1023             :                                 }
    1024    48058990 :                                 o -= ba[i].hlo;
    1025    47956439 :                                 o = ba[i].ci.s ?
    1026    25043953 :                                     (ba[i].ci.tpe == cand_dense) ?
    1027    25043953 :                                         canditer_idx_dense(&ba[i].ci, o) :
    1028    71118751 :                                         canditer_idx(&ba[i].ci, o) : ba[i].t[o];
    1029             :                         }
    1030    15722039 :                         *d++ = o;
    1031             :                 }
    1032       35431 :         } else if (!ATOMvarsized(tpe)) {
    1033       35159 :                 const void *v;
    1034       35159 :                 char *d = Tloc(bn, 0);
    1035             : 
    1036       35159 :                 bn->tnil = false;
    1037       35159 :                 n--;    /* stop one before the end, also ba[n] is last */
    1038   100224795 :                 TIMEOUT_LOOP_IDX_DECL(p, ba[0].cnt, qry_ctx) {
    1039   100105906 :                         oid o = ba[0].ci.s ? canditer_next(&ba[0].ci) : ba[0].t[p];
    1040             : 
    1041   238467461 :                         for (int i = 1; i < n; i++) {
    1042   138342220 :                                 if (is_oid_nil(o)) {
    1043          15 :                                         bn->tnil = true;
    1044          15 :                                         break;
    1045             :                                 }
    1046   138342205 :                                 if (o < ba[i].hlo || o >= ba[i].hhi) {
    1047           0 :                                         GDKerror("does not match always\n");
    1048           0 :                                         bat_iterator_end(&bi);
    1049           0 :                                         goto bunins_failed;
    1050             :                                 }
    1051   138342205 :                                 o -= ba[i].hlo;
    1052   138915462 :                                 o = ba[i].ci.s ?
    1053    56316233 :                                     (ba[i].ci.tpe == cand_dense) ?
    1054    56316233 :                                         canditer_idx_dense(&ba[i].ci, o) :
    1055   184293071 :                                         canditer_idx(&ba[i].ci, o) : ba[i].t[o];
    1056             :                         }
    1057   100125256 :                         if (is_oid_nil(o)) {
    1058          15 :                                 assert(!stringtrick);
    1059          15 :                                 bn->tnil = true;
    1060          15 :                                 v = nil;
    1061   100125241 :                         } else if (o < ba[n].hlo || o >= ba[n].hhi) {
    1062           0 :                                 GDKerror("does not match always\n");
    1063           0 :                                 bat_iterator_end(&bi);
    1064           0 :                                 goto bunins_failed;
    1065             :                         } else {
    1066   100125241 :                                 o -= ba[n].hlo;
    1067   100125241 :                                 v = (const char *) bi.base + (o << bi.shift);
    1068             :                         }
    1069   100125256 :                         if (ATOMputFIX(tpe, d, v) != GDK_SUCCEED) {
    1070           0 :                                 bat_iterator_end(&bi);
    1071           0 :                                 goto bunins_failed;
    1072             :                         }
    1073   100106109 :                         d += bi.width;
    1074             :                 }
    1075       35353 :                 if (stringtrick) {
    1076        6684 :                         bn->tnil = false;
    1077        6684 :                         bn->tnonil = b->tnonil;
    1078        6684 :                         bn->tkey = false;
    1079        6684 :                         assert(bn->tvheap == NULL);
    1080        6684 :                         bn->tvheap = bi.vh;
    1081        6684 :                         HEAPincref(bi.vh);
    1082        6685 :                         assert(bn->tvheap->parentid != bn->batCacheid);
    1083        6685 :                         BBPretain(bn->tvheap->parentid);
    1084        6691 :                         assert(bn->ttype == b->ttype);
    1085        6692 :                         assert(bn->twidth == bi.width);
    1086        6692 :                         assert(bn->tshift == bi.shift);
    1087             :                 }
    1088             :                 n++;            /* undo for debug print */
    1089             :         } else {
    1090         272 :                 const void *v;
    1091             : 
    1092         272 :                 assert(!stringtrick);
    1093         272 :                 bn->tnil = false;
    1094         272 :                 n--;    /* stop one before the end, also ba[n] is last */
    1095      701042 :                 TIMEOUT_LOOP_IDX_DECL(p, ba[0].cnt, qry_ctx) {
    1096      700458 :                         oid o = ba[0].ci.s ? canditer_next(&ba[0].ci) : ba[0].t[p];
    1097     1415369 :                         for (int i = 1; i < n; i++) {
    1098      715029 :                                 if (is_oid_nil(o)) {
    1099           0 :                                         bn->tnil = true;
    1100           0 :                                         break;
    1101             :                                 }
    1102      715029 :                                 if (o < ba[i].hlo || o >= ba[i].hhi) {
    1103           0 :                                         GDKerror("does not match always\n");
    1104           0 :                                         bat_iterator_end(&bi);
    1105           0 :                                         goto bunins_failed;
    1106             :                                 }
    1107      715029 :                                 o -= ba[i].hlo;
    1108      715072 :                                 o = ba[i].ci.s ?
    1109       19618 :                                     (ba[i].ci.tpe == cand_dense) ?
    1110       19618 :                                         canditer_idx_dense(&ba[i].ci, o) :
    1111      731957 :                                         canditer_idx(&ba[i].ci, o) : ba[i].t[o];
    1112             :                         }
    1113      700340 :                         if (is_oid_nil(o)) {
    1114           0 :                                 bn->tnil = true;
    1115           0 :                                 v = nil;
    1116      700340 :                         } else if (o < ba[n].hlo || o >= ba[n].hhi) {
    1117           0 :                                 GDKerror("does not match always\n");
    1118           0 :                                 bat_iterator_end(&bi);
    1119           0 :                                 goto bunins_failed;
    1120             :                         } else {
    1121      700340 :                                 o -= ba[n].hlo;
    1122      700340 :                                 v = BUNtail(bi, o);
    1123             :                         }
    1124      700344 :                         if (bunfastapp(bn, v) != GDK_SUCCEED) {
    1125           0 :                                 bat_iterator_end(&bi);
    1126           0 :                                 goto bunins_failed;
    1127             :                         }
    1128             :                 }
    1129             :                 n++;            /* undo for debug print */
    1130             :         }
    1131       36448 :         bat_iterator_end(&bi);
    1132       36525 :         TIMEOUT_CHECK(qry_ctx, GOTO_LABEL_TIMEOUT_HANDLER(bunins_failed, qry_ctx));
    1133       36446 :         BATsetcount(bn, ba[0].cnt);
    1134       36521 :         bn->tsorted = (ba[0].cnt <= 1) | issorted;
    1135       36521 :         bn->trevsorted = ba[0].cnt <= 1;
    1136       36521 :         bn->tnonil = nonil & b->tnonil;
    1137       36521 :         bn->tseqbase = oid_nil;
    1138       36521 :         bn->tkey = (ba[0].cnt <= 1);
    1139             :         /* note, b may point to one of the bats in tobedeleted, so
    1140             :          * reclaim after the last use of b */
    1141       36521 :         while (ndelete-- > 0)
    1142       46405 :                 BBPreclaim(tobedeleted[ndelete]);
    1143       36384 :         GDKfree(tobedeleted);
    1144       36331 :         GDKfree(ba);
    1145       36559 :         TRC_DEBUG(ALGO, "with %d bats: " ALGOOPTBATFMT " " LLFMT " usec\n",
    1146             :                   n, ALGOOPTBATPAR(bn), GDKusec() - t0);
    1147             :         return bn;
    1148             : 
    1149           0 :   bunins_failed:
    1150           0 :         while (ndelete-- > 0)
    1151           0 :                 BBPreclaim(tobedeleted[ndelete]);
    1152           0 :         GDKfree(tobedeleted);
    1153           0 :         GDKfree(ba);
    1154           0 :         BBPreclaim(bn);
    1155           0 :         TRC_DEBUG(ALGO, "failed " LLFMT "usec\n", GDKusec() - t0);
    1156             :         return NULL;
    1157             : }

Generated by: LCOV version 1.14