LCOV - code coverage report
Current view: top level - monetdb5/modules/mal - mat.c (source / functions) Hit Total Coverage
Test: coverage.info Lines: 100 155 64.5 %
Date: 2024-11-13 22:44:48 Functions: 5 5 100.0 %

          Line data    Source code
       1             : /*
       2             :  * SPDX-License-Identifier: MPL-2.0
       3             :  *
       4             :  * This Source Code Form is subject to the terms of the Mozilla Public
       5             :  * License, v. 2.0.  If a copy of the MPL was not distributed with this
       6             :  * file, You can obtain one at http://mozilla.org/MPL/2.0/.
       7             :  *
       8             :  * Copyright 2024 MonetDB Foundation;
       9             :  * Copyright August 2008 - 2023 MonetDB B.V.;
      10             :  * Copyright 1997 - July 2008 CWI.
      11             :  */
      12             : 
      13             : /*
      14             :  * Martin Kersten
      15             :  * Multiple association tables
      16             :  * A MAT is a convenient way to deal represent horizontal fragmented
      17             :  * tables. It combines the definitions of several, type compatible
      18             :  * BATs under a single name.
      19             :  * It is produced by the mitosis optimizer and the operations
      20             :  * are the target of the mergetable optimizer.
      21             :  *
      22             :  * The MAT is materialized when the operations
      23             :  * can not deal with the components individually,
      24             :  * or the incremental operation is not supported.
      25             :  * Normally all mat.new() operations are removed by the
      26             :  * mergetable optimizer.
      27             :  * In case a mat.new() is retained in the code, then it will
      28             :  * behave as a mat.pack();
      29             :  *
      30             :  * The primitives below are chosen to accommodate the SQL
      31             :  * front-end to produce reasonable efficient code.
      32             :  */
      33             : #include "monetdb_config.h"
      34             : #include "mal_resolve.h"
      35             : #include "mal_exception.h"
      36             : #include "mal_interpreter.h"
      37             : 
      38             : /*
      39             :  * The pack is an ordinary multi BAT insert. Oid synchronistion
      40             :  * between pieces should be ensured by the code generators.
      41             :  * The pack operation could be quite expensive, because it
      42             :  * may create a really large BAT.
      43             :  * The slice over a mat helps to avoid constructing intermediates
      44             :  * that are subsequently reduced.
      45             :  * Contrary to most operations, NIL arguments are skipped and
      46             :  * do not produce RUNTIME_OBJECT_MISSING.
      47             :  */
      48             : static str
      49       98169 : MATpackInternal(Client cntxt, MalBlkPtr mb, MalStkPtr stk, InstrPtr p)
      50             : {
      51       98169 :         int i;
      52       98169 :         bat *ret = getArgReference_bat(stk, p, 0);
      53       98169 :         BAT *b, *bn = NULL;
      54       98169 :         BUN cap = 0;
      55       98169 :         int tt = TYPE_any;
      56       98169 :         int rt = getArgType(mb, p, 0), unmask = 0;
      57       98169 :         (void) cntxt;
      58             : 
      59      490505 :         for (i = 1; i < p->argc; i++) {
      60      392360 :                 bat bid = stk->stk[getArg(p, i)].val.bval;
      61      392360 :                 b = BBPquickdesc(bid);
      62      392336 :                 if (b) {
      63      392336 :                         if (tt == TYPE_any)
      64       98160 :                                 tt = b->ttype;
      65      392336 :                         if ((tt != TYPE_void && b->ttype != TYPE_void
      66      326690 :                                  && b->ttype != TYPE_msk) && tt != b->ttype)
      67           0 :                                 throw(MAL, "mat.pack", "incompatible arguments");
      68      392336 :                         cap += BATcount(b);
      69             :                 }
      70             :         }
      71       98145 :         if (tt == TYPE_any) {
      72           0 :                 *ret = bat_nil;
      73           0 :                 return MAL_SUCCEED;
      74             :         }
      75             : 
      76       98145 :         if (tt == TYPE_msk && rt == newBatType(TYPE_oid)) {
      77           0 :                 tt = TYPE_oid;
      78           0 :                 unmask = 1;
      79             :         }
      80       98145 :         bn = COLnew(0, tt, cap, TRANSIENT);
      81       98160 :         if (bn == NULL)
      82           0 :                 throw(MAL, "mat.pack", SQLSTATE(HY013) MAL_MALLOC_FAIL);
      83             : 
      84      490464 :         for (i = 1; i < p->argc; i++) {
      85      392307 :                 if (!(b = BATdescriptor(stk->stk[getArg(p, i)].val.ival))) {
      86           0 :                         BBPreclaim(bn);
      87           0 :                         throw(MAL, "mat.pack", SQLSTATE(HY002) RUNTIME_OBJECT_MISSING);
      88             :                 }
      89      392409 :                 if ((unmask && b->ttype == TYPE_msk) || mask_cand(b)) {
      90        5384 :                         BAT *ob = b;
      91        5384 :                         b = BATunmask(b);
      92        5384 :                         BBPunfix(ob->batCacheid);
      93        5384 :                         if (!b) {
      94           0 :                                 BBPreclaim(bn);
      95           0 :                                 throw(MAL, "mat.pack", GDK_EXCEPTION);
      96             :                         }
      97             :                 }
      98      392409 :                 if (BATcount(bn) == 0) {
      99       98879 :                         BAThseqbase(bn, b->hseqbase);
     100       98882 :                         BATtseqbase(bn, b->tseqbase);
     101             :                 }
     102      392411 :                 if (BATappend(bn, b, NULL, false) != GDK_SUCCEED) {
     103           0 :                         BBPreclaim(bn);
     104           0 :                         BBPunfix(b->batCacheid);
     105           0 :                         throw(MAL, "mat.pack", GDK_EXCEPTION);
     106             :                 }
     107      392362 :                 BBPunfix(b->batCacheid);
     108             :         }
     109       98157 :         if (bn->tnil && bn->tnonil) {
     110           0 :                 BBPreclaim(bn);
     111           0 :                 throw(MAL, "mat.pack",
     112             :                           "INTERNAL ERROR" "bn->tnil or  bn->tnonil fails ");
     113             :         }
     114       98157 :         *ret = bn->batCacheid;
     115       98157 :         BBPkeepref(bn);
     116       98157 :         return MAL_SUCCEED;
     117             : }
     118             : 
     119             : /*
     120             :  * Enable incremental packing. The SQL front-end requires
     121             :  * fixed oid sequences.
     122             :  */
     123             : static str
     124      564386 : MATpackIncrement(Client cntxt, MalBlkPtr mb, MalStkPtr stk, InstrPtr p)
     125             : {
     126      564386 :         bat *ret = getArgReference_bat(stk, p, 0);
     127      564386 :         int pieces;
     128      564386 :         BAT *b, *bb, *bn;
     129      564386 :         size_t newsize;
     130             : 
     131      564386 :         (void) cntxt;
     132      564386 :         b = BATdescriptor(stk->stk[getArg(p, 1)].val.ival);
     133      564361 :         if (b == NULL)
     134           0 :                 throw(MAL, "mat.pack", SQLSTATE(HY002) RUNTIME_OBJECT_MISSING);
     135             : 
     136      564361 :         if (getArgType(mb, p, 2) == TYPE_int) {
     137             :                 /* first step, estimate with some slack */
     138      145808 :                 pieces = stk->stk[getArg(p, 2)].val.ival;
     139      145808 :                 int tt = ATOMtype(b->ttype);
     140      145808 :                 if (b->ttype == TYPE_msk)
     141           0 :                         tt = TYPE_oid;
     142      145808 :                 bn = COLnew(b->hseqbase, tt, (BUN) (1.2 * BATcount(b) * pieces),
     143             :                                         TRANSIENT);
     144      145801 :                 if (bn == NULL) {
     145           0 :                         BBPunfix(b->batCacheid);
     146           0 :                         throw(MAL, "mat.pack", SQLSTATE(HY013) MAL_MALLOC_FAIL);
     147             :                 }
     148             :                 /* allocate enough space for the vheap, but not for strings,
     149             :                  * since BATappend does clever things for strings, and not for
     150             :                  * vheap views since they may well get shared */
     151      145801 :                 if (b->tvheap && b->tvheap->parentid == b->batCacheid && bn->tvheap
     152       56634 :                         && ATOMstorage(b->ttype) != TYPE_str) {
     153          46 :                         newsize = b->tvheap->size * pieces;
     154          46 :                         if (HEAPextend(bn->tvheap, newsize, true) != GDK_SUCCEED) {
     155           0 :                                 BBPunfix(b->batCacheid);
     156           0 :                                 BBPreclaim(bn);
     157           0 :                                 throw(MAL, "mat.pack", GDK_EXCEPTION);
     158             :                         }
     159             :                 }
     160      145801 :                 BATtseqbase(bn, b->tseqbase);
     161      145811 :                 if (b->ttype == TYPE_msk || mask_cand(b)) {
     162           0 :                         BAT *ob = b;
     163           0 :                         b = BATunmask(b);
     164           0 :                         BBPunfix(ob->batCacheid);
     165           0 :                         if (!b) {
     166           0 :                                 BBPreclaim(bn);
     167           0 :                                 throw(MAL, "mat.pack", GDK_EXCEPTION);
     168             :                         }
     169             :                 }
     170      145811 :                 if (BATappend(bn, b, NULL, false) != GDK_SUCCEED) {
     171           0 :                         BBPreclaim(bn);
     172           0 :                         BBPunfix(b->batCacheid);
     173           0 :                         throw(MAL, "mat.pack", GDK_EXCEPTION);
     174             :                 }
     175      145809 :                 bn->tunique_est = b->tunique_est;
     176      145809 :                 bn->unused = (pieces - 1);   /* misuse "unused" field */
     177      145809 :                 BBPunfix(b->batCacheid);
     178      145794 :                 if (bn->tnil && bn->tnonil) {
     179           0 :                         BBPreclaim(bn);
     180           0 :                         throw(MAL, "mat.pack",
     181           0 :                                   "INTERNAL ERROR" " bn->tnil %d bn->tnonil %d", bn->tnil,
     182           0 :                                   bn->tnonil);
     183             :                 }
     184      145794 :                 *ret = bn->batCacheid;
     185      145794 :                 BBPretain(bn->batCacheid);
     186      145797 :                 BBPunfix(bn->batCacheid);
     187             :         } else {
     188             :                 /* remaining steps */
     189      418553 :                 if (!(bb = BATdescriptor(stk->stk[getArg(p, 2)].val.ival))) {
     190           0 :                         BBPunfix(b->batCacheid);
     191           0 :                         throw(MAL, "mat.pack", SQLSTATE(HY002) RUNTIME_OBJECT_MISSING);
     192             :                 }
     193      418469 :                 if (bb->ttype == TYPE_msk || mask_cand(bb)) {
     194           0 :                         BAT *obb = bb;
     195           0 :                         bb = BATunmask(bb);
     196           0 :                         BBPunfix(obb->batCacheid);
     197           0 :                         if (!bb) {
     198           0 :                                 BBPunfix(b->batCacheid);
     199           0 :                                 throw(MAL, "mat.pack", GDK_EXCEPTION);
     200             :                         }
     201             :                 }
     202      418469 :                 if (BATcount(b) == 0) {
     203      247745 :                         BAThseqbase(b, bb->hseqbase);
     204      247799 :                         BATtseqbase(b, bb->tseqbase);
     205             :                 }
     206      418494 :                 if (BATappend(b, bb, NULL, false) != GDK_SUCCEED) {
     207           0 :                         BBPunfix(bb->batCacheid);
     208           0 :                         BBPunfix(b->batCacheid);
     209           0 :                         throw(MAL, "mat.pack", GDK_EXCEPTION);
     210             :                 }
     211      418560 :                 BBPunfix(bb->batCacheid);
     212      418385 :                 b->tunique_est += bb->tunique_est;
     213      418385 :                 b->unused--;
     214      418385 :                 if (b->unused == 0 && (b = BATsetaccess(b, BAT_READ)) == NULL)
     215           0 :                         throw(MAL, "mat.pack", GDK_EXCEPTION);
     216      418411 :                 if (b->tnil && b->tnonil) {
     217           0 :                         BBPunfix(b->batCacheid);
     218           0 :                         throw(MAL, "mat.pack",
     219             :                                   "INTERNAL ERROR" " b->tnil or  b->tnonil fails ");
     220             :                 }
     221      418411 :                 *ret = b->batCacheid;
     222      418411 :                 BBPretain(b->batCacheid);
     223      418519 :                 BBPunfix(b->batCacheid);
     224             :         }
     225             :         return MAL_SUCCEED;
     226             : }
     227             : 
     228             : static str
     229       98168 : MATpack(Client cntxt, MalBlkPtr mb, MalStkPtr stk, InstrPtr p)
     230             : {
     231       98168 :         return MATpackInternal(cntxt, mb, stk, p);
     232             : }
     233             : 
     234             : static str
     235      294871 : MATpackValues(Client cntxt, MalBlkPtr mb, MalStkPtr stk, InstrPtr p)
     236             : {
     237      294871 :         int i, type, first = 1;
     238      294871 :         bat *ret;
     239      294871 :         BAT *bn;
     240             : 
     241      294871 :         (void) cntxt;
     242      294871 :         type = getArgType(mb, p, first);
     243      294871 :         bn = COLnew(0, type, p->argc, TRANSIENT);
     244      294726 :         if (bn == NULL)
     245           0 :                 throw(MAL, "mat.pack", SQLSTATE(HY013) MAL_MALLOC_FAIL);
     246             : 
     247      294726 :         if (ATOMextern(type)) {
     248      888187 :                 for (i = first; i < p->argc; i++)
     249      712447 :                         if (BUNappend(bn, stk->stk[getArg(p, i)].val.pval, false) != GDK_SUCCEED)
     250           0 :                                 goto bailout;
     251             :         } else {
     252      604339 :                 for (i = first; i < p->argc; i++)
     253      485367 :                         if (BUNappend(bn, getArgReference(stk, p, i), false) != GDK_SUCCEED)
     254           0 :                                 goto bailout;
     255             :         }
     256      294712 :         ret = getArgReference_bat(stk, p, 0);
     257      294712 :         *ret = bn->batCacheid;
     258      294712 :         BBPkeepref(bn);
     259      294712 :         return MAL_SUCCEED;
     260           0 :   bailout:
     261           0 :         BBPreclaim(bn);
     262           0 :         throw(MAL, "mat.pack", GDK_EXCEPTION);
     263             : }
     264             : 
     265             : #include "mel.h"
     266             : mel_func mat_init_funcs[] = {
     267             :  pattern("mat", "new", MATpack, false, "Define a Merge Association Table (MAT). Fall back to the pack operation\nwhen this is called ", args(1,2, batargany("",1),batvarargany("b",1))),
     268             :  pattern("bat", "pack", MATpackValues, false, "Materialize the values into a BAT. Avoiding a clash with mat.pack() in mergetable", args(1,2, batargany("",1),varargany("",1))),
     269             :  pattern("mat", "pack", MATpackValues, false, "Materialize the MAT (of values) into a BAT", args(1,2, batargany("",1),varargany("",1))),
     270             :  pattern("mat", "pack", MATpack, false, "Materialize the MAT into a BAT", args(1,2, batargany("",1),batvarargany("b",1))),
     271             :  pattern("mat", "packIncrement", MATpackIncrement, false, "Prepare incremental mat pack", args(1,3, batargany("",1),batargany("b",1),arg("pieces",int))),
     272             :  pattern("mat", "packIncrement", MATpackIncrement, false, "Prepare incremental mat pack", args(1,3, batargany("",1),batargany("b",1),batargany("c",1))),
     273             :  { .imp=NULL }
     274             : };
     275             : #include "mal_import.h"
     276             : #ifdef _MSC_VER
     277             : #undef read
     278             : #pragma section(".CRT$XCU",read)
     279             : #endif
     280         308 : LIB_STARTUP_FUNC(init_mat_mal)
     281         308 : { mal_module("mat", NULL, mat_init_funcs); }

Generated by: LCOV version 1.14