Line data Source code
1 : /*
2 : * SPDX-License-Identifier: MPL-2.0
3 : *
4 : * This Source Code Form is subject to the terms of the Mozilla Public
5 : * License, v. 2.0. If a copy of the MPL was not distributed with this
6 : * file, You can obtain one at http://mozilla.org/MPL/2.0/.
7 : *
8 : * Copyright 2024 MonetDB Foundation;
9 : * Copyright August 2008 - 2023 MonetDB B.V.;
10 : * Copyright 1997 - July 2008 CWI.
11 : */
12 :
13 : /*
14 : * @a M. L. Kersten, P. Boncz, N. J. Nes
15 : * @* BAT Buffer Pool (BBP)
16 : * The BATs created and loaded are collected in a BAT buffer pool.
17 : * The Bat Buffer Pool has a number of functions:
18 : * @table @code
19 : *
20 : * @item administration and lookup
21 : * The BBP is a directory which contains status information about all
22 : * known BATs. This interface may be used very heavily, by
23 : * data-intensive applications. To eliminate all overhead, read-only
24 : * access to the BBP may be done by table-lookups. The integer index
25 : * type for these lookups is @emph{bat}, as retrieved by
26 : * @emph{b->batCacheid}. The @emph{bat} zero is reserved for the nil
27 : * bat.
28 : *
29 : * @item persistence
30 : * The BBP is made persistent by saving it to the dictionary file
31 : * called @emph{BBP.dir} in the database.
32 : *
33 : * When the number of BATs rises, having all files in one directory
34 : * becomes a bottleneck. The BBP therefore implements a scheme that
35 : * distributes all BATs in a growing directory tree with at most 64
36 : * BATs stored in one node.
37 : *
38 : * @item buffer management
39 : * The BBP is responsible for loading and saving of BATs to disk. It
40 : * also contains routines to unload BATs from memory when memory
41 : * resources get scarce. For this purpose, it administers BAT memory
42 : * reference counts (to know which BATs can be unloaded) and BAT usage
43 : * statistics (it unloads the least recently used BATs).
44 : *
45 : * @item recovery
46 : * When the database is closed or during a run-time syncpoint, the
47 : * system tables must be written to disk in a safe way, that is immune
48 : * for system failures (like disk full). To do so, the BBP implements
49 : * an atomic commit and recovery protocol: first all files to be
50 : * overwritten are moved to a BACKUP/ dir. If that succeeds, the
51 : * writes are done. If that also fully succeeds the BACKUP/ dir is
52 : * renamed to DELETE_ME/ and subsequently deleted. If not, all files
53 : * in BACKUP/ are moved back to their original location.
54 : *
55 : * @item unloading
56 : * Bats which have a logical reference (ie. a lrefs > 0) but no memory
57 : * reference (refcnt == 0) can be unloaded. Unloading dirty bats
58 : * means, moving the original (committed version) to the BACKUP/ dir
59 : * and saving the bat. This complicates the commit and recovery/abort
60 : * issues. The commit has to check if the bat is already moved. And
61 : * The recovery has to always move back the files from the BACKUP/
62 : * dir.
63 : *
64 : * @item reference counting
65 : * Bats use have two kinds of references: logical and physical
66 : * (pointer) ones. The logical references are administered by
67 : * BBPretain/BBPrelease, the physical ones by BBPfix/BBPunfix.
68 : */
69 :
70 : #include "monetdb_config.h"
71 : #include "gdk.h"
72 : #include "gdk_private.h"
73 : #include "mutils.h"
74 : #ifdef HAVE_FCNTL_H
75 : #include <fcntl.h>
76 : #endif
77 :
78 : #ifndef F_OK
79 : #define F_OK 0
80 : #endif
81 : #ifndef S_ISDIR
82 : #define S_ISDIR(mode) (((mode) & _S_IFMT) == _S_IFDIR)
83 : #endif
84 : #ifndef O_CLOEXEC
85 : #ifdef _O_NOINHERIT
86 : #define O_CLOEXEC _O_NOINHERIT /* Windows */
87 : #else
88 : #define O_CLOEXEC 0
89 : #endif
90 : #endif
91 : #ifndef O_BINARY
92 : #define O_BINARY 0
93 : #endif
94 :
95 : /*
96 : * The BBP has a fixed address, so re-allocation due to a growing BBP
97 : * caused by one thread does not disturb reads to the old entries by
98 : * another. This is implemented using anonymous virtual memory;
99 : * extensions on the same address are guaranteed because a large
100 : * non-committed VM area is requested initially. New slots in the BBP
101 : * are found in O(1) by keeping a freelist that uses the 'next' field
102 : * in the BBPrec records.
103 : */
104 : static BBPrec BBP0[BBPINIT];
105 : BBPrec *BBP[N_BBPINIT] = {[0] = BBP0}; /* fixed base VM address of BBP array */
106 : bat BBPlimit = BBPINIT; /* current committed VM BBP array */
107 : static ATOMIC_TYPE BBPsize = ATOMIC_VAR_INIT(0); /* current used size of BBP array */
108 :
109 : struct BBPfarm_t BBPfarms[MAXFARMS];
110 :
111 : #define KITTENNAP 1 /* used to suspend processing */
112 : #define BBPNONAME "." /* filler for no name in BBP.dir */
113 : /*
114 : * The hash index uses a bucket index (int array) of size mask that is
115 : * tuned for perfect hashing (1 lookup). The bucket chain uses the
116 : * 'next' field in the BBPrec records.
117 : */
118 : static MT_Lock BBPnameLock = MT_LOCK_INITIALIZER(BBPnameLock);
119 : #define BBP_mask 1023 /* number of buckets = & mask */
120 : static bat BBP_hash[BBP_mask+1]; /* BBP logical name hash buckets */
121 : static MT_Lock GDKcacheLock = MT_LOCK_INITIALIZER(GDKcacheLock);
122 : static bat BBP_free;
123 : static uint32_t BBP_nfree;
124 : #define BBP_FREE_LOWATER 10
125 : #define BBP_FREE_HIWATER 50
126 :
127 : static gdk_return BBPfree(BAT *b);
128 : static void BBPdestroy(BAT *b);
129 : static void BBPuncacheit(bat bid, bool unloaddesc);
130 : static gdk_return BBPprepare(bool subcommit);
131 : static BAT *getBBPdescriptor(bat i);
132 : static gdk_return BBPbackup(BAT *b, bool subcommit);
133 : static gdk_return BBPdir_init(void);
134 : static void BBPcallbacks(void);
135 :
136 : /* two lngs of extra info in BBP.dir */
137 : /* these two are atomic because of their use in log_new() */
138 : static ATOMIC_TYPE BBPlogno = ATOMIC_VAR_INIT(0);
139 :
140 : #define BBPtmpcheck(s) (strncmp(s, "tmp_", 4) == 0)
141 :
142 : #define BBPnamecheck(s) (BBPtmpcheck(s) ? strtol((s) + 4, NULL, 8) : 0)
143 :
144 : #define BATno_shared_heap(b) \
145 : (!VIEWtparent(b) && (ATOMIC_GET(&(b)->theap->refs) & HEAPREFS) == 1)
146 :
147 : #define BATshared(b) \
148 : ((!VIEWtparent(b) && (ATOMIC_GET(&(b)->theap->refs) & HEAPREFS) > 1) || \
149 : ((b)->tvheap && !VIEWvtparent(b) && (ATOMIC_GET(&(b)->tvheap->refs) & HEAPREFS) > 1))
150 :
151 : static void
152 25924 : BBP_insert(bat i)
153 : {
154 25924 : bat idx = (bat) (strHash(BBP_logical(i)) & BBP_mask);
155 :
156 25924 : BBP_next(i) = BBP_hash[idx];
157 25924 : BBP_hash[idx] = i;
158 25924 : }
159 :
160 : static void
161 14731 : BBP_delete(bat i)
162 : {
163 14731 : const char *s = BBP_logical(i);
164 14731 : bat idx = (bat) (strHash(s) & BBP_mask);
165 :
166 14731 : for (bat *h = &BBP_hash[idx]; (i = *h) != 0; h = &BBP_next(i)) {
167 14731 : if (strcmp(BBP_logical(i), s) == 0) {
168 14731 : *h = BBP_next(i);
169 14731 : break;
170 : }
171 : }
172 14731 : }
173 :
174 : bat
175 370568541 : getBBPsize(void)
176 : {
177 370568541 : return (bat) ATOMIC_GET(&BBPsize);
178 : }
179 :
180 : lng
181 341 : getBBPlogno(void)
182 : {
183 341 : return (lng) ATOMIC_GET(&BBPlogno);
184 : }
185 :
186 :
187 : /*
188 : * @+ BBP Consistency and Concurrency
189 : * While GDK provides the basic building blocks for an ACID system, in
190 : * itself it is not such a system, as we this would entail too much
191 : * overhead that is often not needed. Hence, some consistency control
192 : * is left to the user. The first important user constraint is that if
193 : * a user updates a BAT, (s)he himself must assure that no-one else
194 : * accesses this BAT.
195 : *
196 : * Concerning buffer management, the BBP carries out a swapping
197 : * policy. BATs are kept in memory till the memory is full. If the
198 : * memory is full, the malloc functions initiate BBP trim actions,
199 : * that unload the coldest BATs that have a zero reference count. The
200 : * second important user constraint is therefore that a user may only
201 : * manipulate live BAT data in memory if it is sure that there is at
202 : * least one reference count to that BAT.
203 : *
204 : * The main BBP array is protected by two locks:
205 : * @table @code
206 : * @item GDKcacheLock]
207 : * this lock guards the free slot management in the BBP array. The
208 : * BBP operations that allocate a new slot for a new BAT
209 : * (@emph{BBPinit},@emph{BBPcacheit}), delete the slot of a destroyed
210 : * BAT (@emph{BBPreclaim}), or rename a BAT (@emph{BBPrename}), hold
211 : * this lock. It also protects all BAT (re)naming actions include
212 : * (read and write) in the hash table with BAT names.
213 : * @item GDKswapLock
214 : * this lock guards the swap (loaded/unloaded) status of the
215 : * BATs. Hence, all BBP routines that influence the swapping policy,
216 : * or actually carry out the swapping policy itself, acquire this lock
217 : * (e.g. @emph{BBPfix},@emph{BBPunfix}). Note that this also means
218 : * that updates to the BBP_status indicator array must be protected by
219 : * GDKswapLock.
220 : *
221 : * To reduce contention GDKswapLock was split into multiple locks; it
222 : * is now an array of lock pointers which is accessed by
223 : * GDKswapLock(bat)
224 : * @end table
225 : *
226 : * Routines that need both locks should first acquire the locks in the
227 : * GDKswapLock array (in ascending order) and then GDKcacheLock (and
228 : * release them in reverse order).
229 : *
230 : * To obtain maximum speed, read operations to existing elements in
231 : * the BBP are unguarded. As said, it is the users responsibility that
232 : * the BAT that is being read is not being modified. BBP update
233 : * actions that modify the BBP data structure itself are locked by the
234 : * BBP functions themselves. Hence, multiple concurrent BBP read
235 : * operations may be ongoing while at the same time at most one BBP
236 : * write operation @strong{on a different BAT} is executing. This
237 : * holds for accesses to the public (quasi-) arrays @emph{BBPcache},
238 : * @emph{BBPstatus} and @emph{BBPrefs}.
239 : * These arrays are called quasi as now they are
240 : * actually stored together in one big BBPrec array called BBP, that
241 : * is allocated in anonymous VM space, so we can reallocate this
242 : * structure without changing the base address (a crucial feature if
243 : * read actions are to go on unlocked while other entries in the BBP
244 : * may be modified).
245 : */
246 : static volatile MT_Id locked_by = 0;
247 :
248 : /* use a lock instead of atomic instructions so that we wait for
249 : * BBPlock/BBPunlock */
250 : #define BBP_unload_inc() \
251 : do { \
252 : MT_lock_set(&GDKunloadLock); \
253 : BBPunloadCnt++; \
254 : MT_lock_unset(&GDKunloadLock); \
255 : } while (0)
256 :
257 : #define BBP_unload_dec() \
258 : do { \
259 : MT_lock_set(&GDKunloadLock); \
260 : --BBPunloadCnt; \
261 : assert(BBPunloadCnt >= 0); \
262 : MT_lock_unset(&GDKunloadLock); \
263 : } while (0)
264 :
265 : static int BBPunloadCnt = 0;
266 : static MT_Lock GDKunloadLock = MT_LOCK_INITIALIZER(GDKunloadLock);
267 :
268 : void
269 8 : BBPlock(void)
270 : {
271 8 : int i;
272 :
273 : /* wait for all pending unloads to finish */
274 8 : MT_lock_set(&GDKunloadLock);
275 8 : while (BBPunloadCnt > 0) {
276 0 : MT_lock_unset(&GDKunloadLock);
277 0 : MT_sleep_ms(1);
278 8 : MT_lock_set(&GDKunloadLock);
279 : }
280 :
281 8 : BBPtmlock();
282 8 : MT_lock_set(&GDKcacheLock);
283 65552 : for (i = 0; i <= BBP_BATMASK; i++)
284 65536 : MT_lock_set(&GDKswapLock(i));
285 8 : locked_by = MT_getpid();
286 :
287 8 : MT_lock_unset(&GDKunloadLock);
288 8 : }
289 :
290 : void
291 8 : BBPunlock(void)
292 : {
293 8 : int i;
294 :
295 65544 : for (i = BBP_BATMASK; i >= 0; i--)
296 65536 : MT_lock_unset(&GDKswapLock(i));
297 8 : MT_lock_unset(&GDKcacheLock);
298 8 : locked_by = 0;
299 8 : BBPtmunlock();
300 8 : }
301 :
302 : int
303 11443832 : BBPselectfarm(role_t role, int type, enum heaptype hptype)
304 : {
305 11443832 : int i;
306 :
307 11443832 : (void) type; /* may use in future */
308 11443832 : (void) hptype; /* may use in future */
309 :
310 11443832 : if (GDKinmemory(0))
311 : return 0;
312 :
313 22514759 : for (i = 0; i < MAXFARMS; i++)
314 22514759 : if (BBPfarms[i].roles & (1U << (int) role))
315 11424329 : return i;
316 : /* must be able to find farms for TRANSIENT and PERSISTENT */
317 0 : assert(role != TRANSIENT && role != PERSISTENT);
318 : return -1;
319 : }
320 :
321 : static gdk_return
322 315 : BBPextend(bat newsize)
323 : {
324 315 : if (newsize > N_BBPINIT * BBPINIT) {
325 0 : GDKerror("trying to extend BAT pool beyond the "
326 : "limit (%d)\n", N_BBPINIT * BBPINIT);
327 0 : return GDK_FAIL;
328 : }
329 :
330 : /* make sure the new size is at least BBPsize large */
331 315 : while (BBPlimit < newsize) {
332 0 : BUN limit = BBPlimit >> BBPINITLOG;
333 0 : assert(BBP[limit] == NULL);
334 0 : BBP[limit] = GDKzalloc(BBPINIT * sizeof(BBPrec));
335 0 : if (BBP[limit] == NULL) {
336 0 : GDKerror("failed to extend BAT pool\n");
337 0 : return GDK_FAIL;
338 : }
339 0 : for (BUN i = 0; i < BBPINIT; i++) {
340 0 : ATOMIC_INIT(&BBP[limit][i].status, 0);
341 0 : BBP[limit][i].pid = ~(MT_Id)0;
342 : }
343 0 : BBPlimit += BBPINIT;
344 : }
345 :
346 : return GDK_SUCCEED;
347 : }
348 :
349 : static gdk_return
350 89 : recover_dir(int farmid, bool direxists)
351 : {
352 89 : if (direxists) {
353 : /* just try; don't care about these non-vital files */
354 0 : if (GDKunlink(farmid, BATDIR, "BBP", "bak") != GDK_SUCCEED)
355 0 : GDKwarning("unlink of BBP.bak failed\n");
356 0 : if (GDKmove(farmid, BATDIR, "BBP", "dir", BATDIR, "BBP", "bak", false) != GDK_SUCCEED)
357 0 : GDKwarning("rename of BBP.dir to BBP.bak failed\n");
358 : }
359 89 : return GDKmove(farmid, BAKDIR, "BBP", "dir", BATDIR, "BBP", "dir", true);
360 : }
361 :
362 : static inline str
363 430996 : BBPsubdir_recursive(char *s, bat i)
364 : {
365 430996 : i >>= 6;
366 430996 : if (i >= 0100) {
367 60670 : s = BBPsubdir_recursive(s, i);
368 60670 : *s++ = DIR_SEP;
369 : }
370 430996 : i &= 077;
371 430996 : *s++ = '0' + (i >> 3);
372 430996 : *s++ = '0' + (i & 7);
373 430996 : return s;
374 : }
375 :
376 : static inline void
377 0 : BBPgetsubdir(char *s, bat i)
378 : {
379 0 : if (i >= 0100) {
380 0 : s = BBPsubdir_recursive(s, i);
381 : }
382 0 : *s = 0;
383 0 : }
384 :
385 : static inline void
386 390265 : BBPgetfilename(char *s, size_t len, bat i)
387 : {
388 390265 : if (i >= 0100) {
389 370360 : char *p = BBPsubdir_recursive(s, i);
390 370324 : *p++ = DIR_SEP;
391 370324 : len -= (p - s);
392 370324 : s = p;
393 : }
394 390229 : if (snprintf(s, len, "%o", i) >= (int) len)
395 0 : TRC_CRITICAL(BAT_, "impossible error\n");
396 390229 : }
397 :
398 : static gdk_return BBPrecover(int farmid);
399 : static gdk_return BBPrecover_subdir(void);
400 : static bool BBPdiskscan(const char *, size_t);
401 :
402 : static int
403 6562 : vheapinit(BAT *b, const char *buf, unsigned bbpversion, const char *filename, int lineno)
404 : {
405 6562 : int n = 0;
406 6562 : uint64_t free, size;
407 6562 : uint16_t storage;
408 :
409 6562 : (void) bbpversion; /* could be used to implement compatibility */
410 :
411 6562 : size = 0; /* for GDKLIBRARY_HSIZE case */
412 6562 : storage = STORE_INVALID; /* for GDKLIBRARY_HSIZE case */
413 13124 : if (bbpversion <= GDKLIBRARY_HSIZE ?
414 0 : sscanf(buf,
415 : " %" SCNu64 " %" SCNu64 " %" SCNu16
416 : "%n",
417 : &free, &size, &storage, &n) < 3 :
418 6562 : sscanf(buf,
419 : " %" SCNu64
420 : "%n",
421 : &free, &n) < 1) {
422 0 : TRC_CRITICAL(GDK, "invalid format for BBP.dir on line %d", lineno);
423 0 : return -1;
424 : }
425 6562 : if (b->batCount == 0)
426 1852 : free = 0;
427 6562 : if (b->ttype >= 0 &&
428 6448 : ATOMstorage(b->ttype) == TYPE_str &&
429 6418 : free < GDK_STRHASHTABLE * sizeof(stridx_t) + BATTINY * GDK_VARALIGN)
430 5529 : size = GDK_STRHASHTABLE * sizeof(stridx_t) + BATTINY * GDK_VARALIGN;
431 1033 : else if (free < 512)
432 68 : size = 512;
433 : else
434 965 : size = free;
435 13124 : *b->tvheap = (Heap) {
436 6562 : .free = (size_t) free,
437 6562 : .size = (size_t) size,
438 : .base = NULL,
439 : .storage = STORE_INVALID,
440 : .cleanhash = true,
441 : .newstorage = STORE_INVALID,
442 : .dirty = false,
443 6562 : .parentid = b->batCacheid,
444 6562 : .farmid = BBPselectfarm(PERSISTENT, b->ttype, varheap),
445 6562 : .hasfile = free > 0,
446 : };
447 6562 : strconcat_len(b->tvheap->filename, sizeof(b->tvheap->filename),
448 : filename, ".theap", NULL);
449 6562 : return n;
450 : }
451 :
452 : static int
453 24718 : heapinit(BAT *b, const char *buf,
454 : #ifdef GDKLIBRARY_HASHASH
455 : int *hashash,
456 : #endif
457 : unsigned bbpversion, const char *filename, int lineno)
458 : {
459 24718 : int t;
460 24718 : char type[33];
461 24718 : uint16_t width;
462 24718 : uint16_t var;
463 24718 : uint16_t properties;
464 24718 : uint64_t nokey0;
465 24718 : uint64_t nokey1;
466 24718 : uint64_t nosorted;
467 24718 : uint64_t norevsorted;
468 24718 : uint64_t base;
469 24718 : uint64_t free;
470 24718 : uint64_t size;
471 24718 : uint16_t storage;
472 24718 : uint64_t minpos, maxpos;
473 24718 : int n;
474 :
475 24718 : (void) bbpversion; /* could be used to implement compatibility */
476 :
477 24718 : size = 0; /* for GDKLIBRARY_HSIZE case */
478 24718 : storage = STORE_INVALID; /* for GDKLIBRARY_HSIZE case */
479 49436 : if (bbpversion <= GDKLIBRARY_HSIZE ?
480 0 : sscanf(buf,
481 : " %10s %" SCNu16 " %" SCNu16 " %" SCNu16 " %" SCNu64
482 : " %" SCNu64 " %" SCNu64 " %" SCNu64 " %" SCNu64
483 : " %" SCNu64 " %" SCNu64 " %" SCNu16 " %" SCNu64 " %" SCNu64
484 : "%n",
485 : type, &width, &var, &properties, &nokey0,
486 : &nokey1, &nosorted, &norevsorted, &base,
487 : &free, &size, &storage, &minpos, &maxpos,
488 : &n) < 14 :
489 24718 : sscanf(buf,
490 : " %10s %" SCNu16 " %" SCNu16 " %" SCNu16 " %" SCNu64
491 : " %" SCNu64 " %" SCNu64 " %" SCNu64 " %" SCNu64
492 : " %" SCNu64 " %" SCNu64 " %" SCNu64
493 : "%n",
494 : type, &width, &var, &properties, &nokey0,
495 : &nokey1, &nosorted, &norevsorted, &base,
496 : &free, &minpos, &maxpos,
497 : &n) < 12) {
498 0 : TRC_CRITICAL(GDK, "invalid format for BBP.dir on line %d", lineno);
499 0 : return -1;
500 : }
501 :
502 24718 : if (strcmp(type, "wkba") == 0)
503 0 : GDKwarning("type wkba (SQL name: GeometryA) is deprecated\n");
504 :
505 24718 : if (properties & ~0x1F81) {
506 0 : TRC_CRITICAL(GDK, "unknown properties are set: incompatible database on line %d of BBP.dir\n", lineno);
507 0 : return -1;
508 : }
509 : #ifdef GDKLIBRARY_HASHASH
510 24718 : *hashash = var & 2;
511 : #endif
512 24718 : var &= ~2;
513 24718 : if ((t = ATOMindex(type)) < 0) {
514 129 : if ((t = ATOMunknown_find(type)) == 0) {
515 0 : TRC_CRITICAL(GDK, "no space for atom %s", type);
516 0 : return -1;
517 : }
518 31037 : } else if (var != (t == TYPE_void || BATatoms[t].atomPut != NULL)) {
519 0 : TRC_CRITICAL(GDK, "inconsistent entry in BBP.dir: tvarsized mismatch for BAT %d on line %d\n", (int) b->batCacheid, lineno);
520 0 : return -1;
521 24589 : } else if (var && t != 0 ?
522 6448 : ATOMsize(t) < width ||
523 6448 : (width != 1 && width != 2 && width != 4
524 : #if SIZEOF_VAR_T == 8
525 30 : && width != 8
526 : #endif
527 : ) :
528 18141 : ATOMsize(t) != width) {
529 0 : TRC_CRITICAL(GDK, "inconsistent entry in BBP.dir: tsize mismatch for BAT %d on line %d\n", (int) b->batCacheid, lineno);
530 0 : return -1;
531 : }
532 24718 : b->ttype = t;
533 24718 : b->twidth = width;
534 24718 : b->tshift = ATOMelmshift(width);
535 24718 : assert_shift_width(b->tshift,b->twidth);
536 24718 : b->tnokey[0] = (BUN) nokey0;
537 24718 : b->tnokey[1] = (BUN) nokey1;
538 24718 : b->tsorted = (bit) ((properties & 0x0001) != 0);
539 24718 : b->trevsorted = (bit) ((properties & 0x0080) != 0);
540 24718 : b->tkey = (properties & 0x0100) != 0;
541 24718 : b->tnonil = (properties & 0x0400) != 0;
542 24718 : b->tnil = (properties & 0x0800) != 0;
543 24718 : b->tascii = (properties & 0x1000) != 0;
544 24718 : b->tnosorted = (BUN) nosorted;
545 24718 : b->tnorevsorted = (BUN) norevsorted;
546 24718 : b->tunique_est = 0.0;
547 : /* (properties & 0x0200) is the old tdense flag */
548 24718 : b->tseqbase = (properties & 0x0200) == 0 || base >= (uint64_t) oid_nil ? oid_nil : (oid) base;
549 24718 : b->theap->free = (size_t) free;
550 24718 : b->theap->hasfile = free > 0;
551 : /* set heap size to match capacity */
552 24718 : if (b->ttype == TYPE_msk) {
553 : /* round up capacity to multiple of 32 */
554 3829 : b->batCapacity = (b->batCapacity + 31) & ~((BUN) 31);
555 3829 : b->theap->size = b->batCapacity / 8;
556 : } else {
557 20889 : b->theap->size = (size_t) b->batCapacity << b->tshift;
558 : }
559 24718 : b->theap->base = NULL;
560 24718 : settailname(b->theap, filename, t, width);
561 24718 : b->theap->storage = STORE_INVALID;
562 24718 : b->theap->newstorage = STORE_INVALID;
563 24718 : b->theap->farmid = BBPselectfarm(PERSISTENT, b->ttype, offheap);
564 24718 : b->theap->dirty = false;
565 24718 : b->theap->parentid = b->batCacheid;
566 24718 : if (minpos < b->batCount)
567 9761 : b->tminpos = (BUN) minpos;
568 : else
569 14957 : b->tminpos = BUN_NONE;
570 24718 : if (maxpos < b->batCount)
571 9826 : b->tmaxpos = (BUN) maxpos;
572 : else
573 14892 : b->tmaxpos = BUN_NONE;
574 24718 : if (t && var) {
575 6562 : t = vheapinit(b, buf + n, bbpversion, filename, lineno);
576 6562 : if (t < 0)
577 : return t;
578 6562 : n += t;
579 : } else {
580 18156 : b->tvheap = NULL;
581 : }
582 24718 : return n;
583 : }
584 :
585 : /* read a single line from the BBP.dir file (file pointer fp) and fill
586 : * in the structure pointed to by bn and extra information through the
587 : * other pointers; this function does not allocate any memory; return 0
588 : * on end of file, 1 on success, and -1 on failure */
589 : /* set to true during initialization, else always false; if false, do
590 : * not return any options (set pointer to NULL as if there aren't any);
591 : * if true and there are options, return them in freshly allocated
592 : * memory through *options */
593 : static bool return_options = false;
594 : int
595 25037 : BBPreadBBPline(FILE *fp, unsigned bbpversion, int *lineno, BAT *bn,
596 : #ifdef GDKLIBRARY_HASHASH
597 : int *hashash,
598 : #endif
599 : char *batname, char *filename, char **options)
600 : {
601 25037 : char buf[4096];
602 25037 : uint64_t batid;
603 25037 : unsigned int properties;
604 25037 : int nread, n;
605 25037 : char *s;
606 25037 : uint64_t count, base = 0;
607 :
608 25037 : if (fgets(buf, sizeof(buf), fp) == NULL) {
609 319 : if (ferror(fp)) {
610 0 : TRC_CRITICAL(GDK, "error reading BBP.dir on line %d\n", *lineno);
611 0 : return -1;
612 : }
613 : return 0; /* end of file */
614 : }
615 24718 : (*lineno)++;
616 24718 : if ((s = strpbrk(buf, "\r\n")) != NULL) {
617 24718 : if (s[0] == '\r' && s[1] != '\n') {
618 0 : TRC_CRITICAL(GDK, "invalid format for BBP.dir on line %d", *lineno);
619 0 : return -1;
620 : }
621 : /* zap the newline */
622 24718 : *s = '\0';
623 : } else {
624 0 : TRC_CRITICAL(GDK, "invalid format for BBP.dir on line %d: line too long\n", *lineno);
625 0 : return -1;
626 : }
627 :
628 49436 : if (bbpversion <= GDKLIBRARY_HSIZE ?
629 0 : sscanf(buf,
630 : "%" SCNu64 " %*u %128s %*s %u %" SCNu64 " %*u %" SCNu64
631 : "%n",
632 : &batid, batname,
633 : &properties, &count, &base,
634 : &nread) < 5 :
635 : bbpversion <= GDKLIBRARY_STATUS ?
636 2534 : sscanf(buf,
637 : "%" SCNu64 " %*u %128s %*s %u %" SCNu64 " %" SCNu64
638 : "%n",
639 : &batid, batname,
640 : &properties, &count, &base,
641 : &nread) < 5 :
642 22184 : sscanf(buf,
643 : "%" SCNu64 " %128s %u %" SCNu64 " %" SCNu64
644 : "%n",
645 : &batid, batname,
646 : &properties, &count, &base,
647 : &nread) < 5) {
648 0 : TRC_CRITICAL(GDK, "invalid format for BBP.dir on line %d", *lineno);
649 0 : return -1;
650 : }
651 :
652 24718 : if (batid >= N_BBPINIT * BBPINIT) {
653 0 : TRC_CRITICAL(GDK, "bat ID (%" PRIu64 ") too large to accommodate (max %d), on line %d.", batid, N_BBPINIT * BBPINIT - 1, *lineno);
654 0 : return -1;
655 : }
656 :
657 24718 : BBPgetfilename(filename, sizeof(BBP_physical(0)), (bat) batid);
658 :
659 24718 : bn->batCacheid = (bat) batid;
660 24718 : bn->batTransient = false;
661 24718 : bn->batCopiedtodisk = true;
662 24718 : switch ((properties & 0x06) >> 1) {
663 524 : case 0:
664 524 : bn->batRestricted = BAT_WRITE;
665 524 : break;
666 24194 : case 1:
667 24194 : bn->batRestricted = BAT_READ;
668 24194 : break;
669 0 : case 2:
670 0 : bn->batRestricted = BAT_APPEND;
671 0 : break;
672 0 : default:
673 0 : TRC_CRITICAL(GDK, "incorrect batRestricted value");
674 0 : return -1;
675 : }
676 24718 : bn->batCount = (BUN) count;
677 24718 : bn->batInserted = bn->batCount;
678 : /* set capacity to at least count */
679 24718 : bn->batCapacity = (BUN) count <= BATTINY ? BATTINY : (BUN) count;
680 :
681 24718 : if (base > (uint64_t) GDK_oid_max) {
682 0 : TRC_CRITICAL(GDK, "head seqbase out of range (ID = %" PRIu64 ", seq = %" PRIu64 ") on line %d.", batid, base, *lineno);
683 0 : return -1;
684 : }
685 24718 : bn->hseqbase = (oid) base;
686 24718 : n = heapinit(bn, buf + nread,
687 : #ifdef GDKLIBRARY_HASHASH
688 : hashash,
689 : #endif
690 : bbpversion, filename, *lineno);
691 24718 : if (n < 0) {
692 : return -1;
693 : }
694 24718 : nread += n;
695 :
696 24718 : if (nread >= (int) sizeof(buf) || (buf[nread] != '\0' && buf[nread] != ' ')) {
697 0 : TRC_CRITICAL(GDK, "invalid format for BBP.dir on line %d", *lineno);
698 0 : return -1;
699 : }
700 24718 : if (options) {
701 24718 : if (return_options && buf[nread] == ' ') {
702 0 : if ((*options = GDKstrdup(buf + nread + 1)) == NULL) {
703 0 : TRC_CRITICAL(GDK, "GDKstrdup failed\n");
704 0 : return -1;
705 : }
706 : } else {
707 24718 : *options = NULL;
708 : }
709 : }
710 : return 1;
711 : }
712 :
713 : static gdk_return
714 314 : BBPreadEntries(FILE *fp, unsigned bbpversion, int lineno
715 : #ifdef GDKLIBRARY_HASHASH
716 : , bat **hashbats, bat *nhashbats
717 : #endif
718 : )
719 : {
720 : #ifdef GDKLIBRARY_HASHASH
721 314 : bat *hbats = NULL;
722 314 : bat nhbats = 0;
723 : #endif
724 :
725 : /* read the BBP.dir and insert the BATs into the BBP */
726 314 : return_options = true;
727 314 : MT_lock_set(&BBPnameLock);
728 23453 : for (;;) {
729 23767 : BAT b;
730 23767 : Heap h;
731 23767 : Heap vh;
732 23767 : vh = h = (Heap) {
733 : .free = 0,
734 : };
735 23767 : b = (BAT) {
736 : .theap = &h,
737 : .tvheap = &vh,
738 : };
739 23767 : char *options;
740 23767 : char headname[129];
741 23767 : char filename[sizeof(BBP_physical(0))];
742 23767 : char logical[1024];
743 : #ifdef GDKLIBRARY_HASHASH
744 23767 : int Thashash;
745 : #endif
746 :
747 23767 : switch (BBPreadBBPline(fp, bbpversion, &lineno, &b,
748 : #ifdef GDKLIBRARY_HASHASH
749 : &Thashash,
750 : #endif
751 : headname, filename, &options)) {
752 314 : case 0:
753 : /* end of file */
754 : #ifdef GDKLIBRARY_HASHASH
755 314 : *hashbats = hbats;
756 314 : *nhashbats = nhbats;
757 : #endif
758 314 : return_options = false;
759 314 : MT_lock_unset(&BBPnameLock);
760 314 : return GDK_SUCCEED;
761 : case 1:
762 : /* successfully read an entry */
763 23453 : break;
764 0 : default:
765 : /* error */
766 0 : goto bailout;
767 : }
768 :
769 23453 : if (b.batCacheid >= N_BBPINIT * BBPINIT) {
770 0 : GDKfree(options);
771 0 : TRC_CRITICAL(GDK, "bat ID (%d) too large to accommodate (max %d), on line %d.", b.batCacheid, N_BBPINIT * BBPINIT - 1, lineno);
772 0 : goto bailout;
773 : }
774 :
775 23453 : if (b.batCacheid >= (bat) ATOMIC_GET(&BBPsize)) {
776 0 : if ((bat) ATOMIC_GET(&BBPsize) + 1 >= BBPlimit &&
777 0 : BBPextend(b.batCacheid + 1) != GDK_SUCCEED) {
778 0 : GDKfree(options);
779 0 : goto bailout;
780 : }
781 0 : ATOMIC_SET(&BBPsize, b.batCacheid + 1);
782 : }
783 23453 : BAT *bn = BBP_desc(b.batCacheid);
784 23453 : if (bn->batCacheid != 0) {
785 0 : GDKfree(options);
786 0 : TRC_CRITICAL(GDK, "duplicate entry in BBP.dir (ID = "
787 : "%d) on line %d.", b.batCacheid, lineno);
788 0 : goto bailout;
789 : }
790 :
791 : #ifdef GDKLIBRARY_HASHASH
792 23453 : if (Thashash) {
793 0 : assert(bbpversion <= GDKLIBRARY_HASHASH);
794 0 : bat *sb = GDKrealloc(hbats, ++nhbats * sizeof(bat));
795 0 : if (sb == NULL) {
796 0 : GDKfree(options);
797 0 : goto bailout;
798 : }
799 0 : hbats = sb;
800 0 : hbats[nhbats - 1] = b.batCacheid;
801 : }
802 : #endif
803 :
804 23453 : Heap *hn;
805 23453 : if ((hn = GDKmalloc(sizeof(Heap))) == NULL) {
806 0 : GDKfree(options);
807 0 : TRC_CRITICAL(GDK, "cannot allocate memory for BAT.");
808 0 : goto bailout;
809 : }
810 23453 : *bn = b;
811 23453 : *hn = h;
812 23453 : bn->theap = hn;
813 23453 : if (b.tvheap) {
814 6222 : Heap *vhn;
815 6222 : assert(b.tvheap == &vh);
816 6222 : if ((vhn = GDKmalloc(sizeof(Heap))) == NULL) {
817 0 : GDKfree(hn);
818 0 : GDKfree(options);
819 0 : TRC_CRITICAL(GDK, "cannot allocate memory for BAT.");
820 0 : goto bailout;
821 : }
822 6222 : *vhn = vh;
823 6222 : bn->tvheap = vhn;
824 6222 : ATOMIC_INIT(&bn->tvheap->refs, 1);
825 : }
826 :
827 23453 : char name[MT_NAME_LEN];
828 23453 : snprintf(name, sizeof(name), "heaplock%d", bn->batCacheid); /* fits */
829 23453 : MT_lock_init(&bn->theaplock, name);
830 23453 : snprintf(name, sizeof(name), "BATlock%d", bn->batCacheid); /* fits */
831 23453 : MT_lock_init(&bn->batIdxLock, name);
832 23453 : snprintf(name, sizeof(name), "hashlock%d", bn->batCacheid); /* fits */
833 23453 : MT_rwlock_init(&bn->thashlock, name);
834 23453 : ATOMIC_INIT(&bn->theap->refs, 1);
835 :
836 23453 : if (snprintf(BBP_bak(b.batCacheid), sizeof(BBP_bak(b.batCacheid)), "tmp_%o", (unsigned) b.batCacheid) >= (int) sizeof(BBP_bak(b.batCacheid))) {
837 0 : BATdestroy(bn);
838 0 : GDKfree(options);
839 0 : TRC_CRITICAL(GDK, "BBP logical filename directory is too large, on line %d\n", lineno);
840 0 : goto bailout;
841 : }
842 23453 : char *s;
843 23453 : if ((s = strchr(headname, '~')) != NULL && s == headname) {
844 : /* sizeof(logical) > sizeof(BBP_bak(b.batCacheid)), so
845 : * this fits */
846 0 : strcpy(logical, BBP_bak(b.batCacheid));
847 : } else {
848 0 : if (s)
849 0 : *s = 0;
850 23453 : strcpy_len(logical, headname, sizeof(logical));
851 : }
852 23453 : if (strcmp(logical, BBP_bak(b.batCacheid)) == 0) {
853 22887 : BBP_logical(b.batCacheid) = BBP_bak(b.batCacheid);
854 : } else {
855 566 : BBP_logical(b.batCacheid) = GDKstrdup(logical);
856 566 : if (BBP_logical(b.batCacheid) == NULL) {
857 0 : BATdestroy(bn);
858 0 : GDKfree(options);
859 0 : TRC_CRITICAL(GDK, "GDKstrdup failed\n");
860 0 : goto bailout;
861 : }
862 : }
863 23453 : strcpy_len(BBP_physical(b.batCacheid), filename, sizeof(BBP_physical(b.batCacheid)));
864 : #ifdef __COVERITY__
865 : /* help coverity */
866 : BBP_physical(b.batCacheid)[sizeof(BBP_physical(b.batCacheid)) - 1] = 0;
867 : #endif
868 23453 : BBP_options(b.batCacheid) = options;
869 23453 : BBP_refs(b.batCacheid) = 0;
870 23453 : BBP_lrefs(b.batCacheid) = 1; /* any BAT we encounter here is persistent, so has a logical reference */
871 23453 : BBP_pid(b.batCacheid) = 0;
872 23453 : BBP_status_set(b.batCacheid, BBPEXISTING);
873 23453 : if (BBPnamecheck(BBP_logical(b.batCacheid)) == 0)
874 566 : BBP_insert(b.batCacheid);
875 : }
876 :
877 0 : bailout:
878 0 : MT_lock_unset(&BBPnameLock);
879 0 : return_options = false;
880 : #ifdef GDKLIBRARY_HASHASH
881 0 : GDKfree(hbats);
882 : #endif
883 0 : return GDK_FAIL;
884 : }
885 :
886 : /* check that the necessary files for all BATs exist and are large
887 : * enough */
888 : static gdk_return
889 315 : BBPcheckbats(unsigned bbpversion)
890 : {
891 315 : (void) bbpversion;
892 51299 : for (bat bid = 1, size = (bat) ATOMIC_GET(&BBPsize); bid < size; bid++) {
893 50984 : struct stat statb;
894 50984 : BAT *b;
895 50984 : char *path;
896 :
897 50984 : b = BBP_desc(bid);
898 50984 : if (b->batCacheid == 0 || b->ttype == TYPE_void) {
899 : /* no files needed */
900 27531 : continue;
901 : }
902 23453 : if (b->theap->free > 0) {
903 15463 : path = GDKfilepath(0, BATDIR, b->theap->filename, NULL);
904 15463 : if (path == NULL)
905 0 : return GDK_FAIL;
906 : /* first check string offset heap with width,
907 : * then without */
908 15463 : if (MT_stat(path, &statb) < 0) {
909 0 : GDKsyserror("cannot stat file %s (expected size %zu)\n",
910 : path, b->theap->free);
911 0 : GDKfree(path);
912 0 : return GDK_FAIL;
913 : }
914 15463 : if ((size_t) statb.st_size < b->theap->free) {
915 0 : GDKerror("file %s too small (expected %zu, actual %zu)\n", path, b->theap->free, (size_t) statb.st_size);
916 0 : GDKfree(path);
917 0 : return GDK_FAIL;
918 : }
919 15463 : size_t hfree = b->theap->free;
920 15463 : hfree = (hfree + GDK_mmap_pagesize - 1) & ~(GDK_mmap_pagesize - 1);
921 15463 : if (hfree == 0)
922 0 : hfree = GDK_mmap_pagesize;
923 15463 : if (statb.st_size > (off_t) hfree) {
924 9 : int fd;
925 9 : if ((fd = MT_open(path, O_RDWR | O_CLOEXEC | O_BINARY)) >= 0) {
926 9 : if (ftruncate(fd, hfree) == -1)
927 0 : perror("ftruncate");
928 9 : (void) close(fd);
929 : }
930 : }
931 15463 : GDKfree(path);
932 : }
933 23453 : if (b->tvheap != NULL && b->tvheap->free > 0) {
934 4475 : path = GDKfilepath(0, BATDIR, BBP_physical(b->batCacheid), "theap");
935 4475 : if (path == NULL)
936 : return GDK_FAIL;
937 4475 : if (MT_stat(path, &statb) < 0) {
938 0 : GDKsyserror("cannot stat file %s\n",
939 : path);
940 0 : GDKfree(path);
941 0 : return GDK_FAIL;
942 : }
943 4475 : if ((size_t) statb.st_size < b->tvheap->free) {
944 0 : GDKerror("file %s too small (expected %zu, actual %zu)\n", path, b->tvheap->free, (size_t) statb.st_size);
945 0 : GDKfree(path);
946 0 : return GDK_FAIL;
947 : }
948 4475 : size_t hfree = b->tvheap->free;
949 4475 : hfree = (hfree + GDK_mmap_pagesize - 1) & ~(GDK_mmap_pagesize - 1);
950 4475 : if (hfree == 0)
951 0 : hfree = GDK_mmap_pagesize;
952 4475 : if (statb.st_size > (off_t) hfree) {
953 0 : int fd;
954 0 : if ((fd = MT_open(path, O_RDWR | O_CLOEXEC | O_BINARY)) >= 0) {
955 0 : if (ftruncate(fd, hfree) == -1)
956 0 : perror("ftruncate");
957 0 : (void) close(fd);
958 : }
959 : }
960 4475 : GDKfree(path);
961 : }
962 : }
963 : return GDK_SUCCEED;
964 : }
965 :
966 : #ifdef HAVE_HGE
967 : #define SIZEOF_MAX_INT SIZEOF_HGE
968 : #else
969 : #define SIZEOF_MAX_INT SIZEOF_LNG
970 : #endif
971 :
972 : unsigned
973 319 : BBPheader(FILE *fp, int *lineno, bat *bbpsize, lng *logno, bool allow_hge_upgrade)
974 : {
975 319 : char buf[BUFSIZ];
976 319 : int sz, ptrsize, oidsize, intsize;
977 319 : unsigned bbpversion;
978 :
979 319 : if (fgets(buf, sizeof(buf), fp) == NULL) {
980 0 : TRC_CRITICAL(GDK, "BBP.dir is empty");
981 0 : return 0;
982 : }
983 319 : ++*lineno;
984 319 : if (sscanf(buf, "BBP.dir, GDKversion %u\n", &bbpversion) != 1) {
985 0 : GDKerror("old BBP without version number; "
986 : "dump the database using a compatible version, "
987 : "then restore into new database using this version.\n");
988 0 : return 0;
989 : }
990 319 : if (bbpversion != GDKLIBRARY &&
991 : bbpversion != GDKLIBRARY_STATUS &&
992 : bbpversion != GDKLIBRARY_JSON &&
993 319 : bbpversion != GDKLIBRARY_HSIZE &&
994 : bbpversion != GDKLIBRARY_HASHASH) {
995 0 : TRC_CRITICAL(GDK, "incompatible BBP version: expected 0%o, got 0%o. "
996 : "This database was probably created by a %s version of MonetDB.",
997 : GDKLIBRARY, bbpversion,
998 : bbpversion > GDKLIBRARY ? "newer" : "too old");
999 0 : return 0;
1000 : }
1001 319 : if (fgets(buf, sizeof(buf), fp) == NULL) {
1002 0 : TRC_CRITICAL(GDK, "short BBP");
1003 0 : return 0;
1004 : }
1005 319 : ++*lineno;
1006 319 : if (sscanf(buf, "%d %d %d", &ptrsize, &oidsize, &intsize) != 3) {
1007 0 : TRC_CRITICAL(GDK, "BBP.dir has incompatible format: pointer, OID, and max. integer sizes are missing on line %d", *lineno);
1008 0 : return 0;
1009 : }
1010 319 : if (ptrsize != SIZEOF_SIZE_T || oidsize != SIZEOF_OID) {
1011 0 : TRC_CRITICAL(GDK, "database created with incompatible server: "
1012 : "expected pointer size %d, got %d, expected OID size %d, got %d.",
1013 : SIZEOF_SIZE_T, ptrsize, SIZEOF_OID, oidsize);
1014 0 : return 0;
1015 : }
1016 319 : if (intsize > SIZEOF_MAX_INT) {
1017 0 : TRC_CRITICAL(GDK, "database created with incompatible server: "
1018 : "expected max. integer size %d, got %d.",
1019 : SIZEOF_MAX_INT, intsize);
1020 0 : return 0;
1021 : }
1022 319 : if (intsize < SIZEOF_MAX_INT && !allow_hge_upgrade) {
1023 0 : TRC_CRITICAL(GDK, "database created with incompatible server: "
1024 : "expected max. integer size %d, got %d; "
1025 : "use --set allow_hge_upgrade=yes to upgrade.",
1026 : SIZEOF_MAX_INT, intsize);
1027 0 : return 0;
1028 : }
1029 319 : if (fgets(buf, sizeof(buf), fp) == NULL) {
1030 0 : TRC_CRITICAL(GDK, "short BBP");
1031 0 : return 0;
1032 : }
1033 319 : ++*lineno;
1034 319 : if (sscanf(buf, "BBPsize=%d", &sz) != 1) {
1035 0 : TRC_CRITICAL(GDK, "no BBPsize value found\n");
1036 0 : return 0;
1037 : }
1038 319 : if (sz > *bbpsize)
1039 94 : *bbpsize = sz;
1040 319 : if (fgets(buf, sizeof(buf), fp) == NULL) {
1041 0 : TRC_CRITICAL(GDK, "short BBP");
1042 0 : return 0;
1043 : }
1044 638 : if (bbpversion <= GDKLIBRARY_STATUS ?
1045 8 : sscanf(buf, "BBPinfo=" LLSCN " %*d", logno) != 1 :
1046 311 : sscanf(buf, "BBPinfo=" LLSCN, logno) != 1) {
1047 0 : TRC_CRITICAL(GDK, "no info value found\n");
1048 0 : return 0;
1049 : }
1050 319 : return bbpversion;
1051 : }
1052 :
1053 : bool
1054 74216071 : GDKinmemory(int farmid)
1055 : {
1056 74216071 : if (farmid == NOFARM)
1057 : farmid = 0;
1058 72959081 : assert(farmid >= 0 && farmid < MAXFARMS);
1059 74216071 : return BBPfarms[farmid].dirname == NULL;
1060 : }
1061 :
1062 : /* all errors are fatal */
1063 : gdk_return
1064 939 : BBPaddfarm(const char *dirname, uint32_t rolemask, bool logerror)
1065 : {
1066 939 : struct stat st;
1067 939 : int i;
1068 :
1069 939 : if (dirname == NULL) {
1070 1 : assert(BBPfarms[0].dirname == NULL);
1071 1 : assert(rolemask & 1);
1072 1 : assert(BBPfarms[0].roles == 0);
1073 1 : BBPfarms[0].roles = rolemask;
1074 1 : return GDK_SUCCEED;
1075 : }
1076 938 : if (strchr(dirname, '\n') != NULL) {
1077 0 : if (logerror)
1078 0 : GDKerror("no newline allowed in directory name\n");
1079 0 : return GDK_FAIL;
1080 : }
1081 938 : if (rolemask == 0 || (rolemask & 1 && BBPfarms[0].roles != 0)) {
1082 0 : if (logerror)
1083 0 : GDKerror("bad rolemask\n");
1084 0 : return GDK_FAIL;
1085 : }
1086 938 : if (strcmp(dirname, "in-memory") == 0 ||
1087 937 : /* backward compatibility: */ strcmp(dirname, ":memory:") == 0) {
1088 : dirname = NULL;
1089 937 : } else if (MT_mkdir(dirname) < 0) {
1090 849 : if (errno == EEXIST) {
1091 849 : if (MT_stat(dirname, &st) == -1 || !S_ISDIR(st.st_mode)) {
1092 0 : if (logerror)
1093 0 : GDKerror("%s: not a directory\n", dirname);
1094 0 : return GDK_FAIL;
1095 : }
1096 : } else {
1097 0 : if (logerror)
1098 0 : GDKsyserror("%s: cannot create directory\n", dirname);
1099 0 : return GDK_FAIL;
1100 : }
1101 : }
1102 1865 : for (i = 0; i < MAXFARMS; i++) {
1103 1865 : if (BBPfarms[i].roles == 0) {
1104 938 : if (dirname) {
1105 937 : BBPfarms[i].dirname = GDKstrdup(dirname);
1106 937 : if (BBPfarms[i].dirname == NULL)
1107 : return GDK_FAIL;
1108 : }
1109 938 : BBPfarms[i].roles = rolemask;
1110 938 : if ((rolemask & 1) == 0 && dirname != NULL) {
1111 : char *bbpdir;
1112 : int j;
1113 :
1114 919 : for (j = 0; j < i; j++)
1115 770 : if (BBPfarms[j].dirname != NULL &&
1116 770 : strcmp(BBPfarms[i].dirname,
1117 : BBPfarms[j].dirname) == 0)
1118 : return GDK_SUCCEED;
1119 : /* if an extra farm, make sure we
1120 : * don't find a BBP.dir there that
1121 : * might belong to an existing
1122 : * database */
1123 149 : bbpdir = GDKfilepath(i, BATDIR, "BBP", "dir");
1124 149 : if (bbpdir == NULL) {
1125 : return GDK_FAIL;
1126 : }
1127 149 : if (MT_stat(bbpdir, &st) != -1 || errno != ENOENT) {
1128 0 : GDKfree(bbpdir);
1129 0 : if (logerror)
1130 0 : GDKerror("%s is a database\n", dirname);
1131 0 : return GDK_FAIL;
1132 : }
1133 149 : GDKfree(bbpdir);
1134 149 : bbpdir = GDKfilepath(i, BAKDIR, "BBP", "dir");
1135 149 : if (bbpdir == NULL) {
1136 : return GDK_FAIL;
1137 : }
1138 149 : if (MT_stat(bbpdir, &st) != -1 || errno != ENOENT) {
1139 0 : GDKfree(bbpdir);
1140 0 : if (logerror)
1141 0 : GDKerror("%s is a database\n", dirname);
1142 0 : return GDK_FAIL;
1143 : }
1144 149 : GDKfree(bbpdir);
1145 : }
1146 466 : return GDK_SUCCEED;
1147 : }
1148 : }
1149 0 : if (logerror)
1150 0 : GDKerror("too many farms\n");
1151 : return GDK_FAIL;
1152 : }
1153 :
1154 : gdk_return
1155 317 : BBPchkfarms(void)
1156 : {
1157 317 : const char *dir = NULL;
1158 317 : uint32_t rolemask = 0;
1159 317 : if ((BBPfarms[0].roles & 1) == 0) {
1160 0 : GDKerror("Must call BBPaddfarms at least once for persistent data\n");
1161 0 : return GDK_FAIL;
1162 : }
1163 10461 : for (int i = 0; i < MAXFARMS; i++) {
1164 10144 : if (BBPfarms[i].roles != 0) {
1165 622 : dir = BBPfarms[i].dirname;
1166 622 : rolemask |= BBPfarms[i].roles;
1167 : }
1168 : }
1169 317 : if (dir == NULL)
1170 1 : dir = "in-memory";
1171 317 : if ((rolemask & (1U << TRANSIENT)) == 0) {
1172 0 : gdk_return rc = BBPaddfarm(dir, 1U << TRANSIENT, true);
1173 0 : if (rc != GDK_SUCCEED)
1174 : return rc;
1175 : }
1176 317 : if ((rolemask & (1U << SYSTRANS)) == 0) {
1177 317 : gdk_return rc = BBPaddfarm(dir, 1U << SYSTRANS, true);
1178 317 : if (rc != GDK_SUCCEED)
1179 : return rc;
1180 : }
1181 : return GDK_SUCCEED;
1182 : }
1183 :
1184 : #ifdef GDKLIBRARY_HASHASH
1185 : static gdk_return
1186 0 : fixhashashbat(BAT *b)
1187 : {
1188 0 : const char *nme = BBP_physical(b->batCacheid);
1189 0 : char *srcdir = GDKfilepath(NOFARM, BATDIR, nme, NULL);
1190 0 : if (srcdir == NULL) {
1191 0 : TRC_CRITICAL(GDK, "GDKfilepath failed\n");
1192 0 : return GDK_FAIL;
1193 : }
1194 0 : char *s;
1195 0 : if ((s = strrchr(srcdir, DIR_SEP)) != NULL)
1196 0 : *s = 0;
1197 0 : const char *bnme;
1198 0 : if ((bnme = strrchr(nme, DIR_SEP)) != NULL)
1199 0 : bnme++;
1200 : else
1201 : bnme = nme;
1202 0 : long_str filename;
1203 0 : snprintf(filename, sizeof(filename), "BACKUP%c%s", DIR_SEP, bnme);
1204 :
1205 : /* we don't maintain index structures */
1206 0 : HASHdestroy(b);
1207 0 : OIDXdestroy(b);
1208 0 : PROPdestroy(b);
1209 0 : STRMPdestroy(b);
1210 0 : RTREEdestroy(b);
1211 :
1212 : /* make backup of heaps */
1213 0 : const char *t;
1214 0 : if (GDKmove(b->theap->farmid, srcdir, bnme, "tail1",
1215 : BAKDIR, bnme, "tail1", false) == GDK_SUCCEED)
1216 : t = "tail1";
1217 0 : else if (GDKmove(b->theap->farmid, srcdir, bnme, "tail2",
1218 : BAKDIR, bnme, "tail2", false) == GDK_SUCCEED)
1219 : t = "tail2";
1220 : #if SIZEOF_VAR_T == 8
1221 0 : else if (GDKmove(b->theap->farmid, srcdir, bnme, "tail4",
1222 : BAKDIR, bnme, "tail4", false) == GDK_SUCCEED)
1223 : t = "tail4";
1224 : #endif
1225 0 : else if (GDKmove(b->theap->farmid, srcdir, bnme, "tail",
1226 : BAKDIR, bnme, "tail", true) == GDK_SUCCEED)
1227 : t = "tail";
1228 : else {
1229 0 : GDKfree(srcdir);
1230 0 : TRC_CRITICAL(GDK, "cannot make backup of %s.tail\n", nme);
1231 0 : return GDK_FAIL;
1232 : }
1233 0 : GDKclrerr();
1234 0 : if (GDKmove(b->theap->farmid, srcdir, bnme, "theap",
1235 : BAKDIR, bnme, "theap", true) != GDK_SUCCEED) {
1236 0 : GDKfree(srcdir);
1237 0 : TRC_CRITICAL(GDK, "cannot make backup of %s.theap\n", nme);
1238 0 : return GDK_FAIL;
1239 : }
1240 : /* load old heaps */
1241 0 : Heap h1 = *b->theap; /* old heap */
1242 0 : h1.base = NULL;
1243 0 : h1.dirty = false;
1244 0 : strconcat_len(h1.filename, sizeof(h1.filename), filename, ".", t, NULL);
1245 0 : if (HEAPload(&h1, filename, t, false) != GDK_SUCCEED) {
1246 0 : GDKfree(srcdir);
1247 0 : TRC_CRITICAL(GDK, "loading old tail heap "
1248 : "for BAT %d failed\n", b->batCacheid);
1249 0 : return GDK_FAIL;
1250 : }
1251 0 : Heap vh1 = *b->tvheap; /* old heap */
1252 0 : vh1.base = NULL;
1253 0 : vh1.dirty = false;
1254 0 : strconcat_len(vh1.filename, sizeof(vh1.filename), filename, ".theap", NULL);
1255 0 : if (HEAPload(&vh1, filename, "theap", false) != GDK_SUCCEED) {
1256 0 : GDKfree(srcdir);
1257 0 : HEAPfree(&h1, false);
1258 0 : TRC_CRITICAL(GDK, "loading old string heap "
1259 : "for BAT %d failed\n", b->batCacheid);
1260 0 : return GDK_FAIL;
1261 : }
1262 :
1263 : /* create new heaps */
1264 0 : Heap *h2 = GDKmalloc(sizeof(Heap));
1265 0 : Heap *vh2 = GDKmalloc(sizeof(Heap));
1266 0 : if (h2 == NULL || vh2 == NULL) {
1267 0 : GDKfree(h2);
1268 0 : GDKfree(vh2);
1269 0 : GDKfree(srcdir);
1270 0 : HEAPfree(&h1, false);
1271 0 : HEAPfree(&vh1, false);
1272 0 : TRC_CRITICAL(GDK, "allocating new heaps "
1273 : "for BAT %d failed\n", b->batCacheid);
1274 0 : return GDK_FAIL;
1275 : }
1276 0 : *h2 = *b->theap;
1277 0 : h2->base = NULL;
1278 0 : if (HEAPalloc(h2, b->batCapacity, b->twidth) != GDK_SUCCEED) {
1279 0 : GDKfree(h2);
1280 0 : GDKfree(vh2);
1281 0 : GDKfree(srcdir);
1282 0 : HEAPfree(&h1, false);
1283 0 : HEAPfree(&vh1, false);
1284 0 : TRC_CRITICAL(GDK, "allocating new tail heap "
1285 : "for BAT %d failed\n", b->batCacheid);
1286 0 : return GDK_FAIL;
1287 : }
1288 0 : h2->dirty = true;
1289 0 : h2->free = h1.free;
1290 :
1291 0 : *vh2 = *b->tvheap;
1292 0 : strconcat_len(vh2->filename, sizeof(vh2->filename), nme, ".theap", NULL);
1293 0 : strHeap(vh2, b->batCapacity);
1294 0 : if (vh2->base == NULL) {
1295 0 : GDKfree(srcdir);
1296 0 : HEAPfree(&h1, false);
1297 0 : HEAPfree(&vh1, false);
1298 0 : HEAPfree(h2, false);
1299 0 : GDKfree(h2);
1300 0 : GDKfree(vh2);
1301 0 : TRC_CRITICAL(GDK, "allocating new string heap "
1302 : "for BAT %d failed\n", b->batCacheid);
1303 0 : return GDK_FAIL;
1304 : }
1305 0 : vh2->dirty = true;
1306 0 : ATOMIC_INIT(&h2->refs, 1);
1307 0 : ATOMIC_INIT(&vh2->refs, 1);
1308 0 : Heap *ovh = b->tvheap;
1309 0 : b->tvheap = vh2;
1310 0 : vh2 = NULL; /* no longer needed */
1311 0 : for (BUN i = 0; i < b->batCount; i++) {
1312 0 : var_t o;
1313 0 : switch (b->twidth) {
1314 0 : case 1:
1315 0 : o = (var_t) ((uint8_t *) h1.base)[i] + GDK_VAROFFSET;
1316 0 : break;
1317 0 : case 2:
1318 0 : o = (var_t) ((uint16_t *) h1.base)[i] + GDK_VAROFFSET;
1319 0 : break;
1320 : #if SIZEOF_VAR_T == 8
1321 0 : case 4:
1322 0 : o = (var_t) ((uint32_t *) h1.base)[i];
1323 0 : break;
1324 : #endif
1325 0 : default:
1326 0 : o = ((var_t *) h1.base)[i];
1327 0 : break;
1328 : }
1329 0 : const char *s = vh1.base + o;
1330 0 : var_t no = strPut(b, &o, s);
1331 0 : if (no == 0) {
1332 0 : HEAPfree(&h1, false);
1333 0 : HEAPfree(&vh1, false);
1334 0 : HEAPdecref(h2, false);
1335 0 : HEAPdecref(b->tvheap, false);
1336 0 : b->tvheap = ovh;
1337 0 : GDKfree(srcdir);
1338 0 : TRC_CRITICAL(GDK, "storing string value "
1339 : "for BAT %d failed\n", b->batCacheid);
1340 0 : return GDK_FAIL;
1341 : }
1342 0 : assert(no >= GDK_VAROFFSET);
1343 0 : switch (b->twidth) {
1344 0 : case 1:
1345 0 : no -= GDK_VAROFFSET;
1346 0 : assert(no <= 0xFF);
1347 0 : ((uint8_t *) h2->base)[i] = (uint8_t) no;
1348 0 : break;
1349 0 : case 2:
1350 0 : no -= GDK_VAROFFSET;
1351 0 : assert(no <= 0xFFFF);
1352 0 : ((uint16_t *) h2->base)[i] = (uint16_t) no;
1353 0 : break;
1354 : #if SIZEOF_VAR_T == 8
1355 0 : case 4:
1356 0 : assert(no <= 0xFFFFFFFF);
1357 0 : ((uint32_t *) h2->base)[i] = (uint32_t) no;
1358 0 : break;
1359 : #endif
1360 0 : default:
1361 0 : ((var_t *) h2->base)[i] = no;
1362 0 : break;
1363 : }
1364 : }
1365 :
1366 : /* cleanup */
1367 0 : HEAPfree(&h1, false);
1368 0 : HEAPfree(&vh1, false);
1369 0 : if (HEAPsave(h2, nme, BATtailname(b), true, h2->free, NULL) != GDK_SUCCEED) {
1370 0 : HEAPdecref(h2, false);
1371 0 : HEAPdecref(b->tvheap, false);
1372 0 : b->tvheap = ovh;
1373 0 : GDKfree(srcdir);
1374 0 : TRC_CRITICAL(GDK, "saving heap failed\n");
1375 0 : return GDK_FAIL;
1376 : }
1377 0 : if (HEAPsave(b->tvheap, nme, "theap", true, b->tvheap->free, &b->theaplock) != GDK_SUCCEED) {
1378 0 : HEAPfree(b->tvheap, false);
1379 0 : b->tvheap = ovh;
1380 0 : GDKfree(srcdir);
1381 0 : TRC_CRITICAL(GDK, "saving string heap failed\n");
1382 0 : return GDK_FAIL;
1383 : }
1384 0 : HEAPdecref(b->theap, false);
1385 0 : b->theap = h2;
1386 0 : HEAPfree(h2, false);
1387 0 : HEAPdecref(ovh, false);
1388 0 : HEAPfree(b->tvheap, false);
1389 0 : GDKfree(srcdir);
1390 0 : return GDK_SUCCEED;
1391 : }
1392 :
1393 : static gdk_return
1394 0 : fixhashash(bat *hashbats, bat nhashbats)
1395 : {
1396 0 : for (bat i = 0; i < nhashbats; i++) {
1397 0 : bat bid = hashbats[i];
1398 0 : BAT *b = BBP_desc(bid);
1399 0 : if (b->batCacheid == 0) {
1400 : /* not a valid BAT (shouldn't happen) */
1401 0 : continue;
1402 : }
1403 0 : if (fixhashashbat(b) != GDK_SUCCEED)
1404 : return GDK_FAIL;
1405 : }
1406 : return GDK_SUCCEED;
1407 : }
1408 : #endif
1409 :
1410 : #ifdef GDKLIBRARY_JSON
1411 : static gdk_return
1412 0 : jsonupgradebat(BAT *b, json_storage_conversion fixJSONStorage)
1413 : {
1414 0 : const char *nme = BBP_physical(b->batCacheid);
1415 0 : char *srcdir = GDKfilepath(NOFARM, BATDIR, nme, NULL);
1416 :
1417 0 : if (srcdir == NULL) {
1418 0 : TRC_CRITICAL(GDK, "GDKfilepath failed\n");
1419 0 : return GDK_FAIL;
1420 : }
1421 :
1422 0 : char *s;
1423 0 : if ((s = strrchr(srcdir, DIR_SEP)) != NULL)
1424 0 : *s = 0;
1425 0 : const char *bnme;
1426 0 : if ((bnme = strrchr(nme, DIR_SEP)) != NULL) {
1427 0 : bnme++;
1428 : } else {
1429 : bnme = nme;
1430 : }
1431 :
1432 0 : long_str filename;
1433 0 : snprintf(filename, sizeof(filename), "BACKUP%c%s", DIR_SEP, bnme);
1434 :
1435 : /* A json column should not normally have any index structures */
1436 0 : HASHdestroy(b);
1437 0 : OIDXdestroy(b);
1438 0 : PROPdestroy(b);
1439 0 : STRMPdestroy(b);
1440 0 : RTREEdestroy(b);
1441 :
1442 : /* backup the current heaps */
1443 0 : if (GDKmove(b->theap->farmid, srcdir, bnme, "tail",
1444 : BAKDIR, bnme, "tail", false) != GDK_SUCCEED) {
1445 0 : GDKfree(srcdir);
1446 0 : TRC_CRITICAL(GDK, "cannot make backup of %s.tail\n", nme);
1447 0 : return GDK_FAIL;
1448 : }
1449 0 : if (GDKmove(b->theap->farmid, srcdir, bnme, "theap",
1450 : BAKDIR, bnme, "theap", true) != GDK_SUCCEED) {
1451 0 : GDKfree(srcdir);
1452 0 : TRC_CRITICAL(GDK, "cannot make backup of %s.theap\n", nme);
1453 0 : return GDK_FAIL;
1454 : }
1455 :
1456 : /* load the old heaps */
1457 0 : Heap h1 = *b->theap;
1458 0 : h1.base = NULL;
1459 0 : h1.dirty = false;
1460 0 : strconcat_len(h1.filename, sizeof(h1.filename), filename, ".tail", NULL);
1461 0 : if (HEAPload(&h1, filename, "tail", false) != GDK_SUCCEED) {
1462 0 : GDKfree(srcdir);
1463 0 : TRC_CRITICAL(GDK, "loading old tail heap "
1464 : "for BAT %d failed\n", b->batCacheid);
1465 0 : return GDK_FAIL;
1466 : }
1467 :
1468 0 : Heap vh1 = *b->tvheap;
1469 0 : vh1.base = NULL;
1470 0 : vh1.dirty = false;
1471 0 : strconcat_len(vh1.filename, sizeof(vh1.filename), filename, ".theap", NULL);
1472 0 : if (HEAPload(&vh1, filename, "theap", false) != GDK_SUCCEED) {
1473 0 : GDKfree(srcdir);
1474 0 : HEAPfree(&h1, false);
1475 0 : TRC_CRITICAL(GDK, "loading old string heap "
1476 : "for BAT %d failed\n", b->batCacheid);
1477 0 : return GDK_FAIL;
1478 : }
1479 :
1480 : /* create the new heaps */
1481 0 : Heap *h2 = GDKmalloc(sizeof(Heap));
1482 0 : Heap *vh2 = GDKmalloc(sizeof(Heap));
1483 0 : if (h2 == NULL || vh2 == NULL) {
1484 0 : GDKfree(h2);
1485 0 : GDKfree(vh2);
1486 0 : GDKfree(srcdir);
1487 0 : HEAPfree(&h1, false);
1488 0 : HEAPfree(&vh1, false);
1489 0 : TRC_CRITICAL(GDK, "allocating new heaps "
1490 : "for BAT %d failed\n", b->batCacheid);
1491 0 : return GDK_FAIL;
1492 : }
1493 0 : *h2 = *b->theap;
1494 0 : h2->base = NULL;
1495 0 : if (HEAPalloc(h2, b->batCapacity, b->twidth) != GDK_SUCCEED) {
1496 0 : GDKfree(h2);
1497 0 : GDKfree(vh2);
1498 0 : GDKfree(srcdir);
1499 0 : HEAPfree(&h1, false);
1500 0 : HEAPfree(&vh1, false);
1501 0 : TRC_CRITICAL(GDK, "allocating new tail heap "
1502 : "for BAT %d failed\n", b->batCacheid);
1503 0 : return GDK_FAIL;
1504 :
1505 : }
1506 0 : h2->dirty = true;
1507 0 : h2->free = h1.free;
1508 :
1509 0 : *vh2 = *b->tvheap;
1510 0 : strconcat_len(vh2->filename, sizeof(vh2->filename), nme, ".theap", NULL);
1511 0 : strHeap(vh2, b->batCapacity);
1512 0 : if (vh2->base == NULL) {
1513 0 : GDKfree(srcdir);
1514 0 : HEAPfree(&h1, false);
1515 0 : HEAPfree(&vh1, false);
1516 0 : HEAPfree(h2, false);
1517 0 : GDKfree(h2);
1518 0 : GDKfree(vh2);
1519 0 : TRC_CRITICAL(GDK, "allocating new string heap "
1520 : "for BAT %d failed\n", b->batCacheid);
1521 0 : return GDK_FAIL;
1522 : }
1523 0 : vh2->dirty = true;
1524 0 : ATOMIC_INIT(&h2->refs, 1);
1525 0 : ATOMIC_INIT(&vh2->refs, 1);
1526 0 : Heap *ovh = b->tvheap;
1527 0 : b->tvheap = vh2;
1528 0 : vh2 = NULL;
1529 :
1530 0 : for (BUN i = 0; i < b->batCount; i++) {
1531 0 : var_t o = ((var_t *) h1.base)[i];
1532 0 : const char *s = vh1.base + o;
1533 0 : char *ns;
1534 0 : if (fixJSONStorage(&ns, &s) != GDK_SUCCEED) {
1535 0 : GDKfree(srcdir);
1536 0 : HEAPfree(&h1, false);
1537 0 : HEAPfree(&vh1, false);
1538 0 : HEAPdecref(h2, false);
1539 0 : HEAPdecref(b->tvheap, false);
1540 0 : b->tvheap = ovh;
1541 0 : TRC_CRITICAL(GDK, "converting value "
1542 : "in BAT %d failed\n", b->batCacheid);
1543 0 : return GDK_FAIL;
1544 : }
1545 0 : var_t no = strPut(b, &o, ns);
1546 0 : GDKfree(ns);
1547 0 : if (no == 0) {
1548 0 : GDKfree(srcdir);
1549 0 : HEAPfree(&h1, false);
1550 0 : HEAPfree(&vh1, false);
1551 0 : HEAPdecref(h2, false);
1552 0 : HEAPdecref(b->tvheap, false);
1553 0 : b->tvheap = ovh;
1554 0 : TRC_CRITICAL(GDK, "storing new value "
1555 : "in BAT %d failed\n", b->batCacheid);
1556 0 : return GDK_FAIL;
1557 :
1558 : }
1559 0 : ((var_t *)h2->base)[i] = no;
1560 : }
1561 :
1562 : /* cleanup */
1563 0 : HEAPfree(&h1, false);
1564 0 : HEAPfree(&vh1, false);
1565 0 : if (HEAPsave(h2, nme, BATtailname(b), true, h2->free, NULL) !=
1566 : GDK_SUCCEED) {
1567 0 : HEAPdecref(h2, false);
1568 0 : HEAPdecref(b->tvheap, false);
1569 0 : b->tvheap = ovh;
1570 0 : GDKfree(srcdir);
1571 0 : TRC_CRITICAL(GDK, "saving heap failed\n");
1572 0 : return GDK_FAIL;
1573 : }
1574 :
1575 0 : if (HEAPsave(b->tvheap, nme, "theap", true, b->tvheap->free,
1576 : &b->theaplock) != GDK_SUCCEED) {
1577 0 : HEAPfree(b->tvheap, false);
1578 0 : b->tvheap = ovh;
1579 0 : GDKfree(srcdir);
1580 0 : TRC_CRITICAL(GDK, "saving string failed\n");
1581 0 : return GDK_FAIL;
1582 : }
1583 :
1584 0 : HEAPdecref(b->theap, false);
1585 0 : b->theap = h2;
1586 0 : HEAPfree(h2, false);
1587 0 : HEAPdecref(ovh, false);
1588 0 : HEAPfree(b->tvheap, false);
1589 0 : GDKfree(srcdir);
1590 :
1591 0 : return GDK_SUCCEED;
1592 : }
1593 :
1594 : gdk_return
1595 0 : BBPjson_upgrade(json_storage_conversion fixJSONStorage)
1596 : {
1597 0 : bat bid;
1598 0 : int JSON_type = ATOMindex("json");
1599 0 : bat nbat = (bat) ATOMIC_GET(&BBPsize);
1600 0 : bat *upd = GDKmalloc(sizeof(bat) * (size_t) nbat);
1601 0 : int nupd = 0;
1602 :
1603 0 : if (upd == NULL) {
1604 0 : TRC_CRITICAL(GDK, "could not create bat\n");
1605 0 : return GDK_FAIL;
1606 : }
1607 0 : upd[nupd++] = 0; /* first entry unused */
1608 :
1609 0 : BBPlock();
1610 :
1611 0 : for (bid = 1; bid < nbat; bid++) {
1612 0 : BAT *b = BBP_desc(bid);
1613 0 : if (b->batCacheid == 0) {
1614 : /* not a valid BAT */
1615 0 : continue;
1616 : }
1617 :
1618 0 : if (b->ttype < 0) {
1619 0 : const char *nme;
1620 :
1621 0 : nme = ATOMunknown_name(b->ttype);
1622 0 : int tt = ATOMindex(nme);
1623 0 : if (tt >= 0)
1624 0 : b->ttype = tt;
1625 0 : if (strcmp(nme, "json") != 0)
1626 0 : continue;
1627 0 : } else if (b->ttype != JSON_type) {
1628 0 : continue;
1629 : }
1630 0 : fprintf(stderr, "Upgrading json bat %d\n", bid);
1631 0 : if (jsonupgradebat(b, fixJSONStorage) != GDK_SUCCEED) {
1632 0 : BBPunlock();
1633 0 : GDKfree(upd);
1634 0 : return GDK_FAIL;
1635 : }
1636 0 : upd[nupd++] = bid;
1637 : }
1638 0 : BBPunlock();
1639 0 : if (nupd > 1 &&
1640 0 : TMsubcommit_list(upd, NULL, nupd, -1) != GDK_SUCCEED) {
1641 0 : TRC_CRITICAL(GDK, "failed to commit changes\n");
1642 0 : GDKfree(upd);
1643 0 : return GDK_FAIL;
1644 : }
1645 0 : GDKfree(upd);
1646 0 : return GDK_SUCCEED;
1647 : }
1648 : #endif
1649 :
1650 : static bool
1651 100 : BBPtrim(bool aggressive, bat nbat)
1652 : {
1653 100 : int n = 0;
1654 100 : int waitctr = 0;
1655 100 : bool changed = false;
1656 100 : unsigned flag = BBPUNLOADING | BBPSYNCING | BBPSAVING;
1657 100 : if (!aggressive)
1658 100 : flag |= BBPHOT;
1659 100 : lng t0 = GDKusec();
1660 138840 : for (bat bid = 1; bid < nbat && !GDKexiting(); bid++) {
1661 : /* quick check to see if we might possibly have to do
1662 : * work (includes free bats) */
1663 138740 : if ((BBP_status(bid) & BBPLOADED) == 0)
1664 36668 : continue;
1665 : /* don't do this during a (sub)commit */
1666 102072 : BBPtmlock();
1667 102072 : MT_lock_set(&GDKswapLock(bid));
1668 102072 : BAT *b = NULL;
1669 102072 : bool swap = false;
1670 102072 : if ((BBP_status(bid) & (flag | BBPLOADED)) == BBPLOADED &&
1671 18836 : BBP_refs(bid) == 0 &&
1672 18836 : BBP_lrefs(bid) != 0 &&
1673 18836 : (b = BBP_desc(bid))->batCacheid != 0) {
1674 18836 : MT_lock_set(&b->theaplock);
1675 18836 : if (!BATshared(b) &&
1676 18782 : !isVIEW(b) &&
1677 18599 : (!BATdirty(b) ||
1678 0 : (aggressive &&
1679 0 : b->theap->storage == STORE_MMAP &&
1680 0 : (b->tvheap == NULL ||
1681 0 : b->tvheap->storage == STORE_MMAP)) ||
1682 15099 : (b->batRole == PERSISTENT &&
1683 14741 : BBP_lrefs(bid) <= 2))) {
1684 12182 : BBP_status_on(bid, BBPUNLOADING);
1685 12182 : swap = true;
1686 20864 : waitctr += BATdirty(b) ? 9 : 1;
1687 : }
1688 18836 : MT_lock_unset(&b->theaplock);
1689 : }
1690 102072 : MT_lock_unset(&GDKswapLock(bid));
1691 102072 : if (swap) {
1692 12182 : TRC_DEBUG(BAT_, "unload and free bat %d\n", bid);
1693 12182 : if (BBPfree(b) != GDK_SUCCEED)
1694 0 : GDKerror("unload failed for bat %d", bid);
1695 12182 : n++;
1696 12182 : changed = true;
1697 : }
1698 102072 : BBPtmunlock();
1699 : /* every once in a while, give others a chance */
1700 102072 : if (++waitctr >= 1000) {
1701 153 : waitctr = 0;
1702 153 : MT_sleep_ms(2);
1703 : }
1704 : }
1705 100 : if (n > 0)
1706 37 : TRC_INFO(BAT_, "unloaded %d bats in "LLFMT" usec%s\n", n, GDKusec() - t0, aggressive ? " (also hot)" : "");
1707 100 : return changed;
1708 : }
1709 :
1710 : static void
1711 314 : BBPmanager(void *dummy)
1712 : {
1713 314 : (void) dummy;
1714 314 : bool changed = true;
1715 :
1716 414 : for (;;) {
1717 414 : int n = 0;
1718 414 : bat nbat = (bat) ATOMIC_GET(&BBPsize);
1719 414 : MT_thread_setworking("clearing HOT bits");
1720 317028 : for (bat bid = 1; bid < nbat; bid++) {
1721 316614 : MT_lock_set(&GDKswapLock(bid));
1722 316614 : if (BBP_refs(bid) == 0 && BBP_lrefs(bid) != 0) {
1723 108965 : n += (BBP_status(bid) & BBPHOT) != 0;
1724 108965 : BBP_status_off(bid, BBPHOT);
1725 : }
1726 316614 : MT_lock_unset(&GDKswapLock(bid));
1727 : }
1728 414 : TRC_DEBUG(BAT_, "cleared HOT bit from %d bats\n", n);
1729 414 : size_t cur = GDKvm_cursize();
1730 414 : MT_thread_setworking("sleeping");
1731 18282 : for (int i = 0, n = changed && cur > GDK_vm_maxsize / 2 ? 1 : cur > GDK_vm_maxsize / 4 ? 10 : 100; i < n; i++) {
1732 17768 : MT_sleep_ms(100);
1733 17750 : if (GDKexiting())
1734 : return;
1735 : }
1736 100 : MT_thread_setworking("BBPtrim");
1737 100 : changed = BBPtrim(false, nbat);
1738 100 : MT_thread_setworking("BBPcallbacks");
1739 100 : BBPcallbacks();
1740 100 : if (GDKexiting())
1741 : return;
1742 : }
1743 : }
1744 :
1745 : static MT_Id manager;
1746 :
1747 : gdk_return
1748 315 : BBPinit(bool allow_hge_upgrade, bool no_manager)
1749 : {
1750 315 : FILE *fp = NULL;
1751 315 : struct stat st;
1752 315 : unsigned bbpversion = 0;
1753 315 : int i;
1754 315 : int lineno = 0;
1755 : #ifdef GDKLIBRARY_HASHASH
1756 315 : bat *hashbats = NULL;
1757 315 : bat nhashbats = 0;
1758 315 : gdk_return res = GDK_SUCCEED;
1759 : #endif
1760 315 : ATOMIC_BASE_TYPE dbg = ATOMIC_GET(&GDKdebug);
1761 :
1762 315 : ATOMIC_AND(&GDKdebug, ~TAILCHKMASK);
1763 :
1764 : /* the maximum number of BATs allowed in the system and the
1765 : * size of the "physical" array are linked in a complicated
1766 : * manner. The expression below shows the relationship */
1767 315 : static_assert((uint64_t) N_BBPINIT * BBPINIT < (UINT64_C(1) << (3 * ((sizeof(BBP[0][0].physical) + 2) * 2 / 5))), "\"physical\" array in BBPrec is too small");
1768 : /* similarly, the maximum number of BATs allowed also has a
1769 : * (somewhat simpler) relation with the size of the "bak"
1770 : * array */
1771 315 : static_assert((uint64_t) N_BBPINIT * BBPINIT < (UINT64_C(1) << (3 * (sizeof(BBP[0][0].bak) - 5))), "\"bak\" array in BBPrec is too small");
1772 :
1773 315 : if (!GDKinmemory(0)) {
1774 314 : str bbpdirstr, backupbbpdirstr;
1775 :
1776 314 : BBPtmlock();
1777 :
1778 314 : if ((bbpdirstr = GDKfilepath(0, BATDIR, "BBP", "dir")) == NULL) {
1779 0 : TRC_CRITICAL(GDK, "GDKmalloc failed\n");
1780 0 : BBPtmunlock();
1781 0 : ATOMIC_SET(&GDKdebug, dbg);
1782 0 : return GDK_FAIL;
1783 : }
1784 :
1785 314 : if ((backupbbpdirstr = GDKfilepath(0, BAKDIR, "BBP", "dir")) == NULL) {
1786 0 : GDKfree(bbpdirstr);
1787 0 : TRC_CRITICAL(GDK, "GDKmalloc failed\n");
1788 0 : BBPtmunlock();
1789 0 : ATOMIC_SET(&GDKdebug, dbg);
1790 0 : return GDK_FAIL;
1791 : }
1792 :
1793 314 : if (GDKremovedir(0, TEMPDIR) != GDK_SUCCEED) {
1794 0 : GDKfree(bbpdirstr);
1795 0 : GDKfree(backupbbpdirstr);
1796 0 : TRC_CRITICAL(GDK, "cannot remove directory %s\n", TEMPDIR);
1797 0 : BBPtmunlock();
1798 0 : ATOMIC_SET(&GDKdebug, dbg);
1799 0 : return GDK_FAIL;
1800 : }
1801 :
1802 314 : if (GDKremovedir(0, DELDIR) != GDK_SUCCEED) {
1803 0 : GDKfree(bbpdirstr);
1804 0 : GDKfree(backupbbpdirstr);
1805 0 : TRC_CRITICAL(GDK, "cannot remove directory %s\n", DELDIR);
1806 0 : BBPtmunlock();
1807 0 : ATOMIC_SET(&GDKdebug, dbg);
1808 0 : return GDK_FAIL;
1809 : }
1810 :
1811 : /* first move everything from SUBDIR to BAKDIR (its parent) */
1812 314 : if (BBPrecover_subdir() != GDK_SUCCEED) {
1813 0 : GDKfree(bbpdirstr);
1814 0 : GDKfree(backupbbpdirstr);
1815 0 : TRC_CRITICAL(GDK, "cannot properly recover_subdir process %s.", SUBDIR);
1816 0 : BBPtmunlock();
1817 0 : ATOMIC_SET(&GDKdebug, dbg);
1818 0 : return GDK_FAIL;
1819 : }
1820 :
1821 : /* try to obtain a BBP.dir from bakdir */
1822 314 : if (MT_stat(backupbbpdirstr, &st) == 0) {
1823 : /* backup exists; *must* use it */
1824 89 : if (recover_dir(0, MT_stat(bbpdirstr, &st) == 0) != GDK_SUCCEED) {
1825 0 : GDKfree(bbpdirstr);
1826 0 : GDKfree(backupbbpdirstr);
1827 0 : BBPtmunlock();
1828 0 : goto bailout;
1829 : }
1830 89 : if ((fp = GDKfilelocate(0, "BBP", "r", "dir")) == NULL) {
1831 0 : GDKfree(bbpdirstr);
1832 0 : GDKfree(backupbbpdirstr);
1833 0 : TRC_CRITICAL(GDK, "cannot open recovered BBP.dir.");
1834 0 : BBPtmunlock();
1835 0 : ATOMIC_SET(&GDKdebug, dbg);
1836 0 : return GDK_FAIL;
1837 : }
1838 225 : } else if ((fp = GDKfilelocate(0, "BBP", "r", "dir")) == NULL) {
1839 : /* there was no BBP.dir either. Panic! try to use a
1840 : * BBP.bak */
1841 225 : if (MT_stat(backupbbpdirstr, &st) < 0) {
1842 : /* no BBP.bak (nor BBP.dir or BACKUP/BBP.dir):
1843 : * create a new one */
1844 225 : TRC_DEBUG(IO_, "initializing BBP.\n");
1845 225 : if (BBPdir_init() != GDK_SUCCEED) {
1846 0 : GDKfree(bbpdirstr);
1847 0 : GDKfree(backupbbpdirstr);
1848 0 : BBPtmunlock();
1849 0 : goto bailout;
1850 : }
1851 0 : } else if (GDKmove(0, BATDIR, "BBP", "bak", BATDIR, "BBP", "dir", true) == GDK_SUCCEED)
1852 0 : TRC_DEBUG(IO_, "reverting to dir saved in BBP.bak.\n");
1853 :
1854 225 : if ((fp = GDKfilelocate(0, "BBP", "r", "dir")) == NULL) {
1855 0 : GDKsyserror("cannot open BBP.dir");
1856 0 : GDKfree(bbpdirstr);
1857 0 : GDKfree(backupbbpdirstr);
1858 0 : BBPtmunlock();
1859 0 : goto bailout;
1860 : }
1861 : }
1862 : assert(fp != NULL);
1863 314 : GDKfree(bbpdirstr);
1864 314 : GDKfree(backupbbpdirstr);
1865 314 : BBPtmunlock();
1866 : }
1867 :
1868 : /* scan the BBP.dir to obtain current size */
1869 315 : BBPlimit = BBPINIT;
1870 315 : memset(BBP0, 0, sizeof(BBP0));
1871 315 : memset(BBP, 0, sizeof(BBP));
1872 315 : BBP[0] = BBP0;
1873 :
1874 315 : bat bbpsize;
1875 315 : bbpsize = 1;
1876 315 : if (GDKinmemory(0)) {
1877 : bbpversion = GDKLIBRARY;
1878 : } else {
1879 314 : lng logno;
1880 314 : bbpversion = BBPheader(fp, &lineno, &bbpsize, &logno, allow_hge_upgrade);
1881 314 : if (bbpversion == 0) {
1882 0 : ATOMIC_SET(&GDKdebug, dbg);
1883 0 : return GDK_FAIL;
1884 : }
1885 314 : ATOMIC_SET(&BBPlogno, logno);
1886 : }
1887 :
1888 : /* allocate BBP records */
1889 315 : if (BBPextend(bbpsize) != GDK_SUCCEED) {
1890 0 : ATOMIC_SET(&GDKdebug, dbg);
1891 0 : return GDK_FAIL;
1892 : }
1893 315 : ATOMIC_SET(&BBPsize, bbpsize);
1894 :
1895 315 : if (!GDKinmemory(0)) {
1896 314 : if (BBPreadEntries(fp, bbpversion, lineno
1897 : #ifdef GDKLIBRARY_HASHASH
1898 : , &hashbats, &nhashbats
1899 : #endif
1900 : ) != GDK_SUCCEED) {
1901 0 : ATOMIC_SET(&GDKdebug, dbg);
1902 0 : return GDK_FAIL;
1903 : }
1904 314 : fclose(fp);
1905 : }
1906 :
1907 : /* remove trailing free bats from potential free list (they will
1908 : * get added when needed) */
1909 14837 : for (bat i = (bat) ATOMIC_GET(&BBPsize) - 1; i > 0; i--) {
1910 14611 : if (BBP_desc(i)->batCacheid != 0)
1911 : break;
1912 14522 : bbpsize--;
1913 : }
1914 315 : ATOMIC_SET(&BBPsize, bbpsize);
1915 :
1916 : /* add free bats to free list in such a way that low numbered
1917 : * ones are at the head of the list */
1918 51299 : for (bat i = (bat) ATOMIC_GET(&BBPsize) - 1; i > 0; i--) {
1919 50984 : if (BBP_desc(i)->batCacheid == 0) {
1920 27531 : BBP_next(i) = BBP_free;
1921 27531 : BBP_free = i;
1922 27531 : BBP_nfree++;
1923 : }
1924 : }
1925 :
1926 : /* will call BBPrecover if needed */
1927 315 : if (!GDKinmemory(0)) {
1928 314 : BBPtmlock();
1929 314 : gdk_return rc = BBPprepare(false);
1930 314 : BBPtmunlock();
1931 314 : if (rc != GDK_SUCCEED) {
1932 : #ifdef GDKLIBRARY_HASHASH
1933 0 : GDKfree(hashbats);
1934 : #endif
1935 0 : TRC_CRITICAL(GDK, "cannot properly prepare process %s.", BAKDIR);
1936 0 : ATOMIC_SET(&GDKdebug, dbg);
1937 0 : return rc;
1938 : }
1939 : }
1940 :
1941 315 : if (BBPcheckbats(bbpversion) != GDK_SUCCEED) {
1942 : #ifdef GDKLIBRARY_HASHASH
1943 0 : GDKfree(hashbats);
1944 : #endif
1945 0 : ATOMIC_SET(&GDKdebug, dbg);
1946 0 : return GDK_FAIL;
1947 : }
1948 :
1949 : #ifdef GDKLIBRARY_HASHASH
1950 315 : if (nhashbats > 0)
1951 0 : res = fixhashash(hashbats, nhashbats);
1952 315 : GDKfree(hashbats);
1953 315 : if (res != GDK_SUCCEED)
1954 : return res;
1955 : #endif
1956 :
1957 : #ifdef GDKLIBRARY_JSON
1958 315 : if (bbpversion <= GDKLIBRARY_JSON) {
1959 0 : char *jsonupgradestr;
1960 0 : if (GDKinmemory(0)) {
1961 315 : jsonupgradestr = NULL;
1962 : } else {
1963 0 : if ((jsonupgradestr = GDKfilepath(0, BATDIR, "jsonupgradeneeded", NULL)) == NULL) {
1964 0 : TRC_CRITICAL(GDK, "GDKfilepath failed\n");
1965 0 : ATOMIC_SET(&GDKdebug, dbg);
1966 0 : return GDK_FAIL;
1967 : }
1968 :
1969 : /* create signal file that we need to upgrade
1970 : * stored json strings. This will be performed
1971 : * by an upgrade function in the GDK that will
1972 : * be called at the end of the json module
1973 : * initialization with a callback that actually
1974 : * knows how to perform the upgrade. */
1975 0 : int fd = MT_open(jsonupgradestr, O_WRONLY | O_CREAT);
1976 0 : GDKfree(jsonupgradestr);
1977 0 : if (fd < 0) {
1978 0 : TRC_CRITICAL(GDK, "cannot create signal file jsonupgradeneeded");
1979 0 : ATOMIC_SET(&GDKdebug, dbg);
1980 0 : return GDK_FAIL;
1981 : }
1982 :
1983 0 : close(fd);
1984 : }
1985 : }
1986 : #endif
1987 :
1988 315 : if (bbpversion < GDKLIBRARY && TMcommit() != GDK_SUCCEED) {
1989 0 : TRC_CRITICAL(GDK, "TMcommit failed\n");
1990 0 : ATOMIC_SET(&GDKdebug, dbg);
1991 0 : return GDK_FAIL;
1992 : }
1993 :
1994 315 : ATOMIC_SET(&GDKdebug, dbg);
1995 :
1996 : /* cleanup any leftovers (must be done after BBPrecover) */
1997 1246 : for (i = 0; i < MAXFARMS && BBPfarms[i].dirname != NULL; i++) {
1998 : int j;
1999 1229 : for (j = 0; j < i; j++) {
2000 : /* don't clean a directory twice */
2001 766 : if (BBPfarms[j].dirname &&
2002 766 : strcmp(BBPfarms[i].dirname,
2003 : BBPfarms[j].dirname) == 0)
2004 : break;
2005 : }
2006 931 : if (j == i) {
2007 463 : char *d = GDKfilepath(i, NULL, BATDIR, NULL);
2008 463 : if (d == NULL) {
2009 : return GDK_FAIL;
2010 : }
2011 463 : BBPdiskscan(d, strlen(d) - strlen(BATDIR));
2012 463 : GDKfree(d);
2013 : }
2014 : }
2015 :
2016 315 : if (!GDKinmemory(0) && !no_manager && MT_create_thread(&manager, BBPmanager, NULL, MT_THR_DETACHED, "BBPmanager") < 0) {
2017 0 : TRC_CRITICAL(GDK, "Could not start BBPmanager thread.");
2018 0 : return GDK_FAIL;
2019 : }
2020 : return GDK_SUCCEED;
2021 :
2022 0 : bailout:
2023 : /* now it is time for real panic */
2024 0 : TRC_CRITICAL(GDK, "could not write %s%cBBP.dir.", BATDIR, DIR_SEP);
2025 0 : return GDK_FAIL;
2026 : }
2027 :
2028 : /*
2029 : * During the exit phase all non-persistent BATs are removed. Upon
2030 : * exit the status of the BBP tables is saved on disk. This function
2031 : * is called once and during the shutdown of the server. Since
2032 : * shutdown may be issued from any thread (dangerous) it may lead to
2033 : * interference in a parallel session.
2034 : */
2035 :
2036 : static int backup_files = 0, backup_dir = 0, backup_subdir = 0;
2037 : static char *lockfile = NULL;
2038 :
2039 : void
2040 297 : BBPexit(void)
2041 : {
2042 297 : bat i;
2043 297 : bool skipped;
2044 :
2045 : //BBPlock(); /* stop all threads ever touching more descriptors */
2046 :
2047 : /* free all memory (just for leak-checking in Purify) */
2048 297 : do {
2049 297 : skipped = false;
2050 384641 : for (i = 0; i < (bat) ATOMIC_GET(&BBPsize); i++) {
2051 384344 : if (BBPvalid(i)) {
2052 272121 : BAT *b = BBP_desc(i);
2053 :
2054 272121 : if (b->batCacheid != 0) {
2055 272121 : if (BATshared(b)) {
2056 0 : skipped = true;
2057 0 : continue;
2058 : }
2059 272121 : MT_lock_set(&b->theaplock);
2060 272121 : bat tp = VIEWtparent(b);
2061 0 : if (tp != 0) {
2062 0 : --BBP_lrefs(tp);
2063 0 : HEAPdecref(b->theap, false);
2064 0 : b->theap = NULL;
2065 : }
2066 272121 : tp = VIEWvtparent(b);
2067 0 : if (tp != 0) {
2068 0 : --BBP_lrefs(tp);
2069 0 : HEAPdecref(b->tvheap, false);
2070 0 : b->tvheap = NULL;
2071 : }
2072 272121 : if (b->oldtail) {
2073 7 : Heap *h = b->oldtail;
2074 7 : b->oldtail = NULL;
2075 7 : ATOMIC_AND(&h->refs, ~DELAYEDREMOVE);
2076 7 : HEAPdecref(h, false);
2077 : }
2078 272121 : PROPdestroy_nolock(b);
2079 272121 : MT_lock_unset(&b->theaplock);
2080 272121 : BATfree(b);
2081 : }
2082 272121 : BBP_pid(i) = 0;
2083 272121 : BBPuncacheit(i, true);
2084 272121 : if (BBP_logical(i) != BBP_bak(i))
2085 10464 : GDKfree(BBP_logical(i));
2086 272121 : BBP_logical(i) = NULL;
2087 : }
2088 : }
2089 297 : } while (skipped);
2090 : /* these need to be NULL, otherwise no new ones get created */
2091 297 : memset(BBP_hash, 0, sizeof(BBP_hash));
2092 297 : backup_files = 0;
2093 297 : backup_dir = 0;
2094 297 : backup_subdir = 0;
2095 297 : if (lockfile) {
2096 296 : GDKfree(lockfile);
2097 296 : lockfile = NULL;
2098 : }
2099 297 : }
2100 :
2101 : /*
2102 : * The routine BBPdir creates the BAT pool dictionary file. It
2103 : * includes some information about the current state of affair in the
2104 : * pool. The location in the buffer pool is saved for later use as
2105 : * well. This is merely done for ease of debugging and of no
2106 : * importance to front-ends. The tail of non-used entries is
2107 : * reclaimed as well.
2108 : */
2109 : static inline int
2110 1792878 : heap_entry(FILE *fp, BATiter *bi, BUN size)
2111 : {
2112 1792878 : size_t free = bi->hfree;
2113 1792878 : if (size < BUN_NONE) {
2114 1792878 : if ((bi->type >= 0 && ATOMstorage(bi->type) == TYPE_msk))
2115 281657 : free = ((size + 31) / 32) * 4;
2116 1511221 : else if (bi->width > 0)
2117 1511221 : free = size << bi->shift;
2118 : else
2119 : free = 0;
2120 : }
2121 :
2122 5711096 : return fprintf(fp, " %s %d %d %d " BUNFMT " " BUNFMT " " BUNFMT " "
2123 : BUNFMT " " OIDFMT " %zu %" PRIu64" %" PRIu64,
2124 1792878 : bi->type >= 0 ? BATatoms[bi->type].name : ATOMunknown_name(bi->type),
2125 1792878 : bi->width,
2126 1792878 : bi->type == TYPE_void || bi->vh != NULL,
2127 1792878 : (unsigned short) bi->sorted |
2128 1792878 : ((unsigned short) bi->revsorted << 7) |
2129 3585756 : ((unsigned short) bi->key << 8) |
2130 1792878 : ((unsigned short) BATtdensebi(bi) << 9) |
2131 1792878 : ((unsigned short) bi->nonil << 10) |
2132 1792878 : ((unsigned short) bi->nil << 11) |
2133 1792878 : ((unsigned short) bi->ascii << 12),
2134 1090055 : bi->nokey[0] >= size || bi->nokey[1] >= size ? 0 : bi->nokey[0],
2135 1792878 : bi->nokey[0] >= size || bi->nokey[1] >= size ? 0 : bi->nokey[1],
2136 1792878 : bi->nosorted >= size ? 0 : bi->nosorted,
2137 1792878 : bi->norevsorted >= size ? 0 : bi->norevsorted,
2138 : bi->tseq,
2139 : free,
2140 1792878 : bi->minpos < size ? (uint64_t) bi->minpos : (uint64_t) oid_nil,
2141 1792878 : bi->maxpos < size ? (uint64_t) bi->maxpos : (uint64_t) oid_nil);
2142 : }
2143 :
2144 : static inline int
2145 1792878 : vheap_entry(FILE *fp, BATiter *bi, BUN size)
2146 : {
2147 1792878 : (void) size;
2148 1792878 : if (bi->vh == NULL)
2149 : return 0;
2150 412682 : return fprintf(fp, " %zu", size == 0 ? 0 : bi->vhfree);
2151 : }
2152 :
2153 : static gdk_return
2154 1792878 : new_bbpentry(FILE *fp, bat i, BUN size, BATiter *bi)
2155 : {
2156 : #ifndef NDEBUG
2157 1792878 : assert(i > 0);
2158 1792878 : assert(i < (bat) ATOMIC_GET(&BBPsize));
2159 1792878 : assert(bi->b);
2160 1792878 : assert(bi->b->batCacheid == i);
2161 1792878 : assert(bi->b->batRole == PERSISTENT);
2162 1792878 : assert(0 <= bi->h->farmid && bi->h->farmid < MAXFARMS);
2163 1792878 : assert(BBPfarms[bi->h->farmid].roles & (1U << PERSISTENT));
2164 1792878 : if (bi->vh) {
2165 412682 : assert(0 <= bi->vh->farmid && bi->vh->farmid < MAXFARMS);
2166 412682 : assert(BBPfarms[bi->vh->farmid].roles & (1U << PERSISTENT));
2167 : }
2168 1792878 : assert(size <= bi->count || size == BUN_NONE);
2169 1792878 : assert(BBP_options(i) == NULL || strpbrk(BBP_options(i), "\r\n") == NULL);
2170 : #endif
2171 :
2172 1792878 : if (BBP_options(i) != NULL && strpbrk(BBP_options(i), "\r\n") != NULL) {
2173 0 : GDKerror("options for bat %d contains a newline\n", i);
2174 0 : return GDK_FAIL;
2175 : }
2176 1792878 : if (size > bi->count)
2177 : size = bi->count;
2178 1792878 : if (fprintf(fp, "%d %s %d " BUNFMT " " OIDFMT,
2179 : /* BAT info */
2180 : (int) i,
2181 : BBP_logical(i),
2182 1792878 : (unsigned) bi->restricted << 1,
2183 : size,
2184 1792878 : bi->b->hseqbase) < 0 ||
2185 3585756 : heap_entry(fp, bi, size) < 0 ||
2186 1792878 : vheap_entry(fp, bi, size) < 0 ||
2187 3585756 : (BBP_options(i) && fprintf(fp, " %s", BBP_options(i)) < 0) ||
2188 1792878 : fprintf(fp, "\n") < 0) {
2189 0 : GDKsyserror("new_bbpentry: Writing BBP.dir entry failed\n");
2190 0 : return GDK_FAIL;
2191 : }
2192 :
2193 : return GDK_SUCCEED;
2194 : }
2195 :
2196 : static gdk_return
2197 13112 : BBPdir_header(FILE *f, int n, lng logno)
2198 : {
2199 13112 : if (fprintf(f, "BBP.dir, GDKversion %u\n%d %d %d\nBBPsize=%d\nBBPinfo=" LLFMT "\n",
2200 : GDKLIBRARY, SIZEOF_SIZE_T, SIZEOF_OID,
2201 : #ifdef HAVE_HGE
2202 : SIZEOF_HGE
2203 : #else
2204 : SIZEOF_LNG
2205 : #endif
2206 13112 : , n, logno) < 0 ||
2207 13112 : ferror(f)) {
2208 0 : GDKsyserror("Writing BBP.dir header failed\n");
2209 0 : return GDK_FAIL;
2210 : }
2211 : return GDK_SUCCEED;
2212 : }
2213 :
2214 : static gdk_return
2215 13112 : BBPdir_first(bool subcommit, lng logno, FILE **obbpfp, FILE **nbbpfp)
2216 : {
2217 13112 : FILE *obbpf = NULL, *nbbpf = NULL;
2218 13112 : int n = 0;
2219 13112 : lng ologno;
2220 :
2221 13112 : if (obbpfp)
2222 12887 : *obbpfp = NULL;
2223 13112 : *nbbpfp = NULL;
2224 :
2225 13112 : if ((nbbpf = GDKfilelocate(0, "BBP", "w", "dir")) == NULL) {
2226 : return GDK_FAIL;
2227 : }
2228 :
2229 13112 : if (subcommit) {
2230 12879 : char buf[512];
2231 :
2232 12879 : assert(obbpfp != NULL);
2233 : /* we need to copy the backup BBP.dir to the new, but
2234 : * replacing the entries for the subcommitted bats */
2235 12879 : if ((obbpf = GDKfileopen(0, SUBDIR, "BBP", "dir", "r")) == NULL &&
2236 0 : (obbpf = GDKfileopen(0, BAKDIR, "BBP", "dir", "r")) == NULL) {
2237 0 : GDKsyserror("subcommit attempted without backup BBP.dir");
2238 0 : goto bailout;
2239 : }
2240 : /* read first three lines */
2241 25758 : if (fgets(buf, sizeof(buf), obbpf) == NULL || /* BBP.dir, GDKversion %d */
2242 25758 : fgets(buf, sizeof(buf), obbpf) == NULL || /* SIZEOF_SIZE_T SIZEOF_OID SIZEOF_MAX_INT */
2243 12879 : fgets(buf, sizeof(buf), obbpf) == NULL) { /* BBPsize=%d */
2244 0 : GDKerror("subcommit attempted with invalid backup BBP.dir.");
2245 0 : goto bailout;
2246 : }
2247 : /* third line contains BBPsize */
2248 12879 : if (sscanf(buf, "BBPsize=%d", &n) != 1) {
2249 0 : GDKerror("cannot read BBPsize in backup BBP.dir.");
2250 0 : goto bailout;
2251 : }
2252 : /* fourth line contains BBPinfo */
2253 12879 : if (fgets(buf, sizeof(buf), obbpf) == NULL ||
2254 12879 : sscanf(buf, "BBPinfo=" LLSCN, &ologno) != 1) {
2255 0 : GDKerror("cannot read BBPinfo in backup BBP.dir.");
2256 0 : goto bailout;
2257 : }
2258 : }
2259 :
2260 13112 : if (n < (bat) ATOMIC_GET(&BBPsize))
2261 2653 : n = (bat) ATOMIC_GET(&BBPsize);
2262 :
2263 13112 : TRC_DEBUG(IO_, "writing BBP.dir (%d bats).\n", n);
2264 :
2265 13112 : if (BBPdir_header(nbbpf, n, logno) != GDK_SUCCEED) {
2266 0 : goto bailout;
2267 : }
2268 :
2269 13112 : if (obbpfp)
2270 12887 : *obbpfp = obbpf;
2271 13112 : *nbbpfp = nbbpf;
2272 :
2273 13112 : return GDK_SUCCEED;
2274 :
2275 0 : bailout:
2276 0 : if (obbpf != NULL)
2277 0 : fclose(obbpf);
2278 0 : if (nbbpf != NULL)
2279 0 : fclose(nbbpf);
2280 0 : return GDK_FAIL;
2281 : }
2282 :
2283 : static bat
2284 1986614 : BBPdir_step(bat bid, BUN size, int n, char *buf, size_t bufsize,
2285 : FILE **obbpfp, FILE *nbbpf, BATiter *bi)
2286 : {
2287 1986614 : if (n < -1) /* safety catch */
2288 : return n;
2289 5291551 : while (n >= 0 && n < bid) {
2290 3304937 : if (n > 0) {
2291 1572318 : if (fputs(buf, nbbpf) == EOF) {
2292 0 : GDKerror("Writing BBP.dir file failed.\n");
2293 0 : goto bailout;
2294 : }
2295 : }
2296 3304937 : if (fgets(buf, (int) bufsize, *obbpfp) == NULL) {
2297 3221 : if (ferror(*obbpfp)) {
2298 0 : GDKerror("error reading backup BBP.dir.");
2299 0 : goto bailout;
2300 : }
2301 3221 : n = -1;
2302 3221 : if (fclose(*obbpfp) == EOF) {
2303 0 : GDKsyserror("Closing backup BBP.dir file failed\n");
2304 0 : GDKclrerr(); /* ignore error */
2305 : }
2306 3221 : *obbpfp = NULL;
2307 : } else {
2308 3301716 : if (sscanf(buf, "%d", &n) != 1 || n <= 0 || n >= N_BBPINIT * BBPINIT) {
2309 0 : GDKerror("subcommit attempted with invalid backup BBP.dir.");
2310 0 : goto bailout;
2311 : }
2312 : }
2313 : }
2314 1986614 : if (bi) {
2315 1792878 : assert(BBP_status(bid) & BBPPERSISTENT);
2316 1792878 : if (new_bbpentry(nbbpf, bid, size, bi) != GDK_SUCCEED)
2317 0 : goto bailout;
2318 : }
2319 1986614 : return n == -1 ? -1 : n == bid ? 0 : n;
2320 :
2321 0 : bailout:
2322 0 : if (*obbpfp)
2323 0 : fclose(*obbpfp);
2324 0 : fclose(nbbpf);
2325 0 : return -2;
2326 : }
2327 :
2328 : static gdk_return
2329 13112 : BBPdir_last(int n, char *buf, size_t bufsize, FILE *obbpf, FILE *nbbpf)
2330 : {
2331 13112 : if (n > 0 && fputs(buf, nbbpf) == EOF) {
2332 0 : GDKerror("Writing BBP.dir file failed.\n");
2333 0 : goto bailout;
2334 : }
2335 315406 : while (obbpf) {
2336 311952 : if (fgets(buf, (int) bufsize, obbpf) == NULL) {
2337 9658 : if (ferror(obbpf)) {
2338 0 : GDKerror("error reading backup BBP.dir.");
2339 0 : goto bailout;
2340 : }
2341 9658 : if (fclose(obbpf) == EOF) {
2342 0 : GDKsyserror("Closing backup BBP.dir file failed\n");
2343 0 : GDKclrerr(); /* ignore error */
2344 : }
2345 : obbpf = NULL;
2346 : } else {
2347 302294 : if (fputs(buf, nbbpf) == EOF) {
2348 0 : GDKerror("Writing BBP.dir file failed.\n");
2349 0 : goto bailout;
2350 : }
2351 : }
2352 : }
2353 13112 : if (fflush(nbbpf) == EOF ||
2354 13112 : (!(ATOMIC_GET(&GDKdebug) & NOSYNCMASK)
2355 : #if defined(NATIVE_WIN32)
2356 : && _commit(_fileno(nbbpf)) < 0
2357 : #elif defined(HAVE_FDATASYNC)
2358 11 : && fdatasync(fileno(nbbpf)) < 0
2359 : #elif defined(HAVE_FSYNC)
2360 : && fsync(fileno(nbbpf)) < 0
2361 : #endif
2362 : )) {
2363 0 : GDKsyserror("Syncing BBP.dir file failed\n");
2364 0 : goto bailout;
2365 : }
2366 13112 : if (fclose(nbbpf) == EOF) {
2367 0 : GDKsyserror("Closing BBP.dir file failed\n");
2368 0 : nbbpf = NULL; /* can't close again */
2369 0 : goto bailout;
2370 : }
2371 :
2372 13112 : TRC_DEBUG(IO_, "end\n");
2373 :
2374 : return GDK_SUCCEED;
2375 :
2376 0 : bailout:
2377 0 : if (obbpf != NULL)
2378 0 : fclose(obbpf);
2379 0 : if (nbbpf != NULL)
2380 0 : fclose(nbbpf);
2381 : return GDK_FAIL;
2382 : }
2383 :
2384 : gdk_return
2385 225 : BBPdir_init(void)
2386 : {
2387 225 : FILE *fp;
2388 225 : gdk_return rc;
2389 :
2390 225 : rc = BBPdir_first(false, 0, NULL, &fp);
2391 225 : if (rc == GDK_SUCCEED)
2392 225 : rc = BBPdir_last(-1, NULL, 0, NULL, fp);
2393 225 : return rc;
2394 : }
2395 :
2396 : /* function used for debugging */
2397 : void
2398 0 : BBPdump(void)
2399 : {
2400 0 : size_t mem = 0, vm = 0;
2401 0 : int n = 0;
2402 :
2403 0 : for (bat i = 0; i < (bat) ATOMIC_GET(&BBPsize); i++) {
2404 0 : if (BBP_refs(i) == 0 && BBP_lrefs(i) == 0)
2405 0 : continue;
2406 0 : BAT *b = BBP_desc(i);
2407 0 : unsigned status = BBP_status(i);
2408 0 : printf("# %d: " ALGOOPTBATFMT " refs=%d lrefs=%d status=%u%s",
2409 : i,
2410 0 : ALGOOPTBATPAR(b),
2411 : BBP_refs(i),
2412 0 : BBP_lrefs(i),
2413 : status,
2414 0 : status & BBPLOADED ? "" : " not cached");
2415 0 : if (b->batCacheid == 0) {
2416 0 : printf(", no descriptor\n");
2417 0 : continue;
2418 : }
2419 0 : if (b->theap) {
2420 0 : if (b->theap->parentid != b->batCacheid) {
2421 0 : printf(" Theap -> %d", b->theap->parentid);
2422 : } else {
2423 0 : printf(" Theap=[%zu,%zu,f=%d]%s%s",
2424 : b->theap->free,
2425 : b->theap->size,
2426 0 : b->theap->farmid,
2427 0 : b->theap->base == NULL ? "X" : b->theap->storage == STORE_MMAP ? "M" : "",
2428 0 : status & BBPSWAPPED ? "(Swapped)" : b->theap->dirty ? "(Dirty)" : "");
2429 0 : mem += HEAPmemsize(b->theap);
2430 0 : vm += HEAPvmsize(b->theap);
2431 0 : n++;
2432 : }
2433 : }
2434 0 : if (b->tvheap) {
2435 0 : if (b->tvheap->parentid != b->batCacheid) {
2436 0 : printf(" Tvheap -> %d",
2437 : b->tvheap->parentid);
2438 : } else {
2439 0 : printf(" Tvheap=[%zu,%zu,f=%d]%s%s",
2440 : b->tvheap->free,
2441 : b->tvheap->size,
2442 0 : b->tvheap->farmid,
2443 0 : b->tvheap->base == NULL ? "X" : b->tvheap->storage == STORE_MMAP ? "M" : "",
2444 0 : b->tvheap->dirty ? "(Dirty)" : "");
2445 0 : mem += HEAPmemsize(b->tvheap);
2446 0 : vm += HEAPvmsize(b->tvheap);
2447 : }
2448 : }
2449 0 : if (MT_rwlock_rdtry(&b->thashlock)) {
2450 0 : if (b->thash && b->thash != (Hash *) 1) {
2451 0 : size_t m = HEAPmemsize(&b->thash->heaplink) + HEAPmemsize(&b->thash->heapbckt);
2452 0 : size_t v = HEAPvmsize(&b->thash->heaplink) + HEAPvmsize(&b->thash->heapbckt);
2453 0 : printf(" Thash=[%zu,%zu,f=%d/%d]", m, v,
2454 0 : b->thash->heaplink.farmid,
2455 0 : b->thash->heapbckt.farmid);
2456 0 : mem += m;
2457 0 : vm += v;
2458 : }
2459 0 : MT_rwlock_rdunlock(&b->thashlock);
2460 : }
2461 0 : printf(" role: %s\n",
2462 0 : b->batRole == PERSISTENT ? "persistent" : "transient");
2463 : }
2464 0 : printf("# %d bats: mem=%zu, vm=%zu\n", n, mem, vm);
2465 0 : fflush(stdout);
2466 0 : }
2467 :
2468 : /*
2469 : * @+ BBP Readonly Interface
2470 : *
2471 : * These interface functions do not change the BBP tables. If they
2472 : * only access one specific BAT, the caller must have ensured that no
2473 : * other thread is modifying that BAT, therefore such functions do not
2474 : * need locking.
2475 : *
2476 : * BBP index lookup by BAT name:
2477 : */
2478 : static inline bat
2479 40128 : BBP_find(const char *nme, bool lock)
2480 : {
2481 40128 : bat i = BBPnamecheck(nme);
2482 :
2483 13533 : if (i != 0) {
2484 : /* for tmp_X BATs, we already know X */
2485 13533 : const char *s;
2486 :
2487 13533 : if (i >= (bat) ATOMIC_GET(&BBPsize) || (s = BBP_logical(i)) == NULL || strcmp(s, nme)) {
2488 13533 : i = 0;
2489 : }
2490 26595 : } else if (*nme != '.') {
2491 : /* must lock since hash-lookup traverses other BATs */
2492 26595 : if (lock)
2493 1236 : MT_lock_set(&BBPnameLock);
2494 26922 : for (i = BBP_hash[strHash(nme) & BBP_mask]; i; i = BBP_next(i)) {
2495 954 : if (strcmp(BBP_logical(i), nme) == 0)
2496 : break;
2497 : }
2498 26595 : if (lock)
2499 1236 : MT_lock_unset(&BBPnameLock);
2500 : }
2501 40128 : return i;
2502 : }
2503 :
2504 : bat
2505 1236 : BBPindex(const char *nme)
2506 : {
2507 1236 : return BBP_find(nme, true);
2508 : }
2509 :
2510 : /*
2511 : * @+ BBP Update Interface
2512 : * Operations to insert, delete, clear, and modify BBP entries.
2513 : * Our policy for the BBP is to provide unlocked BBP access for
2514 : * speed, but still write operations have to be locked.
2515 : * #ifdef DEBUG_THREADLOCAL_BATS
2516 : * Create the shadow version (reversed) of a bat.
2517 : *
2518 : * An existing BAT is inserted into the BBP
2519 : */
2520 :
2521 : /* The free list is empty. We create a new entry by either just
2522 : * increasing BBPsize (up to BBPlimit) or extending the BBP (which
2523 : * increases BBPlimit).
2524 : *
2525 : * Note that this is the only place in normal, multi-threaded operation
2526 : * where BBPsize is assigned a value (never decreasing) and that the
2527 : * assignment happens after any necessary memory was allocated and
2528 : * initialized. */
2529 : static gdk_return
2530 35523 : maybeextend(void)
2531 : {
2532 35523 : bat size = (bat) ATOMIC_GET(&BBPsize);
2533 35523 : if (size + BBP_FREE_LOWATER > BBPlimit &&
2534 0 : BBPextend(size + BBP_FREE_LOWATER) != GDK_SUCCEED) {
2535 : /* nothing available */
2536 : return GDK_FAIL;
2537 : }
2538 35523 : ATOMIC_SET(&BBPsize, size + BBP_FREE_LOWATER);
2539 35523 : assert(BBP_free == 0);
2540 35523 : BBP_free = size;
2541 355230 : for (int i = 1; i < BBP_FREE_LOWATER; i++) {
2542 319707 : bat sz = size;
2543 319707 : BBP_next(sz) = ++size;
2544 : }
2545 35523 : BBP_next(size) = 0;
2546 35523 : BBP_nfree += BBP_FREE_LOWATER;
2547 35523 : return GDK_SUCCEED;
2548 : }
2549 :
2550 : /* return new BAT id (> 0); return 0 on failure */
2551 : bat
2552 18060781 : BBPallocbat(int tt)
2553 : {
2554 18060781 : MT_Id pid = MT_getpid();
2555 18058617 : bool lock = locked_by == 0 || locked_by != pid;
2556 18058617 : bat i;
2557 18058617 : int len = 0;
2558 18058617 : struct freebats *t = MT_thread_getfreebats();
2559 :
2560 18056981 : if (t->freebats == 0) {
2561 : /* critical section: get a new BBP entry */
2562 185370 : assert(t->nfreebats == 0);
2563 185370 : if (lock) {
2564 185370 : MT_lock_set(&GDKcacheLock);
2565 : }
2566 :
2567 : /* get a global bat, perhaps extend */
2568 185373 : if (BBP_free <= 0) {
2569 : /* we need to extend the BBP */
2570 35523 : gdk_return r;
2571 35523 : r = maybeextend();
2572 35523 : if (r != GDK_SUCCEED) {
2573 0 : if (lock) {
2574 0 : MT_lock_unset(&GDKcacheLock);
2575 : }
2576 : /* failed */
2577 0 : return 0;
2578 : }
2579 : }
2580 185373 : t->freebats = i = BBP_free;
2581 185373 : bat l = 0;
2582 2011995 : for (int x = 0; x < BBP_FREE_LOWATER && i; x++) {
2583 1826622 : assert(BBP_next(i) == 0 || BBP_next(i) > i);
2584 1826622 : t->nfreebats++;
2585 1826622 : BBP_nfree--;
2586 1826622 : l = i;
2587 1826622 : i = BBP_next(i);
2588 : }
2589 185373 : BBP_next(l) = 0;
2590 185373 : BBP_free = i;
2591 :
2592 185373 : if (lock) {
2593 185373 : MT_lock_unset(&GDKcacheLock);
2594 : }
2595 : /* rest of the work outside the lock */
2596 : }
2597 18056984 : if (t->nfreebats > 0) {
2598 18056984 : assert(t->freebats > 0);
2599 18056984 : i = t->freebats;
2600 18056984 : t->freebats = BBP_next(i);
2601 18056984 : assert(t->freebats == 0 || t->freebats > i);
2602 18056984 : BBP_next(i) = 0;
2603 18056984 : t->nfreebats--;
2604 : } else {
2605 0 : assert(t->nfreebats == 0);
2606 0 : assert(t->freebats == 0);
2607 : return 0;
2608 : }
2609 :
2610 : /* fill in basic BBP fields for the new bat */
2611 :
2612 18056984 : MT_lock_set(&GDKswapLock(i));
2613 18051666 : BBP_status_set(i, BBPDELETING|BBPHOT);
2614 18051666 : BBP_refs(i) = 1; /* new bats have 1 pin */
2615 18051666 : BBP_lrefs(i) = 0; /* ie. no logical refs */
2616 18051666 : BBP_pid(i) = pid;
2617 18051666 : MT_lock_unset(&GDKswapLock(i));
2618 :
2619 18060705 : if (*BBP_bak(i) == 0)
2620 365929 : len = snprintf(BBP_bak(i), sizeof(BBP_bak(i)), "tmp_%o", (unsigned) i);
2621 18060705 : if (len == -1 || len >= FILENAME_MAX) {
2622 0 : GDKerror("impossible error\n");
2623 0 : return 0;
2624 : }
2625 18060705 : BBP_logical(i) = BBP_bak(i);
2626 :
2627 : /* Keep the physical location around forever */
2628 18060705 : if (!GDKinmemory(0) && *BBP_physical(i) == 0) {
2629 365531 : BBPgetfilename(BBP_physical(i), sizeof(BBP_physical(i)), i);
2630 365573 : TRC_DEBUG(BAT_, "%d = new %s(%s)\n", (int) i, BBP_logical(i), ATOMname(tt));
2631 : }
2632 :
2633 : return i;
2634 : }
2635 :
2636 : gdk_return
2637 18073065 : BBPcacheit(BAT *bn, bool lock)
2638 : {
2639 18073065 : bat i = bn->batCacheid;
2640 18073065 : unsigned mode;
2641 :
2642 18073065 : if (lock)
2643 36112886 : lock = locked_by == 0 || locked_by != MT_getpid();
2644 :
2645 18073065 : assert(i > 0);
2646 :
2647 18073065 : if (lock)
2648 18056870 : MT_lock_set(&GDKswapLock(i));
2649 18067363 : mode = (BBP_status(i) | BBPLOADED) & ~(BBPLOADING | BBPDELETING | BBPSWAPPED);
2650 :
2651 : /* cache it! */
2652 18067363 : BBP_status_set(i, mode);
2653 :
2654 18067363 : if (lock)
2655 18058221 : MT_lock_unset(&GDKswapLock(i));
2656 18066117 : return GDK_SUCCEED;
2657 : }
2658 :
2659 : /*
2660 : * BBPuncacheit changes the BBP status to swapped out. Currently only
2661 : * used in BBPfree (bat swapped out) and BBPclear (bat destroyed
2662 : * forever).
2663 : */
2664 :
2665 : static void
2666 18093471 : BBPuncacheit(bat i, bool unloaddesc)
2667 : {
2668 18093471 : if (i < 0)
2669 : i = -i;
2670 18093471 : if (BBPcheck(i)) {
2671 18091847 : BAT *b = BBP_desc(i);
2672 :
2673 18091847 : assert(unloaddesc || BBP_refs(i) == 0);
2674 :
2675 18091847 : if (BBP_status(i) & BBPLOADED) {
2676 18068029 : TRC_DEBUG(BAT_, "uncache %d (%s)\n", (int) i, BBP_logical(i));
2677 :
2678 : /* clearing bits can be done without the lock */
2679 18068029 : BBP_status_off(i, BBPLOADED);
2680 : }
2681 18091847 : if (unloaddesc) {
2682 18078399 : BATdestroy(b);
2683 : }
2684 : }
2685 18094012 : }
2686 :
2687 : /*
2688 : * @- BBPclear
2689 : * BBPclear removes a BAT from the BBP directory forever.
2690 : */
2691 : static inline void
2692 69905 : BBPhandover(struct freebats *t, uint32_t n)
2693 : {
2694 69905 : bat *p, bid;
2695 : /* take one bat from our private free list and hand it over to
2696 : * the global free list */
2697 69905 : if (n >= t->nfreebats) {
2698 44566 : bid = t->freebats;
2699 44566 : t->freebats = 0;
2700 44566 : BBP_nfree += t->nfreebats;
2701 44566 : t->nfreebats = 0;
2702 : } else {
2703 25339 : p = &t->freebats;
2704 278729 : for (uint32_t i = n; i < t->nfreebats; i++)
2705 253390 : p = &BBP_next(*p);
2706 25339 : bid = *p;
2707 25339 : *p = 0;
2708 25339 : BBP_nfree += n;
2709 25339 : t->nfreebats -= n;
2710 : }
2711 : p = &BBP_free;
2712 1636144 : while (bid != 0) {
2713 12652427 : while (*p && *p < bid)
2714 11086188 : p = &BBP_next(*p);
2715 1566239 : bat i = BBP_next(bid);
2716 1566239 : BBP_next(bid) = *p;
2717 1566239 : *p = bid;
2718 1566239 : bid = i;
2719 : }
2720 69905 : }
2721 :
2722 : #ifndef NDEBUG
2723 : extern void printlist(bat bid) __attribute__((__cold__));
2724 : /* print a bat free list, pass start of free list as argument
2725 : * to be used from the debugger */
2726 : void
2727 0 : printlist(bat bid)
2728 : {
2729 0 : int n = 0;
2730 0 : while (bid) {
2731 0 : printf("%d ", bid);
2732 0 : bid = BBP_next(bid);
2733 0 : n++;
2734 : }
2735 0 : printf("(%d)\n", n);
2736 0 : }
2737 : #endif
2738 :
2739 : static inline void
2740 17803224 : bbpclear(bat i, bool lock)
2741 : {
2742 17803224 : struct freebats *t = MT_thread_getfreebats();
2743 :
2744 17802042 : TRC_DEBUG(BAT_, "clear %d (%s)\n", (int) i, BBP_logical(i));
2745 17802042 : BBPuncacheit(i, true);
2746 17812542 : TRC_DEBUG(BAT_, "set to unloading %d\n", i);
2747 17812542 : if (lock) {
2748 17808460 : MT_lock_set(&GDKswapLock(i));
2749 : }
2750 :
2751 17806551 : BBP_status_set(i, BBPUNLOADING);
2752 17806551 : BBP_refs(i) = 0;
2753 17806551 : BBP_lrefs(i) = 0;
2754 17806551 : if (lock)
2755 17806380 : MT_lock_unset(&GDKswapLock(i));
2756 17807330 : if (!BBPtmpcheck(BBP_logical(i))) {
2757 1198 : MT_lock_set(&BBPnameLock);
2758 1198 : BBP_delete(i);
2759 1198 : MT_lock_unset(&BBPnameLock);
2760 : }
2761 17807330 : if (BBP_logical(i) != BBP_bak(i))
2762 1198 : GDKfree(BBP_logical(i));
2763 17808074 : BBP_status_set(i, 0);
2764 17808074 : BBP_logical(i) = NULL;
2765 17808074 : bat *p;
2766 52410104 : for (p = &t->freebats; *p && *p < i; p = &BBP_next(*p))
2767 : ;
2768 17808074 : BBP_next(i) = *p;
2769 17808074 : *p = i;
2770 17808074 : t->nfreebats++;
2771 17808074 : BBP_pid(i) = ~(MT_Id)0; /* not zero, not a valid thread id */
2772 17808074 : if (t->nfreebats > BBP_FREE_HIWATER) {
2773 25338 : if (lock)
2774 25338 : MT_lock_set(&GDKcacheLock);
2775 25339 : BBPhandover(t, t->nfreebats - BBP_FREE_LOWATER);
2776 25339 : if (lock)
2777 25339 : MT_lock_unset(&GDKcacheLock);
2778 : }
2779 17808075 : }
2780 :
2781 : void
2782 17805999 : BBPclear(bat i)
2783 : {
2784 17805999 : if (BBPcheck(i)) {
2785 17803273 : bool lock = locked_by == 0 || locked_by != MT_getpid();
2786 17803273 : bbpclear(i, lock);
2787 : }
2788 17805272 : }
2789 :
2790 : void
2791 48895 : BBPrelinquishbats(void)
2792 : {
2793 48895 : struct freebats *t = MT_thread_getfreebats();
2794 48895 : if (t == NULL || t->nfreebats == 0)
2795 : return;
2796 44566 : MT_lock_set(&GDKcacheLock);
2797 89132 : while (t->nfreebats > 0) {
2798 44566 : BBPhandover(t, t->nfreebats);
2799 : }
2800 44566 : MT_lock_unset(&GDKcacheLock);
2801 : }
2802 :
2803 : /*
2804 : * @- BBP rename
2805 : *
2806 : * Each BAT has a logical name that is globally unique.
2807 : * The batId is the same as the logical BAT name.
2808 : *
2809 : * The default logical name of a BAT is tmp_X, where X is the
2810 : * batCacheid. Apart from being globally unique, new logical bat
2811 : * names cannot be of the form tmp_X, unless X is the batCacheid.
2812 : *
2813 : * Physical names consist of a directory name followed by a logical
2814 : * name suffix. The directory name is derived from the batCacheid,
2815 : * and is currently organized in a hierarchy that puts max 64 bats in
2816 : * each directory (see BBPgetsubdir).
2817 : *
2818 : * Concerning the physical suffix: it is almost always bat_X. This
2819 : * saves us a whole lot of trouble, as bat_X is always unique and no
2820 : * conflicts can occur. Other suffixes are only supported in order
2821 : * just for backward compatibility with old repositories (you won't
2822 : * see them anymore in new repositories).
2823 : */
2824 : int
2825 38892 : BBPrename(BAT *b, const char *nme)
2826 : {
2827 38892 : if (b == NULL)
2828 : return 0;
2829 :
2830 38892 : bat bid = b->batCacheid;
2831 38892 : bat tmpid = 0, i;
2832 :
2833 38892 : if (nme == NULL) {
2834 13533 : if (BBP_bak(bid)[0] == 0 &&
2835 0 : snprintf(BBP_bak(bid), sizeof(BBP_bak(bid)), "tmp_%o", (unsigned) bid) >= (int) sizeof(BBP_bak(bid))) {
2836 : /* cannot happen */
2837 0 : TRC_CRITICAL(GDK, "BBP default filename too long\n");
2838 0 : return BBPRENAME_LONG;
2839 : }
2840 13533 : nme = BBP_bak(bid);
2841 : }
2842 :
2843 : /* If name stays same, do nothing */
2844 38892 : if (BBP_logical(bid) && strcmp(BBP_logical(bid), nme) == 0)
2845 : return 0;
2846 :
2847 38892 : if ((tmpid = BBPnamecheck(nme)) && tmpid != bid) {
2848 0 : GDKerror("illegal temporary name: '%s'\n", nme);
2849 0 : return BBPRENAME_ILLEGAL;
2850 : }
2851 38892 : if (strLen(nme) >= IDLENGTH) {
2852 0 : GDKerror("illegal temporary name: '%s'\n", nme);
2853 0 : return BBPRENAME_LONG;
2854 : }
2855 :
2856 38892 : MT_lock_set(&BBPnameLock);
2857 38892 : i = BBP_find(nme, false);
2858 38892 : if (i != 0) {
2859 1 : MT_lock_unset(&BBPnameLock);
2860 1 : GDKerror("name is in use: '%s'.\n", nme);
2861 1 : return BBPRENAME_ALREADY;
2862 : }
2863 :
2864 38891 : char *nnme;
2865 38891 : if (nme == BBP_bak(bid) || strcmp(nme, BBP_bak(bid)) == 0) {
2866 38891 : nnme = BBP_bak(bid);
2867 : } else {
2868 25358 : nnme = GDKstrdup(nme);
2869 25358 : if (nnme == NULL) {
2870 0 : MT_lock_unset(&BBPnameLock);
2871 0 : return BBPRENAME_MEMORY;
2872 : }
2873 : }
2874 :
2875 : /* carry through the name change */
2876 38891 : if (BBP_logical(bid) && !BBPtmpcheck(BBP_logical(bid))) {
2877 13533 : BBP_delete(bid);
2878 : }
2879 38891 : if (BBP_logical(bid) != BBP_bak(bid))
2880 13533 : GDKfree(BBP_logical(bid));
2881 38891 : BBP_logical(bid) = nnme;
2882 38891 : if (tmpid == 0) {
2883 25358 : BBP_insert(bid);
2884 : }
2885 38891 : MT_lock_set(&b->theaplock);
2886 38891 : bool transient = b->batTransient;
2887 38891 : MT_lock_unset(&b->theaplock);
2888 38891 : if (!transient) {
2889 9759 : bool lock = locked_by == 0 || locked_by != MT_getpid();
2890 :
2891 9759 : if (lock)
2892 9759 : MT_lock_set(&GDKswapLock(i));
2893 9759 : BBP_status_on(bid, BBPRENAMED);
2894 9759 : if (lock)
2895 9759 : MT_lock_unset(&GDKswapLock(i));
2896 : }
2897 38891 : MT_lock_unset(&BBPnameLock);
2898 38891 : return 0;
2899 : }
2900 :
2901 : /*
2902 : * @+ BBP swapping Policy
2903 : * The BAT can be moved back to disk using the routine BBPfree. It
2904 : * frees the storage for other BATs. After this call BAT* references
2905 : * maintained for the BAT are wrong. We should keep track of dirty
2906 : * unloaded BATs. They may have to be committed later on, which may
2907 : * include reading them in again.
2908 : *
2909 : * BBPswappable: may this bat be unloaded? Only real bats without
2910 : * memory references can be unloaded.
2911 : */
2912 : static inline void
2913 3218702 : BBPspin(bat i, const char *s, unsigned event)
2914 : {
2915 3218702 : if (BBPcheck(i) && (BBP_status(i) & event)) {
2916 : lng spin = LL_CONSTANT(0);
2917 :
2918 1833 : do {
2919 1833 : MT_sleep_ms(KITTENNAP);
2920 1833 : spin++;
2921 1833 : } while (BBP_status(i) & event);
2922 24 : TRC_DEBUG(BAT_, "%d,%s,%u: " LLFMT " loops\n", (int) i, s, event, spin);
2923 : }
2924 3218521 : }
2925 :
2926 : void
2927 6660137 : BBPcold(bat i)
2928 : {
2929 6660137 : if (!is_bat_nil(i)) {
2930 6660462 : BAT *b = BBP_desc(i);
2931 6660462 : if (b->batRole == PERSISTENT)
2932 701 : BBP_status_off(i, BBPHOT);
2933 : }
2934 6660137 : }
2935 :
2936 : /* This function can fail if the input parameter (i) is incorrect
2937 : * (unlikely). */
2938 : static inline int
2939 110138773 : incref(bat i, bool logical, bool lock)
2940 : {
2941 110138773 : int refs;
2942 110138773 : BAT *b;
2943 :
2944 110138773 : if (!BBPcheck(i))
2945 : return 0;
2946 :
2947 110066642 : if (lock) {
2948 33866348 : for (;;) {
2949 33866348 : MT_lock_set(&GDKswapLock(i));
2950 33981820 : if (!(BBP_status(i) & (BBPUNSTABLE|BBPLOADING)))
2951 : break;
2952 : /* the BATs is "unstable", try again */
2953 0 : MT_lock_unset(&GDKswapLock(i));
2954 0 : BBPspin(i, __func__, BBPUNSTABLE|BBPLOADING);
2955 : }
2956 : }
2957 : /* we have the lock */
2958 :
2959 110182114 : b = BBP_desc(i);
2960 110182114 : if (b->batCacheid == 0) {
2961 : /* should not have happened */
2962 0 : if (lock)
2963 0 : MT_lock_unset(&GDKswapLock(i));
2964 0 : return 0;
2965 : }
2966 :
2967 110182114 : assert(BBP_refs(i) + BBP_lrefs(i) ||
2968 : BBP_status(i) & (BBPDELETED | BBPSWAPPED));
2969 110182114 : if (logical) {
2970 33869700 : refs = ++BBP_lrefs(i);
2971 33869700 : BBP_pid(i) = 0;
2972 : } else {
2973 76312414 : refs = ++BBP_refs(i);
2974 76312414 : BBP_status_on(i, BBPHOT);
2975 : }
2976 110182114 : if (lock)
2977 33866974 : MT_lock_unset(&GDKswapLock(i));
2978 :
2979 : return refs;
2980 : }
2981 :
2982 : /* increment the physical reference counter for the given bat
2983 : * returns the new reference count
2984 : * also increments the physical reference count of the parent bat(s) (if
2985 : * any) */
2986 : int
2987 57833 : BBPfix(bat i)
2988 : {
2989 57833 : return BATdescriptor(i) ? 1 : 0;
2990 : }
2991 :
2992 : /* increment the logical reference count for the given bat
2993 : * returns the new reference count */
2994 : int
2995 28822329 : BBPretain(bat i)
2996 : {
2997 28822329 : bool lock = locked_by == 0 || locked_by != MT_getpid();
2998 :
2999 28822329 : return incref(i, true, lock);
3000 : }
3001 :
3002 : static inline int
3003 135421198 : decref(bat i, bool logical, bool lock, const char *func)
3004 : {
3005 135421198 : int refs = 0, lrefs;
3006 135421198 : bool swap = false;
3007 135421198 : bool locked = false;
3008 135421198 : int farmid = 0;
3009 135421198 : BAT *b;
3010 :
3011 135421198 : if (is_bat_nil(i))
3012 : return -1;
3013 127636546 : assert(i > 0);
3014 127636546 : if (BBPcheck(i) == 0)
3015 : return -1;
3016 :
3017 127510157 : if (lock)
3018 127497142 : MT_lock_set(&GDKswapLock(i));
3019 :
3020 127514458 : while (BBP_status(i) & BBPUNLOADING) {
3021 0 : if (lock)
3022 0 : MT_lock_unset(&GDKswapLock(i));
3023 0 : BBPspin(i, func, BBPUNLOADING);
3024 0 : if (lock)
3025 127514458 : MT_lock_set(&GDKswapLock(i));
3026 : }
3027 :
3028 127615913 : b = (BBP_status(i) & BBPLOADED) ? BBP_desc(i) : NULL;
3029 :
3030 : /* decrement references by one */
3031 127615913 : if (logical) {
3032 33791484 : if (BBP_lrefs(i) == 0) {
3033 0 : GDKerror("%s: %s does not have logical references.\n", func, BBP_logical(i));
3034 0 : assert(0);
3035 : } else {
3036 33791484 : refs = --BBP_lrefs(i);
3037 : }
3038 : /* cannot release last logical ref if still shared */
3039 : // but we could still have a bat iterator on it
3040 : //assert(!BATshared(BBP_desc(i)) || refs > 0);
3041 : } else {
3042 93824429 : if (BBP_refs(i) == 0) {
3043 0 : GDKerror("%s: %s does not have pointer fixes.\n", func, BBP_logical(i));
3044 0 : assert(0);
3045 : } else {
3046 93824429 : refs = --BBP_refs(i);
3047 93824429 : if (b && refs == 0) {
3048 78138538 : MT_lock_set(&b->theaplock);
3049 78168386 : locked = true;
3050 78168386 : if (VIEWtparent(b) || VIEWvtparent(b))
3051 13340013 : BBP_status_on(i, BBPHOT);
3052 : }
3053 : }
3054 : }
3055 127645761 : if (b) {
3056 127394813 : if (!locked) {
3057 49489359 : MT_lock_set(&b->theaplock);
3058 49503266 : locked = true;
3059 : }
3060 : #if 0
3061 : if (b->batCount > b->batInserted && !isVIEW(b)) {
3062 : /* if batCount is larger than batInserted and
3063 : * the dirty bits are off, it may be that a
3064 : * (sub)commit happened in parallel to an
3065 : * update; we must undo the turning off of the
3066 : * dirty bits */
3067 : if (b->theap && b->theap->parentid == i)
3068 : b->theap->dirty = true;
3069 : if (b->tvheap && b->tvheap->parentid == i)
3070 : b->tvheap->dirty = true;
3071 : }
3072 : #endif
3073 127379252 : if (b->theap)
3074 127379252 : farmid = b->theap->farmid;
3075 : }
3076 :
3077 : /* we destroy transients asap and unload persistent bats only
3078 : * if they have been made cold or are not dirty */
3079 127630200 : unsigned chkflag = BBPSYNCING;
3080 127630200 : bool swapdirty = false;
3081 127630200 : if (b) {
3082 127386271 : size_t cursize;
3083 127386271 : if ((cursize = GDKvm_cursize()) < (size_t) (GDK_vm_maxsize * 0.75)) {
3084 127387055 : if (!locked) {
3085 0 : MT_lock_set(&b->theaplock);
3086 0 : locked = true;
3087 : }
3088 127387055 : if (((b->theap ? b->theap->size : 0) + (b->tvheap ? b->tvheap->size : 0)) < (GDK_vm_maxsize - cursize) / 32)
3089 127396874 : chkflag |= BBPHOT;
3090 0 : } else if (cursize > (size_t) (GDK_vm_maxsize * 0.85))
3091 127630984 : swapdirty = true;
3092 : }
3093 : /* only consider unloading if refs is 0; if, in addition, lrefs
3094 : * is 0, we can definitely unload, else only if some more
3095 : * conditions are met */
3096 220463074 : if (BBP_refs(i) == 0 &&
3097 110630886 : (BBP_lrefs(i) == 0 ||
3098 92807662 : (b != NULL && b->theap != NULL
3099 92810840 : ? ((swapdirty || !BATdirty(b)) &&
3100 10693397 : !(BBP_status(i) & chkflag) &&
3101 16192 : (BBP_status(i) & BBPPERSISTENT) &&
3102 : /* cannot unload in-memory data */
3103 7912 : !GDKinmemory(farmid) &&
3104 : /* do not unload views or parents of views */
3105 7912 : !BATshared(b) &&
3106 92814698 : b->batCacheid == b->theap->parentid &&
3107 7036 : (b->tvheap == NULL || b->batCacheid == b->tvheap->parentid))
3108 24428 : : (BBP_status(i) & BBPTMP)))) {
3109 : /* bat will be unloaded now. set the UNLOADING bit
3110 : * while locked so no other thread thinks it's
3111 : * available anymore */
3112 17810494 : assert((BBP_status(i) & BBPUNLOADING) == 0);
3113 17810494 : TRC_DEBUG(BAT_, "%s set to unloading BAT %d (status %u, lrefs %d)\n", func, i, BBP_status(i), BBP_lrefs(i));
3114 17810494 : BBP_status_on(i, BBPUNLOADING);
3115 17810494 : swap = true;
3116 : } /* else: bat cannot be swapped out */
3117 127630984 : lrefs = BBP_lrefs(i);
3118 127630984 : if (locked)
3119 127435145 : MT_lock_unset(&b->theaplock);
3120 :
3121 : /* unlock before re-locking in unload; as saving a dirty
3122 : * persistent bat may take a long time */
3123 127730217 : if (lock)
3124 127555428 : MT_lock_unset(&GDKswapLock(i));
3125 :
3126 127668482 : if (swap) {
3127 17810976 : if (b != NULL) {
3128 17793584 : if (lrefs == 0 && (BBP_status(i) & BBPDELETED) == 0) {
3129 : /* free memory (if loaded) and delete from
3130 : * disk (if transient but saved) */
3131 17785530 : BBPdestroy(b);
3132 : } else {
3133 8054 : TRC_DEBUG(BAT_, "%s unload and free bat %d\n", func, i);
3134 : /* free memory of transient */
3135 8054 : if (BBPfree(b) != GDK_SUCCEED)
3136 : return -1; /* indicate failure */
3137 : }
3138 17392 : } else if (lrefs == 0 && (BBP_status(i) & BBPDELETED) == 0) {
3139 12730 : BATdelete(BBP_desc(i));
3140 12730 : BBPclear(i);
3141 : } else {
3142 4662 : BBP_status_off(i, BBPUNLOADING);
3143 : }
3144 : }
3145 : return refs;
3146 : }
3147 :
3148 : int
3149 90086090 : BBPunfix(bat i)
3150 : {
3151 90086090 : return decref(i, false, true, __func__);
3152 : }
3153 :
3154 : int
3155 41570400 : BBPrelease(bat i)
3156 : {
3157 41570400 : return decref(i, true, true, __func__);
3158 : }
3159 :
3160 : void
3161 5064109 : BBPkeepref(BAT *b)
3162 : {
3163 5064109 : assert(b != NULL);
3164 5064109 : bool lock = locked_by == 0 || locked_by != MT_getpid();
3165 5064109 : int i = b->batCacheid;
3166 5064109 : int refs = incref(i, true, lock);
3167 5071137 : if (refs == 1) {
3168 4851074 : MT_lock_set(&b->theaplock);
3169 4843519 : BATsettrivprop(b);
3170 4841581 : MT_lock_unset(&b->theaplock);
3171 : }
3172 5063998 : if (ATOMIC_GET(&GDKdebug) & CHECKMASK)
3173 5022496 : BATassertProps(b);
3174 5069854 : if (BATsetaccess(b, BAT_READ) == NULL)
3175 : return; /* already decreffed */
3176 :
3177 3861383 : refs = decref(i, false, lock, __func__);
3178 3858755 : (void) refs;
3179 3858755 : assert(refs >= 0);
3180 : }
3181 :
3182 : BAT *
3183 76480630 : BATdescriptor(bat i)
3184 : {
3185 76480630 : BAT *b = NULL;
3186 :
3187 76480630 : if (BBPcheck(i)) {
3188 76425977 : bool lock = locked_by == 0 || locked_by != MT_getpid();
3189 : if (lock) {
3190 76425981 : for (;;) {
3191 76425979 : MT_lock_set(&GDKswapLock(i));
3192 76334688 : if (!(BBP_status(i) & (BBPUNSTABLE|BBPLOADING)))
3193 : break;
3194 : /* the BATs is "unstable", try again */
3195 2 : MT_lock_unset(&GDKswapLock(i));
3196 2 : BBPspin(i, __func__, BBPUNSTABLE|BBPLOADING);
3197 : }
3198 : }
3199 76334686 : if (incref(i, false, false) > 0) {
3200 76479572 : if ((BBP_status(i) & BBPLOADED) == 0) {
3201 16129 : b = getBBPdescriptor(i);
3202 16129 : if (b == NULL) {
3203 : /* if loading failed, we need to
3204 : * compensate for the incref */
3205 0 : decref(i, false, false, __func__);
3206 : }
3207 : } else {
3208 76463443 : b = BBP_desc(i);
3209 : }
3210 : }
3211 76479572 : if (lock)
3212 76481622 : MT_lock_unset(&GDKswapLock(i));
3213 : }
3214 76448617 : return b;
3215 : }
3216 :
3217 : /*
3218 : * BBPdescriptor checks whether BAT needs loading and does so if
3219 : * necessary. You must have at least one fix on the BAT before calling
3220 : * this.
3221 : */
3222 : static BAT *
3223 16129 : getBBPdescriptor(bat i)
3224 : {
3225 16129 : bool load = false;
3226 16129 : BAT *b = NULL;
3227 :
3228 16129 : assert(i > 0);
3229 16129 : if (!BBPcheck(i)) {
3230 0 : GDKerror("BBPcheck failed for bat id %d\n", i);
3231 0 : return NULL;
3232 : }
3233 16129 : assert(BBP_refs(i));
3234 16129 : unsigned status = BBP_status(i);
3235 16129 : b = BBP_desc(i);
3236 16129 : if ((status & BBPLOADED) == 0 || status & BBPWAITING) {
3237 16129 : while (BBP_status(i) & BBPWAITING) { /* wait for bat to be loaded by other thread */
3238 0 : MT_lock_unset(&GDKswapLock(i));
3239 0 : BBPspin(i, __func__, BBPWAITING);
3240 16129 : MT_lock_set(&GDKswapLock(i));
3241 : }
3242 16129 : if (BBPvalid(i)) {
3243 16129 : if ((BBP_status(i) & BBPLOADED) == 0) {
3244 16129 : load = true;
3245 16129 : TRC_DEBUG(BAT_, "set to loading BAT %d\n", i);
3246 16129 : BBP_status_on(i, BBPLOADING);
3247 : }
3248 : }
3249 : }
3250 16129 : if (load) {
3251 16129 : TRC_DEBUG(IO_, "load %s\n", BBP_logical(i));
3252 :
3253 16129 : b = BATload_intern(i, false);
3254 :
3255 16129 : BBP_status_off(i, BBPLOADING);
3256 16129 : CHECKDEBUG if (b != NULL)
3257 12987 : BATassertProps(b);
3258 : }
3259 : return b;
3260 : }
3261 :
3262 : /*
3263 : * In BBPsave executes unlocked; it just marks the BBP_status of the
3264 : * BAT to BBPsaving, so others that want to save or unload this BAT
3265 : * must spin lock on the BBP_status field.
3266 : */
3267 : gdk_return
3268 19360 : BBPsave(BAT *b)
3269 : {
3270 19360 : bool lock = locked_by == 0 || locked_by != MT_getpid();
3271 19360 : bat bid = b->batCacheid;
3272 19360 : gdk_return ret = GDK_SUCCEED;
3273 :
3274 19360 : MT_lock_set(&b->theaplock);
3275 19360 : if (BBP_lrefs(bid) == 0 || isVIEW(b) || !BATdirty(b)) {
3276 : /* do nothing */
3277 10678 : MT_lock_unset(&b->theaplock);
3278 10678 : MT_rwlock_rdlock(&b->thashlock);
3279 10678 : if (b->thash && b->thash != (Hash *) 1 &&
3280 224 : (b->thash->heaplink.dirty || b->thash->heapbckt.dirty))
3281 124 : BAThashsave(b, (BBP_status(bid) & BBPPERSISTENT) != 0);
3282 10678 : MT_rwlock_rdunlock(&b->thashlock);
3283 10678 : return GDK_SUCCEED;
3284 : }
3285 8682 : MT_lock_unset(&b->theaplock);
3286 8682 : if (lock)
3287 8682 : MT_lock_set(&GDKswapLock(bid));
3288 :
3289 8682 : if (BBP_status(bid) & BBPSAVING) {
3290 : /* wait until save in other thread completes */
3291 0 : if (lock)
3292 0 : MT_lock_unset(&GDKswapLock(bid));
3293 0 : BBPspin(bid, __func__, BBPSAVING);
3294 : } else {
3295 : /* save it */
3296 8682 : unsigned flags = BBPSAVING;
3297 :
3298 8682 : MT_lock_set(&b->theaplock);
3299 8682 : if (DELTAdirty(b)) {
3300 441 : flags |= BBPSWAPPED;
3301 : }
3302 8682 : if (b->batTransient) {
3303 8677 : flags |= BBPTMP;
3304 : }
3305 8682 : MT_lock_unset(&b->theaplock);
3306 8682 : BBP_status_on(bid, flags);
3307 8682 : if (lock)
3308 8682 : MT_lock_unset(&GDKswapLock(bid));
3309 :
3310 8682 : TRC_DEBUG(IO_, "save " ALGOBATFMT "\n", ALGOBATPAR(b));
3311 :
3312 : /* do the time-consuming work unlocked */
3313 8682 : if (BBP_status(bid) & BBPEXISTING && b->batInserted > 0)
3314 2 : ret = BBPbackup(b, false);
3315 2 : if (ret == GDK_SUCCEED) {
3316 8682 : ret = BATsave(b);
3317 : }
3318 : /* clearing bits can be done without the lock */
3319 8682 : BBP_status_off(bid, BBPSAVING);
3320 : }
3321 : return ret;
3322 : }
3323 :
3324 : /*
3325 : * TODO merge BBPfree with BATfree? Its function is to prepare a BAT
3326 : * for being unloaded (or even destroyed, if the BAT is not
3327 : * persistent).
3328 : */
3329 : static void
3330 17786652 : BBPdestroy(BAT *b)
3331 : {
3332 17786652 : bat tp = VIEWtparent(b);
3333 17786652 : bat vtp = VIEWvtparent(b);
3334 :
3335 17786652 : if (b->theap) {
3336 17786915 : HEAPdecref(b->theap, tp == 0);
3337 17793705 : b->theap = NULL;
3338 17793705 : if (tp != 0)
3339 9135345 : BBPrelease(tp);
3340 : }
3341 17792862 : if (b->tvheap) {
3342 2726201 : HEAPdecref(b->tvheap, vtp == 0);
3343 2726258 : b->tvheap = NULL;
3344 2726258 : if (vtp != 0)
3345 2030261 : BBPrelease(vtp);
3346 : }
3347 17792857 : if (b->oldtail) {
3348 2 : ATOMIC_AND(&b->oldtail->refs, ~DELAYEDREMOVE);
3349 2 : HEAPdecref(b->oldtail, true);
3350 2 : b->oldtail = NULL;
3351 : }
3352 17792857 : BATdelete(b);
3353 :
3354 17793178 : BBPclear(b->batCacheid); /* if destroyed; de-register from BBP */
3355 17792427 : }
3356 :
3357 : static gdk_return
3358 19360 : BBPfree(BAT *b)
3359 : {
3360 19360 : bat bid = b->batCacheid;
3361 19360 : gdk_return ret;
3362 :
3363 19360 : assert(bid > 0);
3364 19360 : assert(BBPswappable(b));
3365 19360 : assert(!isVIEW(b));
3366 :
3367 19360 : BBP_unload_inc();
3368 : /* write dirty BATs before unloading */
3369 19360 : ret = BBPsave(b);
3370 19360 : if (ret == GDK_SUCCEED) {
3371 19360 : if (BBP_status(bid) & BBPLOADED)
3372 19360 : BATfree(b); /* free memory */
3373 19360 : BBPuncacheit(bid, false);
3374 : }
3375 19360 : TRC_DEBUG(BAT_, "turn off unloading %d\n", bid);
3376 19360 : BBP_status_off(bid, BBPUNLOADING);
3377 19360 : BBP_unload_dec();
3378 19360 : return ret;
3379 : }
3380 :
3381 : /*
3382 : * BBPquickdesc loads a BAT descriptor without loading the entire BAT,
3383 : * of which the result be used only for a *limited* number of
3384 : * purposes. Specifically, during the global sync/commit, we do not
3385 : * want to load any BATs that are not already loaded, both because
3386 : * this costs performance, and because getting into memory shortage
3387 : * during a commit is extremely dangerous. Loading a BAT tends not to
3388 : * be required, since the commit actions mostly involve moving some
3389 : * pointers in the BAT descriptor.
3390 : */
3391 : BAT *
3392 1241016 : BBPquickdesc(bat bid)
3393 : {
3394 1241016 : BAT *b;
3395 :
3396 1241016 : if (!BBPcheck(bid)) {
3397 163 : if (!is_bat_nil(bid)) {
3398 0 : GDKerror("called with invalid batid.\n");
3399 0 : assert(0);
3400 : }
3401 : return NULL;
3402 : }
3403 1240664 : BBPspin(bid, __func__, BBPWAITING);
3404 1240469 : b = BBP_desc(bid);
3405 1240469 : if (b->ttype < 0) {
3406 129 : const char *aname = ATOMunknown_name(b->ttype);
3407 129 : int tt = ATOMindex(aname);
3408 129 : if (tt < 0) {
3409 0 : GDKwarning("atom '%s' unknown in bat '%s'.\n",
3410 : aname, BBP_physical(bid));
3411 : } else {
3412 129 : b->ttype = tt;
3413 : }
3414 : }
3415 : return b;
3416 : }
3417 :
3418 : /*
3419 : * @+ Global Commit
3420 : */
3421 : static BAT *
3422 1986614 : dirty_bat(bat *i, bool subcommit)
3423 : {
3424 1986614 : if (BBPvalid(*i)) {
3425 1978089 : BAT *b;
3426 1978089 : BBPspin(*i, __func__, BBPSAVING);
3427 1978089 : if (BBP_status(*i) & BBPLOADED) {
3428 1868679 : b = BBP_desc(*i);
3429 1868679 : MT_lock_set(&b->theaplock);
3430 1990773 : if ((BBP_status(*i) & BBPNEW) &&
3431 122094 : BATcheckmodes(b, false) != GDK_SUCCEED) /* check mmap modes */
3432 0 : *i = -*i; /* error */
3433 1868679 : else if ((BBP_status(*i) & BBPPERSISTENT) &&
3434 0 : (subcommit || BATdirty(b))) {
3435 1688265 : MT_lock_unset(&b->theaplock);
3436 1688265 : return b; /* the bat is loaded, persistent and dirty */
3437 : }
3438 180414 : MT_lock_unset(&b->theaplock);
3439 109410 : } else if (subcommit)
3440 106876 : return BBP_desc(*i);
3441 : }
3442 : return NULL;
3443 : }
3444 :
3445 : /*
3446 : * @- backup-bat
3447 : * Backup-bat moves all files of a BAT to a backup directory. Only
3448 : * after this succeeds, it may be saved. If some failure occurs
3449 : * halfway saving, we can thus always roll back.
3450 : */
3451 : static gdk_return
3452 222818 : file_move(int farmid, const char *srcdir, const char *dstdir, const char *name, const char *ext)
3453 : {
3454 222818 : if (GDKmove(farmid, srcdir, name, ext, dstdir, name, ext, false) == GDK_SUCCEED) {
3455 : return GDK_SUCCEED;
3456 : } else {
3457 0 : char *path;
3458 0 : struct stat st;
3459 :
3460 0 : path = GDKfilepath(farmid, srcdir, name, ext);
3461 0 : if (path == NULL)
3462 0 : return GDK_FAIL;
3463 0 : if (MT_stat(path, &st)) {
3464 : /* source file does not exist; the best
3465 : * recovery is to give an error but continue
3466 : * by considering the BAT as not saved; making
3467 : * sure that this time it does get saved.
3468 : */
3469 0 : GDKsyserror("file_move: cannot stat %s\n", path);
3470 0 : GDKfree(path);
3471 0 : return GDK_FAIL; /* fishy, but not fatal */
3472 : }
3473 0 : GDKfree(path);
3474 : }
3475 0 : return GDK_FAIL;
3476 : }
3477 :
3478 : /* returns true if the file exists */
3479 : static bool
3480 3176228 : file_exists(int farmid, const char *dir, const char *name, const char *ext)
3481 : {
3482 3176228 : char *path;
3483 3176228 : struct stat st;
3484 3176228 : int ret = -1;
3485 :
3486 3176228 : path = GDKfilepath(farmid, dir, name, ext);
3487 3176228 : if (path) {
3488 3176228 : ret = MT_stat(path, &st);
3489 3176228 : TRC_DEBUG(IO_, "stat(%s) = %d\n", path, ret);
3490 3176228 : GDKfree(path);
3491 : }
3492 3176228 : return (ret == 0);
3493 : }
3494 :
3495 : static gdk_return
3496 222818 : heap_move(Heap *hp, const char *srcdir, const char *dstdir, const char *nme, const char *ext)
3497 : {
3498 : /* see doc at BATsetaccess()/gdk_bat.c for an expose on mmap
3499 : * heap modes */
3500 222818 : if (file_exists(hp->farmid, dstdir, nme, ext)) {
3501 : /* dont overwrite heap with the committed state
3502 : * already in dstdir */
3503 : return GDK_SUCCEED;
3504 222818 : } else if (hp->newstorage == STORE_PRIV &&
3505 0 : !file_exists(hp->farmid, srcdir, nme, ext)) {
3506 :
3507 : /* In order to prevent half-saved X.new files
3508 : * surviving a recover we create a dummy file in the
3509 : * BACKUP(dstdir) whose presence will trigger
3510 : * BBPrecover to remove them. Thus, X will prevail
3511 : * where it otherwise wouldn't have. If X already has
3512 : * a saved X.new, that one is backed up as normal.
3513 : */
3514 :
3515 0 : FILE *fp;
3516 0 : long_str kill_ext;
3517 0 : char *path;
3518 :
3519 0 : strconcat_len(kill_ext, sizeof(kill_ext), ext, ".kill", NULL);
3520 0 : path = GDKfilepath(hp->farmid, dstdir, nme, kill_ext);
3521 0 : if (path == NULL)
3522 : return GDK_FAIL;
3523 0 : fp = MT_fopen(path, "w");
3524 0 : if (fp == NULL)
3525 0 : GDKsyserror("heap_move: cannot open file %s\n", path);
3526 0 : TRC_DEBUG(IO_, "open %s = %d\n", path, fp ? 0 : -1);
3527 0 : GDKfree(path);
3528 :
3529 0 : if (fp != NULL) {
3530 0 : fclose(fp);
3531 0 : return GDK_SUCCEED;
3532 : } else {
3533 : return GDK_FAIL;
3534 : }
3535 : }
3536 222818 : return file_move(hp->farmid, srcdir, dstdir, nme, ext);
3537 : }
3538 :
3539 : /*
3540 : * @- BBPprepare
3541 : *
3542 : * this routine makes sure there is a BAKDIR/, and initiates one if
3543 : * not. For subcommits, it does the same with SUBDIR.
3544 : *
3545 : * It is now locked, to get proper file counters, and also to prevent
3546 : * concurrent BBPrecovers, etc.
3547 : *
3548 : * backup_dir == 0 => no backup BBP.dir
3549 : * backup_dir == 1 => BBP.dir saved in BACKUP/
3550 : * backup_dir == 2 => BBP.dir saved in SUBCOMMIT/
3551 : */
3552 :
3553 : static gdk_return
3554 26088 : BBPprepare(bool subcommit)
3555 : {
3556 26088 : bool start_subcommit;
3557 26088 : int set = 1 + subcommit;
3558 26088 : gdk_return ret = GDK_SUCCEED;
3559 :
3560 26088 : start_subcommit = (subcommit && backup_subdir == 0);
3561 12879 : if (start_subcommit) {
3562 : /* starting a subcommit. Make sure SUBDIR and DELDIR
3563 : * are clean */
3564 12879 : ret = BBPrecover_subdir();
3565 12879 : if (ret != GDK_SUCCEED)
3566 : return ret;
3567 : }
3568 26088 : if (backup_files == 0) {
3569 322 : backup_dir = 0;
3570 322 : ret = BBPrecover(0);
3571 322 : if (ret != GDK_SUCCEED)
3572 : return ret;
3573 322 : str bakdirpath = GDKfilepath(0, NULL, BAKDIR, NULL);
3574 322 : if (bakdirpath == NULL) {
3575 : return GDK_FAIL;
3576 : }
3577 :
3578 322 : if (MT_mkdir(bakdirpath) < 0 && errno != EEXIST) {
3579 0 : GDKsyserror("cannot create directory %s\n", bakdirpath);
3580 0 : GDKfree(bakdirpath);
3581 0 : return GDK_FAIL;
3582 : }
3583 : /* if BAKDIR already exists, don't signal error */
3584 322 : TRC_DEBUG(IO_, "mkdir %s = %d\n", bakdirpath, (int) ret);
3585 322 : GDKfree(bakdirpath);
3586 : }
3587 26088 : if (start_subcommit) {
3588 : /* make a new SUBDIR (subdir of BAKDIR) */
3589 12879 : str subdirpath = GDKfilepath(0, NULL, SUBDIR, NULL);
3590 12879 : if (subdirpath == NULL) {
3591 : return GDK_FAIL;
3592 : }
3593 :
3594 12879 : if (MT_mkdir(subdirpath) < 0) {
3595 0 : GDKsyserror("cannot create directory %s\n", subdirpath);
3596 0 : GDKfree(subdirpath);
3597 0 : return GDK_FAIL;
3598 : }
3599 12879 : TRC_DEBUG(IO_, "mkdir %s\n", subdirpath);
3600 12879 : GDKfree(subdirpath);
3601 : }
3602 26088 : if (backup_dir != set) {
3603 : /* a valid backup dir *must* at least contain BBP.dir */
3604 52482 : if ((ret = GDKmove(0, backup_dir ? BAKDIR : BATDIR, "BBP", "dir", subcommit ? SUBDIR : BAKDIR, "BBP", "dir", true)) != GDK_SUCCEED)
3605 : return ret;
3606 26080 : backup_dir = set;
3607 : }
3608 : /* increase counters */
3609 26088 : backup_subdir += subcommit;
3610 26088 : backup_files++;
3611 :
3612 26088 : return ret;
3613 : }
3614 :
3615 : static gdk_return
3616 1263921 : do_backup(Heap *h, bool dirty, bool subcommit)
3617 : {
3618 1263921 : gdk_return ret = GDK_SUCCEED;
3619 1263921 : char extnew[16];
3620 :
3621 1263921 : if (h->wasempty) {
3622 : return GDK_SUCCEED;
3623 : }
3624 :
3625 : /* direct mmap is unprotected (readonly usage, or has WAL
3626 : * protection) */
3627 1263921 : if (h->storage != STORE_MMAP) {
3628 : /* STORE_PRIV saves into X.new files. Two cases could
3629 : * happen. The first is when a valid X.new exists
3630 : * because of an access change or a previous
3631 : * commit. This X.new should be backed up as
3632 : * usual. The second case is when X.new doesn't
3633 : * exist. In that case we could have half written
3634 : * X.new files (after a crash). To protect against
3635 : * these we write X.new.kill files in the backup
3636 : * directory (see heap_move). */
3637 1253887 : gdk_return mvret = GDK_SUCCEED;
3638 :
3639 1253887 : char *srcdir = GDKfilepath(NOFARM, BATDIR, h->filename, NULL);
3640 1253887 : if (srcdir == NULL)
3641 : return GDK_FAIL;
3642 1253887 : char *nme = strrchr(srcdir, DIR_SEP);
3643 1253887 : assert(nme != NULL);
3644 1253887 : *nme++ = '\0';
3645 1253887 : char *ext = strchr(nme, '.');
3646 1253887 : assert(ext != NULL);
3647 1253887 : *ext++ = '\0';
3648 :
3649 1253887 : strconcat_len(extnew, sizeof(extnew), ext, ".new", NULL);
3650 1476705 : if (dirty &&
3651 445636 : !file_exists(h->farmid, BAKDIR, nme, extnew) &&
3652 222818 : !file_exists(h->farmid, BAKDIR, nme, ext)) {
3653 : /* if the heap is dirty and there is no heap
3654 : * file (with or without .new extension) in
3655 : * the BAKDIR, move the heap (preferably with
3656 : * .new extension) to the correct backup
3657 : * directory */
3658 222818 : if (file_exists(h->farmid, srcdir, nme, extnew)) {
3659 0 : mvret = heap_move(h, srcdir,
3660 : subcommit ? SUBDIR : BAKDIR,
3661 : nme, extnew);
3662 222818 : } else if (file_exists(h->farmid, srcdir, nme, ext)) {
3663 222820 : mvret = heap_move(h, srcdir,
3664 : subcommit ? SUBDIR : BAKDIR,
3665 : nme, ext);
3666 222818 : if (mvret == GDK_SUCCEED) {
3667 : /* file no longer in "standard"
3668 : * location */
3669 222818 : h->hasfile = false;
3670 : }
3671 : }
3672 1031069 : } else if (subcommit) {
3673 : /* if subcommit, we may need to move an
3674 : * already made backup from BAKDIR to
3675 : * SUBDIR */
3676 1031069 : if (file_exists(h->farmid, BAKDIR, nme, extnew))
3677 0 : mvret = file_move(h->farmid, BAKDIR, SUBDIR, nme, extnew);
3678 1031069 : else if (file_exists(h->farmid, BAKDIR, nme, ext))
3679 0 : mvret = file_move(h->farmid, BAKDIR, SUBDIR, nme, ext);
3680 : }
3681 : /* there is a situation where the move may fail,
3682 : * namely if this heap was not supposed to be existing
3683 : * before, i.e. after a BATmaterialize on a persistent
3684 : * bat; as a workaround, do not complain about move
3685 : * failure if the source file is nonexistent
3686 : */
3687 222818 : if (mvret != GDK_SUCCEED && file_exists(h->farmid, srcdir, nme, ext)) {
3688 1253887 : ret = GDK_FAIL;
3689 : }
3690 1253887 : if (subcommit &&
3691 1253885 : (h->storage == STORE_PRIV || h->newstorage == STORE_PRIV)) {
3692 0 : long_str kill_ext;
3693 :
3694 0 : strconcat_len(kill_ext, sizeof(kill_ext),
3695 : ext, ".new.kill", NULL);
3696 0 : if (file_exists(h->farmid, BAKDIR, nme, kill_ext) &&
3697 0 : file_move(h->farmid, BAKDIR, SUBDIR, nme, kill_ext) != GDK_SUCCEED) {
3698 0 : ret = GDK_FAIL;
3699 : }
3700 : }
3701 1253887 : GDKfree(srcdir);
3702 : }
3703 : return ret;
3704 : }
3705 :
3706 : static gdk_return
3707 998496 : BBPbackup(BAT *b, bool subcommit)
3708 : {
3709 998496 : gdk_return rc = GDK_SUCCEED;
3710 :
3711 998496 : MT_lock_set(&b->theaplock);
3712 998496 : BATiter bi = bat_iterator_nolock(b);
3713 998496 : if (!bi.copiedtodisk || bi.transient) {
3714 1 : MT_lock_unset(&b->theaplock);
3715 1 : return GDK_SUCCEED;
3716 : }
3717 998495 : assert(b->theap->parentid == b->batCacheid);
3718 998495 : if (b->oldtail && b->oldtail != (Heap *) 1) {
3719 1710 : bi.h = b->oldtail;
3720 1710 : bi.hdirty = b->oldtail->dirty;
3721 : }
3722 998495 : bat_iterator_incref(&bi);
3723 998495 : MT_lock_unset(&b->theaplock);
3724 :
3725 : /* determine location dir and physical suffix */
3726 998495 : if (bi.type != TYPE_void) {
3727 998495 : rc = do_backup(bi.h, bi.hdirty, subcommit);
3728 998495 : if (rc == GDK_SUCCEED && bi.vh != NULL)
3729 265426 : rc = do_backup(bi.vh, bi.vhdirty, subcommit);
3730 : }
3731 998495 : bat_iterator_end(&bi);
3732 998495 : return rc;
3733 : }
3734 :
3735 : static inline void
3736 0 : BBPcheckHeap(Heap *h)
3737 : {
3738 0 : struct stat statb;
3739 0 : char *path;
3740 :
3741 0 : char *s = strrchr(h->filename, DIR_SEP);
3742 0 : if (s)
3743 0 : s++;
3744 : else
3745 : s = h->filename;
3746 0 : path = GDKfilepath(0, BAKDIR, s, NULL);
3747 0 : if (path == NULL)
3748 0 : return;
3749 0 : if (MT_stat(path, &statb) < 0) {
3750 0 : GDKfree(path);
3751 0 : path = GDKfilepath(0, BATDIR, h->filename, NULL);
3752 0 : if (path == NULL)
3753 : return;
3754 0 : if (MT_stat(path, &statb) < 0) {
3755 0 : GDKsyserror("cannot stat file %s (expected size %zu)\n",
3756 : path, h->free);
3757 0 : assert(0);
3758 : GDKfree(path);
3759 : return;
3760 : }
3761 : }
3762 0 : assert((statb.st_mode & S_IFMT) == S_IFREG);
3763 0 : assert((size_t) statb.st_size >= h->free);
3764 0 : if ((size_t) statb.st_size < h->free) {
3765 : GDKerror("file %s too small (expected %zu, actual %zu)\n", path, h->free, (size_t) statb.st_size);
3766 : GDKfree(path);
3767 : return;
3768 : }
3769 0 : GDKfree(path);
3770 : }
3771 :
3772 : static void
3773 0 : BBPcheckBBPdir(void)
3774 : {
3775 0 : FILE *fp;
3776 0 : int lineno = 0;
3777 0 : bat bbpsize = 0;
3778 0 : unsigned bbpversion;
3779 0 : lng logno;
3780 :
3781 0 : fp = GDKfileopen(0, BAKDIR, "BBP", "dir", "r");
3782 0 : assert(fp != NULL);
3783 0 : if (fp == NULL) {
3784 : fp = GDKfileopen(0, BATDIR, "BBP", "dir", "r");
3785 : assert(fp != NULL);
3786 : if (fp == NULL)
3787 : return;
3788 : }
3789 0 : bbpversion = BBPheader(fp, &lineno, &bbpsize, &logno, false);
3790 0 : if (bbpversion == 0) {
3791 0 : fclose(fp);
3792 0 : return; /* error reading file */
3793 : }
3794 0 : assert(bbpversion == GDKLIBRARY);
3795 :
3796 0 : for (;;) {
3797 0 : BAT b;
3798 0 : Heap h;
3799 0 : Heap vh;
3800 0 : vh = h = (Heap) {
3801 : .free = 0,
3802 : };
3803 0 : b = (BAT) {
3804 : .theap = &h,
3805 : .tvheap = &vh,
3806 : };
3807 0 : char filename[sizeof(BBP_physical(0))];
3808 0 : char batname[129];
3809 : #ifdef GDKLIBRARY_HASHASH
3810 0 : int hashash;
3811 : #endif
3812 :
3813 0 : switch (BBPreadBBPline(fp, bbpversion, &lineno, &b,
3814 : #ifdef GDKLIBRARY_HASHASH
3815 : &hashash,
3816 : #endif
3817 : batname, filename, NULL)) {
3818 0 : case 0:
3819 : /* end of file */
3820 0 : fclose(fp);
3821 : /* don't leak errors, this is just debug code */
3822 0 : GDKclrerr();
3823 0 : return;
3824 : case 1:
3825 : /* successfully read an entry */
3826 0 : break;
3827 0 : default:
3828 : /* error */
3829 0 : fclose(fp);
3830 0 : return;
3831 : }
3832 : #ifdef GDKLIBRARY_HASHASH
3833 0 : assert(hashash == 0);
3834 : #endif
3835 0 : assert(b.batCacheid < (bat) ATOMIC_GET(&BBPsize));
3836 0 : assert(b.hseqbase <= GDK_oid_max);
3837 0 : if (b.ttype == TYPE_void) {
3838 : /* no files needed */
3839 0 : continue;
3840 : }
3841 0 : if (b.theap->free > 0)
3842 0 : BBPcheckHeap(b.theap);
3843 0 : if (b.tvheap != NULL && b.tvheap->free > 0)
3844 0 : BBPcheckHeap(b.tvheap);
3845 : }
3846 : }
3847 :
3848 : /*
3849 : * @+ Atomic Write
3850 : * The atomic BBPsync() function first safeguards the old images of
3851 : * all files to be written in BAKDIR. It then saves all files. If that
3852 : * succeeds fully, BAKDIR is renamed to DELDIR. The rename is
3853 : * considered an atomic action. If it succeeds, the DELDIR is removed.
3854 : * If something fails, the pre-sync status can be obtained by moving
3855 : * back all backed up files; this is done by BBPrecover().
3856 : *
3857 : * The BBP.dir is also moved into the BAKDIR.
3858 : */
3859 : gdk_return
3860 12887 : BBPsync(int cnt, bat *restrict subcommit, BUN *restrict sizes, lng logno)
3861 : {
3862 12887 : gdk_return ret = GDK_SUCCEED;
3863 12887 : lng t0 = 0, t1 = 0;
3864 12887 : str bakdir, deldir;
3865 12887 : const bool lock = locked_by == 0 || locked_by != MT_getpid();
3866 12887 : char buf[3000];
3867 12887 : int n = subcommit ? 0 : -1;
3868 8 : FILE *obbpf, *nbbpf;
3869 :
3870 12887 : if ((bakdir = GDKfilepath(0, NULL, subcommit ? SUBDIR : BAKDIR, NULL)) == NULL)
3871 : return GDK_FAIL;
3872 12887 : if ((deldir = GDKfilepath(0, NULL, DELDIR, NULL)) == NULL) {
3873 0 : GDKfree(bakdir);
3874 0 : return GDK_FAIL;
3875 : }
3876 :
3877 12887 : TRC_DEBUG_IF(PERF) t0 = t1 = GDKusec();
3878 :
3879 12887 : if ((ATOMIC_GET(&GDKdebug) & TAILCHKMASK) && !GDKinmemory(0))
3880 0 : BBPcheckBBPdir();
3881 :
3882 12887 : ret = BBPprepare(subcommit != NULL);
3883 :
3884 12887 : if (ret == GDK_SUCCEED) {
3885 12887 : ret = BBPdir_first(subcommit != NULL, logno, &obbpf, &nbbpf);
3886 : }
3887 :
3888 1999501 : for (int idx = 1; ret == GDK_SUCCEED && idx < cnt; idx++) {
3889 1986614 : bat i = subcommit ? subcommit[idx] : idx;
3890 1986614 : BUN size = sizes ? sizes[idx] : BUN_NONE;
3891 1986614 : BATiter bi, *bip;
3892 :
3893 1986614 : const bat bid = i;
3894 1986614 : if (lock)
3895 1975555 : MT_lock_set(&GDKswapLock(bid));
3896 : /* set flag that we're syncing, i.e. that we'll
3897 : * be between moving heap to backup dir and
3898 : * saving the new version, in other words, the
3899 : * heap may not exist in the usual location */
3900 1986614 : BBP_status_on(bid, BBPSYNCING);
3901 : /* wait until unloading is finished before
3902 : * attempting to make a backup */
3903 1986614 : while (BBP_status(bid) & BBPUNLOADING) {
3904 0 : if (lock)
3905 0 : MT_lock_unset(&GDKswapLock(bid));
3906 0 : BBPspin(bid, __func__, BBPUNLOADING);
3907 0 : if (lock)
3908 1986614 : MT_lock_set(&GDKswapLock(bid));
3909 : }
3910 1986614 : BAT *b = BBP_desc(bid);
3911 1986614 : if (subcommit && b->ttype != TYPE_void) {
3912 : /* move any tail/theap files we find for this bat that
3913 : * are in the BACKUP directory to the SUBCOMMIT
3914 : * directory */
3915 1975555 : assert(b->ttype > 0); /* no unknown types allowed */
3916 1975555 : char fname[16]; /* plenty big enough */
3917 1975555 : if (snprintf(fname, sizeof(fname), "%o", (unsigned) bid) < 16) {
3918 : /* the snprintf never fails, any of the
3919 : * below may fail */
3920 1975555 : uint8_t stpe = ATOMstorage(b->ttype);
3921 3536344 : if ((b->ttype != TYPE_str || b->twidth >= 8) &&
3922 1560789 : GDKmove(0, BAKDIR, fname, "tail", SUBDIR, fname, "tail", false) == GDK_SUCCEED)
3923 2 : TRC_DEBUG(IO_, "moved %s.tail from %s to %s\n",
3924 : fname, BAKDIR, SUBDIR);
3925 2390638 : if (stpe == TYPE_str &&
3926 415083 : GDKmove(0, BAKDIR, fname, "tail1", SUBDIR, fname, "tail1", false) == GDK_SUCCEED)
3927 0 : TRC_DEBUG(IO_, "moved %s.tail1 from %s to %s\n",
3928 : fname, BAKDIR, SUBDIR);
3929 525385 : if (stpe == TYPE_str && b->twidth >= 2 &&
3930 110302 : GDKmove(0, BAKDIR, fname, "tail2", SUBDIR, fname, "tail2", false) == GDK_SUCCEED)
3931 0 : TRC_DEBUG(IO_, "moved %s.tail2 from %s to %s\n",
3932 : fname, BAKDIR, SUBDIR);
3933 : #if SIZEOF_VAR_T == 8
3934 432791 : if (stpe == TYPE_str && b->twidth >= 4 &&
3935 17708 : GDKmove(0, BAKDIR, fname, "tail4", SUBDIR, fname, "tail4", false) == GDK_SUCCEED)
3936 0 : TRC_DEBUG(IO_, "moved %s.tail4 from %s to %s\n",
3937 : fname, BAKDIR, SUBDIR);
3938 : #endif
3939 2391501 : if (ATOMvarsized(b->ttype) &&
3940 415946 : GDKmove(0, BAKDIR, fname, "theap", SUBDIR, fname, "theap", false) == GDK_SUCCEED)
3941 1975555 : TRC_DEBUG(IO_, "moved %s.theap from %s to %s\n",
3942 : fname, BAKDIR, SUBDIR);
3943 : }
3944 : }
3945 1986614 : b = dirty_bat(&i, subcommit != NULL);
3946 1986614 : if (i <= 0)
3947 : ret = GDK_FAIL;
3948 1986614 : else if (BBP_status(bid) & BBPEXISTING &&
3949 1667772 : b != NULL &&
3950 1667772 : b->batInserted > 0)
3951 998494 : ret = BBPbackup(b, subcommit != NULL);
3952 :
3953 1986614 : if (lock)
3954 1975555 : MT_lock_unset(&GDKswapLock(bid));
3955 :
3956 1986614 : if (ret != GDK_SUCCEED)
3957 : break;
3958 :
3959 1986614 : if (BBP_status(i) & BBPPERSISTENT) {
3960 1792878 : MT_lock_set(&BBP_desc(i)->theaplock);
3961 1792878 : bi = bat_iterator_nolock(BBP_desc(i));
3962 1792878 : bat_iterator_incref(&bi);
3963 1792878 : assert(sizes == NULL || size <= bi.count);
3964 1789380 : assert(sizes == NULL || bi.width == 0 || (bi.type == TYPE_msk ? ((size + 31) / 32) * 4 : size << bi.shift) <= bi.hfree);
3965 1792878 : if (size > bi.count) /* includes sizes==NULL */
3966 : size = bi.count;
3967 1792878 : bi.b->batInserted = size;
3968 1792878 : if (bi.b->ttype >= 0 && ATOMvarsized(bi.b->ttype)) {
3969 : /* see epilogue() for other part of this */
3970 : /* remember the tail we're saving */
3971 412632 : if (BATsetprop_nolock(bi.b, (enum prop_t) 20, TYPE_ptr, &bi.h) == NULL) {
3972 0 : GDKerror("setprop failed\n");
3973 0 : ret = GDK_FAIL;
3974 : } else {
3975 412632 : if (bi.b->oldtail == NULL)
3976 410601 : bi.b->oldtail = (Heap *) 1;
3977 412632 : HEAPincref(bi.h);
3978 : }
3979 : }
3980 1792878 : MT_lock_unset(&bi.b->theaplock);
3981 1792878 : if (ret == GDK_SUCCEED && b && size != 0) {
3982 : /* wait for BBPSAVING so that we
3983 : * can set it, wait for
3984 : * BBPUNLOADING before
3985 : * attempting to save */
3986 1088225 : for (;;) {
3987 1088225 : if (lock)
3988 1088225 : MT_lock_set(&GDKswapLock(i));
3989 1088225 : if (!(BBP_status(i) & (BBPSAVING|BBPUNLOADING)))
3990 : break;
3991 0 : if (lock)
3992 0 : MT_lock_unset(&GDKswapLock(i));
3993 0 : BBPspin(i, __func__, BBPSAVING|BBPUNLOADING);
3994 : }
3995 1088225 : BBP_status_on(i, BBPSAVING);
3996 1088225 : if (lock)
3997 1088225 : MT_lock_unset(&GDKswapLock(i));
3998 1088225 : ret = BATsave_iter(b, &bi, size);
3999 1088225 : BBP_status_off(i, BBPSAVING);
4000 : }
4001 : bip = &bi;
4002 : } else {
4003 : bip = NULL;
4004 : }
4005 1986614 : if (ret == GDK_SUCCEED) {
4006 1986614 : n = BBPdir_step(i, size, n, buf, sizeof(buf), &obbpf, nbbpf, bip);
4007 1986614 : if (n < -1)
4008 0 : ret = GDK_FAIL;
4009 : }
4010 1986614 : if (bip)
4011 1792878 : bat_iterator_end(bip);
4012 : /* we once again have a saved heap */
4013 : }
4014 :
4015 12887 : TRC_DEBUG(PERF, "write time "LLFMT" usec\n", (t0 = GDKusec()) - t1);
4016 :
4017 12887 : if (ret == GDK_SUCCEED) {
4018 12887 : ret = BBPdir_last(n, buf, sizeof(buf), obbpf, nbbpf);
4019 : }
4020 :
4021 12887 : TRC_DEBUG(PERF, "dir time "LLFMT" usec, %d bats\n", (t1 = GDKusec()) - t0, (bat) ATOMIC_GET(&BBPsize));
4022 :
4023 12887 : if (ret == GDK_SUCCEED) {
4024 : /* atomic switchover */
4025 : /* this is the big one: this call determines
4026 : * whether the operation of this function
4027 : * succeeded, so no changing of ret after this
4028 : * call anymore */
4029 :
4030 12887 : if (MT_rename(bakdir, deldir) < 0 &&
4031 : /* maybe there was an old deldir, so remove and try again */
4032 0 : (GDKremovedir(0, DELDIR) != GDK_SUCCEED ||
4033 0 : MT_rename(bakdir, deldir) < 0))
4034 0 : ret = GDK_FAIL;
4035 0 : if (ret != GDK_SUCCEED)
4036 0 : GDKsyserror("rename(%s,%s) failed\n", bakdir, deldir);
4037 12887 : TRC_DEBUG(IO_, "rename %s %s = %d\n", bakdir, deldir, (int) ret);
4038 : }
4039 :
4040 : /* AFTERMATH */
4041 12887 : if (ret == GDK_SUCCEED) {
4042 12887 : ATOMIC_SET(&BBPlogno, logno); /* the new value */
4043 12887 : backup_files = subcommit ? (backup_files - backup_subdir) : 0;
4044 12887 : backup_dir = backup_subdir = 0;
4045 12887 : if (GDKremovedir(0, DELDIR) != GDK_SUCCEED)
4046 0 : fprintf(stderr, "#BBPsync: cannot remove directory %s\n", DELDIR);
4047 12887 : (void) BBPprepare(false); /* (try to) remove DELDIR and set up new BAKDIR */
4048 12887 : if (backup_files > 1) {
4049 12879 : TRC_DEBUG(PERF, "backup_files %d > 1\n", backup_files);
4050 12879 : backup_files = 1;
4051 : }
4052 : }
4053 12887 : TRC_DEBUG(PERF, "%s (ready time "LLFMT" usec)\n",
4054 : ret == GDK_SUCCEED ? "" : " failed",
4055 : (t0 = GDKusec()) - t1);
4056 :
4057 12887 : if (ret != GDK_SUCCEED) {
4058 : /* clean up extra refs we created */
4059 0 : for (int idx = 1; idx < cnt; idx++) {
4060 0 : bat i = subcommit ? subcommit[idx] : idx;
4061 0 : BAT *b = BBP_desc(i);
4062 0 : if (ATOMvarsized(b->ttype)) {
4063 0 : MT_lock_set(&b->theaplock);
4064 0 : ValPtr p = BATgetprop_nolock(b, (enum prop_t) 20);
4065 0 : if (p != NULL) {
4066 0 : HEAPdecref(p->val.pval, false);
4067 0 : BATrmprop_nolock(b, (enum prop_t) 20);
4068 : }
4069 0 : MT_lock_unset(&b->theaplock);
4070 : }
4071 : }
4072 : }
4073 :
4074 : /* turn off the BBPSYNCING bits for all bats, even when things
4075 : * didn't go according to plan (i.e., don't check for ret ==
4076 : * GDK_SUCCEED) */
4077 1999501 : for (int idx = 1; idx < cnt; idx++) {
4078 1986614 : bat i = subcommit ? subcommit[idx] : idx;
4079 1986614 : BBP_status_off(i, BBPSYNCING);
4080 : }
4081 :
4082 12887 : GDKfree(bakdir);
4083 12887 : GDKfree(deldir);
4084 12887 : return ret;
4085 : }
4086 :
4087 : /*
4088 : * Recovery just moves all files back to their original location. this
4089 : * is an incremental process: if something fails, just stop with still
4090 : * files left for moving in BACKUP/. The recovery process can resume
4091 : * later with the left over files.
4092 : */
4093 : static gdk_return
4094 0 : force_move(int farmid, const char *srcdir, const char *dstdir, const char *name)
4095 : {
4096 0 : const char *p;
4097 0 : char *dstpath, *killfile;
4098 0 : gdk_return ret = GDK_SUCCEED;
4099 :
4100 0 : if ((p = strrchr(name, '.')) != NULL && strcmp(p, ".kill") == 0) {
4101 : /* Found a X.new.kill file, ie remove the X.new file */
4102 0 : ptrdiff_t len = p - name;
4103 0 : long_str srcpath;
4104 :
4105 0 : strncpy(srcpath, name, len);
4106 0 : srcpath[len] = '\0';
4107 0 : if ((dstpath = GDKfilepath(farmid, dstdir, srcpath, NULL)) == NULL) {
4108 : return GDK_FAIL;
4109 : }
4110 :
4111 : /* step 1: remove the X.new file that is going to be
4112 : * overridden by X */
4113 0 : if (MT_remove(dstpath) != 0 && errno != ENOENT) {
4114 : /* if it exists and cannot be removed, all
4115 : * this is going to fail */
4116 0 : GDKsyserror("force_move: remove(%s)\n", dstpath);
4117 0 : GDKfree(dstpath);
4118 0 : return GDK_FAIL;
4119 : }
4120 0 : GDKfree(dstpath);
4121 :
4122 : /* step 2: now remove the .kill file. This one is
4123 : * crucial, otherwise we'll never finish recovering */
4124 0 : if ((killfile = GDKfilepath(farmid, srcdir, name, NULL)) == NULL) {
4125 : return GDK_FAIL;
4126 : }
4127 0 : if (MT_remove(killfile) != 0) {
4128 0 : ret = GDK_FAIL;
4129 0 : GDKsyserror("force_move: remove(%s)\n", killfile);
4130 : }
4131 0 : GDKfree(killfile);
4132 0 : return ret;
4133 : }
4134 : /* try to rename it */
4135 0 : ret = GDKmove(farmid, srcdir, name, NULL, dstdir, name, NULL, false);
4136 :
4137 0 : if (ret != GDK_SUCCEED) {
4138 0 : char *srcpath;
4139 :
4140 0 : GDKclrerr();
4141 : /* two legal possible causes: file exists or dir
4142 : * doesn't exist */
4143 0 : if ((dstpath = GDKfilepath(farmid, dstdir, name, NULL)) == NULL)
4144 : return GDK_FAIL;
4145 0 : if ((srcpath = GDKfilepath(farmid, srcdir, name, NULL)) == NULL) {
4146 0 : GDKfree(dstpath);
4147 0 : return GDK_FAIL;
4148 : }
4149 0 : if (MT_remove(dstpath) != 0) /* clear destination */
4150 0 : ret = GDK_FAIL;
4151 0 : TRC_DEBUG(IO_, "remove %s = %d\n", dstpath, (int) ret);
4152 :
4153 0 : (void) GDKcreatedir(dstdir); /* if fails, move will fail */
4154 0 : ret = GDKmove(farmid, srcdir, name, NULL, dstdir, name, NULL, true);
4155 0 : TRC_DEBUG(IO_, "link %s %s = %d\n", srcpath, dstpath, (int) ret);
4156 0 : GDKfree(dstpath);
4157 0 : GDKfree(srcpath);
4158 : }
4159 : return ret;
4160 : }
4161 :
4162 : gdk_return
4163 322 : BBPrecover(int farmid)
4164 : {
4165 322 : str bakdirpath;
4166 322 : str leftdirpath;
4167 322 : DIR *dirp;
4168 322 : struct dirent *dent;
4169 322 : long_str path, dstpath;
4170 322 : bat i;
4171 322 : size_t j = strlen(BATDIR);
4172 322 : gdk_return ret = GDK_SUCCEED;
4173 322 : bool dirseen = false;
4174 322 : str dstdir;
4175 :
4176 322 : bakdirpath = GDKfilepath(farmid, NULL, BAKDIR, NULL);
4177 322 : leftdirpath = GDKfilepath(farmid, NULL, LEFTDIR, NULL);
4178 322 : if (bakdirpath == NULL || leftdirpath == NULL) {
4179 0 : GDKfree(bakdirpath);
4180 0 : GDKfree(leftdirpath);
4181 0 : return GDK_FAIL;
4182 : }
4183 322 : dirp = opendir(bakdirpath);
4184 322 : if (dirp == NULL) {
4185 233 : if (errno != ENOENT)
4186 0 : GDKsyserror("cannot open directory %s\n", bakdirpath);
4187 233 : GDKfree(bakdirpath);
4188 233 : GDKfree(leftdirpath);
4189 233 : return GDK_SUCCEED; /* nothing to do */
4190 : }
4191 89 : memcpy(dstpath, BATDIR, j);
4192 89 : dstpath[j] = DIR_SEP;
4193 89 : dstpath[++j] = 0;
4194 89 : dstdir = dstpath + j;
4195 89 : TRC_DEBUG(IO_, "start\n");
4196 :
4197 89 : if (MT_mkdir(leftdirpath) < 0 && errno != EEXIST) {
4198 0 : GDKsyserror("cannot create directory %s\n", leftdirpath);
4199 0 : closedir(dirp);
4200 0 : GDKfree(bakdirpath);
4201 0 : GDKfree(leftdirpath);
4202 0 : return GDK_FAIL;
4203 : }
4204 :
4205 : /* move back all files */
4206 267 : while ((dent = readdir(dirp)) != NULL) {
4207 178 : const char *q = strchr(dent->d_name, '.');
4208 :
4209 178 : if (q == dent->d_name) {
4210 178 : char *fn;
4211 :
4212 178 : if (strcmp(dent->d_name, ".") == 0 ||
4213 89 : strcmp(dent->d_name, "..") == 0)
4214 178 : continue;
4215 0 : fn = GDKfilepath(farmid, BAKDIR, dent->d_name, NULL);
4216 0 : if (fn) {
4217 0 : int uret = MT_remove(fn);
4218 0 : TRC_DEBUG(IO_, "remove %s = %d\n",
4219 : fn, uret);
4220 0 : GDKfree(fn);
4221 : }
4222 0 : continue;
4223 0 : } else if (strcmp(dent->d_name, "BBP.dir") == 0) {
4224 0 : dirseen = true;
4225 0 : continue;
4226 : }
4227 0 : if (q == NULL)
4228 0 : q = dent->d_name + strlen(dent->d_name);
4229 0 : if ((j = q - dent->d_name) + 1 > sizeof(path)) {
4230 : /* name too long: ignore */
4231 0 : continue;
4232 : }
4233 0 : strncpy(path, dent->d_name, j);
4234 0 : path[j] = 0;
4235 0 : if (GDKisdigit(*path)) {
4236 0 : i = strtol(path, NULL, 8);
4237 : } else {
4238 0 : i = BBP_find(path, false);
4239 0 : if (i < 0)
4240 0 : i = -i;
4241 : }
4242 0 : if (i == 0 || i >= (bat) ATOMIC_GET(&BBPsize) || !BBPvalid(i)) {
4243 0 : force_move(farmid, BAKDIR, LEFTDIR, dent->d_name);
4244 : } else {
4245 0 : BBPgetsubdir(dstdir, i);
4246 0 : if (force_move(farmid, BAKDIR, dstpath, dent->d_name) != GDK_SUCCEED) {
4247 : ret = GDK_FAIL;
4248 : break;
4249 : }
4250 : /* don't trust index files after recovery */
4251 0 : GDKunlink(farmid, dstpath, path, "thashl");
4252 0 : GDKunlink(farmid, dstpath, path, "thashb");
4253 0 : GDKunlink(farmid, dstpath, path, "torderidx");
4254 0 : GDKunlink(farmid, dstpath, path, "tstrimps");
4255 : }
4256 : }
4257 89 : closedir(dirp);
4258 89 : if (dirseen && ret == GDK_SUCCEED) { /* we have a saved BBP.dir; it should be moved back!! */
4259 0 : struct stat st;
4260 0 : char *fn;
4261 :
4262 0 : fn = GDKfilepath(farmid, BATDIR, "BBP", "dir");
4263 0 : if (fn == NULL) {
4264 : ret = GDK_FAIL;
4265 : } else {
4266 0 : ret = recover_dir(farmid, MT_stat(fn, &st) == 0);
4267 0 : GDKfree(fn);
4268 : }
4269 : }
4270 :
4271 89 : if (ret == GDK_SUCCEED) {
4272 89 : if (MT_rmdir(bakdirpath) < 0) {
4273 0 : GDKsyserror("cannot remove directory %s\n", bakdirpath);
4274 0 : ret = GDK_FAIL;
4275 : }
4276 89 : TRC_DEBUG(IO_, "rmdir %s = %d\n", bakdirpath, (int) ret);
4277 : }
4278 89 : if (ret != GDK_SUCCEED)
4279 0 : GDKerror("recovery failed.\n");
4280 :
4281 89 : TRC_DEBUG(IO_, "end\n");
4282 89 : GDKfree(bakdirpath);
4283 89 : GDKfree(leftdirpath);
4284 89 : return ret;
4285 : }
4286 :
4287 : /*
4288 : * SUBDIR recovery is quite mindlessly moving all files back to the
4289 : * parent (BAKDIR). We do recognize moving back BBP.dir and set
4290 : * backed_up_subdir accordingly.
4291 : */
4292 : gdk_return
4293 13193 : BBPrecover_subdir(void)
4294 : {
4295 13193 : str subdirpath;
4296 13193 : DIR *dirp;
4297 13193 : struct dirent *dent;
4298 13193 : gdk_return ret = GDK_SUCCEED;
4299 :
4300 13193 : subdirpath = GDKfilepath(0, NULL, SUBDIR, NULL);
4301 13193 : if (subdirpath == NULL)
4302 : return GDK_FAIL;
4303 13193 : dirp = opendir(subdirpath);
4304 13193 : if (dirp == NULL && errno != ENOENT)
4305 0 : GDKsyserror("cannot open directory %s\n", subdirpath);
4306 13193 : GDKfree(subdirpath);
4307 13193 : if (dirp == NULL) {
4308 : return GDK_SUCCEED; /* nothing to do */
4309 : }
4310 0 : TRC_DEBUG(IO_, "start\n");
4311 :
4312 : /* move back all files */
4313 0 : while ((dent = readdir(dirp)) != NULL) {
4314 0 : if (dent->d_name[0] == '.')
4315 0 : continue;
4316 0 : ret = GDKmove(0, SUBDIR, dent->d_name, NULL, BAKDIR, dent->d_name, NULL, true);
4317 0 : if (ret != GDK_SUCCEED)
4318 : break;
4319 0 : if (strcmp(dent->d_name, "BBP.dir") == 0)
4320 0 : backup_dir = 1;
4321 : }
4322 0 : closedir(dirp);
4323 :
4324 : /* delete the directory */
4325 0 : if (ret == GDK_SUCCEED) {
4326 0 : ret = GDKremovedir(0, SUBDIR);
4327 0 : if (backup_dir == 2) {
4328 0 : TRC_DEBUG(IO_, "%s%cBBP.dir had disappeared!\n", SUBDIR, DIR_SEP);
4329 0 : backup_dir = 0;
4330 : }
4331 : }
4332 0 : TRC_DEBUG(IO_, "end = %d\n", (int) ret);
4333 :
4334 0 : if (ret != GDK_SUCCEED)
4335 0 : GDKerror("recovery failed.\n");
4336 : return ret;
4337 : }
4338 :
4339 : /*
4340 : * @- The diskscan
4341 : * The BBPdiskscan routine walks through the BAT dir, cleans up
4342 : * leftovers, and measures disk occupancy. Leftovers are files that
4343 : * cannot belong to a BAT. in order to establish this for [ht]heap
4344 : * files, the BAT descriptor is loaded in order to determine whether
4345 : * these files are still required.
4346 : *
4347 : * The routine gathers all bat sizes in a bat that contains bat-ids
4348 : * and bytesizes. The return value is the number of bytes of space
4349 : * freed.
4350 : */
4351 : static bool
4352 20703 : persistent_bat(bat bid)
4353 : {
4354 20703 : if (bid >= 0 && bid < (bat) ATOMIC_GET(&BBPsize) && BBPvalid(bid)) {
4355 20703 : BAT *b = BBP_desc(bid);
4356 20703 : if ((BBP_status(bid) & BBPLOADED) == 0 || b->batCopiedtodisk) {
4357 : return true;
4358 : }
4359 : }
4360 : return false;
4361 : }
4362 :
4363 : static BAT *
4364 20703 : getdesc(bat bid)
4365 : {
4366 20703 : BAT *b = NULL;
4367 :
4368 20703 : if (is_bat_nil(bid))
4369 : return NULL;
4370 20703 : assert(bid > 0);
4371 20703 : if (bid < (bat) ATOMIC_GET(&BBPsize) && BBP_logical(bid))
4372 20703 : b = BBP_desc(bid);
4373 20703 : if (b == NULL)
4374 0 : BBPclear(bid);
4375 : return b;
4376 : }
4377 :
4378 : static bool
4379 1465 : BBPdiskscan(const char *parent, size_t baseoff)
4380 : {
4381 1465 : DIR *dirp = opendir(parent);
4382 1465 : struct dirent *dent;
4383 1465 : char fullname[FILENAME_MAX];
4384 1465 : str dst;
4385 1465 : size_t dstlen;
4386 1465 : const char *src = parent;
4387 :
4388 1465 : if (dirp == NULL) {
4389 149 : if (errno != ENOENT)
4390 0 : GDKsyserror("cannot open directory %s\n", parent);
4391 149 : return true; /* nothing to do */
4392 : }
4393 :
4394 1316 : dst = stpcpy(fullname, src);
4395 1316 : if (dst > fullname && dst[-1] != DIR_SEP)
4396 1316 : *dst++ = DIR_SEP;
4397 1316 : dstlen = sizeof(fullname) - (dst - fullname);
4398 :
4399 27283 : while ((dent = readdir(dirp)) != NULL) {
4400 24651 : const char *p;
4401 24651 : bat bid;
4402 24651 : bool ok, delete;
4403 :
4404 24651 : if (dent->d_name[0] == '.')
4405 2632 : continue; /* ignore .dot files and directories (. ..) */
4406 :
4407 : #ifdef GDKLIBRARY_JSON
4408 22019 : if (strcmp(dent->d_name, "jsonupgradeneeded") == 0) {
4409 0 : continue; /* ignore json upgrade signal file */
4410 : }
4411 : #endif
4412 :
4413 22019 : if (strncmp(dent->d_name, "BBP.", 4) == 0 &&
4414 314 : (strcmp(parent + baseoff, BATDIR) == 0 ||
4415 314 : strncmp(parent + baseoff, BAKDIR, strlen(BAKDIR)) == 0 ||
4416 0 : strncmp(parent + baseoff, SUBDIR, strlen(SUBDIR)) == 0))
4417 314 : continue;
4418 :
4419 21705 : p = strchr(dent->d_name, '.');
4420 :
4421 21705 : if (strlen(dent->d_name) >= dstlen) {
4422 : /* found a file with too long a name
4423 : (i.e. unknown); stop pruning in this
4424 : subdir */
4425 0 : fprintf(stderr, "unexpected file %s, leaving %s.\n", dent->d_name, parent);
4426 0 : break;
4427 : }
4428 21705 : strncpy(dst, dent->d_name, dstlen);
4429 21705 : fullname[sizeof(fullname) - 1] = 0;
4430 :
4431 21705 : if (p == NULL && !BBPdiskscan(fullname, baseoff)) {
4432 : /* it was a directory */
4433 1002 : continue;
4434 : }
4435 :
4436 20703 : if (p && strcmp(p + 1, "tmp") == 0) {
4437 : delete = true;
4438 : ok = true;
4439 20703 : bid = 0;
4440 : } else {
4441 20703 : bid = strtol(dent->d_name, NULL, 8);
4442 20703 : ok = p && bid;
4443 20703 : delete = false;
4444 :
4445 20703 : if (!ok || !persistent_bat(bid)) {
4446 : delete = true;
4447 20703 : } else if (strncmp(p + 1, "tail", 4) == 0) {
4448 15463 : BAT *b = getdesc(bid);
4449 15463 : delete = (b == NULL || !b->ttype || !b->batCopiedtodisk || b->batCount == 0);
4450 15463 : assert(b == NULL || b->batCount > 0 || b->theap->free == 0);
4451 15463 : if (!delete) {
4452 15463 : if (b->ttype == TYPE_str) {
4453 4331 : switch (b->twidth) {
4454 2638 : case 1:
4455 2638 : delete = strcmp(p + 1, "tail1") != 0;
4456 2638 : break;
4457 1413 : case 2:
4458 1413 : delete = strcmp(p + 1, "tail2") != 0;
4459 1413 : break;
4460 : #if SIZEOF_VAR_T == 8
4461 280 : case 4:
4462 280 : delete = strcmp(p + 1, "tail4") != 0;
4463 280 : break;
4464 : #endif
4465 0 : default:
4466 0 : delete = strcmp(p + 1, "tail") != 0;
4467 0 : break;
4468 : }
4469 : } else {
4470 11132 : delete = strcmp(p + 1, "tail") != 0;
4471 : }
4472 : }
4473 5240 : } else if (strncmp(p + 1, "theap", 5) == 0) {
4474 4475 : BAT *b = getdesc(bid);
4475 4475 : delete = (b == NULL || !b->tvheap || !b->batCopiedtodisk || b->tvheap->free == 0);
4476 765 : } else if (strncmp(p + 1, "thashl", 6) == 0 ||
4477 383 : strncmp(p + 1, "thashb", 6) == 0) {
4478 764 : BAT *b = getdesc(bid);
4479 764 : delete = b == NULL;
4480 764 : if (!delete)
4481 764 : b->thash = (Hash *) 1;
4482 1 : } else if (strncmp(p + 1, "thash", 5) == 0) {
4483 : /* older versions used .thash which we
4484 : * can simply ignore */
4485 : delete = true;
4486 1 : } else if (strncmp(p + 1, "thsh", 4) == 0) {
4487 : /* temporary hash files which we can
4488 : * simply ignore */
4489 : delete = true;
4490 1 : } else if (strncmp(p + 1, "timprints", 9) == 0) {
4491 : /* imprints have been removed */
4492 : delete = true;
4493 1 : } else if (strncmp(p + 1, "torderidx", 9) == 0) {
4494 0 : BAT *b = getdesc(bid);
4495 0 : delete = b == NULL;
4496 0 : if (!delete)
4497 0 : b->torderidx = (Heap *) 1;
4498 1 : } else if (strncmp(p + 1, "tstrimps", 8) == 0) {
4499 1 : BAT *b = getdesc(bid);
4500 1 : delete = b == NULL;
4501 1 : if (!delete)
4502 1 : b->tstrimps = (Strimps *)1;
4503 0 : } else if (strncmp(p + 1, "new", 3) != 0) {
4504 20703 : ok = false;
4505 : }
4506 : }
4507 20703 : if (!ok) {
4508 : /* found an unknown file; stop pruning in this
4509 : * subdir */
4510 0 : fprintf(stderr, "unexpected file %s, leaving %s.\n", dent->d_name, parent);
4511 0 : break;
4512 : }
4513 20703 : if (delete) {
4514 0 : if (MT_remove(fullname) != 0 && errno != ENOENT) {
4515 0 : GDKsyserror("remove(%s)", fullname);
4516 0 : continue;
4517 : }
4518 25967 : TRC_DEBUG(IO_, "remove(%s) = 0\n", fullname);
4519 : }
4520 : }
4521 1316 : closedir(dirp);
4522 1316 : return false;
4523 : }
4524 :
4525 : void
4526 297 : gdk_bbp_reset(void)
4527 : {
4528 297 : int i;
4529 :
4530 297 : BBP_free = 0;
4531 297 : BBP_nfree = 0;
4532 297 : while (BBPlimit > BBPINIT) {
4533 0 : BBPlimit -= BBPINIT;
4534 0 : assert(BBPlimit >= 0);
4535 0 : GDKfree(BBP[BBPlimit >> BBPINITLOG]);
4536 0 : BBP[BBPlimit >> BBPINITLOG] = NULL;
4537 : }
4538 297 : ATOMIC_SET(&BBPsize, 0);
4539 297 : memset(BBP0, 0, sizeof(BBP0));
4540 9801 : for (i = 0; i < MAXFARMS; i++)
4541 9504 : GDKfree((void *) BBPfarms[i].dirname); /* loose "const" */
4542 297 : memset(BBPfarms, 0, sizeof(BBPfarms));
4543 297 : memset(BBP_hash, 0, sizeof(BBP_hash));
4544 :
4545 297 : locked_by = 0;
4546 297 : BBPunloadCnt = 0;
4547 297 : backup_files = 0;
4548 297 : backup_dir = 0;
4549 297 : backup_subdir = 0;
4550 297 : }
4551 :
4552 : static MT_Lock GDKCallbackListLock = MT_LOCK_INITIALIZER(GDKCallbackListLock);
4553 :
4554 : static struct {
4555 : int cnt;
4556 : gdk_callback *head;
4557 : } callback_list = {
4558 : .cnt = 0,
4559 : .head = NULL,
4560 : };
4561 :
4562 : /*
4563 : * @- Add a callback
4564 : * Adds new callback to the callback list.
4565 : */
4566 : gdk_return
4567 0 : gdk_add_callback(char *name, gdk_callback_func *f, int argc, void *argv[], int
4568 : interval)
4569 : {
4570 :
4571 0 : gdk_callback *callback = NULL;
4572 :
4573 0 : if (!(callback = GDKmalloc(sizeof(gdk_callback) + sizeof(void *) * argc))) {
4574 0 : TRC_CRITICAL(GDK, "Failed to allocate memory!");
4575 0 : return GDK_FAIL;
4576 : }
4577 :
4578 0 : *callback = (gdk_callback) {
4579 : .name = name,
4580 : .argc = argc,
4581 : .interval = interval,
4582 : .func = f,
4583 : };
4584 :
4585 0 : for (int i=0; i < argc; i++) {
4586 0 : callback->argv[i] = argv[i];
4587 : }
4588 :
4589 0 : MT_lock_set(&GDKCallbackListLock);
4590 0 : gdk_callback *p = callback_list.head;
4591 0 : if (p) {
4592 : int cnt = 1;
4593 0 : do {
4594 : /* check if already added */
4595 0 : if (strcmp(callback->name, p->name) == 0) {
4596 0 : MT_lock_unset(&GDKCallbackListLock);
4597 0 : GDKfree(callback);
4598 0 : return GDK_FAIL;
4599 : }
4600 0 : if (p->next == NULL) {
4601 0 : p->next = callback;
4602 0 : p = callback->next;
4603 : } else {
4604 : p = p->next;
4605 : }
4606 0 : cnt += 1;
4607 0 : } while(p);
4608 0 : callback_list.cnt = cnt;
4609 : } else {
4610 0 : callback_list.cnt = 1;
4611 0 : callback_list.head = callback;
4612 : }
4613 0 : MT_lock_unset(&GDKCallbackListLock);
4614 0 : return GDK_SUCCEED;
4615 : }
4616 :
4617 : /*
4618 : * @- Remove a callback
4619 : * Removes a callback from the callback list with a given name as an argument.
4620 : */
4621 : gdk_return
4622 0 : gdk_remove_callback(char *cb_name, gdk_callback_func *argsfree)
4623 : {
4624 0 : gdk_callback *prev = NULL;
4625 0 : gdk_return res = GDK_FAIL;
4626 :
4627 0 : MT_lock_set(&GDKCallbackListLock);
4628 0 : gdk_callback *curr = callback_list.head;
4629 0 : while(curr) {
4630 0 : if (strcmp(cb_name, curr->name) == 0) {
4631 0 : if (curr == callback_list.head && prev == NULL) {
4632 0 : callback_list.head = curr->next;
4633 : } else {
4634 0 : prev->next = curr->next;
4635 : }
4636 0 : if (argsfree)
4637 0 : argsfree(curr->argc, curr->argv);
4638 0 : GDKfree(curr);
4639 0 : curr = NULL;
4640 0 : callback_list.cnt -=1;
4641 0 : res = GDK_SUCCEED;
4642 : } else {
4643 0 : prev = curr;
4644 0 : curr = curr->next;
4645 : }
4646 : }
4647 0 : MT_lock_unset(&GDKCallbackListLock);
4648 0 : return res;
4649 : }
4650 :
4651 : static gdk_return
4652 0 : do_callback(gdk_callback *cb)
4653 : {
4654 0 : cb->last_called = GDKusec();
4655 0 : return cb->func(cb->argc, cb->argv);
4656 : }
4657 :
4658 : static bool
4659 0 : should_call(gdk_callback *cb)
4660 : {
4661 0 : if (cb->last_called && cb->interval) {
4662 0 : return (cb->last_called + cb->interval * 1000 * 1000) <
4663 0 : GDKusec();
4664 : }
4665 : return true;
4666 : }
4667 :
4668 : static void
4669 100 : BBPcallbacks(void)
4670 : {
4671 100 : MT_lock_set(&GDKCallbackListLock);
4672 100 : gdk_callback *next = callback_list.head;
4673 :
4674 100 : while (next) {
4675 0 : if(should_call(next))
4676 0 : do_callback(next);
4677 0 : next = next->next;
4678 : }
4679 100 : MT_lock_unset(&GDKCallbackListLock);
4680 100 : }
4681 :
4682 : /* GDKtmLock protects all accesses and changes to BAKDIR and SUBDIR.
4683 : * MUST use BBPtmlock()/BBPtmunlock() to set/unset the lock.
4684 : *
4685 : * This is at the end of the file on purpose: we don't want people to
4686 : * accidentally use GDKtmLock directly. */
4687 : static MT_Lock GDKtmLock = MT_LOCK_INITIALIZER(GDKtmLock);
4688 : static int lockfd;
4689 :
4690 : static void
4691 115708 : BBPtmlockFinish(void)
4692 : {
4693 115708 : if (!GDKinmemory(0) &&
4694 : /* also use an external lock file to synchronize with
4695 : * external programs */
4696 115708 : (lockfile != NULL ||
4697 314 : (lockfile = GDKfilepath(0, NULL, ".tm_lock", NULL)) != NULL)) {
4698 115708 : lockfd = MT_lockf(lockfile, F_LOCK);
4699 : }
4700 115708 : }
4701 :
4702 : void
4703 115592 : BBPtmlock(void)
4704 : {
4705 115592 : MT_lock_set(&GDKtmLock);
4706 115592 : BBPtmlockFinish();
4707 115592 : }
4708 :
4709 : static bool
4710 116 : BBPtrytmlock(int ms)
4711 : {
4712 116 : if (!MT_lock_trytime(&GDKtmLock, ms))
4713 0 : return false;
4714 116 : BBPtmlockFinish();
4715 116 : return true;
4716 : }
4717 :
4718 : void
4719 115708 : BBPtmunlock(void)
4720 : {
4721 115708 : if (lockfile && lockfd >= 0) {
4722 115708 : assert(!GDKinmemory(0));
4723 115708 : MT_lockf(lockfile, F_ULOCK);
4724 115708 : close(lockfd);
4725 115708 : lockfd = -1;
4726 : }
4727 115708 : MT_lock_unset(&GDKtmLock);
4728 115708 : }
4729 :
4730 : void
4731 116 : BBPprintinfo(void)
4732 : {
4733 : /* 32 categories for the bats, not all are expected to be filled */
4734 116 : struct counters {
4735 : size_t sz;
4736 : size_t vmsz;
4737 : int nr;
4738 116 : } bats[2][2][2][2][2] = {0};
4739 116 : int nbats = 0;
4740 116 : int nskip = 0;
4741 :
4742 116 : if (!BBPtrytmlock(1000)) {
4743 0 : printf("BBP is currently locked, so no BAT information\n");
4744 0 : return;
4745 : }
4746 116 : bat sz = (bat) ATOMIC_GET(&BBPsize);
4747 234826 : for (bat i = 1; i < sz; i++) {
4748 234710 : if (!MT_lock_trytime(&GDKswapLock(i), 1000)) {
4749 0 : nskip++;
4750 0 : continue;
4751 : }
4752 234710 : int r;
4753 234710 : if ((r = BBP_refs(i)) > 0 || BBP_lrefs(i) > 0) {
4754 193930 : BAT *b = BBP_desc(i);
4755 193930 : if (!MT_lock_trytime(&b->theaplock, 1000)) {
4756 0 : nskip++;
4757 0 : b = NULL;
4758 : }
4759 0 : if (b != NULL) {
4760 193930 : nbats++;
4761 193930 : ATOMIC_BASE_TYPE status = BBP_status(i);
4762 193930 : struct counters *bt = &bats[r > 0][BATdirty(b)][(status & BBPPERSISTENT) != 0][(status & BBPLOADED) != 0][(status & BBPHOT) != 0];
4763 193930 : bt->nr++;
4764 193930 : if (b->theap && b->batCacheid == b->theap->parentid) {
4765 193930 : bt->sz += HEAPmemsize(b->theap);
4766 193930 : bt->vmsz += HEAPvmsize(b->theap);
4767 : }
4768 193930 : if (b->tvheap && b->batCacheid == b->tvheap->parentid) {
4769 11401 : bt->sz += HEAPmemsize(b->tvheap);
4770 11401 : bt->vmsz += HEAPvmsize(b->tvheap);
4771 : }
4772 193930 : MT_lock_unset(&b->theaplock);
4773 : }
4774 : }
4775 234710 : MT_lock_unset(&GDKswapLock(i));
4776 : }
4777 116 : uint32_t nfree = BBP_nfree;
4778 116 : BBPtmunlock();
4779 116 : printf("BATs:\n");
4780 116 : if (bats[1][1][1][1][1].nr > 0)
4781 116 : printf("fix, dirty, persistent, loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[1][1][1][1][1].nr, bats[1][1][1][1][1].vmsz, bats[1][1][1][1][1].sz);
4782 116 : if (bats[1][1][1][1][0].nr > 0)
4783 0 : printf("fix, dirty, persistent, not loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[1][1][1][1][0].nr, bats[1][1][1][1][0].vmsz, bats[1][1][1][1][0].sz);
4784 116 : if (bats[1][1][1][0][1].nr > 0)
4785 0 : printf("fix, dirty, persistent, loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[1][1][1][0][1].nr, bats[1][1][1][0][1].vmsz, bats[1][1][1][0][1].sz);
4786 116 : if (bats[1][1][1][0][0].nr > 0)
4787 0 : printf("fix, dirty, persistent, not loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[1][1][1][0][0].nr, bats[1][1][1][0][0].vmsz, bats[1][1][1][0][0].sz);
4788 116 : if (bats[1][1][0][1][1].nr > 0)
4789 116 : printf("fix, dirty, transient, loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[1][1][0][1][1].nr, bats[1][1][0][1][1].vmsz, bats[1][1][0][1][1].sz);
4790 116 : if (bats[1][1][0][1][0].nr > 0)
4791 1 : printf("fix, dirty, transient, not loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[1][1][0][1][0].nr, bats[1][1][0][1][0].vmsz, bats[1][1][0][1][0].sz);
4792 116 : if (bats[1][1][0][0][1].nr > 0)
4793 0 : printf("fix, dirty, transient, loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[1][1][0][0][1].nr, bats[1][1][0][0][1].vmsz, bats[1][1][0][0][1].sz);
4794 116 : if (bats[1][1][0][0][0].nr > 0)
4795 0 : printf("fix, dirty, transient, not loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[1][1][0][0][0].nr, bats[1][1][0][0][0].vmsz, bats[1][1][0][0][0].sz);
4796 116 : if (bats[1][0][1][1][1].nr > 0)
4797 105 : printf("fix, clean, persistent, loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[1][0][1][1][1].nr, bats[1][0][1][1][1].vmsz, bats[1][0][1][1][1].sz);
4798 116 : if (bats[1][0][1][1][0].nr > 0)
4799 0 : printf("fix, clean, persistent, not loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[1][0][1][1][0].nr, bats[1][0][1][1][0].vmsz, bats[1][0][1][1][0].sz);
4800 116 : if (bats[1][0][1][0][1].nr > 0)
4801 0 : printf("fix, clean, persistent, loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[1][0][1][0][1].nr, bats[1][0][1][0][1].vmsz, bats[1][0][1][0][1].sz);
4802 116 : if (bats[1][0][1][0][0].nr > 0)
4803 0 : printf("fix, clean, persistent, not loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[1][0][1][0][0].nr, bats[1][0][1][0][0].vmsz, bats[1][0][1][0][0].sz);
4804 116 : if (bats[1][0][0][1][1].nr > 0)
4805 0 : printf("fix, clean, transient, loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[1][0][0][1][1].nr, bats[1][0][0][1][1].vmsz, bats[1][0][0][1][1].sz);
4806 116 : if (bats[1][0][0][1][0].nr > 0)
4807 0 : printf("fix, clean, transient, not loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[1][0][0][1][0].nr, bats[1][0][0][1][0].vmsz, bats[1][0][0][1][0].sz);
4808 116 : if (bats[1][0][0][0][1].nr > 0)
4809 0 : printf("fix, clean, transient, loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[1][0][0][0][1].nr, bats[1][0][0][0][1].vmsz, bats[1][0][0][0][1].sz);
4810 116 : if (bats[1][0][0][0][0].nr > 0)
4811 0 : printf("fix, clean, transient, not loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[1][0][0][0][0].nr, bats[1][0][0][0][0].vmsz, bats[1][0][0][0][0].sz);
4812 116 : if (bats[0][1][1][1][1].nr > 0)
4813 112 : printf("no fix, dirty, persistent, loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[0][1][1][1][1].nr, bats[0][1][1][1][1].vmsz, bats[0][1][1][1][1].sz);
4814 116 : if (bats[0][1][1][1][0].nr > 0)
4815 29 : printf("no fix, dirty, persistent, not loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[0][1][1][1][0].nr, bats[0][1][1][1][0].vmsz, bats[0][1][1][1][0].sz);
4816 116 : if (bats[0][1][1][0][1].nr > 0)
4817 0 : printf("no fix, dirty, persistent, loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[0][1][1][0][1].nr, bats[0][1][1][0][1].vmsz, bats[0][1][1][0][1].sz);
4818 116 : if (bats[0][1][1][0][0].nr > 0)
4819 1 : printf("no fix, dirty, persistent, not loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[0][1][1][0][0].nr, bats[0][1][1][0][0].vmsz, bats[0][1][1][0][0].sz);
4820 116 : if (bats[0][1][0][1][1].nr > 0)
4821 97 : printf("no fix, dirty, transient, loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[0][1][0][1][1].nr, bats[0][1][0][1][1].vmsz, bats[0][1][0][1][1].sz);
4822 116 : if (bats[0][1][0][1][0].nr > 0)
4823 16 : printf("no fix, dirty, transient, not loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[0][1][0][1][0].nr, bats[0][1][0][1][0].vmsz, bats[0][1][0][1][0].sz);
4824 116 : if (bats[0][1][0][0][1].nr > 0)
4825 0 : printf("no fix, dirty, transient, loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[0][1][0][0][1].nr, bats[0][1][0][0][1].vmsz, bats[0][1][0][0][1].sz);
4826 116 : if (bats[0][1][0][0][0].nr > 0)
4827 17 : printf("no fix, dirty, transient, not loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[0][1][0][0][0].nr, bats[0][1][0][0][0].vmsz, bats[0][1][0][0][0].sz);
4828 116 : if (bats[0][0][1][1][1].nr > 0)
4829 114 : printf("no fix, clean, persistent, loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[0][0][1][1][1].nr, bats[0][0][1][1][1].vmsz, bats[0][0][1][1][1].sz);
4830 116 : if (bats[0][0][1][1][0].nr > 0)
4831 20 : printf("no fix, clean, persistent, not loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[0][0][1][1][0].nr, bats[0][0][1][1][0].vmsz, bats[0][0][1][1][0].sz);
4832 116 : if (bats[0][0][1][0][1].nr > 0)
4833 0 : printf("no fix, clean, persistent, loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[0][0][1][0][1].nr, bats[0][0][1][0][1].vmsz, bats[0][0][1][0][1].sz);
4834 116 : if (bats[0][0][1][0][0].nr > 0)
4835 18 : printf("no fix, clean, persistent, not loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[0][0][1][0][0].nr, bats[0][0][1][0][0].vmsz, bats[0][0][1][0][0].sz);
4836 116 : if (bats[0][0][0][1][1].nr > 0)
4837 4 : printf("no fix, clean, transient, loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[0][0][0][1][1].nr, bats[0][0][0][1][1].vmsz, bats[0][0][0][1][1].sz);
4838 116 : if (bats[0][0][0][1][0].nr > 0)
4839 0 : printf("no fix, clean, transient, not loaded, hot: %d bats, %zu virtual, %zu malloc\n", bats[0][0][0][1][0].nr, bats[0][0][0][1][0].vmsz, bats[0][0][0][1][0].sz);
4840 116 : if (bats[0][0][0][0][1].nr > 0)
4841 0 : printf("no fix, clean, transient, loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[0][0][0][0][1].nr, bats[0][0][0][0][1].vmsz, bats[0][0][0][0][1].sz);
4842 116 : if (bats[0][0][0][0][0].nr > 0)
4843 0 : printf("no fix, clean, transient, not loaded, cold: %d bats, %zu virtual, %zu malloc\n", bats[0][0][0][0][0].nr, bats[0][0][0][0][0].vmsz, bats[0][0][0][0][0].sz);
4844 :
4845 116 : printf("%d bats total, %d in use, %"PRIu32" free bats in common shared list\n",
4846 : sz - 1, nbats, nfree);
4847 116 : if (nskip > 0)
4848 0 : printf("%d bat slots unaccounted for because of locking\n", nskip);
4849 : }
|