Line data Source code
1 : /*
2 : * SPDX-License-Identifier: MPL-2.0
3 : *
4 : * This Source Code Form is subject to the terms of the Mozilla Public
5 : * License, v. 2.0. If a copy of the MPL was not distributed with this
6 : * file, You can obtain one at http://mozilla.org/MPL/2.0/.
7 : *
8 : * Copyright 2024 MonetDB Foundation;
9 : * Copyright August 2008 - 2023 MonetDB B.V.;
10 : * Copyright 1997 - July 2008 CWI.
11 : */
12 :
13 : /*
14 : * (author) M. Kersten
15 : *
16 : * Search the first definition of the operator in the current module
17 : * and check the parameter types.
18 : * For a polymorphic MAL function we make a fully instantiated clone.
19 : * It will be prepended to the symbol list as it is more restrictive.
20 : * This effectively overloads the MAL procedure.
21 : */
22 : #include "monetdb_config.h"
23 : #include "mal_resolve.h"
24 : #include "mal_namespace.h"
25 : #include "mal_private.h"
26 : #include "mal_linker.h"
27 :
28 : #define MAXTYPEVAR 4
29 :
30 : static malType getPolyType(malType t, int *polytype);
31 : static int updateTypeMap(int formal, int actual, int polytype[MAXTYPEVAR]);
32 : static bool typeResolved(MalBlkPtr mb, InstrPtr p, int i);
33 :
34 : int
35 329904944 : resolvedType(int dsttype, int srctype)
36 : {
37 329904944 : if (dsttype == srctype || dsttype == TYPE_any || srctype == TYPE_any)
38 : return 0;
39 :
40 227984707 : if (getOptBat(dsttype) && isaBatType(srctype)) {
41 2412 : int t1 = getBatType(dsttype);
42 2412 : int t2 = getBatType(srctype);
43 2412 : if (t1 == t2 || t1 == TYPE_any || t2 == TYPE_any)
44 : return 0;
45 : }
46 12245 : if (getOptBat(dsttype) && !isaBatType(srctype)) {
47 10312 : int t1 = getBatType(dsttype);
48 10312 : int t2 = srctype;
49 10312 : if (t1 == t2 || t1 == TYPE_any || t2 == TYPE_any)
50 : return 0;
51 : }
52 :
53 227984074 : if (isaBatType(dsttype) && isaBatType(srctype)) {
54 160645993 : int t1 = getBatType(dsttype);
55 160645993 : int t2 = getBatType(srctype);
56 160645993 : if (t1 == t2 || t1 == TYPE_any || t2 == TYPE_any)
57 94670808 : return 0;
58 : }
59 : return -1;
60 : }
61 :
62 : static int
63 71606894 : resolveType(int *rtype, int dsttype, int srctype)
64 : {
65 71606894 : if (dsttype == srctype) {
66 34082104 : *rtype = dsttype;
67 34082104 : return 0;
68 : }
69 37524790 : if (dsttype == TYPE_any) {
70 3704619 : *rtype = srctype;
71 3704619 : return 0;
72 : }
73 33820171 : if (srctype == TYPE_any) {
74 20294664 : *rtype = dsttype;
75 20294664 : return 0;
76 : }
77 : /*
78 : * A bat reference can be coerced to bat type.
79 : */
80 13525507 : if (isaBatType(dsttype) && isaBatType(srctype)) {
81 13495358 : int t1, t2, t3;
82 13495358 : t1 = getBatType(dsttype);
83 13495358 : t2 = getBatType(srctype);
84 13495358 : if (t1 == t2)
85 : t3 = t1;
86 13495355 : else if (t1 == TYPE_any)
87 : t3 = t2;
88 190543 : else if (t2 == TYPE_any)
89 : t3 = t1;
90 : else {
91 : return -1;
92 : }
93 13304821 : *rtype = newBatType(t3);
94 13304821 : return 0;
95 : }
96 : return -1;
97 : }
98 :
99 :
100 : /*
101 : * Since we now know the storage type of the receiving variable, we can
102 : * set the garbage collection flag.
103 : */
104 : #define prepostProcess(tp, p, b, mb) \
105 : do { \
106 : if( isaBatType(tp) || \
107 : ATOMtype(tp) == TYPE_str || \
108 : (!isPolyType(tp) && tp < TYPE_any && \
109 : tp >= 0 && ATOMextern(tp))) { \
110 : getInstrPtr(mb, 0)->gc = true; \
111 : setVarCleanup(mb, getArg(p, b)); \
112 : p->gc = true; \
113 : } \
114 : } while (0)
115 :
116 : static malType
117 493600991 : getFormalArgType( Symbol s, int arg)
118 : {
119 493600991 : if (s->kind == FUNCTIONsymbol)
120 41616 : return getArgType(s->def, getSignature(s), arg);
121 493559375 : mel_arg *a = s->func->args+arg;
122 493559375 : malType tpe = TYPE_any;
123 493559375 : if (a->nr || !a->type[0]) {
124 195985689 : if (a->isbat)
125 : tpe = newBatType(TYPE_any);
126 : else
127 23531420 : tpe = a->typeid;
128 195985689 : setTypeIndex(tpe, a->nr);
129 : } else {
130 297573686 : if (a->isbat)
131 123878859 : tpe = newBatType(a->typeid);
132 : else
133 173694827 : tpe = a->typeid;
134 : }
135 493559375 : if (a->opt == 1)
136 30360 : setOptBat(tpe);
137 : return tpe;
138 : }
139 :
140 : static malType
141 74551681 : findFunctionType(Module scope, MalBlkPtr mb, InstrPtr p, int idx, int silent)
142 : {
143 74551681 : Module m;
144 74551681 : Symbol s;
145 74551681 : int i, k, unmatched = 0, s1;
146 74551681 : int polytype[MAXTYPEVAR];
147 74551681 : int returns[256];
148 74551681 : int *returntype = NULL;
149 : /*
150 : * Within a module find the element in its list
151 : * of symbols. A skiplist is used to speed up the search for the
152 : * definition of the function.
153 : *
154 : * For the implementation we should be aware that over 90% of the
155 : * functions in the kernel have just a few arguments and a single
156 : * return value.
157 : * A point of concern is that polymorphic arithmetic operations
158 : * lead to an explosion in the symbol table. This increase the
159 : * loop to find a candidate.
160 : *
161 : * Consider to collect the argument type into a separate structure, because
162 : * it will be looked up multiple types to resolve the instruction.[todo]
163 : * Simplify polytype using a map into the concrete argument table.
164 : */
165 :
166 74551681 : m = scope;
167 74551681 : s = m->space[(int) (getSymbolIndex(getFunctionId(p)))];
168 74551681 : if (s == 0)
169 : return -1;
170 :
171 74551461 : if (p->retc < 256) {
172 154150187 : for (i = 0; i < p->retc; i++)
173 79598766 : returns[i] = 0;
174 74551461 : returntype = returns;
175 : } else {
176 40 : returntype = (int *) GDKzalloc(p->retc * sizeof(int));
177 40 : if (returntype == 0)
178 : return -1;
179 : }
180 :
181 531864496 : while (s != NULL) { /* single scope element check */
182 531863240 : if (getFunctionId(p) != s->name) {
183 127888089 : s = s->skip;
184 127888089 : continue;
185 : }
186 : /*
187 : * Perform a strong type-check on the actual arguments. If it
188 : * turns out to be a polymorphic MAL function, we have to
189 : * clone it. Provided the actual/formal parameters are
190 : * compliant throughout the function call.
191 : *
192 : * Also look out for variable argument lists. This means that
193 : * we have to keep two iterators, one for the caller (i) and
194 : * one for the callee (k). Since a variable argument only
195 : * occurs as the last one, we simple avoid an increment when
196 : * running out of formal arguments.
197 : *
198 : * A call of the form (X1,..., Xi) := f(Y1,....,Yn) can be
199 : * matched against the function signature (B1,...,Bk):=
200 : * f(A1,...,Am) where i==k , n<=m and
201 : * type(Ai)=type(Yi). Furthermore, the variables Xi obtain
202 : * their type from Bi (or type(Bi)==type(Xi)).
203 : */
204 403975151 : int argc = 0, argcc = 0, retc = 0, varargs = 0, varrets = 0, unsafe = 0, inlineprop = 0, polymorphic = 0;
205 403975151 : if (s->kind == FUNCTIONsymbol) {
206 10468 : InstrPtr sig = getSignature(s);
207 10468 : retc = sig->retc;
208 10468 : argc = sig->argc;
209 10468 : varargs = (sig->varargs & (VARARGS | VARRETS));
210 10468 : varrets = (sig->varargs & VARRETS);
211 10468 : unsafe = s->def->unsafeProp;
212 10468 : inlineprop = s->def->inlineProp;
213 10468 : polymorphic = sig->polymorphic;
214 10468 : argcc = argc;
215 : } else {
216 403964683 : retc = s->func->retc;
217 403964683 : argc = s->func->argc;
218 403964683 : varargs = /*retc == 0 ||*/ s->func->vargs || s->func->vrets;
219 403964683 : varrets = retc == 0 || s->func->vrets;
220 403964683 : unsafe = s->func->unsafe;
221 403964683 : inlineprop = 0;
222 403964683 : polymorphic = s->func->poly;
223 403964683 : if (!retc && !polymorphic)
224 2324666 : polymorphic = 1;
225 403964683 : argcc = argc + ((retc == 0)?1:0);
226 : }
227 403975151 : unmatched = 0;
228 :
229 : /*
230 : * The simple case could be taken care of separately to
231 : * speedup processing
232 : * However, it turned out not to make a big difference. The
233 : * first time we encounter a polymorphic argument in the
234 : * signature.
235 : * Subsequently, the polymorphic arguments update this table
236 : * and check for any type mismatches that might occur. There
237 : * are at most 2 type variables involved per argument due to
238 : * the limited type nesting permitted. Note, each function
239 : * returns at least one value.
240 : */
241 403975151 : if (polymorphic) {
242 92322755 : int limit = polymorphic;
243 92322755 : if (!(argcc == p->argc || (argc < p->argc && varargs))) {
244 37078932 : s = s->peer;
245 37078932 : continue;
246 : }
247 55243823 : if (retc != p->retc && !varrets) {
248 437720 : s = s->peer;
249 437720 : continue;
250 : }
251 :
252 156091687 : for (k = 0; k < limit; k++)
253 101285584 : polytype[k] = TYPE_any;
254 : /*
255 : * Most polymorphic functions don't have a variable argument
256 : * list. So we save some instructions factoring this caise out.
257 : * Be careful, the variable number of return arguments should
258 : * be considered as well.
259 : */
260 : i = p->retc;
261 : /* first handle the variable argument list */
262 295238851 : for (k = retc; i < p->argc; k++, i++) {
263 243990321 : int actual = getArgType(mb, p, i);
264 243990321 : int formal = getFormalArgType(s, k);
265 243990321 : if (k == argc - 1 && varargs)
266 100714790 : k--;
267 : /*
268 : * Take care of variable argument lists.
269 : * They are allowed as the last in the signature only.
270 : * Furthermore, for patterns if the formal type is
271 : * 'any' then all remaining arguments are acceptable
272 : * and detailed type analysis becomes part of the
273 : * pattern implementation.
274 : * In all other cases the type should apply to all
275 : * remaining arguments.
276 : */
277 243990321 : if (getOptBat(formal) && !isAnyExpression(formal) && getBatType(actual) == getBatType(formal))
278 243990321 : formal = actual;
279 243990321 : if (formal == actual)
280 89482153 : continue;
281 154508168 : if (updateTypeMap(formal, actual, polytype)) {
282 : unmatched = i;
283 : break;
284 : }
285 152357085 : formal = getPolyType(formal, polytype);
286 : /*
287 : * Collect the polymorphic types and resolve them.
288 : * If it fails, we know this isn't the function we are
289 : * looking for.
290 : */
291 152357085 : if (resolvedType(formal, actual) < 0) {
292 : unmatched = i;
293 : break;
294 : }
295 : }
296 : /*
297 : * The last argument/result type could be a polymorphic
298 : * variable list. It should only be allowed for patterns,
299 : * where it can deal with the stack. If the type is
300 : * specified as :any then any mix of arguments is allowed.
301 : * If the type is a new numbered type variable then the
302 : * first element in the list determines the required type
303 : * of all.
304 : */
305 54791865 : if (varargs) {
306 9739469 : if (s->kind != PATTERNsymbol && retc)
307 : unmatched = i;
308 : else {
309 : /* resolve the arguments */
310 9743080 : for (; i < p->argc; i++) {
311 : /* the type of the last one has already been set */
312 1506495 : int actual = getArgType(mb, p, i);
313 1506495 : int formal = getFormalArgType(s, k);
314 1506495 : if (k == argc - 1 && varargs)
315 0 : k--;
316 :
317 1506495 : formal = getPolyType(formal, polytype);
318 1506495 : if (getOptBat(formal) && !isAnyExpression(formal) && getBatType(actual) == getBatType(formal))
319 1506495 : formal = actual;
320 1506495 : if (formal == actual || formal == TYPE_any)
321 1020 : continue;
322 1505475 : if (resolvedType(formal, actual) < 0) {
323 : unmatched = i;
324 : break;
325 : }
326 : }
327 : }
328 : }
329 : } else {
330 : /*
331 : * We have to check the argument types to determine a
332 : * possible match for the non-polymorphic case.
333 : */
334 311652396 : if (argc != p->argc || retc != p->retc) {
335 157740247 : s = s->peer;
336 157740247 : continue;
337 : }
338 :
339 :
340 199648005 : for (i = p->retc; i < p->argc; i++) {
341 176141223 : int actual = getArgType(mb, p, i);
342 176141223 : int formal = getFormalArgType(s, i);
343 176141223 : if (resolvedType(formal, actual) < 0) {
344 : unmatched = i;
345 : break;
346 : }
347 : }
348 : }
349 : /*
350 : * It is possible that you may have to coerce the value to
351 : * another type. We assume that coercions are explicit at the
352 : * MAL level. (e.g. var2:= var0:int). This avoids repeated
353 : * type analysis just before you execute a function.
354 : * An optimizer may at a later stage automatically insert such
355 : * coercion requests.
356 : */
357 :
358 208704910 : if (unmatched) {
359 133947366 : s = s->peer;
360 133947366 : continue;
361 : }
362 : /*
363 : * At this stage we know all arguments are type compatible
364 : * with the signature.
365 : * We should assure that also the target variables have the
366 : * proper types or can inherit them from the signature. The
367 : * result type vector should be build separately first,
368 : * because we may encounter an error later on.
369 : *
370 : * If any of the arguments refer to a constraint type, any_x,
371 : * then the resulting type can not be determined.
372 : */
373 74757544 : s1 = 0;
374 74757544 : if (polymorphic) {
375 99712816 : for (k = i = 0; i < p->retc && k < retc; k++, i++) {
376 48458705 : int actual = getArgType(mb, p, i);
377 48458705 : int formal = getFormalArgType(s, k);
378 :
379 48458705 : if (k == retc - 1 && varrets)
380 363673 : k--;
381 :
382 48458705 : s1 = getPolyType(formal, polytype);
383 :
384 48458705 : if (getOptBat(formal) && !isAnyExpression(formal) && getBatType(actual) == getBatType(formal))
385 48458705 : s1 = actual;
386 48458705 : if (resolveType(returntype+i, s1, actual) < 0) {
387 : s1 = -1;
388 : break;
389 : }
390 : }
391 : } else {
392 : /* check for non-polymorphic return */
393 47216761 : for (k = i = 0; i < p->retc; i++) {
394 23915956 : int actual = getArgType(mb, p, i);
395 23915956 : int formal = getFormalArgType(s, i);
396 :
397 23915956 : if (k == retc - 1 && varrets)
398 : k--;
399 :
400 23915956 : if (actual == formal) {
401 8669531 : returntype[i] = actual;
402 : } else {
403 15246425 : if (resolveType(returntype+i, formal, actual) < 0) {
404 : s1 = -1;
405 : break;
406 : }
407 : }
408 : }
409 : }
410 74775597 : if (s1 < 0) {
411 220681 : s = s->peer;
412 220681 : continue;
413 : }
414 : /*
415 : * If the return types are correct, copy them in place.
416 : * Beware that signatures should be left untouched, which
417 : * means that we may not overwrite any formal argument.
418 : * Using the knowledge dat the arguments occupy the header
419 : * of the symbol stack, it is easy to filter such errors.
420 : * Also mark all variables that are subject to garbage control.
421 : * Beware, this is not yet effectuated in the interpreter.
422 : */
423 :
424 74554916 : p->typeresolved = true;
425 74554916 : p->inlineProp = inlineprop;
426 74554916 : p->unsafeProp = unsafe;
427 154163861 : for (i = 0; i < p->retc; i++) {
428 79608945 : int ts = returntype[i];
429 79608945 : if (isVarConstant(mb, getArg(p, i))) {
430 0 : if (!silent) {
431 0 : mb->errors = createMalException(mb, idx, TYPE,
432 : "Assignment to constant");
433 : }
434 0 : p->typeresolved = false;
435 0 : goto wrapup;
436 : }
437 79608945 : if (!isVarFixed(mb, getArg(p, i)) && ts >= 0) {
438 41355519 : setVarType(mb, getArg(p, i), ts);
439 41355519 : setVarFixed(mb, getArg(p, i));
440 : }
441 79608945 : prepostProcess(ts, p, i, mb);
442 : }
443 : /*
444 : * Also the arguments may contain constants
445 : * to be garbage collected.
446 : */
447 343401422 : for (i = p->retc; i < p->argc; i++)
448 268846506 : if (ATOMtype(getArgType(mb, p, i)) == TYPE_str ||
449 222364625 : isaBatType(getArgType(mb, p, i)) ||
450 57193390 : (!isPolyType(getArgType(mb, p, i)) &&
451 57193378 : getArgType(mb, p, i) < TYPE_any &&
452 57193378 : getArgType(mb, p, i) >= 0 &&
453 57193378 : ATOMstorage(getArgType(mb, p, i)) == TYPE_str)) {
454 211656602 : getInstrPtr(mb, 0)->gc = true;
455 211656602 : p->gc = true;
456 : }
457 : /*
458 : * It may happen that an argument was still untyped and as a
459 : * result of the polymorphism matching became strongly
460 : * typed. This should be reflected in the symbol table.
461 : */
462 74554916 : s1 = returntype[0]; /* for those interested */
463 : /*
464 : * If the call refers to a polymorphic function, we clone it
465 : * to arrive at a bounded instance. Polymorphic patterns and
466 : * commands are responsible for type resolution themselves.
467 : * Note that cloning pre-supposes that the function being
468 : * cloned does not contain errors detected earlier in the
469 : * process, nor does it contain polymorphic actual arguments.
470 : */
471 74554916 : if (polymorphic) {
472 : int cnt = 0;
473 288319579 : for (k = i = p->retc; i < p->argc; i++) {
474 237052323 : int actual = getArgType(mb, p, i);
475 237052323 : if (isAnyExpression(actual))
476 10 : cnt++;
477 : }
478 51267256 : if (cnt == 0 && s->kind != COMMANDsymbol
479 27143609 : && s->kind != PATTERNsymbol) {
480 11 : assert(s->kind == FUNCTIONsymbol);
481 11 : s = cloneFunction(scope, s, mb, p);
482 11 : if (mb->errors)
483 3 : goto wrapup;
484 : }
485 : }
486 : /* Any previously found error in the block
487 : * turns the complete block into erroneous.
488 : if (mb->errors) {
489 : p->typeresolved = false;
490 : goto wrapup;
491 : }
492 : */
493 :
494 : /*
495 : * We found the proper function. Copy some properties. In
496 : * particular, determine the calling strategy, i.e. FCNcall,
497 : * CMDcall, PATcall Beware that polymorphic functions
498 : * may produce type-incorrect clones. This piece of code may be
499 : * shared by the separate binder
500 : */
501 74554913 : if (p->token == ASSIGNsymbol) {
502 74567533 : switch (s->kind) {
503 24959945 : case COMMANDsymbol:
504 24959945 : p->token = CMDcall;
505 24959945 : p->fcn = s->func->imp; /* C implementation mandatory */
506 24959945 : if (p->fcn == NULL) {
507 1 : if (!silent)
508 1 : mb->errors = createMalException(mb, idx, TYPE,
509 : "object code for command %s.%s missing",
510 : p->modname, p->fcnname);
511 1 : p->typeresolved = false;
512 1 : goto wrapup;
513 : }
514 : break;
515 49597156 : case PATTERNsymbol:
516 49597156 : p->token = PATcall;
517 49597156 : p->fcn = s->func->imp; /* C implementation optional */
518 49597156 : break;
519 10432 : case FUNCTIONsymbol:
520 10432 : p->token = FCNcall;
521 10432 : if (getSignature(s)->fcn)
522 0 : p->fcn = getSignature(s)->fcn; /* C implementation optional */
523 : break;
524 0 : default:
525 0 : if (!silent)
526 0 : mb->errors = createMalException(mb, idx, MAL,
527 : "MALresolve: unexpected token type");
528 0 : goto wrapup;
529 : }
530 74567532 : p->blk = s->def;
531 : }
532 :
533 74554912 : if (returntype != returns)
534 40 : GDKfree(returntype);
535 : return s1;
536 : } /* while */
537 : /*
538 : * We haven't found the correct function. To ease debugging, we
539 : * may reveal that we found an instruction with the proper
540 : * arguments, but that clashes with one of the target variables.
541 : */
542 1256 : wrapup:
543 1260 : if (returntype != returns)
544 0 : GDKfree(returntype);
545 : return -3;
546 : }
547 :
548 : /*
549 : * We try to clear the type check flag by looking up the
550 : * functions. Errors are simply ignored at this point of the game,
551 : * because they may be resolved as part of the calling sequence.
552 : */
553 : static void
554 5 : typeMismatch(MalBlkPtr mb, InstrPtr p, int idx, int lhs, int rhs, int silent)
555 : {
556 5 : str n1;
557 5 : str n2;
558 :
559 5 : if (!silent) {
560 5 : n1 = getTypeName(lhs);
561 5 : n2 = getTypeName(rhs);
562 5 : mb->errors = createMalException(mb, idx, TYPE, "type mismatch %s := %s", n1,
563 : n2);
564 5 : GDKfree(n1);
565 5 : GDKfree(n2);
566 : }
567 5 : p->typeresolved = false;
568 5 : }
569 :
570 : /*
571 : * A function search should inspect all modules unless a specific module
572 : * is given. Preference is given to the lower scopes.
573 : * The type check is set to TYPE_UNKNOWN first to enforce a proper
574 : * analysis. This way it forms a cheap mechanism to resolve
575 : * the type after a change by an optimizer.
576 : * If we can not find the function, the type check returns unsuccessfully.
577 : * In this case we should issue an error message to the user.
578 : *
579 : * A re-check after the optimizer call should reset the token
580 : * to assignment.
581 : */
582 : void
583 86309469 : typeChecker(Module scope, MalBlkPtr mb, InstrPtr p, int idx, int silent)
584 : {
585 86309469 : int s1 = -1, i, k;
586 86309469 : Module m = 0;
587 :
588 86309469 : p->typeresolved = false;
589 86309469 : if ((p->fcn || p->blk) && p->token >= FCNcall && p->token <= PATcall) {
590 60243155 : p->token = ASSIGNsymbol;
591 60243155 : p->fcn = NULL;
592 60243155 : p->blk = NULL;
593 : }
594 :
595 86309469 : if (isaSignature(p)) {
596 4442327 : for (k = 0; k < p->argc; k++)
597 2225561 : setVarFixed(mb, getArg(p, k));
598 2219870 : for (k = p->retc; k < p->argc; k++) {
599 3104 : prepostProcess(getArgType(mb, p, k), p, k, mb);
600 : }
601 2216766 : p->typeresolved = true;
602 4439281 : for (k = 0; k < p->retc; k++)
603 2222515 : p->typeresolved &= typeResolved(mb, p, 0);
604 76774632 : return;
605 : }
606 84092703 : if (getFunctionId(p) && getModuleId(p)) {
607 74540471 : m = findModule(scope, getModuleId(p));
608 :
609 74554257 : if (!m || strcmp(m->name, getModuleId(p)) != 0) {
610 194 : if (!silent)
611 2 : mb->errors = createMalException(mb, idx, TYPE, "'%s%s%s' undefined",
612 : (getModuleId(p) ? getModuleId(p) : ""),
613 1 : (getModuleId(p) ? "." : ""),
614 : getFunctionId(p));
615 194 : return;
616 : }
617 74554063 : s1 = findFunctionType(m, mb, p, idx, silent);
618 :
619 74557584 : if (s1 >= 0)
620 : return;
621 : /*
622 : * Could not find a function that satisfies the constraints.
623 : * If the instruction is just a function header we may
624 : * continue. Likewise, the function and module may refer to
625 : * string variables known only at runtime.
626 : *
627 : * In all other cases we should generate a message, but only
628 : * if we know that the error was not caused by checking the
629 : * definition of a polymorphic function or the module or
630 : * function name are variables, In those cases, the detailed
631 : * analysis is performed upon an actual call.
632 : */
633 1480 : if (!isaSignature(p) && !getInstrPtr(mb, 0)->polymorphic) {
634 1469 : if (!silent) {
635 28 : char *errsig = NULL;
636 28 : if (!malLibraryEnabled(p->modname)) {
637 0 : mb->errors = createMalException(mb, idx, TYPE,
638 : "'%s%s%s' library error in: %s",
639 : (getModuleId(p) ?
640 : getModuleId(p) : ""),
641 0 : (getModuleId(p) ? "." : ""),
642 : getFunctionId(p),
643 : malLibraryHowToEnable(p->
644 : modname));
645 : } else {
646 28 : bool free_errsig = false, special_undefined = false;
647 28 : errsig = malLibraryHowToEnable(p->modname);
648 28 : if (!strcmp(errsig, "")) {
649 28 : errsig = instruction2str(mb, 0, p,
650 : (LIST_MAL_NAME | LIST_MAL_TYPE
651 : | LIST_MAL_VALUE));
652 28 : free_errsig = true;
653 : } else {
654 : special_undefined = true;
655 : }
656 84 : mb->errors = createMalException(mb, idx, TYPE,
657 : "'%s%s%s' undefined%s: %s",
658 : (getModuleId(p) ?
659 : getModuleId(p) : ""),
660 28 : (getModuleId(p) ? "." : ""),
661 : getFunctionId(p),
662 : special_undefined ? "" :
663 : " in",
664 : errsig ? errsig :
665 : "failed instruction2str()");
666 28 : if (free_errsig)
667 28 : GDKfree(errsig);
668 : }
669 : }
670 1469 : p->typeresolved = false;
671 : } else
672 11 : p->typeresolved = true;
673 1480 : return;
674 : }
675 : /*
676 : * When we arrive here the operator is an assignment.
677 : * The language should also recognize (a,b):=(1,2);
678 : * This is achieved by propagation of the rhs types to the lhs
679 : * variables.
680 : */
681 9552232 : if (getFunctionId(p)) {
682 : return;
683 : }
684 9552149 : if (p->retc >= 1 && p->argc > p->retc && p->argc != 2 * p->retc) {
685 7 : if (!silent) {
686 7 : mb->errors = createMalException(mb, idx, TYPE,
687 : "Multiple assignment mismatch");
688 : }
689 7 : p->typeresolved = true;
690 : } else
691 9552142 : p->typeresolved = true;
692 17448428 : for (k = 0, i = p->retc; k < p->retc && i < p->argc; i++, k++) {
693 7893947 : int rhs = getArgType(mb, p, i);
694 7893947 : int lhs = getArgType(mb, p, k);
695 :
696 7893947 : if (rhs != TYPE_void) {
697 7893796 : if (resolveType(&s1, lhs, rhs) < 0) {
698 5 : typeMismatch(mb, p, idx, lhs, rhs, silent);
699 5 : return;
700 : }
701 : } else {
702 : /*
703 : * The language permits assignment of 'nil' to any variable,
704 : * using the target type.
705 : */
706 151 : if (lhs != TYPE_void && lhs != TYPE_any) {
707 3 : ValRecord cst = { .vtype = TYPE_void, .val.oval = void_nil, .bat = isaBatType(lhs) };
708 3 : int k;
709 :
710 3 : k = defConstant(mb, lhs, &cst);
711 3 : if (k >= 0)
712 3 : p->argv[i] = k;
713 3 : rhs = lhs;
714 : }
715 : }
716 :
717 7896279 : if (!isVarFixed(mb, getArg(p, k))) {
718 3519538 : setVarType(mb, getArg(p, k), rhs);
719 3519538 : setVarFixed(mb, getArg(p, k));
720 : }
721 7896279 : prepostProcess(s1, p, i, mb);
722 7896279 : prepostProcess(s1, p, k, mb);
723 : }
724 : /* the case where we have no rhs */
725 9554481 : if (p->barrier && p->retc == p->argc)
726 545366 : for (k = 0; k < p->retc; k++) {
727 276817 : int tpe = getArgType(mb, p, k);
728 276817 : if (isaBatType(tpe) ||
729 267164 : ATOMtype(tpe) == TYPE_str ||
730 267164 : (!isPolyType(tpe) && tpe < MAXATOMS && ATOMextern(tpe)))
731 9659 : setVarCleanup(mb, getArg(p, k));
732 : }
733 : }
734 :
735 : /*
736 : * After the parser finishes, we have to look for semantic errors,
737 : * such as flow of control problems and possible typeing conflicts.
738 : * The nesting of BARRIER and CATCH statements with their associated
739 : * flow of control primitives LEAVE and RETRY should form a valid
740 : * hierarchy. Failure to comply is considered a structural error
741 : * and leads to flagging the function as erroneous.
742 : * Also check general conformaty of the ML block structure.
743 : * It should start with a signature and finish with and ENDsymbol
744 : *
745 : * Type checking a program is limited to those instructions that are
746 : * not resolved yet. Once the program is completely checked, further calls
747 : * should be ignored. This should be separately administered for the flow
748 : * as well, because a dynamically typed instruction should later on not
749 : * lead to a re-check when it was already fully analyzed.
750 : */
751 : str
752 3007439 : chkTypes(Module s, MalBlkPtr mb, int silent)
753 : {
754 3007439 : InstrPtr p = 0;
755 3007439 : int i;
756 3007439 : str msg = MAL_SUCCEED;
757 :
758 200497930 : for (i = 0; mb->errors == NULL && i < mb->stop; i++) {
759 197488677 : p = getInstrPtr(mb, i);
760 197488677 : assert(p != NULL);
761 197488677 : if (!p->typeresolved)
762 84693330 : typeChecker(s, mb, p, i, silent);
763 : }
764 3009253 : if (mb->errors) {
765 41 : msg = mb->errors;
766 41 : mb->errors = NULL;
767 : }
768 3009253 : return msg;
769 : }
770 :
771 : /*
772 : * Type checking an individual instruction is dangerous,
773 : * because it ignores data flow and variable declarations.
774 : */
775 : int
776 23 : chkInstruction(Module s, MalBlkPtr mb, InstrPtr p)
777 : {
778 23 : if (mb->errors == MAL_SUCCEED) {
779 23 : p->typeresolved = false;
780 23 : typeChecker(s, mb, p, getPC(mb, p), TRUE);
781 : }
782 23 : return mb->errors != MAL_SUCCEED;
783 : }
784 :
785 : /*
786 : * Perform silent check on the program, merely setting the error flag.
787 : */
788 : str
789 577452 : chkProgram(Module s, MalBlkPtr mb)
790 : {
791 577452 : str msg;
792 : /* it is not ready yet, too fragile
793 : mb->typefixed = mb->stop == chk; ignored END */
794 : /* if( mb->flowfixed == 0)*/
795 :
796 577452 : if (mb->errors) {
797 23 : msg = mb->errors;
798 23 : mb->errors = NULL;
799 23 : return msg;
800 : }
801 577429 : msg = chkTypes(s, mb, FALSE);
802 578790 : if (msg == MAL_SUCCEED)
803 578773 : msg = chkFlow(mb);
804 577694 : if (msg == MAL_SUCCEED)
805 577854 : msg = chkDeclarations(mb);
806 : return msg;
807 : }
808 :
809 : /*
810 : * Polymorphic type analysis
811 : * MAL provides for type variables of the form any$N. This feature
812 : * supports polymorphic types, but also complicates the subsequent
813 : * analysis. A variable typed with any$N not occurring in the function
814 : * header leads to a dynamic typed statement. In principle we have
815 : * to type check the function upon each call.
816 : */
817 : static bool
818 2222515 : typeResolved(MalBlkPtr mb, InstrPtr p, int i)
819 : {
820 2222515 : malType t = getArgType(mb, p, i);
821 2222515 : if (t == TYPE_any || isAnyExpression(t)) {
822 558679 : return false;
823 : }
824 : return true;
825 : }
826 :
827 : /*
828 : * For a polymorphic commands we do not generate a cloned version.
829 : * It suffices to determine the actual return value taking into
830 : * account the type variable constraints.
831 : */
832 : static malType
833 202322156 : getPolyType(malType t, int *polytype)
834 : {
835 202322156 : int ti;
836 202322156 : malType tail;
837 :
838 202322156 : ti = getTypeIndex(t);
839 202322156 : if (!isaBatType(t) && ti > 0) {
840 17642128 : tail = polytype[ti];
841 17642128 : if (getOptBat(t))
842 385 : setOptBat(tail);
843 17642128 : return tail;
844 : }
845 :
846 184680028 : tail = ti == 0 ? getBatType(t) : polytype[ti];
847 184680028 : if (isaBatType(t)) {
848 181668975 : tail = newBatType(tail);
849 : }
850 184680028 : if (getOptBat(t))
851 12366 : setOptBat(tail);
852 : return tail;
853 : }
854 :
855 : /*
856 : * Each argument is checked for binding of polymorphic arguments.
857 : * This routine assumes that the type index is indeed smaller than maxarg.
858 : * (The parser currently enforces a single digit from 1-2 )
859 : * The polymorphic type 'any', i.e. any_0, does never constraint an operation
860 : * it can match with all polymorphic types.
861 : * The routine returns the instantiated formal type for subsequent
862 : * type resolution.
863 : */
864 : static int
865 154524334 : updateTypeMap(int formal, int actual, int polytype[MAXTYPEVAR])
866 : {
867 154524334 : int h, t, ret = 0;
868 :
869 154524334 : if (!isAnyExpression(formal) && isaBatType(formal) && isaBatType(actual))
870 : return 0;
871 :
872 63558881 : if ((h = getTypeIndex(formal))) {
873 61143484 : if (isaBatType(actual) && !isaBatType(formal) && !getOptBat(formal) &&
874 6081580 : (polytype[h] == TYPE_any || polytype[h] == actual)) {
875 5341985 : polytype[h] = actual;
876 5341985 : return 0;
877 : }
878 55801499 : t = getBatType(actual);
879 55801499 : if (t != polytype[h]) {
880 33648653 : if (isaBatType(polytype[h]) && isaBatType(actual))
881 : ret = 0;
882 33647305 : else if (polytype[h] == TYPE_any)
883 33186241 : polytype[h] = t;
884 : else {
885 : return -1;
886 : }
887 : }
888 : }
889 57755832 : if (isaBatType(formal)) {
890 44123118 : if (!isaBatType(actual))
891 : return -1;
892 : }
893 : return ret;
894 : }
|