gdk_join.c source code [MonetDB/gdk/gdk_join.c]

1	/*
2	* This Source Code Form is subject to the terms of the Mozilla Public
3	* License, v. 2.0. If a copy of the MPL was not distributed with this
4	* file, You can obtain one at http://mozilla.org/MPL/2.0/.
5	*
6	* Copyright 1997 - July 2008 CWI, August 2008 - 2019 MonetDB B.V.
7	*/
8
9	#include "monetdb_config.h"
10	#include "gdk.h"
11	#include "gdk_private.h"
12	#include "gdk_calc_private.h"
13
14	/*
15	* All join variants produce some sort of join on two input BATs,
16	* optionally subject to up to two candidate lists. Only values in
17	* the input BATs that are mentioned in the associated candidate list
18	* (if provided) are eligible. They all return two output BATs in the
19	* first two arguments. The join operations differ in the way in
20	* which tuples from the two inputs are matched.
21	*
22	* The outputs consist of two aligned BATs (i.e. same length and same
23	* hseqbase (0@0)) that contain the OIDs of the input BATs that match.
24	* The candidate lists, if given, contain the OIDs of the associated
25	* input BAT which must be considered for matching. The input BATs
26	* must have the same type.
27	*
28	* All functions also have a parameter nil_matches which indicates
29	* whether NIL must be considered an ordinary value that can match, or
30	* whether NIL must be considered to never match.
31	*
32	* The join functions that are provided here are:
33	* BATjoin
34	* normal equi-join
35	* BATleftjoin
36	* normal equi-join, but the left output is sorted
37	* BATouterjoin
38	* equi-join, but the left output is sorted, and if there is no
39	* match for a value in the left input, there is still an output
40	* with NIL in the right output
41	* BATsemijoin
42	* equi-join, but the left output is sorted, and if there are
43	* multiple matches, only one is returned (i.e., the left output
44	* is also key)
45	* BATthetajoin
46	* theta-join: an extra operator must be provided encoded as an
47	* integer (macros JOIN_EQ, JOIN_NE, JOIN_LT, JOIN_LE, JOIN_GT,
48	* JOIN_GE); values match if the left input has the given
49	* relationship with the right input; order of the outputs is not
50	* guaranteed
51	* BATbandjoin
52	* band-join: two extra input values (c1, c2) must be provided as
53	* well as Booleans (li, hi) that indicate whether the value
54	* ranges are inclusive or not; values in the left and right
55	* inputs match if right - c1 <[=] left <[=] right + c2; if c1 or
56	* c2 is NIL, there are no matches
57	* BATrangejoin
58	* range-join: the right input consists of two aligned BATs,
59	* values match if the left value is between two corresponding
60	* right values; two extra Boolean parameters, li and hi,
61	* indicate whether equal values match
62	*
63	* In addition to these functions, there are two more functions that
64	* are closely related:
65	* BATintersect
66	* intersection: return a candidate list with OIDs of tuples in
67	* the left input whose value occurs in the right input
68	* BATdiff
69	* difference: return a candidate list with OIDs of tuples in the
70	* left input whose value does not occur in the right input
71	*/
72
73	/ Perform a bunch of sanity checks on the inputs to a join. /
74	static gdk_return
75	joinparamcheck(BAT l, BAT r1, BAT r2, BAT sl, BAT sr, const* char *func)
76	{
77	if (ATOMtype(l->ttype) != ATOMtype(r1->ttype) \|\|
78	(r2 && ATOMtype(l->ttype) != ATOMtype(r2->ttype))) {
79	GDKerror("%s: inputs not compatible.\n", func);
80	return GDK_FAIL;
81	}
82	if (r2 &&
83	(BATcount(r1) != BATcount(r2) \|\| r1->hseqbase != r2->hseqbase)) {
84	GDKerror("%s: right inputs not aligned.\n", func);
85	return GDK_FAIL;
86	}
87	if ((sl && ATOMtype(sl->ttype) != TYPE_oid) \|\|
88	(sr && ATOMtype(sr->ttype) != TYPE_oid)) {
89	GDKerror("%s: candidate lists must have type OID.\n", func);
90	return GDK_FAIL;
91	}
92	if ((sl && !BATtordered(sl)) \|\|
93	(sr && !BATtordered(sr))) {
94	GDKerror("%s: candidate lists must be sorted.\n", func);
95	return GDK_FAIL;
96	}
97	if ((sl && !BATtkey(sl)) \|\|
98	(sr && !BATtkey(sr))) {
99	GDKerror("%s: candidate lists must be unique.\n", func);
100	return GDK_FAIL;
101	}
102	return GDK_SUCCEED;
103	}
104
105	/ Create the result bats for a join, returns the absolute maximum*
106	* number of outputs that could possibly be generated. */
107	static BUN
108	joininitresults(BAT r1p, BAT r2p, BUN lcnt, BUN rcnt, bool lkey, bool rkey,
109	bool semi, bool nil_on_miss, bool only_misses, BUN estimate)
110	{
111	BAT r1, r2;
112	BUN maxsize, size;
113
114	/ if nil_on_miss is set, we really need a right output /
115	assert(!nil_on_miss \|\| r2p != NULL);
116
117	lkey \|= lcnt <= `1`;
118	rkey \|= rcnt <= `1`;
119
120	*r1p = NULL;
121	if (r2p)
122	*r2p = NULL;
123	if (lcnt == `0`) {
124	/ there is nothing to match /
125	maxsize = `0`;
126	} else if (!only_misses && !nil_on_miss && rcnt == `0`) {
127	/ if right is empty, we have no hits, so if we don't*
128	* want misses, the result is empty */
129	maxsize = `0`;
130	} else if (rkey \| semi \| only_misses) {
131	/ each entry left matches at most one on right, in*
132	* case nil_on_miss is also set, each entry matches
133	* exactly one (see below) */
134	maxsize = lcnt;
135	} else if (lkey) {
136	/ each entry on right is matched at most once /
137	if (nil_on_miss) {
138	/ one entry left could match all right, and*
139	* all other entries left match nil */
140	maxsize = lcnt + rcnt - `1`;
141	} else {
142	maxsize = rcnt;
143	}
144	} else if (rcnt == `0`) {
145	/ nil_on_miss must be true due to previous checks, so*
146	* all values on left miss */
147	maxsize = lcnt;
148	} else if (BUN_MAX / lcnt >= rcnt) {
149	/ in the worst case we have a full cross product /
150	maxsize = lcnt * rcnt;
151	} else {
152	/ a BAT cannot grow larger than BUN_MAX /
153	maxsize = BUN_MAX;
154	}
155	size = estimate == BUN_NONE ? lcnt < rcnt ? lcnt : rcnt : estimate;
156	if (size < `1024`)
157	size = `1024`;
158	if (size > maxsize)
159	size = maxsize;
160	if ((rkey \| semi \| only_misses) & nil_on_miss) {
161	/ see comment above: each entry left matches exactly*
162	* once */
163	size = maxsize;
164	}
165
166	if (maxsize == `0`) {
167	r1 = BATdense(`0`, `0`, `0`);
168	if (r1 == NULL) {
169	return BUN_NONE;
170	}
171	if (r2p) {
172	r2 = BATdense(`0`, `0`, `0`);
173	if (r2 == NULL) {
174	BBPreclaim(r1);
175	return BUN_NONE;
176	}
177	*r2p = r2;
178	}
179	*r1p = r1;
180	return `0`;
181	}
182
183	r1 = COLnew(`0`, TYPE_oid, size, TRANSIENT);
184	if (r1 == NULL) {
185	return BUN_NONE;
186	}
187	r1->tnil = false;
188	r1->tnonil = true;
189	r1->tkey = true;
190	r1->tsorted = true;
191	r1->trevsorted = true;
192	r1->tseqbase = `0`;
193	*r1p = r1;
194	if (r2p) {
195	r2 = COLnew(`0`, TYPE_oid, size, TRANSIENT);
196	if (r2 == NULL) {
197	BBPreclaim(r1);
198	return BUN_NONE;
199	}
200	r2->tnil = false;
201	r2->tnonil = true;
202	r2->tkey = true;
203	r2->tsorted = true;
204	r2->trevsorted = true;
205	r2->tseqbase = `0`;
206	*r2p = r2;
207	}
208	return maxsize;
209	}
210
211	#define VALUE(s, x) (s##vars ? \
212	s##vars + VarHeapVal(s##vals, (x), s##width) : \
213	s##vals ? (const char ) s##vals + ((x) s##width) : \
214	(s##val = BUNtoid(s, (x)), (const char *) &s##val))
215	#define FVALUE(s, x) ((const char ) s##vals + ((x) s##width))
216
217	#define APPEND(b, o) (((oid *) b->theap.base)[b->batCount++] = (o))
218
219	#define MAYBEEXTEND_PROGRESS(CNT, LCUR, LCNT) \
220	do { \
221	BUN N = (CNT); \
222	if (BATcount(r1) + N > BATcapacity(r1)) { \
223	/* make some extra space by extrapolating how */ \
224	/* much more we need (fraction of l we've seen */ \
225	/* so far is used as the fraction of the */ \
226	/* expected result size we've produced so */ \
227	/* far) */ \
228	BUN newcap = (BUN) ((double) (LCNT) / (LCUR) * (BATcount(r1) + N) * 1.5); \
229	if (newcap < N + BATcount(r1)) \
230	newcap = N + BATcount(r1) + 1024; \
231	if (newcap > maxsize) \
232	newcap = maxsize; \
233	/* make sure heap.free is set properly before \
234	* extending */ \
235	BATsetcount(r1, BATcount(r1)); \
236	if (BATextend(r1, newcap) != GDK_SUCCEED) \
237	goto bailout; \
238	if (r2) { \
239	BATsetcount(r2, BATcount(r2)); \
240	if (BATextend(r2, newcap) != GDK_SUCCEED) \
241	goto bailout; \
242	assert(BATcapacity(r1) == BATcapacity(r2)); \
243	} \
244	} \
245	} while (0)
246
247	#define MAYBEEXTEND(CNT, CI) MAYBEEXTEND_PROGRESS(CNT, (CI)->next, (CI)->ncand)
248	#define MAYBEEXTEND_NO_CAND(CNT) MAYBEEXTEND_PROGRESS(CNT, lstart, lend)
249
250	/ Return BATs through r1p and r2p for the case that there is no*
251	* match between l and r, taking all flags into consideration.
252	*
253	* This means, if nil_on_miss is set or only_misses is set, *r1p is a
254	* copy of the left candidate list or a dense list of all "head"
255	* values of l, and *r2p (if r2p is not NULL) is all nil. If neither
256	* of those flags is set, the result is two empty BATs. */
257	static gdk_return
258	nomatch(BAT r1p, BAT r2p, BAT l, BAT r, struct canditer *restrict lci,
259	bool nil_on_miss, bool only_misses, const char *func, lng t0)
260	{
261	BAT r1, r2 = NULL;
262
263	if (lci->ncand == `0` \|\| !(nil_on_miss \| only_misses)) {
264	/ return empty BATs /
265	if ((r1 = BATdense(`0`, `0`, `0`)) == NULL)
266	return GDK_FAIL;
267	if (r2p) {
268	if ((r2 = BATdense(`0`, `0`, `0`)) == NULL) {
269	BBPreclaim(r1);
270	return GDK_FAIL;
271	}
272	*r2p = r2;
273	}
274	*r1p = r1;
275	ALGODEBUG fprintf(stderr,
276	"#%s(l=%s,r=%s)=(" ALGOBATFMT "," ALGOOPTBATFMT ") " LLFMT "us -- nomatch\n",
277	func, BATgetId(l), BATgetId(r),
278	ALGOBATPAR(r1), ALGOOPTBATPAR(r2),
279	GDKusec() - t0);
280	return GDK_SUCCEED;
281	}
282
283	r1 = canditer_slice(lci, `0`, lci->ncand);
284	if (r2p) {
285	if ((r2 = BATconstant(`0`, TYPE_void, &oid_nil, lci->ncand, TRANSIENT)) == NULL) {
286	BBPreclaim(r1);
287	return GDK_FAIL;
288	}
289	*r2p = r2;
290	}
291	*r1p = r1;
292	ALGODEBUG fprintf(stderr,
293	"#%s(l=%s,r=%s)=(" ALGOBATFMT "," ALGOOPTBATFMT ") " LLFMT "us -- nomatch\n",
294	func, BATgetId(l), BATgetId(r),
295	ALGOBATPAR(r1), ALGOOPTBATPAR(r2),
296	GDKusec() - t0);
297	return GDK_SUCCEED;
298	}
299
300	/ Implementation of join where there is a single value (possibly*
301	* repeated multiple times) on the left. This means we can use a
302	* point select to find matches in the right column. */
303	static gdk_return
304	selectjoin(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr,
305	struct canditer *restrict lci, bool nil_matches, lng t0,
306	bool swapped, const char *reason)
307	{
308	BATiter li = bat_iterator(l);
309	const void *v;
310	BAT *bn = NULL;
311
312	assert(lci->ncand > `0`);
313	assert(lci->ncand == `1` \|\| (l->tsorted && l->trevsorted));
314
315	oid o = canditer_next(lci);
316	v = BUNtail(li, o - l->hseqbase);
317
318	if (!nil_matches &&
319	(*ATOMcompare(l->ttype))(v, ATOMnilptr(l->ttype)) == `0`) {
320	/ NIL doesn't match anything /
321	return nomatch(r1p, r2p, l, r, lci, false, false,
322	"selectjoin", t0);
323	}
324
325	bn = BATselect(r, sr, v, NULL, true, true, false);
326	if (bn == NULL) {
327	return GDK_FAIL;
328	}
329	if (BATcount(bn) == `0`) {
330	BBPunfix(bn->batCacheid);
331	return nomatch(r1p, r2p, l, r, lci, false, false,
332	"selectjoin", t0);
333	}
334	BAT r1 = COLnew(`0`, TYPE_oid, lci->ncand BATcount(bn), TRANSIENT);
335	if (r1 == NULL) {
336	BBPunfix(bn->batCacheid);
337	return GDK_FAIL;
338	}
339	BAT *r2 = NULL;
340	if (r2p) {
341	r2 = COLnew(`0`, TYPE_oid, lci->ncand * BATcount(bn), TRANSIENT);
342	if (r2 == NULL) {
343	BBPunfix(bn->batCacheid);
344	BBPreclaim(r1);
345	return GDK_FAIL;
346	}
347	}
348
349	r1->tsorted = true;
350	r1->trevsorted = lci->ncand == `1`;
351	r1->tseqbase = BATcount(bn) == `1` && lci->tpe == cand_dense ? o : oid_nil;
352	r1->tkey = BATcount(bn) == `1`;
353	r1->tnil = false;
354	r1->tnonil = true;
355	if (r2) {
356	r2->tsorted = lci->ncand == `1` \|\| BATcount(bn) == `1`;
357	r2->trevsorted = BATcount(bn) == `1`;
358	r2->tseqbase = lci->ncand == `1` && BATtdense(bn) ? bn->tseqbase : oid_nil;
359	r2->tkey = lci->ncand == `1`;
360	r2->tnil = false;
361	r2->tnonil = true;
362	}
363	if (BATtdense(bn)) {
364	oid o1p = (oid ) Tloc(r1, `0`);
365	oid o2p = r2 ? (oid ) Tloc(r2, `0`) : NULL;
366	oid bno = bn->tseqbase;
367	BUN p, q = BATcount(bn);
368
369	do {
370	for (p = `0`; p < q; p++) {
371	*o1p++ = o;
372	}
373	if (o2p) {
374	for (p = `0`; p < q; p++) {
375	*o2p++ = bno + p;
376	}
377	}
378	o = canditer_next(lci);
379	} while (!is_oid_nil(o));
380	} else {
381	oid o1p = (oid ) Tloc(r1, `0`);
382	oid o2p = r2 ? (oid ) Tloc(r2, `0`) : NULL;
383	const oid bnp = (const* oid *) Tloc(bn, `0`);
384	BUN p, q = BATcount(bn);
385
386	do {
387	for (p = `0`; p < q; p++) {
388	*o1p++ = o;
389	}
390	if (o2p) {
391	for (p = `0`; p < q; p++) {
392	*o2p++ = bnp[p];
393	}
394	}
395	o = canditer_next(lci);
396	} while (!is_oid_nil(o));
397	}
398	BATsetcount(r1, lci->ncand * BATcount(bn));
399	*r1p = r1;
400	if (r2p) {
401	BATsetcount(r2, lci->ncand * BATcount(bn));
402	*r2p = r2;
403	}
404	BBPunfix(bn->batCacheid);
405	ALGODEBUG fprintf(stderr, "#%s: %s(l=" ALGOBATFMT ","
406	"r=" ALGOBATFMT ",sl=" ALGOOPTBATFMT ","
407	"sr=" ALGOOPTBATFMT ",nil_matches=%d)%s %s "
408	"-> (" ALGOBATFMT "," ALGOOPTBATFMT ") " LLFMT "us\n",
409	MT_thread_getname(), __func__,
410	ALGOBATPAR(l), ALGOBATPAR(r),
411	ALGOOPTBATPAR(sl), ALGOOPTBATPAR(sr),
412	nil_matches,
413	swapped ? " swapped" : "", reason,
414	ALGOBATPAR(r1), ALGOOPTBATPAR(r2),
415	GDKusec() - t0);
416
417	return GDK_SUCCEED;
418	}
419
420	#if SIZEOF_OID == SIZEOF_INT
421	#define binsearch_oid(indir, offset, vals, lo, hi, v, ordering, last) binsearch_int(indir, offset, (const int *) vals, lo, hi, (int) (v), ordering, last)
422	#endif
423	#if SIZEOF_OID == SIZEOF_LNG
424	#define binsearch_oid(indir, offset, vals, lo, hi, v, ordering, last) binsearch_lng(indir, offset, (const lng *) vals, lo, hi, (lng) (v), ordering, last)
425	#endif
426
427	/ Implementation of join where the right-hand side is dense, and if*
428	* there is a right candidate list, it too is dense. In case
429	* nil_on_miss is not set, we use a range select (BATselect) to find
430	* the matching values in the left column and then calculate the
431	* corresponding matches from the right. If nil_on_miss is set, we
432	* need to do some more work. */
433	static gdk_return
434	mergejoin_void(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr,
435	struct canditer *restrict lci, struct canditer *restrict rci,
436	bool nil_on_miss, bool only_misses, lng t0, bool swapped,
437	const char *reason)
438	{
439	oid lo, hi;
440	BUN i;
441	oid o, o1p = NULL, o2p = NULL;
442	BAT r1 = NULL, r2 = NULL;
443	const oid *lvals = NULL;
444
445	/ r is dense, and if there is a candidate list, it too is*
446	* dense. This means we don't have to do any searches, we
447	* only need to compare ranges to know whether a value from l
448	* has a match in r */
449	assert(ATOMtype(l->ttype) == ATOMtype(r->ttype));
450	assert(r->tsorted \|\| r->trevsorted);
451	assert(BATcount(l) > `0`);
452	assert(rci->tpe == cand_dense);
453	assert(BATcount(r) > `0`);
454
455	/ figure out range [lo..hi) of values in r that we need to match /
456	lo = r->tseqbase;
457	hi = lo + BATcount(r);
458	/ restrict [lo..hi) range further using candidate list /
459	if (rci->seq > r->hseqbase)
460	lo += rci->seq - r->hseqbase;
461	if (rci->seq + rci->ncand < r->hseqbase + BATcount(r))
462	hi -= r->hseqbase + BATcount(r) - rci->seq - rci->ncand;
463
464	/ at this point, the matchable values in r are [lo..hi) /
465	if (!nil_on_miss) {
466	r1 = BATselect(l, sl, &lo, &hi, true, false, only_misses);
467	if (r1 == NULL)
468	return GDK_FAIL;
469	if (only_misses && !l->tnonil) {
470	/ also look for NILs /
471	r2 = BATselect(l, sl, &oid_nil, NULL, true, false, false);
472	if (r2 == NULL) {
473	BBPreclaim(r1);
474	return GDK_FAIL;
475	}
476	if (BATcount(r2) > `0`) {
477	BAT *mg = BATmergecand(r1, r2);
478	BBPunfix(r1->batCacheid);
479	BBPunfix(r2->batCacheid);
480	r1 = mg;
481	if (r1 == NULL)
482	return GDK_FAIL;
483	} else {
484	BBPunfix(r2->batCacheid);
485	}
486	r2 = NULL;
487	}
488	*r1p = r1;
489	if (r2p == NULL)
490	goto doreturn2;
491	if (BATcount(r1) == `0`) {
492	r2 = BATdense(`0`, `0`, `0`);
493	if (r2 == NULL) {
494	BBPreclaim(r1);
495	return GDK_FAIL;
496	}
497	} else if (BATtdense(r1) && BATtdense(l)) {
498	r2 = BATdense(`0`, l->tseqbase + r1->tseqbase - l->hseqbase + r->hseqbase - r->tseqbase, BATcount(r1));
499	if (r2 == NULL) {
500	BBPreclaim(r1);
501	return GDK_FAIL;
502	}
503	} else {
504	r2 = COLnew(`0`, TYPE_oid, BATcount(r1), TRANSIENT);
505	if (r2 == NULL) {
506	BBPreclaim(r1);
507	return GDK_FAIL;
508	}
509	const oid lp = (const* oid *) Tloc(l, `0`);
510	const oid o1p = (const* oid *) Tloc(r1, `0`);
511	oid o2p = (oid ) Tloc(r2, `0`);
512	hi = BATcount(r1);
513	if (l->ttype == TYPE_void && l->tvheap != NULL) {
514	/ this is actually generic code /
515	for (o = `0`; o < hi; o++)
516	o2p[o] = BUNtoid(l, BUNtoid(r1, o) - l->hseqbase) - r->tseqbase + r->hseqbase;
517	} else if (BATtdense(r1)) {
518	lo = r1->tseqbase - l->hseqbase;
519	if (r->tseqbase == r->hseqbase) {
520	memcpy(o2p, lp + lo, hi * SIZEOF_OID);
521	} else {
522	hi += lo;
523	for (o = `0`; lo < hi; o++, lo++) {
524	o2p[o] = lp[lo] - r->tseqbase + r->hseqbase;
525	}
526	}
527	} else if (BATtdense(l)) {
528	for (o = `0`; o < hi; o++) {
529	o2p[o] = o1p[o] - l->hseqbase + l->tseqbase - r->tseqbase + r->hseqbase;
530	}
531	} else {
532	for (o = `0`; o < hi; o++) {
533	o2p[o] = lp[o1p[o] - l->hseqbase] - r->tseqbase + r->hseqbase;
534	}
535	}
536	r2->tkey = l->tkey;
537	r2->tsorted = l->tsorted;
538	r2->trevsorted = l->trevsorted;
539	r2->tnil = false;
540	r2->tnonil = true;
541	BATsetcount(r2, BATcount(r1));
542	}
543	*r2p = r2;
544	goto doreturn2;
545	}
546	/ nil_on_miss is set, this means we must have a second output /
547	assert(r2p);
548	if (BATtdense(l)) {
549	/ if l is dense, we can further restrict the [lo..hi)*
550	* range to values in l that match with values in r */
551	o = lo;
552	i = lci->seq - l->hseqbase;
553	if (l->tseqbase + i > lo)
554	lo = l->tseqbase + i;
555	i = canditer_last(lci) + `1` - l->hseqbase;
556	if (l->tseqbase + i < hi)
557	hi = l->tseqbase + i;
558	if (lci->tpe == cand_dense) {
559	/ l is dense, and so is the left candidate*
560	* list (if it exists); this means we don't
561	* have to actually look at any values in l:
562	* we can just do some arithmetic; it also
563	* means that r1 will be dense, and if
564	* nil_on_miss is not set, or if all values in
565	* l match, r2 will too */
566	if (hi <= lo) {
567	return nomatch(r1p, r2p, l, r, lci,
568	nil_on_miss, only_misses,
569	"mergejoin_void", t0);
570	}
571
572	/ at this point, the matched values in l and*
573	* r (taking candidate lists into account) are
574	* [lo..hi) which we can translate back to the
575	* respective OID values that we can store in
576	* r1 and r2; note that r1 will be dense since
577	* all values in l will match something (even
578	* if nil since nil_on_miss is set) */
579	*r1p = r1 = BATdense(`0`, lci->seq, lci->ncand);
580	if (r1 == NULL)
581	return GDK_FAIL;
582	if (hi - lo < lci->ncand) {
583	/ we need to fill in nils in r2 for*
584	* missing values */
585	*r2p = r2 = COLnew(`0`, TYPE_oid, lci->ncand, TRANSIENT);
586	if (r2 == NULL) {
587	BBPreclaim(*r1p);
588	return GDK_FAIL;
589	}
590	o2p = (oid *) Tloc(r2, `0`);
591	i = l->tseqbase + lci->seq - l->hseqbase;
592	lo -= i;
593	hi -= i;
594	i += r->hseqbase - r->tseqbase;
595	for (o = `0`; o < lo; o++)
596	*o2p++ = oid_nil;
597	for (o = lo; o < hi; o++)
598	*o2p++ = o + i;
599	for (o = hi; o < lci->ncand; o++)
600	*o2p++ = oid_nil;
601	r2->tnonil = false;
602	r2->tnil = true;
603	/ sorted of no nils at end /
604	r2->tsorted = hi == lci->ncand;
605	/ reverse sorted if single non-nil at start /
606	r2->trevsorted = lo == `0` && hi == `1`;
607	r2->tseqbase = oid_nil;
608	/ (hi - lo) different OIDs in r2,*
609	* plus one for nil */
610	r2->tkey = hi - lo + `1` == lci->ncand;
611	BATsetcount(r2, lci->ncand);
612	} else {
613	/ no missing values /
614	*r2p = r2 = BATdense(`0`, r->hseqbase + lo - r->tseqbase, lci->ncand);
615	if (r2 == NULL) {
616	BBPreclaim(*r1p);
617	return GDK_FAIL;
618	}
619	}
620	goto doreturn;
621	}
622	/ l is dense, but the candidate list exists and is*
623	* not dense; we can, by manipulating the range
624	* [lo..hi), just look at the candidate list values */
625
626	/ translate lo and hi to l's OID values that now need*
627	* to match */
628	lo = lo - l->tseqbase + l->hseqbase;
629	hi = hi - l->tseqbase + l->hseqbase;
630
631	*r1p = r1 = COLnew(`0`, TYPE_oid, lci->ncand, TRANSIENT);
632	*r2p = r2 = COLnew(`0`, TYPE_oid, lci->ncand, TRANSIENT);
633	if (r1 == NULL \|\| r2 == NULL) {
634	BBPreclaim(r1);
635	BBPreclaim(r2);
636	return GDK_FAIL;
637	}
638	o1p = (oid *) Tloc(r1, `0`);
639	o2p = (oid *) Tloc(r2, `0`);
640	r2->tnil = false;
641	r2->tnonil = true;
642	r2->tkey = true;
643	r2->tsorted = true;
644	o = canditer_next(lci);
645	for (i = `0`; i < lci->ncand && o < lo; i++) {
646	*o1p++ = o;
647	*o2p++ = oid_nil;
648	o = canditer_next(lci);
649	}
650	if (i > `0`) {
651	r2->tnil = true;
652	r2->tnonil = false;
653	r2->tkey = i == `1`;
654	}
655	for (; i < lci->ncand && o < hi; i++) {
656	*o1p++ = o;
657	*o2p++ = o - l->hseqbase + l->tseqbase - r->tseqbase + r->hseqbase;
658	o = canditer_next(lci);
659	}
660	if (i < lci->ncand) {
661	r2->tkey = !r2->tnil && lci->ncand - i == `1`;
662	r2->tnil = true;
663	r2->tnonil = false;
664	r2->tsorted = false;
665	for (; i < lci->ncand; i++) {
666	*o1p++ = o;
667	*o2p++ = oid_nil;
668	o = canditer_next(lci);
669	}
670	}
671	BATsetcount(r1, lci->ncand);
672	r1->tseqbase = BATcount(r1) == `1` ? (oid)Tloc(r1, `0`) : oid_nil;
673	r1->tsorted = true;
674	r1->trevsorted = BATcount(r1) <= `1`;
675	r1->tnil = false;
676	r1->tnonil = true;
677	r1->tkey = true;
678	BATsetcount(r2, BATcount(r1));
679	r2->tseqbase = r2->tnil \|\| BATcount(r2) > `1` ? oid_nil : BATcount(r2) == `1` ? (oid)Tloc(r2, `0`) : `0`;
680	r2->trevsorted = BATcount(r2) <= `1`;
681	goto doreturn;
682	}
683	/ l is not dense, so we need to look at the values and check*
684	* whether they are in the range [lo..hi) */
685	lvals = (const oid *) Tloc(l, `0`);
686
687	/ do indirection through the candidate list to look at the*
688	* value */
689
690	*r1p = r1 = COLnew(`0`, TYPE_oid, lci->ncand, TRANSIENT);
691	*r2p = r2 = COLnew(`0`, TYPE_oid, lci->ncand, TRANSIENT);
692	if (r1 == NULL \|\| r2 == NULL) {
693	BBPreclaim(r1);
694	BBPreclaim(r2);
695	return GDK_FAIL;
696	}
697	o1p = (oid *) Tloc(r1, `0`);
698	o2p = (oid *) Tloc(r2, `0`);
699	r2->tnil = false;
700	r2->tnonil = true;
701	if (l->ttype == TYPE_void && l->tvheap != NULL) {
702	for (i = `0`; i < lci->ncand; i++) {
703	oid c = canditer_next(lci);
704
705	o = BUNtoid(l, c - l->hseqbase);
706	*o1p++ = c;
707	if (o >= lo && o < hi) {
708	*o2p++ = o - r->tseqbase + r->hseqbase;
709	} else {
710	*o2p++ = oid_nil;
711	r2->tnil = true;
712	r2->tnonil = false;
713	}
714	}
715	} else {
716	for (i = `0`; i < lci->ncand; i++) {
717	oid c = canditer_next(lci);
718
719	o = lvals[c - l->hseqbase];
720	*o1p++ = c;
721	if (o >= lo && o < hi) {
722	*o2p++ = o - r->tseqbase + r->hseqbase;
723	} else {
724	*o2p++ = oid_nil;
725	r2->tnil = true;
726	r2->tnonil = false;
727	}
728	}
729	}
730	r1->tsorted = true;
731	r1->trevsorted = BATcount(r1) <= `1`;
732	r1->tkey = true;
733	r1->tseqbase = oid_nil;
734	r1->tnil = false;
735	r1->tnonil = true;
736	BATsetcount(r1, lci->ncand);
737	BATsetcount(r2, lci->ncand);
738	r2->tsorted = l->tsorted \|\| BATcount(r2) <= `1`;
739	r2->trevsorted = l->trevsorted \|\| BATcount(r2) <= `1`;
740	r2->tkey = l->tkey \|\| BATcount(r2) <= `1`;
741	r2->tseqbase = oid_nil;
742
743	doreturn:
744	if (r1->tkey)
745	virtualize(r1);
746	if (r2->tkey && r2->tsorted)
747	virtualize(r2);
748	doreturn2:
749	ALGODEBUG fprintf(stderr, "#%s: %s(l=" ALGOBATFMT ","
750	"r=" ALGOBATFMT ",sl=" ALGOOPTBATFMT ","
751	"sr=" ALGOOPTBATFMT ","
752	"nil_on_miss=%d,only_misses=%d)%s %s "
753	"-> (" ALGOBATFMT "," ALGOOPTBATFMT ") " LLFMT "us\n",
754	MT_thread_getname(), __func__,
755	ALGOBATPAR(l), ALGOBATPAR(r),
756	ALGOOPTBATPAR(sl), ALGOOPTBATPAR(sr),
757	nil_on_miss, only_misses,
758	swapped ? " swapped" : "", reason,
759	ALGOBATPAR(r1), ALGOOPTBATPAR(r2),
760	GDKusec() - t0);
761
762	return GDK_SUCCEED;
763	}
764
765	/ Implementation of mergejoin (see below) for the special case that*
766	* the values are of type int, and some more conditions are met. */
767	static gdk_return
768	mergejoin_int(BAT r1p, BAT r2p, BAT l, BAT r,
769	bool nil_matches, BUN estimate, lng t0, bool swapped,
770	const char *reason)
771	{
772	BAT r1, r2;
773	BUN lstart, lend, lcnt;
774	BUN rstart, rend;
775	BUN lscan, rscan; / opportunistic scan window /
776	BUN maxsize;
777	const int lvals, rvals;
778	int v;
779	BUN nl, nr;
780	oid lv;
781	BUN i;
782
783	assert(ATOMtype(l->ttype) == ATOMtype(r->ttype));
784	assert(r->tsorted \|\| r->trevsorted);
785
786	lstart = rstart = `0`;
787	lend = BATcount(l);
788	lcnt = lend - lstart;
789	rend = BATcount(r);
790	lvals = (const int *) Tloc(l, `0`);
791	rvals = (const int *) Tloc(r, `0`);
792	assert(!r->tvarsized \|\| !r->ttype);
793
794	/ basic properties will be adjusted if necessary later on,*
795	* they were initially set by joininitresults() */
796
797	if (lend == `0` \|\| rend == `0`) {
798	/ there are no matches /
799	return nomatch(r1p, r2p, l, r,
800	&(struct canditer) {.tpe = cand_dense, .ncand = lcnt,},
801	false, false, __func__, t0);
802	}
803
804	if ((maxsize = joininitresults(r1p, r2p, BATcount(l), BATcount(r),
805	l->tkey, r->tkey, false, false,
806	false, estimate)) == BUN_NONE)
807	return GDK_FAIL;
808	r1 = *r1p;
809	r2 = r2p ? *r2p : NULL;
810
811	/ determine opportunistic scan window for l and r /
812	for (nl = lend - lstart, lscan = `4`; nl > `0`; lscan++)
813	nl >>= `1`;
814	for (nr = rend - rstart, rscan = `4`; nr > `0`; rscan++)
815	nr >>= `1`;
816
817	if (!nil_matches) {
818	/ skip over nils at the start of the columns /
819	if (lscan < lend - lstart && is_int_nil(lvals[lstart + lscan])) {
820	lstart = binsearch_int(NULL, `0`, lvals, lstart + lscan,
821	lend - `1`, int_nil, `1`, `1`);
822	} else {
823	while (is_int_nil(lvals[lstart]))
824	lstart++;
825	}
826	if (rscan < rend - rstart && is_int_nil(rvals[rstart + rscan])) {
827	rstart = binsearch_int(NULL, `0`, rvals, rstart + rscan,
828	rend - `1`, int_nil, `1`, `1`);
829	} else {
830	while (is_int_nil(rvals[rstart]))
831	rstart++;
832	}
833	}
834	/ from here on we don't have to worry about nil values /
835
836	while (lstart < lend && rstart < rend) {
837	v = rvals[rstart];
838
839	if (lscan < lend - lstart && lvals[lstart + lscan] < v) {
840	lstart = binsearch_int(NULL, `0`, lvals, lstart + lscan,
841	lend - `1`, v, `1`, `0`);
842	} else {
843	/ scan l for v /
844	while (lstart < lend && lvals[lstart] < v)
845	lstart++;
846	}
847	if (lstart >= lend) {
848	/ nothing found /
849	break;
850	}
851
852	/ Here we determine the next value in l that we are*
853	* going to try to match in r. We will also count the
854	* number of occurrences in l of that value.
855	* Afterwards, v points to the value and nl is the
856	* number of times it occurs. Also, lstart will
857	* point to the next value to be considered (ready for
858	* the next iteration).
859	* If there are many equal values in l (more than
860	* lscan), we will use binary search to find the end
861	* of the sequence. Obviously, we can do this only if
862	* l is actually sorted (lscan > 0). */
863	nl = `1`; / we'll match (at least) one in l /
864	nr = `0`; / maybe we won't match anything in r /
865	v = lvals[lstart];
866	if (l->tkey) {
867	/ if l is key, there is a single value /
868	lstart++;
869	} else if (lscan < lend - lstart &&
870	v == lvals[lstart + lscan]) {
871	/ lots of equal values: use binary search to*
872	* find end */
873	nl = binsearch_int(NULL, `0`, lvals, lstart + lscan,
874	lend - `1`, v, `1`, `1`);
875	nl -= lstart;
876	lstart += nl;
877	} else {
878	/ just scan /
879	while (++lstart < lend && v == lvals[lstart])
880	nl++;
881	}
882	/ lstart points one beyond the value we're*
883	* going to match: ready for the next iteration. */
884
885	/ First we find the first value in r that is at*
886	* least as large as v, then we find the first
887	* value in r that is larger than v. The difference
888	* is the number of values equal to v and is stored in
889	* nr.
890	* We will use binary search on r to find both ends of
891	* the sequence of values that are equal to v in case
892	* the position is "too far" (more than rscan
893	* away). */
894
895	/ first find the location of the first value in r*
896	* that is >= v, then find the location of the first
897	* value in r that is > v; the difference is the
898	* number of values equal to v */
899
900	/ look ahead a little (rscan) in r to see whether*
901	* we're better off doing a binary search */
902	if (rscan < rend - rstart && rvals[rstart + rscan] < v) {
903	/ value too far away in r: use binary*
904	* search */
905	rstart = binsearch_int(NULL, `0`, rvals, rstart + rscan,
906	rend - `1`, v, `1`, `0`);
907	} else {
908	/ scan r for v /
909	while (rstart < rend && rvals[rstart] < v)
910	rstart++;
911	}
912	if (rstart == rend) {
913	/ nothing found /
914	break;
915	}
916
917	/ now find the end of the sequence of equal values v /
918
919	/ if r is key, there is zero or one match, otherwise*
920	* look ahead a little (rscan) in r to see whether
921	* we're better off doing a binary search */
922	if (r->tkey) {
923	if (rstart < rend && v == rvals[rstart]) {
924	nr = `1`;
925	rstart++;
926	}
927	} else if (rscan < rend - rstart &&
928	v == rvals[rstart + rscan]) {
929	/ range too large: use binary search /
930	nr = binsearch_int(NULL, `0`, rvals, rstart + rscan,
931	rend - `1`, v, `1`, `1`);
932	nr -= rstart;
933	rstart += nr;
934	} else {
935	/ scan r for end of range /
936	while (rstart < rend && v == rvals[rstart]) {
937	nr++;
938	rstart++;
939	}
940	}
941	/ rstart points to first value > v or end of*
942	* r, and nr is the number of values in r that
943	* are equal to v */
944	if (nr == `0`) {
945	/ no entries in r found /
946	continue;
947	}
948	/ make space: nl values in l match nr values in r, so*
949	* we need to add nl * nr values in the results */
950	MAYBEEXTEND_NO_CAND(nl * nr);
951
952	/ maintain properties /
953	if (nl > `1`) {
954	/ value occurs multiple times in l, so entry*
955	* in r will be repeated multiple times: hence
956	* r2 is not key and not dense */
957	if (r2) {
958	r2->tkey = false;
959	r2->tseqbase = oid_nil;
960	}
961	/ multiple different values will be inserted*
962	* in r1 (always in order), so not reverse
963	* ordered anymore */
964	r1->trevsorted = false;
965	}
966	if (nr > `1`) {
967	/ value occurs multiple times in r, so entry*
968	* in l will be repeated multiple times: hence
969	* r1 is not key and not dense */
970	r1->tkey = false;
971	r1->tseqbase = oid_nil;
972	/ multiple different values will be inserted*
973	* in r2 (in order), so not reverse ordered
974	* anymore */
975	if (r2) {
976	r2->trevsorted = false;
977	if (nl > `1`) {
978	/ multiple values in l match*
979	* multiple values in r, so an
980	* ordered sequence will be
981	* inserted multiple times in
982	* r2, so r2 is not ordered
983	* anymore */
984	r2->tsorted = false;
985	}
986	}
987	}
988	if (BATcount(r1) > `0`) {
989	/ a new, higher value will be inserted into*
990	* r1, so r1 is not reverse ordered anymore */
991	r1->trevsorted = false;
992	/ a new higher value will be added to r2 /
993	if (r2) {
994	r2->trevsorted = false;
995	}
996	if (BATtdense(r1) &&
997	((oid *) r1->theap.base)[r1->batCount - `1`] + `1` != l->hseqbase + lstart - nl) {
998	r1->tseqbase = oid_nil;
999	}
1000	}
1001
1002	if (r2 &&
1003	BATcount(r2) > `0` &&
1004	BATtdense(r2) &&
1005	((oid *) r2->theap.base)[r2->batCount - `1`] + `1` != r->hseqbase + rstart - nr) {
1006	r2->tseqbase = oid_nil;
1007	}
1008
1009	/ insert values /
1010	lv = l->hseqbase + lstart - nl;
1011	for (i = `0`; i < nl; i++) {
1012	BUN j;
1013
1014	for (j = `0`; j < nr; j++) {
1015	APPEND(r1, lv);
1016	}
1017	if (r2) {
1018	oid rv = r->hseqbase + rstart - nr;
1019
1020	for (j = `0`; j < nr; j++) {
1021	APPEND(r2, rv);
1022	rv++;
1023	}
1024	}
1025	lv++;
1026	}
1027	}
1028	/ also set other bits of heap to correct value to indicate size /
1029	BATsetcount(r1, BATcount(r1));
1030	if (r2) {
1031	BATsetcount(r2, BATcount(r2));
1032	assert(BATcount(r1) == BATcount(r2));
1033	}
1034	if (BATcount(r1) > `0`) {
1035	if (BATtdense(r1))
1036	r1->tseqbase = ((oid *) r1->theap.base)[`0`];
1037	if (r2 && BATtdense(r2))
1038	r2->tseqbase = ((oid *) r2->theap.base)[`0`];
1039	} else {
1040	r1->tseqbase = `0`;
1041	if (r2) {
1042	r2->tseqbase = `0`;
1043	}
1044	}
1045	ALGODEBUG fprintf(stderr, "#%s: %s(l=" ALGOBATFMT ","
1046	"r=" ALGOBATFMT ","
1047	"nil_matches=%d)%s %s "
1048	"-> (" ALGOBATFMT "," ALGOOPTBATFMT ") " LLFMT "us\n",
1049	MT_thread_getname(), __func__,
1050	ALGOBATPAR(l), ALGOBATPAR(r),
1051	nil_matches,
1052	swapped ? " swapped" : "", reason,
1053	ALGOBATPAR(r1), ALGOOPTBATPAR(r2),
1054	GDKusec() - t0);
1055
1056	return GDK_SUCCEED;
1057
1058	bailout:
1059	BBPreclaim(r1);
1060	BBPreclaim(r2);
1061	return GDK_FAIL;
1062	}
1063
1064	/ Implementation of mergejoin (see below) for the special case that*
1065	* the values are of type lng, and some more conditions are met. */
1066	static gdk_return
1067	mergejoin_lng(BAT r1p, BAT r2p, BAT l, BAT r,
1068	bool nil_matches, BUN estimate, lng t0, bool swapped,
1069	const char *reason)
1070	{
1071	BAT r1, r2;
1072	BUN lstart, lend, lcnt;
1073	BUN rstart, rend;
1074	BUN lscan, rscan; / opportunistic scan window /
1075	BUN maxsize;
1076	const lng lvals, rvals;
1077	lng v;
1078	BUN nl, nr;
1079	oid lv;
1080	BUN i;
1081
1082	assert(ATOMtype(l->ttype) == ATOMtype(r->ttype));
1083	assert(r->tsorted \|\| r->trevsorted);
1084
1085	lstart = rstart = `0`;
1086	lend = BATcount(l);
1087	lcnt = lend - lstart;
1088	rend = BATcount(r);
1089	lvals = (const lng *) Tloc(l, `0`);
1090	rvals = (const lng *) Tloc(r, `0`);
1091	assert(!r->tvarsized \|\| !r->ttype);
1092
1093	/ basic properties will be adjusted if necessary later on,*
1094	* they were initially set by joininitresults() */
1095
1096	if (lend == `0` \|\| rend == `0`) {
1097	/ there are no matches /
1098	return nomatch(r1p, r2p, l, r,
1099	&(struct canditer) {.tpe = cand_dense, .ncand = lcnt,},
1100	false, false, __func__, t0);
1101	}
1102
1103	if ((maxsize = joininitresults(r1p, r2p, BATcount(l), BATcount(r),
1104	l->tkey, r->tkey, false, false,
1105	false, estimate)) == BUN_NONE)
1106	return GDK_FAIL;
1107	r1 = *r1p;
1108	r2 = r2p ? *r2p : NULL;
1109
1110	/ determine opportunistic scan window for l and r /
1111	for (nl = lend - lstart, lscan = `4`; nl > `0`; lscan++)
1112	nl >>= `1`;
1113	for (nr = rend - rstart, rscan = `4`; nr > `0`; rscan++)
1114	nr >>= `1`;
1115
1116	if (!nil_matches) {
1117	/ skip over nils at the start of the columns /
1118	if (lscan < lend - lstart && is_lng_nil(lvals[lstart + lscan])) {
1119	lstart = binsearch_lng(NULL, `0`, lvals, lstart + lscan,
1120	lend - `1`, lng_nil, `1`, `1`);
1121	} else {
1122	while (is_lng_nil(lvals[lstart]))
1123	lstart++;
1124	}
1125	if (rscan < rend - rstart && is_lng_nil(rvals[rstart + rscan])) {
1126	rstart = binsearch_lng(NULL, `0`, rvals, rstart + rscan,
1127	rend - `1`, lng_nil, `1`, `1`);
1128	} else {
1129	while (is_lng_nil(rvals[rstart]))
1130	rstart++;
1131	}
1132	}
1133	/ from here on we don't have to worry about nil values /
1134
1135	while (lstart < lend && rstart < rend) {
1136	v = rvals[rstart];
1137
1138	if (lscan < lend - lstart && lvals[lstart + lscan] < v) {
1139	lstart = binsearch_lng(NULL, `0`, lvals, lstart + lscan,
1140	lend - `1`, v, `1`, `0`);
1141	} else {
1142	/ scan l for v /
1143	while (lstart < lend && lvals[lstart] < v)
1144	lstart++;
1145	}
1146	if (lstart >= lend) {
1147	/ nothing found /
1148	break;
1149	}
1150
1151	/ Here we determine the next value in l that we are*
1152	* going to try to match in r. We will also count the
1153	* number of occurrences in l of that value.
1154	* Afterwards, v points to the value and nl is the
1155	* number of times it occurs. Also, lstart will
1156	* point to the next value to be considered (ready for
1157	* the next iteration).
1158	* If there are many equal values in l (more than
1159	* lscan), we will use binary search to find the end
1160	* of the sequence. Obviously, we can do this only if
1161	* l is actually sorted (lscan > 0). */
1162	nl = `1`; / we'll match (at least) one in l /
1163	nr = `0`; / maybe we won't match anything in r /
1164	v = lvals[lstart];
1165	if (l->tkey) {
1166	/ if l is key, there is a single value /
1167	lstart++;
1168	} else if (lscan < lend - lstart &&
1169	v == lvals[lstart + lscan]) {
1170	/ lots of equal values: use binary search to*
1171	* find end */
1172	nl = binsearch_lng(NULL, `0`, lvals, lstart + lscan,
1173	lend - `1`, v, `1`, `1`);
1174	nl -= lstart;
1175	lstart += nl;
1176	} else {
1177	/ just scan /
1178	while (++lstart < lend && v == lvals[lstart])
1179	nl++;
1180	}
1181	/ lstart points one beyond the value we're*
1182	* going to match: ready for the next iteration. */
1183
1184	/ First we find the first value in r that is at*
1185	* least as large as v, then we find the first
1186	* value in r that is larger than v. The difference
1187	* is the number of values equal to v and is stored in
1188	* nr.
1189	* We will use binary search on r to find both ends of
1190	* the sequence of values that are equal to v in case
1191	* the position is "too far" (more than rscan
1192	* away). */
1193
1194	/ first find the location of the first value in r*
1195	* that is >= v, then find the location of the first
1196	* value in r that is > v; the difference is the
1197	* number of values equal to v */
1198
1199	/ look ahead a little (rscan) in r to see whether*
1200	* we're better off doing a binary search */
1201	if (rscan < rend - rstart && rvals[rstart + rscan] < v) {
1202	/ value too far away in r: use binary*
1203	* search */
1204	rstart = binsearch_lng(NULL, `0`, rvals, rstart + rscan,
1205	rend - `1`, v, `1`, `0`);
1206	} else {
1207	/ scan r for v /
1208	while (rstart < rend && rvals[rstart] < v)
1209	rstart++;
1210	}
1211	if (rstart == rend) {
1212	/ nothing found /
1213	break;
1214	}
1215
1216	/ now find the end of the sequence of equal values v /
1217
1218	/ if r is key, there is zero or one match, otherwise*
1219	* look ahead a little (rscan) in r to see whether
1220	* we're better off doing a binary search */
1221	if (r->tkey) {
1222	if (rstart < rend && v == rvals[rstart]) {
1223	nr = `1`;
1224	rstart++;
1225	}
1226	} else if (rscan < rend - rstart &&
1227	v == rvals[rstart + rscan]) {
1228	/ range too large: use binary search /
1229	nr = binsearch_lng(NULL, `0`, rvals, rstart + rscan,
1230	rend - `1`, v, `1`, `1`);
1231	nr -= rstart;
1232	rstart += nr;
1233	} else {
1234	/ scan r for end of range /
1235	while (rstart < rend && v == rvals[rstart]) {
1236	nr++;
1237	rstart++;
1238	}
1239	}
1240	/ rstart points to first value > v or end of*
1241	* r, and nr is the number of values in r that
1242	* are equal to v */
1243	if (nr == `0`) {
1244	/ no entries in r found /
1245	continue;
1246	}
1247	/ make space: nl values in l match nr values in r, so*
1248	* we need to add nl * nr values in the results */
1249	MAYBEEXTEND_NO_CAND(nl * nr);
1250
1251	/ maintain properties /
1252	if (nl > `1`) {
1253	/ value occurs multiple times in l, so entry*
1254	* in r will be repeated multiple times: hence
1255	* r2 is not key and not dense */
1256	if (r2) {
1257	r2->tkey = false;
1258	r2->tseqbase = oid_nil;
1259	}
1260	/ multiple different values will be inserted*
1261	* in r1 (always in order), so not reverse
1262	* ordered anymore */
1263	r1->trevsorted = false;
1264	}
1265	if (nr > `1`) {
1266	/ value occurs multiple times in r, so entry*
1267	* in l will be repeated multiple times: hence
1268	* r1 is not key and not dense */
1269	r1->tkey = false;
1270	r1->tseqbase = oid_nil;
1271	/ multiple different values will be inserted*
1272	* in r2 (in order), so not reverse ordered
1273	* anymore */
1274	if (r2) {
1275	r2->trevsorted = false;
1276	if (nl > `1`) {
1277	/ multiple values in l match*
1278	* multiple values in r, so an
1279	* ordered sequence will be
1280	* inserted multiple times in
1281	* r2, so r2 is not ordered
1282	* anymore */
1283	r2->tsorted = false;
1284	}
1285	}
1286	}
1287	if (BATcount(r1) > `0`) {
1288	/ a new, higher value will be inserted into*
1289	* r1, so r1 is not reverse ordered anymore */
1290	r1->trevsorted = false;
1291	/ a new higher value will be added to r2 /
1292	if (r2) {
1293	r2->trevsorted = false;
1294	}
1295	if (BATtdense(r1) &&
1296	((oid *) r1->theap.base)[r1->batCount - `1`] + `1` != l->hseqbase + lstart - nl) {
1297	r1->tseqbase = oid_nil;
1298	}
1299	}
1300
1301	if (r2 &&
1302	BATcount(r2) > `0` &&
1303	BATtdense(r2) &&
1304	((oid *) r2->theap.base)[r2->batCount - `1`] + `1` != r->hseqbase + rstart - nr) {
1305	r2->tseqbase = oid_nil;
1306	}
1307
1308	/ insert values /
1309	lv = l->hseqbase + lstart - nl;
1310	for (i = `0`; i < nl; i++) {
1311	BUN j;
1312
1313	for (j = `0`; j < nr; j++) {
1314	APPEND(r1, lv);
1315	}
1316	if (r2) {
1317	oid rv = r->hseqbase + rstart - nr;
1318
1319	for (j = `0`; j < nr; j++) {
1320	APPEND(r2, rv);
1321	rv++;
1322	}
1323	}
1324	lv++;
1325	}
1326	}
1327	/ also set other bits of heap to correct value to indicate size /
1328	BATsetcount(r1, BATcount(r1));
1329	if (r2) {
1330	BATsetcount(r2, BATcount(r2));
1331	assert(BATcount(r1) == BATcount(r2));
1332	}
1333	if (BATcount(r1) > `0`) {
1334	if (BATtdense(r1))
1335	r1->tseqbase = ((oid *) r1->theap.base)[`0`];
1336	if (r2 && BATtdense(r2))
1337	r2->tseqbase = ((oid *) r2->theap.base)[`0`];
1338	} else {
1339	r1->tseqbase = `0`;
1340	if (r2) {
1341	r2->tseqbase = `0`;
1342	}
1343	}
1344	ALGODEBUG fprintf(stderr, "#%s: %s(l=" ALGOBATFMT ","
1345	"r=" ALGOBATFMT ","
1346	"nil_matches=%d)%s %s "
1347	"-> (" ALGOBATFMT "," ALGOOPTBATFMT ") " LLFMT "us\n",
1348	MT_thread_getname(), __func__,
1349	ALGOBATPAR(l), ALGOBATPAR(r),
1350	nil_matches,
1351	swapped ? " swapped" : "", reason,
1352	ALGOBATPAR(r1), ALGOOPTBATPAR(r2),
1353	GDKusec() - t0);
1354
1355	return GDK_SUCCEED;
1356
1357	bailout:
1358	BBPreclaim(r1);
1359	BBPreclaim(r2);
1360	return GDK_FAIL;
1361	}
1362
1363	/ Implementation of mergejoin (see below) for the special case that*
1364	* the values are of type oid, and the right-hand side is a candidate
1365	* list with exception, and some more conditions are met. */
1366	static gdk_return
1367	mergejoin_cand(BAT r1p, BAT r2p, BAT l, BAT r,
1368	bool nil_matches, BUN estimate, lng t0, bool swapped,
1369	const char *reason)
1370	{
1371	BAT r1, r2;
1372	BUN lstart, lend, lcnt;
1373	struct canditer lci, rci;
1374	BUN lscan; / opportunistic scan window /
1375	BUN maxsize;
1376	const oid *lvals;
1377	oid v;
1378	BUN nl, nr;
1379	oid lv;
1380	BUN i;
1381
1382	assert(ATOMtype(l->ttype) == ATOMtype(r->ttype));
1383
1384	lstart = `0`;
1385	lend = BATcount(l);
1386	lcnt = lend - lstart;
1387	if (l->ttype == TYPE_void) {
1388	assert(!is_oid_nil(l->tseqbase));
1389	lcnt = canditer_init(&lci, NULL, l);
1390	lvals = NULL;
1391	} else {
1392	lci = (struct canditer) {.tpe = cand_dense}; / not used /
1393	lvals = (const oid *) Tloc(l, `0`);
1394	assert(lvals != NULL);
1395	}
1396
1397	assert(r->ttype == TYPE_void && r->tvheap != NULL);
1398	canditer_init(&rci, NULL, r);
1399
1400	/ basic properties will be adjusted if necessary later on,*
1401	* they were initially set by joininitresults() */
1402
1403	if (lend == `0` \|\| rci.ncand == `0`) {
1404	/ there are no matches /
1405	return nomatch(r1p, r2p, l, r,
1406	&(struct canditer) {.tpe = cand_dense, .ncand = lcnt,},
1407	false, false, __func__, t0);
1408	}
1409
1410	if ((maxsize = joininitresults(r1p, r2p, BATcount(l), BATcount(r),
1411	l->tkey, r->tkey, false, false,
1412	false, estimate)) == BUN_NONE)
1413	return GDK_FAIL;
1414	r1 = *r1p;
1415	r2 = r2p ? *r2p : NULL;
1416
1417	/ determine opportunistic scan window for l and r /
1418	for (nl = lend - lstart, lscan = `4`; nl > `0`; lscan++)
1419	nl >>= `1`;
1420
1421	if (!nil_matches) {
1422	/ skip over nils at the start of the columns /
1423	if (lscan < lend - lstart && lvals && is_oid_nil(lvals[lstart + lscan])) {
1424	lstart = binsearch_oid(NULL, `0`, lvals, lstart + lscan,
1425	lend - `1`, oid_nil, `1`, `1`);
1426	} else if (lvals) {
1427	while (is_oid_nil(lvals[lstart]))
1428	lstart++;
1429	} / else l is candidate list: no nils /
1430	}
1431	/ from here on we don't have to worry about nil values /
1432
1433	while (lstart < lend && rci.next < rci.ncand) {
1434	v = canditer_peek(&rci);
1435
1436	if (lvals) {
1437	if (lscan < lend - lstart &&
1438	lvals[lstart + lscan] < v) {
1439	lstart = binsearch_oid(NULL, `0`, lvals,
1440	lstart + lscan,
1441	lend - `1`, v, `1`, `0`);
1442	} else {
1443	/ scan l for v /
1444	while (lstart < lend && lvals[lstart] < v)
1445	lstart++;
1446	}
1447	} else {
1448	lstart = canditer_search(&lci, v, true);
1449	canditer_setidx(&lci, lstart);
1450	}
1451	if (lstart >= lend) {
1452	/ nothing found /
1453	break;
1454	}
1455
1456	/ Here we determine the next value in l that we are*
1457	* going to try to match in r. We will also count the
1458	* number of occurrences in l of that value.
1459	* Afterwards, v points to the value and nl is the
1460	* number of times it occurs. Also, lstart will
1461	* point to the next value to be considered (ready for
1462	* the next iteration).
1463	* If there are many equal values in l (more than
1464	* lscan), we will use binary search to find the end
1465	* of the sequence. Obviously, we can do this only if
1466	* l is actually sorted (lscan > 0). */
1467	nl = `1`; / we'll match (at least) one in l /
1468	nr = `0`; / maybe we won't match anything in r /
1469	v = lvals ? lvals[lstart] : canditer_next(&lci);
1470	if (l->tkey \|\| lvals == NULL) {
1471	/ if l is key, there is a single value /
1472	lstart++;
1473	} else if (lscan < lend - lstart &&
1474	v == lvals[lstart + lscan]) {
1475	/ lots of equal values: use binary search to*
1476	* find end */
1477	nl = binsearch_oid(NULL, `0`, lvals, lstart + lscan,
1478	lend - `1`, v, `1`, `1`);
1479	nl -= lstart;
1480	lstart += nl;
1481	} else {
1482	/ just scan /
1483	while (++lstart < lend && v == lvals[lstart])
1484	nl++;
1485	}
1486	/ lstart points one beyond the value we're*
1487	* going to match: ready for the next iteration. */
1488
1489	/ First we find the first value in r that is at*
1490	* least as large as v, then we find the first
1491	* value in r that is larger than v. The difference
1492	* is the number of values equal to v and is stored in
1493	* nr.
1494	* We will use binary search on r to find both ends of
1495	* the sequence of values that are equal to v in case
1496	* the position is "too far" (more than rscan
1497	* away). */
1498
1499	/ first find the location of the first value in r*
1500	* that is >= v, then find the location of the first
1501	* value in r that is > v; the difference is the
1502	* number of values equal to v */
1503	nr = canditer_search(&rci, v, true);
1504	canditer_setidx(&rci, nr);
1505	if (nr == rci.ncand) {
1506	/ nothing found /
1507	break;
1508	}
1509
1510	/ now find the end of the sequence of equal values v /
1511
1512	/ if r is key, there is zero or one match, otherwise*
1513	* look ahead a little (rscan) in r to see whether
1514	* we're better off doing a binary search */
1515	if (canditer_peek(&rci) == v) {
1516	nr = `1`;
1517	canditer_next(&rci);
1518	} else {
1519	/ rci points to first value > v or end of*
1520	* r, and nr is the number of values in r that
1521	* are equal to v */
1522	/ no entries in r found /
1523	continue;
1524	}
1525	/ make space: nl values in l match nr values in r, so*
1526	* we need to add nl * nr values in the results */
1527	MAYBEEXTEND_NO_CAND(nl * nr);
1528
1529	/ maintain properties /
1530	if (nl > `1`) {
1531	/ value occurs multiple times in l, so entry*
1532	* in r will be repeated multiple times: hence
1533	* r2 is not key and not dense */
1534	if (r2) {
1535	r2->tkey = false;
1536	r2->tseqbase = oid_nil;
1537	}
1538	/ multiple different values will be inserted*
1539	* in r1 (always in order), so not reverse
1540	* ordered anymore */
1541	r1->trevsorted = false;
1542	}
1543	if (nr > `1`) {
1544	/ value occurs multiple times in r, so entry*
1545	* in l will be repeated multiple times: hence
1546	* r1 is not key and not dense */
1547	r1->tkey = false;
1548	r1->tseqbase = oid_nil;
1549	/ multiple different values will be inserted*
1550	* in r2 (in order), so not reverse ordered
1551	* anymore */
1552	if (r2) {
1553	r2->trevsorted = false;
1554	if (nl > `1`) {
1555	/ multiple values in l match*
1556	* multiple values in r, so an
1557	* ordered sequence will be
1558	* inserted multiple times in
1559	* r2, so r2 is not ordered
1560	* anymore */
1561	r2->tsorted = false;
1562	}
1563	}
1564	}
1565	if (BATcount(r1) > `0`) {
1566	/ a new, higher value will be inserted into*
1567	* r1, so r1 is not reverse ordered anymore */
1568	r1->trevsorted = false;
1569	/ a new higher value will be added to r2 /
1570	if (r2) {
1571	r2->trevsorted = false;
1572	}
1573	if (BATtdense(r1) &&
1574	((oid *) r1->theap.base)[r1->batCount - `1`] + `1` != l->hseqbase + lstart - nl) {
1575	r1->tseqbase = oid_nil;
1576	}
1577	}
1578
1579	if (r2 &&
1580	BATcount(r2) > `0` &&
1581	BATtdense(r2) &&
1582	((oid *) r2->theap.base)[r2->batCount - `1`] + `1` != r->hseqbase + rci.next - nr) {
1583	r2->tseqbase = oid_nil;
1584	}
1585
1586	/ insert values /
1587	lv = l->hseqbase + lstart - nl;
1588	for (i = `0`; i < nl; i++) {
1589	BUN j;
1590
1591	for (j = `0`; j < nr; j++) {
1592	APPEND(r1, lv);
1593	}
1594	if (r2) {
1595	oid rv = r->hseqbase + rci.next - nr;
1596
1597	for (j = `0`; j < nr; j++) {
1598	APPEND(r2, rv);
1599	rv++;
1600	}
1601	}
1602	lv++;
1603	}
1604	}
1605	/ also set other bits of heap to correct value to indicate size /
1606	BATsetcount(r1, BATcount(r1));
1607	if (r2) {
1608	BATsetcount(r2, BATcount(r2));
1609	assert(BATcount(r1) == BATcount(r2));
1610	}
1611	if (BATcount(r1) > `0`) {
1612	if (BATtdense(r1))
1613	r1->tseqbase = ((oid *) r1->theap.base)[`0`];
1614	if (r2 && BATtdense(r2))
1615	r2->tseqbase = ((oid *) r2->theap.base)[`0`];
1616	} else {
1617	r1->tseqbase = `0`;
1618	if (r2) {
1619	r2->tseqbase = `0`;
1620	}
1621	}
1622	ALGODEBUG fprintf(stderr, "#%s: %s(l=" ALGOBATFMT ","
1623	"r=" ALGOBATFMT ","
1624	"nil_matches=%d)%s %s "
1625	"-> (" ALGOBATFMT "," ALGOOPTBATFMT ") " LLFMT "us\n",
1626	MT_thread_getname(), __func__,
1627	ALGOBATPAR(l), ALGOBATPAR(r),
1628	nil_matches,
1629	swapped ? " swapped" : "", reason,
1630	ALGOBATPAR(r1), ALGOOPTBATPAR(r2),
1631	GDKusec() - t0);
1632
1633	return GDK_SUCCEED;
1634
1635	bailout:
1636	BBPreclaim(r1);
1637	BBPreclaim(r2);
1638	return GDK_FAIL;
1639	}
1640
1641	/ Perform a "merge" join on l and r (if both are sorted) with*
1642	* optional candidate lists, or join using binary search on r if l is
1643	* not sorted. The return BATs have already been created by the
1644	* caller.
1645	*
1646	* If nil_matches is set, nil values are treated as ordinary values
1647	* that can match; otherwise nil values never match.
1648	*
1649	* If nil_on_miss is set, a nil value is returned in r2 if there is no
1650	* match in r for a particular value in l (left outer join).
1651	*
1652	* If semi is set, only a single set of values in r1/r2 is returned if
1653	* there is a match of l in r, no matter how many matches there are in
1654	* r; otherwise all matches are returned.
1655	*
1656	* t0 and swapped are only for debugging (ALGOMASK set in GDKdebug).
1657	*/
1658	static gdk_return
1659	mergejoin(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr,
1660	struct canditer *restrict lci, struct canditer *restrict rci,
1661	bool nil_matches, bool nil_on_miss, bool semi, bool only_misses,
1662	bool not_in, BUN estimate, lng t0, bool swapped, const char *reason)
1663	{
1664	/ [lr]scan determine how far we look ahead in l/r in order to*
1665	* decide whether we want to do a binary search or a scan */
1666	BUN lscan, rscan;
1667	const void lvals, rvals; / the values of l/r (NULL if dense) /
1668	const char lvars, rvars; / the indirect values (NULL if fixed size) /
1669	int lwidth, rwidth; / width of the values /
1670	const void *nil = ATOMnilptr(l->ttype);
1671	int (cmp)(const* void , const* void *) = ATOMcompare(l->ttype);
1672	const void v; /* points to value under consideration /
1673	const void *prev = NULL;
1674	BUN nl, nr;
1675	bool insert_nil;
1676	/ equal_order is set if we can scan both BATs in the same*
1677	* order, so when both are sorted or both are reverse sorted
1678	* -- important to know in order to skip over values; if l is
1679	* not sorted, this must be set to true and we will always do a
1680	* binary search on all of r */
1681	bool equal_order;
1682	/ [lr]ordering is either 1 or -1 depending on the order of*
1683	* l/r: it determines the comparison function used */
1684	int lordering, rordering;
1685	oid lv;
1686	BUN i, j; / counters /
1687	bool lskipped = false; / whether we skipped values in l /
1688	oid lval = oid_nil, rval = oid_nil; / temporary space to point v to /
1689	struct canditer llci, rrci;
1690
1691	if (sl == NULL && sr == NULL && !nil_on_miss &&
1692	!semi && !only_misses && !not_in &&
1693	l->tsorted && r->tsorted) {
1694	/ special cases with far fewer options /
1695	if (r->ttype == TYPE_void && r->tvheap)
1696	return mergejoin_cand(r1p, r2p, l, r, nil_matches,
1697	estimate, t0, swapped, __func__);
1698	switch (ATOMbasetype(l->ttype)) {
1699	case TYPE_int:
1700	return mergejoin_int(r1p, r2p, l, r, nil_matches,
1701	estimate, t0, swapped, __func__);
1702	case TYPE_lng:
1703	return mergejoin_lng(r1p, r2p, l, r, nil_matches,
1704	estimate, t0, swapped, __func__);
1705	}
1706	}
1707
1708	assert(ATOMtype(l->ttype) == ATOMtype(r->ttype));
1709	assert(r->tsorted \|\| r->trevsorted);
1710	assert(sl == NULL \|\| sl->tsorted);
1711	assert(sr == NULL \|\| sr->tsorted);
1712
1713	if (BATtvoid(l)) {
1714	/ l->ttype == TYPE_void && is_oid_nil(l->tseqbase) is*
1715	* handled by selectjoin */
1716	assert(!is_oid_nil(l->tseqbase));
1717	canditer_init(&llci, NULL, l);
1718	lvals = NULL;
1719	} else {
1720	lvals = Tloc(l, `0`);
1721	llci = (struct canditer) {.tpe = cand_dense}; / not used /
1722	}
1723	rrci = (struct canditer) {.tpe = cand_dense};
1724	if (BATtvoid(r)) {
1725	if (!is_oid_nil(r->tseqbase))
1726	canditer_init(&rrci, NULL, r);
1727	rvals = NULL;
1728	} else {
1729	rvals = Tloc(r, `0`);
1730	}
1731	if (l->tvarsized && l->ttype) {
1732	assert(r->tvarsized && r->ttype);
1733	lvars = l->tvheap->base;
1734	rvars = r->tvheap->base;
1735	} else {
1736	assert(!r->tvarsized \|\| !r->ttype);
1737	lvars = rvars = NULL;
1738	}
1739	lwidth = l->twidth;
1740	rwidth = r->twidth;
1741
1742	/ basic properties will be adjusted if necessary later on,*
1743	* they were initially set by joininitresults() */
1744
1745	if (not_in && rci->ncand > `0` && !r->tnonil &&
1746	((BATtvoid(l) && l->tseqbase == oid_nil) \|\|
1747	(BATtvoid(r) && r->tseqbase == oid_nil) \|\|
1748	(rvals && cmp(nil, VALUE(r, (r->tsorted ? rci->seq : canditer_last(rci)) - r->hseqbase)) == `0`)))
1749	return nomatch(r1p, r2p, l, r, lci, false, false,
1750	"mergejoin", t0);
1751
1752	if (lci->ncand == `0` \|\|
1753	rci->ncand == `0` \|\|
1754	(!nil_matches &&
1755	((l->ttype == TYPE_void && is_oid_nil(l->tseqbase)) \|\|
1756	(r->ttype == TYPE_void && is_oid_nil(r->tseqbase)))) \|\|
1757	(l->ttype == TYPE_void && is_oid_nil(l->tseqbase) &&
1758	(r->tnonil \|\|
1759	(r->ttype == TYPE_void && !is_oid_nil(r->tseqbase)))) \|\|
1760	(r->ttype == TYPE_void && is_oid_nil(r->tseqbase) &&
1761	(l->tnonil \|\|
1762	(l->ttype == TYPE_void && !is_oid_nil(l->tseqbase))))) {
1763	/ there are no matches /
1764	return nomatch(r1p, r2p, l, r, lci, nil_on_miss, only_misses,
1765	"mergejoin", t0);
1766	}
1767
1768	BUN maxsize = joininitresults(r1p, r2p, lci->ncand, rci->ncand,
1769	l->tkey, r->tkey, semi, nil_on_miss,
1770	only_misses, estimate);
1771	if (maxsize == BUN_NONE)
1772	return GDK_FAIL;
1773	BAT r1 = r1p;
1774	BAT r2 = r2p ? r2p : NULL;
1775
1776	if (l->tsorted \|\| l->trevsorted) {
1777	/ determine opportunistic scan window for l /
1778	for (nl = lci->ncand, lscan = `4`; nl > `0`; lscan++)
1779	nl >>= `1`;
1780	equal_order = (l->tsorted && r->tsorted) \|\|
1781	(l->trevsorted && r->trevsorted &&
1782	!BATtvoid(l) && !BATtvoid(r));
1783	lordering = l->tsorted && (r->tsorted \|\| !equal_order) ? `1` : -`1`;
1784	rordering = equal_order ? lordering : -lordering;
1785	} else {
1786	/ if l not sorted, we will always use binary search*
1787	* on r */
1788	assert(!BATtvoid(l)); / void is always sorted /
1789	lscan = `0`;
1790	equal_order = true;
1791	lordering = `1`;
1792	rordering = r->tsorted ? `1` : -`1`;
1793	}
1794	/ determine opportunistic scan window for r; if l is not*
1795	* sorted this is only used to find range of equal values */
1796	for (nl = rci->ncand, rscan = `4`; nl > `0`; rscan++)
1797	nl >>= `1`;
1798
1799	if (!equal_order) {
1800	/ we go through r backwards /
1801	canditer_setidx(rci, rci->ncand);
1802	}
1803	/ At this point the various variables that help us through*
1804	* the algorithm have been set. The table explains them. The
1805	* first two columns are the inputs, the next three columns
1806	* are the variables, the final two columns indicate how the
1807	* variables can be used.
1808	*
1809	* l/r sl/sr \| vals cand off \| result value being matched
1810	* -------------+-----------------+----------------------------------
1811	* dense NULL \| NULL NULL set \| i off==nil?nil:i+off
1812	* dense dense \| NULL NULL set \| i off==nil?nil:i+off
1813	* dense set \| NULL set set \| cand[i] off==nil?nil:cand[i]+off
1814	* set NULL \| set NULL 0 \| i vals[i]
1815	* set dense \| set NULL 0 \| i vals[i]
1816	* set set \| set set 0 \| cand[i] vals[cand[i]]
1817	*
1818	* If {l,r}off is lng_nil, all values in the corresponding bat
1819	* are oid_nil because the bat has type VOID and the tseqbase
1820	* is nil.
1821	*/
1822
1823	/ Before we start adding values to r1 and r2, the properties*
1824	* are as follows:
1825	* tseqbase - 0
1826	* tkey - true
1827	* tsorted - true
1828	* trevsorted - true
1829	* tnil - false
1830	* tnonil - true
1831	* We will modify these as we go along.
1832	*/
1833	while (lci->next < lci->ncand) {
1834	if (lscan == `0`) {
1835	/ always search r completely /
1836	assert(equal_order);
1837	canditer_reset(rci);
1838	} else {
1839	/ If l is sorted (lscan > 0), we look at the*
1840	* next value in r to see whether we can jump
1841	* over a large section of l using binary
1842	* search. We do this by looking ahead in l
1843	* (lscan far, to be precise) and seeing if
1844	* the value there is still too "small"
1845	* (definition depends on sort order of l).
1846	* If it is, we use binary search on l,
1847	* otherwise we scan l for the next position
1848	* with a value greater than or equal to the
1849	* value in r.
1850	* The next value to match in r is the first
1851	* if equal_order is set, the last
1852	* otherwise.
1853	* When skipping over values in l, we count
1854	* how many we skip in nlx. We need this in
1855	* case only_misses or nil_on_miss is set, and
1856	* to properly set the dense property in the
1857	* first output BAT. */
1858	BUN nlx = `0`; / number of non-matching values in l /
1859
1860	if (equal_order) {
1861	if (rci->next == rci->ncand)
1862	v = NULL; / no more values /
1863	else
1864	v = VALUE(r, canditer_peek(rci) - r->hseqbase);
1865	} else {
1866	if (rci->next == `0`)
1867	v = NULL; / no more values /
1868	else
1869	v = VALUE(r, canditer_peekprev(rci) - r->hseqbase);
1870	}
1871	/ here, v points to next value in r, or if*
1872	* we're at the end of r, v is NULL */
1873	if (v == NULL) {
1874	nlx = lci->ncand - lci->next;
1875	} else {
1876	if (lscan < lci->ncand - lci->next) {
1877	lv = canditer_idx(lci, lci->next + lscan);
1878	lv -= l->hseqbase;
1879	if (lvals) {
1880	if (lordering * cmp(VALUE(l, lv), v) < `0`) {
1881	nlx = binsearch(NULL, `0`, l->ttype, lvals, lvars, lwidth, lv, BATcount(l), v, lordering, `0`);
1882	nlx = canditer_search(lci, nlx + l->hseqbase, true);
1883	nlx -= lci->next;
1884	}
1885	} else {
1886	assert(lordering == `1`);
1887	if (canditer_idx(&llci, lv) < (const* oid *)v) {
1888	nlx = canditer_search(&llci, (const* oid *)v, true);
1889	nlx = canditer_search(lci, nlx + l->hseqbase, true);
1890	nlx -= lci->next;
1891	}
1892	}
1893	if (lci->next + nlx == lci->ncand)
1894	v = NULL;
1895	}
1896	}
1897	if (nlx > `0`) {
1898	if (only_misses) {
1899	MAYBEEXTEND(nlx, lci);
1900	lskipped \|= nlx > `1` && lci->tpe != cand_dense;
1901	while (nlx > `0`) {
1902	APPEND(r1, canditer_next(lci));
1903	nlx--;
1904	}
1905	if (lskipped)
1906	r1->tseqbase = oid_nil;
1907	if (r1->trevsorted && BATcount(r1) > `1`)
1908	r1->trevsorted = false;
1909	} else if (nil_on_miss) {
1910	if (r2->tnonil) {
1911	r2->tnil = true;
1912	r2->tnonil = false;
1913	r2->tseqbase = oid_nil;
1914	r2->tsorted = false;
1915	r2->trevsorted = false;
1916	r2->tkey = false;
1917	}
1918	MAYBEEXTEND(nlx, lci);
1919	lskipped \|= nlx > `1` && lci->tpe != cand_dense;
1920	while (nlx > `0`) {
1921	APPEND(r1, canditer_next(lci));
1922	APPEND(r2, oid_nil);
1923	nlx--;
1924	}
1925	if (lskipped)
1926	r1->tseqbase = oid_nil;
1927	if (r1->trevsorted && BATcount(r1) > `1`)
1928	r1->trevsorted = false;
1929	} else {
1930	lskipped = BATcount(r1) > `0`;
1931	canditer_setidx(lci, lci->next + nlx);
1932	}
1933	}
1934	if (v == NULL) {
1935	/ we have exhausted the inputs /
1936	break;
1937	}
1938	}
1939
1940	/ Here we determine the next value in l that we are*
1941	* going to try to match in r. We will also count the
1942	* number of occurrences in l of that value.
1943	* Afterwards, v points to the value and nl is the
1944	* number of times it occurs. Also, lci will point to
1945	* the next value to be considered (ready for the next
1946	* iteration).
1947	* If there are many equal values in l (more than
1948	* lscan), we will use binary search to find the end
1949	* of the sequence. Obviously, we can do this only if
1950	* l is actually sorted (lscan > 0). */
1951	nl = `1`; / we'll match (at least) one in l /
1952	nr = `0`; / maybe we won't match anything in r /
1953	v = VALUE(l, canditer_peek(lci) - l->hseqbase);
1954	if (l->tkey) {
1955	/ if l is key, there is a single value /
1956	} else if (lscan > `0` &&
1957	lscan < lci->ncand - lci->next &&
1958	cmp(v, VALUE(l, canditer_idx(lci, lci->next + lscan) - l->hseqbase)) == `0`) {
1959	/ lots of equal values: use binary search to*
1960	* find end */
1961	assert(lvals != NULL);
1962	nl = binsearch(NULL, `0`,
1963	l->ttype, lvals, lvars,
1964	lwidth, lci->next + lscan,
1965	BATcount(l),
1966	v, lordering, `1`);
1967	nl = canditer_search(lci, nl + l->hseqbase, true);
1968	nl -= lci->next;
1969	} else {
1970	struct canditer ci = lci; /* work on copy /
1971	nl = `0`; / it will be incremented again /
1972	do {
1973	canditer_next(&ci);
1974	nl++;
1975	} while (ci.next < ci.ncand &&
1976	cmp(v, VALUE(l, canditer_peek(&ci) - l->hseqbase)) == `0`);
1977	}
1978	/ lci->next + nl is the position for the next iteration /
1979
1980	if ((!nil_matches \|\| not_in) && !l->tnonil && cmp(v, nil) == `0`) {
1981	if (not_in) {
1982	/ just skip the whole thing: nils*
1983	* don't cause any output */
1984	canditer_setidx(lci, lci->next + nl);
1985	continue;
1986	}
1987	/ v is nil and nils don't match anything, set*
1988	* to NULL to indicate nil */
1989	v = NULL;
1990	}
1991
1992	/ First we find the "first" value in r that is "at*
1993	* least as large" as v, then we find the "first"
1994	* value in r that is "larger" than v. The difference
1995	* is the number of values equal to v and is stored in
1996	* nr. The definitions of "larger" and "first" depend
1997	* on the orderings of l and r. If equal_order is
1998	* set, we go through r from low to high (this
1999	* includes the case that l is not sorted); otherwise
2000	* we go through r from high to low.
2001	* In either case, we will use binary search on r to
2002	* find both ends of the sequence of values that are
2003	* equal to v in case the position is "too far" (more
2004	* than rscan away). */
2005	if (v == NULL) {
2006	nr = `0`; / nils don't match anything /
2007	} else if (r->ttype == TYPE_void && is_oid_nil(r->tseqbase)) {
2008	if (is_oid_nil((const* oid *) v)) {
2009	/ all values in r match /
2010	nr = rci->ncand;
2011	} else {
2012	/ no value in r matches /
2013	nr = `0`;
2014	}
2015	/ in either case, we're done after this /
2016	canditer_setidx(rci, equal_order ? rci->ncand : `0`);
2017	} else if (equal_order) {
2018	/ first find the location of the first value*
2019	* in r that is >= v, then find the location
2020	* of the first value in r that is > v; the
2021	* difference is the number of values equal
2022	* v; we change rci */
2023
2024	/ look ahead a little (rscan) in r to*
2025	* see whether we're better off doing
2026	* a binary search */
2027	if (rvals) {
2028	if (rscan < rci->ncand - rci->next &&
2029	rordering * cmp(v, VALUE(r, canditer_idx(rci, rci->next + rscan) - r->hseqbase)) > `0`) {
2030	/ value too far away in r:*
2031	* use binary search */
2032	lv = binsearch(NULL, `0`, r->ttype, rvals, rvars, rwidth, rci->next + rscan, BATcount(r), v, rordering, `0`);
2033	lv = canditer_search(rci, lv + r->hseqbase, true);
2034	canditer_setidx(rci, lv);
2035	} else {
2036	/ scan r for v /
2037	while (rci->next < rci->ncand) {
2038	if (rordering * cmp(v, VALUE(r, canditer_peek(rci) - r->hseqbase)) <= `0`)
2039	break;
2040	canditer_next(rci);
2041	}
2042	}
2043	if (rci->next < rci->ncand &&
2044	cmp(v, VALUE(r, canditer_peek(rci) - r->hseqbase)) == `0`) {
2045	/ if we found an equal value,*
2046	* look for the last equal
2047	* value */
2048	if (r->tkey) {
2049	/ r is key, there can*
2050	* only be a single
2051	* equal value */
2052	nr = `1`;
2053	canditer_next(rci);
2054	} else if (rscan < rci->ncand - rci->next &&
2055	cmp(v, VALUE(r, canditer_idx(rci, rci->next + rscan) - r->hseqbase)) == `0`) {
2056	/ many equal values:*
2057	* use binary search
2058	* to find the end */
2059	nr = binsearch(NULL, `0`, r->ttype, rvals, rvars, rwidth, rci->next + rscan, BATcount(r), v, rordering, `1`);
2060	nr = canditer_search(rci, nr + r->hseqbase, true);
2061	nr -= rci->next;
2062	canditer_setidx(rci, rci->next + nr);
2063	} else {
2064	/ scan r for end of*
2065	* range */
2066	do {
2067	nr++;
2068	canditer_next(rci);
2069	} while (rci->next < rci->ncand &&
2070	cmp(v, VALUE(r, canditer_peek(rci) - r->hseqbase)) == `0`);
2071	}
2072	}
2073	} else {
2074	assert(rordering == `1`);
2075	rval = canditer_search(&rrci, (const* oid*)v, true) + r->hseqbase;
2076	lv = canditer_search(rci, rval, true);
2077	canditer_setidx(rci, lv);
2078	nr = (canditer_idx(&rrci, canditer_peek(rci) - r->hseqbase) == (oid)v);
2079	if (nr == `1`)
2080	canditer_next(rci);
2081	}
2082	/ rci points to first value > v or end of r,*
2083	* and nr is the number of values in r that
2084	* are equal to v */
2085	} else {
2086	/ first find the location of the first value*
2087	* in r that is > v, then find the location
2088	* of the first value in r that is >= v; the
2089	* difference is the number of values equal
2090	* v; we change rci */
2091
2092	/ look back from the end a little*
2093	* (rscan) in r to see whether we're
2094	* better off doing a binary search */
2095	if (rvals) {
2096	if (rci->next > rscan &&
2097	rordering * cmp(v, VALUE(r, canditer_idx(rci, rci->next - rscan) - r->hseqbase)) < `0`) {
2098	/ value too far away*
2099	* in r: use binary
2100	* search */
2101	lv = binsearch(NULL, `0`, r->ttype, rvals, rvars, rwidth, `0`, rci->next - rscan, v, rordering, `1`);
2102	lv = canditer_search(rci, lv + r->hseqbase, true);
2103	canditer_setidx(rci, lv);
2104	} else {
2105	/ scan r for v /
2106	while (rci->next > `0` &&
2107	rordering * cmp(v, VALUE(r, canditer_peekprev(rci) - r->hseqbase)) < `0`)
2108	canditer_prev(rci);
2109	}
2110	if (rci->next > `0` &&
2111	cmp(v, VALUE(r, canditer_peekprev(rci) - r->hseqbase)) == `0`) {
2112	/ if we found an equal value,*
2113	* look for the last equal
2114	* value */
2115	if (r->tkey) {
2116	/ r is key, there can only be a single equal value /
2117	nr = `1`;
2118	canditer_prev(rci);
2119	} else if (rci->next > rscan &&
2120	cmp(v, VALUE(r, canditer_idx(rci, rci->next - rscan) - r->hseqbase)) == `0`) {
2121	/ use binary search to find the start /
2122	nr = binsearch(NULL, `0`, r->ttype, rvals, rvars, rwidth, `0`, rci->next - rscan, v, rordering, `0`);
2123	nr = canditer_search(rci, nr + r->hseqbase, true);
2124	nr = rci->next - nr;
2125	canditer_setidx(rci, rci->next - nr);
2126	} else {
2127	/ scan r for start of range /
2128	do {
2129	canditer_prev(rci);
2130	nr++;
2131	} while (rci->next > `0` &&
2132	cmp(v, VALUE(r, canditer_peekprev(rci) - r->hseqbase)) == `0`);
2133	}
2134	}
2135	} else {
2136	lv = canditer_search(&rrci, (const* oid *)v, true);
2137	lv = canditer_search(rci, lv + r->hseqbase, true);
2138	nr = (canditer_idx(rci, lv) == (const* oid*)v);
2139	canditer_setidx(rci, lv);
2140	}
2141	/ rci points to first value > v*
2142	* or end of r, and nr is the number of values
2143	* in r that are equal to v */
2144	}
2145
2146	if (nr == `0`) {
2147	/ no entries in r found /
2148	if (!(nil_on_miss \| only_misses)) {
2149	if (lscan > `0` &&
2150	(equal_order ? rci->next == rci->ncand : rci->next == `0`)) {
2151	/ nothing more left to match*
2152	* in r */
2153	break;
2154	}
2155	lskipped = BATcount(r1) > `0`;
2156	canditer_setidx(lci, lci->next + nl);
2157	continue;
2158	}
2159	/ insert a nil to indicate a non-match /
2160	insert_nil = true;
2161	nr = `1`;
2162	if (r2) {
2163	r2->tnil = true;
2164	r2->tnonil = false;
2165	r2->tsorted = false;
2166	r2->trevsorted = false;
2167	r2->tseqbase = oid_nil;
2168	r2->tkey = false;
2169	}
2170	} else if (only_misses) {
2171	/ we had a match, so we're not interested /
2172	lskipped = BATcount(r1) > `0`;
2173	canditer_setidx(lci, lci->next + nl);
2174	continue;
2175	} else {
2176	insert_nil = false;
2177	if (semi) {
2178	/ for semi-join, only insert single*
2179	* value */
2180	nr = `1`;
2181	}
2182	}
2183	if (canditer_idx(lci, lci->next + nl - `1`) - canditer_idx(lci, lci->next) != nl - `1`) {
2184	/ not all values in the range are*
2185	* candidates */
2186	lskipped = true;
2187	}
2188	/ make space: nl values in l match nr values in r, so*
2189	* we need to add nl * nr values in the results */
2190	MAYBEEXTEND(nl * nr, lci);
2191
2192	/ maintain properties /
2193	if (nl > `1`) {
2194	if (r2) {
2195	/ value occurs multiple times in l,*
2196	* so entry in r will be repeated
2197	* multiple times: hence r2 is not key
2198	* and not dense */
2199	r2->tkey = false;
2200	r2->tseqbase = oid_nil;
2201	}
2202	/ multiple different values will be inserted*
2203	* in r1 (always in order), so not reverse
2204	* ordered anymore */
2205	r1->trevsorted = false;
2206	}
2207	if (nr > `1`) {
2208	/ value occurs multiple times in r, so entry*
2209	* in l will be repeated multiple times: hence
2210	* r1 is not key and not dense */
2211	r1->tkey = false;
2212	r1->tseqbase = oid_nil;
2213	if (r2) {
2214	/ multiple different values will be*
2215	* inserted in r2 (in order), so not
2216	* reverse ordered anymore */
2217	r2->trevsorted = false;
2218	if (nl > `1`) {
2219	/ multiple values in l match*
2220	* multiple values in r, so an
2221	* ordered sequence will be
2222	* inserted multiple times in
2223	* r2, so r2 is not ordered
2224	* anymore */
2225	r2->tsorted = false;
2226	}
2227	}
2228	}
2229	if (lscan == `0`) {
2230	/ deduce relative positions of r matches for*
2231	* this and previous value in v */
2232	if (prev && r2) {
2233	/ keyness or r2 can only be assured*
2234	* as long as matched values are
2235	* ordered */
2236	int ord = rordering * cmp(prev, v);
2237	if (ord < `0`) {
2238	/ previous value in l was*
2239	* less than current */
2240	r2->trevsorted = false;
2241	r2->tkey &= r2->tsorted;
2242	} else if (ord > `0`) {
2243	/ previous value was*
2244	* greater */
2245	r2->tsorted = false;
2246	r2->tkey &= r2->trevsorted;
2247	} else {
2248	/ value can be equal if*
2249	* intervening values in l
2250	* didn't match anything; if
2251	* multiple values match in r,
2252	* r2 won't be sorted */
2253	r2->tkey = false;
2254	if (nr > `1`) {
2255	r2->tsorted = false;
2256	r2->trevsorted = false;
2257	}
2258	}
2259	}
2260	prev = v;
2261	}
2262	if (BATcount(r1) > `0`) {
2263	/ a new, higher value will be inserted into*
2264	* r1, so r1 is not reverse ordered anymore */
2265	r1->trevsorted = false;
2266	if (r2) {
2267	/ depending on whether l and r are*
2268	* ordered the same or not, a new
2269	* higher or lower value will be added
2270	* to r2 */
2271	if (equal_order)
2272	r2->trevsorted = false;
2273	else {
2274	r2->tsorted = false;
2275	r2->tseqbase = oid_nil;
2276	}
2277	}
2278	/ if there is a left candidate list, it may*
2279	* be that the next value added isn't
2280	* consecutive with the last one */
2281	if (lskipped \|\|
2282	((oid *) r1->theap.base)[r1->batCount - `1`] + `1` != canditer_peek(lci))
2283	r1->tseqbase = oid_nil;
2284	}
2285
2286	/ insert values: first the left output /
2287	for (i = `0`; i < nl; i++) {
2288	lv = canditer_next(lci);
2289	for (j = `0`; j < nr; j++)
2290	APPEND(r1, lv);
2291	}
2292	/ then the right output, various different ways of*
2293	* doing it */
2294	if (r2 == NULL) {
2295	/ nothing to do /
2296	} else if (insert_nil) {
2297	do {
2298	for (i = `0`; i < nr; i++) {
2299	APPEND(r2, oid_nil);
2300	}
2301	} while (--nl > `0`);
2302	} else if (equal_order) {
2303	struct canditer ci = rci; /* work on copy /
2304	if (r2->batCount > `0` &&
2305	BATtdense(r2) &&
2306	((oid *) r2->theap.base)[r2->batCount - `1`] + `1` != canditer_idx(&ci, ci.next - nr))
2307	r2->tseqbase = oid_nil;
2308	do {
2309	canditer_setidx(&ci, ci.next - nr);
2310	for (i = `0`; i < nr; i++) {
2311	APPEND(r2, canditer_next(&ci));
2312	}
2313	} while (--nl > `0`);
2314	} else {
2315	if (r2->batCount > `0` &&
2316	BATtdense(r2) &&
2317	((oid *) r2->theap.base)[r2->batCount - `1`] + `1` != canditer_peek(rci))
2318	r2->tseqbase = oid_nil;
2319	do {
2320	struct canditer ci = rci; /* work on copy /
2321	for (i = `0`; i < nr; i++) {
2322	APPEND(r2, canditer_next(&ci));
2323	}
2324	} while (--nl > `0`);
2325	}
2326	}
2327	/ also set other bits of heap to correct value to indicate size /
2328	BATsetcount(r1, BATcount(r1));
2329	r1->tseqbase = oid_nil;
2330	if (r2) {
2331	BATsetcount(r2, BATcount(r2));
2332	assert(BATcount(r1) == BATcount(r2));
2333	r2->tseqbase = oid_nil;
2334	}
2335	if (BATcount(r1) > `0`) {
2336	if (BATtdense(r1))
2337	r1->tseqbase = ((oid *) r1->theap.base)[`0`];
2338	if (r2 && BATtdense(r2))
2339	r2->tseqbase = ((oid *) r2->theap.base)[`0`];
2340	} else {
2341	r1->tseqbase = `0`;
2342	if (r2) {
2343	r2->tseqbase = `0`;
2344	}
2345	}
2346	ALGODEBUG fprintf(stderr, "#%s: %s(l=" ALGOBATFMT ","
2347	"r=" ALGOBATFMT ",sl=" ALGOOPTBATFMT ","
2348	"sr=" ALGOOPTBATFMT ",nil_matches=%d,"
2349	"nil_on_miss=%d,semi=%d,only_misses=%d,"
2350	"not_in=%d)%s %s "
2351	"-> (" ALGOBATFMT "," ALGOOPTBATFMT ") " LLFMT "us\n",
2352	MT_thread_getname(), __func__,
2353	ALGOBATPAR(l), ALGOBATPAR(r),
2354	ALGOOPTBATPAR(sl), ALGOOPTBATPAR(sr),
2355	nil_matches, nil_on_miss, semi, only_misses, not_in,
2356	swapped ? " swapped" : "", reason,
2357	ALGOBATPAR(r1), ALGOOPTBATPAR(r2),
2358	GDKusec() - t0);
2359
2360	return GDK_SUCCEED;
2361
2362	bailout:
2363	BBPreclaim(r1);
2364	BBPreclaim(r2);
2365	return GDK_FAIL;
2366	}
2367
2368	#define HASHLOOPBODY() \
2369	do { \
2370	MAYBEEXTEND(1, lci); \
2371	APPEND(r1, lo); \
2372	if (r2) \
2373	APPEND(r2, ro); \
2374	nr++; \
2375	} while (false)
2376
2377	#define HASHloop_bound_TYPE(vals, h, hb, v, lo, hi, TYPE) \
2378	for (hb = HASHget(h, hash_##TYPE(h, &v)); \
2379	hb != HASHnil(h); \
2380	hb = HASHgetlink(h,hb)) \
2381	if (hb >= (lo) && hb < (hi) && \
2382	v == vals[hb])
2383
2384	#define HASHloop_bound(bi, h, hb, v, lo, hi) \
2385	for (hb = HASHget(h, HASHprobe((h), v)); \
2386	hb != HASHnil(h); \
2387	hb = HASHgetlink(h,hb)) \
2388	if (hb >= (lo) && hb < (hi) && \
2389	(cmp == NULL \|\| \
2390	(*cmp)(v, BUNtail(bi, hb)) == 0))
2391
2392	#define HASHJOIN(TYPE) \
2393	do { \
2394	TYPE *rvals = Tloc(r, 0); \
2395	TYPE *lvals = Tloc(l, 0); \
2396	TYPE v; \
2397	while (lci->next < lci->ncand) { \
2398	lo = canditer_next(lci); \
2399	v = lvals[lo - l->hseqbase]; \
2400	nr = 0; \
2401	if ((!nil_matches \|\| not_in) && is_##TYPE##_nil(v)) { \
2402	/* no match */ \
2403	if (not_in) \
2404	continue; \
2405	} else if (sr) { \
2406	for (rb = HASHget(hsh, hash_##TYPE(hsh, &v)); \
2407	rb != HASHnil(hsh); \
2408	rb = HASHgetlink(hsh, rb)) { \
2409	ro = BUNtoid(sr, rb); \
2410	if (v != rvals[ro - r->hseqbase]) \
2411	continue; \
2412	if (only_misses) { \
2413	nr++; \
2414	break; \
2415	} \
2416	HASHLOOPBODY(); \
2417	if (semi) \
2418	break; \
2419	} \
2420	} else { \
2421	HASHloop_bound_TYPE(rvals, hsh, rb, v, rl, rh, TYPE) { \
2422	ro = (oid) (rb - rl + rseq); \
2423	if (only_misses) { \
2424	nr++; \
2425	break; \
2426	} \
2427	HASHLOOPBODY(); \
2428	if (semi) \
2429	break; \
2430	} \
2431	} \
2432	if (nr == 0) { \
2433	if (only_misses) { \
2434	nr = 1; \
2435	MAYBEEXTEND(1, lci); \
2436	APPEND(r1, lo); \
2437	if (lskipped) \
2438	r1->tseqbase = oid_nil; \
2439	} else if (nil_on_miss) { \
2440	nr = 1; \
2441	r2->tnil = true; \
2442	r2->tnonil = false; \
2443	r2->tkey = false; \
2444	MAYBEEXTEND(1, lci); \
2445	APPEND(r1, lo); \
2446	APPEND(r2, oid_nil); \
2447	} else { \
2448	lskipped = BATcount(r1) > 0; \
2449	} \
2450	} else if (only_misses) { \
2451	lskipped = BATcount(r1) > 0; \
2452	} else { \
2453	if (lskipped) { \
2454	/* note, we only get here in an \
2455	* iteration after lskipped was \
2456	* first set to true, i.e. we did \
2457	* indeed skip values in l */ \
2458	r1->tseqbase = oid_nil; \
2459	} \
2460	if (nr > 1) { \
2461	r1->tkey = false; \
2462	r1->tseqbase = oid_nil; \
2463	} \
2464	} \
2465	if (nr > 0 && BATcount(r1) > nr) \
2466	r1->trevsorted = false; \
2467	} \
2468	} while (0)
2469
2470	/ Implementation of join using a hash lookup of values in the right*
2471	* column. */
2472	static gdk_return
2473	hashjoin(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr,
2474	struct canditer *restrict lci, struct canditer *restrict rci,
2475	bool nil_matches, bool nil_on_miss, bool semi, bool only_misses,
2476	bool not_in,
2477	BUN estimate, lng t0, bool swapped, bool phash, const char *reason)
2478	{
2479	oid lo, ro;
2480	BATiter ri;
2481	BUN rb;
2482	BUN rl, rh;
2483	oid rseq;
2484	BUN nr;
2485	const char *lvals;
2486	const char *lvars;
2487	int lwidth;
2488	const void *nil = ATOMnilptr(l->ttype);
2489	int (cmp)(const* void , const* void *) = ATOMcompare(l->ttype);
2490	oid lval = oid_nil; / hold value if l is dense /
2491	const char v = (const* char *) &lval;
2492	bool lskipped = false; / whether we skipped values in l /
2493	Hash *restrict hsh;
2494
2495	assert(!BATtvoid(r));
2496	assert(ATOMtype(l->ttype) == ATOMtype(r->ttype));
2497	assert(sl == NULL \|\| sl->tsorted);
2498	assert(sr == NULL \|\| sr->tsorted);
2499
2500	int t = ATOMbasetype(r->ttype);
2501	if (r->ttype == TYPE_void \|\| l->ttype == TYPE_void)
2502	t = TYPE_void;
2503
2504	lwidth = l->twidth;
2505	lvals = (const char *) Tloc(l, `0`);
2506	if (l->tvarsized && l->ttype) {
2507	assert(r->tvarsized && r->ttype);
2508	lvars = l->tvheap->base;
2509	} else {
2510	assert(!r->tvarsized \|\| !r->ttype);
2511	lvars = NULL;
2512	}
2513	/ offset to convert BUN to OID for value in right column /
2514	rseq = r->hseqbase;
2515
2516	if (lci->ncand == `0` \|\| rci->ncand== `0`)
2517	return nomatch(r1p, r2p, l, r, lci,
2518	nil_on_miss, only_misses, "hashjoin", t0);
2519
2520	BUN maxsize = joininitresults(r1p, r2p, lci->ncand, rci->ncand,
2521	l->tkey, r->tkey, semi, nil_on_miss,
2522	only_misses, estimate);
2523	if (maxsize == BUN_NONE)
2524	return GDK_FAIL;
2525
2526	BAT r1 = r1p;
2527	BAT r2 = r2p ? r2p : NULL;
2528
2529	rl = rci->seq - r->hseqbase;
2530	rh = canditer_last(rci) + `1` - r->hseqbase;
2531	if (phash) {
2532	BAT *b = BBPdescriptor(VIEWtparent(r));
2533	assert(sr == NULL);
2534	ALGODEBUG fprintf(stderr, "#%s: %s(%s): using "
2535	"parent(" ALGOBATFMT ") for hash\n",
2536	MT_thread_getname(), __func__,
2537	BATgetId(r), ALGOBATPAR(b));
2538	rl += (BUN) ((r->theap.base - b->theap.base) >> r->tshift);
2539	rh += rl;
2540	r = b;
2541	}
2542
2543	if (sr) {
2544	if (BATtdense(sr) &&
2545	BATcheckhash(r) &&
2546	BATcount(r) / ((size_t ) r->thash->heap.base)[`5`] lci->ncand < lci->ncand + rci->ncand) {
2547	ALGODEBUG fprintf(stderr, "#%s: %s(%s): using "
2548	"existing hash with candidate list\n",
2549	MT_thread_getname(), __func__,
2550	BATgetId(r));
2551	hsh = r->thash;
2552	sr = NULL;
2553	} else {
2554	int len;
2555	char ext[`32`];
2556	assert(!phash);
2557	ALGODEBUG fprintf(stderr, "#%s: %s(%s): creating "
2558	"hash for candidate list\n",
2559	MT_thread_getname(), __func__,
2560	BATgetId(r));
2561	len = snprintf(ext, sizeof(ext), "thash%x", sr->batCacheid);
2562	if (len == -`1` \|\| len >= (int) sizeof(ext))
2563	goto bailout;
2564	if ((hsh = BAThash_impl(r, sr, ext)) == NULL) {
2565	goto bailout;
2566	}
2567	}
2568	} else {
2569	if (BAThash(r) != GDK_SUCCEED) {
2570	hsh = NULL;
2571	goto bailout;
2572	}
2573	hsh = r->thash;
2574	}
2575	ri = bat_iterator(r);
2576
2577	if (not_in && !r->tnonil) {
2578	/ check whether there is a nil on the right, since if*
2579	* so, we should return an empty result */
2580	if (sr) {
2581	for (rb = HASHget(hsh, HASHprobe(hsh, nil));
2582	rb != HASHnil(hsh);
2583	rb = HASHgetlink(hsh, rb)) {
2584	ro = BUNtoid(sr, rb);
2585	if ((*cmp)(v, BUNtail(ri, ro - r->hseqbase)) != `0`) {
2586	HEAPfree(&hsh->heap, true);
2587	GDKfree(hsh);
2588	return nomatch(r1p, r2p, l, r, lci,
2589	false, false, "hashjoin", t0);
2590	}
2591	}
2592	} else {
2593	HASHloop_bound(ri, hsh, rb, nil, rl, rh) {
2594	return nomatch(r1p, r2p, l, r, lci,
2595	false, false, "hashjoin", t0);
2596	}
2597	}
2598	}
2599
2600	/ basic properties will be adjusted if necessary later on,*
2601	* they were initially set by joininitresults() */
2602
2603	if (r2) {
2604	r2->tkey = l->tkey;
2605	/ r2 is not likely to be sorted (although it is*
2606	* certainly possible) */
2607	r2->tsorted = false;
2608	r2->trevsorted = false;
2609	r2->tseqbase = oid_nil;
2610	}
2611
2612	if (sl && !BATtdense(sl))
2613	r1->tseqbase = oid_nil;
2614
2615	switch (t) {
2616	case TYPE_int:
2617	HASHJOIN(int);
2618	break;
2619	case TYPE_lng:
2620	HASHJOIN(lng);
2621	break;
2622	default:
2623	while (lci->next < lci->ncand) {
2624	lo = canditer_next(lci);
2625	if (BATtvoid(l)) {
2626	if (BATtdense(l))
2627	lval = lo - l->hseqbase + l->tseqbase;
2628	} else {
2629	v = VALUE(l, lo - l->hseqbase);
2630	}
2631	nr = `0`;
2632	if ((!nil_matches \|\| not_in) && cmp(v, nil) == `0`) {
2633	/ no match /
2634	if (not_in)
2635	continue;
2636	} else if (sr) {
2637	for (rb = HASHget(hsh, HASHprobe(hsh, v));
2638	rb != HASHnil(hsh);
2639	rb = HASHgetlink(hsh, rb)) {
2640	ro = BUNtoid(sr, rb);
2641	if ((*cmp)(v, BUNtail(ri, ro - r->hseqbase)) != `0`)
2642	continue;
2643	if (only_misses) {
2644	nr++;
2645	break;
2646	}
2647	HASHLOOPBODY();
2648	if (semi)
2649	break;
2650	}
2651	} else {
2652	HASHloop_bound(ri, hsh, rb, v, rl, rh) {
2653	ro = (oid) (rb - rl + rseq);
2654	if (only_misses) {
2655	nr++;
2656	break;
2657	}
2658	HASHLOOPBODY();
2659	if (semi)
2660	break;
2661	}
2662	}
2663	if (nr == `0`) {
2664	if (only_misses) {
2665	nr = `1`;
2666	MAYBEEXTEND(`1`, lci);
2667	APPEND(r1, lo);
2668	if (lskipped)
2669	r1->tseqbase = oid_nil;
2670	} else if (nil_on_miss) {
2671	nr = `1`;
2672	r2->tnil = true;
2673	r2->tnonil = false;
2674	r2->tkey = false;
2675	MAYBEEXTEND(`1`, lci);
2676	APPEND(r1, lo);
2677	APPEND(r2, oid_nil);
2678	} else {
2679	lskipped = BATcount(r1) > `0`;
2680	}
2681	} else if (only_misses) {
2682	lskipped = BATcount(r1) > `0`;
2683	} else {
2684	if (lskipped) {
2685	/ note, we only get here in an*
2686	* iteration after lskipped was
2687	* first set to true, i.e. we did
2688	* indeed skip values in l */
2689	r1->tseqbase = oid_nil;
2690	}
2691	if (nr > `1`) {
2692	r1->tkey = false;
2693	r1->tseqbase = oid_nil;
2694	}
2695	}
2696	if (nr > `0` && BATcount(r1) > nr)
2697	r1->trevsorted = false;
2698	}
2699	break;
2700	}
2701	if (sr) {
2702	HEAPfree(&hsh->heap, true);
2703	GDKfree(hsh);
2704	}
2705	/ also set other bits of heap to correct value to indicate size /
2706	BATsetcount(r1, BATcount(r1));
2707	if (BATcount(r1) <= `1`) {
2708	r1->tsorted = true;
2709	r1->trevsorted = true;
2710	r1->tkey = true;
2711	r1->tseqbase = `0`;
2712	}
2713	if (r2) {
2714	BATsetcount(r2, BATcount(r2));
2715	assert(BATcount(r1) == BATcount(r2));
2716	if (BATcount(r2) <= `1`) {
2717	r2->tsorted = true;
2718	r2->trevsorted = true;
2719	r2->tkey = true;
2720	r2->tseqbase = `0`;
2721	}
2722	}
2723	if (BATcount(r1) > `0`) {
2724	if (BATtdense(r1))
2725	r1->tseqbase = ((oid *) r1->theap.base)[`0`];
2726	if (r2 && BATtdense(r2))
2727	r2->tseqbase = ((oid *) r2->theap.base)[`0`];
2728	} else {
2729	r1->tseqbase = `0`;
2730	if (r2) {
2731	r2->tseqbase = `0`;
2732	}
2733	}
2734	ALGODEBUG fprintf(stderr, "#%s: %s(l=" ALGOBATFMT ","
2735	"r=" ALGOBATFMT ",sl=" ALGOOPTBATFMT ","
2736	"sr=" ALGOOPTBATFMT ",nil_matches=%d,"
2737	"nil_on_miss=%d,semi=%d,only_misses=%d,"
2738	"not_in=%d)%s %s "
2739	"-> (" ALGOBATFMT "," ALGOOPTBATFMT ") " LLFMT "us\n",
2740	MT_thread_getname(), __func__,
2741	ALGOBATPAR(l), ALGOBATPAR(r),
2742	ALGOOPTBATPAR(sl), ALGOOPTBATPAR(sr),
2743	nil_matches, nil_on_miss, semi, only_misses, not_in,
2744	swapped ? " swapped" : "", reason,
2745	ALGOBATPAR(r1), ALGOOPTBATPAR(r2),
2746	GDKusec() - t0);
2747
2748	return GDK_SUCCEED;
2749
2750	bailout:
2751	if (sr && hsh) {
2752	HEAPfree(&hsh->heap, true);
2753	GDKfree(hsh);
2754	}
2755	BBPreclaim(r1);
2756	BBPreclaim(r2);
2757	return GDK_FAIL;
2758	}
2759
2760	#define MASK_EQ 1
2761	#define MASK_LT 2
2762	#define MASK_GT 4
2763	#define MASK_LE (MASK_EQ \| MASK_LT)
2764	#define MASK_GE (MASK_EQ \| MASK_GT)
2765	#define MASK_NE (MASK_LT \| MASK_GT)
2766
2767	static gdk_return
2768	thetajoin(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr, int opcode, BUN estimate, lng t0)
2769	{
2770	struct canditer lci, rci;
2771	BUN lcnt, rcnt;
2772	const char lvals, rvals;
2773	const char lvars, rvars;
2774	int lwidth, rwidth;
2775	const void *nil = ATOMnilptr(l->ttype);
2776	int (cmp)(const* void , const* void *) = ATOMcompare(l->ttype);
2777	const void vl, vr;
2778	oid lastr = `0`; / last value inserted into r2 /
2779	BUN nr;
2780	oid lo, ro;
2781	int c;
2782	bool lskipped = false; / whether we skipped values in l /
2783	lng loff = `0`, roff = `0`;
2784	oid lval = oid_nil, rval = oid_nil;
2785
2786	ALGODEBUG fprintf(stderr, "#thetajoin(l=" ALGOBATFMT ","
2787	"r=" ALGOBATFMT ",sl=" ALGOOPTBATFMT ","
2788	"sr=" ALGOOPTBATFMT ",op=%s%s%s)\n",
2789	ALGOBATPAR(l), ALGOBATPAR(r), ALGOOPTBATPAR(sl), ALGOOPTBATPAR(sr),
2790	opcode & MASK_LT ? "<" : "",
2791	opcode & MASK_GT ? ">" : "",
2792	opcode & MASK_EQ ? "=" : "");
2793
2794	assert(ATOMtype(l->ttype) == ATOMtype(r->ttype));
2795	assert(sl == NULL \|\| sl->tsorted);
2796	assert(sr == NULL \|\| sr->tsorted);
2797	assert((opcode & (MASK_EQ \| MASK_LT \| MASK_GT)) != `0`);
2798
2799	lcnt = canditer_init(&lci, l, sl);
2800	rcnt = canditer_init(&rci, r, sr);
2801
2802	lvals = BATtvoid(l) ? NULL : (const char *) Tloc(l, `0`);
2803	rvals = BATtvoid(r) ? NULL : (const char *) Tloc(r, `0`);
2804	if (l->tvarsized && l->ttype) {
2805	assert(r->tvarsized && r->ttype);
2806	lvars = l->tvheap->base;
2807	rvars = r->tvheap->base;
2808	} else {
2809	assert(!r->tvarsized \|\| !r->ttype);
2810	lvars = rvars = NULL;
2811	}
2812	lwidth = l->twidth;
2813	rwidth = r->twidth;
2814
2815	if (BATtvoid(l)) {
2816	if (!BATtdense(l)) {
2817	/ trivial: nils don't match anything /
2818	return nomatch(r1p, r2p, l, r, &lci,
2819	false, false, "thetajoin", t0);
2820	}
2821	loff = (lng) l->tseqbase - (lng) l->hseqbase;
2822	}
2823	if (BATtvoid(r)) {
2824	if (!BATtdense(r)) {
2825	/ trivial: nils don't match anything /
2826	return nomatch(r1p, r2p, l, r, &lci,
2827	false, false, "thetajoin", t0);
2828	}
2829	roff = (lng) r->tseqbase - (lng) r->hseqbase;
2830	}
2831
2832	BUN maxsize = joininitresults(r1p, r2p, lcnt, rcnt, false, false,
2833	false, false, false, estimate);
2834	if (maxsize == BUN_NONE)
2835	return GDK_FAIL;
2836	BAT r1 = r1p;
2837	BAT r2 = r2p ? r2p : NULL;
2838
2839	r1->tkey = true;
2840	r1->tsorted = true;
2841	r1->trevsorted = true;
2842	if (r2) {
2843	r2->tkey = true;
2844	r2->tsorted = true;
2845	r2->trevsorted = true;
2846	}
2847
2848	/ nested loop implementation for theta join /
2849	vl = &lval;
2850	vr = &rval;
2851	for (BUN li = `0`; li < lci.ncand; li++) {
2852	lo = canditer_next(&lci);
2853	if (lvals)
2854	vl = VALUE(l, lo - l->hseqbase);
2855	else
2856	lval = (oid) ((lng) lo + loff);
2857	nr = `0`;
2858	if (cmp(vl, nil) != `0`) {
2859	canditer_reset(&rci);
2860	for (BUN ri = `0`; ri < rci.ncand; ri++) {
2861	ro = canditer_next(&rci);
2862	if (rvals)
2863	vr = VALUE(r, ro - r->hseqbase);
2864	else
2865	rval = (oid) ((lng) ro + roff);
2866	if (cmp(vr, nil) == `0`)
2867	continue;
2868	c = cmp(vl, vr);
2869	if (!((opcode & MASK_LT && c < `0`) \|\|
2870	(opcode & MASK_GT && c > `0`) \|\|
2871	(opcode & MASK_EQ && c == `0`)))
2872	continue;
2873	MAYBEEXTEND(`1`, &lci);
2874	if (BATcount(r1) > `0`) {
2875	if (r2 && lastr + `1` != ro)
2876	r2->tseqbase = oid_nil;
2877	if (nr == `0`) {
2878	r1->trevsorted = false;
2879	if (r2 == NULL) {
2880	/ nothing /
2881	} else if (lastr > ro) {
2882	r2->tsorted = false;
2883	r2->tkey = false;
2884	} else if (lastr < ro) {
2885	r2->trevsorted = false;
2886	} else {
2887	r2->tkey = false;
2888	}
2889	}
2890	}
2891	APPEND(r1, lo);
2892	if (r2) {
2893	APPEND(r2, ro);
2894	}
2895	lastr = ro;
2896	nr++;
2897	}
2898	}
2899	if (nr > `1`) {
2900	r1->tkey = false;
2901	r1->tseqbase = oid_nil;
2902	if (r2) {
2903	r2->trevsorted = false;
2904	}
2905	} else if (nr == `0`) {
2906	lskipped = BATcount(r1) > `0`;
2907	} else if (lskipped) {
2908	r1->tseqbase = oid_nil;
2909	}
2910	}
2911	/ also set other bits of heap to correct value to indicate size /
2912	BATsetcount(r1, BATcount(r1));
2913	if (r2) {
2914	BATsetcount(r2, BATcount(r2));
2915	assert(BATcount(r1) == BATcount(r2));
2916	}
2917	if (BATcount(r1) > `0`) {
2918	if (BATtdense(r1))
2919	r1->tseqbase = ((oid *) r1->theap.base)[`0`];
2920	if (r2 && BATtdense(r2))
2921	r2->tseqbase = ((oid *) r2->theap.base)[`0`];
2922	} else {
2923	r1->tseqbase = `0`;
2924	if (r2) {
2925	r2->tseqbase = `0`;
2926	}
2927	}
2928	ALGODEBUG fprintf(stderr, "#thetajoin(l=%s,r=%s)=(" ALGOBATFMT "," ALGOOPTBATFMT ") " LLFMT "us\n",
2929	BATgetId(l), BATgetId(r),
2930	ALGOBATPAR(r1), ALGOOPTBATPAR(r2),
2931	GDKusec() - t0);
2932	return GDK_SUCCEED;
2933
2934	bailout:
2935	BBPreclaim(r1);
2936	BBPreclaim(r2);
2937	return GDK_FAIL;
2938	}
2939
2940	static gdk_return
2941	bandjoin(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr,
2942	const void c1, const* void *c2, bool li, bool hi, BUN estimate,
2943	lng t0)
2944	{
2945	BUN lcnt, rcnt;
2946	struct canditer lci, rci;
2947	const char lvals, rvals;
2948	int lwidth, rwidth;
2949	int t;
2950	const void *nil = ATOMnilptr(l->ttype);
2951	int (cmp)(const* void , const* void *) = ATOMcompare(l->ttype);
2952	const char vl, vr;
2953	oid lastr = `0`; / last value inserted into r2 /
2954	BUN nr;
2955	oid lo, ro;
2956	bool lskipped = false; / whether we skipped values in l /
2957	BUN nils = `0`; / needed for XXX_WITH_CHECK macros /
2958
2959	assert(ATOMtype(l->ttype) == ATOMtype(r->ttype));
2960	assert(sl == NULL \|\| sl->tsorted);
2961	assert(sr == NULL \|\| sr->tsorted);
2962
2963	t = ATOMtype(l->ttype);
2964	t = ATOMbasetype(t);
2965
2966	lcnt = canditer_init(&lci, l, sl);
2967	rcnt = canditer_init(&rci, r, sr);
2968
2969	if (lcnt == `0` \|\| rcnt == `0`)
2970	return nomatch(r1p, r2p, l, r, &lci,
2971	false, false, "bandjoin", t0);
2972
2973	switch (t) {
2974	case TYPE_bte:
2975	if (is_bte_nil((const* bte *)c1) \|\|
2976	is_bte_nil((const* bte *)c2) \|\|
2977	-(const* bte )c1 > (const bte *)c2 \|\|
2978	((!hi \|\| !li) && -(const* bte )c1 == (const bte *)c2))
2979	return nomatch(r1p, r2p, l, r, &lci,
2980	false, false, "bandjoin", t0);
2981	break;
2982	case TYPE_sht:
2983	if (is_sht_nil((const* sht *)c1) \|\|
2984	is_sht_nil((const* sht *)c2) \|\|
2985	-(const* sht )c1 > (const sht *)c2 \|\|
2986	((!hi \|\| !li) && -(const* sht )c1 == (const sht *)c2))
2987	return nomatch(r1p, r2p, l, r, &lci,
2988	false, false, "bandjoin", t0);
2989	break;
2990	case TYPE_int:
2991	if (is_int_nil((const* int *)c1) \|\|
2992	is_int_nil((const* int *)c2) \|\|
2993	-(const* int )c1 > (const int *)c2 \|\|
2994	((!hi \|\| !li) && -(const* int )c1 == (const int *)c2))
2995	return nomatch(r1p, r2p, l, r, &lci,
2996	false, false, "bandjoin", t0);
2997	break;
2998	case TYPE_lng:
2999	if (is_lng_nil((const* lng *)c1) \|\|
3000	is_lng_nil((const* lng *)c2) \|\|
3001	-(const* lng )c1 > (const lng *)c2 \|\|
3002	((!hi \|\| !li) && -(const* lng )c1 == (const lng *)c2))
3003	return nomatch(r1p, r2p, l, r, &lci,
3004	false, false, "bandjoin", t0);
3005	break;
3006	#ifdef HAVE_HGE
3007	case TYPE_hge:
3008	if (is_hge_nil((const* hge *)c1) \|\|
3009	is_hge_nil((const* hge *)c2) \|\|
3010	-(const* hge )c1 > (const hge *)c2 \|\|
3011	((!hi \|\| !li) && -(const* hge )c1 == (const hge *)c2))
3012	return nomatch(r1p, r2p, l, r, &lci,
3013	false, false, "bandjoin", t0);
3014	break;
3015	#endif
3016	case TYPE_flt:
3017	if (is_flt_nil((const* flt *)c1) \|\|
3018	is_flt_nil((const* flt *)c2) \|\|
3019	-(const* flt )c1 > (const flt *)c2 \|\|
3020	((!hi \|\| !li) && -(const* flt )c1 == (const flt *)c2))
3021	return nomatch(r1p, r2p, l, r, &lci,
3022	false, false, "bandjoin", t0);
3023	break;
3024	case TYPE_dbl:
3025	if (is_dbl_nil((const* dbl *)c1) \|\|
3026	is_dbl_nil((const* dbl *)c2) \|\|
3027	-(const* dbl )c1 > (const dbl *)c2 \|\|
3028	((!hi \|\| !li) && -(const* dbl )c1 == (const dbl *)c2))
3029	return nomatch(r1p, r2p, l, r, &lci,
3030	false, false, "bandjoin", t0);
3031	break;
3032	default:
3033	GDKerror("BATbandjoin: unsupported type\n");
3034	return GDK_FAIL;
3035	}
3036
3037	BUN maxsize = joininitresults(r1p, r2p, lcnt, rcnt, false, false,
3038	false, false, false, estimate);
3039	if (maxsize == BUN_NONE)
3040	return GDK_FAIL;
3041	BAT r1 = r1p;
3042	BAT r2 = r2p ? r2p : NULL;
3043
3044	lvals = (const char *) Tloc(l, `0`);
3045	rvals = (const char *) Tloc(r, `0`);
3046	assert(!r->tvarsized);
3047	lwidth = l->twidth;
3048	rwidth = r->twidth;
3049
3050	assert(lvals != NULL);
3051	assert(rvals != NULL);
3052
3053	r1->tkey = true;
3054	r1->tsorted = true;
3055	r1->trevsorted = true;
3056	if (r2) {
3057	r2->tkey = true;
3058	r2->tsorted = true;
3059	r2->trevsorted = true;
3060	}
3061
3062	/ nested loop implementation for band join /
3063	for (BUN li = `0`; li < lcnt; li++) {
3064	lo = canditer_next(&lci);
3065	vl = FVALUE(l, lo - l->hseqbase);
3066	if (cmp(vl, nil) == `0`)
3067	continue;
3068	nr = `0`;
3069	canditer_reset(&rci);
3070	for (BUN ri = `0`; ri < rcnt; ri++) {
3071	ro = canditer_next(&rci);
3072	vr = FVALUE(r, ro - r->hseqbase);
3073	switch (ATOMtype(l->ttype)) {
3074	case TYPE_bte: {
3075	if (is_bte_nil((const* bte *) vr))
3076	continue;
3077	sht v1 = (sht) (const* bte *) vr, v2;
3078	v2 = v1;
3079	v1 -= (const* bte *)c1;
3080	if ((const* bte *)vl <= v1 &&
3081	(!li \|\| (const* bte *)vl != v1))
3082	continue;
3083	v2 += (const* bte *)c2;
3084	if ((const* bte *)vl >= v2 &&
3085	(!hi \|\| (const* bte *)vl != v2))
3086	continue;
3087	break;
3088	}
3089	case TYPE_sht: {
3090	if (is_sht_nil((const* sht *) vr))
3091	continue;
3092	int v1 = (int) (const* sht *) vr, v2;
3093	v2 = v1;
3094	v1 -= (const* sht *)c1;
3095	if ((const* sht *)vl <= v1 &&
3096	(!li \|\| (const* sht *)vl != v1))
3097	continue;
3098	v2 += (const* sht *)c2;
3099	if ((const* sht *)vl >= v2 &&
3100	(!hi \|\| (const* sht *)vl != v2))
3101	continue;
3102	break;
3103	}
3104	case TYPE_int: {
3105	if (is_int_nil((const* int *) vr))
3106	continue;
3107	lng v1 = (lng) (const* int *) vr, v2;
3108	v2 = v1;
3109	v1 -= (const* int *)c1;
3110	if ((const* int *)vl <= v1 &&
3111	(!li \|\| (const* int *)vl != v1))
3112	continue;
3113	v2 += (const* int *)c2;
3114	if ((const* int *)vl >= v2 &&
3115	(!hi \|\| (const* int *)vl != v2))
3116	continue;
3117	break;
3118	}
3119	#ifdef HAVE_HGE
3120	case TYPE_lng: {
3121	if (is_lng_nil((const* lng *) vr))
3122	continue;
3123	hge v1 = (hge) (const* lng *) vr, v2;
3124	v2 = v1;
3125	v1 -= (const* lng *)c1;
3126	if ((const* lng *)vl <= v1 &&
3127	(!li \|\| (const* lng *)vl != v1))
3128	continue;
3129	v2 += (const* lng *)c2;
3130	if ((const* lng *)vl >= v2 &&
3131	(!hi \|\| (const* lng *)vl != v2))
3132	continue;
3133	break;
3134	}
3135	#else
3136	#ifdef HAVE___INT128
3137	case TYPE_lng: {
3138	if (is_lng_nil((const* lng *) vr))
3139	continue;
3140	__int128 v1 = (__int128) (const* lng *) vr, v2;
3141	v2 = v1;
3142	v1 -= (const* lng *)c1;
3143	if ((const* lng *)vl <= v1 &&
3144	(!li \|\| (const* lng *)vl != v1))
3145	continue;
3146	v2 += (const* lng *)c2;
3147	if ((const* lng *)vl >= v2 &&
3148	(!hi \|\| (const* lng *)vl != v2))
3149	continue;
3150	break;
3151	}
3152	#else
3153	case TYPE_lng: {
3154	if (is_lng_nil((const* lng *) vr))
3155	continue;
3156	lng v1, v2;
3157	bool abort_on_error = true;
3158	SUB_WITH_CHECK((const* lng *)vr,
3159	(const* lng *)c1,
3160	lng, v1,
3161	GDK_lng_max,
3162	do{if((const* lng)c1<`0`)goto* nolmatch;else goto lmatch1;}while(false));
3163	if ((const* lng *)vl <= v1 &&
3164	(!li \|\| (const* lng *)vl != v1))
3165	continue;
3166	lmatch1:
3167	ADD_WITH_CHECK((const* lng *)vr,
3168	(const* lng *)c2,
3169	lng, v2,
3170	GDK_lng_max,
3171	do{if((const* lng)c2>`0`)goto* nolmatch;else goto lmatch2;}while(false));
3172	if ((const* lng *)vl >= v2 &&
3173	(!hi \|\| (const* lng *)vl != v2))
3174	continue;
3175	lmatch2:
3176	break;
3177	nolmatch:
3178	continue;
3179	}
3180	#endif
3181	#endif
3182	#ifdef HAVE_HGE
3183	case TYPE_hge: {
3184	if (is_hge_nil((const* hge *) vr))
3185	continue;
3186	hge v1, v2;
3187	bool abort_on_error = true;
3188	SUB_WITH_CHECK((const* hge *)vr,
3189	(const* hge *)c1,
3190	hge, v1,
3191	GDK_hge_max,
3192	do{if((const* hge)c1<`0`)goto* nohmatch;else goto hmatch1;}while(false));
3193	if ((const* hge *)vl <= v1 &&
3194	(!li \|\| (const* hge *)vl != v1))
3195	continue;
3196	hmatch1:
3197	ADD_WITH_CHECK((const* hge *)vr,
3198	(const* hge *)c2,
3199	hge, v2,
3200	GDK_hge_max,
3201	do{if((const* hge)c2>`0`)goto* nohmatch;else goto hmatch2;}while(false));
3202	if ((const* hge *)vl >= v2 &&
3203	(!hi \|\| (const* hge *)vl != v2))
3204	continue;
3205	hmatch2:
3206	break;
3207	nohmatch:
3208	continue;
3209	}
3210	#endif
3211	case TYPE_flt: {
3212	if (is_flt_nil((const* flt *) vr))
3213	continue;
3214	dbl v1 = (dbl) (const* flt *) vr, v2;
3215	v2 = v1;
3216	v1 -= (const* flt *)c1;
3217	if ((const* flt *)vl <= v1 &&
3218	(!li \|\| (const* flt *)vl != v1))
3219	continue;
3220	v2 += (const* flt *)c2;
3221	if ((const* flt *)vl >= v2 &&
3222	(!hi \|\| (const* flt *)vl != v2))
3223	continue;
3224	break;
3225	}
3226	case TYPE_dbl: {
3227	if (is_dbl_nil((const* dbl *) vr))
3228	continue;
3229	dbl v1, v2;
3230	bool abort_on_error = true;
3231	SUB_WITH_CHECK((const* dbl *)vr,
3232	(const* dbl *)c1,
3233	dbl, v1,
3234	GDK_dbl_max,
3235	do{if((const* dbl)c1<`0`)goto* nodmatch;else goto dmatch1;}while(false));
3236	if ((const* dbl *)vl <= v1 &&
3237	(!li \|\| (const* dbl *)vl != v1))
3238	continue;
3239	dmatch1:
3240	ADD_WITH_CHECK((const* dbl *)vr,
3241	(const* dbl *)c2,
3242	dbl, v2,
3243	GDK_dbl_max,
3244	do{if((const* dbl)c2>`0`)goto* nodmatch;else goto dmatch2;}while(false));
3245	if ((const* dbl *)vl >= v2 &&
3246	(!hi \|\| (const* dbl *)vl != v2))
3247	continue;
3248	dmatch2:
3249	break;
3250	nodmatch:
3251	continue;
3252	}
3253	}
3254	MAYBEEXTEND(`1`, &lci);
3255	if (BATcount(r1) > `0`) {
3256	if (r2 && lastr + `1` != ro)
3257	r2->tseqbase = oid_nil;
3258	if (nr == `0`) {
3259	r1->trevsorted = false;
3260	if (r2 == NULL) {
3261	/ nothing /
3262	} else if (lastr > ro) {
3263	r2->tsorted = false;
3264	r2->tkey = false;
3265	} else if (lastr < ro) {
3266	r2->trevsorted = false;
3267	} else {
3268	r2->tkey = false;
3269	}
3270	}
3271	}
3272	APPEND(r1, lo);
3273	if (r2) {
3274	APPEND(r2, ro);
3275	}
3276	lastr = ro;
3277	nr++;
3278	}
3279	if (nr > `1`) {
3280	r1->tkey = false;
3281	r1->tseqbase = oid_nil;
3282	if (r2) {
3283	r2->trevsorted = false;
3284	}
3285	} else if (nr == `0`) {
3286	lskipped = BATcount(r1) > `0`;
3287	} else if (lskipped) {
3288	r1->tseqbase = oid_nil;
3289	}
3290	}
3291	/ also set other bits of heap to correct value to indicate size /
3292	BATsetcount(r1, BATcount(r1));
3293	if (r2) {
3294	BATsetcount(r2, BATcount(r2));
3295	assert(BATcount(r1) == BATcount(r2));
3296	}
3297	if (BATcount(r1) > `0`) {
3298	if (BATtdense(r1))
3299	r1->tseqbase = ((oid *) r1->theap.base)[`0`];
3300	if (r2 && BATtdense(r2))
3301	r2->tseqbase = ((oid *) r2->theap.base)[`0`];
3302	} else {
3303	r1->tseqbase = `0`;
3304	if (r2) {
3305	r2->tseqbase = `0`;
3306	}
3307	}
3308	ALGODEBUG fprintf(stderr, "#BATbandjoin(l=%s,r=%s)=(" ALGOBATFMT "," ALGOOPTBATFMT ") " LLFMT "us\n",
3309	BATgetId(l), BATgetId(r),
3310	ALGOBATPAR(r1), ALGOOPTBATPAR(r2),
3311	GDKusec() - t0);
3312	return GDK_SUCCEED;
3313
3314	bailout:
3315	BBPreclaim(r1);
3316	BBPreclaim(r2);
3317	return GDK_FAIL;
3318	}
3319
3320	/ small ordered right, dense left, oid's only, do fetches /
3321	static gdk_return
3322	fetchjoin(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr,
3323	struct canditer *restrict lci, struct canditer *restrict rci,
3324	const char *reason, lng t0)
3325	{
3326	oid lo = lci->seq - l->hseqbase + l->tseqbase, hi = lo + lci->ncand;
3327	BUN b, e, p;
3328	BAT r1, r2 = NULL;
3329
3330	if (r->tsorted) {
3331	b = SORTfndfirst(r, &lo);
3332	e = SORTfndfirst(r, &hi);
3333	} else {
3334	assert(r->trevsorted);
3335	b = SORTfndlast(r, &hi);
3336	e = SORTfndlast(r, &lo);
3337	}
3338	if (b < rci->seq - r->hseqbase)
3339	b = rci->seq - r->hseqbase;
3340	if (e > rci->seq + rci->ncand - r->hseqbase)
3341	e = rci->seq + rci->ncand - r->hseqbase;
3342	if (e == b) {
3343	return nomatch(r1p, r2p, l, r, lci,
3344	false, false, "fetchjoin", t0);
3345	}
3346	r1 = COLnew(`0`, TYPE_oid, e - b, TRANSIENT);
3347	if (r1 == NULL)
3348	return GDK_FAIL;
3349	if (r2p) {
3350	if ((r2 = BATdense(`0`, r->hseqbase + b, e - b)) == NULL) {
3351	BBPreclaim(r1);
3352	return GDK_FAIL;
3353	}
3354	*r2p = r2;
3355	}
3356	*r1p = r1;
3357	oid op = (oid ) Tloc(r1, `0`);
3358	const oid rp = (const* oid *) Tloc(r, `0`);
3359	for (p = b; p < e; p++) {
3360	*op++ = rp[p] + l->hseqbase - l->tseqbase;
3361	}
3362	BATsetcount(r1, e - b);
3363	r1->tkey = r->tkey;
3364	r1->tsorted = r->tsorted \|\| e - b <= `1`;
3365	r1->trevsorted = r->trevsorted \|\| e - b <= `1`;
3366	r1->tseqbase = e == b ? `0` : e - b == `1` ? (const* oid *)Tloc(r1, `0`) : oid_nil;
3367	ALGODEBUG fprintf(stderr, "#%s: %s(l=" ALGOBATFMT ","
3368	"r=" ALGOBATFMT ",sl=" ALGOOPTBATFMT ","
3369	"sr=" ALGOOPTBATFMT ") %s "
3370	"-> (" ALGOBATFMT "," ALGOOPTBATFMT ") " LLFMT "us\n",
3371	MT_thread_getname(), __func__,
3372	ALGOBATPAR(l), ALGOBATPAR(r),
3373	ALGOOPTBATPAR(sl), ALGOOPTBATPAR(sr),
3374	reason,
3375	ALGOBATPAR(r1), ALGOOPTBATPAR(r2),
3376	GDKusec() - t0);
3377
3378	return GDK_SUCCEED;
3379	}
3380
3381
3382	/ Make the implementation choices for various left joins. /
3383	static gdk_return
3384	leftjoin(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr,
3385	bool nil_matches, bool nil_on_miss, bool semi, bool only_misses,
3386	bool not_in, BUN estimate, const char *func, lng t0)
3387	{
3388	BUN lcnt, rcnt;
3389	struct canditer lci, rci;
3390	bool phash = false;
3391
3392	/ only_misses implies left output only /
3393	assert(!only_misses \|\| r2p == NULL);
3394	/ if nil_on_miss is set, we really need a right output /
3395	assert(!nil_on_miss \|\| r2p != NULL);
3396	/ if not_in is set, then so is only_misses /
3397	assert(!not_in \|\| only_misses);
3398	*r1p = NULL;
3399	if (r2p)
3400	*r2p = NULL;
3401	if (joinparamcheck(l, r, NULL, sl, sr, func) != GDK_SUCCEED)
3402	return GDK_FAIL;
3403
3404	lcnt = canditer_init(&lci, l, sl);
3405	rcnt = canditer_init(&rci, r, sr);
3406
3407	if (lcnt == `0` \|\| (!only_misses && !nil_on_miss && rcnt == `0`)) {
3408	ALGODEBUG fprintf(stderr, "#%s(l=" ALGOBATFMT ","
3409	"r=" ALGOBATFMT ",sl=" ALGOOPTBATFMT ","
3410	"sr=" ALGOOPTBATFMT ",nil_matches=%d,"
3411	"nil_on_miss=%d,semi=%d,only_misses=%d,"
3412	"not_in=%d)\n",
3413	func,
3414	ALGOBATPAR(l), ALGOBATPAR(r),
3415	ALGOOPTBATPAR(sl), ALGOOPTBATPAR(sr),
3416	nil_matches, nil_on_miss, semi, only_misses,
3417	not_in);
3418	return nomatch(r1p, r2p, l, r, &lci,
3419	nil_on_miss, only_misses, func, t0);
3420	}
3421
3422	if (!nil_on_miss && !semi && !only_misses && !not_in &&
3423	(lcnt == `1` \|\| (BATordered(l) && BATordered_rev(l)) \|\|
3424	(l->ttype == TYPE_void && is_oid_nil(l->tseqbase)))) {
3425	/ single value to join, use select /
3426	return selectjoin(r1p, r2p, l, r, sl, sr,
3427	&lci, nil_matches, t0, false, func);
3428	} else if (BATtdense(r) && rci.tpe == cand_dense &&
3429	lcnt > `0` && rcnt > `0`) {
3430	/ use special implementation for dense right-hand side /
3431	return mergejoin_void(r1p, r2p, l, r, sl, sr, &lci, &rci,
3432	nil_on_miss, only_misses, t0, false,
3433	func);
3434	} else if (BATtdense(l)
3435	&& lci.tpe == cand_dense
3436	&& rci.tpe == cand_dense
3437	&& !semi
3438	&& !nil_matches
3439	&& !only_misses
3440	&& !not_in
3441	/ && (rcnt * 1024) < lcnt /
3442	&& (BATordered(r) \|\| BATordered_rev(r))) {
3443	assert(ATOMtype(l->ttype) == TYPE_oid); / tdense /
3444	return fetchjoin(r1p, r2p, l, r, sl, sr, &lci, &rci, func, t0);
3445	} else if ((BATordered(r) \|\| BATordered_rev(r))
3446	&& (BATordered(l)
3447	\|\| BATordered_rev(l)
3448	\|\| BATtdense(r)
3449	\|\| lcnt < `1024`
3450	\|\| BATcount(r) * (Tsize(r) + (r->tvheap ? r->tvheap->size : `0`) + `2` * sizeof(BUN)) > GDK_mem_maxsize / (GDKnr_threads ? GDKnr_threads : `1`))) {
3451	return mergejoin(r1p, r2p, l, r, sl, sr, &lci, &rci,
3452	nil_matches, nil_on_miss, semi, only_misses,
3453	not_in, estimate, t0, false, func);
3454	}
3455	phash = sr == NULL &&
3456	VIEWtparent(r) != `0` &&
3457	BATcount(BBPquickdesc(VIEWtparent(r), false)) == BATcount(r);
3458	return hashjoin(r1p, r2p, l, r, sl, sr, &lci, &rci,
3459	nil_matches, nil_on_miss, semi, only_misses,
3460	not_in, estimate, t0, false, phash, func);
3461	}
3462
3463	/ Perform an equi-join over l and r. Returns two new, aligned, bats*
3464	* with the oids of matching tuples. The result is in the same order
3465	* as l (i.e. r1 is sorted). */
3466	gdk_return
3467	BATleftjoin(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr, bool nil_matches, BUN estimate)
3468	{
3469	return leftjoin(r1p, r2p, l, r, sl, sr, nil_matches,
3470	false, false, false, false, estimate, "BATleftjoin",
3471	GDKdebug & ALGOMASK ? GDKusec() : `0`);
3472	}
3473
3474	/ Performs a left outer join over l and r. Returns two new, aligned,*
3475	* bats with the oids of matching tuples, or the oid in the first
3476	* output bat and nil in the second output bat if the value in l does
3477	* not occur in r. The result is in the same order as l (i.e. r1 is
3478	* sorted). */
3479	gdk_return
3480	BATouterjoin(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr, bool nil_matches, BUN estimate)
3481	{
3482	return leftjoin(r1p, r2p, l, r, sl, sr, nil_matches,
3483	true, false, false, false, estimate, "BATouterjoin",
3484	GDKdebug & ALGOMASK ? GDKusec() : `0`);
3485	}
3486
3487	/ Perform a semi-join over l and r. Returns one or two new, bats*
3488	* with the oids of matching tuples. The result is in the same order
3489	* as l (i.e. r1 is sorted). If a single bat is returned, it is a
3490	* candidate list. */
3491	gdk_return
3492	BATsemijoin(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr, bool nil_matches, BUN estimate)
3493	{
3494	return leftjoin(r1p, r2p, l, r, sl, sr, nil_matches,
3495	false, true, false, false, estimate, "BATsemijoin",
3496	GDKdebug & ALGOMASK ? GDKusec() : `0`);
3497	}
3498
3499	/ Return a candidate list with the list of rows in l whose value also*
3500	* occurs in r. This is just the left output of a semi-join. */
3501	BAT *
3502	BATintersect(BAT l, BAT r, BAT sl, BAT sr, bool nil_matches, BUN estimate)
3503	{
3504	BAT *bn;
3505
3506	if (leftjoin(&bn, NULL, l, r, sl, sr, nil_matches,
3507	false, true, false, false, estimate, "BATintersect",
3508	GDKdebug & ALGOMASK ? GDKusec() : `0`) == GDK_SUCCEED)
3509	return virtualize(bn);
3510	return NULL;
3511	}
3512
3513	/ Return the difference of l and r. The result is a BAT with the*
3514	* oids of those values in l that do not occur in r. This is what you
3515	* might call an anti-semi-join. The result is a candidate list. */
3516	BAT *
3517	BATdiff(BAT l, BAT r, BAT sl, BAT sr, bool nil_matches, bool not_in,
3518	BUN estimate)
3519	{
3520	BAT *bn;
3521
3522	if (leftjoin(&bn, NULL, l, r, sl, sr, nil_matches,
3523	false, false, true, not_in, estimate, "BATdiff",
3524	GDKdebug & ALGOMASK ? GDKusec() : `0`) == GDK_SUCCEED)
3525	return virtualize(bn);
3526	return NULL;
3527	}
3528
3529	gdk_return
3530	BATthetajoin(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr, int op, bool nil_matches, BUN estimate)
3531	{
3532	int opcode = `0`;
3533	lng t0 = `0`;
3534
3535	/ encode operator as a bit mask into opcode /
3536	switch (op) {
3537	case JOIN_EQ:
3538	return BATjoin(r1p, r2p, l, r, sl, sr, nil_matches, estimate);
3539	case JOIN_NE:
3540	opcode = MASK_NE;
3541	break;
3542	case JOIN_LT:
3543	opcode = MASK_LT;
3544	break;
3545	case JOIN_LE:
3546	opcode = MASK_LE;
3547	break;
3548	case JOIN_GT:
3549	opcode = MASK_GT;
3550	break;
3551	case JOIN_GE:
3552	opcode = MASK_GE;
3553	break;
3554	default:
3555	GDKerror("BATthetajoin: unknown operator %d.\n", op);
3556	return GDK_FAIL;
3557	}
3558
3559	ALGODEBUG t0 = GDKusec();
3560	*r1p = NULL;
3561	if (r2p) {
3562	*r2p = NULL;
3563	}
3564	if (joinparamcheck(l, r, NULL, sl, sr, "BATthetajoin") != GDK_SUCCEED)
3565	return GDK_FAIL;
3566
3567	return thetajoin(r1p, r2p, l, r, sl, sr, opcode, estimate, t0);
3568	}
3569
3570	gdk_return
3571	BATjoin(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr, bool nil_matches, BUN estimate)
3572	{
3573	struct canditer lci, rci;
3574	BUN lcnt, rcnt;
3575	BUN lsize, rsize;
3576	bool lhash = false, rhash = false;
3577	bool plhash = false, prhash = false;
3578	BUN lslots = `0`, rslots = `0`;
3579	bool swap;
3580	bat parent;
3581	size_t mem_size;
3582	lng t0 = `0`;
3583	const char *reason = "";
3584
3585	ALGODEBUG t0 = GDKusec();
3586
3587	if ((parent = VIEWtparent(l)) != `0`) {
3588	BAT *b = BBPdescriptor(parent);
3589	if (l->hseqbase == b->hseqbase &&
3590	BATcount(l) == BATcount(b))
3591	l = b;
3592	}
3593	if ((parent = VIEWtparent(r)) != `0`) {
3594	BAT *b = BBPdescriptor(parent);
3595	if (r->hseqbase == b->hseqbase &&
3596	BATcount(r) == BATcount(b))
3597	r = b;
3598	}
3599
3600	lcnt = canditer_init(&lci, l, sl);
3601	rcnt = canditer_init(&rci, r, sr);
3602
3603	*r1p = NULL;
3604	if (r2p) {
3605	*r2p = NULL;
3606	}
3607	if (joinparamcheck(l, r, NULL, sl, sr, "BATjoin") != GDK_SUCCEED)
3608	return GDK_FAIL;
3609
3610	if (lcnt == `0` \|\| rcnt == `0`) {
3611	ALGODEBUG fprintf(stderr, "#BATjoin(l=" ALGOBATFMT ","
3612	"r=" ALGOBATFMT ",sl=" ALGOOPTBATFMT ","
3613	"sr=" ALGOOPTBATFMT ",nil_matches=%d)\n",
3614	ALGOBATPAR(l), ALGOBATPAR(r),
3615	ALGOOPTBATPAR(sl), ALGOOPTBATPAR(sr),
3616	nil_matches);
3617	return nomatch(r1p, r2p, l, r, &lci,
3618	false, false, "BATjoin", t0);
3619	}
3620
3621	swap = false;
3622
3623	/ some statistics to help us decide /
3624	lsize = (BUN) (BATcount(l) * (Tsize(l)) + (l->tvheap ? l->tvheap->size : `0`) + `2` * sizeof(BUN));
3625	rsize = (BUN) (BATcount(r) * (Tsize(r)) + (r->tvheap ? r->tvheap->size : `0`) + `2` * sizeof(BUN));
3626	mem_size = GDK_mem_maxsize / (GDKnr_threads ? GDKnr_threads : `1`);
3627
3628	if (lcnt == `1` \|\| (BATordered(l) && BATordered_rev(l)) \|\| (l->ttype == TYPE_void && is_oid_nil(l->tseqbase))) {
3629	/ single value to join, use select /
3630	return selectjoin(r1p, r2p, l, r, sl, sr,
3631	&lci, nil_matches, t0, false, __func__);
3632	} else if (r2p != NULL && (rcnt == `1` \|\| (BATordered(r) && BATordered_rev(r)) \|\| (r->ttype == TYPE_void && is_oid_nil(r->tseqbase)))) {
3633	/ single value to join, use select /
3634	return selectjoin(r2p, r1p, r, l, sr, sl,
3635	&rci, nil_matches, t0, true, __func__);
3636	} else if (BATtdense(r) && rci.tpe == cand_dense) {
3637	/ use special implementation for dense right-hand side /
3638	return mergejoin_void(r1p, r2p, l, r, sl, sr, &lci, &rci,
3639	false, false, t0, false, __func__);
3640	} else if (r2p && BATtdense(l) && lci.tpe == cand_dense) {
3641	/ use special implementation for dense right-hand side /
3642	return mergejoin_void(r2p, r1p, r, l, sr, sl, &rci, &lci,
3643	false, false, t0, true, __func__);
3644	} else if ((BATordered(l) \|\| BATordered_rev(l)) &&
3645	(BATordered(r) \|\| BATordered_rev(r))) {
3646	/ both sorted /
3647	return mergejoin(r1p, r2p, l, r, sl, sr, &lci, &rci,
3648	nil_matches, false, false, false, false,
3649	estimate, t0, false, __func__);
3650	}
3651	if (sl == NULL) {
3652	lhash = BATcheckhash(l);
3653	if (lhash) {
3654	lslots = ((size_t *) l->thash->heap.base)[`5`];
3655	} else if ((parent = VIEWtparent(l)) != `0`) {
3656	BAT *b = BBPdescriptor(parent);
3657	/ use hash on parent if the average chain*
3658	* length times the number of required probes
3659	* is less than the cost for creating and
3660	* probing a new hash on the view */
3661	if (BATcheckhash(b)) {
3662	lslots = ((size_t *) b->thash->heap.base)[`5`];
3663	lhash = (BATcount(b) == BATcount(l) \|\|
3664	BATcount(b) / lslots * rcnt < lcnt + rcnt);
3665	}
3666	plhash = lhash;
3667	}
3668	} else if (BATtdense(sl) && BATcheckhash(l)) {
3669	lslots = ((size_t *) l->thash->heap.base)[`5`];
3670	lhash = BATcount(l) / lslots * rcnt < lcnt + rcnt;
3671	}
3672	if (sr == NULL) {
3673	rhash = BATcheckhash(r);
3674	if (rhash) {
3675	rslots = ((size_t *) r->thash->heap.base)[`5`];
3676	} else if ((parent = VIEWtparent(r)) != `0`) {
3677	BAT *b = BBPdescriptor(parent);
3678	/ use hash on parent if the average chain*
3679	* length times the number of required probes
3680	* is less than the cost for creating and
3681	* probing a new hash on the view */
3682	if (BATcheckhash(b)) {
3683	rslots = ((size_t *) b->thash->heap.base)[`5`];
3684	rhash = (BATcount(b) == BATcount(r) \|\|
3685	BATcount(b) / rslots * lcnt < lcnt + rcnt);
3686	}
3687	prhash = rhash;
3688	}
3689	} else if (BATtdense(sr) && BATcheckhash(r)) {
3690	rslots = ((size_t *) r->thash->heap.base)[`5`];
3691	rhash = BATcount(r) / rslots * rcnt < lcnt + rcnt;
3692	}
3693	if (lhash && rhash) {
3694	if (lcnt == lslots && rcnt == rslots) {
3695	/ both perfect hashes, smallest on right /
3696	swap = r2p && lcnt < rcnt;
3697	} else if (r2p && lcnt == lslots) {
3698	/ left is perfect (right isn't): swap /
3699	swap = true;
3700	} else if (rcnt != rslots) {
3701	/ neither is perfect, shortest chains on right /
3702	swap = r2p && lcnt / lslots < rcnt / rslots;
3703	} / else: right is perfect /
3704	reason = "both have hash";
3705	} else if (r2p && lhash) {
3706	/ only left has hash, swap /
3707	swap = true;
3708	reason = "left has hash";
3709	} else if (rhash) {
3710	/ only right has hash, don't swap /
3711	swap = false;
3712	reason = "right has hash";
3713	} else if (r2p &&
3714	(BATordered(l) \|\| BATordered_rev(l)) &&
3715	(BATtvoid(l) \|\| rcnt < `1024` \|\| MIN(lsize, rsize) > mem_size)) {
3716	/ only left is sorted, swap; but only if right is*
3717	* "large" and the smaller of the two isn't too large
3718	* (i.e. prefer hash over binary search, but only if
3719	* the hash table doesn't cause thrashing) */
3720	return mergejoin(r2p, r1p, r, l, sr, sl, &rci, &lci,
3721	nil_matches, false, false, false, false,
3722	estimate, t0, true, __func__);
3723	} else if ((BATordered(r) \|\| BATordered_rev(r)) &&
3724	(BATtvoid(r) \|\| lcnt < `1024` \|\| MIN(lsize, rsize) > mem_size)) {
3725	/ only right is sorted, don't swap; but only if left*
3726	* is "large" and the smaller of the two isn't too
3727	* large (i.e. prefer hash over binary search, but
3728	* only if the hash table doesn't cause thrashing) */
3729	return mergejoin(r1p, r2p, l, r, sl, sr, &lci, &rci,
3730	nil_matches, false, false, false, false,
3731	estimate, t0, false, __func__);
3732	} else if (r2p && !l->batTransient && r->batTransient) {
3733	/ l is persistent and r is not, create hash on l*
3734	* since it may be reused */
3735	swap = true;
3736	reason = "left is persistent";
3737	} else if (l->batTransient && !r->batTransient) {
3738	/ l is not persistent but r is, create hash on r*
3739	* since it may be reused */
3740	/ nothing /;
3741	reason = "right is persistent";
3742	} else if (r2p && lcnt < rcnt) {
3743	/ no hashes, not sorted, create hash on smallest BAT /
3744	swap = true;
3745	reason = "left is smaller";
3746	}
3747	if (swap) {
3748	assert(r2p);
3749	return hashjoin(r2p, r1p, r, l, sr, sl, &rci, &lci,
3750	nil_matches, false, false, false, false,
3751	estimate, t0, true, plhash, reason);
3752	} else {
3753	return hashjoin(r1p, r2p, l, r, sl, sr, &lci, &rci,
3754	nil_matches, false, false, false, false,
3755	estimate, t0, false, prhash, reason);
3756	}
3757	}
3758
3759	gdk_return
3760	BATbandjoin(BAT r1p, BAT r2p, BAT l, BAT r, BAT sl, BAT sr,
3761	const void c1, const* void *c2, bool li, bool hi, BUN estimate)
3762	{
3763	lng t0 = `0`;
3764
3765	ALGODEBUG t0 = GDKusec();
3766
3767	ALGODEBUG fprintf(stderr, "#BATbandjoin("
3768	"l=" ALGOBATFMT ",r=" ALGOBATFMT ","
3769	"sl=" ALGOOPTBATFMT ",sr=" ALGOOPTBATFMT ")\n",
3770	ALGOBATPAR(l), ALGOBATPAR(r),
3771	ALGOOPTBATPAR(sl), ALGOOPTBATPAR(sr));
3772
3773	*r1p = NULL;
3774	if (r2p) {
3775	*r2p = NULL;
3776	}
3777	if (joinparamcheck(l, r, NULL, sl, sr, "BATbandjoin") != GDK_SUCCEED)
3778	return GDK_FAIL;
3779	return bandjoin(r1p, r2p, l, r, sl, sr, c1, c2, li, hi, estimate, t0);
3780	}
3781
3782	gdk_return
3783	BATrangejoin(BAT r1p, BAT r2p, BAT l, BAT rl, BAT *rh,
3784	BAT sl, BAT sr, bool li, bool hi, bool anti, bool symmetric,
3785	BUN estimate)
3786	{
3787	struct canditer lci, rci;
3788	BAT r1, r2;
3789	BUN maxsize;
3790	lng t0 = `0`;
3791
3792	ALGODEBUG t0 = GDKusec();
3793	*r1p = NULL;
3794	if (r2p) {
3795	*r2p = NULL;
3796	}
3797	if (joinparamcheck(l, rl, rh, sl, sr, "BATrangejoin") != GDK_SUCCEED)
3798	return GDK_FAIL;
3799	if (canditer_init(&lci, l, sl) == `0` \|\|
3800	canditer_init(&rci, rl, sr) == `0` \|\|
3801	(l->ttype == TYPE_void && is_oid_nil(l->tseqbase)) \|\|
3802	((rl->ttype == TYPE_void && is_oid_nil(rl->tseqbase)) &&
3803	(rh->ttype == TYPE_void && is_oid_nil(rh->tseqbase)))) {
3804	/ trivial: empty input /
3805	return nomatch(r1p, r2p, l, rl, &lci, false, false,
3806	__func__, t0);
3807	}
3808	if (rl->ttype == TYPE_void && is_oid_nil(rl->tseqbase)) {
3809	if (!anti)
3810	return nomatch(r1p, r2p, l, rl, &lci, false, false,
3811	__func__, t0);
3812	return thetajoin(r1p, r2p, l, rh, sl, sr, MASK_GT, estimate, t0);
3813	}
3814	if (rh->ttype == TYPE_void && is_oid_nil(rh->tseqbase)) {
3815	if (!anti)
3816	return nomatch(r1p, r2p, l, rl, &lci, false, false,
3817	__func__, t0);
3818	return thetajoin(r1p, r2p, l, rl, sl, sr, MASK_LT, estimate, t0);
3819	}
3820
3821	if ((maxsize = joininitresults(&r1, r2p ? &r2 : NULL, sl ? BATcount(sl) : BATcount(l), sr ? BATcount(sr) : BATcount(rl), false, false, false, false, false, estimate)) == BUN_NONE)
3822	return GDK_FAIL;
3823	*r1p = r1;
3824	if (r2p) {
3825	*r2p = r2;
3826	}
3827	if (maxsize == `0`)
3828	return GDK_SUCCEED;
3829
3830	/ note, the rangejoin implementation is in gdk_select.c since*
3831	* it uses the imprints code there */
3832	return rangejoin(r1, r2, l, rl, rh, &lci, &rci, li, hi, anti, symmetric, maxsize);
3833	}
3834

Browse the source code of MonetDB/gdk/gdk_join.c