| 1 | /*------------------------------------------------------------------------- | 
|---|
| 2 | * | 
|---|
| 3 | * nodeSamplescan.c | 
|---|
| 4 | *	  Support routines for sample scans of relations (table sampling). | 
|---|
| 5 | * | 
|---|
| 6 | * Portions Copyright (c) 1996-2019, PostgreSQL Global Development Group | 
|---|
| 7 | * Portions Copyright (c) 1994, Regents of the University of California | 
|---|
| 8 | * | 
|---|
| 9 | * | 
|---|
| 10 | * IDENTIFICATION | 
|---|
| 11 | *	  src/backend/executor/nodeSamplescan.c | 
|---|
| 12 | * | 
|---|
| 13 | *------------------------------------------------------------------------- | 
|---|
| 14 | */ | 
|---|
| 15 | #include "postgres.h" | 
|---|
| 16 |  | 
|---|
| 17 | #include "access/relscan.h" | 
|---|
| 18 | #include "access/tableam.h" | 
|---|
| 19 | #include "access/tsmapi.h" | 
|---|
| 20 | #include "executor/executor.h" | 
|---|
| 21 | #include "executor/nodeSamplescan.h" | 
|---|
| 22 | #include "miscadmin.h" | 
|---|
| 23 | #include "pgstat.h" | 
|---|
| 24 | #include "storage/bufmgr.h" | 
|---|
| 25 | #include "storage/predicate.h" | 
|---|
| 26 | #include "utils/builtins.h" | 
|---|
| 27 | #include "utils/rel.h" | 
|---|
| 28 |  | 
|---|
| 29 | static TupleTableSlot *SampleNext(SampleScanState *node); | 
|---|
| 30 | static void tablesample_init(SampleScanState *scanstate); | 
|---|
| 31 | static TupleTableSlot *tablesample_getnext(SampleScanState *scanstate); | 
|---|
| 32 |  | 
|---|
| 33 | /* ---------------------------------------------------------------- | 
|---|
| 34 | *						Scan Support | 
|---|
| 35 | * ---------------------------------------------------------------- | 
|---|
| 36 | */ | 
|---|
| 37 |  | 
|---|
| 38 | /* ---------------------------------------------------------------- | 
|---|
| 39 | *		SampleNext | 
|---|
| 40 | * | 
|---|
| 41 | *		This is a workhorse for ExecSampleScan | 
|---|
| 42 | * ---------------------------------------------------------------- | 
|---|
| 43 | */ | 
|---|
| 44 | static TupleTableSlot * | 
|---|
| 45 | SampleNext(SampleScanState *node) | 
|---|
| 46 | { | 
|---|
| 47 | /* | 
|---|
| 48 | * if this is first call within a scan, initialize | 
|---|
| 49 | */ | 
|---|
| 50 | if (!node->begun) | 
|---|
| 51 | tablesample_init(node); | 
|---|
| 52 |  | 
|---|
| 53 | /* | 
|---|
| 54 | * get the next tuple, and store it in our result slot | 
|---|
| 55 | */ | 
|---|
| 56 | return tablesample_getnext(node); | 
|---|
| 57 | } | 
|---|
| 58 |  | 
|---|
| 59 | /* | 
|---|
| 60 | * SampleRecheck -- access method routine to recheck a tuple in EvalPlanQual | 
|---|
| 61 | */ | 
|---|
| 62 | static bool | 
|---|
| 63 | SampleRecheck(SampleScanState *node, TupleTableSlot *slot) | 
|---|
| 64 | { | 
|---|
| 65 | /* | 
|---|
| 66 | * No need to recheck for SampleScan, since like SeqScan we don't pass any | 
|---|
| 67 | * checkable keys to heap_beginscan. | 
|---|
| 68 | */ | 
|---|
| 69 | return true; | 
|---|
| 70 | } | 
|---|
| 71 |  | 
|---|
| 72 | /* ---------------------------------------------------------------- | 
|---|
| 73 | *		ExecSampleScan(node) | 
|---|
| 74 | * | 
|---|
| 75 | *		Scans the relation using the sampling method and returns | 
|---|
| 76 | *		the next qualifying tuple. | 
|---|
| 77 | *		We call the ExecScan() routine and pass it the appropriate | 
|---|
| 78 | *		access method functions. | 
|---|
| 79 | * ---------------------------------------------------------------- | 
|---|
| 80 | */ | 
|---|
| 81 | static TupleTableSlot * | 
|---|
| 82 | ExecSampleScan(PlanState *pstate) | 
|---|
| 83 | { | 
|---|
| 84 | SampleScanState *node = castNode(SampleScanState, pstate); | 
|---|
| 85 |  | 
|---|
| 86 | return ExecScan(&node->ss, | 
|---|
| 87 | (ExecScanAccessMtd) SampleNext, | 
|---|
| 88 | (ExecScanRecheckMtd) SampleRecheck); | 
|---|
| 89 | } | 
|---|
| 90 |  | 
|---|
| 91 | /* ---------------------------------------------------------------- | 
|---|
| 92 | *		ExecInitSampleScan | 
|---|
| 93 | * ---------------------------------------------------------------- | 
|---|
| 94 | */ | 
|---|
| 95 | SampleScanState * | 
|---|
| 96 | ExecInitSampleScan(SampleScan *node, EState *estate, int eflags) | 
|---|
| 97 | { | 
|---|
| 98 | SampleScanState *scanstate; | 
|---|
| 99 | TableSampleClause *tsc = node->tablesample; | 
|---|
| 100 | TsmRoutine *tsm; | 
|---|
| 101 |  | 
|---|
| 102 | Assert(outerPlan(node) == NULL); | 
|---|
| 103 | Assert(innerPlan(node) == NULL); | 
|---|
| 104 |  | 
|---|
| 105 | /* | 
|---|
| 106 | * create state structure | 
|---|
| 107 | */ | 
|---|
| 108 | scanstate = makeNode(SampleScanState); | 
|---|
| 109 | scanstate->ss.ps.plan = (Plan *) node; | 
|---|
| 110 | scanstate->ss.ps.state = estate; | 
|---|
| 111 | scanstate->ss.ps.ExecProcNode = ExecSampleScan; | 
|---|
| 112 |  | 
|---|
| 113 | /* | 
|---|
| 114 | * Miscellaneous initialization | 
|---|
| 115 | * | 
|---|
| 116 | * create expression context for node | 
|---|
| 117 | */ | 
|---|
| 118 | ExecAssignExprContext(estate, &scanstate->ss.ps); | 
|---|
| 119 |  | 
|---|
| 120 | /* | 
|---|
| 121 | * open the scan relation | 
|---|
| 122 | */ | 
|---|
| 123 | scanstate->ss.ss_currentRelation = | 
|---|
| 124 | ExecOpenScanRelation(estate, | 
|---|
| 125 | node->scan.scanrelid, | 
|---|
| 126 | eflags); | 
|---|
| 127 |  | 
|---|
| 128 | /* we won't set up the HeapScanDesc till later */ | 
|---|
| 129 | scanstate->ss.ss_currentScanDesc = NULL; | 
|---|
| 130 |  | 
|---|
| 131 | /* and create slot with appropriate rowtype */ | 
|---|
| 132 | ExecInitScanTupleSlot(estate, &scanstate->ss, | 
|---|
| 133 | RelationGetDescr(scanstate->ss.ss_currentRelation), | 
|---|
| 134 | table_slot_callbacks(scanstate->ss.ss_currentRelation)); | 
|---|
| 135 |  | 
|---|
| 136 | /* | 
|---|
| 137 | * Initialize result type and projection. | 
|---|
| 138 | */ | 
|---|
| 139 | ExecInitResultTypeTL(&scanstate->ss.ps); | 
|---|
| 140 | ExecAssignScanProjectionInfo(&scanstate->ss); | 
|---|
| 141 |  | 
|---|
| 142 | /* | 
|---|
| 143 | * initialize child expressions | 
|---|
| 144 | */ | 
|---|
| 145 | scanstate->ss.ps.qual = | 
|---|
| 146 | ExecInitQual(node->scan.plan.qual, (PlanState *) scanstate); | 
|---|
| 147 |  | 
|---|
| 148 | scanstate->args = ExecInitExprList(tsc->args, (PlanState *) scanstate); | 
|---|
| 149 | scanstate->repeatable = | 
|---|
| 150 | ExecInitExpr(tsc->repeatable, (PlanState *) scanstate); | 
|---|
| 151 |  | 
|---|
| 152 | /* | 
|---|
| 153 | * If we don't have a REPEATABLE clause, select a random seed.  We want to | 
|---|
| 154 | * do this just once, since the seed shouldn't change over rescans. | 
|---|
| 155 | */ | 
|---|
| 156 | if (tsc->repeatable == NULL) | 
|---|
| 157 | scanstate->seed = random(); | 
|---|
| 158 |  | 
|---|
| 159 | /* | 
|---|
| 160 | * Finally, initialize the TABLESAMPLE method handler. | 
|---|
| 161 | */ | 
|---|
| 162 | tsm = GetTsmRoutine(tsc->tsmhandler); | 
|---|
| 163 | scanstate->tsmroutine = tsm; | 
|---|
| 164 | scanstate->tsm_state = NULL; | 
|---|
| 165 |  | 
|---|
| 166 | if (tsm->InitSampleScan) | 
|---|
| 167 | tsm->InitSampleScan(scanstate, eflags); | 
|---|
| 168 |  | 
|---|
| 169 | /* We'll do BeginSampleScan later; we can't evaluate params yet */ | 
|---|
| 170 | scanstate->begun = false; | 
|---|
| 171 |  | 
|---|
| 172 | return scanstate; | 
|---|
| 173 | } | 
|---|
| 174 |  | 
|---|
| 175 | /* ---------------------------------------------------------------- | 
|---|
| 176 | *		ExecEndSampleScan | 
|---|
| 177 | * | 
|---|
| 178 | *		frees any storage allocated through C routines. | 
|---|
| 179 | * ---------------------------------------------------------------- | 
|---|
| 180 | */ | 
|---|
| 181 | void | 
|---|
| 182 | ExecEndSampleScan(SampleScanState *node) | 
|---|
| 183 | { | 
|---|
| 184 | /* | 
|---|
| 185 | * Tell sampling function that we finished the scan. | 
|---|
| 186 | */ | 
|---|
| 187 | if (node->tsmroutine->EndSampleScan) | 
|---|
| 188 | node->tsmroutine->EndSampleScan(node); | 
|---|
| 189 |  | 
|---|
| 190 | /* | 
|---|
| 191 | * Free the exprcontext | 
|---|
| 192 | */ | 
|---|
| 193 | ExecFreeExprContext(&node->ss.ps); | 
|---|
| 194 |  | 
|---|
| 195 | /* | 
|---|
| 196 | * clean out the tuple table | 
|---|
| 197 | */ | 
|---|
| 198 | if (node->ss.ps.ps_ResultTupleSlot) | 
|---|
| 199 | ExecClearTuple(node->ss.ps.ps_ResultTupleSlot); | 
|---|
| 200 | ExecClearTuple(node->ss.ss_ScanTupleSlot); | 
|---|
| 201 |  | 
|---|
| 202 | /* | 
|---|
| 203 | * close heap scan | 
|---|
| 204 | */ | 
|---|
| 205 | if (node->ss.ss_currentScanDesc) | 
|---|
| 206 | table_endscan(node->ss.ss_currentScanDesc); | 
|---|
| 207 | } | 
|---|
| 208 |  | 
|---|
| 209 | /* ---------------------------------------------------------------- | 
|---|
| 210 | *		ExecReScanSampleScan | 
|---|
| 211 | * | 
|---|
| 212 | *		Rescans the relation. | 
|---|
| 213 | * | 
|---|
| 214 | * ---------------------------------------------------------------- | 
|---|
| 215 | */ | 
|---|
| 216 | void | 
|---|
| 217 | ExecReScanSampleScan(SampleScanState *node) | 
|---|
| 218 | { | 
|---|
| 219 | /* Remember we need to do BeginSampleScan again (if we did it at all) */ | 
|---|
| 220 | node->begun = false; | 
|---|
| 221 | node->done = false; | 
|---|
| 222 | node->haveblock = false; | 
|---|
| 223 | node->donetuples = 0; | 
|---|
| 224 |  | 
|---|
| 225 | ExecScanReScan(&node->ss); | 
|---|
| 226 | } | 
|---|
| 227 |  | 
|---|
| 228 |  | 
|---|
| 229 | /* | 
|---|
| 230 | * Initialize the TABLESAMPLE method: evaluate params and call BeginSampleScan. | 
|---|
| 231 | */ | 
|---|
| 232 | static void | 
|---|
| 233 | tablesample_init(SampleScanState *scanstate) | 
|---|
| 234 | { | 
|---|
| 235 | TsmRoutine *tsm = scanstate->tsmroutine; | 
|---|
| 236 | ExprContext *econtext = scanstate->ss.ps.ps_ExprContext; | 
|---|
| 237 | Datum	   *params; | 
|---|
| 238 | Datum		datum; | 
|---|
| 239 | bool		isnull; | 
|---|
| 240 | uint32		seed; | 
|---|
| 241 | bool		allow_sync; | 
|---|
| 242 | int			i; | 
|---|
| 243 | ListCell   *arg; | 
|---|
| 244 |  | 
|---|
| 245 | scanstate->donetuples = 0; | 
|---|
| 246 | params = (Datum *) palloc(list_length(scanstate->args) * sizeof(Datum)); | 
|---|
| 247 |  | 
|---|
| 248 | i = 0; | 
|---|
| 249 | foreach(arg, scanstate->args) | 
|---|
| 250 | { | 
|---|
| 251 | ExprState  *argstate = (ExprState *) lfirst(arg); | 
|---|
| 252 |  | 
|---|
| 253 | params[i] = ExecEvalExprSwitchContext(argstate, | 
|---|
| 254 | econtext, | 
|---|
| 255 | &isnull); | 
|---|
| 256 | if (isnull) | 
|---|
| 257 | ereport(ERROR, | 
|---|
| 258 | (errcode(ERRCODE_INVALID_TABLESAMPLE_ARGUMENT), | 
|---|
| 259 | errmsg( "TABLESAMPLE parameter cannot be null"))); | 
|---|
| 260 | i++; | 
|---|
| 261 | } | 
|---|
| 262 |  | 
|---|
| 263 | if (scanstate->repeatable) | 
|---|
| 264 | { | 
|---|
| 265 | datum = ExecEvalExprSwitchContext(scanstate->repeatable, | 
|---|
| 266 | econtext, | 
|---|
| 267 | &isnull); | 
|---|
| 268 | if (isnull) | 
|---|
| 269 | ereport(ERROR, | 
|---|
| 270 | (errcode(ERRCODE_INVALID_TABLESAMPLE_REPEAT), | 
|---|
| 271 | errmsg( "TABLESAMPLE REPEATABLE parameter cannot be null"))); | 
|---|
| 272 |  | 
|---|
| 273 | /* | 
|---|
| 274 | * The REPEATABLE parameter has been coerced to float8 by the parser. | 
|---|
| 275 | * The reason for using float8 at the SQL level is that it will | 
|---|
| 276 | * produce unsurprising results both for users used to databases that | 
|---|
| 277 | * accept only integers in the REPEATABLE clause and for those who | 
|---|
| 278 | * might expect that REPEATABLE works like setseed() (a float in the | 
|---|
| 279 | * range from -1 to 1). | 
|---|
| 280 | * | 
|---|
| 281 | * We use hashfloat8() to convert the supplied value into a suitable | 
|---|
| 282 | * seed.  For regression-testing purposes, that has the convenient | 
|---|
| 283 | * property that REPEATABLE(0) gives a machine-independent result. | 
|---|
| 284 | */ | 
|---|
| 285 | seed = DatumGetUInt32(DirectFunctionCall1(hashfloat8, datum)); | 
|---|
| 286 | } | 
|---|
| 287 | else | 
|---|
| 288 | { | 
|---|
| 289 | /* Use the seed selected by ExecInitSampleScan */ | 
|---|
| 290 | seed = scanstate->seed; | 
|---|
| 291 | } | 
|---|
| 292 |  | 
|---|
| 293 | /* Set default values for params that BeginSampleScan can adjust */ | 
|---|
| 294 | scanstate->use_bulkread = true; | 
|---|
| 295 | scanstate->use_pagemode = true; | 
|---|
| 296 |  | 
|---|
| 297 | /* Let tablesample method do its thing */ | 
|---|
| 298 | tsm->BeginSampleScan(scanstate, | 
|---|
| 299 | params, | 
|---|
| 300 | list_length(scanstate->args), | 
|---|
| 301 | seed); | 
|---|
| 302 |  | 
|---|
| 303 | /* We'll use syncscan if there's no NextSampleBlock function */ | 
|---|
| 304 | allow_sync = (tsm->NextSampleBlock == NULL); | 
|---|
| 305 |  | 
|---|
| 306 | /* Now we can create or reset the HeapScanDesc */ | 
|---|
| 307 | if (scanstate->ss.ss_currentScanDesc == NULL) | 
|---|
| 308 | { | 
|---|
| 309 | scanstate->ss.ss_currentScanDesc = | 
|---|
| 310 | table_beginscan_sampling(scanstate->ss.ss_currentRelation, | 
|---|
| 311 | scanstate->ss.ps.state->es_snapshot, | 
|---|
| 312 | 0, NULL, | 
|---|
| 313 | scanstate->use_bulkread, | 
|---|
| 314 | allow_sync, | 
|---|
| 315 | scanstate->use_pagemode); | 
|---|
| 316 | } | 
|---|
| 317 | else | 
|---|
| 318 | { | 
|---|
| 319 | table_rescan_set_params(scanstate->ss.ss_currentScanDesc, NULL, | 
|---|
| 320 | scanstate->use_bulkread, | 
|---|
| 321 | allow_sync, | 
|---|
| 322 | scanstate->use_pagemode); | 
|---|
| 323 | } | 
|---|
| 324 |  | 
|---|
| 325 | pfree(params); | 
|---|
| 326 |  | 
|---|
| 327 | /* And we're initialized. */ | 
|---|
| 328 | scanstate->begun = true; | 
|---|
| 329 | } | 
|---|
| 330 |  | 
|---|
| 331 | /* | 
|---|
| 332 | * Get next tuple from TABLESAMPLE method. | 
|---|
| 333 | */ | 
|---|
| 334 | static TupleTableSlot * | 
|---|
| 335 | tablesample_getnext(SampleScanState *scanstate) | 
|---|
| 336 | { | 
|---|
| 337 | TableScanDesc scan = scanstate->ss.ss_currentScanDesc; | 
|---|
| 338 | TupleTableSlot *slot = scanstate->ss.ss_ScanTupleSlot; | 
|---|
| 339 |  | 
|---|
| 340 | ExecClearTuple(slot); | 
|---|
| 341 |  | 
|---|
| 342 | if (scanstate->done) | 
|---|
| 343 | return NULL; | 
|---|
| 344 |  | 
|---|
| 345 | for (;;) | 
|---|
| 346 | { | 
|---|
| 347 | if (!scanstate->haveblock) | 
|---|
| 348 | { | 
|---|
| 349 | if (!table_scan_sample_next_block(scan, scanstate)) | 
|---|
| 350 | { | 
|---|
| 351 | scanstate->haveblock = false; | 
|---|
| 352 | scanstate->done = true; | 
|---|
| 353 |  | 
|---|
| 354 | /* exhausted relation */ | 
|---|
| 355 | return NULL; | 
|---|
| 356 | } | 
|---|
| 357 |  | 
|---|
| 358 | scanstate->haveblock = true; | 
|---|
| 359 | } | 
|---|
| 360 |  | 
|---|
| 361 | if (!table_scan_sample_next_tuple(scan, scanstate, slot)) | 
|---|
| 362 | { | 
|---|
| 363 | /* | 
|---|
| 364 | * If we get here, it means we've exhausted the items on this page | 
|---|
| 365 | * and it's time to move to the next. | 
|---|
| 366 | */ | 
|---|
| 367 | scanstate->haveblock = false; | 
|---|
| 368 | continue; | 
|---|
| 369 | } | 
|---|
| 370 |  | 
|---|
| 371 | /* Found visible tuple, return it. */ | 
|---|
| 372 | break; | 
|---|
| 373 | } | 
|---|
| 374 |  | 
|---|
| 375 | scanstate->donetuples++; | 
|---|
| 376 |  | 
|---|
| 377 | return slot; | 
|---|
| 378 | } | 
|---|
| 379 |  | 
|---|