mirror of
https://github.com/zebrajr/postgres.git
synced 2025-12-07 12:20:31 +01:00
Add a TABLESAMPLE clause to SELECT statements that allows user to specify random BERNOULLI sampling or block level SYSTEM sampling. Implementation allows for extensible sampling functions to be written, using a standard API. Basic version follows SQLStandard exactly. Usable concrete use cases for the sampling API follow in later commits. Petr Jelinek Reviewed by Michael Paquier and Simon Riggs
56 lines
1.7 KiB
C
56 lines
1.7 KiB
C
/*-------------------------------------------------------------------------
|
|
*
|
|
* sampling.h
|
|
* definitions for sampling functions
|
|
*
|
|
* Portions Copyright (c) 1996-2014, PostgreSQL Global Development Group
|
|
* Portions Copyright (c) 1994, Regents of the University of California
|
|
*
|
|
* src/include/utils/sampling.h
|
|
*
|
|
*-------------------------------------------------------------------------
|
|
*/
|
|
#ifndef SAMPLING_H
|
|
#define SAMPLING_H
|
|
|
|
#include "storage/bufmgr.h"
|
|
|
|
/* Random generator for sampling code */
|
|
typedef unsigned short SamplerRandomState[3];
|
|
|
|
extern void sampler_random_init_state(long seed,
|
|
SamplerRandomState randstate);
|
|
extern double sampler_random_fract(SamplerRandomState randstate);
|
|
|
|
/* Block sampling methods */
|
|
/* Data structure for Algorithm S from Knuth 3.4.2 */
|
|
typedef struct
|
|
{
|
|
BlockNumber N; /* number of blocks, known in advance */
|
|
int n; /* desired sample size */
|
|
BlockNumber t; /* current block number */
|
|
int m; /* blocks selected so far */
|
|
SamplerRandomState randstate; /* random generator state */
|
|
} BlockSamplerData;
|
|
|
|
typedef BlockSamplerData *BlockSampler;
|
|
|
|
extern void BlockSampler_Init(BlockSampler bs, BlockNumber nblocks,
|
|
int samplesize, long randseed);
|
|
extern bool BlockSampler_HasMore(BlockSampler bs);
|
|
extern BlockNumber BlockSampler_Next(BlockSampler bs);
|
|
|
|
/* Reservoid sampling methods */
|
|
typedef struct
|
|
{
|
|
double W;
|
|
SamplerRandomState randstate; /* random generator state */
|
|
} ReservoirStateData;
|
|
|
|
typedef ReservoirStateData *ReservoirState;
|
|
|
|
extern void reservoir_init_selection_state(ReservoirState rs, int n);
|
|
extern double reservoir_get_next_S(ReservoirState rs, double t, int n);
|
|
|
|
#endif /* SAMPLING_H */
|