add lib

yuuuxt · yuuuxt · commit f642a78691d8 · 2020-10-17T17:19:54.000+08:00
diff --git a/lib/sequential-uuids/.gitignore b/lib/sequential-uuids/.gitignore
@@ -0,0 +1,2 @@
+*.o
+*.so
diff --git a/lib/sequential-uuids/LICENSE b/lib/sequential-uuids/LICENSE
@@ -0,0 +1,21 @@
+MIT License
+
+Copyright (c) 2018 Tomas Vondra
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
diff --git a/lib/sequential-uuids/META.json b/lib/sequential-uuids/META.json
@@ -0,0 +1,35 @@
+{
+   "name": "sequential_uuids",
+   "abstract": "UUID generators with sequential patterns, which helps to reduce random I/O patterns associated with regular entirely-random UUID.",
+   "description": "Regular random UUIDs are distributed uniformly over the whole range of possible values. This results in poor locality when inserting data into indexes - all index leaf pages are equally likely to be hit, forcing the whole index into memory. With small indexes that's fine, but once the index size exceeds shared buffers (or RAM), the cache hit ratio quickly deteriorates. The main goal of the two generators implemented by this extension, is generating UUIDS in a more sequential pattern, but without reducing the randomness too much (which could increase the probability of collision and predictability of the generated UUIDs). This idea is not new, and is described as",
+   "version": "1.0.1",
+   "maintainer": "Tomas Vondra <tomas@pgaddict.com>",
+   "license": "bsd",
+   "prereqs": {
+      "runtime": {
+         "requires": {
+            "PostgreSQL": "10.0.0"
+         }
+      }
+   },
+   "provides": {
+     "sequential_uuids": {
+       "file": "sequential_uuids--1.0.1.sql",
+       "docfile" : "README.md",
+       "version": "1.0.1"
+     }
+   },
+   "resources": {
+      "repository": {
+        "url":  "https://github.com/tvondra/sequential-uuids.git",
+        "web":  "http://github.com/tvondra/sequential-uuids",
+        "type": "git"
+      }
+   },
+   "tags" : ["UUID", "generator"],
+   "meta-spec": {
+      "version": "1.0.0",
+      "url": "http://pgxn.org/meta/spec.txt"
+   },
+   "release_status" : "stable"
+}
diff --git a/lib/sequential-uuids/Makefile b/lib/sequential-uuids/Makefile
@@ -0,0 +1,19 @@
+# sequeantial_uuids/Makefile
+#
+# Copyright (c) 2014 Citus Data, Inc.
+#
+
+MODULE_big = sequential_uuids
+
+OBJS = sequential_uuids.o
+
+EXTENSION = sequential_uuids
+DATA = sequential_uuids--1.0.1.sql
+
+PG_CONFIG = pg_config
+PGXS := $(shell $(PG_CONFIG) --pgxs)
+include $(PGXS)
+
+ifndef MAJORVERSION
+    MAJORVERSION := $(basename $(VERSION))
+endif
diff --git a/lib/sequential-uuids/README.md b/lib/sequential-uuids/README.md
@@ -0,0 +1,105 @@
+Sequential UUID generators
+==========================
+
+This PostgreSQL extension implements two UUID generators with sequential
+patterns, which helps to reduce random I/O patterns associated with
+regular entirely-random UUID.
+
+Regular random UUIDs are distributed uniformly over the whole range of
+possible values.  This results in poor locality when inserting data into
+indexes - all index leaf pages are equally likely to be hit, forcing
+the whole index into memory.  With small indexes that's fine, but once
+the index size exceeds shared buffers (or RAM), the cache hit ratio
+quickly deteriorates.
+
+Compare this to sequences and timestamps, which have a more sequential
+pattern and the new data almost always end up in the right-most part of
+the index (new sequence value is larger than all preceding values, same
+for timestamp).  This results in a nicer and cache-friendlier behavior,
+but the values are predictable and may easily collide cross machines.
+
+The main goal of the two generators implemented by this extension, is
+generating UUIDS in a more sequential pattern, but without reducing the
+randomness too much (which could increase the probability of collision
+and predictability of the generated UUIDs).  This idea is not new, and
+is described as 
+
+This idea is pretty much what the UUID wikipedia article [1] calls COMB
+(combined-time GUID) and is more more thoroughly explained in [2].
+
+
+Generators
+----------
+
+The extension provides two functions generating sequential UUIDs using
+either a sequence or timestamp.
+
+* `uuid_sequence_nextval(sequence regclass, block_size int default 65536, block_count int default 65536)`
+
+* `uuid_time_nextval(interval_length int default 60, interval_count int default 65536) RETURNS uuid`
+
+The default values for parameters are selected to work well for a range
+of workloads.  See the next section explaining the design for additional
+information about the meaning of those parameters.
+
+
+Design
+------
+
+The easiest way to make UUIDs more sequential is to use some sequential
+value as a prefix. For example, we might take a sequence or a timestamp
+and add random data until we have 16B in total.  The resulting values
+would be almost perfectly sequential, but there are two issues with it:
+
+* reduction of randomness - E.g. with a sequence producing bigint values
+  this would reduce the randomness from 16B to 8B.  Timestamps do reduce
+  the randomness in a similar way, depending on the accuracy.  This
+  increases both the collision probability and predictability (e.g. it
+  allows determining which UUIDs were generated close to each other, and
+  perhaps the exact timestamp).
+
+* bloat - If the values only grow, this may result in bloat in indexes
+  after deleting historical data.  This is a well-known issue e.g. with
+  indexes on timestamps in log tables.
+
+To address both of these issues, the implemented generators are designed
+to wrap-around regularly, either after generating certain number of UUIDs
+or some amount of time.  In both cases, the UUIDs are generates in blocks
+and have the form of
+
+    (block ID; random data)
+
+The size of the block ID depends on the number of blocks and is fixed
+(depends on generator parameters).  For example with the default 64k
+blocks we need 2 bytes to store it.  The block ID increments regularly,
+and eventually wraps around.
+
+For sequence-based generators the block size is determined by number of
+UUIDs generated.  For example we may use blocks of 256 values, in which
+case the two-byte block ID may be computed like this:
+
+    (nextval('s') / 256) % 65536
+
+So the generator wraps-around every ~16M UUIDs (because 256 * 65536).
+
+For timestamp-based generators, the block size is defined as interval
+length, with the default value 60 seconds.  As the default number of
+blocks is 64k (same as for sequence-based generators), the bloc may be
+computed like this
+
+    (timestamp / 60) % 65536
+
+Which means the generator wraps around every ~45 days.
+
+
+Supported Releases
+------------------
+
+Currently, this extension works only on releases since PostgreSQL 10. It
+can be made working on older releases with some minor code tweaks if
+someone wants to spend a bit of time on that.
+
+
+[1] https://en.wikipedia.org/wiki/Universally_unique_identifier
+
+[2] http://www.informit.com/articles/article.aspx?p=25862
diff --git a/lib/sequential-uuids/sequential_uuids--1.0--1.0.1.sql b/lib/sequential-uuids/sequential_uuids--1.0--1.0.1.sql
diff --git a/lib/sequential-uuids/sequential_uuids--1.0.1.sql b/lib/sequential-uuids/sequential_uuids--1.0.1.sql
@@ -0,0 +1,12 @@
+/* sequential_uuids.sql */
+
+-- complain if script is sourced in psql, rather than via CREATE EXTENSION
+\echo Use "CREATE EXTENSION sequential_uuids" to load this file. \quit
+
+CREATE FUNCTION uuid_sequence_nextval(regclass, block_size int default 65536, block_count int default 65536) RETURNS uuid
+AS 'MODULE_PATHNAME', 'uuid_sequence_nextval'
+LANGUAGE C STRICT PARALLEL SAFE;
+
+CREATE FUNCTION uuid_time_nextval(interval_length int default 60, interval_count int default 65536) RETURNS uuid
+AS 'MODULE_PATHNAME', 'uuid_time_nextval'
+LANGUAGE C STRICT PARALLEL SAFE;
diff --git a/lib/sequential-uuids/sequential_uuids.c b/lib/sequential-uuids/sequential_uuids.c
@@ -0,0 +1,199 @@
+/*-------------------------------------------------------------------------
+ *
+ * sequential_uuids.c
+ *	  generators of sequential UUID values based on sequence/timestamp
+ *
+ *
+ * Currently, this only works on PostgreSQL 10. Adding support for older
+ * releases is possible, but it would require solving a couple issues:
+ *
+ * 1) pg_uuid_t hidden in uuid.c (can be solved by local struct definition)
+ *
+ * 2) pg_strong_random not available (can fallback to random, probably)
+ *
+ * 3) functions defined as PARALLEL SAFE, which fails on pre-9.6 releases
+ *
+ *-------------------------------------------------------------------------
+ */
+#include <sys/time.h>
+#include <sys/types.h>
+#include <unistd.h>
+
+#include "postgres.h"
+
+#include "catalog/namespace.h"
+#include "commands/sequence.h"
+#include "utils/uuid.h"
+
+PG_MODULE_MAGIC;
+
+PG_FUNCTION_INFO_V1(uuid_sequence_nextval);
+PG_FUNCTION_INFO_V1(uuid_time_nextval);
+
+/*
+ * uuid_sequence_nextval
+ *	generate sequential UUID using a sequence
+ *
+ * The sequence-based sequential UUID generator define the group size
+ * and group count based on number of UUIDs generated.
+ *
+ * The block_size (65546 by default) determines the number of UUIDs with
+ * the same prefix, and block_count (65536 by default) determines the
+ * number of blocks before wrapping around to 0. This means that with
+ * the default values, the generator wraps around every ~2B UUIDs.
+ *
+ * You may increase (or rather decrease) the parameters if needed, e.g,
+ * by lowering the block size to 256, in wich case the cycle interval
+ * is only 16M values.
+ */
+Datum
+uuid_sequence_nextval(PG_FUNCTION_ARGS)
+{
+	int				i;
+	int64			val;
+	Oid				relid = PG_GETARG_OID(0);
+	int32			block_size = PG_GETARG_INT32(1);
+	int32			block_count = PG_GETARG_INT32(2);
+	int64			prefix_bytes;
+	pg_uuid_t	   *uuid;
+	unsigned char  *p;
+
+	/* some basic sanity checks */
+	if (block_size < 0)
+		ereport(ERROR,
+				(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
+				 errmsg("block size must be a positive integer")));
+
+	if (block_count < 0)
+		ereport(ERROR,
+				(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
+				 errmsg("number of blocks must be a positive integer")));
+
+	/* count the number of bytes to keep from the sequence value */
+	prefix_bytes = 0;
+	while (block_count > 1)
+	{
+		block_count /= 256;
+		prefix_bytes++;
+	}
+
+	/*
+	 * Read the next value from the sequence and get rid of the least
+	 * significant bytes.
+	 */
+	val = nextval_internal(relid, true);
+	val /= block_size;
+
+	p = (unsigned char *) &val;
+
+	uuid = palloc(sizeof(pg_uuid_t));
+
+	/* copy the desired number of (least significant) bytes as prefix */
+	for (i = 0; i < prefix_bytes; i++)
+		uuid->data[i] = p[prefix_bytes - 1 - i];
+
+	/* generate the remaining bytes as random (use strong generator) */
+	if(!pg_strong_random(uuid->data + prefix_bytes, UUID_LEN - prefix_bytes))
+		ereport(ERROR,
+				(errcode(ERRCODE_INTERNAL_ERROR),
+				 errmsg("could not generate random values")));
+
+	/*
+	 * Set the UUID version flags according to "version 4" (pseudorandom)
+	 * UUID, see http://tools.ietf.org/html/rfc4122#section-4.4
+	 *
+	 * This does reduce the randomness a bit, because it determines the
+	 * value of certain bits, but that should be negligible (certainly
+	 * compared to the reduction due to prefix).
+	 * 
+	 * UUID v4 is probably the safest choice here. There is v1 which is
+	 * time-based, but it includes MAC address (which we don't use) and
+	 * works with very special timestamp (starting at 1582 etc.). So we
+	 * just use v4 and claim this is pseudorandom.
+	 */
+	uuid->data[6] = (uuid->data[6] & 0x0f) | 0x40;	/* time_hi_and_version */
+	uuid->data[8] = (uuid->data[8] & 0x3f) | 0x80;	/* clock_seq_hi_and_reserved */
+
+	PG_RETURN_UUID_P(uuid);
+}
+
+/*
+ * uuid_time_nextval
+ *	generate sequential UUID using current time
+ *
+ * The timestamp-based sequential UUID generator define the group size
+ * and group count based on data extracted from current timestamp.
+ *
+ * The interval_length (60 seconds by default) is defined as number of
+ * seconds where UUIDs share the same prefix). The prefix length is
+ * determined by the number of intervals (65536 by default, i.e. 2B).
+ * With these parameters the generator wraps around every ~45 days.
+ */
+Datum
+uuid_time_nextval(PG_FUNCTION_ARGS)
+{
+	int				i;
+	struct timeval	tv;
+	int64			val;
+	pg_uuid_t	   *uuid;
+	int32			interval_length = PG_GETARG_INT32(0);
+	int32			interval_count = PG_GETARG_INT32(1);
+	int64			prefix_bytes;
+	unsigned char  *p;
+
+	/* some basic sanity checks */
+	if (interval_length < 1)
+		ereport(ERROR,
+				(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
+				 errmsg("length of interval must be a positive integer")));
+
+	if (interval_count < 1)
+		ereport(ERROR,
+				(errcode(ERRCODE_INVALID_PARAMETER_VALUE),
+				 errmsg("number of intervals must be a positive integer")));
+
+	if (gettimeofday(&tv, NULL) != 0)
+		elog(ERROR, "gettimeofday call failed");
+
+	val = (tv.tv_sec / interval_length);
+
+	/* count the number of bytes to keep from the timestamp */
+	prefix_bytes = 0;
+	while (interval_count > 1)
+	{
+		interval_count /= 256;
+		prefix_bytes++;
+	}
+
+	p = (unsigned char *) &val;
+
+	uuid = palloc(sizeof(pg_uuid_t));
+
+	/* copy the desired number of (least significant) bytes as prefix */
+	for (i = 0; i < prefix_bytes; i++)
+		uuid->data[i] = p[prefix_bytes - 1 - i];
+
+	/* generate the remaining bytes as random (use strong generator) */
+	if(!pg_strong_random(uuid->data + prefix_bytes, UUID_LEN - prefix_bytes))
+		ereport(ERROR,
+				(errcode(ERRCODE_INTERNAL_ERROR),
+				 errmsg("could not generate random values")));
+
+	/*
+	 * Set the UUID version flags according to "version 4" (pseudorandom)
+	 * UUID, see http://tools.ietf.org/html/rfc4122#section-4.4
+	 *
+	 * This does reduce the randomness a bit, because it determines the
+	 * value of certain bits, but that should be negligible (certainly
+	 * compared to the reduction due to prefix).
+	 * 
+	 * UUID v4 is probably the safest choice here. There is v1 which is
+	 * time-based, but it includes MAC address (which we don't use) and
+	 * works with very special timestamp (starting at 1582 etc.). So we
+	 * just use v4 and claim this is pseudorandom.
+	 */
+	uuid->data[6] = (uuid->data[6] & 0x0f) | 0x40;	/* time_hi_and_version */
+	uuid->data[8] = (uuid->data[8] & 0x3f) | 0x80;	/* clock_seq_hi_and_reserved */
+
+	PG_RETURN_UUID_P(uuid);
+}
diff --git a/lib/sequential-uuids/sequential_uuids.control b/lib/sequential-uuids/sequential_uuids.control