postgrespro
diff --git a/‎contrib/pg_pathman/.gitignore
Lines changed: 2 additions & 0 deletions b/‎contrib/pg_pathman/.gitignore
Lines changed: 2 additions & 0 deletions
diff --git a/‎contrib/pg_pathman/.travis.yml
Lines changed: 2 additions & 0 deletions b/‎contrib/pg_pathman/.travis.yml
Lines changed: 2 additions & 0 deletions
diff --git a/‎contrib/pg_pathman/Makefile
Lines changed: 15 additions & 8 deletions b/‎contrib/pg_pathman/Makefile
Lines changed: 15 additions & 8 deletions
diff --git a/‎contrib/pg_pathman/README.md
Lines changed: 121 additions & 50 deletions b/‎contrib/pg_pathman/README.md
Lines changed: 121 additions & 50 deletions
@@ -1,7 +1,9 @@
 .deps
+isolation_output
 results/pg_pathman.out
 regression.diffs
 regression.out
 *.o
 *.so
+*.pyc
 pg_pathman--*.sql
@@ -14,6 +14,8 @@ before_install:
   - sudo sh ./travis/apt.postgresql.org.sh
 
 env:
+  - PGVERSION=9.6 CHECK_CODE=true
+  - PGVERSION=9.6 CHECK_CODE=false
   - PGVERSION=9.5 CHECK_CODE=true
   - PGVERSION=9.5 CHECK_CODE=false
 
 
@@ -1,15 +1,22 @@
 # contrib/pg_pathman/Makefile
 
 MODULE_big = pg_pathman
-OBJS = src/init.o src/utils.o src/runtimeappend.o src/runtime_merge_append.o src/pg_pathman.o src/dsm_array.o \
-	src/rangeset.o src/pl_funcs.o src/worker.o src/hooks.o src/nodes_common.o $(WIN32RES)
+OBJS = src/init.o src/relation_info.o src/utils.o src/partition_filter.o \
+	src/runtimeappend.o src/runtime_merge_append.o src/pg_pathman.o src/rangeset.o \
+	src/pl_funcs.o src/pl_range_funcs.o src/pl_hash_funcs.o src/pathman_workers.o \
+	src/hooks.o src/nodes_common.o src/xact_handling.o src/copy_stmt_hooking.o \
+	src/pg_compat.o $(WIN32RES)
 
 EXTENSION = pg_pathman
-EXTVERSION = 0.1
+EXTVERSION = 1.0
 DATA_built = $(EXTENSION)--$(EXTVERSION).sql
 PGFILEDESC = "pg_pathman - partitioning tool"
 
-REGRESS = pg_pathman
+REGRESS = pathman_basic \
+		  pathman_runtime_nodes \
+		  pathman_callbacks \
+		  pathman_domains \
+		  pathman_foreign_keys
 EXTRA_REGRESS_OPTS=--temp-config=$(top_srcdir)/$(subdir)/conf.add
 EXTRA_CLEAN = $(EXTENSION)--$(EXTVERSION).sql ./isolation_output
 
@@ -27,14 +34,14 @@ endif
 $(EXTENSION)--$(EXTVERSION).sql: init.sql hash.sql range.sql
 	cat $^ > $@
 
-ISOLATIONCHECKS=insert_trigger rollback_on_create_partitions
+ISOLATIONCHECKS=insert_nodes for_update rollback_on_create_partitions
 
 submake-isolation:
 	$(MAKE) -C $(top_builddir)/src/test/isolation all
 
 isolationcheck: | submake-isolation
 	$(MKDIR_P) isolation_output
 	$(pg_isolation_regress_check) \
-	    --temp-config=$(top_srcdir)/$(subdir)/conf.add \
-	    --outputdir=./isolation_output \
-	    $(ISOLATIONCHECKS)
+		--temp-config=$(top_srcdir)/$(subdir)/conf.add \
+		--outputdir=./isolation_output \
+		$(ISOLATIONCHECKS)
@@ -1,9 +1,12 @@
 [![Build Status](https://travis-ci.org/postgrespro/pg_pathman.svg?branch=master)](https://travis-ci.org/postgrespro/pg_pathman)
+[![PGXN version](https://badge.fury.io/pg/pg_pathman.svg)](https://badge.fury.io/pg/pg_pathman)
 
 # pg_pathman
 
 The `pg_pathman` module provides optimized partitioning mechanism and functions to manage partitions.
 
+The extension is compatible with PostgreSQL 9.5 (9.6 support is coming soon).
+
 ## Overview
 **Partitioning** means splitting one large table into smaller pieces. Each row in such table is moved to a single partition according to the partitioning key. PostgreSQL supports partitioning via table inheritance: each partition must be created as a child table with CHECK CONSTRAINT. For example:
 
@@ -29,16 +32,15 @@ WHERE id = 150
 Based on the partitioning type and condition's operator, `pg_pathman` searches for the corresponding partitions and builds the plan. Currently `pg_pathman` supports two partitioning schemes:
 
 * **RANGE** - maps rows to partitions using partitioning key ranges assigned to each partition. Optimization is achieved by using the binary search algorithm;
-* **HASH** - maps rows to partitions using a generic hash function (only *integer* attributes are supported at the moment).
+* **HASH** - maps rows to partitions using a generic hash function.
 
 More interesting features are yet to come. Stay tuned!
 
 ## Roadmap
- * Replace INSERT triggers with a custom node (aka **PartitionFilter**)
- * Implement [concurrent partitioning](https://github.com/postgrespro/pg_pathman/tree/concurrent_part) (much more responsive)
- * Implement HASH partitioning for non-integer attributes
- * Optimize hash join (both tables are partitioned by join key)
- * Implement LIST partitioning scheme
+
+ * Provide a way to create user-defined partition creation\destruction callbacks (issue [#22](https://github.com/postgrespro/pg_pathman/issues/22))
+ * Implement LIST partitioning scheme;
+ * Optimize hash join (both tables are partitioned by join key).
 
 ## Installation guide
 To install `pg_pathman`, execute this in the module's directory:
@@ -62,77 +64,99 @@ Done! Now it's time to setup your partitioning schemes.
 
 ### Partition creation
 ```plpgsql
-create_hash_partitions(relation         TEXT,
+create_hash_partitions(relation         REGCLASS,
                        attribute        TEXT,
-                       partitions_count INTEGER)
+                       partitions_count INTEGER,
+                       partition_name   TEXT DEFAULT NULL)
 ```
-Performs HASH partitioning for `relation` by integer key `attribute`. Creates `partitions_count` partitions and trigger on INSERT. All the data will be automatically copied from the parent to partitions.
+Performs HASH partitioning for `relation` by integer key `attribute`. The `partitions_count` parameter specifies the number of partitions to create; it cannot be changed afterwards. If `partition_data` is `true` then all the data will be automatically copied from the parent table to partitions. Note that data migration may took a while to finish and the table will be locked until transaction commits. See `partition_table_concurrently()` for a lock-free way to migrate data.
+
+```plpgsql
+create_range_partitions(relation       REGCLASS,
+                        attribute      TEXT,
+                        start_value    ANYELEMENT,
+                        interval       ANYELEMENT,
+                        count          INTEGER DEFAULT NULL
+                        partition_data BOOLEAN DEFAULT true)
+
+create_range_partitions(relation       REGCLASS,
+                        attribute      TEXT,
+                        start_value    ANYELEMENT,
+                        interval       INTERVAL,
+                        count          INTEGER DEFAULT NULL,
+                        partition_data BOOLEAN DEFAULT true)
+```
+Performs RANGE partitioning for `relation` by partitioning key `attribute`. `start_value` argument specifies initial value, `interval` sets the range of values in a single partition, `count` is the number of premade partitions (if not set then pathman tries to determine it based on attribute values).
 
 ```plpgsql
-create_range_partitions(relation    TEXT,
-                        attribute   TEXT,
-                        start_value ANYELEMENT,
-                        interval    ANYELEMENT,
-                        premake     INTEGER DEFAULT NULL)
+create_partitions_from_range(relation       REGCLASS,
+                             attribute      TEXT,
+                             start_value    ANYELEMENT,
+                             end_value      ANYELEMENT,
+                             interval       ANYELEMENT,
+                             partition_data BOOLEAN DEFAULT true)
 
-create_range_partitions(relation    TEXT,
-                        attribute   TEXT,
-                        start_value ANYELEMENT,
-                        interval    INTERVAL,
-                        premake     INTEGER DEFAULT NULL)
+create_partitions_from_range(relation       REGCLASS,
+                             attribute      TEXT,
+                             start_value    ANYELEMENT,
+                             end_value      ANYELEMENT,
+                             interval       INTERVAL,
+                             partition_data BOOLEAN DEFAULT true)
 ```
-Performs RANGE partitioning for `relation` by partitioning key `attribute`. `start_value` argument specifies initial value, `interval` sets the range of values in a single partition, `premake` is the number of premade partitions (if not set then pathman tries to determine it based on attribute values). All the data will be automatically copied from the parent to partitions.
+Performs RANGE-partitioning from specified range for `relation` by partitioning key `attribute`.
+
+### Data migration
 
 ```plpgsql
-create_partitions_from_range(relation    TEXT,
-                             attribute   TEXT,
-                             start_value ANYELEMENT,
-                             end_value   ANYELEMENT,
-                             interval    ANYELEMENT)
+partition_table_concurrently(relation REGCLASS)
+```
+Starts a background worker to move data from parent table to partitions. The worker utilizes short transactions to copy small batches of data (up to 10K rows per transaction) and thus doesn't significantly interfere with user's activity.
 
-create_partitions_from_range(relation    TEXT,
-                             attribute   TEXT,
-                             start_value ANYELEMENT,
-                             end_value   ANYELEMENT,
-                             interval    INTERVAL)
+```plpgsql
+stop_concurrent_part_task(relation REGCLASS)
 ```
-Performs RANGE-partitioning from specified range for `relation` by partitioning key `attribute`. Data will be copied to partitions as well.
+Stops a background worker performing a concurrent partitioning task. Note: worker will exit after it finishes relocating a current batch.
 
 ### Triggers
 ```plpgsql
-create_hash_update_trigger(parent TEXT)
+create_hash_update_trigger(parent REGCLASS)
 ```
 Creates the trigger on UPDATE for HASH partitions. The UPDATE trigger isn't created by default because of the overhead. It's useful in cases when the key attribute might change.
 ```plpgsql
-create_range_update_trigger(parent TEXT)
+create_range_update_trigger(parent REGCLASS)
 ```
 Same as above, but for a RANGE-partitioned table.
 
 ### Post-creation partition management
 ```plpgsql
-split_range_partition(partition TEXT, value ANYELEMENT)
+split_range_partition(partition      REGCLASS,
+                      value          ANYELEMENT,
+                      partition_name TEXT DEFAULT NULL,)
 ```
 Split RANGE `partition` in two by `value`.
 
 ```plpgsql
-merge_range_partitions(partition1 TEXT, partition2 TEXT)
+merge_range_partitions(partition1 REGCLASS, partition2 REGCLASS)
 ```
 Merge two adjacent RANGE partitions. First, data from `partition2` is copied to `partition1`, then `partition2` is removed.
 
 ```plpgsql
-append_range_partition(p_relation TEXT)
+append_range_partition(p_relation     REGCLASS,
+                       partition_name TEXT DEFAULT NULL)
 ```
-Append new RANGE partition.
+Append new RANGE partition with `pathman_config.range_interval` as interval.
 
 ```plpgsql
-prepend_range_partition(p_relation TEXT)
+prepend_range_partition(p_relation     REGCLASS,
+                        partition_name TEXT DEFAULT NULL)
 ```
-Prepend new RANGE partition.
+Prepend new RANGE partition with `pathman_config.range_interval` as interval.
 
 ```plpgsql
-add_range_partition(relation    TEXT,
-                    start_value ANYELEMENT,
-                    end_value   ANYELEMENT)
+add_range_partition(relation       REGCLASS,
+                    start_value    ANYELEMENT,
+                    end_value      ANYELEMENT,
+                    partition_name TEXT DEFAULT NULL)
 ```
 Create new RANGE partition for `relation` with specified range bounds.
 
@@ -142,28 +166,65 @@ drop_range_partition(partition TEXT)
 Drop RANGE partition and all its data.
 
 ```plpgsql
-attach_range_partition(relation    TEXT,
-                       partition   TEXT,
+attach_range_partition(relation    REGCLASS,
+                       partition   REGCLASS,
                        start_value ANYELEMENT,
                        end_value   ANYELEMENT)
 ```
 Attach partition to the existing RANGE-partitioned relation. The attached table must have exactly the same structure as the parent table, including the dropped columns.
 
 ```plpgsql
-detach_range_partition(partition TEXT)
+detach_range_partition(partition REGCLASS)
 ```
 Detach partition from the existing RANGE-partitioned relation.
 
 ```plpgsql
-disable_partitioning(relation TEXT)
+disable_pathman_for(relation TEXT)
 ```
 Permanently disable `pg_pathman` partitioning mechanism for the specified parent table and remove the insert trigger if it exists. All partitions and data remain unchanged.
 
+```plpgsql
+drop_partitions(parent      REGCLASS,
+                delete_data BOOLEAN DEFAULT FALSE)
+```
+Drop partitions of the `parent` table. If `delete_data` is `false` then the data is copied to the parent table first. Default is `false`.
+
+
+### Additional parameters
+
+```plpgsql
+enable_parent(relation  REGCLASS)
+disable_parent(relation REGCLASS)
+```
+Include/exclude parent table into/from query plan. In original PostgreSQL planner parent table is always included into query plan even if it's empty which can lead to additional overhead. You can use `disable_parent()` if you are never going to use parent table as a storage. Default value depends on the `partition_data` parameter that was specified during initial partitioning in `create_range_partitions()` or `create_partitions_from_range()` functions. If the `partition_data` parameter was `true` then all data have already been migrated to partitions and parent table disabled. Otherwise it is enabled.
+
+```plpgsql
+enable_auto(relation  REGCLASS)
+disable_auto(relation REGCLASS)
+```
+Enable/disable auto partition propagation (only for RANGE partitioning). It is enabled by default.
+
 ## Custom plan nodes
 `pg_pathman` provides a couple of [custom plan nodes](https://wiki.postgresql.org/wiki/CustomScanAPI) which aim to reduce execution time, namely:
 
 - `RuntimeAppend` (overrides `Append` plan node)
 - `RuntimeMergeAppend` (overrides `MergeAppend` plan node)
+- `PartitionFilter` (drop-in replacement for INSERT triggers)
+
+`PartitionFilter` acts as a *proxy node* for INSERT's child scan, which means it can redirect output tuples to the corresponding partition:
+
+```
+EXPLAIN (COSTS OFF)
+INSERT INTO partitioned_table
+SELECT generate_series(1, 10), random();
+               QUERY PLAN
+-----------------------------------------
+ Insert on partitioned_table
+   ->  Custom Scan (PartitionFilter)
+         ->  Subquery Scan on "*SELECT*"
+               ->  Result
+(4 rows)
+```
 
 `RuntimeAppend` and `RuntimeMergeAppend` have much in common: they come in handy in a case when WHERE condition takes form of:
 ```
@@ -290,6 +351,15 @@ SELECT tableoid::regclass AS partition, * FROM partitioned_table;
 
 - Though indices on a parent table aren't particularly useful (since it's empty), they act as prototypes for indices on partitions. For each index on the parent table, `pg_pathman` will create a similar index on every partition.
 
+- All running concurrent partitioning tasks can be listed using the `pathman_concurrent_part_tasks` view:
+```plpgsql
+SELECT * FROM pathman_concurrent_part_tasks;
+ userid | pid  | dbid  | relid | processed | status  
+--------+------+-------+-------+-----------+---------
+ dmitry | 7367 | 16384 | test  |    472000 | working
+(1 row)
+```
+
 ### HASH partitioning
 Consider an example of HASH partitioning. First create a table with some integer column:
 ```
@@ -419,17 +489,18 @@ There are several user-accessible [GUC](https://www.postgresql.org/docs/9.5/stat
  - `pg_pathman.enable` --- disable (or enable) `pg_pathman` completely
  - `pg_pathman.enable_runtimeappend` --- toggle `RuntimeAppend` custom node on\off
  - `pg_pathman.enable_runtimemergeappend` --- toggle `RuntimeMergeAppend` custom node on\off
+ - `pg_pathman.enable_partitionfilter` --- toggle `PartitionFilter` custom node on\off
 
 To **permanently** disable `pg_pathman` for some previously partitioned table, use the `disable_partitioning()` function:
 ```
-SELECT disable_partitioning('range_rel');
+SELECT disable_pathman_for('range_rel');
 ```
 All sections and data will remain unchanged and will be handled by the standard PostgreSQL inheritance mechanism.
 
 ##Feedback
 Do not hesitate to post your issues, questions and new ideas at the [issues](https://github.com/postgrespro/pg_pathman/issues) page.
 
 ## Authors
-Ildar Musin <i.musin@postgrespro.ru> Postgres Professional Ltd., Russia     
-Alexander Korotkov <a.korotkov@postgrespro.ru> Postgres Professional Ltd., Russia       
-Dmitry Ivanov <d.ivanov@postgrespro.ru> Postgres Professional Ltd., Russia      
+Ildar Musin <i.musin@postgrespro.ru> Postgres Professional Ltd., Russia		
+Alexander Korotkov <a.korotkov@postgrespro.ru> Postgres Professional Ltd., Russia		
+Dmitry Ivanov <d.ivanov@postgrespro.ru> Postgres Professional Ltd., Russia