Merge branch 'master' of https://github.com/postgrespro/postgres_cluster

knizhnik · knizhnik · commit e195a0cb70da · 2016-04-19T18:13:07.000+03:00
diff --git a/contrib/mmts/README.md b/contrib/mmts/README.md
@@ -1,117 +1,53 @@
-# pg_dtm
-
-### Design
-
-This repo implements distributed transaction manager using Snapshot Sharing mechanism. General concepts and alternative approaches described in postgres wiki https://wiki.postgresql.org/wiki/DTM.
-
-Backend-DTM protocol description can be found in [dtmd/README](dtmd/README).
-
-### Installation
-
-* Patch postgres using xtm.patch. After that build and install postgres in usual way.
-```bash
-cd ~/code/postgres
-patch -p1 < ~/code/pg_dtm/xtm.patch
-```
-* Install pg_dtm extension.
-```bash
-export PATH=/path/to/pgsql/bin/:$PATH
-cd ~/code/pg_dtm
-make && make install
-```
-* Run dtmd.
-```bash
-cd ~/code/pg_dtm/dtmd
-make
-mkdir /tmp/clog
-./bin/dtmd &
-```
-* To run something meaningful you need at leat two postgres instances. Also pg_dtm requires presense in ```shared_preload_libraries```.
-```bash
-initdb -D ./install/data1
-initdb -D ./install/data2
-echo "port = 5433" >> ./install/data2/postgresql.conf
-echo "shared_preload_libraries = 'pg_dtm'" >> ./install/data1/postgresql.conf
-echo "shared_preload_libraries = 'pg_dtm'" >> ./install/data2/postgresql.conf
-pg_ctl -D ./install/data1 -l ./install/data1/log start
-pg_ctl -D ./install/data2 -l ./install/data2/log start
-```
-
-#### Automatic provisioning
-
-For a cluster-wide deploy we use ansible, more details in tests/deploy_layouts. (Ansible instructions will be later)
-
-### Usage
-
-Now cluster is running and you can use global tx between two nodes. Let's connect to postgres instances at different ports:
-
-```sql
-create extension pg_dtm; -- node1
-create table accounts(user_id int, amount int); -- node1
-insert into accounts (select 2*generate_series(1,100)-1, 0); -- node1, odd user_id's
-    create extension pg_dtm; -- node2
-    create table accounts(user_id int, amount int); -- node2
-    insert into accounts (select 2*generate_series(1,100), 0); -- node2, even user_id's
-select dtm_begin_transaction(); -- node1, returns global xid, e.g. 42
-	select dtm_join_transaction(42); -- node2, join global tx
-begin; -- node1
-	begin; -- node2
-update accounts set amount=amount-100 where user_id=1; -- node1, transfer money from user#1
-	update accounts set amount=amount+100 where user_id=2; -- node2, to user#2
-commit; -- node1, blocks until second commit happend
-	commit; -- node2
-```
-
-### Consistency testing
-
-To ensure consistency we use simple bank test: perform a lot of simultaneous transfers between accounts on different servers, while constantly checking total amount of money on all accounts. This test can be found in tests/perf.
-
-```bash
-> go run ./tests/perf/*
-  -C value
-    	Connection string (repeat for multiple connections)
-  -a int
-    	The number of bank accounts (default 100000)
-  -b string
-    	Backend to use. Possible optinos: transfers, fdw, pgshard, readers. (default "transfers")
-  -g	Use DTM to keep global consistency
-  -i	Init database
-  -l	Use 'repeatable read' isolation level instead of 'read committed'
-  -n int
-    	The number updates each writer (reader in case of Reades backend) performs (default 10000)
-  -p	Use parallel execs
-  -r int
-    	The number of readers (default 1)
-  -s int
-    	StartID. Script will update rows starting from this value
-  -v	Show progress and other stuff for mortals
-  -w int
-    	The number of writers (default 8)
-```
-
-So previous installation can be initialized with:
-```
-go run ./tests/perf/*.go  \
--C "dbname=postgres port=5432" \
--C "dbname=postgres port=5433" \
--g -i
-```
-and tested with:
-```
-go run ./tests/perf/*.go  \
--C "dbname=postgres port=5432" \
--C "dbname=postgres port=5433" \
--g
-```
-
-### Using with postres_fdw.
-
-We also provide a patch, that enables support of global transactions with postres_fdw. After patching and installing postres_fdw it is possible to run same test via fdw usig key ```-b fdw```.
-
-### Using with pg_shard
-
-Citus Data have branch in their pg_shard repo, that interacts with transaction manager. https://github.com/citusdata/pg_shard/tree/transaction_manager_integration
-To use this feature one should have following line in postgresql.conf (or set it via GUC)
-```
-pg_shard.use_dtm_transactions = 1
-```
+# Postgres Multimaster
+
+## Testing
+
+The testing process involves multiple modules that perform different tasks. The
+modules and their APIs are listed below.
+
+### Modules
+
+#### `combineaux`
+
+Governs the whole testing process. Runs different workloads during different
+troubles.
+
+#### `stresseaux`
+
+Puts workloads against the database. Writes logs that are later used by
+`valideaux`.
+
+* `start(id, workload, cluster)` - starts a `workload` against the `cluster`
+and call it `id`.
+* `stop(id)` - stops a previously started workload called `id`.
+
+#### `starteaux`
+
+Manages the database nodes.
+
+* `deploy(driver, ...)` - deploys a cluster using the specified `driver` and
+other parameters specific to that driver. Returns a `cluster` instance that is
+used in other methods.
+* `cluster->up(id)` - adds a node named `id` to the `cluster`.
+* `cluster->down(id)` - removes a node named `id` from the `cluster`.
+* `cluster->drop(src, dst, ratio)` - drop `ratio` packets flowing from node
+`src` to node `dst`.
+* `cluster->delay(src, dst, msec)` - delay packets flowing from node `src` to
+node `dst` by `msec` milliseconds.
+
+#### `troubleaux`
+
+This is the troublemaker that messes with the network, nodes and time.
+
+* `cause(cluster, trouble, ...)` - causes the specified `trouble` in the
+specified `cluster` with some trouble-specific parameters.
+* `fix(cluster)` - fixes all troubles caused in the `cluster`.
+
+#### `valideaux`
+
+Validates the logs of stresseaux.
+
+#### `reporteaux`
+
+Generates reports on the test results. This is usually a table that with
+`trouble` vs `workload` axes.
diff --git a/contrib/mmts/Testeaux.pm b/contrib/mmts/Testeaux.pm
@@ -0,0 +1,85 @@
+package Testeaux;
+
+package combineaux
+{
+	sub combine
+	{
+		my ($workloads, $troubles) = @_;
+
+		my $cluster = starteaux->deploy('lxc');
+
+		foreach my $workload (@$workloads)
+		{
+			foreach my $trouble (@$troubles)
+			{
+				print("run workload $workload during trouble $trouble\n");
+				# FIXME: generate proper id instead of 'hello'
+				stresseaux::start('hello', $workload, $cluster);
+				# FIXME: add a time gap here
+				troubleaux::cause($cluster, $trouble);
+				# FIXME: add a time gap here
+				stresseaux::stop('hello');
+				troubleaux::fix($cluster);
+			}
+		}
+	}
+}
+
+package stresseaux
+{
+	sub start
+	{
+		my ($id, $workload, $cluster) = @_;
+		print("start stress $id: workload $workload, cluster $cluster\n");
+		# fixme: implement
+	}
+
+	sub stop
+	{
+		my $id = shift;
+		print("stop stress $id\n");
+		# FIXME: implement
+	}
+}
+
+package starteaux
+{
+	sub deploy
+	{
+		my ($class, $driver, @args) = @_;
+		my $self = {};
+		print("deploy cluster using driver $driver\n");
+		# fixme: implement
+		return bless $self, 'starteaux';
+	}
+
+	sub up
+	{
+		my ($self, $id) = @_;
+		print("up node $id\n");
+		# FIXME: implement
+	}
+
+	sub down
+	{
+		my ($self, $id = @_;
+		print("down node $id\n");
+		# FIXME: implement
+	}
+
+	sub drop
+	{
+		my ($self, $src, $dst, $ratio) = @_;
+		print("drop $ratio packets from $src to $dst\n");
+		# FIXME: implement
+	}
+
+	sub delay
+	{
+		my ($self, $src, $dst, $msec) = @_;
+		print("delay packets from $src to $dst by $msec msec\n");
+		# FIXME: implement
+	}
+}
+
+1;