From a743d5e9e562e727c8f2a9df7e0949148d2f4984 Mon Sep 17 00:00:00 2001
From: Marina Polyakova <m.polyakova@postgrespro.ru>
Date: Fri, 6 Apr 2018 21:12:41 +0300
Subject: [PATCH v8] Pgbench errors and serialization/deadlock retries

Client's run is aborted only in case of a serious error, for example, the
connection with the backend was lost. Otherwise if the execution of SQL or meta
command fails, the client's run continues normally until the end of the current
script execution (it is assumed that one transaction script contains only one
transaction).

Transactions with serialization or deadlock failures are rolled back and
repeated until they complete successfully or reach the maximum number of tries
(specified by the --max-tries option) / the maximum time of tries (specified by
the --latency-limit option). These options can be combined together; but if
none of them are used, failed transactions are not retried at all. If the last
transaction run fails, this transaction will be reported as failed, and the
client variables will be set as they were before the first run of this
transaction.

If there're retries and/or errors their statistics are printed in the progress,
in the transaction / aggregation logs and in the end with other results (all and
for each script). A transaction error is reported here only if the last try of
this transaction fails. Also retries and/or errors are printed per-command with
average latencies if you use the appropriate benchmarking option
(--report-per-command, -r) and the total number of retries and/or errors is not
zero.

If a failed transaction block does not terminate in the current script, the
commands of the following scripts are processed as usual so you can get a lot of
errors of type "in failed SQL transaction" (when the current SQL transaction is
aborted and commands ignored until end of transaction block). In such cases you
can use separate statistics of these errors in all reports.

If you want to distinguish between failures or errors by type (including which
limit for retries was violated and how far it was exceeded for the
serialization/deadlock errors), use the pgbench debugging output created with
the option --debug and with the debugging level "fails" or "all". The first
variant is recommended for this purpose because with in the second case the
debugging output can be very large.
---
 doc/src/sgml/ref/pgbench.sgml                      |  321 ++-
 src/bin/pgbench/pgbench.c                          | 2100 +++++++++++++++-----
 src/bin/pgbench/t/001_pgbench_with_server.pl       |   41 +-
 src/bin/pgbench/t/002_pgbench_no_server.pl         |    4 +-
 .../t/003_serialization_and_deadlock_fails.pl      |  761 +++++++
 5 files changed, 2715 insertions(+), 512 deletions(-)
 create mode 100644 src/bin/pgbench/t/003_serialization_and_deadlock_fails.pl

diff --git a/doc/src/sgml/ref/pgbench.sgml b/doc/src/sgml/ref/pgbench.sgml
index 41d9030..2756703 100644
--- a/doc/src/sgml/ref/pgbench.sgml
+++ b/doc/src/sgml/ref/pgbench.sgml
@@ -55,16 +55,19 @@ number of clients: 10
 number of threads: 1
 number of transactions per client: 1000
 number of transactions actually processed: 10000/10000
+maximum number of tries: 1
 tps = 85.184871 (including connections establishing)
 tps = 85.296346 (excluding connections establishing)
 </screen>
 
-  The first six lines report some of the most important parameter
-  settings.  The next line reports the number of transactions completed
-  and intended (the latter being just the product of number of clients
+  The first six lines and the eighth line report some of the most important
+  parameter settings.  The seventh line reports the number of transactions
+  completed and intended (the latter being just the product of number of clients
   and number of transactions per client); these will be equal unless the run
-  failed before completion.  (In <option>-T</option> mode, only the actual
-  number of transactions is printed.)
+  failed before completion or some SQL/meta command(s) failed.  (In
+  <option>-T</option> mode, only the actual number of transactions is printed.)
+  (see <xref linkend="errors-and-retries" endterm="errors-and-retries-title"/>
+  for more information)
   The last two lines report the number of transactions per second,
   figured with and without counting the time to start database sessions.
  </para>
@@ -380,11 +383,28 @@ pgbench <optional> <replaceable>options</replaceable> </optional> <replaceable>d
      </varlistentry>
 
      <varlistentry>
-      <term><option>-d</option></term>
-      <term><option>--debug</option></term>
+      <term><option>-d</option> <replaceable>debug_level</replaceable></term>
+      <term><option>--debug=</option><replaceable>debug_level</replaceable></term>
       <listitem>
        <para>
-        Print debugging output.
+        Print debugging output. You can use the following debugging levels:
+          <itemizedlist>
+           <listitem>
+            <para><literal>no</literal>: no debugging output (except built-in
+            function <function>debug</function>, see <xref
+            linkend="pgbench-functions"/>).</para>
+           </listitem>
+           <listitem>
+            <para><literal>fails</literal>: print only failure messages, errors
+            and retries (see <xref linkend="errors-and-retries"
+            endterm="errors-and-retries-title"/> for more information).</para>
+           </listitem>
+           <listitem>
+            <para><literal>all</literal>: print all debugging output
+            (throttling, executed/sent/received commands etc.).</para>
+           </listitem>
+          </itemizedlist>
+        The default is no debugging output.
        </para>
       </listitem>
      </varlistentry>
@@ -453,6 +473,16 @@ pgbench <optional> <replaceable>options</replaceable> </optional> <replaceable>d
         at all. They are counted and reported separately as
         <firstterm>skipped</firstterm>.
        </para>
+       <para>
+        The transaction with serialization or deadlock failure can be retried if
+        the total time of all its tries is less than
+        <replaceable>limit</replaceable> ms. This option can be combined with
+        the option <option>--max-tries</option> which limits the total number of
+        transaction tries. But if none of them are used, failed transactions are
+        not retried at all. See
+        <xref linkend="errors-and-retries" endterm="errors-and-retries-title"/>
+        for more information about retrying failed transactions.
+       </para>
        </listitem>
      </varlistentry>
 
@@ -513,22 +543,38 @@ pgbench <optional> <replaceable>options</replaceable> </optional> <replaceable>d
         Show progress report every <replaceable>sec</replaceable> seconds.  The report
         includes the time since the beginning of the run, the tps since the
         last report, and the transaction latency average and standard
-        deviation since the last report.  Under throttling (<option>-R</option>),
-        the latency is computed with respect to the transaction scheduled
-        start time, not the actual transaction beginning time, thus it also
-        includes the average schedule lag time.
+        deviation since the last report.  If any transactions ended with a
+        failed SQL or meta command since the last report, they are also reported
+        as failed.  If any transactions ended with an error "in failed SQL
+        transaction block", they are reported separatly as <literal>in failed
+        tx</literal> (see <xref linkend="errors-and-retries"
+        endterm="errors-and-retries-title"/> for more information).  Under
+        throttling (<option>-R</option>), the latency is computed with respect
+        to the transaction scheduled start time, not the actual transaction
+        beginning time, thus it also includes the average schedule lag time.  If
+        any transactions have been rolled back and retried after a
+        serialization/deadlock failure since the last report, the report
+        includes the number of such transactions and the sum of all retries. Use
+        the options <option>--max-tries</option> and/or
+        <option>--latency-limit</option> to enable transactions retries after
+        serialization/deadlock failures.
        </para>
       </listitem>
      </varlistentry>
 
      <varlistentry>
       <term><option>-r</option></term>
-      <term><option>--report-latencies</option></term>
+      <term><option>--report-per-command</option></term>
       <listitem>
        <para>
-        Report the average per-statement latency (execution time from the
-        perspective of the client) of each command after the benchmark
-        finishes.  See below for details.
+        Report the following statistics for each command after the benchmark
+        finishes: the average per-statement latency (execution time from the
+        perspective of the client), the number of all errors, the number of
+        errors "in failed SQL transaction block", and the number of retries
+        after serialization or deadlock failures.  The report displays the
+        columns with statistics on errors and retries only if the current
+        <application>pgbench</application> run has an error of the corresponding
+        type or retry, respectively. See below for details.
        </para>
       </listitem>
      </varlistentry>
@@ -667,6 +713,21 @@ pgbench <optional> <replaceable>options</replaceable> </optional> <replaceable>d
      </varlistentry>
 
      <varlistentry>
+      <term><option>--max-tries=<replaceable>number_of_tries</replaceable></option></term>
+      <listitem>
+       <para>
+        Set the maximum number of tries for transactions with
+        serialization/deadlock failures. This option can be combined with the
+        option <option>--latency-limit</option> which limits the total time of
+        transaction tries. But if none of them are used, failed transactions are
+        not retried at all. See
+        <xref linkend="errors-and-retries" endterm="errors-and-retries-title"/>
+        for more information about retrying failed transactions.
+       </para>
+      </listitem>
+     </varlistentry>
+
+     <varlistentry>
       <term><option>--progress-timestamp</option></term>
       <listitem>
        <para>
@@ -807,8 +868,8 @@ pgbench <optional> <replaceable>options</replaceable> </optional> <replaceable>d
  <refsect1>
   <title>Notes</title>
 
- <refsect2>
-  <title>What is the <quote>Transaction</quote> Actually Performed in <application>pgbench</application>?</title>
+ <refsect2 id="transactions-and-scripts">
+  <title id="transactions-and-scripts-title">What is the <quote>Transaction</quote> Actually Performed in <application>pgbench</application>?</title>
 
   <para>
    <application>pgbench</application> executes test scripts chosen randomly
@@ -1583,7 +1644,7 @@ END;
    The format of the log is:
 
 <synopsis>
-<replaceable>client_id</replaceable> <replaceable>transaction_no</replaceable> <replaceable>time</replaceable> <replaceable>script_no</replaceable> <replaceable>time_epoch</replaceable> <replaceable>time_us</replaceable> <optional> <replaceable>schedule_lag</replaceable> </optional>
+<replaceable>client_id</replaceable> <replaceable>transaction_no</replaceable> <replaceable>time</replaceable> <replaceable>script_no</replaceable> <replaceable>time_epoch</replaceable> <replaceable>time_us</replaceable> <optional> <replaceable>schedule_lag</replaceable> </optional> <optional> <replaceable>retries</replaceable> </optional>
 </synopsis>
 
    where
@@ -1604,6 +1665,17 @@ END;
    When both <option>--rate</option> and <option>--latency-limit</option> are used,
    the <replaceable>time</replaceable> for a skipped transaction will be reported as
    <literal>skipped</literal>.
+   <replaceable>retries</replaceable> is the sum of all the retries after the
+   serialization or deadlock failures during the current script execution. It is
+   only present when the maximum number of tries for transactions is more than 1
+   (<option>--max-tries</option>) and/or the maximum time of tries for
+   transactions is used (<option>--latency-limit</option>). If the transaction
+   ended with an error "in failed SQL transaction", its
+   <replaceable>time</replaceable> will be reported as
+   <literal>in_failed_tx</literal>. If the transaction ended with other error,
+   its <replaceable>time</replaceable> will be reported as
+   <literal>failed</literal> (see <xref linkend="errors-and-retries"
+   endterm="errors-and-retries-title"/> for more information).
   </para>
 
   <para>
@@ -1633,6 +1705,24 @@ END;
   </para>
 
   <para>
+   The following example shows a snippet of a log file with errors and retries,
+   with the maximum number of tries set to 10 (note the additional
+   <replaceable>retries</replaceable> column):
+<screen>
+3 0 47423 0 1499414498 34501 4
+3 1 8333 0 1499414498 42848 1
+3 2 8358 0 1499414498 51219 1
+4 0 72345 0 1499414498 59433 7
+1 3 41718 0 1499414498 67879 5
+1 4 8416 0 1499414498 76311 1
+3 3 33235 0 1499414498 84469 4
+0 0 failed 0 1499414498 84905 10
+2 0 failed 0 1499414498 86248 10
+3 4 8307 0 1499414498 92788 1
+</screen>
+  </para>
+
+  <para>
    When running a long test on hardware that can handle a lot of transactions,
    the log files can become very large.  The <option>--sampling-rate</option> option
    can be used to log only a random sample of transactions.
@@ -1647,7 +1737,7 @@ END;
    format is used for the log files:
 
 <synopsis>
-<replaceable>interval_start</replaceable> <replaceable>num_transactions</replaceable> <replaceable>sum_latency</replaceable> <replaceable>sum_latency_2</replaceable> <replaceable>min_latency</replaceable> <replaceable>max_latency</replaceable> <optional> <replaceable>sum_lag</replaceable> <replaceable>sum_lag_2</replaceable> <replaceable>min_lag</replaceable> <replaceable>max_lag</replaceable> <optional> <replaceable>skipped</replaceable> </optional> </optional>
+<replaceable>interval_start</replaceable> <replaceable>num_transactions</replaceable> <replaceable>sum_latency</replaceable> <replaceable>sum_latency_2</replaceable> <replaceable>min_latency</replaceable> <replaceable>max_latency</replaceable> <replaceable>failed_tx</replaceable> <replaceable>in_failed_tx</replaceable> <optional> <replaceable>sum_lag</replaceable> <replaceable>sum_lag_2</replaceable> <replaceable>min_lag</replaceable> <replaceable>max_lag</replaceable> <optional> <replaceable>skipped</replaceable> </optional> </optional> <optional> <replaceable>retried_tx</replaceable> <replaceable>retries</replaceable> </optional>
 </synopsis>
 
    where
@@ -1661,7 +1751,13 @@ END;
    transaction latencies within the interval,
    <replaceable>min_latency</replaceable> is the minimum latency within the interval,
    and
-   <replaceable>max_latency</replaceable> is the maximum latency within the interval.
+   <replaceable>max_latency</replaceable> is the maximum latency within the interval,
+   <replaceable>failed_tx</replaceable> is the number of transactions that ended
+   with a failed SQL or meta command within the interval,
+   <replaceable>in_failed_tx</replaceable> is the number of transactions that
+   ended with an error "in failed SQL transaction block" (see
+   <xref linkend="errors-and-retries" endterm="errors-and-retries-title"/>
+   for more information).
    The next fields,
    <replaceable>sum_lag</replaceable>, <replaceable>sum_lag_2</replaceable>, <replaceable>min_lag</replaceable>,
    and <replaceable>max_lag</replaceable>, are only present if the <option>--rate</option>
@@ -1669,21 +1765,28 @@ END;
    They provide statistics about the time each transaction had to wait for the
    previous one to finish, i.e. the difference between each transaction's
    scheduled start time and the time it actually started.
-   The very last field, <replaceable>skipped</replaceable>,
+   The next field, <replaceable>skipped</replaceable>,
    is only present if the <option>--latency-limit</option> option is used, too.
    It counts the number of transactions skipped because they would have
    started too late.
+   The <replaceable>retried_tx</replaceable> and
+   <replaceable>retries</replaceable> fields are only present if the maximum
+   number of tries for transactions is more than 1
+   (<option>--max-tries</option>) and/or the maximum time of tries for
+   transactions is used (<option>--latency-limit</option>). They report the
+   number of retried transactions and the sum of all the retries after
+   serialization or deadlock failures within the interval.
    Each transaction is counted in the interval when it was committed.
   </para>
 
   <para>
    Here is some example output:
 <screen>
-1345828501 5601 1542744 483552416 61 2573
-1345828503 7884 1979812 565806736 60 1479
-1345828505 7208 1979422 567277552 59 1391
-1345828507 7685 1980268 569784714 60 1398
-1345828509 7073 1979779 573489941 236 1411
+1345828501 5601 1542744 483552416 61 2573 0 0
+1345828503 7884 1979812 565806736 60 1479 0 0
+1345828505 7208 1979422 567277552 59 1391 0 0
+1345828507 7685 1980268 569784714 60 1398 0 0
+1345828509 7073 1979779 573489941 236 1411 0 0
 </screen></para>
 
   <para>
@@ -1695,15 +1798,54 @@ END;
  </refsect2>
 
  <refsect2>
-  <title>Per-Statement Latencies</title>
+  <title>Per-Statement Report</title>
+
+  <para>
+   With the <option>-r</option> option, <application>pgbench</application>
+   collects the following statistics for each statement:
+   <itemizedlist>
+     <listitem>
+       <para>
+         <literal>latency</literal> &mdash; elapsed transaction time for each
+         statement. <application>pgbench</application> reports an average value
+         of all successful runs of the statement.
+       </para>
+     </listitem>
+     <listitem>
+       <para>
+         The number of errors in this statement. See
+         <xref linkend="errors-and-retries" endterm="errors-and-retries-title"/>
+         for more information.
+       </para>
+     </listitem>
+     <listitem>
+       <para>
+         The number of errors "in failed SQL transaction" in this statement. See
+         <xref linkend="errors-and-retries" endterm="errors-and-retries-title"/>
+         for more information.
+       </para>
+     </listitem>
+     <listitem>
+       <para>
+         The number of retries after a serialization or a deadlock failure in
+         this statement. See <xref linkend="errors-and-retries"
+         endterm="errors-and-retries-title"/> for more information.
+       </para>
+     </listitem>
+   </itemizedlist>
+  </para>
 
   <para>
-   With the <option>-r</option> option, <application>pgbench</application> collects
-   the elapsed transaction time of each statement executed by every
-   client.  It then reports an average of those values, referred to
-   as the latency for each statement, after the benchmark has finished.
+   The report displays the columns with statistics on errors and retries only if
+   the current <application>pgbench</application> run has an error or retry,
+   respectively.
   </para>
 
+   <para>
+   All values are computed for each statement executed by every client and are
+   reported after the benchmark has finished.
+   </para>
+
   <para>
    For the default script, the output will look similar to this:
 <screen>
@@ -1715,6 +1857,7 @@ number of clients: 10
 number of threads: 1
 number of transactions per client: 1000
 number of transactions actually processed: 10000/10000
+maximum number of tries: 1
 latency average = 15.844 ms
 latency stddev = 2.715 ms
 tps = 618.764555 (including connections establishing)
@@ -1732,10 +1875,50 @@ statement latencies in milliseconds:
         0.371  INSERT INTO pgbench_history (tid, bid, aid, delta, mtime) VALUES (:tid, :bid, :aid, :delta, CURRENT_TIMESTAMP);
         1.212  END;
 </screen>
+
+   Another example of output for the default script using serializable default
+   transaction isolation level (<command>PGOPTIONS='-c
+   default_transaction_isolation=serializable' pgbench ...</command>):
+<screen>
+starting vacuum...end.
+transaction type: &lt;builtin: TPC-B (sort of)&gt;
+scaling factor: 1
+query mode: simple
+number of clients: 10
+number of threads: 1
+number of transactions per client: 1000
+number of transactions actually processed: 4473/10000
+number of errors: 5527 (55.270%)
+number of retried: 7467 (74.670%)
+number of retries: 257244
+maximum number of tries: 100
+number of transactions above the 100.0 ms latency limit: 5766/10000 (57.660 %) (including errors)
+latency average = 41.169 ms
+latency stddev = 51.783 ms
+tps = 50.322494 (including connections establishing)
+tps = 50.324595 (excluding connections establishing)
+statement latencies in milliseconds, errors and retries:
+  0.004     0       0  \set aid random(1, 100000 * :scale)
+  0.000     0       0  \set bid random(1, 1 * :scale)
+  0.000     0       0  \set tid random(1, 10 * :scale)
+  0.000     0       0  \set delta random(-5000, 5000)
+  0.213     0       0  BEGIN;
+  0.393     0       0  UPDATE pgbench_accounts
+                       SET abalance = abalance + :delta WHERE aid = :aid;
+  0.332     0       0  SELECT abalance FROM pgbench_accounts WHERE aid = :aid;
+  0.409  4971  250265  UPDATE pgbench_tellers
+                       SET tbalance = tbalance + :delta WHERE tid = :tid;
+  0.311   556    6975  UPDATE pgbench_branches
+                       SET bbalance = bbalance + :delta WHERE bid = :bid;
+  0.299     0       0  INSERT INTO pgbench_history
+                              (tid, bid, aid, delta, mtime)
+                       VALUES (:tid, :bid, :aid, :delta, CURRENT_TIMESTAMP);
+  0.520     0       4  END;
+</screen>
   </para>
 
   <para>
-   If multiple script files are specified, the averages are reported
+   If multiple script files are specified, all statistics are reported
    separately for each script file.
   </para>
 
@@ -1749,6 +1932,78 @@ statement latencies in milliseconds:
   </para>
  </refsect2>
 
+ <refsect2 id="errors-and-retries">
+  <title id="errors-and-retries-title">Errors and Serialization/Deadlock Retries</title>
+
+  <para>
+   Client's run is aborted only in case of a serious error, for example, the
+   connection with the backend was lost. Otherwise if the execution of SQL or
+   meta command fails, the client's run continues normally until the end of the
+   current script execution (it is assumed that one transaction script contains
+   only one transaction; see <xref linkend="transactions-and-scripts"
+   endterm="transactions-and-scripts-title"/> for more information).
+   Transactions with serialization or deadlock failures are rolled back and
+   repeated until they complete successfully or reach the maximum number of
+   tries (specified by the <option>--max-tries</option> option) / the maximum
+   time of tries (specified by the <option>--latency-limit</option> option). If
+   the last transaction run fails, this transaction will be reported as failed,
+   and the client variables will be set as they were before the first run of
+   this transaction.
+  </para>
+
+  <note>
+   <para>
+    Be careful when repeating scripts that contain multiple transactions: the
+    script is always retried completely, so the successful transactions can be
+    performed several times.
+   </para>
+   <para>
+    Be careful when repeating transactions with shell commands. Unlike the
+    results of SQL commands, the results of shell commands are not rolled back,
+    except for the variable value of the <command>\setshell</command> command.
+   </para>
+   <para>
+    If a failed transaction block does not terminate in the current script, the
+    commands of the following scripts are processed as usual so you can get a
+    lot of errors of type "in failed SQL transaction" (when the current SQL
+    transaction is aborted and commands ignored until end of transaction block).
+    In such cases you can use separate statistics of these errors in all
+    reports.
+   </para>
+  </note>
+
+  <para>
+   The latency of a successful transaction includes the entire time of
+   transaction execution with rollbacks and retries. The latency for failed
+   transactions and commands is not computed separately.
+  </para>
+
+  <para>
+   The main report contains the number of failed transactions if it is non-zero.
+   If the total number of transactions ended with an error "in failed SQL
+   transaction block" is non-zero, the main report also contains it. If the
+   total number of retried transactions is non-zero, the main report also
+   contains the statistics related to retries: the total number of retried
+   transactions and total number of retries (use the options
+   <option>--max-tries</option> and/or <option>--latency-limit</option> to make
+   it possible). The per-statement report inherits all columns from the main
+   report. Note that if a failure/error occurs, the following failures/errors in
+   the current script execution are not shown in the reports. The retry is only
+   reported for the first command where the failure occured during the current
+   script execution.
+  </para>
+
+  <para>
+   If you want to distinguish between failures or errors by type (including
+   which limit for retries was violated and how far it was exceeded for the
+   serialization/deadlock errors), use the <application>pgbench</application>
+   debugging output created with the option <option>--debug</option> and with
+   the debugging level <literal>fails</literal> or <literal>all</literal>. The
+   first variant is recommended for this purpose because with in the second case
+   the debugging output can be very large.
+  </para>
+ </refsect2>
+
  <refsect2>
   <title>Good Practices</title>
 
diff --git a/src/bin/pgbench/pgbench.c b/src/bin/pgbench/pgbench.c
index fd18568..8073421 100644
--- a/src/bin/pgbench/pgbench.c
+++ b/src/bin/pgbench/pgbench.c
@@ -59,6 +59,9 @@
 
 #include "pgbench.h"
 
+#define ERRCODE_IN_FAILED_SQL_TRANSACTION  "25P02"
+#define ERRCODE_T_R_SERIALIZATION_FAILURE  "40001"
+#define ERRCODE_T_R_DEADLOCK_DETECTED  "40P01"
 #define ERRCODE_UNDEFINED_TABLE  "42P01"
 
 /*
@@ -186,9 +189,25 @@ bool		progress_timestamp = false; /* progress report with Unix time */
 int			nclients = 1;		/* number of clients */
 int			nthreads = 1;		/* number of threads */
 bool		is_connect;			/* establish connection for each transaction */
-bool		is_latencies;		/* report per-command latencies */
+bool		report_per_command = false;	/* report per-command latencies, retries
+										 * after the failures and errors
+										 * (failures without retrying) */
 int			main_pid;			/* main process id used in log filename */
 
+/*
+ * There're different types of restrictions for deciding that the current failed
+ * transaction can no longer be retried and should be reported as failed:
+ * - max_tries can be used to limit the number of tries;
+ * - latency_limit can be used to limit the total time of tries.
+ *
+ * They can be combined together, and you need to use at least one of them to
+ * retry the failed transactions. By default, failed transactions are not
+ * retried at all.
+ */
+uint32		max_tries = 0;		/* we cannot retry a failed transaction if its
+								 * number of tries reaches this maximum; if its
+								 * value is zero, it is not used */
+
 char	   *pghost = "";
 char	   *pgport = "";
 char	   *login = NULL;
@@ -242,14 +261,74 @@ typedef struct SimpleStats
 typedef struct StatsData
 {
 	time_t		start_time;		/* interval start time, for aggregates */
-	int64		cnt;			/* number of transactions, including skipped */
+	int64		cnt;			/* number of sucessfull transactions, including
+								 * skipped */
 	int64		skipped;		/* number of transactions skipped under --rate
 								 * and --latency-limit */
+	int64		retries;
+	int64		retried;		/* number of transactions that were retried
+								 * after a serialization or a deadlock
+								 * failure */
+	int64		errors;			/* number of transactions that were not retried
+								 * after a serialization or a deadlock
+								 * failure or had another error (including meta
+								 * commands errors) */
+	int64		errors_in_failed_tx;	/* number of transactions that failed in
+										 * a error
+										 * ERRCODE_IN_FAILED_SQL_TRANSACTION */
 	SimpleStats latency;
 	SimpleStats lag;
 } StatsData;
 
 /*
+ * Data structure for client variables.
+ */
+typedef struct Variables
+{
+	Variable   *array;			/* array of variable definitions */
+	int			nvariables;		/* number of variables */
+	bool		vars_sorted;	/* are variables sorted by name? */
+} Variables;
+
+/*
+ * Data structure for thread/client random seed.
+ */
+typedef struct RandomState
+{
+	unsigned short data[3];
+} RandomState;
+
+/*
+ * Data structure for repeating a transaction from the beginnning with the same
+ * parameters.
+ */
+typedef struct RetryState
+{
+	RandomState random_state;	/* random seed */
+	Variables   variables;		/* client variables */
+} RetryState;
+
+/*
+ * For the failures during script execution.
+ */
+typedef enum FailureStatus
+{
+	NO_FAILURE = 0,
+	ANOTHER_FAILURE,			/* other failures that are not listed by
+								 * themselves below */
+	SERIALIZATION_FAILURE,
+	DEADLOCK_FAILURE,
+	IN_FAILED_SQL_TRANSACTION
+} FailureStatus;
+
+typedef struct Failure
+{
+	FailureStatus status;		/* type of the failure */
+	int			command;		/* command number in script where the failure
+								 * occurred */
+} Failure;
+
+/*
  * Connection state machine states.
  */
 typedef enum
@@ -304,6 +383,22 @@ typedef enum
 	CSTATE_END_COMMAND,
 
 	/*
+	 * States for transactions with serialization or deadlock failures.
+	 *
+	 * First, remember the failure in CSTATE_FAILURE. Then process other
+	 * commands of the failed transaction if any and go to CSTATE_RETRY. If we
+	 * can re-execute the transaction from the very beginning, report this as a
+	 * failure, set the same parameters for the transaction execution as in the
+	 * previous tries and process the first transaction command in
+	 * CSTATE_START_COMMAND. Otherwise, report this as an error, set the
+	 * parameters for the transaction execution as they were before the first
+	 * run of this transaction (except for a random state) and go to
+	 * CSTATE_END_TX to complete this transaction.
+	 */
+	CSTATE_FAILURE,
+	CSTATE_RETRY,
+
+	/*
 	 * CSTATE_END_TX performs end-of-transaction processing.  Calculates
 	 * latency, and logs the transaction.  In --connect mode, closes the
 	 * current connection.  Chooses the next script to execute and starts over
@@ -329,14 +424,13 @@ typedef struct
 	int			id;				/* client No. */
 	ConnectionStateEnum state;	/* state machine's current state. */
 	ConditionalStack cstack;	/* enclosing conditionals state */
+	RandomState random_state;	/* separate randomness for each client */
 
 	int			use_file;		/* index in sql_script for this client */
 	int			command;		/* command number in script */
 
 	/* client variables */
-	Variable   *variables;		/* array of variable definitions */
-	int			nvariables;		/* number of variables */
-	bool		vars_sorted;	/* are variables sorted by name? */
+	Variables   variables;
 
 	/* various times about current transaction */
 	int64		txn_scheduled;	/* scheduled start time of transaction (usec) */
@@ -346,6 +440,18 @@ typedef struct
 
 	bool		prepared[MAX_SCRIPTS];	/* whether client prepared the script */
 
+	/*
+	 * For processing errors and repeating transactions with serialization or
+	 * deadlock failures:
+	 */
+	Failure		first_failure;	/* status and command number of the first
+								 * failure in the current transaction execution;
+								 * status NO_FAILURE if there were no failures
+								 * or errors */
+	RetryState  retry_state;
+	uint32			retries;	/* how many times have we already retried the
+								 * current transaction? */
+
 	/* per client collected stats */
 	int64		cnt;			/* client transaction count, for -t */
 	int			ecnt;			/* error count */
@@ -380,6 +486,42 @@ typedef struct
 	ZipfCell	cells[ZIPF_CACHE_SIZE];
 } ZipfCache;
 
+typedef enum ErrorLevel
+{
+	/*
+	 * To report throttling, executed/sent/received commands etc.
+	 */
+	ELEVEL_DEBUG,
+
+	/*
+	 * Normal failure of the SQL/meta command, or processing of the failed
+	 * transaction (its end/retry).
+	 */
+	ELEVEL_CLIENT_FAIL,
+
+	/*
+	 * Something serious e.g. connection with the backend was lost.. therefore
+	 * abort the client.
+	 */
+	ELEVEL_CLIENT_ABORTED,
+
+	/*
+	 * To report the error/log messages of the main program and/or
+	 * PGBENCH_DEBUG.
+	 */
+	ELEVEL_MAIN,
+} ErrorLevel;
+
+/*
+ * Error state for error messages or other logging messages.
+ */
+typedef struct ErrorState
+{
+	bool		in_process;		/* are we processing the error now? */
+	char		message[2048];
+	int			message_length;
+} ErrorState;
+
 /*
  * Thread state
  */
@@ -389,17 +531,20 @@ typedef struct
 	pthread_t	thread;			/* thread handle */
 	CState	   *state;			/* array of CState */
 	int			nstate;			/* length of state[] */
-	unsigned short random_state[3]; /* separate randomness for each thread */
+	RandomState random_state; 	/* separate randomness for each thread */
 	int64		throttle_trigger;	/* previous/next throttling (us) */
 	FILE	   *logfile;		/* where to log, or NULL */
 	ZipfCache	zipf_cache;		/* for thread-safe  zipfian random number
 								 * generation */
+	ErrorState  error_state;	/* for thread-safe error messages or other
+								 * logging messages */
 
 	/* per thread collected stats */
 	instr_time	start_time;		/* thread start time */
 	instr_time	conn_time;
 	StatsData	stats;
-	int64		latency_late;	/* executed but late transactions */
+	int64		latency_late;	/* executed but late transactions (including
+								 * errors) */
 } TState;
 
 #define INVALID_THREAD		((pthread_t) 0)
@@ -445,6 +590,10 @@ typedef struct
 	char	   *argv[MAX_ARGS]; /* command word list */
 	PgBenchExpr *expr;			/* parsed expression, if needed */
 	SimpleStats stats;			/* time spent in this command */
+	int64		retries;
+	int64		errors;			/* number of failures that were not retried */
+	int64		errors_in_failed_tx;	/* number of errors
+										 * ERRCODE_IN_FAILED_SQL_TRANSACTION */
 } Command;
 
 typedef struct ParsedScript
@@ -460,7 +609,18 @@ static int	num_scripts;		/* number of scripts in sql_script[] */
 static int	num_commands = 0;	/* total number of Command structs */
 static int64 total_weight = 0;
 
-static int	debug = 0;			/* debug flag */
+typedef enum DebugLevel
+{
+	NO_DEBUG = 0,				/* no debugging output (except PGBENCH_DEBUG) */
+	DEBUG_FAILS,				/* print only failure messages, errors and
+								 * retries */
+	DEBUG_ALL,					/* print all debugging output (throttling,
+								 * executed/sent/received commands etc.) */
+	NUM_DEBUGLEVEL
+} DebugLevel;
+
+static DebugLevel debug_level = NO_DEBUG;	/* debug flag */
+static const char *DEBUGLEVEL[] = {"no", "fails", "all"};
 
 /* Builtin test scripts */
 typedef struct BuiltinScript
@@ -508,8 +668,14 @@ static const BuiltinScript builtin_script[] =
 	}
 };
 
+/*
+ * To handle error messages or other logging messages outside threads.
+ */
+static ErrorState main_error_state;
+
 
 /* Function prototypes */
+static int64 strtoint64_thread(TState *thread, const char *str);
 static void setNullValue(PgBenchValue *pv);
 static void setBoolValue(PgBenchValue *pv, bool bval);
 static void setIntValue(PgBenchValue *pv, int64 ival);
@@ -525,6 +691,42 @@ static void *threadRun(void *arg);
 static void setalarm(int seconds);
 static void finishCon(CState *st);
 
+/*
+ * To report error messages or other log messages, you can use the following
+ * constructs:
+ *
+ * elog(thread, ELEVEL_CLIENT_FAIL,
+ *      "too many function arguments, maximum is %d\n", MAX_FARGS);
+ *
+ * Or:
+ *
+ * if (errstart(thread, ELEVEL_CLIENT_FAIL))
+ * {
+ *     errmsg(thread,
+ *            "too many function arguments, maximum is %d\n", MAX_FARGS);
+ *     ... other errmsg() calls if needed ...
+ *     errfinish(thread);
+ * }
+ *
+ * In fact, the function elog() calls the functions errstart(), errmsg() and
+ * errfinish() in the same way, so it is just wrapper for more comfortable use.
+ *
+ * Pass the thread as not NULL for client commands and as NULL otherwise. In the
+ * first case the error state of the thread will be used to store the entire
+ * error message during the invokations of the function errmsg(). And the
+ * message will be printed to stderr in function errfinish() (it is assumed that
+ * it is not empty).
+ * Otherwise the main error state will be used for the same purposes.
+ */
+static void errmsg_internal(TState *thread, const char *fmt,
+							va_list *args) pg_attribute_printf(2, 0);
+static void elog(TState *thread, ErrorLevel error_level,
+				 const char *fmt,...) pg_attribute_printf(3, 4);
+static bool errstart(TState *thread, ErrorLevel error_level);
+static void errmsg(TState *thread,
+				   const char *fmt,...) pg_attribute_printf(2, 3);
+static void errfinish(TState *thread);
+
 
 /* callback functions for our flex lexer */
 static const PsqlScanCallbacks pgbench_callbacks = {
@@ -572,7 +774,7 @@ usage(void)
 		   "                           protocol for submitting queries (default: simple)\n"
 		   "  -n, --no-vacuum          do not run VACUUM before tests\n"
 		   "  -P, --progress=NUM       show thread progress report every NUM seconds\n"
-		   "  -r, --report-latencies   report average latency per command\n"
+		   "  -r, --report-per-command report latencies, errors and retries per command\n"
 		   "  -R, --rate=NUM           target rate in transactions per second\n"
 		   "  -s, --scale=NUM          report this scale factor in output\n"
 		   "  -t, --transactions=NUM   number of transactions each client runs (default: 10)\n"
@@ -581,11 +783,12 @@ usage(void)
 		   "  --aggregate-interval=NUM aggregate data over NUM seconds\n"
 		   "  --log-prefix=PREFIX      prefix for transaction time log file\n"
 		   "                           (default: \"pgbench_log\")\n"
+		   "  --max-tries=NUM          max number of tries to run transaction\n"
 		   "  --progress-timestamp     use Unix epoch timestamps for progress\n"
 		   "  --random-seed=SEED       set random seed (\"time\", \"rand\", integer)\n"
 		   "  --sampling-rate=NUM      fraction of transactions to log (e.g., 0.01 for 1%%)\n"
 		   "\nCommon options:\n"
-		   "  -d, --debug              print debugging output\n"
+		   "  -d, --debug=no|fails|all print debugging output (default: no)\n"
 		   "  -h, --host=HOSTNAME      database server host or socket directory\n"
 		   "  -p, --port=PORT          database server port number\n"
 		   "  -U, --username=USERNAME  connect as specified database user\n"
@@ -632,6 +835,12 @@ is_an_int(const char *str)
 int64
 strtoint64(const char *str)
 {
+	return strtoint64_thread(NULL, str);
+}
+
+static int64
+strtoint64_thread(TState *thread, const char *str)
+{
 	const char *ptr = str;
 	int64		result = 0;
 	int			sign = 1;
@@ -667,7 +876,10 @@ strtoint64(const char *str)
 
 	/* require at least one digit */
 	if (!isdigit((unsigned char) *ptr))
-		fprintf(stderr, "invalid input syntax for integer: \"%s\"\n", str);
+	{
+		elog(thread, ELEVEL_MAIN,
+			 "invalid input syntax for integer: \"%s\"\n", str);
+	}
 
 	/* process digits */
 	while (*ptr && isdigit((unsigned char) *ptr))
@@ -675,7 +887,10 @@ strtoint64(const char *str)
 		int64		tmp = result * 10 + (*ptr++ - '0');
 
 		if ((tmp / 10) != result)	/* overflow? */
-			fprintf(stderr, "value \"%s\" is out of range for type bigint\n", str);
+		{
+			elog(thread, ELEVEL_MAIN,
+				 "value \"%s\" is out of range for type bigint\n", str);
+		}
 		result = tmp;
 	}
 
@@ -686,14 +901,17 @@ gotdigits:
 		ptr++;
 
 	if (*ptr != '\0')
-		fprintf(stderr, "invalid input syntax for integer: \"%s\"\n", str);
+	{
+		elog(thread, ELEVEL_MAIN,
+			 "invalid input syntax for integer: \"%s\"\n", str);
+	}
 
 	return ((sign < 0) ? -result : result);
 }
 
 /* random number generator: uniform distribution from min to max inclusive */
 static int64
-getrand(TState *thread, int64 min, int64 max)
+getrand(RandomState *random_state, int64 min, int64 max)
 {
 	/*
 	 * Odd coding is so that min and max have approximately the same chance of
@@ -704,7 +922,7 @@ getrand(TState *thread, int64 min, int64 max)
 	 * protected by a mutex, and therefore a bottleneck on machines with many
 	 * CPUs.
 	 */
-	return min + (int64) ((max - min + 1) * pg_erand48(thread->random_state));
+	return min + (int64) ((max - min + 1) * pg_erand48(random_state->data));
 }
 
 /*
@@ -713,7 +931,8 @@ getrand(TState *thread, int64 min, int64 max)
  * value is exp(-parameter).
  */
 static int64
-getExponentialRand(TState *thread, int64 min, int64 max, double parameter)
+getExponentialRand(RandomState *random_state, int64 min, int64 max,
+				   double parameter)
 {
 	double		cut,
 				uniform,
@@ -723,7 +942,7 @@ getExponentialRand(TState *thread, int64 min, int64 max, double parameter)
 	Assert(parameter > 0.0);
 	cut = exp(-parameter);
 	/* erand in [0, 1), uniform in (0, 1] */
-	uniform = 1.0 - pg_erand48(thread->random_state);
+	uniform = 1.0 - pg_erand48(random_state->data);
 
 	/*
 	 * inner expression in (cut, 1] (if parameter > 0), rand in [0, 1)
@@ -736,7 +955,8 @@ getExponentialRand(TState *thread, int64 min, int64 max, double parameter)
 
 /* random number generator: gaussian distribution from min to max inclusive */
 static int64
-getGaussianRand(TState *thread, int64 min, int64 max, double parameter)
+getGaussianRand(RandomState *random_state, int64 min, int64 max,
+				double parameter)
 {
 	double		stdev;
 	double		rand;
@@ -764,8 +984,8 @@ getGaussianRand(TState *thread, int64 min, int64 max, double parameter)
 		 * are expected in (0, 1] (see
 		 * http://en.wikipedia.org/wiki/Box_muller)
 		 */
-		double		rand1 = 1.0 - pg_erand48(thread->random_state);
-		double		rand2 = 1.0 - pg_erand48(thread->random_state);
+		double		rand1 = 1.0 - pg_erand48(random_state->data);
+		double		rand2 = 1.0 - pg_erand48(random_state->data);
 
 		/* Box-Muller basic form transform */
 		double		var_sqrt = sqrt(-2.0 * log(rand1));
@@ -792,7 +1012,7 @@ getGaussianRand(TState *thread, int64 min, int64 max, double parameter)
  * will approximate a Poisson distribution centered on the given value.
  */
 static int64
-getPoissonRand(TState *thread, int64 center)
+getPoissonRand(RandomState *random_state, int64 center)
 {
 	/*
 	 * Use inverse transform sampling to generate a value > 0, such that the
@@ -801,7 +1021,7 @@ getPoissonRand(TState *thread, int64 center)
 	double		uniform;
 
 	/* erand in [0, 1), uniform in (0, 1] */
-	uniform = 1.0 - pg_erand48(thread->random_state);
+	uniform = 1.0 - pg_erand48(random_state->data);
 
 	return (int64) (-log(uniform) * ((double) center) + 0.5);
 }
@@ -879,7 +1099,7 @@ zipfFindOrCreateCacheCell(ZipfCache * cache, int64 n, double s)
  * Luc Devroye, p. 550-551, Springer 1986.
  */
 static int64
-computeIterativeZipfian(TState *thread, int64 n, double s)
+computeIterativeZipfian(RandomState *random_state, int64 n, double s)
 {
 	double		b = pow(2.0, s - 1.0);
 	double		x,
@@ -890,8 +1110,8 @@ computeIterativeZipfian(TState *thread, int64 n, double s)
 	while (true)
 	{
 		/* random variates */
-		u = pg_erand48(thread->random_state);
-		v = pg_erand48(thread->random_state);
+		u = pg_erand48(random_state->data);
+		v = pg_erand48(random_state->data);
 
 		x = floor(pow(u, -1.0 / (s - 1.0)));
 
@@ -909,10 +1129,11 @@ computeIterativeZipfian(TState *thread, int64 n, double s)
  * Jim Gray et al, SIGMOD 1994
  */
 static int64
-computeHarmonicZipfian(TState *thread, int64 n, double s)
+computeHarmonicZipfian(TState *thread, RandomState *random_state, int64 n,
+					   double s)
 {
 	ZipfCell   *cell = zipfFindOrCreateCacheCell(&thread->zipf_cache, n, s);
-	double		uniform = pg_erand48(thread->random_state);
+	double		uniform = pg_erand48(random_state->data);
 	double		uz = uniform * cell->harmonicn;
 
 	if (uz < 1.0)
@@ -924,7 +1145,8 @@ computeHarmonicZipfian(TState *thread, int64 n, double s)
 
 /* random number generator: zipfian distribution from min to max inclusive */
 static int64
-getZipfianRand(TState *thread, int64 min, int64 max, double s)
+getZipfianRand(TState *thread, RandomState *random_state, int64 min,
+			   int64 max, double s)
 {
 	int64		n = max - min + 1;
 
@@ -933,8 +1155,8 @@ getZipfianRand(TState *thread, int64 min, int64 max, double s)
 
 
 	return min - 1 + ((s > 1)
-					  ? computeIterativeZipfian(thread, n, s)
-					  : computeHarmonicZipfian(thread, n, s));
+					? computeIterativeZipfian(random_state, n, s)
+					: computeHarmonicZipfian(thread, random_state, n, s));
 }
 
 /*
@@ -1034,6 +1256,10 @@ initStats(StatsData *sd, time_t start_time)
 	sd->start_time = start_time;
 	sd->cnt = 0;
 	sd->skipped = 0;
+	sd->retries = 0;
+	sd->retried = 0;
+	sd->errors = 0;
+	sd->errors_in_failed_tx = 0;
 	initSimpleStats(&sd->latency);
 	initSimpleStats(&sd->lag);
 }
@@ -1042,8 +1268,30 @@ initStats(StatsData *sd, time_t start_time)
  * Accumulate one additional item into the given stats object.
  */
 static void
-accumStats(StatsData *stats, bool skipped, double lat, double lag)
+accumStats(StatsData *stats, bool skipped, double lat, double lag,
+		   FailureStatus first_error, int64 retries)
 {
+	/*
+	 * Record the number of retries regardless of whether the transaction was
+	 * successful or failed.
+	 */
+	stats->retries += retries;
+	if (retries > 0)
+		stats->retried++;
+
+	/* Record the failed transaction */
+	if (first_error != NO_FAILURE)
+	{
+		stats->errors++;
+
+		if (first_error == IN_FAILED_SQL_TRANSACTION)
+			stats->errors_in_failed_tx++;
+
+		return;
+	}
+
+	/* Record the successful transaction */
+
 	stats->cnt++;
 
 	if (skipped)
@@ -1070,7 +1318,7 @@ executeStatement(PGconn *con, const char *sql)
 	res = PQexec(con, sql);
 	if (PQresultStatus(res) != PGRES_COMMAND_OK)
 	{
-		fprintf(stderr, "%s", PQerrorMessage(con));
+		elog(NULL, ELEVEL_MAIN, "%s", PQerrorMessage(con));
 		exit(1);
 	}
 	PQclear(res);
@@ -1085,15 +1333,19 @@ tryExecuteStatement(PGconn *con, const char *sql)
 	res = PQexec(con, sql);
 	if (PQresultStatus(res) != PGRES_COMMAND_OK)
 	{
-		fprintf(stderr, "%s", PQerrorMessage(con));
-		fprintf(stderr, "(ignoring this error and continuing anyway)\n");
+		if (errstart(NULL, ELEVEL_MAIN))
+		{
+			errmsg(NULL, "%s", PQerrorMessage(con));
+			errmsg(NULL, "(ignoring this error and continuing anyway)\n");
+			errfinish(NULL);
+		}
 	}
 	PQclear(res);
 }
 
 /* set up a connection to the backend */
 static PGconn *
-doConnect(void)
+doConnect(TState *thread)
 {
 	PGconn	   *conn;
 	bool		new_pass;
@@ -1132,8 +1384,8 @@ doConnect(void)
 
 		if (!conn)
 		{
-			fprintf(stderr, "connection to database \"%s\" failed\n",
-					dbName);
+			elog(thread, ELEVEL_MAIN,
+				 "connection to database \"%s\" failed\n", dbName);
 			return NULL;
 		}
 
@@ -1151,8 +1403,9 @@ doConnect(void)
 	/* check to see that the backend connection was successfully made */
 	if (PQstatus(conn) == CONNECTION_BAD)
 	{
-		fprintf(stderr, "connection to database \"%s\" failed:\n%s",
-				dbName, PQerrorMessage(conn));
+		elog(thread, ELEVEL_MAIN,
+			 "connection to database \"%s\" failed:\n%s",
+			 dbName, PQerrorMessage(conn));
 		PQfinish(conn);
 		return NULL;
 	}
@@ -1184,39 +1437,39 @@ compareVariableNames(const void *v1, const void *v2)
 
 /* Locate a variable by name; returns NULL if unknown */
 static Variable *
-lookupVariable(CState *st, char *name)
+lookupVariable(Variables *variables, char *name)
 {
 	Variable	key;
 
 	/* On some versions of Solaris, bsearch of zero items dumps core */
-	if (st->nvariables <= 0)
+	if (variables->nvariables <= 0)
 		return NULL;
 
 	/* Sort if we have to */
-	if (!st->vars_sorted)
+	if (!variables->vars_sorted)
 	{
-		qsort((void *) st->variables, st->nvariables, sizeof(Variable),
-			  compareVariableNames);
-		st->vars_sorted = true;
+		qsort((void *) variables->array, variables->nvariables,
+			  sizeof(Variable), compareVariableNames);
+		variables->vars_sorted = true;
 	}
 
 	/* Now we can search */
 	key.name = name;
 	return (Variable *) bsearch((void *) &key,
-								(void *) st->variables,
-								st->nvariables,
+								(void *) variables->array,
+								variables->nvariables,
 								sizeof(Variable),
 								compareVariableNames);
 }
 
 /* Get the value of a variable, in string form; returns NULL if unknown */
 static char *
-getVariable(CState *st, char *name)
+getVariable(Variables *variables, char *name)
 {
 	Variable   *var;
 	char		stringform[64];
 
-	var = lookupVariable(st, name);
+	var = lookupVariable(variables, name);
 	if (var == NULL)
 		return NULL;			/* not found */
 
@@ -1244,7 +1497,7 @@ getVariable(CState *st, char *name)
 
 /* Try to convert variable to a value; return false on failure */
 static bool
-makeVariableValue(Variable *var)
+makeVariableValue(TState *thread, Variable *var)
 {
 	size_t slen;
 
@@ -1281,7 +1534,7 @@ makeVariableValue(Variable *var)
 	}
 	else if (is_an_int(var->svalue))
 	{
-		setIntValue(&var->value, strtoint64(var->svalue));
+		setIntValue(&var->value, strtoint64_thread(thread, var->svalue));
 	}
 	else						/* type should be double */
 	{
@@ -1290,9 +1543,9 @@ makeVariableValue(Variable *var)
 
 		if (sscanf(var->svalue, "%lf%c", &dv, &xs) != 1)
 		{
-			fprintf(stderr,
-					"malformed variable \"%s\" value: \"%s\"\n",
-					var->name, var->svalue);
+			elog(thread, ELEVEL_CLIENT_FAIL,
+				 "malformed variable \"%s\" value: \"%s\"\n",
+				 var->name, var->svalue);
 			return false;
 		}
 		setDoubleValue(&var->value, dv);
@@ -1338,13 +1591,16 @@ valid_variable_name(const char *name)
  * Lookup a variable by name, creating it if need be.
  * Caller is expected to assign a value to the variable.
  * Returns NULL on failure (bad name).
+ *
+ * Pass the thread as not NULL for client commands and as NULL otherwise.
  */
 static Variable *
-lookupCreateVariable(CState *st, const char *context, char *name)
+lookupCreateVariable(TState *thread, Variables *variables, const char *context,
+					 char *name)
 {
 	Variable   *var;
 
-	var = lookupVariable(st, name);
+	var = lookupVariable(variables, name);
 	if (var == NULL)
 	{
 		Variable   *newvars;
@@ -1355,29 +1611,34 @@ lookupCreateVariable(CState *st, const char *context, char *name)
 		 */
 		if (!valid_variable_name(name))
 		{
-			fprintf(stderr, "%s: invalid variable name: \"%s\"\n",
-					context, name);
+			/*
+			 * About the error level used: if we process client commands, it a
+			 * normal failure; otherwise it is not and we exit the program.
+			 */
+			elog(thread, thread ? ELEVEL_CLIENT_FAIL : ELEVEL_MAIN,
+				 "%s: invalid variable name: \"%s\"\n",
+				 context, name);
 			return NULL;
 		}
 
 		/* Create variable at the end of the array */
-		if (st->variables)
-			newvars = (Variable *) pg_realloc(st->variables,
-											  (st->nvariables + 1) * sizeof(Variable));
+		if (variables->array)
+			newvars = (Variable *) pg_realloc(variables->array,
+								(variables->nvariables + 1) * sizeof(Variable));
 		else
 			newvars = (Variable *) pg_malloc(sizeof(Variable));
 
-		st->variables = newvars;
+		variables->array = newvars;
 
-		var = &newvars[st->nvariables];
+		var = &newvars[variables->nvariables];
 
 		var->name = pg_strdup(name);
 		var->svalue = NULL;
 		/* caller is expected to initialize remaining fields */
 
-		st->nvariables++;
+		variables->nvariables++;
 		/* we don't re-sort the array till we have to */
-		st->vars_sorted = false;
+		variables->vars_sorted = false;
 	}
 
 	return var;
@@ -1386,12 +1647,13 @@ lookupCreateVariable(CState *st, const char *context, char *name)
 /* Assign a string value to a variable, creating it if need be */
 /* Returns false on failure (bad name) */
 static bool
-putVariable(CState *st, const char *context, char *name, const char *value)
+putVariable(Variables *variables, const char *context, char *name,
+			const char *value)
 {
 	Variable   *var;
 	char	   *val;
 
-	var = lookupCreateVariable(st, context, name);
+	var = lookupCreateVariable(NULL, variables, context, name);
 	if (!var)
 		return false;
 
@@ -1408,13 +1670,14 @@ putVariable(CState *st, const char *context, char *name, const char *value)
 
 /* Assign a value to a variable, creating it if need be */
 /* Returns false on failure (bad name) */
+/* Pass the thread as not NULL for client commands and as NULL otherwise */
 static bool
-putVariableValue(CState *st, const char *context, char *name,
-				  const PgBenchValue *value)
+putVariableValue(TState *thread, Variables *variables, const char *context,
+				 char *name, const PgBenchValue *value)
 {
 	Variable   *var;
 
-	var = lookupCreateVariable(st, context, name);
+	var = lookupCreateVariable(thread, variables, context, name);
 	if (!var)
 		return false;
 
@@ -1428,13 +1691,15 @@ putVariableValue(CState *st, const char *context, char *name,
 
 /* Assign an integer value to a variable, creating it if need be */
 /* Returns false on failure (bad name) */
+/* Pass the thread as not NULL for client commands and as NULL otherwise */
 static bool
-putVariableInt(CState *st, const char *context, char *name, int64 value)
+putVariableInt(TState *thread, Variables *variables, const char *context,
+			   char *name, int64 value)
 {
 	PgBenchValue val;
 
 	setIntValue(&val, value);
-	return putVariableValue(st, context, name, &val);
+	return putVariableValue(thread, variables, context, name, &val);
 }
 
 /*
@@ -1489,7 +1754,7 @@ replaceVariable(char **sql, char *param, int len, char *value)
 }
 
 static char *
-assignVariables(CState *st, char *sql)
+assignVariables(Variables *variables, char *sql)
 {
 	char	   *p,
 			   *name,
@@ -1510,7 +1775,7 @@ assignVariables(CState *st, char *sql)
 			continue;
 		}
 
-		val = getVariable(st, name);
+		val = getVariable(variables, name);
 		free(name);
 		if (val == NULL)
 		{
@@ -1525,12 +1790,13 @@ assignVariables(CState *st, char *sql)
 }
 
 static void
-getQueryParams(CState *st, const Command *command, const char **params)
+getQueryParams(Variables *variables, const Command *command,
+			   const char **params)
 {
 	int			i;
 
 	for (i = 0; i < command->argc - 1; i++)
-		params[i] = getVariable(st, command->argv[i + 1]);
+		params[i] = getVariable(variables, command->argv[i + 1]);
 }
 
 static char *
@@ -1556,7 +1822,7 @@ valueTypeName(PgBenchValue *pval)
 
 /* get a value as a boolean, or tell if there is a problem */
 static bool
-coerceToBool(PgBenchValue *pval, bool *bval)
+coerceToBool(TState *thread, PgBenchValue *pval, bool *bval)
 {
 	if (pval->type == PGBT_BOOLEAN)
 	{
@@ -1565,7 +1831,8 @@ coerceToBool(PgBenchValue *pval, bool *bval)
 	}
 	else /* NULL, INT or DOUBLE */
 	{
-		fprintf(stderr, "cannot coerce %s to boolean\n", valueTypeName(pval));
+		elog(thread, ELEVEL_CLIENT_FAIL,
+			 "cannot coerce %s to boolean\n", valueTypeName(pval));
 		*bval = false;			/* suppress uninitialized-variable warnings */
 		return false;
 	}
@@ -1597,7 +1864,7 @@ valueTruth(PgBenchValue *pval)
 
 /* get a value as an int, tell if there is a problem */
 static bool
-coerceToInt(PgBenchValue *pval, int64 *ival)
+coerceToInt(TState *thread, PgBenchValue *pval, int64 *ival)
 {
 	if (pval->type == PGBT_INT)
 	{
@@ -1610,7 +1877,8 @@ coerceToInt(PgBenchValue *pval, int64 *ival)
 
 		if (dval < PG_INT64_MIN || PG_INT64_MAX < dval)
 		{
-			fprintf(stderr, "double to int overflow for %f\n", dval);
+			elog(thread, ELEVEL_CLIENT_FAIL,
+				 "double to int overflow for %f\n", dval);
 			return false;
 		}
 		*ival = (int64) dval;
@@ -1618,14 +1886,15 @@ coerceToInt(PgBenchValue *pval, int64 *ival)
 	}
 	else /* BOOLEAN or NULL */
 	{
-		fprintf(stderr, "cannot coerce %s to int\n", valueTypeName(pval));
+		elog(thread, ELEVEL_CLIENT_FAIL,
+			 "cannot coerce %s to int\n", valueTypeName(pval));
 		return false;
 	}
 }
 
 /* get a value as a double, or tell if there is a problem */
 static bool
-coerceToDouble(PgBenchValue *pval, double *dval)
+coerceToDouble(TState *thread, PgBenchValue *pval, double *dval)
 {
 	if (pval->type == PGBT_DOUBLE)
 	{
@@ -1639,7 +1908,8 @@ coerceToDouble(PgBenchValue *pval, double *dval)
 	}
 	else /* BOOLEAN or NULL */
 	{
-		fprintf(stderr, "cannot coerce %s to double\n", valueTypeName(pval));
+		elog(thread, ELEVEL_CLIENT_FAIL,
+			 "cannot coerce %s to double\n", valueTypeName(pval));
 		return false;
 	}
 }
@@ -1707,7 +1977,7 @@ evalLazyFunc(TState *thread, CState *st,
 			return true;
 		}
 
-		if (!coerceToBool(&a1, &ba1))
+		if (!coerceToBool(thread, &a1, &ba1))
 			return false;
 
 		if (!ba1)
@@ -1724,7 +1994,7 @@ evalLazyFunc(TState *thread, CState *st,
 			setNullValue(retval);
 			return true;
 		}
-		else if (!coerceToBool(&a2, &ba2))
+		else if (!coerceToBool(thread, &a2, &ba2))
 			return false;
 		else
 		{
@@ -1742,7 +2012,7 @@ evalLazyFunc(TState *thread, CState *st,
 			return true;
 		}
 
-		if (!coerceToBool(&a1, &ba1))
+		if (!coerceToBool(thread, &a1, &ba1))
 			return false;
 
 		if (ba1)
@@ -1759,7 +2029,7 @@ evalLazyFunc(TState *thread, CState *st,
 			setNullValue(retval);
 			return true;
 		}
-		else if (!coerceToBool(&a2, &ba2))
+		else if (!coerceToBool(thread, &a2, &ba2))
 			return false;
 		else
 		{
@@ -1817,8 +2087,8 @@ evalStandardFunc(TState *thread, CState *st,
 
 	if (l != NULL)
 	{
-		fprintf(stderr,
-				"too many function arguments, maximum is %d\n", MAX_FARGS);
+		elog(thread, ELEVEL_CLIENT_FAIL,
+			 "too many function arguments, maximum is %d\n", MAX_FARGS);
 		return false;
 	}
 
@@ -1855,8 +2125,8 @@ evalStandardFunc(TState *thread, CState *st,
 					double		ld,
 								rd;
 
-					if (!coerceToDouble(lval, &ld) ||
-						!coerceToDouble(rval, &rd))
+					if (!coerceToDouble(thread, lval, &ld) ||
+						!coerceToDouble(thread, rval, &rd))
 						return false;
 
 					switch (func)
@@ -1903,8 +2173,8 @@ evalStandardFunc(TState *thread, CState *st,
 					int64		li,
 								ri;
 
-					if (!coerceToInt(lval, &li) ||
-						!coerceToInt(rval, &ri))
+					if (!coerceToInt(thread, lval, &li) ||
+						!coerceToInt(thread, rval, &ri))
 						return false;
 
 					switch (func)
@@ -1941,7 +2211,8 @@ evalStandardFunc(TState *thread, CState *st,
 						case PGBENCH_MOD:
 							if (ri == 0)
 							{
-								fprintf(stderr, "division by zero\n");
+								elog(thread, ELEVEL_CLIENT_FAIL,
+									 "division by zero\n");
 								return false;
 							}
 							/* special handling of -1 divisor */
@@ -1952,7 +2223,8 @@ evalStandardFunc(TState *thread, CState *st,
 									/* overflow check (needed for INT64_MIN) */
 									if (li == PG_INT64_MIN)
 									{
-										fprintf(stderr, "bigint out of range\n");
+										elog(thread, ELEVEL_CLIENT_FAIL,
+											 "bigint out of range\n");
 										return false;
 									}
 									else
@@ -1986,7 +2258,8 @@ evalStandardFunc(TState *thread, CState *st,
 			{
 				int64 li, ri;
 
-				if (!coerceToInt(&vargs[0], &li) || !coerceToInt(&vargs[1], &ri))
+				if (!coerceToInt(thread, &vargs[0], &li) ||
+					!coerceToInt(thread, &vargs[1], &ri))
 					return false;
 
 				if (func == PGBENCH_BITAND)
@@ -2009,7 +2282,7 @@ evalStandardFunc(TState *thread, CState *st,
 		case PGBENCH_NOT:
 			{
 				bool b;
-				if (!coerceToBool(&vargs[0], &b))
+				if (!coerceToBool(thread, &vargs[0], &b))
 					return false;
 
 				setBoolValue(retval, !b);
@@ -2051,19 +2324,24 @@ evalStandardFunc(TState *thread, CState *st,
 
 				Assert(nargs == 1);
 
-				fprintf(stderr, "debug(script=%d,command=%d): ",
-						st->use_file, st->command + 1);
-
-				if (varg->type == PGBT_NULL)
-					fprintf(stderr, "null\n");
-				else if (varg->type == PGBT_BOOLEAN)
-					fprintf(stderr, "boolean %s\n", varg->u.bval ? "true" : "false");
-				else if (varg->type == PGBT_INT)
-					fprintf(stderr, "int " INT64_FORMAT "\n", varg->u.ival);
-				else if (varg->type == PGBT_DOUBLE)
-					fprintf(stderr, "double %.*g\n", DBL_DIG, varg->u.dval);
-				else /* internal error, unexpected type */
-					Assert(0);
+				if (errstart(thread, ELEVEL_MAIN))
+				{
+					errmsg(thread, "debug(script=%d,command=%d): ",
+						   st->use_file, st->command + 1);
+
+					if (varg->type == PGBT_NULL)
+						errmsg(thread, "null\n");
+					else if (varg->type == PGBT_BOOLEAN)
+						errmsg(thread, "boolean %s\n", varg->u.bval ? "true" : "false");
+					else if (varg->type == PGBT_INT)
+						errmsg(thread, "int " INT64_FORMAT "\n", varg->u.ival);
+					else if (varg->type == PGBT_DOUBLE)
+						errmsg(thread, "double %.*g\n", DBL_DIG, varg->u.dval);
+					else /* internal error, unexpected type */
+						Assert(0);
+
+					errfinish(thread);
+				}
 
 				*retval = *varg;
 
@@ -2080,7 +2358,7 @@ evalStandardFunc(TState *thread, CState *st,
 
 				Assert(nargs == 1);
 
-				if (!coerceToDouble(&vargs[0], &dval))
+				if (!coerceToDouble(thread, &vargs[0], &dval))
 					return false;
 
 				if (func == PGBENCH_SQRT)
@@ -2102,7 +2380,7 @@ evalStandardFunc(TState *thread, CState *st,
 
 				Assert(nargs == 1);
 
-				if (!coerceToInt(&vargs[0], &ival))
+				if (!coerceToInt(thread, &vargs[0], &ival))
 					return false;
 
 				setIntValue(retval, ival);
@@ -2132,13 +2410,13 @@ evalStandardFunc(TState *thread, CState *st,
 				{
 					double		extremum;
 
-					if (!coerceToDouble(&vargs[0], &extremum))
+					if (!coerceToDouble(thread, &vargs[0], &extremum))
 						return false;
 					for (i = 1; i < nargs; i++)
 					{
 						double		dval;
 
-						if (!coerceToDouble(&vargs[i], &dval))
+						if (!coerceToDouble(thread, &vargs[i], &dval))
 							return false;
 						if (func == PGBENCH_LEAST)
 							extremum = Min(extremum, dval);
@@ -2151,13 +2429,13 @@ evalStandardFunc(TState *thread, CState *st,
 				{
 					int64		extremum;
 
-					if (!coerceToInt(&vargs[0], &extremum))
+					if (!coerceToInt(thread, &vargs[0], &extremum))
 						return false;
 					for (i = 1; i < nargs; i++)
 					{
 						int64		ival;
 
-						if (!coerceToInt(&vargs[i], &ival))
+						if (!coerceToInt(thread, &vargs[i], &ival))
 							return false;
 						if (func == PGBENCH_LEAST)
 							extremum = Min(extremum, ival);
@@ -2180,27 +2458,29 @@ evalStandardFunc(TState *thread, CState *st,
 
 				Assert(nargs >= 2);
 
-				if (!coerceToInt(&vargs[0], &imin) ||
-					!coerceToInt(&vargs[1], &imax))
+				if (!coerceToInt(thread, &vargs[0], &imin) ||
+					!coerceToInt(thread, &vargs[1], &imax))
 					return false;
 
 				/* check random range */
 				if (imin > imax)
 				{
-					fprintf(stderr, "empty range given to random\n");
+					elog(thread, ELEVEL_CLIENT_FAIL,
+						 "empty range given to random\n");
 					return false;
 				}
 				else if (imax - imin < 0 || (imax - imin) + 1 < 0)
 				{
 					/* prevent int overflows in random functions */
-					fprintf(stderr, "random range is too large\n");
+					elog(thread, ELEVEL_CLIENT_FAIL,
+						 "random range is too large\n");
 					return false;
 				}
 
 				if (func == PGBENCH_RANDOM)
 				{
 					Assert(nargs == 2);
-					setIntValue(retval, getrand(thread, imin, imax));
+					setIntValue(retval, getrand(&st->random_state, imin, imax));
 				}
 				else			/* gaussian & exponential */
 				{
@@ -2208,46 +2488,49 @@ evalStandardFunc(TState *thread, CState *st,
 
 					Assert(nargs == 3);
 
-					if (!coerceToDouble(&vargs[2], &param))
+					if (!coerceToDouble(thread, &vargs[2], &param))
 						return false;
 
 					if (func == PGBENCH_RANDOM_GAUSSIAN)
 					{
 						if (param < MIN_GAUSSIAN_PARAM)
 						{
-							fprintf(stderr,
-									"gaussian parameter must be at least %f "
-									"(not %f)\n", MIN_GAUSSIAN_PARAM, param);
+							elog(thread, ELEVEL_CLIENT_FAIL,
+								 "gaussian parameter must be at least %f "
+								 "(not %f)\n", MIN_GAUSSIAN_PARAM, param);
 							return false;
 						}
 
 						setIntValue(retval,
-									getGaussianRand(thread, imin, imax, param));
+									getGaussianRand(&st->random_state, imin,
+													imax, param));
 					}
 					else if (func == PGBENCH_RANDOM_ZIPFIAN)
 					{
 						if (param <= 0.0 || param == 1.0 || param > MAX_ZIPFIAN_PARAM)
 						{
-							fprintf(stderr,
-									"zipfian parameter must be in range (0, 1) U (1, %d]"
-									" (got %f)\n", MAX_ZIPFIAN_PARAM, param);
+							elog(thread, ELEVEL_CLIENT_FAIL,
+								 "zipfian parameter must be in range (0, 1) U (1, %d]"
+								 " (got %f)\n", MAX_ZIPFIAN_PARAM, param);
 							return false;
 						}
 						setIntValue(retval,
-									getZipfianRand(thread, imin, imax, param));
+									getZipfianRand(thread, &st->random_state,
+												   imin, imax, param));
 					}
 					else		/* exponential */
 					{
 						if (param <= 0.0)
 						{
-							fprintf(stderr,
-									"exponential parameter must be greater than zero"
-									" (got %f)\n", param);
+							elog(thread, ELEVEL_CLIENT_FAIL,
+								 "exponential parameter must be greater than zero"
+								 " (got %f)\n", param);
 							return false;
 						}
 
 						setIntValue(retval,
-									getExponentialRand(thread, imin, imax, param));
+									getExponentialRand(&st->random_state, imin,
+													   imax, param));
 					}
 				}
 
@@ -2263,8 +2546,8 @@ evalStandardFunc(TState *thread, CState *st,
 
 				Assert(nargs == 2);
 
-				if (!coerceToDouble(lval, &ld) ||
-					!coerceToDouble(rval, &rd))
+				if (!coerceToDouble(thread, lval, &ld) ||
+					!coerceToDouble(thread, rval, &rd))
 					return false;
 
 				setDoubleValue(retval, pow(ld, rd));
@@ -2291,8 +2574,8 @@ evalStandardFunc(TState *thread, CState *st,
 
 				Assert(nargs == 2);
 
-				if (!coerceToInt(&vargs[0], &val) ||
-					!coerceToInt(&vargs[1], &seed))
+				if (!coerceToInt(thread, &vargs[0], &val) ||
+					!coerceToInt(thread, &vargs[1], &seed))
 					return false;
 
 				if (func == PGBENCH_HASH_MURMUR2)
@@ -2346,14 +2629,15 @@ evaluateExpr(TState *thread, CState *st, PgBenchExpr *expr, PgBenchValue *retval
 			{
 				Variable   *var;
 
-				if ((var = lookupVariable(st, expr->u.variable.varname)) == NULL)
+				if ((var = lookupVariable(&st->variables, expr->u.variable.varname)) == NULL)
 				{
-					fprintf(stderr, "undefined variable \"%s\"\n",
-							expr->u.variable.varname);
+					elog(thread, ELEVEL_CLIENT_FAIL,
+						 "undefined variable \"%s\"\n",
+						 expr->u.variable.varname);
 					return false;
 				}
 
-				if (!makeVariableValue(var))
+				if (!makeVariableValue(thread, var))
 					return false;
 
 				*retval = var->value;
@@ -2368,8 +2652,8 @@ evaluateExpr(TState *thread, CState *st, PgBenchExpr *expr, PgBenchValue *retval
 
 		default:
 			/* internal error which should never occur */
-			fprintf(stderr, "unexpected enode type in evaluation: %d\n",
-					expr->etype);
+			elog(thread, ELEVEL_MAIN,
+				 "unexpected enode type in evaluation: %d\n", expr->etype);
 			exit(1);
 	}
 }
@@ -2410,7 +2694,8 @@ getMetaCommand(const char *cmd)
  * Return true if succeeded, or false on error.
  */
 static bool
-runShellCommand(CState *st, char *variable, char **argv, int argc)
+runShellCommand(TState *thread, Variables *variables, char *variable,
+				char **argv, int argc)
 {
 	char		command[SHELL_COMMAND_SIZE];
 	int			i,
@@ -2441,17 +2726,18 @@ runShellCommand(CState *st, char *variable, char **argv, int argc)
 		{
 			arg = argv[i] + 1;	/* a string literal starting with colons */
 		}
-		else if ((arg = getVariable(st, argv[i] + 1)) == NULL)
+		else if ((arg = getVariable(variables, argv[i] + 1)) == NULL)
 		{
-			fprintf(stderr, "%s: undefined variable \"%s\"\n",
-					argv[0], argv[i]);
+			elog(thread, ELEVEL_CLIENT_FAIL,
+				 "%s: undefined variable \"%s\"\n", argv[0], argv[i]);
 			return false;
 		}
 
 		arglen = strlen(arg);
 		if (len + arglen + (i > 0 ? 1 : 0) >= SHELL_COMMAND_SIZE - 1)
 		{
-			fprintf(stderr, "%s: shell command is too long\n", argv[0]);
+			elog(thread, ELEVEL_CLIENT_FAIL,
+				 "%s: shell command is too long\n", argv[0]);
 			return false;
 		}
 
@@ -2469,7 +2755,10 @@ runShellCommand(CState *st, char *variable, char **argv, int argc)
 		if (system(command))
 		{
 			if (!timer_exceeded)
-				fprintf(stderr, "%s: could not launch shell command\n", argv[0]);
+			{
+				elog(thread, ELEVEL_CLIENT_FAIL,
+					 "%s: could not launch shell command\n", argv[0]);
+			}
 			return false;
 		}
 		return true;
@@ -2478,19 +2767,24 @@ runShellCommand(CState *st, char *variable, char **argv, int argc)
 	/* Execute the command with pipe and read the standard output. */
 	if ((fp = popen(command, "r")) == NULL)
 	{
-		fprintf(stderr, "%s: could not launch shell command\n", argv[0]);
+		elog(thread, ELEVEL_CLIENT_FAIL,
+			 "%s: could not launch shell command\n", argv[0]);
 		return false;
 	}
 	if (fgets(res, sizeof(res), fp) == NULL)
 	{
 		if (!timer_exceeded)
-			fprintf(stderr, "%s: could not read result of shell command\n", argv[0]);
+		{
+			elog(thread, ELEVEL_CLIENT_FAIL,
+				 "%s: could not read result of shell command\n", argv[0]);
+		}
 		(void) pclose(fp);
 		return false;
 	}
 	if (pclose(fp) < 0)
 	{
-		fprintf(stderr, "%s: could not close shell command\n", argv[0]);
+		elog(thread, ELEVEL_CLIENT_FAIL,
+			 "%s: could not close shell command\n", argv[0]);
 		return false;
 	}
 
@@ -2500,11 +2794,12 @@ runShellCommand(CState *st, char *variable, char **argv, int argc)
 		endptr++;
 	if (*res == '\0' || *endptr != '\0')
 	{
-		fprintf(stderr, "%s: shell command must return an integer (not \"%s\")\n",
-				argv[0], res);
+		elog(thread, ELEVEL_CLIENT_FAIL,
+			 "%s: shell command must return an integer (not \"%s\")\n",
+			 argv[0], res);
 		return false;
 	}
-	if (!putVariableInt(st, "setshell", variable, retval))
+	if (!putVariableInt(thread, variables, "setshell", variable, retval))
 		return false;
 
 #ifdef DEBUG
@@ -2521,11 +2816,47 @@ preparedStatementName(char *buffer, int file, int state)
 }
 
 static void
-commandFailed(CState *st, const char *cmd, const char *message)
+commandFailed(TState *thread, CState *st, const char *cmd, const char *message,
+			  ErrorLevel error_level)
 {
-	fprintf(stderr,
-			"client %d aborted in command %d (%s) of script %d; %s\n",
-			st->id, st->command, cmd, st->use_file, message);
+	switch (error_level)
+	{
+		case ELEVEL_CLIENT_FAIL:
+			if (st->first_failure.status == NO_FAILURE)
+			{
+				/*
+				 * This is the first failure during the execution of the current
+				 * script.
+				 */
+				elog(thread, ELEVEL_CLIENT_FAIL,
+					 "client %d got a failure in command %d (%s) of script %d; %s\n",
+					 st->id, st->command, cmd, st->use_file, message);
+			}
+			else
+			{
+				/*
+				 * This is not the first failure during the execution of the
+				 * current script.
+				 */
+				elog(thread, ELEVEL_CLIENT_FAIL,
+					 "client %d continues a failed transaction in command %d (%s) of script %d; %s\n",
+					 st->id, st->command, cmd, st->use_file, message);
+			}
+			break;
+		case ELEVEL_CLIENT_ABORTED:
+			elog(thread, ELEVEL_CLIENT_ABORTED,
+				 "client %d aborted in command %d (%s) of script %d; %s\n",
+				 st->id, st->command, cmd, st->use_file, message);
+			break;
+		case ELEVEL_DEBUG:
+		case ELEVEL_MAIN:
+		default:
+			/* internal error which should never occur */
+			elog(thread, ELEVEL_MAIN,
+				 "unexpected error level when the command failed: %d\n",
+				 error_level);
+			exit(1);
+	}
 }
 
 /* return a script number with a weighted choice. */
@@ -2538,7 +2869,7 @@ chooseScript(TState *thread)
 	if (num_scripts == 1)
 		return 0;
 
-	w = getrand(thread, 0, total_weight - 1);
+	w = getrand(&thread->random_state, 0, total_weight - 1);
 	do
 	{
 		w -= sql_script[i++].weight;
@@ -2549,7 +2880,7 @@ chooseScript(TState *thread)
 
 /* Send a SQL command, using the chosen querymode */
 static bool
-sendCommand(CState *st, Command *command)
+sendCommand(TState *thread, CState *st, Command *command)
 {
 	int			r;
 
@@ -2558,10 +2889,9 @@ sendCommand(CState *st, Command *command)
 		char	   *sql;
 
 		sql = pg_strdup(command->argv[0]);
-		sql = assignVariables(st, sql);
+		sql = assignVariables(&st->variables, sql);
 
-		if (debug)
-			fprintf(stderr, "client %d sending %s\n", st->id, sql);
+		elog(thread, ELEVEL_DEBUG, "client %d sending %s\n", st->id, sql);
 		r = PQsendQuery(st->con, sql);
 		free(sql);
 	}
@@ -2570,10 +2900,9 @@ sendCommand(CState *st, Command *command)
 		const char *sql = command->argv[0];
 		const char *params[MAX_ARGS];
 
-		getQueryParams(st, command, params);
+		getQueryParams(&st->variables, command, params);
 
-		if (debug)
-			fprintf(stderr, "client %d sending %s\n", st->id, sql);
+		elog(thread, ELEVEL_DEBUG, "client %d sending %s\n", st->id, sql);
 		r = PQsendQueryParams(st->con, sql, command->argc - 1,
 							  NULL, params, NULL, NULL, 0);
 	}
@@ -2598,17 +2927,16 @@ sendCommand(CState *st, Command *command)
 				res = PQprepare(st->con, name,
 								commands[j]->argv[0], commands[j]->argc - 1, NULL);
 				if (PQresultStatus(res) != PGRES_COMMAND_OK)
-					fprintf(stderr, "%s", PQerrorMessage(st->con));
+					elog(thread, ELEVEL_MAIN, "%s", PQerrorMessage(st->con));
 				PQclear(res);
 			}
 			st->prepared[st->use_file] = true;
 		}
 
-		getQueryParams(st, command, params);
+		getQueryParams(&st->variables, command, params);
 		preparedStatementName(name, st->use_file, st->command);
 
-		if (debug)
-			fprintf(stderr, "client %d sending %s\n", st->id, name);
+		elog(thread, ELEVEL_DEBUG, "client %d sending %s\n", st->id, name);
 		r = PQsendQueryPrepared(st->con, name, command->argc - 1,
 								params, NULL, NULL, 0);
 	}
@@ -2617,10 +2945,8 @@ sendCommand(CState *st, Command *command)
 
 	if (r == 0)
 	{
-		if (debug)
-			fprintf(stderr, "client %d could not send %s\n",
-					st->id, command->argv[0]);
-		st->ecnt++;
+		elog(thread, ELEVEL_DEBUG,
+			 "client %d could not send %s\n", st->id, command->argv[0]);
 		return false;
 	}
 	else
@@ -2632,17 +2958,18 @@ sendCommand(CState *st, Command *command)
  * of delay, in microseconds.  Returns true on success, false on error.
  */
 static bool
-evaluateSleep(CState *st, int argc, char **argv, int *usecs)
+evaluateSleep(TState *thread, Variables *variables, int argc, char **argv,
+			  int *usecs)
 {
 	char	   *var;
 	int			usec;
 
 	if (*argv[1] == ':')
 	{
-		if ((var = getVariable(st, argv[1] + 1)) == NULL)
+		if ((var = getVariable(variables, argv[1] + 1)) == NULL)
 		{
-			fprintf(stderr, "%s: undefined variable \"%s\"\n",
-					argv[0], argv[1]);
+			elog(thread, ELEVEL_CLIENT_FAIL,
+				 "%s: undefined variable \"%s\"\n", argv[0], argv[1]);
 			return false;
 		}
 		usec = atoi(var);
@@ -2665,6 +2992,186 @@ evaluateSleep(CState *st, int argc, char **argv, int *usecs)
 }
 
 /*
+ * Get the number of all processed transactions including skipped ones and
+ * errors.
+ */
+static int64
+getTotalCnt(const CState *st)
+{
+	return st->cnt + st->ecnt;
+}
+
+/*
+ * Copy an array of random state.
+ */
+static void
+copyRandomState(RandomState *destination, const RandomState *source)
+{
+	memcpy(destination->data, source->data, sizeof(unsigned short) * 3);
+}
+
+/*
+ * Make a deep copy of variables array.
+ */
+static void
+copyVariables(Variables *destination_vars, const Variables *source_vars)
+{
+	Variable   *destination;
+	Variable   *current_destination;
+	const Variable *source;
+	const Variable *current_source;
+	int			nvariables;
+
+	if (!destination_vars || !source_vars)
+		return;
+
+	destination = destination_vars->array;
+	source = source_vars->array;
+	nvariables = source_vars->nvariables;
+
+	for (current_destination = destination;
+		 current_destination - destination < destination_vars->nvariables;
+		 ++current_destination)
+	{
+		pg_free(current_destination->name);
+		pg_free(current_destination->svalue);
+	}
+
+	destination_vars->array = pg_realloc(destination_vars->array,
+										 sizeof(Variable) * nvariables);
+	destination = destination_vars->array;
+
+	for (current_source = source, current_destination = destination;
+		 current_source - source < nvariables;
+		 ++current_source, ++current_destination)
+	{
+		current_destination->name = pg_strdup(current_source->name);
+		if (current_source->svalue)
+			current_destination->svalue = pg_strdup(current_source->svalue);
+		else
+			current_destination->svalue = NULL;
+		current_destination->value = current_source->value;
+	}
+
+	destination_vars->nvariables = nvariables;
+	destination_vars->vars_sorted = source_vars->vars_sorted;
+}
+
+/*
+ * Returns true if this type of failure can be retried.
+ */
+static bool
+canRetryFailure(FailureStatus failure_status)
+{
+	return (failure_status == SERIALIZATION_FAILURE ||
+			failure_status == DEADLOCK_FAILURE);
+}
+
+/*
+ * Returns true if the failure can be retried.
+ */
+static bool
+canRetry(CState *st, instr_time *now)
+{
+	FailureStatus failure_status = st->first_failure.status;
+
+	Assert(failure_status != NO_FAILURE);
+
+	/* We can only retry serialization or deadlock failures. */
+	if (!canRetryFailure(failure_status))
+		return false;
+
+	/*
+	 * We must have at least one option to limit the retrying of failed
+	 * transactions.
+	 */
+	Assert(max_tries || latency_limit);
+
+	/*
+	 * We cannot retry the failure if we have reached the maximum number of
+	 * tries.
+	 */
+	if (max_tries && st->retries + 1 >= max_tries)
+		return false;
+
+	/*
+	 * We cannot retry the failure if we spent too much time on this
+	 * transaction.
+	 */
+	if (latency_limit)
+	{
+		if (INSTR_TIME_IS_ZERO(*now))
+			INSTR_TIME_SET_CURRENT(*now);
+
+		if (INSTR_TIME_GET_MICROSEC(*now) - st->txn_scheduled >= latency_limit)
+			return false;
+	}
+
+	/* OK */
+	return true;
+}
+
+/*
+ * Process the conditional stack depending on the condition value; is used for
+ * the meta commands \if and \elif.
+ */
+static void
+executeCondition(CState *st, bool condition)
+{
+	Command    *command = sql_script[st->use_file].commands[st->command];
+
+	/* execute or not depending on evaluated condition */
+	if (command->meta == META_IF)
+	{
+		conditional_stack_push(st->cstack,
+							   condition ? IFSTATE_TRUE : IFSTATE_FALSE);
+	}
+	else if (command->meta == META_ELIF)
+	{
+		/* we should get here only if the "elif" needed evaluation */
+		Assert(conditional_stack_peek(st->cstack) == IFSTATE_FALSE);
+		conditional_stack_poke(st->cstack,
+							   condition ? IFSTATE_TRUE : IFSTATE_FALSE);
+	}
+}
+
+/*
+ * Get the failure status from the error code.
+ */
+static FailureStatus
+getFailureStatus(char *sqlState)
+{
+	if (sqlState)
+	{
+		if (strcmp(sqlState, ERRCODE_T_R_SERIALIZATION_FAILURE) == 0)
+			return SERIALIZATION_FAILURE;
+		else if (strcmp(sqlState, ERRCODE_T_R_DEADLOCK_DETECTED) == 0)
+			return DEADLOCK_FAILURE;
+		else if (strcmp(sqlState, ERRCODE_IN_FAILED_SQL_TRANSACTION) == 0)
+			return IN_FAILED_SQL_TRANSACTION;
+	}
+
+	return ANOTHER_FAILURE;
+}
+
+/*
+ * If the latency limit is used, return a percentage of the current transaction
+ * latency from the latency limit. Otherwise return zero.
+ */
+static double
+getLatencyUsed(CState *st, instr_time *now)
+{
+	if (!latency_limit)
+		return 0;
+
+	if (INSTR_TIME_IS_ZERO(*now))
+		INSTR_TIME_SET_CURRENT(*now);
+
+	return (100.0 * (INSTR_TIME_GET_MICROSEC(*now) - st->txn_scheduled) /
+			latency_limit);
+}
+
+/*
  * Advance the state machine of a connection, if possible.
  */
 static void
@@ -2675,6 +3182,7 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 	instr_time	now;
 	bool		end_tx_processed = false;
 	int64		wait;
+	FailureStatus failure_status = NO_FAILURE;
 
 	/*
 	 * gettimeofday() isn't free, so we get the current timestamp lazily the
@@ -2705,9 +3213,9 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 
 				st->use_file = chooseScript(thread);
 
-				if (debug)
-					fprintf(stderr, "client %d executing script \"%s\"\n", st->id,
-							sql_script[st->use_file].desc);
+				elog(thread, ELEVEL_DEBUG,
+					 "client %d executing script \"%s\"\n",
+					 st->id, sql_script[st->use_file].desc);
 
 				if (throttle_delay > 0)
 					st->state = CSTATE_START_THROTTLE;
@@ -2715,6 +3223,11 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 					st->state = CSTATE_START_TX;
 				/* check consistency */
 				Assert(conditional_stack_empty(st->cstack));
+
+				/* reset transaction variables to default values */
+				st->first_failure.status = NO_FAILURE;
+				st->retries = 0;
+
 				break;
 
 				/*
@@ -2732,7 +3245,7 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 				 * away.
 				 */
 				Assert(throttle_delay > 0);
-				wait = getPoissonRand(thread, throttle_delay);
+				wait = getPoissonRand(&thread->random_state, throttle_delay);
 
 				thread->throttle_trigger += wait;
 				st->txn_scheduled = thread->throttle_trigger;
@@ -2762,16 +3275,17 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 						INSTR_TIME_SET_CURRENT(now);
 					now_us = INSTR_TIME_GET_MICROSEC(now);
 					while (thread->throttle_trigger < now_us - latency_limit &&
-						   (nxacts <= 0 || st->cnt < nxacts))
+						   (nxacts <= 0 || getTotalCnt(st) < nxacts))
 					{
 						processXactStats(thread, st, &now, true, agg);
 						/* next rendez-vous */
-						wait = getPoissonRand(thread, throttle_delay);
+						wait = getPoissonRand(&thread->random_state,
+											  throttle_delay);
 						thread->throttle_trigger += wait;
 						st->txn_scheduled = thread->throttle_trigger;
 					}
 					/* stop client if -t exceeded */
-					if (nxacts > 0 && st->cnt >= nxacts)
+					if (nxacts > 0 && getTotalCnt(st) >= nxacts)
 					{
 						st->state = CSTATE_FINISHED;
 						break;
@@ -2779,9 +3293,9 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 				}
 
 				st->state = CSTATE_THROTTLE;
-				if (debug)
-					fprintf(stderr, "client %d throttling " INT64_FORMAT " us\n",
-							st->id, wait);
+				elog(thread, ELEVEL_DEBUG,
+					 "client %d throttling " INT64_FORMAT " us\n",
+					 st->id, wait);
 				break;
 
 				/*
@@ -2811,10 +3325,11 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 					if (INSTR_TIME_IS_ZERO(now))
 						INSTR_TIME_SET_CURRENT(now);
 					start = now;
-					if ((st->con = doConnect()) == NULL)
+					if ((st->con = doConnect(thread)) == NULL)
 					{
-						fprintf(stderr, "client %d aborted while establishing connection\n",
-								st->id);
+						elog(thread, ELEVEL_CLIENT_ABORTED,
+							 "client %d aborted while establishing connection\n",
+							 st->id);
 						st->state = CSTATE_ABORTED;
 						break;
 					}
@@ -2826,7 +3341,16 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 				}
 
 				/*
-				 * Record transaction start time under logging, progress or
+				 * It is the first try to run this transaction. Remember its
+				 * parameters just in case if it fails or we should repeat it in
+				 * future.
+				 */
+				copyRandomState(&st->retry_state.random_state,
+								&st->random_state);
+				copyVariables(&st->retry_state.variables, &st->variables);
+
+				/*
+				 * Record transaction start time under logging, progress,
 				 * throttling.
 				 */
 				if (use_log || progress || throttle_delay || latency_limit ||
@@ -2861,7 +3385,15 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 				 */
 				if (command == NULL)
 				{
-					st->state = CSTATE_END_TX;
+					if (st->first_failure.status == NO_FAILURE)
+					{
+						st->state = CSTATE_END_TX;
+					}
+					else
+					{
+						/* check if we can retry the failure */
+						st->state = CSTATE_RETRY;
+					}
 					break;
 				}
 
@@ -2869,7 +3401,7 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 				 * Record statement start time if per-command latencies are
 				 * requested
 				 */
-				if (is_latencies)
+				if (report_per_command)
 				{
 					if (INSTR_TIME_IS_ZERO(now))
 						INSTR_TIME_SET_CURRENT(now);
@@ -2878,9 +3410,11 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 
 				if (command->type == SQL_COMMAND)
 				{
-					if (!sendCommand(st, command))
+					if (!sendCommand(thread, st, command))
 					{
-						commandFailed(st, "SQL", "SQL command send failed");
+						commandFailed(thread, st, "SQL",
+									  "SQL command send failed",
+									  ELEVEL_CLIENT_ABORTED);
 						st->state = CSTATE_ABORTED;
 					}
 					else
@@ -2892,14 +3426,19 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 								i;
 					char	  **argv = command->argv;
 
-					if (debug)
+					if (errstart(thread, ELEVEL_DEBUG))
 					{
-						fprintf(stderr, "client %d executing \\%s", st->id, argv[0]);
+						errmsg(thread, "client %d executing \\%s",
+							   st->id, argv[0]);
 						for (i = 1; i < argc; i++)
-							fprintf(stderr, " %s", argv[i]);
-						fprintf(stderr, "\n");
+							errmsg(thread, " %s", argv[i]);
+						errmsg(thread, "\n");
+						errfinish(thread);
 					}
 
+					/* change it if the meta command fails */
+					failure_status = NO_FAILURE;
+
 					if (command->meta == META_SLEEP)
 					{
 						/*
@@ -2911,10 +3450,14 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 						 */
 						int			usec;
 
-						if (!evaluateSleep(st, argc, argv, &usec))
+						if (!evaluateSleep(thread, &st->variables, argc, argv,
+										   &usec))
 						{
-							commandFailed(st, "sleep", "execution of meta-command failed");
-							st->state = CSTATE_ABORTED;
+							commandFailed(thread, st, "sleep",
+										  "execution of meta-command failed",
+										  ELEVEL_CLIENT_FAIL);
+							failure_status = ANOTHER_FAILURE;
+							st->state = CSTATE_FAILURE;
 							break;
 						}
 
@@ -2942,35 +3485,37 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 
 						if (!evaluateExpr(thread, st, expr, &result))
 						{
-							commandFailed(st, argv[0], "evaluation of meta-command failed");
-							st->state = CSTATE_ABORTED;
+							commandFailed(thread, st, argv[0],
+										  "evaluation of meta-command failed",
+										  ELEVEL_CLIENT_FAIL);
+
+							/*
+							 * Do not ruin the following conditional commands,
+							 * if any.
+							 */
+							executeCondition(st, false);
+
+							failure_status = ANOTHER_FAILURE;
+							st->state = CSTATE_FAILURE;
 							break;
 						}
 
 						if (command->meta == META_SET)
 						{
-							if (!putVariableValue(st, argv[0], argv[1], &result))
+							if (!putVariableValue(thread, &st->variables,
+												  argv[0], argv[1], &result))
 							{
-								commandFailed(st, "set", "assignment of meta-command failed");
-								st->state = CSTATE_ABORTED;
+								commandFailed(thread, st, "set",
+											  "assignment of meta-command failed",
+											  ELEVEL_CLIENT_FAIL);
+								failure_status = ANOTHER_FAILURE;
+								st->state = CSTATE_FAILURE;
 								break;
 							}
 						}
 						else /* if and elif evaluated cases */
 						{
-							bool cond = valueTruth(&result);
-
-							/* execute or not depending on evaluated condition */
-							if (command->meta == META_IF)
-							{
-								conditional_stack_push(st->cstack, cond ? IFSTATE_TRUE : IFSTATE_FALSE);
-							}
-							else /* elif */
-							{
-								/* we should get here only if the "elif" needed evaluation */
-								Assert(conditional_stack_peek(st->cstack) == IFSTATE_FALSE);
-								conditional_stack_poke(st->cstack, cond ? IFSTATE_TRUE : IFSTATE_FALSE);
-							}
+							executeCondition(st, valueTruth(&result));
 						}
 					}
 					else if (command->meta == META_ELSE)
@@ -2999,7 +3544,10 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 					}
 					else if (command->meta == META_SETSHELL)
 					{
-						bool		ret = runShellCommand(st, argv[1], argv + 2, argc - 2);
+						bool		ret = runShellCommand(thread,
+														  &st->variables,
+														  argv[1], argv + 2,
+														  argc - 2);
 
 						if (timer_exceeded) /* timeout */
 						{
@@ -3008,8 +3556,11 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 						}
 						else if (!ret)	/* on error */
 						{
-							commandFailed(st, "setshell", "execution of meta-command failed");
-							st->state = CSTATE_ABORTED;
+							commandFailed(thread, st, "setshell",
+										  "execution of meta-command failed",
+										  ELEVEL_CLIENT_FAIL);
+							failure_status = ANOTHER_FAILURE;
+							st->state = CSTATE_FAILURE;
 							break;
 						}
 						else
@@ -3019,7 +3570,9 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 					}
 					else if (command->meta == META_SHELL)
 					{
-						bool		ret = runShellCommand(st, NULL, argv + 1, argc - 1);
+						bool		ret = runShellCommand(thread,
+														  &st->variables, NULL,
+														  argv + 1, argc - 1);
 
 						if (timer_exceeded) /* timeout */
 						{
@@ -3028,8 +3581,11 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 						}
 						else if (!ret)	/* on error */
 						{
-							commandFailed(st, "shell", "execution of meta-command failed");
-							st->state = CSTATE_ABORTED;
+							commandFailed(thread, st, "shell",
+										  "execution of meta-command failed",
+										  ELEVEL_CLIENT_FAIL);
+							failure_status = ANOTHER_FAILURE;
+							st->state = CSTATE_FAILURE;
 							break;
 						}
 						else
@@ -3134,37 +3690,56 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 				 * Wait for the current SQL command to complete
 				 */
 			case CSTATE_WAIT_RESULT:
-				command = sql_script[st->use_file].commands[st->command];
-				if (debug)
-					fprintf(stderr, "client %d receiving\n", st->id);
-				if (!PQconsumeInput(st->con))
-				{				/* there's something wrong */
-					commandFailed(st, "SQL", "perhaps the backend died while processing");
-					st->state = CSTATE_ABORTED;
-					break;
-				}
-				if (PQisBusy(st->con))
-					return;		/* don't have the whole result yet */
-
-				/*
-				 * Read and discard the query result;
-				 */
-				res = PQgetResult(st->con);
-				switch (PQresultStatus(res))
 				{
-					case PGRES_COMMAND_OK:
-					case PGRES_TUPLES_OK:
-					case PGRES_EMPTY_QUERY:
-						/* OK */
-						PQclear(res);
-						discard_response(st);
-						st->state = CSTATE_END_COMMAND;
-						break;
-					default:
-						commandFailed(st, "SQL", PQerrorMessage(st->con));
-						PQclear(res);
+					char	   *sqlState;
+
+					command = sql_script[st->use_file].commands[st->command];
+					elog(thread, ELEVEL_DEBUG, "client %d receiving\n", st->id);
+					if (!PQconsumeInput(st->con))
+					{				/* there's something wrong */
+						commandFailed(thread, st, "SQL",
+									  "perhaps the backend died while processing",
+									  ELEVEL_CLIENT_ABORTED);
 						st->state = CSTATE_ABORTED;
 						break;
+					}
+					if (PQisBusy(st->con))
+						return;		/* don't have the whole result yet */
+
+					/*
+					 * Read and discard the query result;
+					 */
+					res = PQgetResult(st->con);
+					sqlState = PQresultErrorField(res, PG_DIAG_SQLSTATE);
+					switch (PQresultStatus(res))
+					{
+						case PGRES_COMMAND_OK:
+						case PGRES_TUPLES_OK:
+						case PGRES_EMPTY_QUERY:
+							/* OK */
+							PQclear(res);
+							discard_response(st);
+							failure_status = NO_FAILURE;
+							st->state = CSTATE_END_COMMAND;
+							break;
+						case PGRES_NONFATAL_ERROR:
+						case PGRES_FATAL_ERROR:
+							failure_status = getFailureStatus(sqlState);
+							commandFailed(thread, st, "SQL",
+										  PQerrorMessage(st->con),
+										  ELEVEL_CLIENT_FAIL);
+							PQclear(res);
+							discard_response(st);
+							st->state = CSTATE_FAILURE;
+							break;
+						default:
+							commandFailed(thread, st, "SQL",
+										  PQerrorMessage(st->con),
+										  ELEVEL_CLIENT_ABORTED);
+							PQclear(res);
+							st->state = CSTATE_ABORTED;
+							break;
+					}
 				}
 				break;
 
@@ -3193,7 +3768,7 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 				 * in thread-local data structure, if per-command latencies
 				 * are requested.
 				 */
-				if (is_latencies)
+				if (report_per_command)
 				{
 					if (INSTR_TIME_IS_ZERO(now))
 						INSTR_TIME_SET_CURRENT(now);
@@ -3212,6 +3787,132 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 				break;
 
 				/*
+				 * Remember the failure and go ahead with next command.
+				 */
+			case CSTATE_FAILURE:
+
+				Assert(failure_status != NO_FAILURE);
+
+				/*
+				 * All subsequent failures will be "retried"/"failed" if the
+				 * first failure of this transaction can be/cannot be retried.
+				 * Therefore remember only the first failure.
+				 */
+				if (st->first_failure.status == NO_FAILURE)
+				{
+					st->first_failure.status = failure_status;
+					st->first_failure.command = st->command;
+				}
+
+				/* Go ahead with next command, to be executed or skipped */
+				st->command++;
+				st->state = conditional_active(st->cstack) ?
+					CSTATE_START_COMMAND : CSTATE_SKIP_COMMAND;
+				break;
+
+			/*
+			 * Retry the failed transaction if possible.
+			 */
+			case CSTATE_RETRY:
+				command = sql_script[st->use_file].commands[st->first_failure.command];
+
+				if (canRetry(st, &now))
+				{
+					/*
+					 * The failed transaction will be retried. So accumulate the
+					 * retry.
+					 */
+					st->retries++;
+					command->retries++;
+
+					/*
+					 * Report this with failures to indicate that the failed
+					 * transaction will be retried.
+					 */
+					if (errstart(thread, ELEVEL_CLIENT_FAIL))
+					{
+						errmsg(thread,
+							   "client %d repeats the failed transaction (try %d",
+							   st->id, st->retries + 1);
+						if (max_tries)
+							errmsg(thread, "/%d", max_tries);
+						if (latency_limit)
+						{
+							errmsg(thread,
+								   ", %.3f%% of the maximum time of tries was used",
+								   getLatencyUsed(st, &now));
+						}
+						errmsg(thread, ")\n");
+						errfinish(thread);
+					}
+
+					/*
+					 * Reset the execution parameters as they were at the
+					 * beginning of the transaction.
+					 */
+					copyRandomState(&st->random_state,
+									&st->retry_state.random_state);
+					copyVariables(&st->variables, &st->retry_state.variables);
+
+					/* Process the first transaction command */
+					st->command = 0;
+					st->first_failure.status = NO_FAILURE;
+					st->state = CSTATE_START_COMMAND;
+				}
+				else
+				{
+					/*
+					 * We will not be able to retry this failed transaction. So
+					 * accumulate the error.
+					 */
+					command->errors++;
+					if (st->first_failure.status ==
+						IN_FAILED_SQL_TRANSACTION)
+						command->errors_in_failed_tx++;
+
+					/*
+					 * Report this with failures to indicate that the failed
+					 * transaction will not be retried.
+					 */
+					if (errstart(thread, ELEVEL_CLIENT_FAIL))
+					{
+						errmsg(thread,
+							   "client %d ends the failed transaction (try %d",
+							   st->id, st->retries + 1);
+
+						/*
+						 * Report the actual number and/or time of tries. We
+						 * do not need this information if this type of
+						 * failure can be never retried.
+						 */
+						if (canRetryFailure(st->first_failure.status))
+						{
+							if (max_tries)
+								errmsg(thread, "/%d", max_tries);
+							if (latency_limit)
+							{
+								errmsg(thread,
+									   ", %.3f%% of the maximum time of tries was used",
+									   getLatencyUsed(st, &now));
+							}
+						}
+						errmsg(thread, ")\n");
+						errfinish(thread);
+					}
+
+					/*
+					 * Reset the execution parameters as they were at the
+					 * beginning of the transaction except for a random
+					 * state.
+					 */
+					copyVariables(&st->variables, &st->retry_state.variables);
+
+					/* End the failed transaction */
+					st->state = CSTATE_END_TX;
+				}
+				break;
+
+				/*
 				 * End of transaction.
 				 */
 			case CSTATE_END_TX:
@@ -3222,7 +3923,8 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 				/* conditional stack must be empty */
 				if (!conditional_stack_empty(st->cstack))
 				{
-					fprintf(stderr, "end of script reached within a conditional, missing \\endif\n");
+					elog(thread, ELEVEL_MAIN,
+						 "end of script reached within a conditional, missing \\endif\n");
 					exit(1);
 				}
 
@@ -3232,7 +3934,8 @@ doCustom(TState *thread, CState *st, StatsData *agg)
 					INSTR_TIME_SET_ZERO(now);
 				}
 
-				if ((st->cnt >= nxacts && duration <= 0) || timer_exceeded)
+				if ((getTotalCnt(st) >= nxacts && duration <= 0) ||
+					timer_exceeded)
 				{
 					/* exit success */
 					st->state = CSTATE_FINISHED;
@@ -3292,7 +3995,7 @@ doLog(TState *thread, CState *st,
 	 * to the random sample.
 	 */
 	if (sample_rate != 0.0 &&
-		pg_erand48(thread->random_state) > sample_rate)
+		pg_erand48(thread->random_state.data) > sample_rate)
 		return;
 
 	/* should we aggregate the results or not? */
@@ -3308,13 +4011,15 @@ doLog(TState *thread, CState *st,
 		while (agg->start_time + agg_interval <= now)
 		{
 			/* print aggregated report to logfile */
-			fprintf(logfile, "%ld " INT64_FORMAT " %.0f %.0f %.0f %.0f",
+			fprintf(logfile, "%ld " INT64_FORMAT " %.0f %.0f %.0f %.0f " INT64_FORMAT " " INT64_FORMAT,
 					(long) agg->start_time,
 					agg->cnt,
 					agg->latency.sum,
 					agg->latency.sum2,
 					agg->latency.min,
-					agg->latency.max);
+					agg->latency.max,
+					agg->errors,
+					agg->errors_in_failed_tx);
 			if (throttle_delay)
 			{
 				fprintf(logfile, " %.0f %.0f %.0f %.0f",
@@ -3325,6 +4030,10 @@ doLog(TState *thread, CState *st,
 				if (latency_limit)
 					fprintf(logfile, " " INT64_FORMAT, agg->skipped);
 			}
+			if (max_tries > 1 || latency_limit)
+				fprintf(logfile, " " INT64_FORMAT " " INT64_FORMAT,
+						agg->retried,
+						agg->retries);
 			fputc('\n', logfile);
 
 			/* reset data and move to next interval */
@@ -3332,7 +4041,8 @@ doLog(TState *thread, CState *st,
 		}
 
 		/* accumulate the current transaction */
-		accumStats(agg, skipped, latency, lag);
+		accumStats(agg, skipped, latency, lag, st->first_failure.status,
+				   st->retries);
 	}
 	else
 	{
@@ -3342,14 +4052,25 @@ doLog(TState *thread, CState *st,
 		gettimeofday(&tv, NULL);
 		if (skipped)
 			fprintf(logfile, "%d " INT64_FORMAT " skipped %d %ld %ld",
-					st->id, st->cnt, st->use_file,
+					st->id, getTotalCnt(st), st->use_file,
 					(long) tv.tv_sec, (long) tv.tv_usec);
-		else
+		else if (st->first_failure.status == NO_FAILURE)
 			fprintf(logfile, "%d " INT64_FORMAT " %.0f %d %ld %ld",
-					st->id, st->cnt, latency, st->use_file,
+					st->id, getTotalCnt(st), latency, st->use_file,
+					(long) tv.tv_sec, (long) tv.tv_usec);
+		else if (st->first_failure.status == IN_FAILED_SQL_TRANSACTION)
+			fprintf(logfile, "%d " INT64_FORMAT " in_failed_tx %d %ld %ld",
+					st->id, getTotalCnt(st), st->use_file,
 					(long) tv.tv_sec, (long) tv.tv_usec);
+		else
+			fprintf(logfile, "%d " INT64_FORMAT " failed %d %ld %ld",
+					st->id, getTotalCnt(st), st->use_file,
+					(long) tv.tv_sec, (long) tv.tv_usec);
+
 		if (throttle_delay)
 			fprintf(logfile, " %.0f", lag);
+		if (max_tries > 1 || latency_limit)
+			fprintf(logfile, " %d", st->retries);
 		fputc('\n', logfile);
 	}
 }
@@ -3369,7 +4090,8 @@ processXactStats(TState *thread, CState *st, instr_time *now,
 	bool		thread_details = progress || throttle_delay || latency_limit,
 				detailed = thread_details || use_log || per_script_stats;
 
-	if (detailed && !skipped)
+	if (detailed && !skipped &&
+		(st->first_failure.status == NO_FAILURE || latency_limit))
 	{
 		if (INSTR_TIME_IS_ZERO(*now))
 			INSTR_TIME_SET_CURRENT(*now);
@@ -3382,7 +4104,8 @@ processXactStats(TState *thread, CState *st, instr_time *now,
 	if (thread_details)
 	{
 		/* keep detailed thread stats */
-		accumStats(&thread->stats, skipped, latency, lag);
+		accumStats(&thread->stats, skipped, latency, lag,
+				   st->first_failure.status, st->retries);
 
 		/* count transactions over the latency limit, if needed */
 		if (latency_limit && latency > latency_limit)
@@ -3390,19 +4113,24 @@ processXactStats(TState *thread, CState *st, instr_time *now,
 	}
 	else
 	{
-		/* no detailed stats, just count */
-		thread->stats.cnt++;
+		/* no detailed stats */
+		accumStats(&thread->stats, skipped, 0, 0, st->first_failure.status,
+				   st->retries);
 	}
 
 	/* client stat is just counting */
-	st->cnt++;
+	if (st->first_failure.status == NO_FAILURE)
+		st->cnt++;
+	else
+		st->ecnt++;
 
 	if (use_log)
 		doLog(thread, st, agg, skipped, latency, lag);
 
 	/* XXX could use a mutex here, but we choose not to */
 	if (per_script_stats)
-		accumStats(&sql_script[st->use_file].stats, skipped, latency, lag);
+		accumStats(&sql_script[st->use_file].stats, skipped, latency, lag,
+				   st->first_failure.status, st->retries);
 }
 
 
@@ -3422,7 +4150,7 @@ disconnect_all(CState *state, int length)
 static void
 initDropTables(PGconn *con)
 {
-	fprintf(stderr, "dropping old tables...\n");
+	elog(NULL, ELEVEL_MAIN, "dropping old tables...\n");
 
 	/*
 	 * We drop all the tables in one command, so that whether there are
@@ -3497,7 +4225,7 @@ initCreateTables(PGconn *con)
 	};
 	int			i;
 
-	fprintf(stderr, "creating tables...\n");
+	elog(NULL, ELEVEL_MAIN, "creating tables...\n");
 
 	for (i = 0; i < lengthof(DDLs); i++)
 	{
@@ -3550,7 +4278,7 @@ initGenerateData(PGconn *con)
 				remaining_sec;
 	int			log_interval = 1;
 
-	fprintf(stderr, "generating data...\n");
+	elog(NULL, ELEVEL_MAIN, "generating data...\n");
 
 	/*
 	 * we do all of this in one transaction to enable the backend's
@@ -3596,7 +4324,7 @@ initGenerateData(PGconn *con)
 	res = PQexec(con, "copy pgbench_accounts from stdin");
 	if (PQresultStatus(res) != PGRES_COPY_IN)
 	{
-		fprintf(stderr, "%s", PQerrorMessage(con));
+		elog(NULL, ELEVEL_MAIN, "%s", PQerrorMessage(con));
 		exit(1);
 	}
 	PQclear(res);
@@ -3613,7 +4341,7 @@ initGenerateData(PGconn *con)
 				 j, k / naccounts + 1, 0);
 		if (PQputline(con, sql))
 		{
-			fprintf(stderr, "PQputline failed\n");
+			elog(NULL, ELEVEL_MAIN, "PQputline failed\n");
 			exit(1);
 		}
 
@@ -3629,10 +4357,11 @@ initGenerateData(PGconn *con)
 			elapsed_sec = INSTR_TIME_GET_DOUBLE(diff);
 			remaining_sec = ((double) scale * naccounts - j) * elapsed_sec / j;
 
-			fprintf(stderr, INT64_FORMAT " of " INT64_FORMAT " tuples (%d%%) done (elapsed %.2f s, remaining %.2f s)\n",
-					j, (int64) naccounts * scale,
-					(int) (((int64) j * 100) / (naccounts * (int64) scale)),
-					elapsed_sec, remaining_sec);
+			elog(NULL, ELEVEL_MAIN,
+				 INT64_FORMAT " of " INT64_FORMAT " tuples (%d%%) done (elapsed %.2f s, remaining %.2f s)\n",
+				 j, (int64) naccounts * scale,
+				 (int) (((int64) j * 100) / (naccounts * (int64) scale)),
+				 elapsed_sec, remaining_sec);
 		}
 		/* let's not call the timing for each row, but only each 100 rows */
 		else if (use_quiet && (j % 100 == 0))
@@ -3646,9 +4375,10 @@ initGenerateData(PGconn *con)
 			/* have we reached the next interval (or end)? */
 			if ((j == scale * naccounts) || (elapsed_sec >= log_interval * LOG_STEP_SECONDS))
 			{
-				fprintf(stderr, INT64_FORMAT " of " INT64_FORMAT " tuples (%d%%) done (elapsed %.2f s, remaining %.2f s)\n",
-						j, (int64) naccounts * scale,
-						(int) (((int64) j * 100) / (naccounts * (int64) scale)), elapsed_sec, remaining_sec);
+				elog(NULL, ELEVEL_MAIN,
+					 INT64_FORMAT " of " INT64_FORMAT " tuples (%d%%) done (elapsed %.2f s, remaining %.2f s)\n",
+					 j, (int64) naccounts * scale,
+					 (int) (((int64) j * 100) / (naccounts * (int64) scale)), elapsed_sec, remaining_sec);
 
 				/* skip to the next interval */
 				log_interval = (int) ceil(elapsed_sec / LOG_STEP_SECONDS);
@@ -3658,12 +4388,12 @@ initGenerateData(PGconn *con)
 	}
 	if (PQputline(con, "\\.\n"))
 	{
-		fprintf(stderr, "very last PQputline failed\n");
+		elog(NULL, ELEVEL_MAIN, "very last PQputline failed\n");
 		exit(1);
 	}
 	if (PQendcopy(con))
 	{
-		fprintf(stderr, "PQendcopy failed\n");
+		elog(NULL, ELEVEL_MAIN, "PQendcopy failed\n");
 		exit(1);
 	}
 
@@ -3676,7 +4406,7 @@ initGenerateData(PGconn *con)
 static void
 initVacuum(PGconn *con)
 {
-	fprintf(stderr, "vacuuming...\n");
+	elog(NULL, ELEVEL_MAIN, "vacuuming...\n");
 	executeStatement(con, "vacuum analyze pgbench_branches");
 	executeStatement(con, "vacuum analyze pgbench_tellers");
 	executeStatement(con, "vacuum analyze pgbench_accounts");
@@ -3696,7 +4426,7 @@ initCreatePKeys(PGconn *con)
 	};
 	int			i;
 
-	fprintf(stderr, "creating primary keys...\n");
+	elog(NULL, ELEVEL_MAIN, "creating primary keys...\n");
 	for (i = 0; i < lengthof(DDLINDEXes); i++)
 	{
 		char		buffer[256];
@@ -3733,7 +4463,7 @@ initCreateFKeys(PGconn *con)
 	};
 	int			i;
 
-	fprintf(stderr, "creating foreign keys...\n");
+	elog(NULL, ELEVEL_MAIN, "creating foreign keys...\n");
 	for (i = 0; i < lengthof(DDLKEYs); i++)
 	{
 		executeStatement(con, DDLKEYs[i]);
@@ -3754,7 +4484,7 @@ checkInitSteps(const char *initialize_steps)
 
 	if (initialize_steps[0] == '\0')
 	{
-		fprintf(stderr, "no initialization steps specified\n");
+		elog(NULL, ELEVEL_MAIN, "no initialization steps specified\n");
 		exit(1);
 	}
 
@@ -3762,9 +4492,13 @@ checkInitSteps(const char *initialize_steps)
 	{
 		if (strchr("dtgvpf ", *step) == NULL)
 		{
-			fprintf(stderr, "unrecognized initialization step \"%c\"\n",
-					*step);
-			fprintf(stderr, "allowed steps are: \"d\", \"t\", \"g\", \"v\", \"p\", \"f\"\n");
+			if (errstart(NULL, ELEVEL_MAIN))
+			{
+				errmsg(NULL, "unrecognized initialization step \"%c\"\n",
+					   *step);
+				errmsg(NULL, "allowed steps are: \"d\", \"t\", \"g\", \"v\", \"p\", \"f\"\n");
+				errfinish(NULL);
+			}
 			exit(1);
 		}
 	}
@@ -3779,7 +4513,7 @@ runInitSteps(const char *initialize_steps)
 	PGconn	   *con;
 	const char *step;
 
-	if ((con = doConnect()) == NULL)
+	if ((con = doConnect(NULL)) == NULL)
 		exit(1);
 
 	for (step = initialize_steps; *step != '\0'; step++)
@@ -3807,14 +4541,14 @@ runInitSteps(const char *initialize_steps)
 			case ' ':
 				break;			/* ignore */
 			default:
-				fprintf(stderr, "unrecognized initialization step \"%c\"\n",
-						*step);
+				elog(NULL, ELEVEL_MAIN,
+					 "unrecognized initialization step \"%c\"\n", *step);
 				PQfinish(con);
 				exit(1);
 		}
 	}
 
-	fprintf(stderr, "done.\n");
+	elog(NULL, ELEVEL_MAIN, "done.\n");
 	PQfinish(con);
 }
 
@@ -3852,8 +4586,9 @@ parseQuery(Command *cmd)
 
 		if (cmd->argc >= MAX_ARGS)
 		{
-			fprintf(stderr, "statement has too many arguments (maximum is %d): %s\n",
-					MAX_ARGS - 1, cmd->argv[0]);
+			elog(NULL, ELEVEL_MAIN,
+				 "statement has too many arguments (maximum is %d): %s\n",
+				 MAX_ARGS - 1, cmd->argv[0]);
 			pg_free(name);
 			return false;
 		}
@@ -3879,9 +4614,14 @@ pgbench_error(const char *fmt,...)
 	va_list		ap;
 
 	fflush(stdout);
-	va_start(ap, fmt);
-	vfprintf(stderr, _(fmt), ap);
-	va_end(ap);
+	if (errstart(NULL, ELEVEL_MAIN))
+	{
+		va_start(ap, fmt);
+		errmsg_internal(NULL, fmt, &ap);
+		va_end(ap);
+
+		errfinish(NULL);
+	}
 }
 
 /*
@@ -3901,25 +4641,29 @@ syntax_error(const char *source, int lineno,
 			 const char *line, const char *command,
 			 const char *msg, const char *more, int column)
 {
-	fprintf(stderr, "%s:%d: %s", source, lineno, msg);
-	if (more != NULL)
-		fprintf(stderr, " (%s)", more);
-	if (column >= 0 && line == NULL)
-		fprintf(stderr, " at column %d", column + 1);
-	if (command != NULL)
-		fprintf(stderr, " in command \"%s\"", command);
-	fprintf(stderr, "\n");
-	if (line != NULL)
-	{
-		fprintf(stderr, "%s\n", line);
-		if (column >= 0)
+	if (errstart(NULL, ELEVEL_MAIN))
+	{
+		errmsg(NULL, "%s:%d: %s", source, lineno, msg);
+		if (more != NULL)
+			errmsg(NULL, " (%s)", more);
+		if (column >= 0 && line == NULL)
+			errmsg(NULL, " at column %d", column + 1);
+		if (command != NULL)
+			errmsg(NULL, " in command \"%s\"", command);
+		errmsg(NULL, "\n");
+		if (line != NULL)
 		{
-			int			i;
+			errmsg(NULL, "%s\n", line);
+			if (column >= 0)
+			{
+				int			i;
 
-			for (i = 0; i < column; i++)
-				fprintf(stderr, " ");
-			fprintf(stderr, "^ error found here\n");
+				for (i = 0; i < column; i++)
+					errmsg(NULL, " ");
+				errmsg(NULL, "^ error found here\n");
+			}
 		}
+		errfinish(NULL);
 	}
 	exit(1);
 }
@@ -4170,9 +4914,8 @@ process_backslash_command(PsqlScanState sstate, const char *source)
 static void
 ConditionError(const char *desc, int cmdn, const char *msg)
 {
-	fprintf(stderr,
-			"condition error in script \"%s\" command %d: %s\n",
-			desc, cmdn, msg);
+	elog(NULL, ELEVEL_MAIN,
+		 "condition error in script \"%s\" command %d: %s\n", desc, cmdn, msg);
 	exit(1);
 }
 
@@ -4370,8 +5113,8 @@ process_file(const char *filename, int weight)
 		fd = stdin;
 	else if ((fd = fopen(filename, "r")) == NULL)
 	{
-		fprintf(stderr, "could not open file \"%s\": %s\n",
-				filename, strerror(errno));
+		elog(NULL, ELEVEL_MAIN,
+			 "could not open file \"%s\": %s\n", filename, strerror(errno));
 		exit(1);
 	}
 
@@ -4379,8 +5122,8 @@ process_file(const char *filename, int weight)
 
 	if (ferror(fd))
 	{
-		fprintf(stderr, "could not read file \"%s\": %s\n",
-				filename, strerror(errno));
+		elog(NULL, ELEVEL_MAIN,
+			 "could not read file \"%s\": %s\n", filename, strerror(errno));
 		exit(1);
 	}
 
@@ -4405,10 +5148,14 @@ listAvailableScripts(void)
 {
 	int			i;
 
-	fprintf(stderr, "Available builtin scripts:\n");
-	for (i = 0; i < lengthof(builtin_script); i++)
-		fprintf(stderr, "\t%s\n", builtin_script[i].name);
-	fprintf(stderr, "\n");
+	if (errstart(NULL, ELEVEL_MAIN))
+	{
+		errmsg(NULL, "Available builtin scripts:\n");
+		for (i = 0; i < lengthof(builtin_script); i++)
+			errmsg(NULL, "\t%s\n", builtin_script[i].name);
+		errmsg(NULL, "\n");
+		errfinish(NULL);
+	}
 }
 
 /* return builtin script "name" if unambiguous, fails if not found */
@@ -4435,10 +5182,16 @@ findBuiltin(const char *name)
 
 	/* error cases */
 	if (found == 0)
-		fprintf(stderr, "no builtin script found for name \"%s\"\n", name);
-	else						/* found > 1 */
-		fprintf(stderr,
-				"ambiguous builtin name: %d builtin scripts found for prefix \"%s\"\n", found, name);
+	{
+		elog(NULL, ELEVEL_MAIN,
+			 "no builtin script found for name \"%s\"\n", name);
+	}
+	else
+	{						/* found > 1 */
+		elog(NULL, ELEVEL_MAIN,
+			 "ambiguous builtin name: %d builtin scripts found for prefix \"%s\"\n",
+			 found, name);
+	}
 
 	listAvailableScripts();
 	exit(1);
@@ -4471,14 +5224,14 @@ parseScriptWeight(const char *option, char **script)
 		wtmp = strtol(sep + 1, &badp, 10);
 		if (errno != 0 || badp == sep + 1 || *badp != '\0')
 		{
-			fprintf(stderr, "invalid weight specification: %s\n", sep);
+			elog(NULL, ELEVEL_MAIN, "invalid weight specification: %s\n", sep);
 			exit(1);
 		}
 		if (wtmp > INT_MAX || wtmp < 0)
 		{
-			fprintf(stderr,
-					"weight specification out of range (0 .. %u): " INT64_FORMAT "\n",
-					INT_MAX, (int64) wtmp);
+			elog(NULL, ELEVEL_MAIN,
+				 "weight specification out of range (0 .. %u): " INT64_FORMAT "\n",
+				 INT_MAX, (int64) wtmp);
 			exit(1);
 		}
 		weight = wtmp;
@@ -4498,13 +5251,15 @@ addScript(ParsedScript script)
 {
 	if (script.commands == NULL || script.commands[0] == NULL)
 	{
-		fprintf(stderr, "empty command list for script \"%s\"\n", script.desc);
+		elog(NULL, ELEVEL_MAIN,
+			 "empty command list for script \"%s\"\n", script.desc);
 		exit(1);
 	}
 
 	if (num_scripts >= MAX_SCRIPTS)
 	{
-		fprintf(stderr, "at most %d SQL scripts are allowed\n", MAX_SCRIPTS);
+		elog(NULL, ELEVEL_MAIN,
+			 "at most %d SQL scripts are allowed\n", MAX_SCRIPTS);
 		exit(1);
 	}
 
@@ -4535,7 +5290,8 @@ printResults(TState *threads, StatsData *total, instr_time total_time,
 	double		time_include,
 				tps_include,
 				tps_exclude;
-	int64		ntx = total->cnt - total->skipped;
+	int64		ntx = total->cnt - total->skipped,
+				total_ntx = total->cnt + total->errors;
 	int			i,
 				totalCacheOverflows = 0;
 
@@ -4556,8 +5312,8 @@ printResults(TState *threads, StatsData *total, instr_time total_time,
 	if (duration <= 0)
 	{
 		printf("number of transactions per client: %d\n", nxacts);
-		printf("number of transactions actually processed: " INT64_FORMAT "/%d\n",
-			   ntx, nxacts * nclients);
+		printf("number of transactions actually processed: " INT64_FORMAT "/" INT64_FORMAT "\n",
+			   ntx, total_ntx);
 	}
 	else
 	{
@@ -4565,6 +5321,43 @@ printResults(TState *threads, StatsData *total, instr_time total_time,
 		printf("number of transactions actually processed: " INT64_FORMAT "\n",
 			   ntx);
 	}
+
+	if (total->errors > 0)
+		printf("number of errors: " INT64_FORMAT " (%.3f%%)\n",
+			   total->errors, 100.0 * total->errors / total_ntx);
+
+	if (total->errors_in_failed_tx > 0)
+		printf("number of errors \"in failed SQL transaction\": " INT64_FORMAT " (%.3f%%)\n",
+			   total->errors_in_failed_tx,
+			   100.0 * total->errors_in_failed_tx / total_ntx);
+
+	/*
+	 * It can be non-zero only if max_tries is greater than one or
+	 * latency_limit is used.
+	 */
+	if (total->retried > 0)
+	{
+		printf("number of retried: " INT64_FORMAT " (%.3f%%)\n",
+			   total->retried, 100.0 * total->retried / total_ntx);
+		printf("number of retries: " INT64_FORMAT "\n", total->retries);
+	}
+
+	if (max_tries)
+		printf("maximum number of tries: %d\n", max_tries);
+
+	if (latency_limit)
+	{
+		printf("number of transactions above the %.1f ms latency limit: " INT64_FORMAT "/" INT64_FORMAT " (%.3f %%)",
+			   latency_limit / 1000.0, latency_late, total_ntx,
+			   (total_ntx > 0) ? 100.0 * latency_late / total_ntx : 0.0);
+
+		/* this statistics includes both successful and failed transactions */
+		if (total->errors > 0)
+			printf(" (including errors)");
+
+		printf("\n");
+	}
+
 	/* Report zipfian cache overflow */
 	for (i = 0; i < nthreads; i++)
 	{
@@ -4584,18 +5377,19 @@ printResults(TState *threads, StatsData *total, instr_time total_time,
 			   total->skipped,
 			   100.0 * total->skipped / total->cnt);
 
-	if (latency_limit)
-		printf("number of transactions above the %.1f ms latency limit: " INT64_FORMAT "/" INT64_FORMAT " (%.3f %%)\n",
-			   latency_limit / 1000.0, latency_late, ntx,
-			   (ntx > 0) ? 100.0 * latency_late / ntx : 0.0);
-
 	if (throttle_delay || progress || latency_limit)
 		printSimpleStats("latency", &total->latency);
 	else
 	{
 		/* no measurement, show average latency computed from run time */
-		printf("latency average = %.3f ms\n",
-			   1000.0 * time_include * nclients / total->cnt);
+		printf("latency average = %.3f ms",
+			   1000.0 * time_include * nclients / total_ntx);
+
+		/* this statistics includes both successful and failed transactions */
+		if (total->errors > 0)
+			printf(" (including errors)");
+
+		printf("\n");
 	}
 
 	if (throttle_delay)
@@ -4614,7 +5408,7 @@ printResults(TState *threads, StatsData *total, instr_time total_time,
 	printf("tps = %f (excluding connections establishing)\n", tps_exclude);
 
 	/* Report per-script/command statistics */
-	if (per_script_stats || is_latencies)
+	if (per_script_stats || report_per_command)
 	{
 		int			i;
 
@@ -4623,6 +5417,7 @@ printResults(TState *threads, StatsData *total, instr_time total_time,
 			if (per_script_stats)
 			{
 				StatsData  *sstats = &sql_script[i].stats;
+				int64		script_total_ntx = sstats->cnt + sstats->errors;
 
 				printf("SQL script %d: %s\n"
 					   " - weight: %d (targets %.1f%% of total)\n"
@@ -4631,9 +5426,33 @@ printResults(TState *threads, StatsData *total, instr_time total_time,
 					   sql_script[i].weight,
 					   100.0 * sql_script[i].weight / total_weight,
 					   sstats->cnt,
-					   100.0 * sstats->cnt / total->cnt,
+					   100.0 * sstats->cnt / script_total_ntx,
 					   (sstats->cnt - sstats->skipped) / time_include);
 
+				if (total->errors > 0)
+					printf(" - number of errors: " INT64_FORMAT " (%.3f%%)\n",
+						   sstats->errors,
+						   100.0 * sstats->errors / script_total_ntx);
+
+				if (total->errors_in_failed_tx > 0)
+					printf(" - number of errors \"in failed SQL transaction\": " INT64_FORMAT " (%.3f%%)\n",
+						   sstats->errors_in_failed_tx,
+						   (100.0 * sstats->errors_in_failed_tx /
+							script_total_ntx));
+
+				/*
+				 * It can be non-zero only if max_tries is greater than one or
+				 * latency_limit is used.
+				 */
+				if (total->retried > 0)
+				{
+					printf(" - number of retried: " INT64_FORMAT " (%.3f%%)\n",
+						   sstats->retried,
+						   100.0 * sstats->retried / script_total_ntx);
+					printf(" - number of retries: " INT64_FORMAT "\n",
+						   sstats->retries);
+				}
+
 				if (throttle_delay && latency_limit && sstats->cnt > 0)
 					printf(" - number of transactions skipped: " INT64_FORMAT " (%.3f%%)\n",
 						   sstats->skipped,
@@ -4642,15 +5461,33 @@ printResults(TState *threads, StatsData *total, instr_time total_time,
 				printSimpleStats(" - latency", &sstats->latency);
 			}
 
-			/* Report per-command latencies */
-			if (is_latencies)
+			/* Report per-command latencies and errors */
+			if (report_per_command)
 			{
 				Command   **commands;
 
 				if (per_script_stats)
-					printf(" - statement latencies in milliseconds:\n");
+					printf(" - statement latencies in milliseconds");
 				else
-					printf("statement latencies in milliseconds:\n");
+					printf("statement latencies in milliseconds");
+
+				if (total->errors > 0)
+				{
+					printf("%s errors",
+						   ((total->errors_in_failed_tx == 0 &&
+							total->retried == 0) ?
+							" and" : ","));
+				}
+				if (total->errors_in_failed_tx > 0)
+				{
+					printf("%s errors \"in failed SQL transaction\"",
+						   total->retried == 0 ? " and" : ",");
+				}
+				if (total->retried > 0)
+				{
+					printf(" and retries");
+				}
+				printf(":\n");
 
 				for (commands = sql_script[i].commands;
 					 *commands != NULL;
@@ -4658,10 +5495,25 @@ printResults(TState *threads, StatsData *total, instr_time total_time,
 				{
 					SimpleStats *cstats = &(*commands)->stats;
 
-					printf("   %11.3f  %s\n",
+					printf("   %11.3f",
 						   (cstats->count > 0) ?
-						   1000.0 * cstats->sum / cstats->count : 0.0,
-						   (*commands)->line);
+						   1000.0 * cstats->sum / cstats->count : 0.0);
+					if (total->errors > 0)
+					{
+						printf("  %20" INT64_MODIFIER "d",
+							   (*commands)->errors);
+					}
+					if (total->errors_in_failed_tx > 0)
+					{
+						printf("  %20" INT64_MODIFIER "d",
+							   (*commands)->errors_in_failed_tx);
+					}
+					if (total->retried > 0)
+					{
+						printf("  %20" INT64_MODIFIER "d",
+							   (*commands)->retries);
+					}
+					printf("  %s\n", (*commands)->line);
 				}
 			}
 		}
@@ -4689,9 +5541,9 @@ set_random_seed(const char *seed)
 		if (!pg_strong_random(&iseed, sizeof(iseed)))
 #endif
 		{
-			fprintf(stderr,
-					"cannot seed random from a strong source, none available: "
-					"use \"time\" or an unsigned integer value.\n");
+			elog(NULL, ELEVEL_MAIN,
+				 "cannot seed random from a strong source, none available: "
+				 "use \"time\" or an unsigned integer value.\n");
 			return false;
 		}
 	}
@@ -4701,21 +5553,32 @@ set_random_seed(const char *seed)
 		char garbage;
 		if (sscanf(seed, "%u%c", &iseed, &garbage) != 1)
 		{
-			fprintf(stderr,
-					"unrecognized random seed option \"%s\": expecting an unsigned integer, \"time\" or \"rand\"\n",
-					seed);
+			elog(NULL, ELEVEL_MAIN,
+				 "unrecognized random seed option \"%s\": expecting an unsigned integer, \"time\" or \"rand\"\n",
+				 seed);
 			return false;
 		}
 	}
 
 	if (seed != NULL)
-		fprintf(stderr, "setting random seed to %u\n", iseed);
+		elog(NULL, ELEVEL_MAIN, "setting random seed to %u\n", iseed);
 	srandom(iseed);
 	/* no precision loss: 32 bit unsigned int cast to 64 bit int */
 	random_seed = iseed;
 	return true;
 }
 
+/*
+ * Initialize the random state of the client/thread.
+ */
+static void
+initRandomState(RandomState *random_state)
+{
+	random_state->data[0] = random();
+	random_state->data[1] = random();
+	random_state->data[2] = random();
+}
+
 
 int
 main(int argc, char **argv)
@@ -4725,7 +5588,7 @@ main(int argc, char **argv)
 		{"builtin", required_argument, NULL, 'b'},
 		{"client", required_argument, NULL, 'c'},
 		{"connect", no_argument, NULL, 'C'},
-		{"debug", no_argument, NULL, 'd'},
+		{"debug", required_argument, NULL, 'd'},
 		{"define", required_argument, NULL, 'D'},
 		{"file", required_argument, NULL, 'f'},
 		{"fillfactor", required_argument, NULL, 'F'},
@@ -4740,7 +5603,7 @@ main(int argc, char **argv)
 		{"progress", required_argument, NULL, 'P'},
 		{"protocol", required_argument, NULL, 'M'},
 		{"quiet", no_argument, NULL, 'q'},
-		{"report-latencies", no_argument, NULL, 'r'},
+		{"report-per-command", no_argument, NULL, 'r'},
 		{"rate", required_argument, NULL, 'R'},
 		{"scale", required_argument, NULL, 's'},
 		{"select-only", no_argument, NULL, 'S'},
@@ -4759,6 +5622,7 @@ main(int argc, char **argv)
 		{"log-prefix", required_argument, NULL, 7},
 		{"foreign-keys", no_argument, NULL, 8},
 		{"random-seed", required_argument, NULL, 9},
+		{"max-tries", required_argument, NULL, 10},
 		{NULL, 0, NULL, 0}
 	};
 
@@ -4827,14 +5691,21 @@ main(int argc, char **argv)
 	state = (CState *) pg_malloc(sizeof(CState));
 	memset(state, 0, sizeof(CState));
 
+	/*
+	 * Set the main error state early, because it may be used while setting
+	 * parameters from environment variables or from the command line.
+	 */
+	memset(&main_error_state, 0, sizeof(ErrorState));
+
 	/* set random seed early, because it may be used while parsing scripts. */
 	if (!set_random_seed(getenv("PGBENCH_RANDOM_SEED")))
 	{
-		fprintf(stderr, "error while setting random seed from PGBENCH_RANDOM_SEED environment variable\n");
+		elog(NULL, ELEVEL_MAIN,
+			 "error while setting random seed from PGBENCH_RANDOM_SEED environment variable\n");
 		exit(1);
 	}
 
-	while ((c = getopt_long(argc, argv, "iI:h:nvp:dqb:SNc:j:Crs:t:T:U:lf:D:F:M:P:R:L:", long_options, &optindex)) != -1)
+	while ((c = getopt_long(argc, argv, "iI:h:nvp:d:qb:SNc:j:Crs:t:T:U:lf:D:F:M:P:R:L:", long_options, &optindex)) != -1)
 	{
 		char	   *script;
 
@@ -4864,15 +5735,29 @@ main(int argc, char **argv)
 				pgport = pg_strdup(optarg);
 				break;
 			case 'd':
-				debug++;
-				break;
+				{
+					for (debug_level = 0;
+						 debug_level < NUM_DEBUGLEVEL;
+						 debug_level++)
+					{
+						if (strcmp(optarg, DEBUGLEVEL[debug_level]) == 0)
+							break;
+					}
+					if (debug_level >= NUM_DEBUGLEVEL)
+					{
+						elog(NULL, ELEVEL_MAIN,
+							 "invalid debug level (-d): \"%s\"\n", optarg);
+						exit(1);
+					}
+					break;
+				}
 			case 'c':
 				benchmarking_option_set = true;
 				nclients = atoi(optarg);
 				if (nclients <= 0 || nclients > MAXCLIENTS)
 				{
-					fprintf(stderr, "invalid number of clients: \"%s\"\n",
-							optarg);
+					elog(NULL, ELEVEL_MAIN,
+						 "invalid number of clients: \"%s\"\n", optarg);
 					exit(1);
 				}
 #ifdef HAVE_GETRLIMIT
@@ -4882,14 +5767,19 @@ main(int argc, char **argv)
 				if (getrlimit(RLIMIT_OFILE, &rlim) == -1)
 #endif							/* RLIMIT_NOFILE */
 				{
-					fprintf(stderr, "getrlimit failed: %s\n", strerror(errno));
+					elog(NULL, ELEVEL_MAIN,
+						 "getrlimit failed: %s\n", strerror(errno));
 					exit(1);
 				}
 				if (rlim.rlim_cur < nclients + 3)
 				{
-					fprintf(stderr, "need at least %d open files, but system limit is %ld\n",
-							nclients + 3, (long) rlim.rlim_cur);
-					fprintf(stderr, "Reduce number of clients, or use limit/ulimit to increase the system limit.\n");
+					if (errstart(NULL, ELEVEL_MAIN))
+					{
+						errmsg(NULL, "need at least %d open files, but system limit is %ld\n",
+							   nclients + 3, (long) rlim.rlim_cur);
+						errmsg(NULL, "Reduce number of clients, or use limit/ulimit to increase the system limit.\n");
+						errfinish(NULL);
+					}
 					exit(1);
 				}
 #endif							/* HAVE_GETRLIMIT */
@@ -4899,14 +5789,15 @@ main(int argc, char **argv)
 				nthreads = atoi(optarg);
 				if (nthreads <= 0)
 				{
-					fprintf(stderr, "invalid number of threads: \"%s\"\n",
-							optarg);
+					elog(NULL, ELEVEL_MAIN,
+						 "invalid number of threads: \"%s\"\n", optarg);
 					exit(1);
 				}
 #ifndef ENABLE_THREAD_SAFETY
 				if (nthreads != 1)
 				{
-					fprintf(stderr, "threads are not supported on this platform; use -j1\n");
+					elog(NULL, ELEVEL_MAIN,
+						 "threads are not supported on this platform; use -j1\n");
 					exit(1);
 				}
 #endif							/* !ENABLE_THREAD_SAFETY */
@@ -4917,14 +5808,15 @@ main(int argc, char **argv)
 				break;
 			case 'r':
 				benchmarking_option_set = true;
-				is_latencies = true;
+				report_per_command = true;
 				break;
 			case 's':
 				scale_given = true;
 				scale = atoi(optarg);
 				if (scale <= 0)
 				{
-					fprintf(stderr, "invalid scaling factor: \"%s\"\n", optarg);
+					elog(NULL, ELEVEL_MAIN,
+						 "invalid scaling factor: \"%s\"\n", optarg);
 					exit(1);
 				}
 				break;
@@ -4933,8 +5825,8 @@ main(int argc, char **argv)
 				nxacts = atoi(optarg);
 				if (nxacts <= 0)
 				{
-					fprintf(stderr, "invalid number of transactions: \"%s\"\n",
-							optarg);
+					elog(NULL, ELEVEL_MAIN,
+						 "invalid number of transactions: \"%s\"\n", optarg);
 					exit(1);
 				}
 				break;
@@ -4943,7 +5835,8 @@ main(int argc, char **argv)
 				duration = atoi(optarg);
 				if (duration <= 0)
 				{
-					fprintf(stderr, "invalid duration: \"%s\"\n", optarg);
+					elog(NULL, ELEVEL_MAIN,
+						 "invalid duration: \"%s\"\n", optarg);
 					exit(1);
 				}
 				break;
@@ -4992,13 +5885,13 @@ main(int argc, char **argv)
 
 					if ((p = strchr(optarg, '=')) == NULL || p == optarg || *(p + 1) == '\0')
 					{
-						fprintf(stderr, "invalid variable definition: \"%s\"\n",
-								optarg);
+						elog(NULL, ELEVEL_MAIN,
+							 "invalid variable definition: \"%s\"\n", optarg);
 						exit(1);
 					}
 
 					*p++ = '\0';
-					if (!putVariable(&state[0], "option", optarg, p))
+					if (!putVariable(&state[0].variables, "option", optarg, p))
 						exit(1);
 				}
 				break;
@@ -5007,7 +5900,8 @@ main(int argc, char **argv)
 				fillfactor = atoi(optarg);
 				if (fillfactor < 10 || fillfactor > 100)
 				{
-					fprintf(stderr, "invalid fillfactor: \"%s\"\n", optarg);
+					elog(NULL, ELEVEL_MAIN,
+						 "invalid fillfactor: \"%s\"\n", optarg);
 					exit(1);
 				}
 				break;
@@ -5018,8 +5912,8 @@ main(int argc, char **argv)
 						break;
 				if (querymode >= NUM_QUERYMODE)
 				{
-					fprintf(stderr, "invalid query mode (-M): \"%s\"\n",
-							optarg);
+					elog(NULL, ELEVEL_MAIN,
+						 "invalid query mode (-M): \"%s\"\n", optarg);
 					exit(1);
 				}
 				break;
@@ -5028,8 +5922,8 @@ main(int argc, char **argv)
 				progress = atoi(optarg);
 				if (progress <= 0)
 				{
-					fprintf(stderr, "invalid thread progress delay: \"%s\"\n",
-							optarg);
+					elog(NULL, ELEVEL_MAIN,
+						 "invalid thread progress delay: \"%s\"\n", optarg);
 					exit(1);
 				}
 				break;
@@ -5042,7 +5936,8 @@ main(int argc, char **argv)
 
 					if (throttle_value <= 0.0)
 					{
-						fprintf(stderr, "invalid rate limit: \"%s\"\n", optarg);
+						elog(NULL, ELEVEL_MAIN,
+							 "invalid rate limit: \"%s\"\n", optarg);
 						exit(1);
 					}
 					/* Invert rate limit into a time offset */
@@ -5055,8 +5950,8 @@ main(int argc, char **argv)
 
 					if (limit_ms <= 0.0)
 					{
-						fprintf(stderr, "invalid latency limit: \"%s\"\n",
-								optarg);
+						elog(NULL, ELEVEL_MAIN,
+							 "invalid latency limit: \"%s\"\n", optarg);
 						exit(1);
 					}
 					benchmarking_option_set = true;
@@ -5080,7 +5975,8 @@ main(int argc, char **argv)
 				sample_rate = atof(optarg);
 				if (sample_rate <= 0.0 || sample_rate > 1.0)
 				{
-					fprintf(stderr, "invalid sampling rate: \"%s\"\n", optarg);
+					elog(NULL, ELEVEL_MAIN,
+						 "invalid sampling rate: \"%s\"\n", optarg);
 					exit(1);
 				}
 				break;
@@ -5089,8 +5985,9 @@ main(int argc, char **argv)
 				agg_interval = atoi(optarg);
 				if (agg_interval <= 0)
 				{
-					fprintf(stderr, "invalid number of seconds for aggregation: \"%s\"\n",
-							optarg);
+					elog(NULL, ELEVEL_MAIN,
+						 "invalid number of seconds for aggregation: \"%s\"\n",
+						 optarg);
 					exit(1);
 				}
 				break;
@@ -5110,12 +6007,28 @@ main(int argc, char **argv)
 				benchmarking_option_set = true;
 				if (!set_random_seed(optarg))
 				{
-					fprintf(stderr, "error while setting random seed from --random-seed option\n");
+					elog(NULL, ELEVEL_MAIN,
+						 "error while setting random seed from --random-seed option\n");
 					exit(1);
 				}
 				break;
+			case 10:			/* max-tries */
+				{
+					int32		max_tries_arg = atoi(optarg);
+
+					if (max_tries_arg <= 0)
+					{
+						elog(NULL, ELEVEL_MAIN,
+							 "invalid number of maximum tries: \"%s\"\n", optarg);
+						exit(1);
+					}
+					benchmarking_option_set = true;
+					max_tries = (uint32) max_tries_arg;
+				}
+				break;
 			default:
-				fprintf(stderr, _("Try \"%s --help\" for more information.\n"), progname);
+				elog(NULL, ELEVEL_MAIN,
+					 _("Try \"%s --help\" for more information.\n"), progname);
 				exit(1);
 				break;
 		}
@@ -5154,7 +6067,7 @@ main(int argc, char **argv)
 
 	if (total_weight == 0 && !is_init_mode)
 	{
-		fprintf(stderr, "total script weight must not be zero\n");
+		elog(NULL, ELEVEL_MAIN, "total script weight must not be zero\n");
 		exit(1);
 	}
 
@@ -5189,7 +6102,8 @@ main(int argc, char **argv)
 	{
 		if (benchmarking_option_set)
 		{
-			fprintf(stderr, "some of the specified options cannot be used in initialization (-i) mode\n");
+			elog(NULL, ELEVEL_MAIN,
+				 "some of the specified options cannot be used in initialization (-i) mode\n");
 			exit(1);
 		}
 
@@ -5224,14 +6138,16 @@ main(int argc, char **argv)
 	{
 		if (initialization_option_set)
 		{
-			fprintf(stderr, "some of the specified options cannot be used in benchmarking mode\n");
+			elog(NULL, ELEVEL_MAIN,
+				 "some of the specified options cannot be used in benchmarking mode\n");
 			exit(1);
 		}
 	}
 
 	if (nxacts > 0 && duration > 0)
 	{
-		fprintf(stderr, "specify either a number of transactions (-t) or a duration (-T), not both\n");
+		elog(NULL, ELEVEL_MAIN,
+			 "specify either a number of transactions (-t) or a duration (-T), not both\n");
 		exit(1);
 	}
 
@@ -5242,47 +6158,60 @@ main(int argc, char **argv)
 	/* --sampling-rate may be used only with -l */
 	if (sample_rate > 0.0 && !use_log)
 	{
-		fprintf(stderr, "log sampling (--sampling-rate) is allowed only when logging transactions (-l)\n");
+		elog(NULL, ELEVEL_MAIN,
+			 "log sampling (--sampling-rate) is allowed only when logging transactions (-l)\n");
 		exit(1);
 	}
 
 	/* --sampling-rate may not be used with --aggregate-interval */
 	if (sample_rate > 0.0 && agg_interval > 0)
 	{
-		fprintf(stderr, "log sampling (--sampling-rate) and aggregation (--aggregate-interval) cannot be used at the same time\n");
+		elog(NULL, ELEVEL_MAIN,
+			 "log sampling (--sampling-rate) and aggregation (--aggregate-interval) cannot be used at the same time\n");
 		exit(1);
 	}
 
 	if (agg_interval > 0 && !use_log)
 	{
-		fprintf(stderr, "log aggregation is allowed only when actually logging transactions\n");
+		elog(NULL, ELEVEL_MAIN,
+			 "log aggregation is allowed only when actually logging transactions\n");
 		exit(1);
 	}
 
 	if (!use_log && logfile_prefix)
 	{
-		fprintf(stderr, "log file prefix (--log-prefix) is allowed only when logging transactions (-l)\n");
+		elog(NULL, ELEVEL_MAIN,
+			 "log file prefix (--log-prefix) is allowed only when logging transactions (-l)\n");
 		exit(1);
 	}
 
 	if (duration > 0 && agg_interval > duration)
 	{
-		fprintf(stderr, "number of seconds for aggregation (%d) must not be higher than test duration (%d)\n", agg_interval, duration);
+		elog(NULL, ELEVEL_MAIN,
+			 "number of seconds for aggregation (%d) must not be higher than test duration (%d)\n",
+			 agg_interval, duration);
 		exit(1);
 	}
 
 	if (duration > 0 && agg_interval > 0 && duration % agg_interval != 0)
 	{
-		fprintf(stderr, "duration (%d) must be a multiple of aggregation interval (%d)\n", duration, agg_interval);
+		elog(NULL, ELEVEL_MAIN,
+			 "duration (%d) must be a multiple of aggregation interval (%d)\n",
+			 duration, agg_interval);
 		exit(1);
 	}
 
 	if (progress_timestamp && progress == 0)
 	{
-		fprintf(stderr, "--progress-timestamp is allowed only under --progress\n");
+		elog(NULL, ELEVEL_MAIN,
+			 "--progress-timestamp is allowed only under --progress\n");
 		exit(1);
 	}
 
+	/* If necessary set the default tries limit  */
+	if (!max_tries && !latency_limit)
+		max_tries = 1;
+
 	/*
 	 * save main process id in the global variable because process id will be
 	 * changed after fork.
@@ -5300,19 +6229,19 @@ main(int argc, char **argv)
 			int			j;
 
 			state[i].id = i;
-			for (j = 0; j < state[0].nvariables; j++)
+			for (j = 0; j < state[0].variables.nvariables; j++)
 			{
-				Variable   *var = &state[0].variables[j];
+				Variable   *var = &state[0].variables.array[j];
 
 				if (var->value.type != PGBT_NO_VALUE)
 				{
-					if (!putVariableValue(&state[i], "startup",
-										   var->name, &var->value))
+					if (!putVariableValue(NULL, &state[i].variables, "startup",
+										  var->name, &var->value))
 						exit(1);
 				}
 				else
 				{
-					if (!putVariable(&state[i], "startup",
+					if (!putVariable(&state[i].variables, "startup",
 									 var->name, var->svalue))
 						exit(1);
 				}
@@ -5324,27 +6253,31 @@ main(int argc, char **argv)
 	for (i = 0; i < nclients; i++)
 	{
 		state[i].cstack = conditional_stack_create();
+		initRandomState(&state[i].random_state);
 	}
 
-	if (debug)
-	{
-		if (duration <= 0)
-			printf("pghost: %s pgport: %s nclients: %d nxacts: %d dbName: %s\n",
-				   pghost, pgport, nclients, nxacts, dbName);
-		else
-			printf("pghost: %s pgport: %s nclients: %d duration: %d dbName: %s\n",
-				   pghost, pgport, nclients, duration, dbName);
-	}
+	if (duration <= 0)
+		elog(NULL, ELEVEL_DEBUG,
+			 "pghost: %s pgport: %s nclients: %d nxacts: %d dbName: %s\n",
+			 pghost, pgport, nclients, nxacts, dbName);
+	else
+		elog(NULL, ELEVEL_DEBUG,
+			 "pghost: %s pgport: %s nclients: %d duration: %d dbName: %s\n",
+			 pghost, pgport, nclients, duration, dbName);
 
 	/* opening connection... */
-	con = doConnect();
+	con = doConnect(NULL);
 	if (con == NULL)
 		exit(1);
 
 	if (PQstatus(con) == CONNECTION_BAD)
 	{
-		fprintf(stderr, "connection to database \"%s\" failed\n", dbName);
-		fprintf(stderr, "%s", PQerrorMessage(con));
+		if (errstart(NULL, ELEVEL_MAIN))
+		{
+			errmsg(NULL, "connection to database \"%s\" failed\n", dbName);
+			errmsg(NULL, "%s", PQerrorMessage(con));
+			errfinish(NULL);
+		}
 		exit(1);
 	}
 
@@ -5359,10 +6292,15 @@ main(int argc, char **argv)
 		{
 			char	   *sqlState = PQresultErrorField(res, PG_DIAG_SQLSTATE);
 
-			fprintf(stderr, "%s", PQerrorMessage(con));
-			if (sqlState && strcmp(sqlState, ERRCODE_UNDEFINED_TABLE) == 0)
+			if (errstart(NULL, ELEVEL_MAIN))
 			{
-				fprintf(stderr, "Perhaps you need to do initialization (\"pgbench -i\") in database \"%s\"\n", PQdb(con));
+				errmsg(NULL, "%s", PQerrorMessage(con));
+				if (sqlState && strcmp(sqlState, ERRCODE_UNDEFINED_TABLE) == 0)
+				{
+					errmsg(NULL, "Perhaps you need to do initialization (\"pgbench -i\") in database \"%s\"\n",
+						   PQdb(con));
+				}
+				errfinish(NULL);
 			}
 
 			exit(1);
@@ -5370,28 +6308,30 @@ main(int argc, char **argv)
 		scale = atoi(PQgetvalue(res, 0, 0));
 		if (scale < 0)
 		{
-			fprintf(stderr, "invalid count(*) from pgbench_branches: \"%s\"\n",
-					PQgetvalue(res, 0, 0));
+			elog(NULL, ELEVEL_MAIN,
+				 "invalid count(*) from pgbench_branches: \"%s\"\n",
+				 PQgetvalue(res, 0, 0));
 			exit(1);
 		}
 		PQclear(res);
 
 		/* warn if we override user-given -s switch */
 		if (scale_given)
-			fprintf(stderr,
-					"scale option ignored, using count from pgbench_branches table (%d)\n",
-					scale);
+			elog(NULL, ELEVEL_MAIN,
+				 "scale option ignored, using count from pgbench_branches table (%d)\n",
+				 scale);
 	}
 
 	/*
 	 * :scale variables normally get -s or database scale, but don't override
 	 * an explicit -D switch
 	 */
-	if (lookupVariable(&state[0], "scale") == NULL)
+	if (lookupVariable(&state[0].variables, "scale") == NULL)
 	{
 		for (i = 0; i < nclients; i++)
 		{
-			if (!putVariableInt(&state[i], "startup", "scale", scale))
+			if (!putVariableInt(NULL, &state[i].variables, "startup", "scale",
+								scale))
 				exit(1);
 		}
 	}
@@ -5400,15 +6340,18 @@ main(int argc, char **argv)
 	 * Define a :client_id variable that is unique per connection. But don't
 	 * override an explicit -D switch.
 	 */
-	if (lookupVariable(&state[0], "client_id") == NULL)
+	if (lookupVariable(&state[0].variables, "client_id") == NULL)
 	{
 		for (i = 0; i < nclients; i++)
-			if (!putVariableInt(&state[i], "startup", "client_id", i))
+		{
+			if (!putVariableInt(NULL, &state[i].variables, "startup",
+								"client_id", i))
 				exit(1);
+		}
 	}
 
 	/* set default seed for hash functions */
-	if (lookupVariable(&state[0], "default_seed") == NULL)
+	if (lookupVariable(&state[0].variables, "default_seed") == NULL)
 	{
 		uint64	seed = ((uint64) (random() & 0xFFFF) << 48) |
 					   ((uint64) (random() & 0xFFFF) << 32) |
@@ -5416,31 +6359,33 @@ main(int argc, char **argv)
 					   (uint64) (random() & 0xFFFF);
 
 		for (i = 0; i < nclients; i++)
-			if (!putVariableInt(&state[i], "startup", "default_seed", (int64) seed))
+			if (!putVariableInt(NULL, &state[i].variables, "startup",
+								"default_seed", (int64) seed))
 				exit(1);
 	}
 
 	/* set random seed unless overwritten */
-	if (lookupVariable(&state[0], "random_seed") == NULL)
+	if (lookupVariable(&state[0].variables, "random_seed") == NULL)
 	{
 		for (i = 0; i < nclients; i++)
-			if (!putVariableInt(&state[i], "startup", "random_seed", random_seed))
+			if (!putVariableInt(NULL, &state[i].variables, "startup",
+								"random_seed", random_seed))
 				exit(1);
 	}
 
 	if (!is_no_vacuum)
 	{
-		fprintf(stderr, "starting vacuum...");
+		elog(NULL, ELEVEL_MAIN, "starting vacuum...");
 		tryExecuteStatement(con, "vacuum pgbench_branches");
 		tryExecuteStatement(con, "vacuum pgbench_tellers");
 		tryExecuteStatement(con, "truncate pgbench_history");
-		fprintf(stderr, "end.\n");
+		elog(NULL, ELEVEL_MAIN, "end.\n");
 
 		if (do_vacuum_accounts)
 		{
-			fprintf(stderr, "starting vacuum pgbench_accounts...");
+			elog(NULL, ELEVEL_MAIN, "starting vacuum pgbench_accounts...");
 			tryExecuteStatement(con, "vacuum analyze pgbench_accounts");
-			fprintf(stderr, "end.\n");
+			elog(NULL, ELEVEL_MAIN, "end.\n");
 		}
 	}
 	PQfinish(con);
@@ -5457,15 +6402,14 @@ main(int argc, char **argv)
 		thread->state = &state[nclients_dealt];
 		thread->nstate =
 			(nclients - nclients_dealt + nthreads - i - 1) / (nthreads - i);
-		thread->random_state[0] = random();
-		thread->random_state[1] = random();
-		thread->random_state[2] = random();
+		initRandomState(&thread->random_state);
 		thread->logfile = NULL; /* filled in later */
 		thread->latency_late = 0;
 		thread->zipf_cache.nb_cells = 0;
 		thread->zipf_cache.current = 0;
 		thread->zipf_cache.overflowCount = 0;
 		initStats(&thread->stats, 0);
+		memset(&(thread->error_state), 0, sizeof(ErrorState));
 
 		nclients_dealt += thread->nstate;
 	}
@@ -5500,7 +6444,8 @@ main(int argc, char **argv)
 
 			if (err != 0 || thread->thread == INVALID_THREAD)
 			{
-				fprintf(stderr, "could not create thread: %s\n", strerror(err));
+				elog(NULL, ELEVEL_MAIN,
+					 "could not create thread: %s\n", strerror(err));
 				exit(1);
 			}
 		}
@@ -5541,6 +6486,10 @@ main(int argc, char **argv)
 		mergeSimpleStats(&stats.lag, &thread->stats.lag);
 		stats.cnt += thread->stats.cnt;
 		stats.skipped += thread->stats.skipped;
+		stats.retries += thread->stats.retries;
+		stats.retried += thread->stats.retried;
+		stats.errors += thread->stats.errors;
+		stats.errors_in_failed_tx += thread->stats.errors_in_failed_tx;
 		latency_late += thread->latency_late;
 		INSTR_TIME_ADD(conn_total_time, thread->conn_time);
 	}
@@ -5610,8 +6559,9 @@ threadRun(void *arg)
 
 		if (thread->logfile == NULL)
 		{
-			fprintf(stderr, "could not open logfile \"%s\": %s\n",
-					logpath, strerror(errno));
+			elog(thread, ELEVEL_MAIN,
+				 "could not open logfile \"%s\": %s\n",
+				 logpath, strerror(errno));
 			goto done;
 		}
 	}
@@ -5621,7 +6571,7 @@ threadRun(void *arg)
 		/* make connections to the database */
 		for (i = 0; i < nstate; i++)
 		{
-			if ((state[i].con = doConnect()) == NULL)
+			if ((state[i].con = doConnect(NULL)) == NULL)
 				goto done;
 		}
 	}
@@ -5689,8 +6639,8 @@ threadRun(void *arg)
 
 				if (sock < 0)
 				{
-					fprintf(stderr, "invalid socket: %s",
-							PQerrorMessage(st->con));
+					elog(thread, ELEVEL_MAIN,
+						 "invalid socket: %s", PQerrorMessage(st->con));
 					goto done;
 				}
 
@@ -5766,7 +6716,8 @@ threadRun(void *arg)
 					continue;
 				}
 				/* must be something wrong */
-				fprintf(stderr, "select() failed: %s\n", strerror(errno));
+				elog(thread, ELEVEL_MAIN,
+					 "select() failed: %s\n", strerror(errno));
 				goto done;
 			}
 		}
@@ -5790,8 +6741,8 @@ threadRun(void *arg)
 
 				if (sock < 0)
 				{
-					fprintf(stderr, "invalid socket: %s",
-							PQerrorMessage(st->con));
+					elog(thread, ELEVEL_MAIN,
+						 "invalid socket: %s", PQerrorMessage(st->con));
 					goto done;
 				}
 
@@ -5825,7 +6776,11 @@ threadRun(void *arg)
 				/* generate and show report */
 				StatsData	cur;
 				int64		run = now - last_report,
-							ntx;
+							ntx,
+							retries,
+							retried,
+							errors,
+							errors_in_failed_tx;
 				double		tps,
 							total_run,
 							latency,
@@ -5852,6 +6807,11 @@ threadRun(void *arg)
 					mergeSimpleStats(&cur.lag, &thread[i].stats.lag);
 					cur.cnt += thread[i].stats.cnt;
 					cur.skipped += thread[i].stats.skipped;
+					cur.retries += thread[i].stats.retries;
+					cur.retried += thread[i].stats.retried;
+					cur.errors += thread[i].stats.errors;
+					cur.errors_in_failed_tx +=
+						thread[i].stats.errors_in_failed_tx;
 				}
 
 				/* we count only actually executed transactions */
@@ -5869,6 +6829,11 @@ threadRun(void *arg)
 				{
 					latency = sqlat = stdev = lag = 0;
 				}
+				retries = cur.retries - last.retries;
+				retried = cur.retried - last.retried;
+				errors = cur.errors - last.errors;
+				errors_in_failed_tx = cur.errors_in_failed_tx -
+					last.errors_in_failed_tx;
 
 				if (progress_timestamp)
 				{
@@ -5890,18 +6855,39 @@ threadRun(void *arg)
 					snprintf(tbuf, sizeof(tbuf), "%.1f s", total_run);
 				}
 
-				fprintf(stderr,
-						"progress: %s, %.1f tps, lat %.3f ms stddev %.3f",
-						tbuf, tps, latency, stdev);
-
-				if (throttle_delay)
+				if (errstart(NULL, ELEVEL_MAIN))
 				{
-					fprintf(stderr, ", lag %.3f ms", lag);
-					if (latency_limit)
-						fprintf(stderr, ", " INT64_FORMAT " skipped",
-								cur.skipped - last.skipped);
+					errmsg(NULL, "progress: %s, %.1f tps, lat %.3f ms stddev %.3f",
+						   tbuf, tps, latency, stdev);
+
+					if (errors > 0)
+					{
+						errmsg(NULL, ", " INT64_FORMAT " failed" , errors);
+						if (errors_in_failed_tx > 0)
+							errmsg(NULL, " (" INT64_FORMAT " in failed tx)",
+								   errors_in_failed_tx);
+					}
+
+					if (throttle_delay)
+					{
+						errmsg(NULL, ", lag %.3f ms", lag);
+						if (latency_limit)
+							errmsg(NULL, ", " INT64_FORMAT " skipped",
+								   cur.skipped - last.skipped);
+					}
+
+					/*
+					 * It can be non-zero only if max_tries is greater than one or
+					 * latency_limit is used.
+					 */
+					if (retried > 0)
+					{
+						errmsg(NULL, ", " INT64_FORMAT " retried, " INT64_FORMAT " retries",
+							   retried, retries);
+					}
+					errmsg(NULL, "\n");
+					errfinish(NULL);
 				}
-				fprintf(stderr, "\n");
 
 				last = cur;
 				last_report = now;
@@ -5986,7 +6972,7 @@ setalarm(int seconds)
 							   win32_timer_callback, NULL, seconds * 1000, 0,
 							   WT_EXECUTEINTIMERTHREAD | WT_EXECUTEONLYONCE))
 	{
-		fprintf(stderr, "failed to set timer\n");
+		elog(NULL, ELEVEL_MAIN, "failed to set timer\n");
 		exit(1);
 	}
 }
@@ -6058,3 +7044,169 @@ pthread_join(pthread_t th, void **thread_return)
 }
 
 #endif							/* WIN32 */
+
+/*
+ * Return the error state of the thread if the thread is not NULL; otherwise
+ * return the main error state.
+ */
+static ErrorState *
+getErrorState(TState *thread)
+{
+	return thread ? &(thread->error_state) : &main_error_state;
+}
+
+/*
+ * Add the formatted string to the end of the saved error/log message if the
+ * buffer size allows it.
+ *
+ * Only for use in the functions elog() / errmsg() / pgbench_error().
+ */
+static void
+errmsg_internal(TState *thread, const char *fmt, va_list *args)
+{
+	ErrorState  *error_state = getErrorState(thread);
+
+	error_state->message_length +=
+		vsnprintf(error_state->message + error_state->message_length,
+				  sizeof(error_state->message) - error_state->message_length,
+				  _(fmt), *args);
+
+	if (!error_state->in_process)
+	{
+		/* internal error which should never occur */
+		/* try to print an existing error message in stderr */
+		fprintf(stderr, "could not process an existing error message:\n%s",
+				error_state->message);
+		exit(1);
+	}
+}
+
+/*
+ * Report an error message or other log message if the debugging level resolves
+ * this error/logging level.
+ *
+ * Pass the thread as not NULL for client commands and as NULL otherwise.
+ */
+static void
+elog(TState *thread, ErrorLevel error_level, const char *fmt,...)
+{
+	va_list		ap;
+
+	if (errstart(thread, error_level))
+	{
+		va_start(ap, fmt);
+		errmsg_internal(thread, fmt, &ap);
+		va_end(ap);
+
+		errfinish(thread);
+	}
+}
+
+/*
+ * Returns true if the debugging level resolves this error/logging level and
+ * false otherwise.
+ *
+ * Pass the thread as not NULL for client commands and as NULL otherwise.
+ */
+static bool
+errstart(TState *thread, ErrorLevel error_level)
+{
+	ErrorState  *error_state = getErrorState(thread);
+	bool		start_error_reporting;
+
+	if (error_state->in_process)
+	{
+		/* internal error which should never occur */
+		fprintf(stderr, "cannot handle more than one error at a time\n");
+		exit(1);
+	}
+
+	/* Check if we have the appropriate debugging level */
+	switch (error_level)
+	{
+		case ELEVEL_DEBUG:
+			/*
+			 * Print the message only if there's a debugging mode for all types
+			 * of messages.
+			 */
+			start_error_reporting = debug_level >= DEBUG_ALL;
+			break;
+		case ELEVEL_CLIENT_FAIL:
+			/*
+			 * Print a failure message only if there's at least a debugging mode
+			 * for fails.
+			 */
+			start_error_reporting = debug_level >= DEBUG_FAILS;
+			break;
+		case ELEVEL_CLIENT_ABORTED:
+		case ELEVEL_MAIN:
+			/*
+			 * Always print an error message if the client is aborted or this is
+			 * the main program error/log message.
+			 */
+			start_error_reporting = true;
+			break;
+		default:
+			/* internal error which should never occur */
+			fprintf(stderr, "unexpected error level: %d\n", error_level);
+			exit(1);
+	}
+
+	if (start_error_reporting)
+	{
+		error_state->in_process = true;
+		error_state->message[0] = '\0';
+		error_state->message_length = 0;
+	}
+
+	return start_error_reporting;
+}
+
+/*
+ * Add the formatted string to the end of the stored error/log message if the
+ * buffer size allows it.
+ *
+ * Pass the thread as not NULL for client commands and as NULL otherwise.
+ */
+static void errmsg(TState *thread, const char *fmt,...)
+{
+	va_list		ap;
+
+	va_start(ap, fmt);
+	errmsg_internal(thread, fmt, &ap);
+	va_end(ap);
+}
+
+/*
+ * Print an error/log message to stderr (it is assumed that it is not
+ * empty).
+ *
+ * Pass the thread as not NULL for client commands and as NULL otherwise.
+ */
+static void
+errfinish(TState *thread)
+{
+	ErrorState  *error_state = getErrorState(thread);
+
+	if (!error_state->in_process)
+	{
+		/* internal error which should never occur */
+		/* try to print an existing error message in stderr */
+		fprintf(stderr, "could not complete an existing error message:\n%s",
+				error_state->message);
+		exit(1);
+	}
+
+	if (error_state->message_length)
+	{
+		fprintf(stderr, "%s", error_state->message);
+	}
+	else
+	{
+		/* internal error which should never occur */
+		fprintf(stderr, "empty error message cannot be reported\n");
+		exit(1);
+	}
+
+	error_state->in_process = false;
+}
diff --git a/src/bin/pgbench/t/001_pgbench_with_server.pl b/src/bin/pgbench/t/001_pgbench_with_server.pl
index be08b20..370fce6 100644
--- a/src/bin/pgbench/t/001_pgbench_with_server.pl
+++ b/src/bin/pgbench/t/001_pgbench_with_server.pl
@@ -118,7 +118,8 @@ pgbench(
 	[   qr{builtin: TPC-B},
 		qr{clients: 2\b},
 		qr{processed: 10/10},
-		qr{mode: simple} ],
+		qr{mode: simple},
+		qr{maximum number of tries: 1} ],
 	[qr{^$}],
 	'pgbench tpcb-like');
 
@@ -134,7 +135,7 @@ pgbench(
 	'pgbench simple update');
 
 pgbench(
-	'-t 100 -c 7 -M prepared -b se --debug',
+	'-t 100 -c 7 -M prepared -b se --debug all',
 	0,
 	[   qr{builtin: select only},
 		qr{clients: 7\b},
@@ -491,6 +492,10 @@ my @errors = (
 \set i 0
 SELECT LEAST(:i, :i, :i, :i, :i, :i, :i, :i, :i, :i, :i);
 } ],
+	[   'sql division by zero', 0, [qr{ERROR:  division by zero}],
+		q{-- SQL division by zero
+	SELECT 1 / 0;
+} ],
 
 	# SHELL
 	[   'shell bad command',               0,
@@ -621,6 +626,16 @@ SELECT LEAST(:i, :i, :i, :i, :i, :i, :i, :i, :i, :i, :i);
 	[   'sleep unknown unit',         1,
 		[qr{unrecognized time unit}], q{\sleep 1 week} ],
 
+	# CONDITIONAL BLOCKS
+	[   'if elif failed conditions', 0,
+		[qr{division by zero}],
+		q{-- failed conditions
+\if 1 / 0
+\elif 1 / 0
+\else
+\endif
+} ],
+
 	# MISC
 	[   'misc invalid backslash command',         1,
 		[qr{invalid command .* "nosuchcommand"}], q{\nosuchcommand} ],
@@ -635,14 +650,32 @@ for my $e (@errors)
 	my $n = '001_pgbench_error_' . $name;
 	$n =~ s/ /_/g;
 	pgbench(
-		'-n -t 1 -Dfoo=bla -Dnull=null -Dtrue=true -Done=1 -Dzero=0.0 -Dbadtrue=trueXXX -M prepared',
+		'-n -t 1 -Dfoo=bla -Dnull=null -Dtrue=true -Done=1 -Dzero=0.0 -Dbadtrue=trueXXX -M prepared -d fails',
 		$status,
-		[ $status ? qr{^$} : qr{processed: 0/1} ],
+		($status ?
+		 [ qr{^$} ] :
+		 [ qr{processed: 0/1}, qr{number of errors: 1 \(100.000%\)},
+		   qr{^((?!number of retried)(.|\n))*$} ]),
 		$re,
 		'pgbench script error: ' . $name,
 		{ $n => $script });
 }
 
+# reset client variables in case of failure
+pgbench(
+	'-n -t 2 -d fails', 0,
+	[ qr{processed: 0/2}, qr{number of errors: 2 \(100.000%\)},
+	  qr{^((?!number of retried)(.|\n))*$} ],
+	[ qr{(client 0 got a failure in command 1 \(SQL\) of script 0; ERROR:  syntax error at or near ":"(.|\n)*){2}} ],
+	'pgbench reset client variables in case of failure',
+	{	'001_pgbench_reset_client_variables' => q{
+BEGIN;
+-- select an unassigned variable
+SELECT :unassigned_var;
+\set unassigned_var 1
+END;
+} });
+
 # zipfian cache array overflow
 pgbench(
 	'-t 1', 0,
diff --git a/src/bin/pgbench/t/002_pgbench_no_server.pl b/src/bin/pgbench/t/002_pgbench_no_server.pl
index af21f04..ed8def9 100644
--- a/src/bin/pgbench/t/002_pgbench_no_server.pl
+++ b/src/bin/pgbench/t/002_pgbench_no_server.pl
@@ -57,7 +57,7 @@ my @options = (
 
 	# name, options, stderr checks
 	[   'bad option',
-		'-h home -p 5432 -U calvin -d --bad-option',
+		'-h home -p 5432 -U calvin -d all --bad-option',
 		[ qr{(unrecognized|illegal) option}, qr{--help.*more information} ] ],
 	[   'no file',
 		'-f no-such-file',
@@ -113,6 +113,8 @@ my @options = (
 	[ 'bad random seed', '--random-seed=one',
 		[qr{unrecognized random seed option "one": expecting an unsigned integer, "time" or "rand"},
 		 qr{error while setting random seed from --random-seed option} ] ],
+	[ 'bad maximum number of tries', '--max-tries -10',
+		[qr{invalid number of maximum tries: "-10"} ] ],
 
 	# loging sub-options
 	[   'sampling => log', '--sampling-rate=0.01',
diff --git a/src/bin/pgbench/t/003_serialization_and_deadlock_fails.pl b/src/bin/pgbench/t/003_serialization_and_deadlock_fails.pl
new file mode 100644
index 0000000..5e45cb1
--- /dev/null
+++ b/src/bin/pgbench/t/003_serialization_and_deadlock_fails.pl
@@ -0,0 +1,761 @@
+use strict;
+use warnings;
+
+use Config;
+use PostgresNode;
+use TestLib;
+use Test::More tests => 34;
+
+use constant
+{
+	READ_COMMITTED   => 0,
+	REPEATABLE_READ  => 1,
+	SERIALIZABLE     => 2,
+};
+
+my @isolation_level_shell = (
+	'read\\ committed',
+	'repeatable\\ read',
+	'serializable');
+
+# The keys of advisory locks for testing deadlock failures:
+use constant
+{
+	DEADLOCK_1         => 3,
+	WAIT_PGBENCH_2     => 4,
+	DEADLOCK_2         => 5,
+	TRANSACTION_ENDS_1 => 6,
+	TRANSACTION_ENDS_2 => 7,
+};
+
+# Test concurrent update in table row.
+my $node = get_new_node('main');
+$node->init;
+$node->start;
+$node->safe_psql('postgres',
+    'CREATE UNLOGGED TABLE xy (x integer, y integer); '
+  . 'INSERT INTO xy VALUES (1, 2), (2, 3);');
+
+my $script_serialization = $node->basedir . '/pgbench_script_serialization';
+append_to_file($script_serialization,
+		"\\set delta random(-5000, 5000)\n"
+	  . "BEGIN;\n"
+	  . "SELECT pg_sleep(1);\n"
+	  . "UPDATE xy SET y = y + :delta "
+	  . "WHERE x = 1 AND pg_advisory_lock(0) IS NOT NULL;\n"
+	  . "SELECT pg_advisory_unlock_all();\n"
+	  . "END;\n");
+
+my $script_deadlocks1 = $node->basedir . '/pgbench_script_deadlocks1';
+append_to_file($script_deadlocks1,
+		"BEGIN;\n"
+	  . "SELECT pg_advisory_lock(" . DEADLOCK_1 . ");\n"
+	  . "SELECT pg_advisory_lock(" . WAIT_PGBENCH_2 . ");\n"
+	  . "SELECT pg_advisory_lock(" . DEADLOCK_2 . ");\n"
+	  . "END;\n"
+	  . "SELECT pg_advisory_unlock_all();\n"
+	  . "SELECT pg_advisory_lock(" . TRANSACTION_ENDS_1 . ");\n"
+	  . "SELECT pg_advisory_unlock_all();");
+
+my $script_deadlocks2 = $node->basedir . '/pgbench_script_deadlocks2';
+append_to_file($script_deadlocks2,
+		"BEGIN;\n"
+	  . "SELECT pg_advisory_lock(" . DEADLOCK_2 . ");\n"
+	  . "SELECT pg_advisory_lock(" . DEADLOCK_1 . ");\n"
+	  . "END;\n"
+	  . "SELECT pg_advisory_unlock_all();\n"
+	  . "SELECT pg_advisory_lock(" . TRANSACTION_ENDS_2 . ");\n"
+	  . "SELECT pg_advisory_unlock_all();");
+
+sub test_pgbench_serialization_errors
+{
+	my ($max_tries, $latency_limit, $test_name) = @_;
+
+	my $isolation_level = REPEATABLE_READ;
+	my $isolation_level_shell = $isolation_level_shell[$isolation_level];
+
+	local $ENV{PGPORT} = $node->port;
+	local $ENV{PGOPTIONS} =
+		"-c default_transaction_isolation=" . $isolation_level_shell;
+	print "# PGOPTIONS: " . $ENV{PGOPTIONS} . "\n";
+
+	my ($h_psql, $in_psql, $out_psql);
+	my ($h_pgbench, $in_pgbench, $out_pgbench, $err_pgbench);
+
+	# Open a psql session, run a parallel transaction and aquire an advisory
+	# lock:
+	print "# Starting psql\n";
+	$h_psql = IPC::Run::start [ 'psql' ], \$in_psql, \$out_psql;
+
+	$in_psql = "begin;\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /BEGIN/;
+
+	$in_psql =
+		"update xy set y = y + 1 "
+	  . "where x = 1 and pg_advisory_lock(0) is not null;\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /UPDATE 1/;
+
+	my $retry_options =
+		($max_tries ? "--max-tries $max_tries" : "")
+	  . ($latency_limit ? "--latency-limit $latency_limit" : "");
+
+	# Start pgbench:
+	my @command = (
+		qw(pgbench --no-vacuum --transactions 1 --debug fails --file),
+		$script_serialization,
+		split /\s+/, $retry_options);
+	print "# Running: " . join(" ", @command) . "\n";
+	$h_pgbench = IPC::Run::start \@command, \$in_pgbench, \$out_pgbench,
+	  \$err_pgbench;
+
+	# Wait until pgbench also tries to acquire the same advisory lock:
+	do
+	{
+		$in_psql =
+			"select * from pg_locks where "
+		  . "locktype = 'advisory' and "
+		  . "objsubid = 1 and "
+		  . "((classid::bigint << 32) | objid::bigint = 0::bigint) and "
+		  . "not granted;\n";
+		print "# Running in psql: " . join(" ", $in_psql);
+		$h_psql->pump() while length $in_psql;
+	} while ($out_psql !~ /1 row/);
+
+	# In psql, commit the transaction, release advisory locks and end the
+	# session:
+	$in_psql = "end;\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /COMMIT/;
+
+	$in_psql = "select pg_advisory_unlock_all();\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /pg_advisory_unlock_all/;
+
+	$in_psql = "\\q\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() while length $in_psql;
+
+	$h_psql->finish();
+
+	# Get pgbench results
+	$h_pgbench->pump() until length $out_pgbench;
+	$h_pgbench->finish();
+
+	# On Windows, the exit status of the process is returned directly as the
+	# process's exit code, while on Unix, it's returned in the high bits
+	# of the exit code (see WEXITSTATUS macro in the standard <sys/wait.h>
+	# header file). IPC::Run's result function always returns exit code >> 8,
+	# assuming the Unix convention, which will always return 0 on Windows as
+	# long as the process was not terminated by an exception. To work around
+	# that, use $h->full_result on Windows instead.
+	my $result =
+	    ($Config{osname} eq "MSWin32")
+	  ? ($h_pgbench->full_results)[0]
+	  : $h_pgbench->result(0);
+
+	# Check pgbench results
+	ok(!$result, "@command exit code 0");
+
+	like($out_pgbench,
+		qr{processed: 0/1},
+		"$test_name: check processed transactions");
+
+	like($out_pgbench,
+		qr{number of errors: 1 \(100\.000%\)},
+		"$test_name: check errors");
+
+	like($out_pgbench,
+		qr{^((?!number of retried)(.|\n))*$},
+		"$test_name: check retried");
+
+	if ($max_tries)
+	{
+		like($out_pgbench,
+			qr{maximum number of tries: $max_tries},
+			"$test_name: check the maximum number of tries");
+	}
+	else
+	{
+		like($out_pgbench,
+			qr{^((?!maximum number of tries)(.|\n))*$},
+			"$test_name: check the maximum number of tries");
+	}
+
+	if ($latency_limit)
+	{
+		like($out_pgbench,
+			qr{number of transactions above the $latency_limit\.0 ms latency limit: 1/1 \(100.000 \%\) \(including errors\)},
+			"$test_name: check transactions above latency limit");
+	}
+	else
+	{
+		like($out_pgbench,
+			qr{^((?!latency limit)(.|\n))*$},
+			"$test_name: check transactions above latency limit");
+	}
+
+	my $pattern =
+		"client 0 got a failure in command 3 \\(SQL\\) of script 0; "
+	  . "ERROR:  could not serialize access due to concurrent update";
+
+	like($err_pgbench,
+		qr{$pattern},
+		"$test_name: check serialization failure");
+}
+
+sub test_pgbench_serialization_failures
+{
+	my $isolation_level = REPEATABLE_READ;
+	my $isolation_level_shell = $isolation_level_shell[$isolation_level];
+
+	local $ENV{PGPORT} = $node->port;
+	local $ENV{PGOPTIONS} =
+		"-c default_transaction_isolation=" . $isolation_level_shell;
+	print "# PGOPTIONS: " . $ENV{PGOPTIONS} . "\n";
+
+	my ($h_psql, $in_psql, $out_psql);
+	my ($h_pgbench, $in_pgbench, $out_pgbench, $err_pgbench);
+
+	# Open a psql session, run a parallel transaction and aquire an advisory
+	# lock:
+	print "# Starting psql\n";
+	$h_psql = IPC::Run::start [ 'psql' ], \$in_psql, \$out_psql;
+
+	$in_psql = "begin;\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /BEGIN/;
+
+	$in_psql =
+		"update xy set y = y + 1 "
+	  . "where x = 1 and pg_advisory_lock(0) is not null;\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /UPDATE 1/;
+
+	# Start pgbench:
+	my @command = (
+		qw(pgbench --no-vacuum --transactions 1 --debug all --max-tries 2),
+		"--file",
+		$script_serialization);
+	print "# Running: " . join(" ", @command) . "\n";
+	$h_pgbench = IPC::Run::start \@command, \$in_pgbench, \$out_pgbench,
+	  \$err_pgbench;
+
+	# Wait until pgbench also tries to acquire the same advisory lock:
+	do
+	{
+		$in_psql =
+			"select * from pg_locks where "
+		  . "locktype = 'advisory' and "
+		  . "objsubid = 1 and "
+		  . "((classid::bigint << 32) | objid::bigint = 0::bigint) and "
+		  . "not granted;\n";
+		print "# Running in psql: " . join(" ", $in_psql);
+		$h_psql->pump() while length $in_psql;
+	} while ($out_psql !~ /1 row/);
+
+	# In psql, commit the transaction, release advisory locks and end the
+	# session:
+	$in_psql = "end;\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /COMMIT/;
+
+	$in_psql = "select pg_advisory_unlock_all();\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /pg_advisory_unlock_all/;
+
+	$in_psql = "\\q\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() while length $in_psql;
+
+	$h_psql->finish();
+
+	# Get pgbench results
+	$h_pgbench->pump() until length $out_pgbench;
+	$h_pgbench->finish();
+
+	# On Windows, the exit status of the process is returned directly as the
+	# process's exit code, while on Unix, it's returned in the high bits
+	# of the exit code (see WEXITSTATUS macro in the standard <sys/wait.h>
+	# header file). IPC::Run's result function always returns exit code >> 8,
+	# assuming the Unix convention, which will always return 0 on Windows as
+	# long as the process was not terminated by an exception. To work around
+	# that, use $h->full_result on Windows instead.
+	my $result =
+	    ($Config{osname} eq "MSWin32")
+	  ? ($h_pgbench->full_results)[0]
+	  : $h_pgbench->result(0);
+
+	# Check pgbench results
+	ok(!$result, "@command exit code 0");
+
+	like($out_pgbench,
+		qr{processed: 1/1},
+		"concurrent update with retrying: check processed transactions");
+
+	like($out_pgbench,
+		qr{^((?!number of errors)(.|\n))*$},
+		"concurrent update with retrying: check errors");
+
+	like($out_pgbench,
+		qr{number of retried: 1 \(100\.000%\)},
+		"concurrent update with retrying: check retried");
+
+	like($out_pgbench,
+		qr{number of retries: 1},
+		"concurrent update with retrying: check retries");
+
+	like($out_pgbench,
+		qr{latency average = \d+\.\d{3} ms\n},
+		"concurrent update with retrying: check latency average");
+
+	my $pattern =
+		"client 0 sending UPDATE xy SET y = y \\+ (-?\\d+) "
+	  . "WHERE x = 1 AND pg_advisory_lock\\(0\\) IS NOT NULL;\n"
+	  . "(client 0 receiving\n)+"
+	  . "client 0 got a failure in command 3 \\(SQL\\) of script 0; "
+	  . "ERROR:  could not serialize access due to concurrent update\n\n"
+	  . "client 0 sending SELECT pg_advisory_unlock_all\\(\\);\n"
+	  . "\\g2+"
+	  . "client 0 continues a failed transaction in command 4 \\(SQL\\) of script 0; "
+	  . "ERROR:  current transaction is aborted, commands ignored until end of transaction block\n\n"
+	  . "client 0 sending END;\n"
+	  . "\\g2+"
+	  . "client 0 repeats the failed transaction \\(try 2/2\\)\n"
+	  . "client 0 executing \\\\set delta\n"
+	  . "client 0 sending BEGIN;\n"
+	  . "\\g2+"
+	  . "client 0 sending SELECT pg_sleep\\(1\\);\n"
+	  . "\\g2+"
+	  . "client 0 sending UPDATE xy SET y = y \\+ \\g1 "
+	  . "WHERE x = 1 AND pg_advisory_lock\\(0\\) IS NOT NULL;";
+
+	like($err_pgbench,
+		qr{$pattern},
+		"concurrent update with retrying: check the retried transaction");
+}
+
+sub test_pgbench_deadlock_errors
+{
+	my $isolation_level = READ_COMMITTED;
+	my $isolation_level_shell = $isolation_level_shell[$isolation_level];
+
+	local $ENV{PGPORT} = $node->port;
+	local $ENV{PGOPTIONS} =
+		"-c default_transaction_isolation=" . $isolation_level_shell;
+	print "# PGOPTIONS: " . $ENV{PGOPTIONS} . "\n";
+
+	my ($h_psql, $in_psql, $out_psql);
+	my ($h1, $in1, $out1, $err1);
+	my ($h2, $in2, $out2, $err2);
+
+	# Open a psql session and aquire an advisory lock:
+	print "# Starting psql\n";
+	$h_psql = IPC::Run::start [ 'psql' ], \$in_psql, \$out_psql;
+
+	$in_psql =
+		"select pg_advisory_lock(" . WAIT_PGBENCH_2 . ") "
+	  . "as pg_advisory_lock_" . WAIT_PGBENCH_2 . ";\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /pg_advisory_lock_@{[ WAIT_PGBENCH_2 ]}/;
+
+	# Run the first pgbench:
+	my @command1 = (
+		qw(pgbench --no-vacuum --transactions 1 --debug fails --file),
+		$script_deadlocks1);
+	print "# Running: " . join(" ", @command1) . "\n";
+	$h1 = IPC::Run::start \@command1, \$in1, \$out1, \$err1;
+
+	# Wait until the first pgbench also tries to acquire the same advisory lock:
+	do
+	{
+		$in_psql =
+			"select case count(*) "
+		  . "when 0 then '" . WAIT_PGBENCH_2 . "_zero' "
+		  . "else '" . WAIT_PGBENCH_2 . "_not_zero' end "
+		  . "from pg_locks where "
+		  . "locktype = 'advisory' and "
+		  . "objsubid = 1 and "
+		  . "((classid::bigint << 32) | objid::bigint = "
+		  . WAIT_PGBENCH_2
+		  . "::bigint) and "
+		  . "not granted;\n";
+		print "# Running in psql: " . join(" ", $in_psql);
+		$h_psql->pump() while length $in_psql;
+	} while ($out_psql !~ /@{[ WAIT_PGBENCH_2 ]}_not_zero/);
+
+	# Run the second pgbench:
+	my @command2 = (
+		qw(pgbench --no-vacuum --transactions 1 --debug fails --file),
+		$script_deadlocks2);
+	print "# Running: " . join(" ", @command2) . "\n";
+	$h2 = IPC::Run::start \@command2, \$in2, \$out2, \$err2;
+
+	# Wait until the second pgbench tries to acquire the lock held by the first
+	# pgbench:
+	do
+	{
+		$in_psql =
+			"select case count(*) "
+		  . "when 0 then '" . DEADLOCK_1 . "_zero' "
+		  . "else '" . DEADLOCK_1 . "_not_zero' end "
+		  . "from pg_locks where "
+		  . "locktype = 'advisory' and "
+		  . "objsubid = 1 and "
+		  . "((classid::bigint << 32) | objid::bigint = "
+		  . DEADLOCK_1
+		  . "::bigint) and "
+		  . "not granted;\n";
+		print "# Running in psql: " . join(" ", $in_psql);
+		$h_psql->pump() while length $in_psql;
+	} while ($out_psql !~ /@{[ DEADLOCK_1 ]}_not_zero/);
+
+	# In the psql session, release the lock that the first pgbench is waiting
+	# for and end the session:
+	$in_psql =
+		"select pg_advisory_unlock(" . WAIT_PGBENCH_2 . ") "
+	  . "as pg_advisory_unlock_" . WAIT_PGBENCH_2 . ";\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /pg_advisory_unlock_@{[ WAIT_PGBENCH_2 ]}/;
+
+	$in_psql = "\\q\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() while length $in_psql;
+
+	$h_psql->finish();
+
+	# Get results from all pgbenches:
+	$h1->pump() until length $out1;
+	$h1->finish();
+
+	$h2->pump() until length $out2;
+	$h2->finish();
+
+	# On Windows, the exit status of the process is returned directly as the
+	# process's exit code, while on Unix, it's returned in the high bits
+	# of the exit code (see WEXITSTATUS macro in the standard <sys/wait.h>
+	# header file). IPC::Run's result function always returns exit code >> 8,
+	# assuming the Unix convention, which will always return 0 on Windows as
+	# long as the process was not terminated by an exception. To work around
+	# that, use $h->full_result on Windows instead.
+	my $result1 =
+	    ($Config{osname} eq "MSWin32")
+	  ? ($h1->full_results)[0]
+	  : $h1->result(0);
+
+	my $result2 =
+	    ($Config{osname} eq "MSWin32")
+	  ? ($h2->full_results)[0]
+	  : $h2->result(0);
+
+	# Check all pgbench results
+	ok(!$result1, "@command1 exit code 0");
+	ok(!$result2, "@command2 exit code 0");
+
+	# The first or second pgbench should get a deadlock error
+	ok((($out1 =~ /processed: 0\/1/ and $out2 =~ /processed: 1\/1/) or
+		($out2 =~ /processed: 0\/1/ and $out1 =~ /processed: 1\/1/)),
+		"concurrent deadlock update: check processed transactions");
+
+	ok((($out1 =~ /number of errors: 1 \(100\.000%\)/ and
+		 $out2 =~ /^((?!number of errors)(.|\n))*$/) or
+		($out2 =~ /number of errors: 1 \(100\.000%\)/ and
+		 $out1 =~ /^((?!number of errors)(.|\n))*$/)),
+		"concurrent deadlock update: check errors");
+
+	ok(($err1 =~ /client 0 got a failure in command 3 \(SQL\) of script 0; ERROR:  deadlock detected/ or
+		$err2 =~ /client 0 got a failure in command 2 \(SQL\) of script 0; ERROR:  deadlock detected/),
+		"concurrent deadlock update: check deadlock failure");
+
+	# Both pgbenches do not have retried transactions
+	like($out1 . $out2,
+		qr{^((?!number of retried)(.|\n))*$},
+		"concurrent deadlock update: check retried");
+}
+
+sub test_pgbench_deadlock_failures
+{
+	my $isolation_level = READ_COMMITTED;
+	my $isolation_level_shell = $isolation_level_shell[$isolation_level];
+
+	local $ENV{PGPORT} = $node->port;
+	local $ENV{PGOPTIONS} =
+		"-c default_transaction_isolation=" . $isolation_level_shell;
+	print "# PGOPTIONS: " . $ENV{PGOPTIONS} . "\n";
+
+	my ($h_psql, $in_psql, $out_psql);
+	my ($h1, $in1, $out1, $err1);
+	my ($h2, $in2, $out2, $err2);
+
+	# Open a psql session and aquire an advisory lock:
+	print "# Starting psql\n";
+	$h_psql = IPC::Run::start [ 'psql' ], \$in_psql, \$out_psql;
+
+	$in_psql =
+		"select pg_advisory_lock(" . WAIT_PGBENCH_2 . ") "
+	  . "as pg_advisory_lock_" . WAIT_PGBENCH_2 . ";\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /pg_advisory_lock_@{[ WAIT_PGBENCH_2 ]}/;
+
+	# Run the first pgbench:
+	my @command1 = (
+		qw(pgbench --no-vacuum --transactions 1 --debug all --max-tries 2),
+		"--file",
+		$script_deadlocks1);
+	print "# Running: " . join(" ", @command1) . "\n";
+	$h1 = IPC::Run::start \@command1, \$in1, \$out1, \$err1;
+
+	# Wait until the first pgbench also tries to acquire the same advisory lock:
+	do
+	{
+		$in_psql =
+			"select case count(*) "
+		  . "when 0 then '" . WAIT_PGBENCH_2 . "_zero' "
+		  . "else '" . WAIT_PGBENCH_2 . "_not_zero' end "
+		  . "from pg_locks where "
+		  . "locktype = 'advisory' and "
+		  . "objsubid = 1 and "
+		  . "((classid::bigint << 32) | objid::bigint = "
+		  . WAIT_PGBENCH_2
+		  . "::bigint) and "
+		  . "not granted;\n";
+		print "# Running in psql: " . join(" ", $in_psql);
+		$h_psql->pump() while length $in_psql;
+	} while ($out_psql !~ /@{[ WAIT_PGBENCH_2 ]}_not_zero/);
+
+	# Run the second pgbench:
+	my @command2 = (
+		qw(pgbench --no-vacuum --transactions 1 --debug all --max-tries 2),
+		"--file",
+		$script_deadlocks2);
+	print "# Running: " . join(" ", @command2) . "\n";
+	$h2 = IPC::Run::start \@command2, \$in2, \$out2, \$err2;
+
+	# Wait until the second pgbench tries to acquire the lock held by the first
+	# pgbench:
+	do
+	{
+		$in_psql =
+			"select case count(*) "
+		  . "when 0 then '" . DEADLOCK_1 . "_zero' "
+		  . "else '" . DEADLOCK_1 . "_not_zero' end "
+		  . "from pg_locks where "
+		  . "locktype = 'advisory' and "
+		  . "objsubid = 1 and "
+		  . "((classid::bigint << 32) | objid::bigint = "
+		  . DEADLOCK_1
+		  . "::bigint) and "
+		  . "not granted;\n";
+		print "# Running in psql: " . join(" ", $in_psql);
+		$h_psql->pump() while length $in_psql;
+	} while ($out_psql !~ /@{[ DEADLOCK_1 ]}_not_zero/);
+
+	# In the psql session, acquire the locks that pgbenches will wait for:
+	$in_psql =
+		"select pg_advisory_lock(" . TRANSACTION_ENDS_1 . ") "
+	  . "as pg_advisory_lock_" . TRANSACTION_ENDS_1 . ";\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /pg_advisory_lock_@{[ TRANSACTION_ENDS_1 ]}/;
+
+	$in_psql =
+		"select pg_advisory_lock(" . TRANSACTION_ENDS_2 . ") "
+	  . "as pg_advisory_lock_" . TRANSACTION_ENDS_2 . ";\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /pg_advisory_lock_@{[ TRANSACTION_ENDS_2 ]}/;
+
+	# In the psql session, release the lock that the first pgbench is waiting
+	# for:
+	$in_psql =
+		"select pg_advisory_unlock(" . WAIT_PGBENCH_2 . ") "
+	  . "as pg_advisory_unlock_" . WAIT_PGBENCH_2 . ";\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /pg_advisory_unlock_@{[ WAIT_PGBENCH_2 ]}/;
+
+	# Wait until pgbenches try to acquire the locks held by the psql session:
+	do
+	{
+		$in_psql =
+			"select case count(*) "
+		  . "when 0 then '" . TRANSACTION_ENDS_1 . "_zero' "
+		  . "else '" . TRANSACTION_ENDS_1 . "_not_zero' end "
+		  . "from pg_locks where "
+		  . "locktype = 'advisory' and "
+		  . "objsubid = 1 and "
+		  . "((classid::bigint << 32) | objid::bigint = "
+		  . TRANSACTION_ENDS_1
+		  . "::bigint) and "
+		  . "not granted;\n";
+		print "# Running in psql: " . join(" ", $in_psql);
+		$h_psql->pump() while length $in_psql;
+	} while ($out_psql !~ /@{[ TRANSACTION_ENDS_1 ]}_not_zero/);
+
+	do
+	{
+		$in_psql =
+			"select case count(*) "
+		  . "when 0 then '" . TRANSACTION_ENDS_2 . "_zero' "
+		  . "else '" . TRANSACTION_ENDS_2 . "_not_zero' end "
+		  . "from pg_locks where "
+		  . "locktype = 'advisory' and "
+		  . "objsubid = 1 and "
+		  . "((classid::bigint << 32) | objid::bigint = "
+		  . TRANSACTION_ENDS_2
+		  . "::bigint) and "
+		  . "not granted;\n";
+		print "# Running in psql: " . join(" ", $in_psql);
+		$h_psql->pump() while length $in_psql;
+	} while ($out_psql !~ /@{[ TRANSACTION_ENDS_2 ]}_not_zero/);
+
+	# In the psql session, release advisory locks and end the session:
+	$in_psql = "select pg_advisory_unlock_all() as pg_advisory_unlock_all;\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() until $out_psql =~ /pg_advisory_unlock_all/;
+
+	$in_psql = "\\q\n";
+	print "# Running in psql: " . join(" ", $in_psql);
+	$h_psql->pump() while length $in_psql;
+
+	$h_psql->finish();
+
+	# Get results from all pgbenches:
+	$h1->pump() until length $out1;
+	$h1->finish();
+
+	$h2->pump() until length $out2;
+	$h2->finish();
+
+	# On Windows, the exit status of the process is returned directly as the
+	# process's exit code, while on Unix, it's returned in the high bits
+	# of the exit code (see WEXITSTATUS macro in the standard <sys/wait.h>
+	# header file). IPC::Run's result function always returns exit code >> 8,
+	# assuming the Unix convention, which will always return 0 on Windows as
+	# long as the process was not terminated by an exception. To work around
+	# that, use $h->full_result on Windows instead.
+	my $result1 =
+	    ($Config{osname} eq "MSWin32")
+	  ? ($h1->full_results)[0]
+	  : $h1->result(0);
+
+	my $result2 =
+	    ($Config{osname} eq "MSWin32")
+	  ? ($h2->full_results)[0]
+	  : $h2->result(0);
+
+	# Check all pgbench results
+	ok(!$result1, "@command1 exit code 0");
+	ok(!$result2, "@command2 exit code 0");
+
+	like($out1,
+		qr{processed: 1/1},
+		"concurrent deadlock update with retrying: pgbench 1: "
+	  . "check processed transactions");
+	like($out2,
+		qr{processed: 1/1},
+		"concurrent deadlock update with retrying: pgbench 2: "
+	  . "check processed transactions");
+
+	# The first or second pgbench should get a deadlock error which was retried:
+	like($out1 . $out2,
+		qr{^((?!number of errors)(.|\n))*$},
+		"concurrent deadlock update with retrying: check errors");
+
+	ok((($out1 =~ /number of retried: 1 \(100\.000%\)/ and
+		 $out2 =~ /^((?!number of retried)(.|\n))*$/) or
+		($out2 =~ /number of retried: 1 \(100\.000%\)/ and
+		 $out1 =~ /^((?!number of retried)(.|\n))*$/)),
+		"concurrent deadlock update with retrying: check retries");
+
+	my $pattern1 =
+		"client 0 sending BEGIN;\n"
+	  . "(client 0 receiving\n)+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . DEADLOCK_1 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . WAIT_PGBENCH_2 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . DEADLOCK_2 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 got a failure in command 3 \\(SQL\\) of script 0; "
+	  . "ERROR:  deadlock detected\n"
+	  . "((?!client 0)(.|\n))*"
+	  . "client 0 sending END;\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_unlock_all\\(\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . TRANSACTION_ENDS_1 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_unlock_all\\(\\);\n"
+	  . "\\g1+"
+	  . "client 0 repeats the failed transaction \\(try 2/2\\)\n"
+	  . "client 0 sending BEGIN;\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . DEADLOCK_1 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . WAIT_PGBENCH_2 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . DEADLOCK_2 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending END;\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_unlock_all\\(\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . TRANSACTION_ENDS_1 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_unlock_all\\(\\);\n"
+	  . "\\g1+";
+
+	my $pattern2 =
+		"client 0 sending BEGIN;\n"
+	  . "(client 0 receiving\n)+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . DEADLOCK_2 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . DEADLOCK_1 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 got a failure in command 2 \\(SQL\\) of script 0; "
+	  . "ERROR:  deadlock detected\n"
+	  . "((?!client 0)(.|\n))*"
+	  . "client 0 sending END;\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_unlock_all\\(\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . TRANSACTION_ENDS_2 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_unlock_all\\(\\);\n"
+	  . "\\g1+"
+	  . "client 0 repeats the failed transaction \\(try 2/2\\)\n"
+	  . "client 0 sending BEGIN;\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . DEADLOCK_2 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . DEADLOCK_1 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending END;\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_unlock_all\\(\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_lock\\(" . TRANSACTION_ENDS_2 . "\\);\n"
+	  . "\\g1+"
+	  . "client 0 sending SELECT pg_advisory_unlock_all\\(\\);\n"
+	  . "\\g1+";
+
+	ok(($err1 =~ /$pattern1/ or $err2 =~ /$pattern2/),
+		"concurrent deadlock update with retrying: "
+	  . "check the retried transaction");
+}
+
+test_pgbench_serialization_errors(
+								1,      # --max-tries
+								0,      # --latency-limit (will not be used)
+								"concurrent update");
+test_pgbench_serialization_errors(
+								0,	    # --max-tries (will not be used)
+								900,    # --latency-limit
+								"concurrent update with maximum time of tries");
+
+test_pgbench_serialization_failures();
+
+test_pgbench_deadlock_errors();
+test_pgbench_deadlock_failures();
+
+#done
+$node->stop;
-- 
2.7.4

