From f4c20c13b09f35427f115ba32599134eeeefb316 Mon Sep 17 00:00:00 2001
From: Ole Tange <tange@gnu.org>
Date: Fri, 1 Jan 2016 15:12:43 +0100
Subject: [PATCH] Released as 20160101 ('20160101alpha')

---
 README                                       |  12 +-
 configure                                    |  20 +-
 configure.ac                                 |   2 +-
 doc/release_new_version                      |  30 +-
 src/Makefile.in                              |   2 +-
 src/niceload                                 |   2 +-
 src/parallel                                 | 583 +++++++++++-
 src/parallel.pod                             | 110 ++-
 src/parallel_design.pod                      | 277 +++---
 src/parallel_tutorial.html                   | 769 ++++++++++------
 src/parallel_tutorial.pod                    | 889 +++++++++++++------
 src/sql                                      |   2 +-
 testsuite/tests-to-run/parallel-local-sql.sh |  75 ++
 13 files changed, 2015 insertions(+), 758 deletions(-)
 create mode 100644 testsuite/tests-to-run/parallel-local-sql.sh

diff --git a/README b/README
index 250beba5..affecffd 100644
--- a/README
+++ b/README
@@ -40,9 +40,9 @@ document.
 
 Full installation of GNU Parallel is as simple as:
 
-    wget http://ftpmirror.gnu.org/parallel/parallel-20151222.tar.bz2
-    bzip2 -dc parallel-20151222.tar.bz2 | tar xvf -
-    cd parallel-20151222
+    wget http://ftpmirror.gnu.org/parallel/parallel-20160101.tar.bz2
+    bzip2 -dc parallel-20160101.tar.bz2 | tar xvf -
+    cd parallel-20160101
     ./configure && make && sudo make install
 
 
@@ -51,9 +51,9 @@ Full installation of GNU Parallel is as simple as:
 If you are not root you can add ~/bin to your path and install in
 ~/bin and ~/share:
 
-    wget http://ftpmirror.gnu.org/parallel/parallel-20151222.tar.bz2
-    bzip2 -dc parallel-20151222.tar.bz2 | tar xvf -
-    cd parallel-20151222
+    wget http://ftpmirror.gnu.org/parallel/parallel-20160101.tar.bz2
+    bzip2 -dc parallel-20160101.tar.bz2 | tar xvf -
+    cd parallel-20160101
     ./configure --prefix=$HOME && make && make install
 
 Or if your system lacks 'make' you can simply copy src/parallel
diff --git a/configure b/configure
index 01b791ed..58a12fe9 100755
--- a/configure
+++ b/configure
@@ -1,6 +1,6 @@
 #! /bin/sh
 # Guess values for system-dependent variables and create Makefiles.
-# Generated by GNU Autoconf 2.69 for parallel 20151222.
+# Generated by GNU Autoconf 2.69 for parallel 20160101.
 #
 # Report bugs to <bug-parallel@gnu.org>.
 #
@@ -579,8 +579,8 @@ MAKEFLAGS=
 # Identity of this package.
 PACKAGE_NAME='parallel'
 PACKAGE_TARNAME='parallel'
-PACKAGE_VERSION='20151222'
-PACKAGE_STRING='parallel 20151222'
+PACKAGE_VERSION='20160101'
+PACKAGE_STRING='parallel 20160101'
 PACKAGE_BUGREPORT='bug-parallel@gnu.org'
 PACKAGE_URL=''
 
@@ -1203,7 +1203,7 @@ if test "$ac_init_help" = "long"; then
   # Omit some internal or obsolete options to make the list less imposing.
   # This message is too long to be a string in the A/UX 3.1 sh.
   cat <<_ACEOF
-\`configure' configures parallel 20151222 to adapt to many kinds of systems.
+\`configure' configures parallel 20160101 to adapt to many kinds of systems.
 
 Usage: $0 [OPTION]... [VAR=VALUE]...
 
@@ -1269,7 +1269,7 @@ fi
 
 if test -n "$ac_init_help"; then
   case $ac_init_help in
-     short | recursive ) echo "Configuration of parallel 20151222:";;
+     short | recursive ) echo "Configuration of parallel 20160101:";;
    esac
   cat <<\_ACEOF
 
@@ -1345,7 +1345,7 @@ fi
 test -n "$ac_init_help" && exit $ac_status
 if $ac_init_version; then
   cat <<\_ACEOF
-parallel configure 20151222
+parallel configure 20160101
 generated by GNU Autoconf 2.69
 
 Copyright (C) 2012 Free Software Foundation, Inc.
@@ -1362,7 +1362,7 @@ cat >config.log <<_ACEOF
 This file contains any messages produced by compilers while
 running configure, to aid debugging if configure makes a mistake.
 
-It was created by parallel $as_me 20151222, which was
+It was created by parallel $as_me 20160101, which was
 generated by GNU Autoconf 2.69.  Invocation command line was
 
   $ $0 $@
@@ -2225,7 +2225,7 @@ fi
 
 # Define the identity of the package.
  PACKAGE='parallel'
- VERSION='20151222'
+ VERSION='20160101'
 
 
 cat >>confdefs.h <<_ACEOF
@@ -2867,7 +2867,7 @@ cat >>$CONFIG_STATUS <<\_ACEOF || ac_write_fail=1
 # report actual input values of CONFIG_FILES etc. instead of their
 # values after options handling.
 ac_log="
-This file was extended by parallel $as_me 20151222, which was
+This file was extended by parallel $as_me 20160101, which was
 generated by GNU Autoconf 2.69.  Invocation command line was
 
   CONFIG_FILES    = $CONFIG_FILES
@@ -2929,7 +2929,7 @@ _ACEOF
 cat >>$CONFIG_STATUS <<_ACEOF || ac_write_fail=1
 ac_cs_config="`$as_echo "$ac_configure_args" | sed 's/^ //; s/[\\""\`\$]/\\\\&/g'`"
 ac_cs_version="\\
-parallel config.status 20151222
+parallel config.status 20160101
 configured by $0, generated by GNU Autoconf 2.69,
   with options \\"\$ac_cs_config\\"
 
diff --git a/configure.ac b/configure.ac
index 0edb3d93..0bc961f3 100644
--- a/configure.ac
+++ b/configure.ac
@@ -1,4 +1,4 @@
-AC_INIT([parallel], [20151222], [bug-parallel@gnu.org])
+AC_INIT([parallel], [20160101], [bug-parallel@gnu.org])
 AM_INIT_AUTOMAKE([-Wall -Werror foreign])
 AC_CONFIG_HEADERS([config.h])
 AC_CONFIG_FILES([
diff --git a/doc/release_new_version b/doc/release_new_version
index ef44512c..3db0601c 100644
--- a/doc/release_new_version
+++ b/doc/release_new_version
@@ -212,9 +212,9 @@ cc:Tim Cuthbertson <tim3d.junk@gmail.com>,
    Ryoichiro Suzuki <ryoichiro.suzuki@gmail.com>,
    Jesse Alama <jesse.alama@gmail.com>
 
-Subject: GNU Parallel 20151222 ('') released <<[stable]>>
+Subject: GNU Parallel 20160122 ('') released <<[stable]>>
 
-GNU Parallel 20151222 ('') <<[stable]>> has been released. It is available for download at: http://ftp.gnu.org/gnu/parallel/
+GNU Parallel 20160122 ('') <<[stable]>> has been released. It is available for download at: http://ftp.gnu.org/gnu/parallel/
 
 <<No new functionality was introduced so this is a good candidate for a stable release.>>
 
@@ -227,11 +227,19 @@ Haiku of the month:
 
 New in this release:
 
-* --transfer is now an alias for --transferfile {}.
+* --sql DBURL uses DBURL as storage for jobs and output. It does not run any jobs so it requires at least one --sqlworker. DBURL must point to a table.
 
-* --transferfile works like --transfer, but takes an argument like --return. This makes it possible to combine transferring files with multiple input sources: parallel -S server --tf {1} wc {2} {1} ::: * ::: -l -w -c
+* --sqlworker DBURL gets jobs from DBURL and stores the result back to DBURL.
 
-* total_jobs() can now be used in {= =}: parallel echo job {#} of '{= $_=total_jobs() =}' ::: {1..50}
+* --sqlandworker is a shorthand for --sql and --sqlworker.
+
+* --sqlworker requires the output of a single job to fit in memory.
+
+* --results now also saves a file called 'seq' containing the sequence number.
+
+* If $PARALLEL_ENV is a file, then that file will be read into $PARALLEL_ENV.
+
+* man parallel_tutorial has been given an overhaul.
 
 * << kontakt GNU Parallel was used (unfortunately without citation) in: Instrumentation and Trace Analysis for Ad-hoc Python Workflows in Cloud Environments http://ieeexplore.ieee.org/xpl/articleDetails.jsp?arnumber=7214035>>
 
@@ -249,17 +257,13 @@ for Big Data Applications https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumb
 
 * <<Citation needed: Introspecting for RSA Key Material to Assist Intrusion Detection http://ieeexplore.ieee.org/xpl/login.jsp?tp=&arnumber=7331177&url=http%3A%2F%2Fieeexplore.ieee.org%2Fxpls%2Fabs_all.jsp%3Farnumber%3D7331177>>
 
-* GNU Parallel was cited in: Evolution and Learning in Heterogeneous Environments http://research.gold.ac.uk/15078/1/COM_thesis_JonesD_2015.pdf
+* GNU Parallel is used in LAST: http://last.cbrc.jp/
 
-* GNU Parallel was cited in: Contrasting genetic architectures of schizophrenia and other complex diseases using fast variance-components analysis http://www.nature.com/ng/journal/v47/n12/full/ng.3431.html
+* GNU Parallel was cited in: Possum - A Framework for Three-Dimensional Reconstruction of Brain Images rfom Serial Sections http://link.springer.com/article/10.1007/s12021-015-9286-1
 
-* GNU Parallel was cited in: Efficient Retrieval of Key Material for Inspecting Potentially Malicious Traffic in the Cloud http://www.cs.bham.ac.uk/~bxb/Papres/2015.1.pdf 
+* GNU Parallel was used in: Mission Impossible: you have 1 minute to analyze the Ebola Genome https://www.biostars.org/p/119397
 
-* GNU Parallel was cited in: Achieving Consistent Doppler Measurements from SDO/HMI Vector Field Inversions http://arxiv.org/pdf/1511.06500.pdf
-
-* Flo uses GNU Parallel: https://github.com/wurmlab/flo
-
-* 使用 GNU parallel 來平行運算http://mutolisp.logdown.com/posts/316959-using-gnu-parallel-to-parallel-computing
+* Distributed Log Search Using GNU Parallel http://blog.codehate.com/post/134320079974/distributed-log-search-using-gnu-parallel
 
 * Bug fixes and man page updates.
 
diff --git a/src/Makefile.in b/src/Makefile.in
index aa536945..d2675532 100644
--- a/src/Makefile.in
+++ b/src/Makefile.in
@@ -78,7 +78,7 @@ NORMAL_UNINSTALL = :
 PRE_UNINSTALL = :
 POST_UNINSTALL = :
 subdir = src
-DIST_COMMON = $(srcdir)/Makefile.in $(srcdir)/Makefile.am README
+DIST_COMMON = $(srcdir)/Makefile.in $(srcdir)/Makefile.am
 ACLOCAL_M4 = $(top_srcdir)/aclocal.m4
 am__aclocal_m4_deps = $(top_srcdir)/configure.ac
 am__configure_deps = $(am__aclocal_m4_deps) $(CONFIGURE_DEPENDENCIES) \
diff --git a/src/niceload b/src/niceload
index ff0f4847..9679af82 100755
--- a/src/niceload
+++ b/src/niceload
@@ -24,7 +24,7 @@
 use strict;
 use Getopt::Long;
 $Global::progname="niceload";
-$Global::version = 20151222;
+$Global::version = 20160101;
 Getopt::Long::Configure("bundling","require_order");
 get_options_from_array(\@ARGV) || die_usage();
 if($opt::version) {
diff --git a/src/parallel b/src/parallel
index 73c52f56..1e945f00 100755
--- a/src/parallel
+++ b/src/parallel
@@ -40,7 +40,7 @@ parse_options();
 ::debug("init", "Open file descriptors: ", join(" ",keys %Global::fd), "\n");
 my $number_of_args;
 if($Global::max_number_of_args) {
-    $number_of_args=$Global::max_number_of_args;
+    $number_of_args = $Global::max_number_of_args;
 } elsif ($opt::X or $opt::m or $opt::xargs) {
     $number_of_args = undef;
 } else {
@@ -59,6 +59,15 @@ if($opt::pipepart) {
 	@input_source_fh = (*STDIN);
     }
 }
+if($opt::sql) {
+    # Create SQL table to hold joblog + output
+    $Global::sql->create_table($#input_source_fh+1);
+    if($opt::sqlworker) {
+	# Start a real --sqlworker in the background later
+	$Global::sqlworker = 1;
+	$opt::sqlworker = undef;
+    }
+}
 
 if($opt::skip_first_line) {
     # Skip the first line for the first file handle
@@ -751,6 +760,9 @@ sub options_hash {
 	 "m" => \$opt::m,
 	 "X" => \$opt::X,
 	 "v" => \@opt::v,
+	 "sql=s" => \$opt::sql,
+	 "sqlworker=s" => \$opt::sqlworker,
+	 "sqlandworker=s" => \$opt::sqlandworker,
 	 "joblog=s" => \$opt::joblog,
 	 "results|result|res=s" => \$opt::results,
 	 "resume" => \$opt::resume,
@@ -935,7 +947,7 @@ sub get_options_from_array {
 sub parse_options {
     # Returns: N/A
     init_globals();
-    @ARGV=read_options();
+    @ARGV = read_options();
 
     # no-* overrides *
     if($opt::nokeeporder) { $opt::keeporder = undef; }
@@ -960,6 +972,7 @@ sub parse_options {
     if(defined $opt::tmpdir) { $ENV{'TMPDIR'} = $opt::tmpdir; }
     $opt::nice ||= 0;
     if(defined $opt::help) { die_usage(); }
+    if(defined $opt::sqlandworker) { $opt::sql = $opt::sqlworker = $opt::sqlandworker; }
     if(defined $opt::colsep) { $Global::trim = 'lr'; }
     if(defined $opt::header) { $opt::colsep = defined $opt::colsep ? $opt::colsep : "\t"; }
     if(defined $opt::trim) { $Global::trim = $opt::trim; }
@@ -1108,6 +1121,7 @@ sub parse_options {
         $opt::jobs = "100%";
     }
     open_joblog();
+    ($opt::sql or $opt::sqlworker) and $Global::sql = SQL->new($opt::sql || $opt::sqlworker);
 }
 
 sub check_invalid_option_combinations {
@@ -1162,7 +1176,7 @@ sub check_invalid_option_combinations {
 
 sub init_globals {
     # Defaults:
-    $Global::version = 20151222;
+    $Global::version = 20160101;
     $Global::progname = 'parallel';
     $Global::infinity = 2**31;
     $Global::debug = 0;
@@ -1595,6 +1609,7 @@ sub read_options {
 
     Getopt::Long::Configure("bundling","require_order");
     my @ARGV_copy = @ARGV;
+    my @ARGV_orig = @ARGV;
     # Check if there is a --profile to set @opt::profile
     get_options_from_array(\@ARGV_copy,"profile|J=s","plain") || die_usage();
     my @ARGV_profile = ();
@@ -1644,12 +1659,29 @@ sub read_options {
     get_options_from_array(\@ARGV_profile) || die_usage();
     get_options_from_array(\@ARGV_env) || die_usage();
     get_options_from_array(\@ARGV) || die_usage();
-
+    # What were the options given on the command line?
+    # Used to start --sqlworker
+    my $ai = arrayindex(\@ARGV_orig, \@ARGV);
+    @Global::options_in_argv = @ARGV_orig[0..$ai-1];
     # Prepend non-options to @ARGV (such as commands like 'nice')
     unshift @ARGV, @ARGV_profile, @ARGV_env;
     return @ARGV;
 }
 
+sub arrayindex {
+    # Similar to Perl's index function, but for arrays
+    # Input:
+    #   $arr_ref1 = ref to @array1 to search in
+    #   $arr_ref2 = ref to @array2 to search for
+    my ($arr_ref1,$arr_ref2) = @_;
+    my $array1_as_string = join "", map { "\257\257".$_ } @$arr_ref1;
+    my $array2_as_string = join "", map { "\257\257".$_ } @$arr_ref2;
+    my $i = index($array1_as_string,$array2_as_string,0);
+    if($i == -1) { return -1 }
+    my @before = split /\257\257/, substr($array1_as_string,0,$i);
+    return $#before;
+}
+
 sub read_args_from_command_line {
     # Arguments given on the command line after:
     #   ::: ($Global::arg_sep)
@@ -2322,9 +2354,27 @@ sub drain_job_queue {
 		::warning("There are no job slots available. Increase --jobs.");
 	    }
         }
+	while($opt::sql and not $Global::sql->finished()) {
+	    # SQL master
+	    $sleep = ::reap_usleep($sleep);
+	    if($Global::sqlworker) {
+		# Start an SQL worker as we are now sure there is work to do
+		$Global::sqlworker = 0;
+		if(fork()) {
+		    # skip
+		} else {
+		    # Replace --sql/--sqlandworker with --sqlworker
+		    my @ARGV = map { s/^--sql(andworker)?$/--sqlworker/; $_ } @Global::options_in_argv;
+		    # exec the --sqlworker
+		    exec($0,::shell_quote(@ARGV),@command);
+		}
+	    }
+	}
     } while ($Global::total_running > 0
 	     or
-	     not $Global::start_no_new_jobs and not $Global::JobQueue->empty());
+	     not $Global::start_no_new_jobs and not $Global::JobQueue->empty()
+	     or
+	     $opt::sql and not $Global::sql->finished());
     if($opt::progress) {
 	my %progress = progress();
 	::status("\r", $progress{'status'}, "\n");
@@ -3291,6 +3341,8 @@ sub reaper {
     my $stiff;
     my @pids_reaped;
     debug("run", "Reaper ");
+    # For efficiency surround with BEGIN/COMMIT when using $opt::sql
+    $opt::sql and $Global::sql->run("BEGIN;");
     while (($stiff = waitpid(-1, &WNOHANG)) > 0) {
 	# $stiff = pid of dead process
 	push(@pids_reaped,$stiff);
@@ -3348,6 +3400,7 @@ sub reaper {
 	    ::status("\r",$progress{'status'});
 	}
     }
+    $opt::sql and $Global::sql->run("COMMIT;");
     debug("run", "done ");
     return @pids_reaped;
 }
@@ -3741,6 +3794,13 @@ sub undef_as_empty {
     return $a ? $a : "";
 }
 
+sub undef_if_empty {
+    if(defined($_[0]) and $_[0] eq "") {
+	return undef;
+    }
+    return $_[0];
+}
+
 sub multiply_binary_prefix {
     # Evalualte numbers with binary prefix
     # Ki=2^10, Mi=2^20, Gi=2^30, Ti=2^40, Pi=2^50, Ei=2^70, Zi=2^80, Yi=2^80
@@ -6092,6 +6152,15 @@ sub openoutputfiles {
 	    $dir = $opt::results."/".$args_as_dirname;
 	    File::Path::mkpath($dir);
 	}
+	# prefix/name1/val1/name2/val2/seq
+	my $seqname = "$dir/seq";
+	my $seqfhw;
+	if(not open($seqfhw, "+>", $seqname)) {
+	    ::error("Cannot write to `$seqname'.");
+	    ::wait_and_exit(255);
+	}
+	print $seqfhw $self->seq();
+	close $seqfhw;
 	# prefix/name1/val1/name2/val2/stdout
 	$outname = "$dir/stdout";
 	if(not open($outfhw, "+>", $outname)) {
@@ -6106,6 +6175,13 @@ sub openoutputfiles {
 	}
 	$self->set_fh(1,"unlink","");
 	$self->set_fh(2,"unlink","");
+	if($opt::sqlworker) {
+	    # Save the filenames in SQL table
+	    $Global::sql->update("SET Stdout = ? WHERE Seq = ".$self->seq(),
+				 $outname);
+	    $Global::sql->update("SET Stderr = ? WHERE Seq = ".$self->seq(),
+				 $errname);
+	}
     } elsif(not $opt::ungroup) {
 	# To group we create temporary files for STDOUT and STDERR
 	# To avoid the cleanup unlink the files immediately (but keep them open)
@@ -6404,6 +6480,9 @@ sub set_starttime {
     my $self = shift;
     my $starttime = shift || ::now();
     $self->{'starttime'} = $starttime;
+    $opt::sqlworker and
+	$Global::sql->update("SET Starttime = ? WHERE Seq = ".$self->seq(),
+			     $starttime);
 }
 
 sub runtime {
@@ -6425,6 +6504,9 @@ sub set_endtime {
     my $self = shift;
     my $endtime = shift;
     $self->{'endtime'} = $endtime;
+    $opt::sqlworker and
+	$Global::sql->update("SET JobRuntime = ? WHERE Seq = ".$self->seq(),
+			     $self->runtime());
 }
 
 sub is_timedout {
@@ -6635,6 +6717,14 @@ sub wrapped {
 		';';
 	}
 	if($ENV{'PARALLEL_ENV'}) {
+	    if(-e $ENV{'PARALLEL_ENV'}) {
+		# This is a file/fifo: Replace envvar with content of file
+		open(my $parallel_env, "<", $ENV{'PARALLEL_ENV'}) ||
+		    ::die_bug("Cannot read parallel_env from $ENV{'PARALLEL_ENV'}");
+		local $/;
+		$ENV{'PARALLEL_ENV'} = <$parallel_env>;
+		close $parallel_env;
+	    }
 	    # If $PARALLEL_ENV set, put that in front of the command
 	    # Used for importing functions for fish
 	    # Map \001 to \n to make it easer to quote \n in $PARALLEL_ENV
@@ -6664,8 +6754,11 @@ sub wrapped {
 	   and
 	   length $command > 499) {
 	    # csh does not like words longer than 1000 (499 quoted)
-	    $command = "perl -e '".base64_zip_eval()."' ".
-		join" ",string_zip_base64('exec "'.::perl_quote_scalar($command).'"');
+	    # bzip2 breaks --sql mysql://...
+	    # $command = "perl -e '".base64_zip_eval()."' ".
+	    # join" ",string_zip_base64('exec "'.::perl_quote_scalar($command).'"');
+	    $command = "perl -e '".base64_eval()."' ".
+		join" ",string_base64('exec "'.::perl_quote_scalar($command).'"');
 	}
 	$self->{'wrapped'} = $command;
     }
@@ -6678,6 +6771,9 @@ sub set_sshlogin {
     $self->{'sshlogin'} = $sshlogin;
     delete $self->{'sshlogin_wrap'}; # If sshlogin is changed the wrap is wrong
     delete $self->{'wrapped'};
+    $opt::sqlworker and
+	$Global::sql->update("SET Host = ? WHERE Seq = ".$self->seq(),
+			     $sshlogin->string());
 }
 
 sub sshlogin {
@@ -6685,6 +6781,18 @@ sub sshlogin {
     return $self->{'sshlogin'};
 }
 
+sub string_base64 {
+    # Base64 encode it into 1000 byte blocks.
+    # 1000 bytes is the largest word size csh supports
+    # Input:
+    #   @strings = to be encoded
+    # Returns:
+    #   @base64 = 1000 byte block
+    $Global::use{"MIME::Base64"} ||= eval "use MIME::Base64; 1;";
+    my @base64 = unpack("(A1000)*",encode_base64((join"",@_),""));
+    return @base64;
+}
+
 sub string_zip_base64 {
     # Pipe string through 'bzip2 -9' and base64 encode it into 1000
     # byte blocks.
@@ -6707,7 +6815,7 @@ sub string_zip_base64 {
 	close $zipin_fh;
 	exit;
     }
-    ::debug("base64","Orig:@_\nAs base64:@base64\n");
+    ::debug("base64","Orig:@_\nAs bzip2 base64:@base64\n");
     return @base64;
 }
 
@@ -6725,11 +6833,11 @@ sub base64_zip_eval {
         @GNU_Parallel=("use","IPC::Open3;","use","MIME::Base64");
         eval "@GNU_Parallel";
 
-        $SIG{CHLD}="IGNORE";
-        # Search for bzip2. Not found => use default path
+	$SIG{CHLD}="IGNORE";
+	# Search for bzip2. Not found => use default path
 	my $zip = (grep { -x $_ } "/usr/local/bin/bzip2")[0] || "bzip2";
-        # $in = stdin on $zip, $out = stdout from $zip
-        my($in, $out,$eval);
+	# $in = stdin on $zip, $out = stdout from $zip
+	my($in, $out,$eval);
 	open3($in,$out,">&STDERR",$zip,"-dc");
 	if(my $perlpid = fork) {
 	    close $in;
@@ -6742,7 +6850,27 @@ sub base64_zip_eval {
 	    close $in;
 	    exit;
 	}
-        wait;
+	wait;
+	eval $eval;
+			     });
+    ::debug("base64",$script,"\n");
+    return $script;
+}
+
+sub base64_eval {
+    # Script that:
+    #   * reads base64 strings from @ARGV
+    #   * decodes them
+    #   * evals the result
+    # Reverse of string_base64 + eval
+    # Will be wrapped in ' so single quote is forbidden
+    # Returns:
+    #   $script = 1-liner for perl -e
+    my $script = ::spacefree(0,q{
+        @GNU_Parallel=("use","IPC::Open3;","use","MIME::Base64");
+        eval "@GNU_Parallel";
+        my $eval;
+	$eval = decode_base64(join"",@ARGV);
 	eval $eval;
 			     });
     ::debug("base64",$script,"\n");
@@ -6913,8 +7041,11 @@ sub sshlogin_wrap {
 		   $command =~ /\n/) {
 		    # csh does not deal well with > 1000 chars in one word
 		    # csh does not deal well with $ENV with \n
-		    $env_command = "perl -e '".base64_zip_eval()."' ".
-			join" ",string_zip_base64($env_command);
+		    # bzip2 breaks --sql mysql://...
+		    # $env_command = "perl -e '".base64_zip_eval()."' ".
+		    # join" ",string_zip_base64($env_command);
+		    $env_command = "perl -e '".base64_eval()."' ".
+			join" ",string_base64($env_command);
 		    $self->{'sshlogin_wrap'} = $env_command;
 		} else {
 		    $self->{'sshlogin_wrap'} = "perl -e ".::shell_quote_scalar($env_command);
@@ -6942,8 +7073,11 @@ sub sshlogin_wrap {
 	       $command =~ /\n/) {
 		# csh does not deal well with > 1000 chars in one word
 		# csh does not deal well with $ENV with \n
-		$quoted_remote_command = "perl -e \\''".base64_zip_eval()."'\\' ".
-		    join" ",string_zip_base64($remote_command);
+		# bzip2 breaks --sql mysql://...
+		# $quoted_remote_command = "perl -e \\''".base64_zip_eval()."'\\' "."".
+		# join" ",string_zip_base64($remote_command);
+		$quoted_remote_command = "perl -e \\''".base64_eval()."'\\' ".
+		    join" ",string_base64($remote_command);
 	    } else {
 		$quoted_remote_command = $dq_remote_command;
 	    }
@@ -6999,6 +7133,9 @@ sub add_transfersize {
     my $self = shift;
     my $transfersize = shift;
     $self->{'transfersize'} += $transfersize;
+    $opt::sqlworker and
+	$Global::sql->update("SET Send = ? WHERE Seq = ".$self->seq(),
+			     $self->{'transfersize'});
 }
 
 sub sshtransfer {
@@ -7041,6 +7178,9 @@ sub add_returnsize {
     my $self = shift;
     my $returnsize = shift;
     $self->{'returnsize'} += $returnsize;
+    $opt::sqlworker and
+	$Global::sql->update("SET Receive = ? WHERE Seq = ".$self->seq(),
+			     $self->{'returnsize'});
 }
 
 sub sshreturn {
@@ -7275,10 +7415,10 @@ sub start {
     }
     $job->openoutputfiles();
     my($stdout_fh,$stderr_fh) = ($job->fh(1,"w"),$job->fh(2,"w"));
-    if($opt::ungroup) {
+    if($opt::ungroup or $opt::sqlworker) {
 	print_dryrun_and_verbose($stdout_fh,$job,$command);
     }
-    if($opt::dryrun) { $command = "true"; }
+    if($opt::dryrun or $opt::sql) { $command = "true"; }
     $ENV{'PARALLEL_SEQ'} = $job->seq();
     $ENV{'PARALLEL_PID'} = $$;
     $ENV{'PARALLEL_TMP'} = ::tmpname("par");
@@ -7381,6 +7521,10 @@ sub print_dryrun_and_verbose {
 	    print $stdout_fh $command,"\n";
 	}
     }
+    if($opt::sqlworker) {
+	$Global::sql->update("SET Command = ? WHERE Seq = ".$job->seq(),
+			     $job->replaced());
+    }
 }
 
 {
@@ -7567,7 +7711,11 @@ sub print {
 
 	if(($opt::dryrun or $Global::verbose)
 	   and
-	   not $self->{'verbose_printed'}) {
+	   not $self->{'verbose_printed'}
+	   and
+	   not $opt::sql
+	   and
+	   not $opt::sqlworker) {
 	    $self->{'verbose_printed'}++;
 	    if($Global::verbose <= 1) {
 		print STDOUT $self->replaced(),"\n";
@@ -7638,6 +7786,10 @@ sub files_print {
 	}
     } elsif($fdno == 1 and $self->fh($fdno,"name")) {
 	print $out_fd $self->tag(),$self->fh($fdno,"name"),"\n";
+	if($opt::sqlworker) {
+	    $Global::sql->update("SET Stdout = ? WHERE Seq = ".$self->seq(),
+				 $self->tag().$self->fh($fdno,"name"));
+	}
 	$self->add_returnsize(-s $self->fh($fdno,"name"));
     }
 }
@@ -7781,12 +7933,25 @@ sub normal_print {
     seek $in_fh, 0, 0;
     # $in_fh is now ready for reading at position 0
     my $outputlength = 0;
+    my @output;
     while(sysread($in_fh,$buf,131072)) {
 	print $out_fd $buf;
 	$outputlength += length $buf;
+	if($opt::sqlworker) {
+	    push @output, $buf;
+	}
     }
     if($fdno == 1) {
 	$self->add_returnsize($outputlength);
+	if($opt::sqlworker and not $opt::results) {
+	    $Global::sql->update("SET Stdout = ? WHERE Seq = ".$self->seq(),
+				 join("",@output));
+	}
+    } else {
+	if($opt::sqlworker and not $opt::results) {
+	    $Global::sql->update("SET Stderr = ? WHERE Seq = ".$self->seq(),
+				 join("",@output));
+	}
     }
     close $in_fh;
     if($? and $opt::compress) {
@@ -7851,6 +8016,9 @@ sub set_exitstatus {
 	# Status may have been set by --timeout
 	$self->{'exitstatus'} ||= $exitstatus;
     }
+    $opt::sqlworker and
+	$Global::sql->update("SET Exitval = ? WHERE Seq = ".$self->seq(),
+			     $exitstatus);
 }
 
 sub reset_exitstatus {
@@ -7867,9 +8035,11 @@ sub set_exitsignal {
     my $self = shift;
     my $exitsignal = shift;
     $self->{'exitsignal'} = $exitsignal;
+    $opt::sqlworker and
+	$Global::sql->update("SET _Signal = ? WHERE Seq = ".$self->seq(),
+			     $exitsignal);
 }
 
-
 {
     my $status_printed;
     my $total_jobs;
@@ -8092,6 +8262,10 @@ sub populate {
 	    }
 	}
     }
+    if($opt::sql) {
+	# Insert the V1..Vn for this $seq in SQL table instead of generating one
+	$Global::sql->insert_records($self->seq(),$self->{'arg_list_flat_orig'});
+    }
 }
 
 sub push {
@@ -8715,6 +8889,10 @@ sub get {
 					$self->{'len'},
 	    );
 	$cmd_line->populate();
+	if($opt::sqlworker) {
+	    # Get the sequence number from the SQL table
+	    $cmd_line->set_seq($SQL::next_seq);
+	}
 	::debug("init","cmd_line->number_of_args ",
 		$cmd_line->number_of_args(), "\n");
 	if(not $Global::no_more_input and ($opt::pipe or $opt::pipepart)) {
@@ -8893,7 +9071,10 @@ sub new {
     my $colsep = shift;
     my @unget = ();
     my $arg_sub_queue;
-    if($colsep) {
+    if($opt::sqlworker) {
+	# Open SQL table
+	$arg_sub_queue = SQLRecordQueue->new();
+    } elsif($colsep) {
 	# Open one file with colsep
 	$arg_sub_queue = RecordColQueue->new($fhs);
     } else {
@@ -8978,7 +9159,7 @@ sub get {
     if(@{$self->{'unget'}}) {
 	return shift @{$self->{'unget'}};
     }
-    my $unget_ref=$self->{'unget'};
+    my $unget_ref = $self->{'unget'};
     if($self->{'arg_sub_queue'}->empty()) {
 	return undef;
     }
@@ -9017,6 +9198,45 @@ sub empty {
 }
 
 
+package SQLRecordQueue;
+
+sub new {
+    my $class = shift;
+    my @unget = ();
+    return bless {
+	'unget' => \@unget,
+    }, ref($class) || $class;
+}
+
+sub get {
+    # Returns:
+    #   reference to array of Arg-objects
+    my $self = shift;
+    if(@{$self->{'unget'}}) {
+	return shift @{$self->{'unget'}};
+    }
+    return $Global::sql->get_record();
+}
+
+sub unget {
+    my $self = shift;
+    ::debug("run", "SQLRecordQueue-unget '@_'\n");
+    unshift @{$self->{'unget'}}, @_;
+}
+
+sub empty {
+    my $self = shift;
+    if(@{$self->{'unget'}}) { return 0; }
+    my $get = $self->get();
+    if(defined $get) {
+	$self->unget($get);
+    }
+    my $empty = not $get;
+    ::debug("run", "SQLRecordQueue->empty $empty");
+    return $empty;
+}
+
+
 package MultifileQueue;
 
 @Global::unget_argv=();
@@ -9463,6 +9683,323 @@ sub insert {
 }
 
 
+package SQL;
+
+sub new {
+    my $class = shift;
+    my $dburl = shift;
+    $Global::use{"DBI"} ||= eval "use DBI; 1;";
+    my %options = parse_dburl(get_alias($dburl));
+    my %driveralias = ("sqlite" => "SQLite",
+		       "sqlite3" => "SQLite",
+		       "pg" => "Pg",
+		       "postgres" => "Pg",
+		       "postgresql" => "Pg");
+    my $driver = $driveralias{$options{'databasedriver'}} || $options{'databasedriver'};
+    my $database = $options{'database'};
+    my $host = $options{'host'} ? ";host=".$options{'host'} : "";
+    my $port = $options{'port'} ? ";port=".$options{'port'} : "";
+    my $dsn = "DBI:$driver:dbname=$database$host$port";
+    my $userid = $options{'user'};
+    my $password = $options{'password'};;
+    my $dbh = DBI->connect($dsn, $userid, $password, { RaiseError => 1 })
+	or die $DBI::errstr;
+    return bless {
+	'dbh' => $dbh,
+	'max_number_of_args' => undef,
+	'table' => $options{'table'},
+    }, ref($class) || $class;
+}
+
+sub get_alias {
+    my $alias = shift;
+    $alias =~ s/^(sql:)*//; # Accept aliases prepended with sql:
+    if ($alias !~ /^:/) {
+	return $alias;
+    }
+
+    # Find the alias
+    my $path;
+    if (-l $0) {
+	($path) = readlink($0) =~ m|^(.*)/|;
+    } else {
+	($path) = $0 =~ m|^(.*)/|;
+    }
+
+    my @deprecated = ("$ENV{HOME}/.dburl.aliases",
+		      "$path/dburl.aliases", "$path/dburl.aliases.dist");
+    for (@deprecated) {
+	if(-r $_) {
+	    print STDERR "$_ is deprecated. Use .sql/aliases instead (read man sql)\n";
+	}
+    }
+    my @urlalias=();
+    check_permissions("$ENV{HOME}/.sql/aliases");
+    check_permissions("$ENV{HOME}/.dburl.aliases");
+    my @search = ("$ENV{HOME}/.sql/aliases",
+		  "$ENV{HOME}/.dburl.aliases", "/etc/sql/aliases",
+		  "$path/dburl.aliases", "$path/dburl.aliases.dist");
+    for my $alias_file (@search) {
+	if(-r $alias_file) {
+	    push @urlalias, `cat "$alias_file"`;
+	}
+    }
+    my ($alias_part,$rest) = $alias=~/(:\w*)(.*)/;
+    # If we saw this before: we have an alias loop
+    if(grep {$_ eq $alias_part } @Private::seen_aliases) {
+	print STDERR "$alias_part is a cyclic alias\n";
+	exit -1;
+    } else {
+	push @Private::seen_aliases, $alias_part;
+    }
+
+    my $dburl;
+    for (@urlalias) {
+	/^$alias_part\s+(\S+.*)/ and do { $dburl = $1; last; }
+    }
+
+    if($dburl) {
+	return get_alias($dburl.$rest);
+    } else {
+	Usage("$alias is not defined in @search");
+	exit(-1);
+    }
+}
+
+sub check_permissions {
+    my $file = shift;
+
+    if(-e $file) {
+	if(not -o $file) {
+	    my $username = (getpwuid($<))[0];
+	    print STDERR "$file should be owned by $username: chown $username $file\n";
+	}
+	my ($dev,$ino,$mode,$nlink,$uid,$gid,$rdev,$size,
+	    $atime,$mtime,$ctime,$blksize,$blocks) = stat($file);
+	if($mode & 077) {
+	    my $username = (getpwuid($<))[0];
+	    print STDERR "$file should be only be readable by $username: chmod 600 $file\n";
+	}
+    }
+}
+
+sub parse_dburl {
+    my $url = shift;
+    my %options = ();
+    # sql:mysql://[[user][:password]@][host][:port]/[database[/table][?sql query]]
+
+    if($url=~m!(?:sql:)? # You can prefix with 'sql:'
+               ((?:oracle|ora|mysql|pg|postgres|postgresql)(?:s|ssl|)|
+                 (?:sqlite|sqlite2|sqlite3)):// # Databasedriver ($1)
+               (?:
+                ([^:@/][^:@]*|) # Username ($2)
+                (?:
+                 :([^@]*) # Password ($3)
+                )?
+               @)?
+               ([^:/]*)? # Hostname ($4)
+               (?:
+                :
+                ([^/]*)? # Port ($5)
+               )?
+               (?:
+                /
+                ([^/?]*)? # Database ($6)
+               )?
+               (?:
+                /
+                ([^?]*)? # Table ($7)
+               )?
+               (?:
+                \?
+                (.*)? # Query ($8)
+               )?
+              !ix) {
+	$options{databasedriver} = ::undef_if_empty(lc(uri_unescape($1)));
+	$options{user} = ::undef_if_empty(uri_unescape($2));
+	$options{password} = ::undef_if_empty(uri_unescape($3));
+	$options{host} = ::undef_if_empty(uri_unescape($4));
+	$options{port} = ::undef_if_empty(uri_unescape($5));
+	$options{database} = ::undef_if_empty(uri_unescape($6));
+	$options{table} = ::undef_if_empty(uri_unescape($7));
+	$options{query} = ::undef_if_empty(uri_unescape($8));
+	::debug("sql","dburl $url\n");
+	::debug("sql","databasedriver ",$options{databasedriver}, " user ", $options{user},
+	      " password ", $options{password}, " host ", $options{host},
+	      " port ", $options{port}, " database ", $options{database},
+	      " table ",$options{table}," query ",$options{query}, "\n");
+
+    } else {
+	::error("$url is not a valid DBURL");
+	exit 255;
+    }
+    return %options;
+}
+
+sub uri_unescape {
+    # Copied from http://cpansearch.perl.org/src/GAAS/URI-1.55/URI/Escape.pm
+    # to avoid depending on URI::Escape
+    # This section is (C) Gisle Aas.
+    # Note from RFC1630:  "Sequences which start with a percent sign
+    # but are not followed by two hexadecimal characters are reserved
+    # for future extension"
+    my $str = shift;
+    if (@_ && wantarray) {
+	# not executed for the common case of a single argument
+	my @str = ($str, @_);  # need to copy
+	foreach (@str) {
+	    s/%([0-9A-Fa-f]{2})/chr(hex($1))/eg;
+	}
+	return @str;
+    }
+    $str =~ s/%([0-9A-Fa-f]{2})/chr(hex($1))/eg if defined $str;
+    $str;
+}
+
+sub run {
+    my $self = shift;
+    my $stmt = shift;
+    my @retval;
+    my $dbh = $self->{'dbh'};
+    ::debug("sql","$opt::sql$opt::sqlworker run $stmt\n");
+    # Execute with the rest of the args - if any
+    my $rv;
+    my $sth;
+    my $lockretry = 0;
+    while($lockretry < 10) {
+	$sth = $dbh->prepare($stmt);
+	if($rv = $sth->execute(@_)) {
+	    last;
+	} else {
+	    if($DBI::errstr =~ /locked/) {
+		::debug("sql","Lock retry: $lockretry");
+		$lockretry++;
+	    } else {
+		::error($DBI::errstr);
+	    }
+	}
+    }
+    if($rv < 0){
+	print $DBI::errstr;
+    }
+    return $sth;
+}
+
+sub get {
+    my $self = shift;
+    my $sth = $self->run(@_);
+    my @retval;
+    while(1) {
+	my @row = $sth->fetchrow_array();
+	@row or last;
+	push @retval, \@row;
+    }
+    return \@retval;
+}
+
+sub table {
+    my $self = shift;
+    return $self->{'table'};
+}
+
+sub update {
+    my $self = shift;
+    my $stmt = shift;
+    my $table = $self->table();
+    $self->run("UPDATE $table $stmt",@_);
+}
+
+sub max_number_of_args {
+    # Maximal number of args for this table
+    my $self = shift;
+    if(not $self->{'max_number_of_args'}) {
+	# Read the number of args from the SQL table
+	my $table = $self->table();
+	my $v = $self->get("SELECT * FROM $table LIMIT 1;");
+	my @reserved_columns = qw(Seq Host Starttime JobRuntime Send
+	    Receive Exitval _Signal Command Stdout Stderr);
+	if(not $v) {
+	    ::error("$table contains no records");
+	}
+	# Count the number of Vx columns
+	$self->{'max_number_of_args'} = $#{$v->[0]} - $#reserved_columns;
+    }
+    return $self->{'max_number_of_args'};
+}
+
+sub set_max_number_of_args {
+    my $self = shift;
+    $self->{'max_number_of_args'} = shift;
+}
+
+sub create_table {
+    my $self = shift;
+    my $max_number_of_args = shift;
+    $self->set_max_number_of_args($max_number_of_args);
+    my $table = $self->table();
+    $self->run(qq(DROP TABLE IF EXISTS $table;));
+    my $v_def = join "", map { "V$_ TEXT," } (1..$self->max_number_of_args());
+    $self->run(qq{CREATE TABLE $table
+		(Seq INT,
+		 Host TEXT,
+		 Starttime REAL,
+		 JobRuntime REAL,
+		 Send INT,
+		 Receive INT,
+		 Exitval INT,
+		 _Signal INT,
+		 Command TEXT,}.
+	       $v_def.
+	       qq{Stdout TEXT,
+		 Stderr TEXT);});
+}
+
+sub insert_records {
+    my $self = shift;
+    my $seq = shift;
+    my $record_ref = shift;
+    my $table = $self->table();
+    my $v_cols = join ",", map { "V$_" } (1..$self->max_number_of_args());
+    # Two extra value due to $seq, Exitval
+    my $v_vals = join ",", map { "?" } (1..$self->max_number_of_args()+2);
+    $self->run("INSERT INTO $table (Seq,Exitval,$v_cols) ".
+	       "VALUES ($v_vals);", $seq, -1000, @$record_ref[1..$#$record_ref]);
+}
+
+sub get_record {
+    my $self = shift;
+    my @retval;
+    my $table = $self->table();
+    my $v_cols = join ",", map { "V$_" } (1..$self->max_number_of_args());
+    my $v = $self->get("SELECT Seq, $v_cols FROM $table ".
+		       "WHERE Exitval = -1000 ORDER BY Seq LIMIT 1;");
+    if($v->[0]) {
+	my $val_ref = $v->[0];
+	# Mark record as taken
+	my $seq = shift @$val_ref;
+	# Save the sequence number to use when running the job
+	$SQL::next_seq = $seq;
+	$self->update("SET Exitval = ? WHERE Seq = ".$seq, -1220);
+	for (@$val_ref) {
+	    push @retval, Arg->new($_);
+	}
+    }
+    if(@retval) {
+	return \@retval;
+    } else {
+	return undef;
+    }
+}
+
+sub finished {
+    # Check if there are any jobs left in the SQL table that do not
+    # have a "real" exitval
+    my $self = shift;
+    my $table = $self->table();
+    my $rv = $self->get("select Seq,Exitval from $table where Exitval <= -1000 limit 1");
+    return not $rv->[0];
+}
+
 package Semaphore;
 
 # This package provides a counting semaphore
diff --git a/src/parallel.pod b/src/parallel.pod
index eea52090..f4ececf0 100644
--- a/src/parallel.pod
+++ b/src/parallel.pod
@@ -514,7 +514,7 @@ should feel free to use B<--will-cite>.
 Size of block in bytes to read at a time. The I<size> can be postfixed
 with K, M, G, T, P, k, m, g, t, or p which would multiply the size
 with 1024, 1048576, 1073741824, 1099511627776, 1125899906842624, 1000,
-1000000, 1000000000, 1000000000000, or 1000000000000000 respectively.
+1000000, 1000000000, 1000000000000, or 1000000000000000, respectively.
 
 GNU B<parallel> tries to meet the block size but can be off by the
 length of one record. For performance reasons I<size> should be bigger
@@ -1088,7 +1088,7 @@ most likely do what is needed.
 
 Multiple arguments. Insert as many arguments as the command line
 length permits. If multiple jobs are being run in parallel: distribute
-the arguments evenly among the jobs. Use B<-j1> to avoid this.
+the arguments evenly among the jobs. Use B<-j1> or B<--xargs> to avoid this.
 
 If B<{}> is not used the arguments will be appended to the
 line.  If B<{}> is used multiple times each B<{}> will be replaced
@@ -1106,7 +1106,7 @@ Minimum memory free when starting another job. The I<size> can be
 postfixed with K, M, G, T, P, k, m, g, t, or p which would multiply
 the size with 1024, 1048576, 1073741824, 1099511627776,
 1125899906842624, 1000, 1000000, 1000000000, 1000000000000, or
-1000000000000000 respectively.
+1000000000000000, respectively.
 
 If the jobs take up very different amount of RAM, GNU B<parallel> will
 only start as many as there is memory for. If less than I<size> bytes
@@ -1791,6 +1791,50 @@ Do not use the first line of input (used by GNU B<parallel> itself
 when called with B<--shebang>).
 
 
+=item B<--sql> I<DBURL> (alpha testing)
+
+Submit jobs via SQL server. I<DBURL> must point to a table, which will
+contain the same information as B<--joblog>, the values from the input
+sources (stored in columns V1 .. Vn), and the output (stored in
+columns Stdout and Stderr).
+
+The table will be dropped and created with the correct amount of
+V-columns.
+
+B<--sql> does not run any jobs, but it creates the values for the jobs
+to be run and wait for them to complete. One or more B<--sqlworker>
+must be run to actually execute the jobs.
+
+The format of a DBURL is:
+
+  [sql:]vendor://[[user][:password]@][host][:port]/[database]/table
+
+E.g.
+
+  sql:mysql://hr:hr@localhost:3306/hrdb/jobs
+  mysql://scott:tiger@my.example.com/pardb/paralleljobs
+  sql:oracle://scott:tiger@ora.example.com/xe/parjob
+  postgresql://scott:tiger@pg.example.com/pgdb/parjob
+  pg:///parjob
+  sqlite3:///pardb/parjob
+
+It can also be an alias from ~/.sql/aliases:
+
+  :myalias mysql:///mydb/paralleljobs
+
+
+=item B<--sqlandworker> I<DBURL> (alpha testing)
+
+Shorthand for: B<--sql> I<DBURL> B<--sqlworker> I<DBURL>.
+
+
+=item B<--sqlworker> I<DBURL> (alpha testing)
+
+Execute jobs via SQL server. Read the input sources variables from the
+table pointed to by I<DBURL>. The I<command> on the command line
+should be the same as given by B<--sql>.
+
+
 =item B<--ssh> I<sshcommand>
 
 GNU B<parallel> defaults to using B<ssh> for remote access. This can
@@ -2579,7 +2623,8 @@ files.
   tar xvf foo.tgz | perl -ne 'print $l;$l=$_;END{print $l}' | \
     parallel echo
 
-The Perl one-liner is needed to avoid race condition.
+The Perl one-liner is needed to make sure the file is complete before
+handing it to GNU B<parallel>.
 
 
 =head1 EXAMPLE: Rewriting a for-loop and a while-read-loop
@@ -3410,6 +3455,35 @@ computers:
 
   true >jobqueue; tail -n+0 -f jobqueue | parallel -S ..
 
+If you keep this running for a long time, jobqueue will grow. A way of
+removing the jobs already run is by making GNU B<parallel> stop when
+it hits a special value and then restart. To use B<--eof> to make GNU
+B<parallel> exit, B<tail> also needs to be forced to exit:
+
+  true >jobqueue;
+  while true; do
+    tail -n+0 -f jobqueue |
+      (parallel -E StOpHeRe -S ..; echo GNU Parallel is now done;
+       perl -e 'while(<>){/StOpHeRe/ and last};print <>' jobqueue > j2;
+       (seq 1000 >> jobqueue &);
+       echo Done appending dummy data forcing tail to exit)
+    echo tail exited;
+    mv j2 jobqueue
+  done
+
+In some cases you can run on more CPUs and computers during the night:
+
+  # Day time
+  echo 50% > jobfile
+  cp day_server_list ~/.parallel/sshloginfile
+  # Night time
+  echo 100% > jobfile
+  cp night_server_list ~/.parallel/sshloginfile
+  tail -n+0 -f jobqueue | parallel --jobs jobfile -S ..
+
+GNU Parallel discovers if B<jobfile> or B<~/.parallel/sshloginfile>
+changes.
+
 There is a a small issue when using GNU B<parallel> as queue
 system/batch manager: You have to submit JobSlot number of jobs before
 they will start, and after that you can submit one at a time, and job
@@ -3421,14 +3495,6 @@ E.g. if you have 10 jobslots then the output from the first completed
 job will only be printed when job 11 has started, and the output of
 second completed job will only be printed when job 12 has started.
 
-To use B<--eof> to make GNU B<parallel> exit, B<tail> also needs to be
-forced to exit:
-
-  tail -n+0 -f command-list.txt |
-    (parallel --eof=EXIT {}; echo Parallel is now done;
-     (seq 1000 >> command-list.txt &);
-    echo Done appending dummy data forcing tail to exit)
-
 
 =head1 EXAMPLE: GNU Parallel as dir processor
 
@@ -3773,6 +3839,26 @@ More than 100 jobs failed.
 
 Other error.
 
+=item Z<>-1 (In joblog and SQL table)
+
+Killed by Ctrl-C, timeout, not enough memory or similar.
+
+=item Z<>-2 (In joblog and SQL table)
+
+$job->skip() was called in {= =}.
+
+=item Z<>-1200 (In SQL table)
+
+Job is ready to run (used with --sql).
+
+=item Z<>-1220 (In SQL table)
+
+Job is taken by worker to be started (used with --sql).
+
+=item Z<>-1250 (In SQL table)
+
+Job is running (used with --sql).
+
 =back
 
 If fail=1 is used, the exit status will be the exit status of the
diff --git a/src/parallel_design.pod b/src/parallel_design.pod
index 4ff06cdc..cda28c58 100644
--- a/src/parallel_design.pod
+++ b/src/parallel_design.pod
@@ -32,7 +32,7 @@ is CentOS 3.9 and Perl 5.8.0.
 GNU B<parallel> busy waits. This is because the reason why a job is
 not started may be due to load average, and thus it will not make
 sense to wait for a job to finish. Instead the load average must be
-checked again. Load average is not the only reason: --timeout has a
+checked again. Load average is not the only reason: B<--timeout> has a
 similar problem.
 
 To not burn up too much CPU GNU B<parallel> sleeps exponentially
@@ -56,14 +56,13 @@ The easiest way to explain what GNU B<parallel> does is to assume that
 there are a number of job slots, and when a slot becomes available a
 job from the queue will be run in that slot. But originally GNU
 B<parallel> did not model job slots in the code. Job slots have been
-added to make it possible to use {%} as a replacement string.
+added to make it possible to use B<{%}> as a replacement string.
 
-While the job
-sequence number can be computed in advance, the job slot can only be
-computed the moment a slot becomes available. So it has been
-implemented as a stack with lazy evaluation: Draw one from an empty
-stack and the stack is extended by one. When a job is done, push the
-available job slot back on the stack.
+While the job sequence number can be computed in advance, the job slot
+can only be computed the moment a slot becomes available. So it has
+been implemented as a stack with lazy evaluation: Draw one from an
+empty stack and the stack is extended by one. When a job is done, push
+the available job slot back on the stack.
 
 This implementation also means that if you use remote executions, you
 cannot assume that a given job slot will remain on the same remote
@@ -89,7 +88,7 @@ B<--compress> compresses the data in the temporary files. This is a
 bit tricky because there should be no files to clean up if GNU
 B<parallel> is killed by a power outage.
 
-GNU B<parallel> first selects a compress program. If the user has not
+GNU B<parallel> first selects a compression program. If the user has not
 selected one, the first of these that are in $PATH is used: B<lz4 pigz
 lzop plzip pbzip2 pxz gzip lzma xz bzip2 lzip>. They are sorted by
 speed on a 16 core machine.
@@ -102,16 +101,16 @@ Schematically the setup is as follows:
 The setup is duplicated for both standard output (stdout) and standard
 error (stderr).
 
-GNU B<parallel> pipes output from the command run into the compress
+GNU B<parallel> pipes output from the command run into the compression
 program which saves to a tmpfile. GNU B<parallel> records the pid of
 the compress program.  At the same time a small perl script (called
 B<cattail> above) is started: It basically does B<cat> followed by
 B<tail -f>, but it also removes the tmpfile as soon as the first byte
-is read, and it continously checks if the pid of the compress program
-is dead. If the compress program is dead, B<cattail> reads the rest of
-tmpfile and exits.
+is read, and it continously checks if the pid of the compression
+program is dead. If the compress program is dead, B<cattail> reads the
+rest of tmpfile and exits.
 
-As most compress programs write out a header when they start, the
+As most compression programs write out a header when they start, the
 tmpfile in practice is unlinked after around 40 ms.
 
 
@@ -134,16 +133,12 @@ Local: B<setpriority(0,0,$nice)>
 
 =item --cat
 
-cat > {}; I<input> {};
-perl -e '$bash = shift;
-         $csh = shift;
-         for(@ARGV) {
-           unlink;rmdir;
-         }
-         if($bash =~ s/h//) {
-           exit $bash;
-         }
-         exit $csh;' "$?h" "$status" {};
+  cat > {}; I<input> {};
+  perl -e '$bash = shift;
+    $csh = shift;
+    for(@ARGV) { unlink;rmdir; }
+    if($bash =~ s/h//) { exit $bash;  }
+    exit $csh;' "$?h" "$status" {};
 
 {} is set to $PARALLEL_TMP which is a tmpfile. The Perl script saves
 the exit value, unlinks the tmpfile, and returns the exit value - no
@@ -151,22 +146,22 @@ matter if the shell is B<bash> (using $?) or B<*csh> (using $status).
 
 =item --fifo
 
-perl -e '($s,$c,$f) = @ARGV;
-         # mkfifo $PARALLEL_TMP
-         system "mkfifo", $f;
-         # spawn $shell -c $command &
-         $pid = fork || exec $s, "-c", $c;
-         open($o,">",$f) || die $!;
-         # cat > $PARALLEL_TMP
-         while(sysread(STDIN,$buf,131072)){
-            syswrite $o, $buf;
-         }
-         close $o;
-         # waitpid to get the exit code from $command
-         waitpid $pid,0;
-         # Cleanup
-         unlink $f;
-         exit $?/256;' I<shell> I<input> $PARALLEL_TMP
+  perl -e '($s,$c,$f) = @ARGV;
+    # mkfifo $PARALLEL_TMP
+    system "mkfifo", $f;
+    # spawn $shell -c $command &
+    $pid = fork || exec $s, "-c", $c;
+    open($o,">",$f) || die $!;
+    # cat > $PARALLEL_TMP
+    while(sysread(STDIN,$buf,131072)){
+       syswrite $o, $buf;
+    }
+    close $o;
+    # waitpid to get the exit code from $command
+    waitpid $pid,0;
+    # Cleanup
+    unlink $f;
+    exit $?/256;' I<shell> I<input> $PARALLEL_TMP
 
 This is an elaborate way of: mkfifo {}; run I<input> in the
 background using I<shell>; copying STDIN to {}; waiting for background
@@ -214,19 +209,19 @@ B<$_EXIT_status>: see B<--return> above.
 
 =item --pipe
 
-perl -e 'if(sysread(STDIN, $buf, 1)) {
-		open($fh, "|-", "@ARGV") || die;
-		syswrite($fh, $buf);
-		# Align up to 128k block
-		if($read = sysread(STDIN, $buf, 131071)) {
-		    syswrite($fh, $buf);
-		}
-		while($read = sysread(STDIN, $buf, 131072)) {
-		    syswrite($fh, $buf);
-		}
-		close $fh;
-		exit ($?&127 ? 128+($?&127) : 1+$?>>8)
-	    }' I<shell> -c I<input>
+  perl -e 'if(sysread(STDIN, $buf, 1)) {
+	open($fh, "|-", "@ARGV") || die;
+	syswrite($fh, $buf);
+	# Align up to 128k block
+	if($read = sysread(STDIN, $buf, 131071)) {
+	    syswrite($fh, $buf);
+	}
+	while($read = sysread(STDIN, $buf, 131072)) {
+	    syswrite($fh, $buf);
+	}
+	close $fh;
+	exit ($?&127 ? 128+($?&127) : 1+$?>>8)
+    }' I<shell> -c I<input>
 
 This small wrapper makes sure that I<input> will never be run if
 there is no data.
@@ -261,8 +256,6 @@ the FIFO, and this value is used as exit value.
 To make it compatible with B<csh> and B<bash> the exit value is
 printed as: $?h/$status and this is parsed by B<perl>.
 
-Works in B<csh>.
-
 There is a bug that makes it necessary to print the exit value 3
 times.
 
@@ -272,17 +265,17 @@ are added to the title to force it to be outside the limits.
 
 You can map the bad limits using:
 
-perl -e 'sub r { int(rand(shift)).($_[0] && "\t".r(@_)) } print map { r(@ARGV)."\n" } 1..10000' 1600 1500 90 |
-  perl -ane '$F[0]+$F[1]+$F[2] < 2037 and print ' | 
-  parallel --colsep '\t' --tagstring '{1}\t{2}\t{3}' tmux -S /tmp/p{%}-'{=3 $_="O"x$_ =}' \
-    new-session -d -n '{=1 $_="O"x$_ =}' true'\ {=2 $_="O"x$_ =};echo $?;rm -f /tmp/p{%}-O*' 
+  perl -e 'sub r { int(rand(shift)).($_[0] && "\t".r(@_)) } print map { r(@ARGV)."\n" } 1..10000' 1600 1500 90 |
+    perl -ane '$F[0]+$F[1]+$F[2] < 2037 and print ' | 
+    parallel --colsep '\t' --tagstring '{1}\t{2}\t{3}' tmux -S /tmp/p{%}-'{=3 $_="O"x$_ =}' \
+      new-session -d -n '{=1 $_="O"x$_ =}' true'\ {=2 $_="O"x$_ =};echo $?;rm -f /tmp/p{%}-O*' 
 
-perl -e 'sub r { int(rand(shift)).($_[0] && "\t".r(@_)) } print map { r(@ARGV)."\n" } 1..10000' 17000 17000 90 |
-  parallel --colsep '\t' --tagstring '{1}\t{2}\t{3}' \
-tmux -S /tmp/p{%}-'{=3 $_="O"x$_ =}' new-session -d -n '{=1 $_="O"x$_ =}' true'\ {=2 $_="O"x$_ =};echo $?;rm /tmp/p{%}-O*'
-> value.csv 2>/dev/null
+  perl -e 'sub r { int(rand(shift)).($_[0] && "\t".r(@_)) } print map { r(@ARGV)."\n" } 1..10000' 17000 17000 90 |
+    parallel --colsep '\t' --tagstring '{1}\t{2}\t{3}' \
+  tmux -S /tmp/p{%}-'{=3 $_="O"x$_ =}' new-session -d -n '{=1 $_="O"x$_ =}' true'\ {=2 $_="O"x$_ =};echo $?;rm /tmp/p{%}-O*'
+  > value.csv 2>/dev/null
 
-R -e 'a<-read.table("value.csv");X11();plot(a[,1],a[,2],col=a[,3]+5,cex=0.1);Sys.sleep(1000)'
+  R -e 'a<-read.table("value.csv");X11();plot(a[,1],a[,2],col=a[,3]+5,cex=0.1);Sys.sleep(1000)'
 
 For B<tmux 1.8> 17000 can be lowered to 2100.
 
@@ -306,23 +299,6 @@ B<--pipepart>/B<--pipe> should be done on the local machine inside B<--tmux>
 =back
 
 
-=head2 --block-size adjustment
-
-Every time GNU B<parallel> detects a record bigger than
-B<--block-size> it increases the block size by 30%. A small
-B<--block-size> gives very poor performance; by exponentially
-increasing the block size performance will not suffer.
-
-GNU B<parallel> will waste CPU power if B<--block-size> does not
-contain a full record, because it tries to find a full record and will
-fail to do so. The recommendation is therefore to use a
-B<--block-size> > 2 records, so you always get at least one full
-record when you read one block.
-
-If you use B<-N> then B<--block-size> should be big enough to contain
-N+1 records.
-
-
 =head2 Convenience options --nice --basefile --transfer --return
 --cleanup --tmux --group --compress --cat --fifo --workdir
 
@@ -360,6 +336,23 @@ that correctly for all corner cases is next to impossible to do by
 hand.
 
 
+=head2 --block-size adjustment
+
+Every time GNU B<parallel> detects a record bigger than
+B<--block-size> it increases the block size by 30%. A small
+B<--block-size> gives very poor performance; by exponentially
+increasing the block size performance will not suffer.
+
+GNU B<parallel> will waste CPU power if B<--block-size> does not
+contain a full record, because it tries to find a full record and will
+fail to do so. The recommendation is therefore to use a
+B<--block-size> > 2 records, so you always get at least one full
+record when you read one block.
+
+If you use B<-N> then B<--block-size> should be big enough to contain
+N+1 records.
+
+
 =head2 Shell shock
 
 The shell shock bug in B<bash> did not affect GNU B<parallel>, but the
@@ -402,10 +395,14 @@ exec'ing a Perl wrapper to monitor the parent pid and kill the child
 if the parent pid becomes 1, then Ctrl-C works and stderr is kept on
 stderr.
 
+To be able to kill all (grand)*children a new process group is
+started.
+
 =head3 --nice
 
 B<nice>ing the remote process is done by B<setpriority(0,0,$nice)>. A
-few old systems do not implement this and is thus unsupported.
+few old systems do not implement this and B<--nice> is unsupported on
+those.
 
 =head3 Setting $PARALLEL_TMP
 
@@ -417,39 +414,39 @@ remote system.
 
 The wrapper looks like this:
 
-    $shell = $PARALLEL_SHELL || $SHELL;
-    $tmpdir = $TMPDIR;
-    $nice = $opt::nice;
-    # Set $PARALLEL_TMP to a non-existent file name in $TMPDIR
-    do {
-	$ENV{PARALLEL_TMP} = $tmpdir."/par".
-	    join"", map { (0..9,"a".."z","A".."Z")[rand(62)] } (1..5);
-    } while(-e $ENV{PARALLEL_TMP});
-    $SIG{CHLD} = sub { $done = 1; };
-    $pid = fork;
-    unless($pid) {
-	# Make own process group to be able to kill HUP it later
-	setpgrp;
-	eval { setpriority(0,0,$nice) };
-	exec $shell, "-c", ($bashfunc."@ARGV");
-	die "exec: $!\n";
-    }
-    do {
-	# Parent is not init (ppid=1), so sshd is alive
-	# Exponential sleep up to 1 sec
-	$s = $s < 1 ? 0.001 + $s * 1.03 : $s;
-	select(undef, undef, undef, $s);
-    } until ($done || getppid == 1);
-    # Kill HUP the process group if job not done
-    kill(SIGHUP, -${pid}) unless $done;
-    wait;
-    exit ($?&127 ? 128+($?&127) : 1+$?>>8)
+  $shell = $PARALLEL_SHELL || $SHELL;
+  $tmpdir = $TMPDIR;
+  $nice = $opt::nice;
+  # Set $PARALLEL_TMP to a non-existent file name in $TMPDIR
+  do {
+      $ENV{PARALLEL_TMP} = $tmpdir."/par".
+  	join"", map { (0..9,"a".."z","A".."Z")[rand(62)] } (1..5);
+  } while(-e $ENV{PARALLEL_TMP});
+  $SIG{CHLD} = sub { $done = 1; };
+  $pid = fork;
+  unless($pid) {
+      # Make own process group to be able to kill HUP it later
+      setpgrp;
+      eval { setpriority(0,0,$nice) };
+      exec $shell, "-c", ($bashfunc."@ARGV");
+      die "exec: $!\n";
+  }
+  do {
+      # Parent is not init (ppid=1), so sshd is alive
+      # Exponential sleep up to 1 sec
+      $s = $s < 1 ? 0.001 + $s * 1.03 : $s;
+      select(undef, undef, undef, $s);
+  } until ($done || getppid == 1);
+  # Kill HUP the process group if job not done
+  kill(SIGHUP, -${pid}) unless $done;
+  wait;
+  exit ($?&127 ? 128+($?&127) : 1+$?>>8)
 
 =head2 Transferring of variables and functions
 
 Transferring of variables and functions given by B<--env> is done by
 running a Perl script remotely that calls the actual command. The Perl
-script sets $ENV{variable} to the correct value before exec'ing the a
+script sets B<$ENV{>I<variable>B<}> to the correct value before exec'ing the a
 shell that runs the function definition followed by the actual
 command.
 
@@ -512,9 +509,9 @@ shell is used when GNU B<parallel> executes commands.
 GNU B<parallel> tries hard to use the right shell. If GNU B<parallel>
 is called from B<tcsh> it will use B<tcsh>.  If it is called from
 B<bash> it will use B<bash>. It does this by looking at the
-(grand*)parent process: If the (grand*)parent process is a shell, use
-this shell; otherwise look at the parent of this (grand*)parent. If
-none of the (grand*)parents are shells, then $SHELL is used.
+(grand)*parent process: If the (grand)*parent process is a shell, use
+this shell; otherwise look at the parent of this (grand)*parent. If
+none of the (grand)*parents are shells, then $SHELL is used.
 
 This will do the right thing if called from:
 
@@ -570,7 +567,7 @@ not known to B<bash>.
 =back
 
 If GNU B<parallel> guesses wrong in these situation, set the shell using
-$PARALLEL_SHELL.
+B<$PARALLEL_SHELL>.
 
 =head2 Quoting
 
@@ -596,7 +593,7 @@ implemented very differently.
 With B<--pipe> GNU B<parallel> reads the blocks from standard input
 (stdin), which is then given to the command on standard input (stdin);
 so every block is being processed by GNU B<parallel> itself. This is
-the reason why B<--pipe> maxes out at around 100 MB/sec.
+the reason why B<--pipe> maxes out at around 500 MB/sec.
 
 B<--pipepart>, on the other hand, first identifies at which byte
 positions blocks start and how long they are. It does that by seeking
@@ -766,42 +763,32 @@ B<ps> and put the result in a file, which is then used next time.
 
 =head2 Killing jobs
 
-B<--memfree>, B<--halt> and when GNU B<parallel> meets a condition
-from which it cannot recover, jobs are killed. This is done by finding
-the (grand)*children of the jobs and killing those processes.
+GNU B<parallel> kills jobs. It can be due to B<--memfree>, B<--halt>,
+or when GNU B<parallel> meets a condition from which it cannot
+recover. Every job is started as its own process group. This way any
+(grand)*children will get killed, too. The process group is killed with
+the specification mentioned in B<--termseq>.
 
-More specifically GNU B<parallel> maintains a list of processes to be
-killed, sends a signal to all processes (first round this is a TERM).
-It weeds out the processes that exited from the list then waits a
-while and weeds out again. It does that until all processes are dead
-or 200 ms passed. Then it does another round with TERM, and finally a
-round with KILL.
 
-  pids = family_pids(jobs)
-  for signal in TERM, TERM, KILL:
-    for pid in pids:
-      kill signal, pid
-    while kill 0, pids and slept < 200 ms:
-      sleep sleeptime
-      pids = kill 0, pids
-      slept += sleeptime
-      sleeptime = sleeptime * 1.1
+=head2 SQL interface
 
-By doing so there is a tiny risk, that GNU B<parallel> will kill
-processes that are not started from GNU B<parallel>. It, however,
-requires all of these to be true:
+GNU B<parallel> uses the DBURL from GNU B<sql> to give database
+software, username, password, host, port, database, and table in a
+single string.
 
-* Process A is sent a signal
-* It dies during a I<sleep sleeptime> cycle
-* A new process B is spawned (by an unrelated process)
-* This is done during the same I<sleep sleeptime> cycle
-* B is owned by the same user
-* B reuses the pid of the A
+The DBURL must point to a table name. The table will be dropped and
+created. The reason for not reusing an exising table is that the user
+may have added more input sources which would require more columns in
+the table.
 
-It is considered unlikely to ever happen due to:
+The table columns are similar to joblog with the addition of B<V1>
+.. B<Vn> which are values from the input sources, and stdout and
+stderr which are the output from standard output and standard error,
+respectively.
+
+The Signal column has been renamed to _Signal due to Signal being a
+reserved word in MySQL.
 
-* The longest I<sleep sleeptime> sleeps is 10 ms
-* Re-use of a dead pid rarely happens within a few seconds
 
 
 =head1 Ideas for new design
diff --git a/src/parallel_tutorial.html b/src/parallel_tutorial.html
index 6e9bb581..f9467795 100644
--- a/src/parallel_tutorial.html
+++ b/src/parallel_tutorial.html
@@ -40,6 +40,7 @@
           <li><a href="#Positional-perl-expression-replacement-string">Positional perl expression replacement string</a></li>
           <li><a href="#Input-from-columns">Input from columns</a></li>
           <li><a href="#Header-defined-replacement-strings">Header defined replacement strings</a></li>
+          <li><a href="#More-pre-defined-replacement-strings">More pre-defined replacement strings</a></li>
         </ul>
       </li>
       <li><a href="#More-than-one-argument">More than one argument</a></li>
@@ -52,15 +53,19 @@
       <li><a href="#Saving-output-into-files">Saving output into files</a></li>
     </ul>
   </li>
-  <li><a href="#Control-the-execution">Control the execution</a>
+  <li><a href="#Controlling-the-execution">Controlling the execution</a>
     <ul>
       <li><a href="#Number-of-simultaneous-jobs">Number of simultaneous jobs</a></li>
       <li><a href="#Shuffle-job-order">Shuffle job order</a></li>
       <li><a href="#Interactivity">Interactivity</a></li>
       <li><a href="#A-terminal-for-every-job">A terminal for every job</a></li>
       <li><a href="#Timing">Timing</a></li>
-      <li><a href="#Progress">Progress</a></li>
-      <li><a href="#Termination">Termination</a></li>
+      <li><a href="#Progress-information">Progress information</a></li>
+      <li><a href="#Termination">Termination</a>
+        <ul>
+          <li><a href="#Termination-signals-advanced">Termination signals (advanced)</a></li>
+        </ul>
+      </li>
       <li><a href="#Limiting-the-resources">Limiting the resources</a></li>
     </ul>
   </li>
@@ -72,10 +77,15 @@
       <li><a href="#Avoid-overloading-sshd">Avoid overloading sshd</a></li>
       <li><a href="#Ignore-hosts-that-are-down">Ignore hosts that are down</a></li>
       <li><a href="#Running-the-same-commands-on-all-hosts">Running the same commands on all hosts</a></li>
-      <li><a href="#Transfer-environment-variables-and-functions">Transfer environment variables and functions</a></li>
+      <li><a href="#Transferring-environment-variables-and-functions">Transferring environment variables and functions</a></li>
       <li><a href="#Showing-what-is-actually-run">Showing what is actually run</a></li>
     </ul>
   </li>
+  <li><a href="#Saving-to-an-SQL-base-advanced">Saving to an SQL base (advanced)</a>
+    <ul>
+      <li><a href="#Using-multiple-workers">Using multiple workers</a></li>
+    </ul>
+  </li>
   <li><a href="#pipe">--pipe</a>
     <ul>
       <li><a href="#Chunk-size">Chunk size</a></li>
@@ -93,6 +103,7 @@
   </li>
   <li><a href="#Semaphore">Semaphore</a>
     <ul>
+      <li><a href="#Mutex">Mutex</a></li>
       <li><a href="#Counting-semaphore">Counting semaphore</a></li>
       <li><a href="#Timeout">Timeout</a></li>
     </ul>
@@ -104,7 +115,7 @@
 
 <h1 id="GNU-Parallel-Tutorial">GNU Parallel Tutorial</h1>
 
-<p>This tutorial shows off much of GNU Parallel&#39;s functionality. The tutorial is meant to learn the options in GNU Parallel. The tutorial is not to show realistic examples from the real world.</p>
+<p>This tutorial shows off much of GNU <b>parallel</b>&#39;s functionality. The tutorial is meant to learn the options in GNU <b>parallel</b>. The tutorial is not to show realistic examples from the real world.</p>
 
 <p>Spend an hour walking through the tutorial. Your command line will love you for it.</p>
 
@@ -226,7 +237,7 @@
 
 <h1 id="Input-sources">Input sources</h1>
 
-<p>GNU Parallel reads input from input sources. These can be files, the command line, and stdin (standard input or a pipe).</p>
+<p>GNU <b>parallel</b> reads input from input sources. These can be files, the command line, and stdin (standard input or a pipe).</p>
 
 <h2 id="A-single-input-source">A single input source</h2>
 
@@ -254,7 +265,7 @@
 
 <h2 id="Multiple-input-sources">Multiple input sources</h2>
 
-<p>GNU Parallel can take multiple input sources given on the command line. GNU Parallel then generates all combinations of the input sources:</p>
+<p>GNU <b>parallel</b> can take multiple input sources given on the command line. GNU <b>parallel</b> then generates all combinations of the input sources:</p>
 
 <pre><code>  parallel echo ::: A B C ::: D E F</code></pre>
 
@@ -276,13 +287,13 @@
 
 <p>Output: Same as above.</p>
 
-<p>STDIN (standard input) can be one of the input sources using &#39;-&#39;:</p>
+<p>STDIN (standard input) can be one of the input sources using <b>-</b>:</p>
 
 <pre><code>  cat abc-file | parallel -a - -a def-file echo </code></pre>
 
 <p>Output: Same as above.</p>
 
-<p>Instead of -a files can be given after &#39;::::&#39;:</p>
+<p>Instead of <b>-a</b> files can be given after <b>::::</b>:</p>
 
 <pre><code>  cat abc-file | parallel echo :::: - def-file</code></pre>
 
@@ -296,7 +307,7 @@
 
 <h3 id="Matching-arguments-from-all-input-sources">Matching arguments from all input sources</h3>
 
-<p>With --xapply you can get one argument from each input source:</p>
+<p>With <b>--xapply</b> you can get one argument from each input source:</p>
 
 <pre><code>  parallel --xapply echo ::: A B C ::: D E F</code></pre>
 
@@ -320,7 +331,7 @@
 
 <h2 id="Changing-the-argument-separator">Changing the argument separator.</h2>
 
-<p>GNU Parallel can use other separators than ::: or ::::. This is typically useful if ::: or :::: is used in the command to run:</p>
+<p>GNU <b>parallel</b> can use other separators than <b>:::</b> or <b>::::</b>. This is typically useful if <b>:::</b> or <b>::::</b> is used in the command to run:</p>
 
 <pre><code>  parallel --arg-sep ,, echo ,, A B C :::: def-file</code></pre>
 
@@ -344,7 +355,7 @@
 
 <h2 id="Changing-the-argument-delimiter">Changing the argument delimiter</h2>
 
-<p>GNU Parallel will normally treat a full line as a single argument: It uses \n as argument delimiter. This can be changed with -d:</p>
+<p>GNU <b>parallel</b> will normally treat a full line as a single argument: It uses <b>\n</b> as argument delimiter. This can be changed with <b>-d</b>:</p>
 
 <pre><code>  parallel -d _ echo :::: abc_-file</code></pre>
 
@@ -354,13 +365,13 @@
   B
   C</code></pre>
 
-<p>NULL can be given as \0:</p>
+<p>NULL can be given as <b>\0</b>:</p>
 
 <pre><code>  parallel -d &#39;\0&#39; echo :::: abc0-file</code></pre>
 
 <p>Output: Same as above.</p>
 
-<p>A shorthand for -d &#39;\0&#39; is -0 (this will often be used to read files from find ... -print0):</p>
+<p>A shorthand for <b>-d &#39;\0&#39;</b> is <b>-0</b> (this will often be used to read files from <b>find ... -print0</b>):</p>
 
 <pre><code>  parallel -0 echo :::: abc0-file</code></pre>
 
@@ -368,7 +379,7 @@
 
 <h2 id="End-of-file-value-for-input-source">End-of-file value for input source</h2>
 
-<p>GNU Parallel can stop reading when it encounters a certain value:</p>
+<p>GNU <b>parallel</b> can stop reading when it encounters a certain value:</p>
 
 <pre><code>  parallel -E stop echo ::: A B stop C D</code></pre>
 
@@ -379,7 +390,7 @@
 
 <h2 id="Skipping-empty-lines">Skipping empty lines</h2>
 
-<p>Using --no-run-if-empty GNU Parallel will skip empty lines.</p>
+<p>Using <b>--no-run-if-empty</b> GNU <b>parallel</b> will skip empty lines.</p>
 
 <pre><code>  (echo 1; echo; echo 2) | parallel --no-run-if-empty echo</code></pre>
 
@@ -402,7 +413,7 @@
   foo
   [/path/to/current/working/dir]</code></pre>
 
-<p>The command can be a script, a binary or a Bash function if the function is exported using &#39;export -f&#39;:</p>
+<p>The command can be a script, a binary or a Bash function if the function is exported using <b>export -f</b>:</p>
 
 <pre><code>  # Only works in Bash
   my_func() {
@@ -421,7 +432,7 @@
 
 <h3 id="The-7-predefined-replacement-strings">The 7 predefined replacement strings</h3>
 
-<p>GNU Parallel has several replacement strings. If no replacement strings are used the default is to append {}:</p>
+<p>GNU <b>parallel</b> has several replacement strings. If no replacement strings are used the default is to append <b>{}</b>:</p>
 
 <pre><code>  parallel echo ::: A/B.C</code></pre>
 
@@ -429,7 +440,7 @@
 
 <pre><code>  A/B.C</code></pre>
 
-<p>The default replacement string is {}:</p>
+<p>The default replacement string is <b>{}</b>:</p>
 
 <pre><code>  parallel echo {} ::: A/B.C</code></pre>
 
@@ -437,7 +448,7 @@
 
 <pre><code>  A/B.C</code></pre>
 
-<p>The replacement string {.} removes the extension:</p>
+<p>The replacement string <b>{.}</b> removes the extension:</p>
 
 <pre><code>  parallel echo {.} ::: A/B.C</code></pre>
 
@@ -445,7 +456,7 @@
 
 <pre><code>  A/B</code></pre>
 
-<p>The replacement string {/} removes the path:</p>
+<p>The replacement string <b>{/}</b> removes the path:</p>
 
 <pre><code>  parallel echo {/} ::: A/B.C</code></pre>
 
@@ -453,7 +464,7 @@
 
 <pre><code>  B.C</code></pre>
 
-<p>The replacement string {//} keeps only the path:</p>
+<p>The replacement string <b>{//}</b> keeps only the path:</p>
 
 <pre><code>  parallel echo {//} ::: A/B.C</code></pre>
 
@@ -461,7 +472,7 @@
 
 <pre><code>  A</code></pre>
 
-<p>The replacement string {/.} removes the path and the extension:</p>
+<p>The replacement string <b>{/.}</b> removes the path and the extension:</p>
 
 <pre><code>  parallel echo {/.} ::: A/B.C</code></pre>
 
@@ -469,7 +480,7 @@
 
 <pre><code>  B</code></pre>
 
-<p>The replacement string {#} gives the job number:</p>
+<p>The replacement string <b>{#}</b> gives the job number:</p>
 
 <pre><code>  parallel echo {#} ::: A B C</code></pre>
 
@@ -479,7 +490,7 @@
   2
   3</code></pre>
 
-<p>The replacement string {%} gives the job slot number (between 1 and number of jobs to run in parallel):</p>
+<p>The replacement string <b>{%}</b> gives the job slot number (between 1 and number of jobs to run in parallel):</p>
 
 <pre><code>  parallel -j 2 echo {%} ::: A B C</code></pre>
 
@@ -491,7 +502,7 @@
 
 <h3 id="Changing-the-replacement-strings">Changing the replacement strings</h3>
 
-<p>The replacement string {} can be changed with -I:</p>
+<p>The replacement string <b>{}</b> can be changed with <b>-I</b>:</p>
 
 <pre><code>  parallel -I ,, echo ,, ::: A/B.C</code></pre>
 
@@ -499,7 +510,7 @@
 
 <pre><code>  A/B.C</code></pre>
 
-<p>The replacement string {.} can be changed with --extensionreplace:</p>
+<p>The replacement string <b>{.}</b> can be changed with <b>--extensionreplace</b>:</p>
 
 <pre><code>  parallel --extensionreplace ,, echo ,, ::: A/B.C</code></pre>
 
@@ -507,7 +518,7 @@
 
 <pre><code>  A/B</code></pre>
 
-<p>The replacement string {/} can be replaced with --basenamereplace:</p>
+<p>The replacement string <b>{/}</b> can be replaced with <b>--basenamereplace</b>:</p>
 
 <pre><code>  parallel --basenamereplace ,, echo ,, ::: A/B.C</code></pre>
 
@@ -515,7 +526,7 @@
 
 <pre><code>  B.C</code></pre>
 
-<p>The replacement string {//} can be changed with --dirnamereplace:</p>
+<p>The replacement string <b>{//}</b> can be changed with <b>--dirnamereplace</b>:</p>
 
 <pre><code>  parallel --dirnamereplace ,, echo ,, ::: A/B.C</code></pre>
 
@@ -523,7 +534,7 @@
 
 <pre><code>  A</code></pre>
 
-<p>The replacement string {/.} can be changed with --basenameextensionreplace:</p>
+<p>The replacement string <b>{/.}</b> can be changed with <b>--basenameextensionreplace</b>:</p>
 
 <pre><code>  parallel --basenameextensionreplace ,, echo ,, ::: A/B.C</code></pre>
 
@@ -531,7 +542,7 @@
 
 <pre><code>  B</code></pre>
 
-<p>The replacement string {#} can be changed with --seqreplace:</p>
+<p>The replacement string <b>{#}</b> can be changed with <b>--seqreplace</b>:</p>
 
 <pre><code>  parallel --seqreplace ,, echo ,, ::: A B C</code></pre>
 
@@ -541,7 +552,7 @@
   2
   3</code></pre>
 
-<p>The replacement string {%} can be changed with --slotreplace:</p>
+<p>The replacement string <b>{%}</b> can be changed with <b>--slotreplace</b>:</p>
 
 <pre><code>  parallel -j2 --slotreplace ,, echo ,, ::: A B C</code></pre>
 
@@ -553,7 +564,7 @@
 
 <h3 id="Perl-expression-replacement-string">Perl expression replacement string</h3>
 
-<p>When predefined replacement strings are not flexible enough a perl expression can be used instead. One example is to remove two extensions: foo.tar.gz -&gt; foo</p>
+<p>When predefined replacement strings are not flexible enough a perl expression can be used instead. One example is to remove two extensions: foo.tar.gz becomes foo</p>
 
 <pre><code>  parallel echo &#39;{= s:\.[^.]+$::;s:\.[^.]+$::; =}&#39; ::: foo.tar.gz</code></pre>
 
@@ -561,25 +572,67 @@
 
 <pre><code>  foo</code></pre>
 
-<p>If the strings <b>{=</b> and <b>=}</b> cause problems they can be replaced with --parens:</p>
+<p>In <b>{= =}</b> you can access all of GNU <b>parallel</b>&#39;s internal functions and variables. A few are worth mentioning.</p>
+
+<p><b>total_jobs()</b> returns the total number of jobs:</p>
+
+<pre><code>  parallel echo Job {#} of {= &#39;$_=total_jobs()&#39; =} ::: {1..5}</code></pre>
+
+<p>Output:</p>
+
+<pre><code>  Job 1 of 5
+  Job 2 of 5
+  Job 3 of 5
+  Job 4 of 5
+  Job 5 of 5</code></pre>
+
+<p><b>Q(...)</b> shell quotes the string:</p>
+
+<pre><code>  parallel echo {} shell quoted is {= &#39;$_=Q($_)&#39; =} ::: &#39;*/!#$&#39;</code></pre>
+
+<p><b>$job-</b>&gt;<b>skip()</b> skips the job:</p>
+
+<pre><code>  parallel echo {= &#39;if($_==3) { $job-&gt;skip() }&#39; =} ::: {1..5}</code></pre>
+
+<p>Output:</p>
+
+<pre><code>  1
+  2
+  4
+  5</code></pre>
+
+<p><b>@arg</b> contains the input source variables:</p>
+
+<pre><code>  parallel echo {= &#39;if($arg[1]==$arg[2]) { $job-&gt;skip() }&#39; =} ::: {1..3} ::: {1..3}</code></pre>
+
+<p>Output:</p>
+
+<pre><code>  1 2
+  1 3
+  2 1
+  2 3
+  3 1
+  3 2</code></pre>
+
+<p>If the strings <b>{=</b> and <b>=}</b> cause problems they can be replaced with <b>--parens</b>:</p>
 
 <pre><code>  parallel --parens ,,,, echo &#39;,, s:\.[^.]+$::;s:\.[^.]+$::; ,,&#39; ::: foo.tar.gz</code></pre>
 
 <p>Output: Same as above.</p>
 
-<p>To define a short hand replacement string use <b>--rpl</b>:</p>
+<p>To define a shorthand replacement string use <b>--rpl</b>:</p>
 
 <pre><code>  parallel --rpl &#39;.. s:\.[^.]+$::;s:\.[^.]+$::;&#39; echo &#39;..&#39; ::: foo.tar.gz</code></pre>
 
 <p>Output: Same as above.</p>
 
-<p>If the short hand starts with &#39;{&#39; it can be used as a positional replacement string, too:</p>
+<p>If the shorthand starts with <b>{</b> it can be used as a positional replacement string, too:</p>
 
 <pre><code>  parallel --rpl &#39;{..} s:\.[^.]+$::;s:\.[^.]+$::;&#39; echo &#39;{..}&#39; ::: foo.tar.gz</code></pre>
 
 <p>Output: Same as above.</p>
 
-<p>GNU <b>parallel</b>&#39;s 7 replacement strings are implemented as:</p>
+<p>GNU <b>parallel</b>&#39;s 7 replacement strings are implemented as this:</p>
 
 <pre><code>  --rpl &#39;{} &#39;
   --rpl &#39;{#} $_=$job-&gt;seq()&#39;
@@ -591,7 +644,7 @@
 
 <h3 id="Positional-replacement-strings">Positional replacement strings</h3>
 
-<p>With multiple input sources the argument from the individual input sources can be access with {number}:</p>
+<p>With multiple input sources the argument from the individual input sources can be accessed with <b>{</b>number<b>}</b>:</p>
 
 <pre><code>  parallel echo {1} and {2} ::: A B ::: C D</code></pre>
 
@@ -602,7 +655,7 @@
   B and C
   B and D</code></pre>
 
-<p>The positional replacement strings can also be modified using / // /. and .:</p>
+<p>The positional replacement strings can also be modified using <b>/</b>, <b>//</b>, <b>/.</b>, and <b>.</b>:</p>
 
 <pre><code>  parallel echo /={1/} //={1//} /.={1/.} .={1.} ::: A/B.C D/E.F</code></pre>
 
@@ -636,7 +689,7 @@
 
 <pre><code>  foo bar</code></pre>
 
-<p>If a defined short hand starts with &#39;{&#39; it can be used as a positional replacement string, too:</p>
+<p>If shorthand defined using <b>--rpl</b> starts with <b>{</b> it can be used as a positional replacement string, too:</p>
 
 <pre><code>  parallel --rpl &#39;{..} s:\.[^.]+$::;s:\.[^.]+$::;&#39; echo &#39;{2..} {1}&#39; ::: bar ::: foo.tar.gz</code></pre>
 
@@ -644,7 +697,7 @@
 
 <h3 id="Input-from-columns">Input from columns</h3>
 
-<p>The columns in a file can be bound to positional replacement strings using --colsep. Here the columns are separated with TAB (\t):</p>
+<p>The columns in a file can be bound to positional replacement strings using <b>--colsep</b>. Here the columns are separated by TAB (\t):</p>
 
 <pre><code>  parallel --colsep &#39;\t&#39; echo 1={1} 2={2} :::: tsv-file.tsv</code></pre>
 
@@ -656,7 +709,7 @@
 
 <h3 id="Header-defined-replacement-strings">Header defined replacement strings</h3>
 
-<p>With --header GNU Parallel will use the first value of the input source as the name of the replacement string. Only the non-modified version {} is supported:</p>
+<p>With <b>--header</b> GNU <b>parallel</b> will use the first value of the input source as the name of the replacement string. Only the non-modified version <b>{}</b> is supported:</p>
 
 <pre><code>  parallel --header : echo f1={f1} f2={f2} ::: f1 A B ::: f2 C D</code></pre>
 
@@ -667,7 +720,7 @@
   f1=B f2=C
   f1=B f2=D</code></pre>
 
-<p>It is useful with --colsep for processing files with TAB separated values:</p>
+<p>It is useful with <b>--colsep</b> for processing files with TAB separated values:</p>
 
 <pre><code>  parallel --header : --colsep &#39;\t&#39; echo f1={f1} f2={f2} :::: tsv-file.tsv</code></pre>
 
@@ -676,9 +729,38 @@
 <pre><code>  f1=A f2=B
   f1=C f2=D</code></pre>
 
+<h3 id="More-pre-defined-replacement-strings">More pre-defined replacement strings</h3>
+
+<p><b>--plus</b> adds the replacement strings <b>{+/} {+.} {+..} {+...} {..} {...} {/..} {/...} {##}</b>. The idea being that <b>{+foo}</b> matches the opposite of <b>{foo}</b> and <b>{}</b> = <b>{+/}</b>/<b>{/}</b> = <b>{.}</b>.<b>{+.}</b> = <b>{+/}</b>/<b>{/.}</b>.<b>{+.}</b> = <b>{..}</b>.<b>{+..}</b> = <b>{+/}</b>/<b>{/..}</b>.<b>{+..}</b> = <b>{...}</b>.<b>{+...}</b> = <b>{+/}</b>/<b>{/...}</b>.<b>{+...}</b>.</p>
+
+<pre><code>  parallel --plus echo {} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {+/}/{/} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {.}.{+.} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {+/}/{/.}.{+.} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {..}.{+..} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {+/}/{/..}.{+..} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {...}.{+...} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {+/}/{/...}.{+...} ::: dir/sub/file.ext1.ext2.ext3</code></pre>
+
+<p>Output:</p>
+
+<pre><code>  dir/sub/file.ext1.ext2.ext3</code></pre>
+
+<p><b>{##}</b> is simply the number of jobs:</p>
+
+<pre><code>  parallel --plus echo Job {#} of {##} ::: {1..5}</code></pre>
+
+<p>Output:</p>
+
+<pre><code>  Job 1 of 5
+  Job 2 of 5
+  Job 3 of 5
+  Job 4 of 5
+  Job 5 of 5</code></pre>
+
 <h2 id="More-than-one-argument">More than one argument</h2>
 
-<p>With --xargs will GNU Parallel fit as many arguments as possible on a single line:</p>
+<p>With <b>--xargs</b> GNU <b>parallel</b> will fit as many arguments as possible on a single line:</p>
 
 <pre><code>  cat num30000 | parallel --xargs echo | wc -l</code></pre>
 
@@ -688,7 +770,7 @@
 
 <p>The 30000 arguments fitted on 2 lines.</p>
 
-<p>The maximal length of a single line can be set with -s. With a maximal line length of 10000 chars 17 commands will be run:</p>
+<p>The maximal length of a single line can be set with <b>-s</b>. With a maximal line length of 10000 chars 17 commands will be run:</p>
 
 <pre><code>  cat num30000 | parallel --xargs -s 10000 echo | wc -l</code></pre>
 
@@ -696,11 +778,11 @@
 
 <pre><code>  17</code></pre>
 
-<p>For better parallelism GNU Parallel can distribute the arguments between all the parallel jobs when end of file is met.</p>
+<p>For better parallelism GNU <b>parallel</b> can distribute the arguments between all the parallel jobs when end of file is met.</p>
 
-<p>Below GNU Parallel reads the last argument when generating the second job. When GNU Parallel reads the last argument, it spreads all the arguments for the second job over 4 jobs instead, as 4 parallel jobs are requested.</p>
+<p>Below GNU <b>parallel</b> reads the last argument when generating the second job. When GNU <b>parallel</b> reads the last argument, it spreads all the arguments for the second job over 4 jobs instead, as 4 parallel jobs are requested.</p>
 
-<p>The first job will be the same as the --xargs example above, but the second job will be split into 4 evenly sized jobs, resulting in a total of 5 jobs:</p>
+<p>The first job will be the same as the <b>--xargs</b> example above, but the second job will be split into 4 evenly sized jobs, resulting in a total of 5 jobs:</p>
 
 <pre><code>  cat num30000 | parallel --jobs 4 -m echo | wc -l</code></pre>
 
@@ -719,7 +801,7 @@
   7 8 9
   10</code></pre>
 
-<p>A replacement string can be part of a word. -m will not repeat the context:</p>
+<p>A replacement string can be part of a word. <b>-m</b> will not repeat the context:</p>
 
 <pre><code>  parallel --jobs 4 -m echo pre-{}-post ::: A B C D E F G</code></pre>
 
@@ -730,7 +812,7 @@
   pre-E F-post
   pre-G-post</code></pre>
 
-<p>To repeat the context use -X which otherwise works like -m:</p>
+<p>To repeat the context use <b>-X</b> which otherwise works like <b>-m</b>:</p>
 
 <pre><code>  parallel --jobs 4 -X echo pre-{}-post ::: A B C D E F G</code></pre>
 
@@ -741,7 +823,7 @@
   pre-E-post pre-F-post
   pre-G-post</code></pre>
 
-<p>To limit the number of arguments use -N:</p>
+<p>To limit the number of arguments use <b>-N</b>:</p>
 
 <pre><code>  parallel -N3 echo ::: A B C D E F G H</code></pre>
 
@@ -751,7 +833,7 @@
   D E F
   G H</code></pre>
 
-<p>-N also sets the positional replacement strings:</p>
+<p><b>-N</b> also sets the positional replacement strings:</p>
 
 <pre><code>  parallel -N3 echo 1={1} 2={2} 3={3} ::: A B C D E F G H</code></pre>
 
@@ -761,7 +843,7 @@
   1=D 2=E 3=F
   1=G 2=H 3=</code></pre>
 
-<p>-N0 reads 1 argument but inserts none:</p>
+<p><b>-N0</b> reads 1 argument but inserts none:</p>
 
 <pre><code>  parallel -N0 echo foo ::: 1 2 3</code></pre>
 
@@ -775,7 +857,7 @@
 
 <p>Command lines that contain special characters may need to be protected from the shell.</p>
 
-<p>The perl program &#39;print &quot;@ARGV\n&quot;&#39; basically works like echo.</p>
+<p>The <b>perl</b> program <b>print &quot;@ARGV\n&quot;</b> basically works like <b>echo</b>.</p>
 
 <pre><code>  perl -e &#39;print &quot;@ARGV\n&quot;&#39; A</code></pre>
 
@@ -791,7 +873,7 @@
 
 <pre><code>  [Nothing]</code></pre>
 
-<p>To quote the command use -q:</p>
+<p>To quote the command use <b>-q</b>:</p>
 
 <pre><code>  parallel -q perl -e &#39;print &quot;@ARGV\n&quot;&#39; ::: This works</code></pre>
 
@@ -800,7 +882,7 @@
 <pre><code>  This
   works</code></pre>
 
-<p>Or you can quote the critical part using \&#39;:</p>
+<p>Or you can quote the critical part using <b>\&#39;</b>:</p>
 
 <pre><code>  parallel perl -e \&#39;&#39;print &quot;@ARGV\n&quot;&#39;\&#39; ::: This works, too</code></pre>
 
@@ -810,7 +892,7 @@
   works,
   too</code></pre>
 
-<p>GNU Parallel can also \-quote full lines. Simply run:</p>
+<p>GNU <b>parallel</b> can also \-quote full lines. Simply run this:</p>
 
 <pre><code>  parallel --shellquote
   parallel: Warning: Input is read from the terminal. Only experts do this on purpose. Press CTRL-D to exit.
@@ -833,7 +915,7 @@
 
 <h2 id="Trimming-space">Trimming space</h2>
 
-<p>Space can be trimmed on the arguments using --trim:</p>
+<p>Space can be trimmed on the arguments using <b>--trim</b>:</p>
 
 <pre><code>  parallel --trim r echo pre-{}-post ::: &#39; A &#39;</code></pre>
 
@@ -869,7 +951,7 @@
   B       foo-B
   C       foo-C</code></pre>
 
-<p>To prefix it with another string use --tagstring:</p>
+<p>To prefix it with another string use <b>--tagstring</b>:</p>
 
 <pre><code>  parallel --tagstring {}-bar echo foo-{} ::: A B C</code></pre>
 
@@ -879,7 +961,7 @@
   B-bar   foo-B
   C-bar   foo-C</code></pre>
 
-<p>To see what commands will be run without running them:</p>
+<p>To see what commands will be run without running them use <b>--dryrun</b>:</p>
 
 <pre><code>  parallel --dryrun echo {} ::: A B C</code></pre>
 
@@ -889,7 +971,7 @@
   echo B
   echo C</code></pre>
 
-<p>To print the command before running them use --verbose:</p>
+<p>To print the command before running them use <b>--verbose</b>:</p>
 
 <pre><code>  parallel --verbose echo {} ::: A B C</code></pre>
 
@@ -902,7 +984,7 @@
   B
   C</code></pre>
 
-<p>GNU Parallel will postpone the output until the command completes:</p>
+<p>GNU <b>parallel</b> will postpone the output until the command completes:</p>
 
 <pre><code>  parallel -j2 &#39;printf &quot;%s-start\n%s&quot; {} {};sleep {};printf &quot;%s\n&quot; -middle;echo {}-end&#39; ::: 4 2 1</code></pre>
 
@@ -918,7 +1000,7 @@
   4-middle
   4-end</code></pre>
 
-<p>To get the output immediately use --ungroup:</p>
+<p>To get the output immediately use <b>--ungroup</b>:</p>
 
 <pre><code>  parallel -j2 --ungroup &#39;printf &quot;%s-start\n%s&quot; {} {};sleep {};printf &quot;%s\n&quot; -middle;echo {}-end&#39; ::: 4 2 1</code></pre>
 
@@ -934,9 +1016,9 @@
   -middle
   4-end</code></pre>
 
-<p>--ungroup is fast, but can cause half a line from one job to be mixed with half a line of another job. That has happend in the second line, where the line &#39;4-middle&#39; is mixed with &#39;2-start&#39;.</p>
+<p><b>--ungroup</b> is fast, but can cause half a line from one job to be mixed with half a line of another job. That has happend in the second line, where the line &#39;4-middle&#39; is mixed with &#39;2-start&#39;.</p>
 
-<p>To avoid this use --linebuffer:</p>
+<p>To avoid this use <b>--linebuffer</b>:</p>
 
 <pre><code>  parallel -j2 --linebuffer &#39;printf &quot;%s-start\n%s&quot; {} {};sleep {};printf &quot;%s\n&quot; -middle;echo {}-end&#39; ::: 4 2 1</code></pre>
 
@@ -952,7 +1034,7 @@
   4-middle
   4-end</code></pre>
 
-<p>To force the output in the same order as the arguments use --keep-order/-k:</p>
+<p>To force the output in the same order as the arguments use <b>--keep-order</b>/<b>-k</b>:</p>
 
 <pre><code>  parallel -j2 -k &#39;printf &quot;%s-start\n%s&quot; {} {};sleep {};printf &quot;%s\n&quot; -middle;echo {}-end&#39; ::: 4 2 1</code></pre>
 
@@ -970,21 +1052,21 @@
 
 <h2 id="Saving-output-into-files">Saving output into files</h2>
 
-<p>GNU Parallel can save the output of each job into files:</p>
+<p>GNU <b>parallel</b> can save the output of each job into files:</p>
 
 <pre><code>  parallel --files echo ::: A B C</code></pre>
 
-<p>Output will be similar to:</p>
+<p>Output will be similar to this:</p>
 
 <pre><code>  /tmp/pAh6uWuQCg.par
   /tmp/opjhZCzAX4.par
   /tmp/W0AT_Rph2o.par</code></pre>
 
-<p>By default GNU Parallel will cache the output in files in /tmp. This can be changed by setting $TMPDIR or --tmpdir:</p>
+<p>By default GNU <b>parallel</b> will cache the output in files in <b>/tmp</b>. This can be changed by setting <b>$TMPDIR</b> or <b>--tmpdir</b>:</p>
 
 <pre><code>  parallel --tmpdir /var/tmp --files echo ::: A B C</code></pre>
 
-<p>Output will be similar to:</p>
+<p>Output will be similar to this:</p>
 
 <pre><code>  /var/tmp/N_vk7phQRc.par
   /var/tmp/7zA4Ccf3wZ.par
@@ -996,7 +1078,7 @@
 
 <p>Output: Same as above.</p>
 
-<p>The output files can be saved in a structured way using --results:</p>
+<p>The output files can be saved in a structured way using <b>--results</b>:</p>
 
 <pre><code>  parallel --results outdir echo ::: A B C</code></pre>
 
@@ -1006,43 +1088,50 @@
   B
   C</code></pre>
 
-<p>but also these files were generated containing the standard output (stdout) and standard error (stderr):</p>
+<p>These files were also generated containing the standard output (stdout), standard error (stderr), and the sequence number (seq):</p>
 
-<pre><code>  outdir/1/A/stderr
+<pre><code>  outdir/1/A/seq
+  outdir/1/A/stderr
   outdir/1/A/stdout
+  outdir/1/B/seq
   outdir/1/B/stderr
   outdir/1/B/stdout
+  outdir/1/C/seq
   outdir/1/C/stderr
   outdir/1/C/stdout</code></pre>
 
-<p>This is useful if you are running multiple variables:</p>
+<p><b>--header :</b> will take the first value as name and use that in the directory structure. This is useful if you are using multiple input sources:</p>
 
 <pre><code>  parallel --header : --results outdir echo ::: f1 A B ::: f2 C D</code></pre>
 
 <p>Generated files:</p>
 
-<pre><code>  outdir/f1/A/f2/C/stderr
+<pre><code>  outdir/f1/A/f2/C/seq
+  outdir/f1/A/f2/C/stderr
   outdir/f1/A/f2/C/stdout
+  outdir/f1/A/f2/D/seq
   outdir/f1/A/f2/D/stderr
   outdir/f1/A/f2/D/stdout
+  outdir/f1/B/f2/C/seq
   outdir/f1/B/f2/C/stderr
   outdir/f1/B/f2/C/stdout
+  outdir/f1/B/f2/D/seq
   outdir/f1/B/f2/D/stderr
   outdir/f1/B/f2/D/stdout</code></pre>
 
 <p>The directories are named after the variables and their values.</p>
 
-<h1 id="Control-the-execution">Control the execution</h1>
+<h1 id="Controlling-the-execution">Controlling the execution</h1>
 
 <h2 id="Number-of-simultaneous-jobs">Number of simultaneous jobs</h2>
 
-<p>The number of concurrent jobs is given with --jobs/-j:</p>
+<p>The number of concurrent jobs is given with <b>--jobs</b>/<b>-j</b>:</p>
 
 <pre><code>  /usr/bin/time parallel -N0 -j64 sleep 1 :::: num128</code></pre>
 
-<p>With 64 jobs in parallel the 128 sleeps will take 2-8 seconds to run - depending on how fast your machine is.</p>
+<p>With 64 jobs in parallel the 128 <b>sleep</b>s will take 2-8 seconds to run - depending on how fast your machine is.</p>
 
-<p>By default --jobs is the same as the number of CPU cores. So this:</p>
+<p>By default <b>--jobs</b> is the same as the number of CPU cores. So this:</p>
 
 <pre><code>  /usr/bin/time parallel -N0 sleep 1 :::: num128</code></pre>
 
@@ -1050,13 +1139,13 @@
 
 <pre><code>  /usr/bin/time parallel -N0 --jobs 200% sleep 1 :::: num128</code></pre>
 
-<p>--jobs 0 will run as many jobs in parallel as possible:</p>
+<p><b>--jobs 0</b> will run as many jobs in parallel as possible:</p>
 
 <pre><code>  /usr/bin/time parallel -N0 --jobs 0 sleep 1 :::: num128</code></pre>
 
 <p>which should take 1-7 seconds depending on how fast your machine is.</p>
 
-<p>--jobs can read from a file which is re-read when a job finishes:</p>
+<p><b>--jobs</b> can read from a file which is re-read when a job finishes:</p>
 
 <pre><code>  echo 50% &gt; my_jobs
   /usr/bin/time parallel -N0 --jobs my_jobs sleep 1 :::: num128 &amp;
@@ -1064,15 +1153,15 @@
   echo 0 &gt; my_jobs
   wait</code></pre>
 
-<p>The first second only 50% of the CPU cores will run a job. The &#39;0&#39; is put into my_jobs and then the rest of the jobs will be started in parallel.</p>
+<p>The first second only 50% of the CPU cores will run a job. Then <b>0</b> is put into <b>my_jobs</b> and then the rest of the jobs will be started in parallel.</p>
 
-<p>Instead of basing the percentage on the number of CPU cores GNU Parallel can base it on the number of CPUs:</p>
+<p>Instead of basing the percentage on the number of CPU cores GNU <b>parallel</b> can base it on the number of CPUs:</p>
 
 <pre><code>  parallel --use-cpus-instead-of-cores -N0 sleep 1 :::: num8</code></pre>
 
 <h2 id="Shuffle-job-order">Shuffle job order</h2>
 
-<p>If you have many jobs (e.g. by multiple combinations of input sources), it can be handy to shuffle the jobs, so you get different values run.</p>
+<p>If you have many jobs (e.g. by multiple combinations of input sources), it can be handy to shuffle the jobs, so you get different values run. Use <b>--shuf</b> for that:</p>
 
 <pre><code>  parallel --shuf echo ::: 1 2 3 ::: a b c ::: A B C</code></pre>
 
@@ -1082,7 +1171,7 @@
 
 <h2 id="Interactivity">Interactivity</h2>
 
-<p>GNU Parallel can ask the user if a command should be run using --interactive:</p>
+<p>GNU <b>parallel</b> can ask the user if a command should be run using <b>--interactive</b>:</p>
 
 <pre><code>  parallel --interactive echo ::: 1 2 3</code></pre>
 
@@ -1094,7 +1183,7 @@
   echo 3 ?...y
   3</code></pre>
 
-<p>GNU Parallel can be used to put arguments on the command line for an interactive command such as emacs to edit one file at a time:</p>
+<p>GNU <b>parallel</b> can be used to put arguments on the command line for an interactive command such as <b>emacs</b> to edit one file at a time:</p>
 
 <pre><code>  parallel --tty emacs ::: 1 2 3</code></pre>
 
@@ -1104,7 +1193,7 @@
 
 <h2 id="A-terminal-for-every-job">A terminal for every job</h2>
 
-<p>Using tmux GNU Parallel can start a terminal for every job run:</p>
+<p>Using <b>--tmux</b> GNU <b>parallel</b> can start a terminal for every job run:</p>
 
 <pre><code>  seq 10 20 | parallel --tmux &#39;echo start {}; sleep {}; echo done {}&#39;</code></pre>
 
@@ -1112,11 +1201,11 @@
 
 <pre><code>  tmux -S /tmp/tmsrPrO0 attach</code></pre>
 
-<p>Using normal tmux keystrokes (CTRL-b n or CTRL-b p) you can cycle between windows of the running jobs. When a job is finished it will pause for 10 seconds before closing the window.</p>
+<p>Using normal <b>tmux</b> keystrokes (CTRL-b n or CTRL-b p) you can cycle between windows of the running jobs. When a job is finished it will pause for 10 seconds before closing the window.</p>
 
 <h2 id="Timing">Timing</h2>
 
-<p>Some jobs do heavy I/O when they start. To avoid a thundering herd GNU Parallel can delay starting new jobs. --delay X will make sure there is at least X seconds between each start:</p>
+<p>Some jobs do heavy I/O when they start. To avoid a thundering herd GNU <b>parallel</b> can delay starting new jobs. <b>--delay</b> <i>X</i> will make sure there is at least <i>X</i> seconds between each start:</p>
 
 <pre><code>  parallel --delay 2.5 echo Starting {}\;date ::: 1 2 3</code></pre>
 
@@ -1129,7 +1218,7 @@
   Starting 3
   Thu Aug 15 16:24:38 CEST 2013</code></pre>
 
-<p>If jobs taking more than a certain amount of time are known to fail, they can be stopped with --timeout. The accuracy of --timeout is 2 seconds:</p>
+<p>If jobs taking more than a certain amount of time are known to fail, they can be stopped with <b>--timeout</b>. The accuracy of <b>--timeout</b> is 2 seconds:</p>
 
 <pre><code>  parallel --timeout 4.1 sleep {}\; echo {} ::: 2 4 6 8</code></pre>
 
@@ -1138,7 +1227,7 @@
 <pre><code>  2
   4</code></pre>
 
-<p>GNU Parallel can compute the median runtime for jobs and kill those that take more than 200% of the median runtime:</p>
+<p>GNU <b>parallel</b> can compute the median runtime for jobs and kill those that take more than 200% of the median runtime:</p>
 
 <pre><code>  parallel --timeout 200% sleep {}\; echo {} ::: 2.1 2.2 3 7 2.3</code></pre>
 
@@ -1149,7 +1238,9 @@
   3
   2.3</code></pre>
 
-<p>Based on the runtime of completed jobs GNU Parallel can estimate the total runtime:</p>
+<h2 id="Progress-information">Progress information</h2>
+
+<p>Based on the runtime of completed jobs GNU <b>parallel</b> can estimate the total runtime:</p>
 
 <pre><code>  parallel --eta sleep ::: 1 3 2 2 1 3 3 2 1</code></pre>
 
@@ -1161,9 +1252,7 @@
   Computer:jobs running/jobs completed/%of started jobs/Average seconds to complete
   ETA: 2s 0left 1.11avg  local:0/9/100%/1.1s </code></pre>
 
-<h2 id="Progress">Progress</h2>
-
-<p>GNU Parallel can give progress information with --progress:</p>
+<p>GNU <b>parallel</b> can give progress information with <b>--progress</b>:</p>
 
 <pre><code>  parallel --progress sleep ::: 1 3 2 2 1 3 3 2 1</code></pre>
 
@@ -1175,15 +1264,15 @@
   Computer:jobs running/jobs completed/%of started jobs/Average seconds to complete
   local:0/9/100%/1.1s</code></pre>
 
-<p>A progress bar can be shown with --bar:</p>
+<p>A progress bar can be shown with <b>--bar</b>:</p>
 
 <pre><code>  parallel --bar sleep ::: 1 3 2 2 1 3 3 2 1</code></pre>
 
-<p>And a graphic bar can be shown with --bar and zenity:</p>
+<p>And a graphic bar can be shown with <b>--bar</b> and <b>zenity</b>:</p>
 
 <pre><code>  seq 1000 | parallel -j10 --bar &#39;(echo -n {};sleep 0.1)&#39; 2&gt; &gt;(zenity --progress --auto-kill)</code></pre>
 
-<p>A logfile of the jobs completed so far can be generated with --joblog:</p>
+<p>A logfile of the jobs completed so far can be generated with <b>--joblog</b>:</p>
 
 <pre><code>  parallel --joblog /tmp/log exit  ::: 1 2 3 0 
   cat /tmp/log</code></pre>
@@ -1196,9 +1285,9 @@
   3       :       1376577364.990  0.013   0       0       3       0       exit 3
   4       :       1376577365.003  0.003   0       0       0       0       exit 0</code></pre>
 
-<p>The log contains the job sequence, which host the job was run on, the start time and run time, how much data was transferred if the job was run on a remote host, the exit value, the signal that killed the job, and finally the command being run.</p>
+<p>The log contains the job sequence, which host the job was run on, the start time and run time, how much data was transferred, the exit value, the signal that killed the job, and finally the command being run.</p>
 
-<p>With a joblog GNU Parallel can be stopped and later pickup where it left off. It it important that the input of the completed jobs is unchanged.</p>
+<p>With a joblog GNU <b>parallel</b> can be stopped and later pickup where it left off. It it important that the input of the completed jobs is unchanged.</p>
 
 <pre><code>  parallel --joblog /tmp/log exit  ::: 1 2 3 0 
   cat /tmp/log
@@ -1221,9 +1310,9 @@
   5       :       1376580070.028  0.009   0       0       0       0       exit 0
   6       :       1376580070.038  0.007   0       0       0       0       exit 0</code></pre>
 
-<p>Note how the start time of the last 2 jobs is clearly from the second run.</p>
+<p>Note how the start time of the last 2 jobs is clearly different from the second run.</p>
 
-<p>With --resume-failed GNU Parallel will re-run the jobs that failed:</p>
+<p>With <b>--resume-failed</b> GNU <b>parallel</b> will re-run the jobs that failed:</p>
 
 <pre><code>  parallel --resume-failed --joblog /tmp/log exit  ::: 1 2 3 0 0 0
   cat /tmp/log</code></pre>
@@ -1241,11 +1330,32 @@
   2       :       1376580154.444  0.022   0       0       2       0       exit 2
   3       :       1376580154.466  0.005   0       0       3       0       exit 3</code></pre>
 
-<p>Note how seq 1 2 3 have been repeated because they had exit value != 0.</p>
+<p>Note how seq 1 2 3 have been repeated because they had exit value different from 0.</p>
+
+<p><b>--retry-failed</b> does almost the same as <b>--resume-failed</b>. Where <b>--resume-failed</b> reads the commands from the command line (and ignores the commands in the joblog), <b>--retry-failed</b> ignores the command line and reruns the commands mentioned in the joblog.</p>
+
+<pre><code>  parallel --resume-failed --joblog /tmp/log
+  cat /tmp/log</code></pre>
+
+<p>Output:</p>
+
+<pre><code>  Seq     Host    Starttime       Runtime Send    Receive Exitval Signal  Command
+  1       :       1376580069.544  0.008   0       0       1       0       exit 1
+  2       :       1376580069.552  0.009   0       0       2       0       exit 2
+  3       :       1376580069.560  0.012   0       0       3       0       exit 3
+  4       :       1376580069.571  0.005   0       0       0       0       exit 0
+  5       :       1376580070.028  0.009   0       0       0       0       exit 0
+  6       :       1376580070.038  0.007   0       0       0       0       exit 0
+  1       :       1376580154.433  0.010   0       0       1       0       exit 1
+  2       :       1376580154.444  0.022   0       0       2       0       exit 2
+  3       :       1376580154.466  0.005   0       0       3       0       exit 3
+  1       :       1376580164.633  0.010   0       0       1       0       exit 1
+  2       :       1376580164.644  0.022   0       0       2       0       exit 2
+  3       :       1376580164.666  0.005   0       0       3       0       exit 3</code></pre>
 
 <h2 id="Termination">Termination</h2>
 
-<p>For certain jobs there is no need to continue if one of the jobs fails and has an exit code != 0. GNU Parallel will stop spawning new jobs with --halt soon,fail=1:</p>
+<p>For certain jobs there is no need to continue if one of the jobs fails and has an exit code different from 0. GNU <b>parallel</b> will stop spawning new jobs with <b>--halt soon,fail=1</b>:</p>
 
 <pre><code>  parallel -j2 --halt soon,fail=1 echo {}\; exit {} ::: 0 0 1 2 3</code></pre>
 
@@ -1260,7 +1370,7 @@
   parallel: Starting no more jobs. Waiting for 1 jobs to finish. This job failed:
   echo 2; exit 2</code></pre>
 
-<p>With --halt now,fail=1 the running jobs will be killed immediately:</p>
+<p>With <b>--halt now,fail=1</b> the running jobs will be killed immediately:</p>
 
 <pre><code>  parallel -j2 --halt now,fail=1 echo {}\; exit {} ::: 0 0 1 2 3</code></pre>
 
@@ -1272,7 +1382,7 @@
   parallel: This job failed:
   echo 1; exit 1</code></pre>
 
-<p>If --halt is given a percentage this percentage of the jobs must fail before GNU Parallel stops spawning more jobs:</p>
+<p>If <b>--halt</b> is given a percentage this percentage of the jobs must fail before GNU <b>parallel</b> stops spawning more jobs:</p>
 
 <pre><code>  parallel -j2 --halt soon,fail=20% echo {}\; exit {} ::: 0 1 2 3 4 5 6 7 8 9</code></pre>
 
@@ -1290,9 +1400,9 @@
   parallel: This job failed:
   echo 3; exit 3</code></pre>
 
-<p>If you are looking for success instead of failures, you can use success:</p>
+<p>If you are looking for success instead of failures, you can use <b>success</b>. This will finish as soon as the first job succeeds:</p>
 
-<pre><code>  parallel -j2 --halt soon,success=1 echo {}\; exit {} ::: 1 2 3 0 4 5 6</code></pre>
+<pre><code>  parallel -j2 --halt now,success=1 echo {}\; exit {} ::: 1 2 3 0 4 5 6</code></pre>
 
 <p>Output:</p>
 
@@ -1301,11 +1411,9 @@
   3
   0
   parallel: This job succeeded:
-  echo 0; exit 0
-  parallel: Starting no more jobs. Waiting for 1 jobs to finish.
-  4</code></pre>
+  echo 0; exit 0</code></pre>
 
-<p>GNU Parallel can retry the command with --retries. This is useful if a command fails for unknown reasons now and then.</p>
+<p>GNU <b>parallel</b> can retry the command with <b>--retries</b>. This is useful if a command fails for unknown reasons now and then.</p>
 
 <pre><code>  parallel -k --retries 3 &#39;echo tried {} &gt;&gt;/tmp/runs; echo completed {}; exit {}&#39; ::: 1 2 0
   cat /tmp/runs</code></pre>
@@ -1326,9 +1434,42 @@
 
 <p>Note how job 1 and 2 were tried 3 times, but 0 was not retried because it had exit code 0.</p>
 
+<h3 id="Termination-signals-advanced">Termination signals (advanced)</h3>
+
+<p>Using <b>--termseq</b> you can control which signals are sent when killing children. Normally children will be killed by sending them <b>SIGTERM</b>, waiting 200 ms, then another <b>SIGTERM</b>, waiting 100 ms, then another <b>SIGTERM</b>, waiting 50 ms, then a <b>SIGKILL</b>, finally waiting 25 ms before giving up. It looks like this:</p>
+
+<pre><code>  show_signals() {
+    perl -e &#39;for(keys %SIG) { $SIG{$_} = eval &quot;sub { print \&quot;Got $_\\n\&quot;; }&quot;;} while(1){sleep 1}&#39; 
+  }
+  export -f show_signals
+  echo | parallel --termseq TERM,200,TERM,100,TERM,50,KILL,25 -u --timeout 1 show_signals</code></pre>
+
+<p>Output:</p>
+
+<pre><code>  Got TERM
+  Got TERM
+  Got TERM</code></pre>
+
+<p>Or just:</p>
+
+<pre><code>  echo | parallel -u --timeout 1 show_signals</code></pre>
+
+<p>Output: Same as above.</p>
+
+<p>You can change this to <b>SIGINT</b>, <b>SIGTERM</b>, <b>SIGKILL</b>:</p>
+
+<pre><code>  echo | parallel --termseq INT,200,TERM,100,KILL,25 -u --timeout 1 show_signals</code></pre>
+
+<p>Output:</p>
+
+<pre><code>  Got INT
+  Got TERM</code></pre>
+
+<p>The <b>SIGKILL</b> does not show because it cannot be caught, and thus the child dies.</p>
+
 <h2 id="Limiting-the-resources">Limiting the resources</h2>
 
-<p>To avoid overloading systems GNU Parallel can look at the system load before starting another job:</p>
+<p>To avoid overloading systems GNU <b>parallel</b> can look at the system load before starting another job:</p>
 
 <pre><code>  parallel --load 100% echo load is less than {} job per cpu ::: 1 </code></pre>
 
@@ -1337,7 +1478,7 @@
 <pre><code>  [when then load is less than the number of cpu cores]
   load is less than 1 job per cpu</code></pre>
 
-<p>GNU Parallel can also check if the system is swapping.</p>
+<p>GNU <b>parallel</b> can also check if the system is swapping.</p>
 
 <pre><code>  parallel --noswap echo the system is not swapping ::: now</code></pre>
 
@@ -1346,7 +1487,11 @@
 <pre><code>  [when then system is not swapping]
   the system is not swapping now</code></pre>
 
-<p>GNU Parallel can run the jobs with a nice value. This will work both locally and remotely.</p>
+<p>Some jobs need a lot of memory, and should only be started when there is enough memory free. Using <b>--memfree</b> GNU <b>parallel</b> can check if there is enough memory free. Additionally, GNU <b>parallel</b> will kill off the youngest job if the memory free falls below 50% of the size. The killed job will put back on the queue and retried later.</p>
+
+<pre><code>  parallel --memfree 1G echo will run if more than 1 GB is ::: free</code></pre>
+
+<p>GNU <b>parallel</b> can run the jobs with a nice value. This will work both locally and remotely.</p>
 
 <pre><code>  parallel --nice 17 echo this is being run with nice -n ::: 17</code></pre>
 
@@ -1356,11 +1501,11 @@
 
 <h1 id="Remote-execution">Remote execution</h1>
 
-<p>GNU Parallel can run jobs on remote servers. It uses ssh to communicate with the remote machines.</p>
+<p>GNU <b>parallel</b> can run jobs on remote servers. It uses <b>ssh</b> to communicate with the remote machines.</p>
 
 <h2 id="Sshlogin">Sshlogin</h2>
 
-<p>The most basic sshlogin is -S host:</p>
+<p>The most basic sshlogin is <b>-S</b> <i>host</i>:</p>
 
 <pre><code>  parallel -S $SERVER1 echo running on ::: $SERVER1</code></pre>
 
@@ -1368,7 +1513,7 @@
 
 <pre><code>  running on [$SERVER1]</code></pre>
 
-<p>To use a different username prepend the server with username@</p>
+<p>To use a different username prepend the server with <i>username@</i>:</p>
 
 <pre><code>  parallel -S username@$SERVER1 echo running on ::: username@$SERVER1</code></pre>
 
@@ -1376,7 +1521,7 @@
 
 <pre><code>  running on [username@$SERVER1]</code></pre>
 
-<p>The special sshlogin &#39;:&#39; is the local machine:</p>
+<p>The special sshlogin <b>:</b> is the local machine:</p>
 
 <pre><code>  parallel -S : echo running on ::: the_local_machine</code></pre>
 
@@ -1384,7 +1529,7 @@
 
 <pre><code>  running on the_local_machine</code></pre>
 
-<p>If ssh is not in $PATH it can be prepended to $SERVER1:</p>
+<p>If <b>ssh</b> is not in $PATH it can be prepended to $SERVER1:</p>
 
 <pre><code>  parallel -S &#39;/usr/bin/ssh &#39;$SERVER1 echo custom ::: ssh</code></pre>
 
@@ -1392,7 +1537,16 @@
 
 <pre><code>  custom ssh</code></pre>
 
-<p>Several servers can be given using multiple -S:</p>
+<p>The <b>ssh</b> command can also be given using <b>--ssh</b>:</p>
+
+<pre><code>  parallel --ssh /usr/bin/ssh -S $SERVER1 echo custom ::: ssh</code></pre>
+
+<p>or by setting <b>$PARALLEL_SSH</b>:</p>
+
+<pre><code>  export PARALLEL_SSH=/usr/bin/ssh
+  parallel -S $SERVER1 echo custom ::: ssh</code></pre>
+
+<p>Several servers can be given using multiple <b>-S</b>:</p>
 
 <pre><code>  parallel -S $SERVER1 -S $SERVER2 echo ::: running on more hosts</code></pre>
 
@@ -1403,7 +1557,7 @@
   more
   hosts</code></pre>
 
-<p>Or they can be separated by ,:</p>
+<p>Or they can be separated by <b>,</b>:</p>
 
 <pre><code>  parallel -S $SERVER1,$SERVER2 echo ::: running on more hosts</code></pre>
 
@@ -1415,7 +1569,7 @@
   SERVERS=&quot;`echo $SERVER1; echo $SERVER2`&quot;
   parallel -S &quot;$SERVERS&quot; echo ::: running on more hosts</code></pre>
 
-<p>The can also be read from a file (replace user@ with the user on $SERVER2):</p>
+<p>They can also be read from a file (replace <i>user@</i> with the user on <b>$SERVER2</b>):</p>
 
 <pre><code>  echo $SERVER1 &gt; nodefile
   # Force 4 cores, special ssh-command, username
@@ -1424,9 +1578,11 @@
 
 <p>Output: Same as above.</p>
 
-<p>The special --sshloginfile &#39;..&#39; reads from ~/.parallel/sshloginfile.</p>
+<p>Every time a job finished, the <b>--sshloginfile</b> will be re-read, so it is possible to both add and remove hosts while running.</p>
 
-<p>To force GNU Parallel to treat a server having a given number of CPU cores prepend #/ to the sshlogin:</p>
+<p>The special <b>--sshloginfile ..</b> reads from <b>~/.parallel/sshloginfile</b>.</p>
+
+<p>To force GNU <b>parallel</b> to treat a server having a given number of CPU cores prepend the number of core followed by <b>/</b> to the sshlogin:</p>
 
 <pre><code>  parallel -S 4/$SERVER1 echo force {} cpus on server ::: 4</code></pre>
 
@@ -1434,18 +1590,20 @@
 
 <pre><code>  force 4 cpus on server</code></pre>
 
-<p>Servers can be put into groups by prepending &#39;@groupname&#39; to the server and the group can then be selected by appending &#39;@groupname&#39; to the argument if using &#39;--hostgroup&#39;.</p>
+<p>Servers can be put into groups by prepending <i>@groupname</i> to the server and the group can then be selected by appending <i>@groupname</i> to the argument if using <b>--hostgroup</b>:</p>
 
-<pre><code>  parallel --hostgroup -S @grp1/$SERVER1 -S @grp2/$SERVER2 echo {} ::: run_on_grp1@grp1 run_on_grp2@grp2</code></pre>
+<pre><code>  parallel --hostgroup -S @grp1/$SERVER1 -S @grp2/$SERVER2 echo {} ::: \
+    run_on_grp1@grp1 run_on_grp2@grp2</code></pre>
 
 <p>Output:</p>
 
 <pre><code>  run_on_grp1
   run_on_grp2</code></pre>
 
-<p>A host can be in multiple groups by separating groups with &#39;+&#39;, and you can force GNU <b>parallel</b> to limit the groups on which the command can be run with &#39;-S @groupname&#39;:</p>
+<p>A host can be in multiple groups by separating the groups with <b>+</b>, and you can force GNU <b>parallel</b> to limit the groups on which the command can be run with <b>-S</b> <i>@groupname</i>:</p>
 
-<pre><code>  parallel -S @grp1 -S @grp1+grp2/$SERVER1 -S @grp2/SERVER2 echo {} ::: run_on_grp1 also_grp1</code></pre>
+<pre><code>  parallel -S @grp1 -S @grp1+grp2/$SERVER1 -S @grp2/SERVER2 echo {} ::: \
+    run_on_grp1 also_grp1</code></pre>
 
 <p>Output:</p>
 
@@ -1454,32 +1612,32 @@
 
 <h2 id="Transferring-files">Transferring files</h2>
 
-<p>GNU Parallel can transfer the files to be processed to the remote host. It does that using rsync.</p>
+<p>GNU <b>parallel</b> can transfer the files to be processed to the remote host. It does that using rsync.</p>
 
 <pre><code>  echo This is input_file &gt; input_file
-  parallel -S $SERVER1 --transfer cat ::: input_file </code></pre>
+  parallel -S $SERVER1 --transferfile {} cat ::: input_file </code></pre>
 
 <p>Output:</p>
 
 <pre><code>  This is input_file</code></pre>
 
-<p>If the files is processed into another file, the resulting file can be transferred back:</p>
+<p>If the files are processed into another file, the resulting file can be transferred back:</p>
 
 <pre><code>  echo This is input_file &gt; input_file
-  parallel -S $SERVER1 --transfer --return {}.out cat {} &quot;&gt;&quot;{}.out ::: input_file 
+  parallel -S $SERVER1 --transferfile {} --return {}.out cat {} &quot;&gt;&quot;{}.out ::: input_file 
   cat input_file.out</code></pre>
 
 <p>Output: Same as above.</p>
 
-<p>To remove the input and output file on the remote server use --cleanup:</p>
+<p>To remove the input and output file on the remote server use <b>--cleanup</b>:</p>
 
 <pre><code>  echo This is input_file &gt; input_file
-  parallel -S $SERVER1 --transfer --return {}.out --cleanup cat {} &quot;&gt;&quot;{}.out ::: input_file 
+  parallel -S $SERVER1 --transferfile {} --return {}.out --cleanup cat {} &quot;&gt;&quot;{}.out ::: input_file 
   cat input_file.out</code></pre>
 
 <p>Output: Same as above.</p>
 
-<p>There is a short hand for --transfer --return --cleanup called --trc:</p>
+<p>There is a shorthand for <b>--transferfile {} --return --cleanup</b> called <b>--trc</b>:</p>
 
 <pre><code>  echo This is input_file &gt; input_file
   parallel -S $SERVER1 --trc {}.out cat {} &quot;&gt;&quot;{}.out ::: input_file 
@@ -1487,7 +1645,7 @@
 
 <p>Output: Same as above.</p>
 
-<p>Some jobs need a common database for all jobs. GNU Parallel can transfer that using --basefile which will transfer the file before the first job:</p>
+<p>Some jobs need a common database for all jobs. GNU <b>parallel</b> can transfer that using <b>--basefile</b> which will transfer the file before the first job:</p>
 
 <pre><code>  echo common data &gt; common_file
   parallel --basefile common_file -S $SERVER1 cat common_file\; echo {} ::: foo</code></pre>
@@ -1497,17 +1655,17 @@
 <pre><code>  common data
   foo</code></pre>
 
-<p>To remove it from the remote host after the last job use --cleanup.</p>
+<p>To remove it from the remote host after the last job use <b>--cleanup</b>.</p>
 
 <h2 id="Working-dir">Working dir</h2>
 
-<p>The default working dir on the remote machines is the login dir. This can be changed with --workdir <i>mydir</i>.</p>
+<p>The default working dir on the remote machines is the login dir. This can be changed with <b>--workdir</b> <i>mydir</i>.</p>
 
-<p>Files transferred using --transfer and --return will be relative to <i>mydir</i> on remote computers, and the command will be executed in the dir <i>mydir</i>.</p>
+<p>Files transferred using <b>--transferfile</b> and <b>--return</b> will be relative to <i>mydir</i> on remote computers, and the command will be executed in the dir <i>mydir</i>.</p>
 
-<p>The special <i>mydir</i> value ... will create working dirs under ~/.parallel/tmp/ on the remote computers. If --cleanup is given these dirs will be removed.</p>
+<p>The special <i>mydir</i> value <b>...</b> will create working dirs under <b>~/.parallel/tmp</b> on the remote computers. If <b>--cleanup</b> is given these dirs will be removed.</p>
 
-<p>The special <i>mydir</i> value . uses the current working dir. If the current working dir is beneath your home dir, the value . is treated as the relative path to your home dir. This means that if your home dir is different on remote computers (e.g. if your login is different) the relative path will still be relative to your home dir.</p>
+<p>The special <i>mydir</i> value <b>.</b> uses the current working dir. If the current working dir is beneath your home dir, the value <b>.</b> is treated as the relative path to your home dir. This means that if your home dir is different on remote computers (e.g. if your login is different) the relative path will still be relative to your home dir.</p>
 
 <pre><code>  parallel -S $SERVER1 pwd ::: &quot;&quot;
   parallel --workdir . -S $SERVER1 pwd ::: &quot;&quot;
@@ -1521,7 +1679,7 @@
 
 <h2 id="Avoid-overloading-sshd">Avoid overloading sshd</h2>
 
-<p>If many jobs are started on the same server, sshd can be overloaded. GNU Parallel can insert a delay between each job run on the same server:</p>
+<p>If many jobs are started on the same server, <b>sshd</b> can be overloaded. GNU <b>parallel</b> can insert a delay between each job run on the same server:</p>
 
 <pre><code>  parallel -S $SERVER1 --sshdelay 0.2 echo ::: 1 2 3</code></pre>
 
@@ -1531,7 +1689,7 @@
   2
   3</code></pre>
 
-<p>Sshd will be less overloaded if using --controlmaster, which will multiplex ssh connections:</p>
+<p><b>sshd</b> will be less overloaded if using <b>--controlmaster</b>, which will multiplex ssh connections:</p>
 
 <pre><code>  parallel --controlmaster -S $SERVER1 echo ::: 1 2 3</code></pre>
 
@@ -1539,7 +1697,7 @@
 
 <h2 id="Ignore-hosts-that-are-down">Ignore hosts that are down</h2>
 
-<p>In clusters with many hosts a few of the are often down. GNU Parallel can ignore those hosts. In this case the host 173.194.32.46 is down:</p>
+<p>In clusters with many hosts a few of them are often down. GNU <b>parallel</b> can ignore those hosts. In this case the host 173.194.32.46 is down:</p>
 
 <pre><code>  parallel --filter-hosts -S 173.194.32.46,$SERVER1 echo ::: bar </code></pre>
 
@@ -1549,7 +1707,7 @@
 
 <h2 id="Running-the-same-commands-on-all-hosts">Running the same commands on all hosts</h2>
 
-<p>GNU Parallel can run the same command on all the hosts:</p>
+<p>GNU <b>parallel</b> can run the same command on all the hosts:</p>
 
 <pre><code>  parallel --onall -S $SERVER1,$SERVER2 echo ::: foo bar</code></pre>
 
@@ -1560,7 +1718,7 @@
   foo
   bar</code></pre>
 
-<p>Often you will just want to run a single command on all hosts with out arguments. --nonall is a no argument --onall:</p>
+<p>Often you will just want to run a single command on all hosts with out arguments. <b>--nonall</b> is a no argument <b>--onall</b>:</p>
 
 <pre><code>  parallel --nonall -S $SERVER1,$SERVER2 echo foo bar</code></pre>
 
@@ -1569,7 +1727,7 @@
 <pre><code>  foo bar
   foo bar</code></pre>
 
-<p>When --tag is used with --nonall and --onall the --tagstring is the host:</p>
+<p>When <b>--tag</b> is used with <b>--nonall</b> and <b>--onall</b> the <b>--tagstring</b> is the host:</p>
 
 <pre><code>  parallel --nonall --tag -S $SERVER1,$SERVER2 echo foo bar</code></pre>
 
@@ -1578,11 +1736,11 @@
 <pre><code>  $SERVER1 foo bar
   $SERVER2 foo bar</code></pre>
 
-<p>--jobs sets the number of servers to log in to in parallel.</p>
+<p><b>--jobs</b> sets the number of servers to log in to in parallel.</p>
 
-<h2 id="Transfer-environment-variables-and-functions">Transfer environment variables and functions</h2>
+<h2 id="Transferring-environment-variables-and-functions">Transferring environment variables and functions</h2>
 
-<p>Using --env GNU Parallel can transfer an environment variable to the remote system.</p>
+<p>Using <b>--env</b> GNU <b>parallel</b> can transfer an environment variable to the remote system.</p>
 
 <pre><code>  MYVAR=&#39;foo bar&#39;
   export MYVAR
@@ -1592,7 +1750,7 @@
 
 <pre><code>  foo bar baz</code></pre>
 
-<p>This works for functions too if your shell is Bash:</p>
+<p>This works for functions, too, if your shell is Bash:</p>
 
 <pre><code>  # This only works in Bash
   my_func() {
@@ -1605,7 +1763,7 @@
 
 <pre><code>  in my_func baz</code></pre>
 
-<p>GNU Parallel can copy all defined variables and functions to the remote system. It just needs to record which ones to ignore in ~/.parallel/ignored_vars. Do that by running this once:</p>
+<p>GNU <b>parallel</b> can copy all defined variables and functions to the remote system. It just needs to record which ones to ignore in <b>~/.parallel/ignored_vars</b>. Do that by running this once:</p>
 
 <pre><code>  parallel --record-env
   cat ~/.parallel/ignored_vars</code></pre>
@@ -1614,7 +1772,7 @@
 
 <pre><code>  [list of variables to ignore - including $PATH and $HOME]</code></pre>
 
-<p>Now all new variables and functions defined will be copied when using --env _:</p>
+<p>Now all new variables and functions defined will be copied when using <b>--env _</b>:</p>
 
 <pre><code>  # The function is only copied if using Bash
   my_func2() {
@@ -1633,21 +1791,25 @@
 
 <h2 id="Showing-what-is-actually-run">Showing what is actually run</h2>
 
-<p>--verbose will show the command that would be run on the local machine. When a job is run on a remote machine this is wrapped with ssh and possibly transferring files and environment variables, setting the workdir, and setting --nice value. -vv shows all of this.</p>
+<p><b>--verbose</b> will show the command that would be run on the local machine. When a job is run on a remote machine, this is wrapped with <b>ssh</b> and possibly transferring files and environment variables, setting the workdir, and setting <b>--nice</b> value. <b>-vv</b> shows all of this.</p>
 
 <pre><code>  parallel -vv -S $SERVER1 echo ::: bar</code></pre>
 
 <p>Output:</p>
 
-<pre><code>  ssh lo exec perl\ -e\ \\\$ENV\\\{\\\&quot;PARALLEL_PID\\\&quot;\\\}=\\\&quot;2554030\\\&quot;\\\;\
-  \\$ENV\\\{\\\&quot;PARALLEL_SEQ\\\&quot;\\\}=\\\&quot;1\\\&quot;\\\;\\\$bashfunc\\\ =\\\ \\\&quot;\\\&quot;\
-  \\;@ARGV=\\\&quot;echo\\\ bar\\\&quot;\\\;\\\$SIG\\\{CHLD\\\}=sub\\\{\\\$done=1\\\;\\\}\
-  \\;\\\$pid=fork\\\;unless\\\(\\\$pid\\\)\\\{setpgrp\\\;exec\\\$ENV\\\{SHELL\\\
-  },\\\&quot;-c\\\&quot;,\\\(\\\$bashfunc.\\\&quot;@ARGV\\\&quot;\\\)\\\;die\\\&quot;exec:\\\$\\\!\\\\n\\
-  \&quot;\\\;\\\}do\\\{\\\$s=\\\$s\\\&lt;1\\\?0.001+\\\$s\\\*1.03:\\\$s\\\;select\\\(
-  undef,undef,undef,\\\$s\\\)\\\;\\\}until\\\(\\\$done\\\|\\\|getppid==1\\\)\\\;
-  kill\\\(SIGHUP,-\\\$\\\{pid\\\}\\\)unless\\\$done\\\;wait\\\;exit\\\(\\\$\\\?\
-  \\&amp;127\\\?128+\\\(\\\$\\\?\\\&amp;127\\\):1+\\\$\\\?\\\&gt;\\\&gt;8\\\);
+<pre><code>  ssh lo -- exec perl -e \&#39;&#39;@GNU_Parallel=(&quot;use&quot;,&quot;IPC::Open3;&quot;,&quot;use&quot;,&quot;MIME::Base64&quot;);
+  eval&quot;@GNU_Parallel&quot;;my$eval;$eval=decode_base64(join&quot;&quot;,@ARGV);eval$eval;&#39;\&#39; 
+  JEVOVnsiUEFSQUxMRUxfUElEIn09IjI3MzQiOyRFTlZ7IlBBUkFMTEVMX1NFUSJ9PSIx
+  IjskYmFzaGZ1bmMgPSAiIjtAQVJHVj0iZWNobyBiYXIiOyRzaGVsbD0iJEVOVntTSEVM
+  TH0iOyR0bXBkaXI9Ii90bXAiOyRuaWNlPTA7ZG97JEVOVntQQVJBTExFTF9UTVB9PSR0
+  bXBkaXIuIi9wYXIiLmpvaW4iIixtYXB7KDAuLjksImEiLi4ieiIsIkEiLi4iWiIpW3Jh
+  bmQoNjIpXX0oMS4uNSk7fXdoaWxlKC1lJEVOVntQQVJBTExFTF9UTVB9KTskU0lHe0NI
+  TER9PXN1YnskZG9uZT0xO307JHBpZD1mb3JrO3VubGVzcygkcGlkKXtzZXRwZ3JwO2V2
+  YWx7c2V0cHJpb3JpdHkoMCwwLCRuaWNlKX07ZXhlYyRzaGVsbCwiLWMiLCgkYmFzaGZ1
+  bmMuIkBBUkdWIik7ZGllImV4ZWM6JCFcbiI7fWRveyRzPSRzPDE/MC4wMDErJHMqMS4w
+  MzokcztzZWxlY3QodW5kZWYsdW5kZWYsdW5kZWYsJHMpO311bnRpbCgkZG9uZXx8Z2V0
+  cHBpZD09MSk7a2lsbChTSUdIVVAsLSR7cGlkfSl1bmxlc3MkZG9uZTt3YWl0O2V4aXQo
+  JD8mMTI3PzEyOCsoJD8mMTI3KToxKyQ/Pj44KQ==;
   bar</code></pre>
 
 <p>When the command gets more complex, the output is so hard to read, that it is only useful for debugging:</p>
@@ -1660,37 +1822,104 @@
 
 <p>Output will be similar to:</p>
 
-<pre><code>  ( ssh lo mkdir -p ./.parallel/tmp/aspire-2554425-1;rsync --protocol 30 -rlDzR 
-  -essh ./abc-file lo:./.parallel/tmp/aspire-2554425-1 );ssh lo exec perl -e \&#39;&#39;
-  @GNU_Parallel=(&quot;use&quot;,&quot;IPC::Open3;&quot;,&quot;use&quot;,&quot;MIME::Base64&quot;);eval&quot;@GNU_Parallel&quot;;
-  $SIG{CHLD}=&quot;IGNORE&quot;;my$zip=(grep{-x$_}&quot;/usr/local/bin/bzip2&quot;)[0]||&quot;bzip2&quot;;my(
-  $in,$out,$eval);open3($in,$out,&quot;&gt;&amp;STDERR&quot;,$zip,&quot;-dc&quot;);if(my$perlpid=fork){
-  close$in;$eval=join&quot;&quot;,&lt;$out&gt;;close$out;}else{close$out;print$in(decode_base64(
-  join&quot;&quot;,@ARGV));close$in;exit;}wait;eval$eval;&#39;\&#39; QlpoOTFBWSZTWayP388AAbdfgAAQd
-  X/+3//l/wS/7//vQAIq3U6bauIpk1NPUwnqGgND1NGI9TTQ0A0ADIDQNITU9NGqfonpPJRvU0ZQZAA
-  GhpoBoABpqaFNBMh+kGoybUaHogwCYBAADCSgRNqek1TxTeknqemhGyBqek8pk2jRPSeo002mQRo5f
-  oSZYrgzQFDd3HNWaskbx+MxNR89BdDzESFbADOJkI+QhIlnojHCWRVuGc2j2lzMzE41wC7auAMQ06c
-  S3AlqQfKcdo0gd506U0HzAAxMkGJBHjDCZULOMpVbowhIVxxaQz7yansTsBgurEZaGO/6K0Nc4iodr
-  BW4m9SXErqRbLNy5eANDvZ+TIt2c2GBcWSlmYuloxY5u2bGUdU/dGsO5EhyrvKCpZMhIgmQFAQhcwR
-  mD+jMKRawkRFJSGyTNC3PqWnE51ucPyx29Yxjnkyub98lytpyk+v8BUc4eA3xz98dMYjxvb0pgWksh
-  oHZ7HwGQRq1vuDyzKgkwPL9lwGIdL+WPNJFSljlVAahIhQpDCAOJpTqDhgmfoRQcy54PC9T0T3iMnV
-  JeTUdL8P0/s18NqDSUavMNV3qD0CtYi6entl0neNsOQN2VDSLHj0xOMls65LNPo+Wh28rJtVoh2JgE
-  7Q9Qo/XBr6krGIsYpQR6nRDuJCD/5aaQBBFFQGtv2VoFTwkXiUTxFP1CC4AGBznAaMklgWQvVtKguJ
-  zQnPqr9ABtHwbB5GTzPOQ4iWAmrUxvl4j5wqrVchOZcs3NYUQmGO2+VYBimFVxhGcaxDALMZ6bWEUo
-  yt8eC8W5o1ObFtTnHAvjOQgYEL/nHTcxU0G57QMKCzJcASQWFNpe2CpQcgYlBxIN4kwtfxdyRThQkK
-  yP388;_EXIT_status=$?; mkdir -p ./.; rsync --protocol 30 --rsync-path=cd\ 
-  ./.parallel/tmp/aspire-2554425-1/./.\;\ rsync -rlDzR -essh lo:./abc-file.out 
-  ./.;ssh lo \(rm\ -f\ ./.parallel/tmp/aspire-2554425-1/abc-file\;\ sh\ -c\ \&#39;
-  rmdir\ ./.parallel/tmp/aspire-2554425-1/\ ./.parallel/tmp/\ ./.parallel/\ 2\&gt;
-  /dev/null\&#39;\;rm\ -rf\ ./.parallel/tmp/aspire-2554425-1\;\);ssh lo \(rm\ -f\ 
-  ./.parallel/tmp/aspire-2554425-1/abc-file.out\;\ sh\ -c\ \&#39;rmdir\ ./.parallel
-  /tmp/aspire-2554425-1/\ ./.parallel/tmp/\ ./.parallel/\ 2\&gt;/dev/null\&#39;\;rm\ 
-  -rf\ ./.parallel/tmp/aspire-2554425-1\;\);ssh lo rm -rf .parallel/tmp/
-  aspire-2554425-1; exit $_EXIT_status;</code></pre>
+<pre><code>  ( ssh lo -- mkdir -p ./.parallel/tmp/hk-3492-1;rsync --protocol 30
+  -rlDzR -essh ./abc-file lo:./.parallel/tmp/hk-3492-1 );ssh lo --
+  exec perl -e \&#39;&#39;@GNU_Parallel=(&quot;use&quot;,&quot;IPC::Open3;&quot;,&quot;use&quot;,&quot;MIME::Base64&quot;);
+  eval&quot;@GNU_Parallel&quot;;my$eval;$eval=decode_base64(join&quot;&quot;,@ARGV);eval$eval;&#39;\&#39;
+  c3lzdGVtKCJta2RpciIsIi1wIiwiLS0iLCIucGFyYWxsZWwvdG1wL2hrLTM0OTItMSIp
+  OyBjaGRpciAiLnBhcmFsbGVsL3RtcC9oay0zNDkyLTEiIHx8cHJpbnQoU1RERVJSICJw
+  YXJhbGxlbDogQ2Fubm90IGNoZGlyIHRvIC5wYXJhbGxlbC90bXAvaGstMzQ5Mi0xXG4i
+  KSAmJiBleGl0IDI1NTskRU5WeyJHUEdfQUdFTlRfSU5GTyJ9PSIvdG1wL2dwZy10WjVI
+  U0QvUy5ncGctYWdlbnQ6MjM5NzoxIjskRU5WeyJQQVJBTExFTF9TRVEifT0iMSI7JEVO
+  VnsiU1FMSVRFVEJMIn09InNxbGl0ZTM6Ly8vJTJGdG1wJTJGcGFyYWxsZWwuZGIyL3Bh
+  cnNxbDIiOyRFTlZ7IlBBUkFMTEVMX1BJRCJ9PSIzNDkyIjskRU5WeyJTUUxJVEUifT0i
+  c3FsaXRlMzovLy8lMkZ0bXAlMkZwYXJhbGxlbC5kYjIiOyRFTlZ7IlBBUkFMTEVMX1BJ
+  RCJ9PSIzNDkyIjskRU5WeyJQQVJBTExFTF9TRVEifT0iMSI7QGJhc2hfZnVuY3Rpb25z
+  PXF3KG15X2Z1bmMzKTsgaWYoJEVOVnsiU0hFTEwifT1+L2NzaC8pIHsgcHJpbnQgU1RE
+  RVJSICJDU0gvVENTSCBETyBOT1QgU1VQUE9SVCBuZXdsaW5lcyBJTiBWQVJJQUJMRVMv
+  RlVOQ1RJT05TLiBVbnNldCBAYmFzaF9mdW5jdGlvbnNcbiI7IGV4ZWMgImZhbHNlIjsg
+  fSAKJGJhc2hmdW5jID0gIm15X2Z1bmMzKCkgeyAgZWNobyBpbiBteV9mdW5jIFwkMSA+
+  IFwkMS5vdXQKfTtleHBvcnQgLWYgbXlfZnVuYzMgPi9kZXYvbnVsbDsiO0BBUkdWPSJt
+  eV9mdW5jMyBhYmMtZmlsZSI7JHNoZWxsPSIkRU5We1NIRUxM
+  fSI7JHRtcGRpcj0iL3RtcCI7JG5pY2U9MTc7ZG97JEVOVntQQVJBTExFTF9UTVB9PSR0
+  bXBkaXIuIi9wYXIiLmpvaW4iIixtYXB7KDAuLjksImEiLi4ieiIsIkEiLi4iWiIpW3Jh
+  bmQoNjIpXX0oMS4uNSk7fXdoaWxlKC1lJEVOVntQQVJBTExFTF9UTVB9KTskU0lHe0NI
+  TER9PXN1YnskZG9uZT0xO307JHBpZD1mb3JrO3VubGVzcygkcGlkKXtzZXRwZ3JwO2V2
+  YWx7c2V0cHJpb3JpdHkoMCwwLCRuaWNlKX07ZXhlYyRzaGVsbCwiLWMiLCgkYmFzaGZ1
+  bmMuIkBBUkdWIik7ZGllImV4ZWM6JCFcbiI7fWRveyRzPSRzPDE/MC4wMDErJHMqMS4w
+  MzokcztzZWxlY3QodW5kZWYsdW5kZWYsdW5kZWYsJHMpO311bnRpbCgkZG9uZXx8Z2V0
+  cHBpZD09MSk7a2lsbChTSUdIVVAsLSR7cGlkfSl1bmxlc3MkZG9uZTt3YWl0O2V4aXQo
+  JD8mMTI3PzEyOCsoJD8mMTI3KToxKyQ/Pj44KQ==;_EXIT_status=$?;
+  mkdir -p ./.; rsync --protocol 30 --rsync-path=cd\
+  ./.parallel/tmp/hk-3492-1/./.\;\ rsync -rlDzR -essh
+  lo:./abc-file.out ./.;ssh lo -- \(rm\ -f\
+  ./.parallel/tmp/hk-3492-1/abc-file\;\ sh\ -c\ \&#39;rmdir\
+  ./.parallel/tmp/hk-3492-1/\ ./.parallel/tmp/\ ./.parallel/\
+  2\&gt;/dev/null\&#39;\;rm\ -rf\ ./.parallel/tmp/hk-3492-1\;\);ssh lo --
+  \(rm\ -f\ ./.parallel/tmp/hk-3492-1/abc-file.out\;\ sh\ -c\ \&#39;rmdir\
+  ./.parallel/tmp/hk-3492-1/\ ./.parallel/tmp/\ ./.parallel/\
+  2\&gt;/dev/null\&#39;\;rm\ -rf\ ./.parallel/tmp/hk-3492-1\;\);ssh lo -- rm
+  -rf .parallel/tmp/hk-3492-1; exit $_EXIT_status;</code></pre>
+
+<h1 id="Saving-to-an-SQL-base-advanced">Saving to an SQL base (advanced)</h1>
+
+<p>GNU <b>parallel</b> can save into an SQL base. Point GNU <b>parallel</b> to a table and it will put the joblog there together with the variables and the outout each in their own column.</p>
+
+<p>GNU <b>parallel</b> uses a DBURL to address the table. A DBURL has this format:</p>
+
+<pre><code>  vendor://[[user][:password]@][host][:port]/[database[/table]</code></pre>
+
+<p>Example:</p>
+
+<pre><code>  mysql://scott:tiger@my.example.com/mydatabase/mytable
+  postgresql://scott:tiger@pg.example.com/mydatabase/mytable
+  sqlite3:///%2Ftmp%2Fmydatabase/mytable</code></pre>
+
+<p>To refer to <b>/tmp/mydatabase</b> with <b>sqlite</b> you need to encode the <b>/</b> as <b>%2F</b>.</p>
+
+<p>Run a job using <b>sqlite</b> on <b>mytable</b> in <b>/tmp/mydatabase</b>:</p>
+
+<pre><code>  DBURL=sqlite3:///%2Ftmp%2Fmydatabase
+  DBURLTABLE=$DBURL/mytable
+  parallel --sqlandworker $DBURLTABLE echo ::: foo bar ::: baz quuz</code></pre>
+
+<p>To see the result:</p>
+
+<pre><code>  sql $DBURL &#39;SELECT * FROM mytable ORDER BY Seq;&#39;</code></pre>
+
+<p>Output will be similar to:</p>
+
+<pre><code>  Seq|Host|Starttime|JobRuntime|Send|Receive|Exitval|_Signal|Command|V1|V2|Stdout|Stderr
+  1|:|1451619638.903|0.806||8|0|0|echo foo baz|foo|baz|foo baz
+  |
+  2|:|1451619639.265|1.54||9|0|0|echo foo quuz|foo|quuz|foo quuz
+  |
+  3|:|1451619640.378|1.43||8|0|0|echo bar baz|bar|baz|bar baz
+  |
+  4|:|1451619641.473|0.958||9|0|0|echo bar quuz|bar|quuz|bar quuz
+  |</code></pre>
+
+<p>The first columns are well known from <b>--joblog</b>. <b>V1</b> and <b>V2</b> are data from the input sources. <b>Stdout</b> and <b>Stderr</b> are standard output and standard error, respectively.</p>
+
+<h2 id="Using-multiple-workers">Using multiple workers</h2>
+
+<p>Using an SQL base as storage costs a lot of performance.</p>
+
+<p>One of the situations where it makes sense is if you have multiple workers.</p>
+
+<p>You can then have a single master machine that submits jobs to the SQL base (but does not do any of the work):</p>
+
+<pre><code>  parallel --sql $DBURLTABLE echo ::: foo bar ::: baz quuz</code></pre>
+
+<p>On the worker machines you run exactly the same command except you replace <b>--sql</b> with <b>--sqlworker</b>.</p>
+
+<pre><code>  parallel --sqlworker $DBURLTABLE echo ::: foo bar ::: baz quuz</code></pre>
+
+<p>To run a master and a worker on the same machine use <b>--sqlandworker</b> as shown earlier.</p>
 
 <h1 id="pipe">--pipe</h1>
 
-<p>The --pipe functionality puts GNU Parallel in a different mode: Instead of treating the data on stdin (standard input) as arguments for a command to run, the data will be sent to stdin (standard input) of the command.</p>
+<p>The <b>--pipe</b> functionality puts GNU <b>parallel</b> in a different mode: Instead of treating the data on stdin (standard input) as arguments for a command to run, the data will be sent to stdin (standard input) of the command.</p>
 
 <p>The typical situation is:</p>
 
@@ -1700,7 +1929,7 @@
 
 <h2 id="Chunk-size">Chunk size</h2>
 
-<p>By default GNU Parallel will start an instance of command_B, read a chunk of 1 MB, and pass that to the instance. Then start another instance, read another chunk, and pass that to the second instance.</p>
+<p>By default GNU <b>parallel</b> will start an instance of command_B, read a chunk of 1 MB, and pass that to the instance. Then start another instance, read another chunk, and pass that to the second instance.</p>
 
 <pre><code>  cat num1000000 | parallel --pipe wc</code></pre>
 
@@ -1714,7 +1943,7 @@
   149796  149796 1048572
    85349   85349  597444</code></pre>
 
-<p>The size of the chunk is not exactly 1 MB because GNU Parallel only passes full lines - never half a line, thus the blocksize is only average 1 MB. You can change the block size to 2 MB with --block:</p>
+<p>The size of the chunk is not exactly 1 MB because GNU <b>parallel</b> only passes full lines - never half a line, thus the blocksize is only average 1 MB. You can change the block size to 2 MB with <b>--block</b>:</p>
 
 <pre><code>  cat num1000000 | parallel --pipe --block 2M wc</code></pre>
 
@@ -1725,7 +1954,7 @@
   299593  299593 2097151
    85349   85349  597444</code></pre>
 
-<p>GNU Parallel treats each line as a record. If the order of record is unimportant (e.g. you need all lines processed, but you do not care which is processed first), then you can use --round-robin. Without --round-robin GNU Parallel will start a command per block; with --round-robin only the requested number of jobs will be started (--jobs). The records will then be distributed between the running jobs:</p>
+<p>GNU <b>parallel</b> treats each line as a record. If the order of record is unimportant (e.g. you need all lines processed, but you do not care which is processed first), then you can use <b>--round-robin</b>. Without <b>--round-robin</b> GNU <b>parallel</b> will start a command per block; with <b>--round-robin</b> only the requested number of jobs will be started (<b>--jobs</b>). The records will then be distributed between the running jobs:</p>
 
 <pre><code>  cat num1000000 | parallel --pipe -j4 --round-robin wc</code></pre>
 
@@ -1740,9 +1969,9 @@
 
 <h2 id="Records">Records</h2>
 
-<p>GNU Parallel sees the input as records. The default record is a single line.</p>
+<p>GNU <b>parallel</b> sees the input as records. The default record is a single line.</p>
 
-<p>Using -N140000 GNU Parallel will read 140000 records at a time:</p>
+<p>Using <b>-N140000</b> GNU <b>parallel</b> will read 140000 records at a time:</p>
 
 <pre><code>  cat num1000000 | parallel --pipe -N140000 wc</code></pre>
 
@@ -1759,7 +1988,7 @@
 
 <p>Notice that the last job could not get the full 140000 lines, but only 20000 lines.</p>
 
-<p>If a record is 75 lines -L can be used:</p>
+<p>If a record is 75 lines <b>-L</b> can be used:</p>
 
 <pre><code>  cat num1000000 | parallel --pipe -L75 wc</code></pre>
 
@@ -1774,17 +2003,17 @@
    85350   85350  597450
       25      25     176</code></pre>
 
-<p>Notice GNU Parallel still reads a block of around 1 MB; but instead of passing full lines to &#39;wc&#39; it passes full 75 lines at a time. This of course does not hold for the last job (which in this case got 25 lines).</p>
+<p>Notice GNU <b>parallel</b> still reads a block of around 1 MB; but instead of passing full lines to <b>wc</b> it passes full 75 lines at a time. This of course does not hold for the last job (which in this case got 25 lines).</p>
 
 <h2 id="Record-separators">Record separators</h2>
 
-<p>GNU Parallel uses separators to determine where two records split.</p>
+<p>GNU <b>parallel</b> uses separators to determine where two records split.</p>
 
-<p>--recstart gives the string that starts a record; --recend gives the string that ends a record. The default is --recend &#39;\n&#39; (newline).</p>
+<p><b>--recstart</b> gives the string that starts a record; <b>--recend</b> gives the string that ends a record. The default is <b>--recend &#39;\n&#39;</b> (newline).</p>
 
-<p>If both --recend and --recstart are given, then the record will only split if the recend string is immediately followed by the recstart string.</p>
+<p>If both <b>--recend</b> and <b>--recstart</b> are given, then the record will only split if the recend string is immediately followed by the recstart string.</p>
 
-<p>Here the --recend is set to &#39;, &#39;:</p>
+<p>Here the <b>--recend</b> is set to <b>&#39;, &#39;</b>:</p>
 
 <pre><code>  echo /foo, bar/, /baz, qux/, | parallel -kN1 --recend &#39;, &#39; --pipe echo JOB{#}\;cat\;echo END</code></pre>
 
@@ -1800,9 +2029,9 @@
   qux/,
   END</code></pre>
 
-<p>Here the --recstart is set to &#39;/&#39;:</p>
+<p>Here the <b>--recstart</b> is set to <b>/</b>:</p>
 
-<pre><code>  echo /foo, bar/, /baz, qux/, | parallel -kN1 --recstart &#39;/&#39; --pipe echo JOB{#}\;cat\;echo END</code></pre>
+<pre><code>  echo /foo, bar/, /baz, qux/, | parallel -kN1 --recstart / --pipe echo JOB{#}\;cat\;echo END</code></pre>
 
 <p>Output:</p>
 
@@ -1816,9 +2045,9 @@
   /,
   END</code></pre>
 
-<p>Here both --recend and --recstart are set:</p>
+<p>Here both <b>--recend</b> and <b>--recstart</b> are set:</p>
 
-<pre><code>  echo /foo, bar/, /baz, qux/, | parallel -kN1 --recend &#39;, &#39; --recstart &#39;/&#39; --pipe echo JOB{#}\;cat\;echo END</code></pre>
+<pre><code>  echo /foo, bar/, /baz, qux/, | parallel -kN1 --recend &#39;, &#39; --recstart / --pipe echo JOB{#}\;cat\;echo END</code></pre>
 
 <p>Output:</p>
 
@@ -1830,9 +2059,9 @@
 
 <p>Note the difference between setting one string and setting both strings.</p>
 
-<p>With --regexp the --recend and --recstart will be treated as a regular expression:</p>
+<p>With <b>--regexp</b> the <b>--recend</b> and <b>--recstart</b> will be treated as a regular expression:</p>
 
-<pre><code>  echo foo,bar,_baz,__qux, | parallel -kN1 --regexp --recend &#39;,_+&#39; --pipe echo JOB{#}\;cat\;echo END</code></pre>
+<pre><code>  echo foo,bar,_baz,__qux, | parallel -kN1 --regexp --recend ,_+ --pipe echo JOB{#}\;cat\;echo END</code></pre>
 
 <p>Output:</p>
 
@@ -1844,9 +2073,9 @@
   qux,
   END</code></pre>
 
-<p>GNU Parallel can remove the record separators with --remove-rec-sep/--rrs:</p>
+<p>GNU <b>parallel</b> can remove the record separators with <b>--remove-rec-sep</b>/<b>--rrs</b>:</p>
 
-<pre><code>  echo foo,bar,_baz,__qux, | parallel -kN1 --rrs --regexp --recend &#39;,_+&#39; --pipe echo JOB{#}\;cat\;echo END</code></pre>
+<pre><code>  echo foo,bar,_baz,__qux, | parallel -kN1 --rrs --regexp --recend ,_+ --pipe echo JOB{#}\;cat\;echo END</code></pre>
 
 <p>Output:</p>
 
@@ -1860,7 +2089,7 @@
 
 <h2 id="Header">Header</h2>
 
-<p>If the input data has a header, the header can be repeated for each job by matching the header with --header. If headers start with %:</p>
+<p>If the input data has a header, the header can be repeated for each job by matching the header with <b>--header</b>. If headers start with <b>%</b> you can do this:</p>
 
 <pre><code>  cat num_%header | parallel --header &#39;(%.*\n)*&#39; --pipe -N3 echo JOB{#}\;cat</code></pre>
 
@@ -1889,7 +2118,7 @@
   %head2
   10</code></pre>
 
-<p>If the header is 2 lines, --header 2 will work:</p>
+<p>If the header is 2 lines, <b>--header</b> 2 will work:</p>
 
 <pre><code>  cat num_%header | parallel --header 2 --pipe -N3 echo JOB{#}\;cat</code></pre>
 
@@ -1897,7 +2126,7 @@
 
 <h2 id="pipepart">--pipepart</h2>
 
-<p>--pipe is not very efficient. It maxes out at around 500 MB/s. --pipepart can easily deliver 5 GB/s. But there are a few limitations. The input has to be a normal file (not a pipe) given by -a or :::: and -L/-l/-N do not work.</p>
+<p><b>--pipe</b> is not very efficient. It maxes out at around 500 MB/s. <b>--pipepart</b> can easily deliver 5 GB/s. But there are a few limitations. The input has to be a normal file (not a pipe) given by <b>-a</b> or <b>::::</b> and <b>-L</b>/<b>-l</b>/<b>-N</b> do not work.</p>
 
 <pre><code>  parallel --pipepart -a num1000000 --block 3m wc</code></pre>
 
@@ -1911,17 +2140,17 @@
 
 <h2 id="Input-data-and-parallel-command-in-the-same-file">Input data and parallel command in the same file</h2>
 
-<p>GNU Parallel is often called as:</p>
+<p>GNU <b>parallel</b> is often called as this:</p>
 
 <pre><code>  cat input_file | parallel command</code></pre>
 
-<p>With --shebang the input_file and parallel can be combined into the same script.</p>
+<p>With <b>--shebang</b> the <i>input_file</i> and <b>parallel</b> can be combined into the same script.</p>
 
-<p>UNIX-scripts start with a shebang line like:</p>
+<p>UNIX-scripts start with a shebang line like this:</p>
 
 <pre><code>  #!/bin/bash</code></pre>
 
-<p>GNU Parallel can do that, too. With --shebang the arguments can be listed in the file. The parallel command is the first line of the script:</p>
+<p>GNU <b>parallel</b> can do that, too. With <b>--shebang</b> the arguments can be listed in the file. The <b>parallel</b> command is the first line of the script:</p>
 
 <pre><code>  #!/usr/bin/parallel --shebang -r echo
 
@@ -1937,19 +2166,19 @@
 
 <h2 id="Parallelizing-existing-scripts">Parallelizing existing scripts</h2>
 
-<p>GNU Parallel is often called as:</p>
+<p>GNU <b>parallel</b> is often called as:</p>
 
 <pre><code>  cat input_file | parallel command
   parallel command ::: foo bar</code></pre>
 
-<p>If command is a script parallel can be combined into a single file so:</p>
+<p>If command is a script <b>parallel</b> can be combined into a single file so:</p>
 
 <pre><code>  cat input_file | command
   command foo bar</code></pre>
 
-<p>will run the script in parallel.</p>
+<p>will run the script in <b>parallel</b>.</p>
 
-<p>This perl script perl_echo works like echo:</p>
+<p>This <b>perl</b> script <b>perl_echo</b> works like <b>echo</b>:</p>
 
 <pre><code>  #!/usr/bin/perl
 
@@ -1959,7 +2188,7 @@
 
 <pre><code>  parallel perl_echo ::: foo bar</code></pre>
 
-<p>By changing the #!-line it can be run in parallel</p>
+<p>By changing the <b>#!</b>-line it can be run in parallel:</p>
 
 <pre><code>  #!/usr/bin/parallel --shebang-wrap /usr/bin/perl
 
@@ -1983,56 +2212,92 @@
 
 <p>#!/usr/bin/parallel --shebang-wrap /usr/bin/perl</p>
 
+<p>print &quot;Arguments @ARGV\n&quot;;</p>
+
 </dd>
 <dt id="Python">Python:</dt>
 <dd>
 
 <p>#!/usr/bin/parallel --shebang-wrap /usr/bin/python</p>
 
+<p>import sys</p>
+
+<p>print &#39;Arguments&#39;, str(sys.argv)</p>
+
 </dd>
 <dt id="Bash">Bash:</dt>
 <dd>
 
 <p>#!/usr/bin/parallel --shebang-wrap /bin/bash</p>
 
+<p>echo Arguments &quot;$@&quot;</p>
+
 </dd>
 <dt id="R">R:</dt>
 <dd>
 
 <p>#!/usr/bin/parallel --shebang-wrap /usr/bin/Rscript --vanilla --slave</p>
 
+<p>args &lt;- commandArgs(trailingOnly = TRUE) print(paste(&quot;Arguments &quot;,args))</p>
+
 </dd>
 <dt id="GNUplot">GNUplot:</dt>
 <dd>
 
 <p>#!/usr/bin/parallel --shebang-wrap ARG={} /usr/bin/gnuplot</p>
 
+<p>print &quot;Arguments &quot;, system(&#39;echo $ARG&#39;)</p>
+
 </dd>
 <dt id="Ruby">Ruby:</dt>
 <dd>
 
 <p>#!/usr/bin/parallel --shebang-wrap /usr/bin/ruby</p>
 
+<p>print &quot;Arguments &quot; puts ARGV</p>
+
+</dd>
+<dt id="Octave">Octave:</dt>
+<dd>
+
+<p>#!/usr/bin/parallel --shebang-wrap /usr/bin/octave</p>
+
+<p>printf (&quot;Arguments&quot;); arg_list = argv (); for i = 1:nargin printf (&quot; %s&quot;, arg_list{i}); endfor printf (&quot;\n&quot;);</p>
+
+</dd>
+<dt id="Common-LISP">Common LISP:</dt>
+<dd>
+
+<p>#!/usr/bin/parallel --shebang-wrap /usr/bin/clisp</p>
+
+<p>(format t &quot;~&amp;~S~&amp;&quot; &#39;Arguments) (format t &quot;~&amp;~S~&amp;&quot; *args*)</p>
+
+<p>LUA PHP Javascript nodejs Tcl C#?</p>
+
 </dd>
 </dl>
 
 <h1 id="Semaphore">Semaphore</h1>
 
-<p>GNU Parallel can work as a counting semaphore. This is slower and less efficient than its normal mode.</p>
+<p>GNU <b>parallel</b> can work as a counting semaphore. This is slower and less efficient than its normal mode.</p>
 
 <p>A counting semaphore is like a row of toilets. People needing a toilet can use any toilet, but if there are more people than toilets, they will have to wait for one of the toilets to be available.</p>
 
-<p>An alias for &#39;parallel --semaphore&#39; is &#39;sem&#39;.</p>
+<p>An alias for <b>parallel --semaphore</b> is <b>sem</b>.</p>
 
-<p>&#39;sem&#39; will follow a person to the toilets, wait until a toilet is available, leave the person in the toilet and exit.</p>
+<p><b>sem</b> will follow a person to the toilets, wait until a toilet is available, leave the person in the toilet and exit.</p>
 
-<p>&#39;sem --fg&#39; will follow a person to the toilets, wait until a toilet is available, stay with the person in the toilet and exit when the person exits.</p>
+<p><b>sem --fg</b> will follow a person to the toilets, wait until a toilet is available, stay with the person in the toilet and exit when the person exits.</p>
 
-<p>&#39;sem --wait&#39; will wait for all persons to leave the toilets.</p>
+<p><b>sem --wait</b> will wait for all persons to leave the toilets.</p>
 
-<p>&#39;sem&#39; does not have a queue discipline, so the next person is chosen randomly.</p>
+<p><b>sem</b> does not have a queue discipline, so the next person is chosen randomly.</p>
 
-<p>-j sets the number of toilets. The default is to have only one toilet (technically this is called a mutex). The program is started in the background and &#39;sem&#39; exits immediately. Use --wait to wait for all &#39;sem&#39;s to finish:</p>
+<p><b>-j</b> sets the number of toilets.</p>
+
+<h2 id="Mutex">Mutex</h2>
+
+<p>The default is to have only one toilet (this is called a mutex). The program is started in the background and <b>sem</b> exits immediately. Use <b>--wait</b> to wait for all <b>sem</b>s to finish:</p>
 
 <pre><code>  sem &#39;sleep 1; echo The first finished&#39; &amp;&amp;
     echo The first is now running in the background &amp;&amp;
@@ -2047,7 +2312,7 @@
   The second is now running in the background
   The second finished</code></pre>
 
-<p>The command can be run in the foreground with --fg, which will only exit when the command completes:</p>
+<p>The command can be run in the foreground with <b>--fg</b>, which will only exit when the command completes:</p>
 
 <pre><code>  sem --fg &#39;sleep 1; echo The first finished&#39; &amp;&amp;
     echo The first finished running in the foreground &amp;&amp;
@@ -2055,9 +2320,9 @@
     echo The second finished running in the foreground
   sem --wait</code></pre>
 
-<p>The difference between this and just running the command, is that a mutex is set, so if other sems were running in the background only one would run at the same time.</p>
+<p>The difference between this and just running the command, is that a mutex is set, so if other <b>sem</b>s were running in the background only one would run at a time.</p>
 
-<p>To tell the difference between which semaphore is used, use --semaphorename/--id. Run this in one terminal:</p>
+<p>To tell the difference between which semaphore is used, use <b>--semaphorename</b>/<b>--id</b>. Run this in one terminal:</p>
 
 <pre><code>  sem --id my_id -u &#39;echo First started; sleep 10; echo The first finished&#39;</code></pre>
 
@@ -2071,7 +2336,7 @@
 
 <p>A mutex is like having a single toilet: When it is in use everyone else will have to wait. A counting semaphore is like having multiple toilets: Several people can use the toilets, but when they all are in use, everyone else will have to wait.</p>
 
-<p>sem can emulate a counting semaphore. Use --jobs to set the number of toilets:</p>
+<p><b>sem</b> can emulate a counting semaphore. Use <b>--jobs</b> to set the number of toilets like this:</p>
 
 <pre><code>  sem --jobs 3 --id my_id -u &#39;echo First started; sleep 5; echo The first finished&#39; &amp;&amp;
   sem --jobs 3 --id my_id -u &#39;echo Second started; sleep 6; echo The second finished&#39; &amp;&amp;
@@ -2092,7 +2357,7 @@
 
 <h2 id="Timeout">Timeout</h2>
 
-<p>With --semaphoretimeout you can force running the command anyway after a period (postive number) or give up (negative number):</p>
+<p>With <b>--semaphoretimeout</b> you can force running the command anyway after a period (postive number) or give up (negative number):</p>
 
 <pre><code>  sem --id foo -u &#39;echo Slow started; sleep 5; echo Slow ended&#39; &amp;&amp;
   sem --id foo --semaphoretimeout 1 &#39;echo Force this running after 1 sec&#39; &amp;&amp;
@@ -2111,9 +2376,9 @@
 
 <h1 id="Informational">Informational</h1>
 
-<p>GNU Parallel has some options to give short information about the configuration.</p>
+<p>GNU <b>parallel</b> has some options to give short information about the configuration.</p>
 
-<p>--help will print a summary of the most important options:</p>
+<p><b>--help</b> will print a summary of the most important options:</p>
 
 <pre><code>  parallel --help</code></pre>
 
@@ -2146,11 +2411,11 @@
   When using GNU Parallel for a publication please cite:
   
   O. Tange (2011): GNU Parallel - The Command-Line Power Tool,
-  ;login: The USENIX Magazine, February 2011:42-47.</code></pre>
+  ;login: The USENIX Magazine, February 2011:42-47.
 
-<p>When asking for help, always report the full output of:</p>
+    When asking for help, always report the full output of this:
 
-<pre><code>  parallel --version</code></pre>
+  parallel --version</code></pre>
 
 <p>Output:</p>
 
@@ -2167,7 +2432,7 @@
   O. Tange (2011): GNU Parallel - The Command-Line Power Tool, 
   ;login: The USENIX Magazine, February 2011:42-47.</code></pre>
 
-<p>In scripts --minversion can be used to ensure the user has at least this version:</p>
+<p>In scripts <b>--minversion</b> can be used to ensure the user has at least this version:</p>
 
 <pre><code>  parallel --minversion 20130722 &amp;&amp; echo Your version is at least 20130722.</code></pre>
 
@@ -2176,7 +2441,7 @@
 <pre><code>  20130722
   Your version is at least 20130722.</code></pre>
 
-<p>If using GNU Parallel for research the BibTeX citation can be generated using --bibtex.</p>
+<p>If using GNU <b>parallel</b> for research the BibTeX citation can be generated using <b>--bibtex</b>:</p>
 
 <pre><code>  parallel --bibtex</code></pre>
 
@@ -2195,7 +2460,7 @@
    pages = {42-47}
   }</code></pre>
 
-<p>With --max-line-length-allowed GNU Parallel will report the maximal size of the command line:</p>
+<p>With <b>--max-line-length-allowed</b> GNU <b>parallel</b> will report the maximal size of the command line:</p>
 
 <pre><code>  parallel --max-line-length-allowed</code></pre>
 
@@ -2203,7 +2468,7 @@
 
 <pre><code>  131071</code></pre>
 
-<p>--number-of-cpus and --number-of-cores run system specific code to determine the number of CPUs and CPU cores on the system. On unsupported platforms they will return 1:</p>
+<p><b>--number-of-cpus</b> and <b>--number-of-cores</b> run system specific code to determine the number of CPUs and CPU cores on the system. On unsupported platforms they will return 1:</p>
 
 <pre><code>  parallel --number-of-cpus 
   parallel --number-of-cores</code></pre>
@@ -2215,9 +2480,9 @@
 
 <h1 id="Profiles">Profiles</h1>
 
-<p>The defaults for GNU Parallel can be changed systemwise by putting the command line options in /etc/parallel/config. They can be changed for a user by putting them in ~/.parallel/config.</p>
+<p>The defaults for GNU <b>parallel</b> can be changed systemwide by putting the command line options in <b>/etc/parallel/config</b>. They can be changed for a user by putting them in <b>~/.parallel/config</b>.</p>
 
-<p>Profiles work the same way, but have to be referred to with --profile:</p>
+<p>Profiles work the same way, but have to be referred to with <b>--profile</b>:</p>
 
 <pre><code>  echo &#39;--nice 17&#39; &gt; ~/.parallel/nicetimeout
   echo &#39;--timeout 300%&#39; &gt;&gt; ~/.parallel/nicetimeout
@@ -2244,7 +2509,7 @@
 
 <p>I hope you have learned something from this tutorial.</p>
 
-<p>If you like GNU Parallel:</p>
+<p>If you like GNU <b>parallel</b>:</p>
 
 <ul>
 
@@ -2257,7 +2522,7 @@
 <li><p>Post the intro videos and the tutorial on Reddit, Diaspora*, forums, blogs, Identi.ca, Google+, Twitter, Facebook, Linkedin, mailing lists</p>
 
 </li>
-<li><p>Request or write a review for your favourite blog or magazine</p>
+<li><p>Request or write a review for your favourite blog or magazine (especially if you do something cool with GNU <b>parallel</b>)</p>
 
 </li>
 <li><p>Invite me for your next conference</p>
@@ -2265,16 +2530,16 @@
 </li>
 </ul>
 
-<p>If you use GNU Parallel for research:</p>
+<p>If you use GNU <b>parallel</b> for research:</p>
 
 <ul>
 
-<li><p>Please cite GNU Parallel in you publications (use --bibtex)</p>
+<li><p>Please cite GNU <b>parallel</b> in you publications (use <b>--bibtex</b>)</p>
 
 </li>
 </ul>
 
-<p>If GNU Parallel saves you money:</p>
+<p>If GNU <b>parallel</b> saves you money:</p>
 
 <ul>
 
@@ -2283,7 +2548,7 @@
 </li>
 </ul>
 
-<p>(C) 2013,2014,2015 Ole Tange, GPLv3</p>
+<p>(C) 2013,2014,2015,2016 Ole Tange, GPLv3</p>
 
 
 </body>
diff --git a/src/parallel_tutorial.pod b/src/parallel_tutorial.pod
index a0af2232..e2894562 100644
--- a/src/parallel_tutorial.pod
+++ b/src/parallel_tutorial.pod
@@ -2,8 +2,8 @@
 
 =head1 GNU Parallel Tutorial
 
-This tutorial shows off much of GNU Parallel's functionality. The
-tutorial is meant to learn the options in GNU Parallel.  The tutorial
+This tutorial shows off much of GNU B<parallel>'s functionality. The
+tutorial is meant to learn the options in GNU B<parallel>.  The tutorial
 is not to show realistic examples from the real world.
 
 Spend an hour walking through the tutorial. Your command line will
@@ -107,7 +107,7 @@ and using an empty pass phrase.
 
 =head1 Input sources
 
-GNU Parallel reads input from input sources. These can be files, the
+GNU B<parallel> reads input from input sources. These can be files, the
 command line, and stdin (standard input or a pipe).
 
 =head2 A single input source
@@ -138,8 +138,8 @@ Output: Same as above.
 
 =head2 Multiple input sources
 
-GNU Parallel can take multiple input sources given on the command
-line. GNU Parallel then generates all combinations of the input
+GNU B<parallel> can take multiple input sources given on the command
+line. GNU B<parallel> then generates all combinations of the input
 sources:
 
   parallel echo ::: A B C ::: D E F
@@ -162,13 +162,13 @@ The input sources can be files:
 
 Output: Same as above.
 
-STDIN (standard input) can be one of the input sources using '-':
+STDIN (standard input) can be one of the input sources using B<->:
 
   cat abc-file | parallel -a - -a def-file echo 
 
 Output: Same as above.
 
-Instead of -a files can be given after '::::':
+Instead of B<-a> files can be given after B<::::>:
 
   cat abc-file | parallel echo :::: - def-file
 
@@ -182,7 +182,7 @@ Output: Same as above.
 
 =head3 Matching arguments from all input sources
 
-With --xapply you can get one argument from each input source:
+With B<--xapply> you can get one argument from each input source:
 
   parallel --xapply echo ::: A B C ::: D E F
 
@@ -206,8 +206,8 @@ Output (the order may be different):
 
 =head2 Changing the argument separator.
 
-GNU Parallel can use other separators than ::: or ::::. This is
-typically useful if ::: or :::: is used in the command to run:
+GNU B<parallel> can use other separators than B<:::> or B<::::>. This is
+typically useful if B<:::> or B<::::> is used in the command to run:
 
   parallel --arg-sep ,, echo ,, A B C :::: def-file
 
@@ -232,8 +232,8 @@ Output: Same as above.
 
 =head2 Changing the argument delimiter
 
-GNU Parallel will normally treat a full line as a single argument: It
-uses \n as argument delimiter. This can be changed with -d:
+GNU B<parallel> will normally treat a full line as a single argument: It
+uses B<\n> as argument delimiter. This can be changed with B<-d>:
 
   parallel -d _ echo :::: abc_-file
 
@@ -243,14 +243,14 @@ Output (the order may be different):
   B
   C
 
-NULL can be given as \0:
+NULL can be given as B<\0>:
 
   parallel -d '\0' echo :::: abc0-file
 
 Output: Same as above.
 
-A shorthand for -d '\0' is -0 (this will often be used to read files
-from find ... -print0):
+A shorthand for B<-d '\0'> is B<-0> (this will often be used to read files
+from B<find ... -print0>):
 
   parallel -0 echo :::: abc0-file
 
@@ -258,7 +258,7 @@ Output: Same as above.
 
 =head2 End-of-file value for input source
 
-GNU Parallel can stop reading when it encounters a certain value:
+GNU B<parallel> can stop reading when it encounters a certain value:
 
   parallel -E stop echo ::: A B stop C D
 
@@ -269,7 +269,7 @@ Output:
 
 =head2 Skipping empty lines
 
-Using --no-run-if-empty GNU Parallel will skip empty lines.
+Using B<--no-run-if-empty> GNU B<parallel> will skip empty lines.
 
   (echo 1; echo; echo 2) | parallel --no-run-if-empty echo
 
@@ -295,7 +295,7 @@ Output (the order may be different):
   [/path/to/current/working/dir]
 
 The command can be a script, a binary or a Bash function if the function is
-exported using 'export -f':
+exported using B<export -f>:
 
   # Only works in Bash
   my_func() {
@@ -314,8 +314,8 @@ Output (the order may be different):
 
 =head3 The 7 predefined replacement strings
 
-GNU Parallel has several replacement strings. If no replacement
-strings are used the default is to append {}:
+GNU B<parallel> has several replacement strings. If no replacement
+strings are used the default is to append B<{}>:
 
   parallel echo ::: A/B.C
 
@@ -323,7 +323,7 @@ Output:
 
   A/B.C
 
-The default replacement string is {}:
+The default replacement string is B<{}>:
 
   parallel echo {} ::: A/B.C
 
@@ -331,7 +331,7 @@ Output:
 
   A/B.C
 
-The replacement string {.} removes the extension:
+The replacement string B<{.}> removes the extension:
 
   parallel echo {.} ::: A/B.C
 
@@ -339,7 +339,7 @@ Output:
 
   A/B
 
-The replacement string {/} removes the path:
+The replacement string B<{/}> removes the path:
 
   parallel echo {/} ::: A/B.C
 
@@ -347,7 +347,7 @@ Output:
 
   B.C
 
-The replacement string {//} keeps only the path:
+The replacement string B<{//}> keeps only the path:
 
   parallel echo {//} ::: A/B.C
 
@@ -355,7 +355,7 @@ Output:
 
   A
 
-The replacement string {/.} removes the path and the extension:
+The replacement string B<{/.}> removes the path and the extension:
 
   parallel echo {/.} ::: A/B.C
 
@@ -363,7 +363,7 @@ Output:
 
   B
 
-The replacement string {#} gives the job number:
+The replacement string B<{#}> gives the job number:
 
   parallel echo {#} ::: A B C
 
@@ -373,7 +373,7 @@ Output (the order may be different):
   2
   3
 
-The replacement string {%} gives the job slot number (between 1 and
+The replacement string B<{%}> gives the job slot number (between 1 and
 number of jobs to run in parallel):
 
   parallel -j 2 echo {%} ::: A B C
@@ -386,7 +386,7 @@ Output (the order may be different and 1 and 2 may be swapped):
 
 =head3 Changing the replacement strings
 
-The replacement string {} can be changed with -I:
+The replacement string B<{}> can be changed with B<-I>:
 
   parallel -I ,, echo ,, ::: A/B.C
 
@@ -394,7 +394,7 @@ Output:
 
   A/B.C
 
-The replacement string {.} can be changed with --extensionreplace:
+The replacement string B<{.}> can be changed with B<--extensionreplace>:
 
   parallel --extensionreplace ,, echo ,, ::: A/B.C
 
@@ -402,7 +402,7 @@ Output:
 
   A/B
 
-The replacement string {/} can be replaced with --basenamereplace:
+The replacement string B<{/}> can be replaced with B<--basenamereplace>:
 
   parallel --basenamereplace ,, echo ,, ::: A/B.C
 
@@ -410,7 +410,7 @@ Output:
 
   B.C
 
-The replacement string {//} can be changed with --dirnamereplace:
+The replacement string B<{//}> can be changed with B<--dirnamereplace>:
 
   parallel --dirnamereplace ,, echo ,, ::: A/B.C
 
@@ -418,7 +418,7 @@ Output:
 
   A
 
-The replacement string {/.} can be changed with --basenameextensionreplace:
+The replacement string B<{/.}> can be changed with B<--basenameextensionreplace>:
 
   parallel --basenameextensionreplace ,, echo ,, ::: A/B.C
 
@@ -426,7 +426,7 @@ Output:
 
   B
 
-The replacement string {#} can be changed with --seqreplace:
+The replacement string B<{#}> can be changed with B<--seqreplace>:
 
   parallel --seqreplace ,, echo ,, ::: A B C
 
@@ -436,7 +436,7 @@ Output (the order may be different):
   2
   3
 
-The replacement string {%} can be changed with --slotreplace:
+The replacement string B<{%}> can be changed with B<--slotreplace>:
 
   parallel -j2 --slotreplace ,, echo ,, ::: A B C
 
@@ -450,7 +450,7 @@ Output (the order may be different and 1 and 2 may be swapped):
 
 When predefined replacement strings are not flexible enough a perl
 expression can be used instead. One example is to remove two
-extensions: foo.tar.gz -> foo
+extensions: foo.tar.gz becomes foo
 
   parallel echo '{= s:\.[^.]+$::;s:\.[^.]+$::; =}' ::: foo.tar.gz
 
@@ -458,26 +458,69 @@ Output:
 
   foo
 
-If the strings B<{=> and B<=}> cause problems they can be replaced with --parens:
+In B<{= =}> you can access all of GNU B<parallel>'s internal functions
+and variables. A few are worth mentioning.
+
+B<total_jobs()> returns the total number of jobs:
+
+  parallel echo Job {#} of {= '$_=total_jobs()' =} ::: {1..5}
+
+Output:
+
+  Job 1 of 5
+  Job 2 of 5
+  Job 3 of 5
+  Job 4 of 5
+  Job 5 of 5
+
+B<Q(...)> shell quotes the string:
+
+  parallel echo {} shell quoted is {= '$_=Q($_)' =} ::: '*/!#$'
+
+B<$job->>B<skip()> skips the job:
+
+  parallel echo {= 'if($_==3) { $job->skip() }' =} ::: {1..5}
+
+Output:
+
+  1
+  2
+  4
+  5
+
+B<@arg> contains the input source variables:
+
+  parallel echo {= 'if($arg[1]==$arg[2]) { $job->skip() }' =} ::: {1..3} ::: {1..3}
+
+Output:
+
+  1 2
+  1 3
+  2 1
+  2 3
+  3 1
+  3 2
+
+If the strings B<{=> and B<=}> cause problems they can be replaced with B<--parens>:
 
   parallel --parens ,,,, echo ',, s:\.[^.]+$::;s:\.[^.]+$::; ,,' ::: foo.tar.gz
 
 Output: Same as above.
 
-To define a short hand replacement string use B<--rpl>:
+To define a shorthand replacement string use B<--rpl>:
 
   parallel --rpl '.. s:\.[^.]+$::;s:\.[^.]+$::;' echo '..' ::: foo.tar.gz
 
 Output: Same as above.
 
-If the short hand starts with '{' it can be used as a positional
+If the shorthand starts with B<{> it can be used as a positional
 replacement string, too:
 
   parallel --rpl '{..} s:\.[^.]+$::;s:\.[^.]+$::;' echo '{..}' ::: foo.tar.gz
 
 Output: Same as above.
 
-GNU B<parallel>'s 7 replacement strings are implemented as:
+GNU B<parallel>'s 7 replacement strings are implemented as this:
 
   --rpl '{} '
   --rpl '{#} $_=$job->seq()'
@@ -490,7 +533,7 @@ GNU B<parallel>'s 7 replacement strings are implemented as:
 =head3 Positional replacement strings
 
 With multiple input sources the argument from the individual input
-sources can be access with {number}:
+sources can be accessed with B<{>numberB<}>:
 
   parallel echo {1} and {2} ::: A B ::: C D
 
@@ -501,7 +544,7 @@ Output (the order may be different):
   B and C
   B and D
 
-The positional replacement strings can also be modified using / // /. and  .:
+The positional replacement strings can also be modified using B</>, B<//>, B</.>, and  B<.>:
 
   parallel echo /={1/} //={1//} /.={1/.} .={1.} ::: A/B.C D/E.F
 
@@ -538,8 +581,8 @@ Output:
 
   foo bar
 
-If a defined short hand starts with '{' it can be used as a positional
-replacement string, too:
+If shorthand defined using B<--rpl> starts with B<{> it can be used as
+a positional replacement string, too:
 
   parallel --rpl '{..} s:\.[^.]+$::;s:\.[^.]+$::;' echo '{2..} {1}' ::: bar ::: foo.tar.gz
 
@@ -549,7 +592,7 @@ Output: Same as above.
 =head3 Input from columns
 
 The columns in a file can be bound to positional replacement strings
-using --colsep. Here the columns are separated with TAB (\t):
+using B<--colsep>. Here the columns are separated by TAB (\t):
 
   parallel --colsep '\t' echo 1={1} 2={2} :::: tsv-file.tsv
 
@@ -561,9 +604,9 @@ Output (the order may be different):
 
 =head3 Header defined replacement strings
 
-With --header GNU Parallel will use the first value of the input
+With B<--header> GNU B<parallel> will use the first value of the input
 source as the name of the replacement string. Only the non-modified
-version {} is supported:
+version B<{}> is supported:
 
   parallel --header : echo f1={f1} f2={f2} ::: f1 A B ::: f2 C D
 
@@ -574,7 +617,7 @@ Output (the order may be different):
   f1=B f2=C
   f1=B f2=D
 
-It is useful with --colsep for processing files with TAB separated values:
+It is useful with B<--colsep> for processing files with TAB separated values:
 
   parallel --header : --colsep '\t' echo f1={f1} f2={f2} :::: tsv-file.tsv
 
@@ -583,9 +626,41 @@ Output (the order may be different):
   f1=A f2=B
   f1=C f2=D
 
+=head3 More pre-defined replacement strings
+
+B<--plus> adds the replacement strings B<{+/} {+.} {+..} {+...} {..}  {...}
+{/..} {/...} {##}>. The idea being that B<{+foo}> matches the opposite of B<{foo}>
+and B<{}> = B<{+/}>/B<{/}> = B<{.}>.B<{+.}> = B<{+/}>/B<{/.}>.B<{+.}> = B<{..}>.B<{+..}> =
+B<{+/}>/B<{/..}>.B<{+..}> = B<{...}>.B<{+...}> = B<{+/}>/B<{/...}>.B<{+...}>.
+
+  parallel --plus echo {} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {+/}/{/} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {.}.{+.} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {+/}/{/.}.{+.} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {..}.{+..} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {+/}/{/..}.{+..} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {...}.{+...} ::: dir/sub/file.ext1.ext2.ext3
+  parallel --plus echo {+/}/{/...}.{+...} ::: dir/sub/file.ext1.ext2.ext3
+
+Output:
+
+  dir/sub/file.ext1.ext2.ext3
+
+B<{##}> is simply the number of jobs:
+
+  parallel --plus echo Job {#} of {##} ::: {1..5}
+
+Output:
+
+  Job 1 of 5
+  Job 2 of 5
+  Job 3 of 5
+  Job 4 of 5
+  Job 5 of 5
+
 =head2 More than one argument
 
-With --xargs will GNU Parallel fit as many arguments as possible on a
+With B<--xargs> GNU B<parallel> will fit as many arguments as possible on a
 single line:
 
   cat num30000 | parallel --xargs echo | wc -l
@@ -596,7 +671,7 @@ Output (if you run this under Bash on GNU/Linux):
 
 The 30000 arguments fitted on 2 lines.
 
-The maximal length of a single line can be set with -s. With a maximal
+The maximal length of a single line can be set with B<-s>. With a maximal
 line length of 10000 chars 17 commands will be run:
 
   cat num30000 | parallel --xargs -s 10000 echo | wc -l
@@ -605,15 +680,15 @@ Output:
 
   17
 
-For better parallelism GNU Parallel can distribute the arguments
+For better parallelism GNU B<parallel> can distribute the arguments
 between all the parallel jobs when end of file is met.
 
-Below GNU Parallel reads the last argument when generating the second
-job. When GNU Parallel reads the last argument, it spreads all the
+Below GNU B<parallel> reads the last argument when generating the second
+job. When GNU B<parallel> reads the last argument, it spreads all the
 arguments for the second job over 4 jobs instead, as 4 parallel jobs
 are requested.
 
-The first job will be the same as the --xargs example above, but the
+The first job will be the same as the B<--xargs> example above, but the
 second job will be split into 4 evenly sized jobs, resulting in a
 total of 5 jobs:
 
@@ -635,7 +710,7 @@ Output:
   7 8 9
   10
 
-A replacement string can be part of a word. -m will not repeat the context:
+A replacement string can be part of a word. B<-m> will not repeat the context:
 
   parallel --jobs 4 -m echo pre-{}-post ::: A B C D E F G
 
@@ -646,7 +721,7 @@ Output (the order may be different):
   pre-E F-post
   pre-G-post
 
-To repeat the context use -X which otherwise works like -m:
+To repeat the context use B<-X> which otherwise works like B<-m>:
 
   parallel --jobs 4 -X echo pre-{}-post ::: A B C D E F G
 
@@ -657,7 +732,7 @@ Output (the order may be different):
   pre-E-post pre-F-post
   pre-G-post
 
-To limit the number of arguments use -N:
+To limit the number of arguments use B<-N>:
 
   parallel -N3 echo ::: A B C D E F G H
 
@@ -667,7 +742,7 @@ Output (the order may be different):
   D E F
   G H
 
--N also sets the positional replacement strings:
+B<-N> also sets the positional replacement strings:
 
   parallel -N3 echo 1={1} 2={2} 3={3} ::: A B C D E F G H
 
@@ -677,7 +752,7 @@ Output (the order may be different):
   1=D 2=E 3=F
   1=G 2=H 3=
 
--N0 reads 1 argument but inserts none:
+B<-N0> reads 1 argument but inserts none:
 
   parallel -N0 echo foo ::: 1 2 3
 
@@ -691,7 +766,7 @@ Output:
 
 Command lines that contain special characters may need to be protected from the shell.
 
-The perl program 'print "@ARGV\n"' basically works like echo.
+The B<perl> program B<print "@ARGV\n"> basically works like B<echo>.
 
   perl -e 'print "@ARGV\n"' A
 
@@ -707,7 +782,7 @@ Output:
 
   [Nothing]
 
-To quote the command use -q:
+To quote the command use B<-q>:
 
   parallel -q perl -e 'print "@ARGV\n"' ::: This works
 
@@ -716,7 +791,7 @@ Output (the order may be different):
   This
   works
 
-Or you can quote the critical part using \':
+Or you can quote the critical part using B<\'>:
 
   parallel perl -e \''print "@ARGV\n"'\' ::: This works, too
 
@@ -726,7 +801,7 @@ Output (the order may be different):
   works,
   too
 
-GNU Parallel can also \-quote full lines. Simply run:
+GNU B<parallel> can also \-quote full lines. Simply run this:
 
   parallel --shellquote
   parallel: Warning: Input is read from the terminal. Only experts do this on purpose. Press CTRL-D to exit.
@@ -750,7 +825,7 @@ Output (the order may be different):
 
 =head2 Trimming space
 
-Space can be trimmed on the arguments using --trim:
+Space can be trimmed on the arguments using B<--trim>:
 
   parallel --trim r echo pre-{}-post ::: ' A '
 
@@ -787,7 +862,7 @@ Output (the order may be different):
   B       foo-B
   C       foo-C
 
-To prefix it with another string use --tagstring:
+To prefix it with another string use B<--tagstring>:
 
   parallel --tagstring {}-bar echo foo-{} ::: A B C
 
@@ -797,7 +872,7 @@ Output (the order may be different):
   B-bar   foo-B
   C-bar   foo-C
 
-To see what commands will be run without running them:
+To see what commands will be run without running them use B<--dryrun>:
 
   parallel --dryrun echo {} ::: A B C
 
@@ -807,7 +882,7 @@ Output (the order may be different):
   echo B
   echo C
 
-To print the command before running them use --verbose:
+To print the command before running them use B<--verbose>:
 
   parallel --verbose echo {} ::: A B C
 
@@ -820,7 +895,7 @@ Output (the order may be different):
   B
   C
 
-GNU Parallel will postpone the output until the command completes:
+GNU B<parallel> will postpone the output until the command completes:
 
   parallel -j2 'printf "%s-start\n%s" {} {};sleep {};printf "%s\n" -middle;echo {}-end' ::: 4 2 1
 
@@ -836,7 +911,7 @@ Output:
   4-middle
   4-end
 
-To get the output immediately use --ungroup:
+To get the output immediately use B<--ungroup>:
 
   parallel -j2 --ungroup 'printf "%s-start\n%s" {} {};sleep {};printf "%s\n" -middle;echo {}-end' ::: 4 2 1
 
@@ -852,11 +927,11 @@ Output:
   -middle
   4-end
 
---ungroup is fast, but can cause half a line from one job to be mixed
+B<--ungroup> is fast, but can cause half a line from one job to be mixed
 with half a line of another job. That has happend in the second line,
 where the line '4-middle' is mixed with '2-start'.
 
-To avoid this use --linebuffer:
+To avoid this use B<--linebuffer>:
 
   parallel -j2 --linebuffer 'printf "%s-start\n%s" {} {};sleep {};printf "%s\n" -middle;echo {}-end' ::: 4 2 1
 
@@ -872,7 +947,7 @@ Output:
   4-middle
   4-end
 
-To force the output in the same order as the arguments use --keep-order/-k:
+To force the output in the same order as the arguments use B<--keep-order>/B<-k>:
 
   parallel -j2 -k 'printf "%s-start\n%s" {} {};sleep {};printf "%s\n" -middle;echo {}-end' ::: 4 2 1
 
@@ -888,24 +963,25 @@ Output:
   1-middle
   1-end
 
+
 =head2 Saving output into files
 
-GNU Parallel can save the output of each job into files:
+GNU B<parallel> can save the output of each job into files:
 
   parallel --files echo ::: A B C
 
-Output will be similar to:
+Output will be similar to this:
 
   /tmp/pAh6uWuQCg.par
   /tmp/opjhZCzAX4.par
   /tmp/W0AT_Rph2o.par
 
-By default GNU Parallel will cache the output in files in /tmp. This
-can be changed by setting $TMPDIR or --tmpdir:
+By default GNU B<parallel> will cache the output in files in B</tmp>. This
+can be changed by setting B<$TMPDIR> or B<--tmpdir>:
 
   parallel --tmpdir /var/tmp --files echo ::: A B C
 
-Output will be similar to:
+Output will be similar to this:
 
   /var/tmp/N_vk7phQRc.par
   /var/tmp/7zA4Ccf3wZ.par
@@ -917,7 +993,7 @@ Or:
 
 Output: Same as above.
 
-The output files can be saved in a structured way using --results:
+The output files can be saved in a structured way using B<--results>:
 
   parallel --results outdir echo ::: A B C
 
@@ -927,45 +1003,54 @@ Output:
   B
   C
 
-but also these files were generated containing the standard output
-(stdout) and standard error (stderr):
+These files were also generated containing the standard output
+(stdout), standard error (stderr), and the sequence number (seq):
 
+  outdir/1/A/seq
   outdir/1/A/stderr
   outdir/1/A/stdout
+  outdir/1/B/seq
   outdir/1/B/stderr
   outdir/1/B/stdout
+  outdir/1/C/seq
   outdir/1/C/stderr
   outdir/1/C/stdout
 
-This is useful if you are running multiple variables:
+B<--header :> will take the first value as name and use that in the
+directory structure. This is useful if you are using multiple input
+sources:
 
   parallel --header : --results outdir echo ::: f1 A B ::: f2 C D
 
 Generated files:
 
+  outdir/f1/A/f2/C/seq
   outdir/f1/A/f2/C/stderr
   outdir/f1/A/f2/C/stdout
+  outdir/f1/A/f2/D/seq
   outdir/f1/A/f2/D/stderr
   outdir/f1/A/f2/D/stdout
+  outdir/f1/B/f2/C/seq
   outdir/f1/B/f2/C/stderr
   outdir/f1/B/f2/C/stdout
+  outdir/f1/B/f2/D/seq
   outdir/f1/B/f2/D/stderr
   outdir/f1/B/f2/D/stdout
 
 The directories are named after the variables and their values.
 
-=head1 Control the execution
+=head1 Controlling the execution
 
 =head2 Number of simultaneous jobs 
 
-The number of concurrent jobs is given with --jobs/-j:
+The number of concurrent jobs is given with B<--jobs>/B<-j>:
 
   /usr/bin/time parallel -N0 -j64 sleep 1 :::: num128
 
-With 64 jobs in parallel the 128 sleeps will take 2-8 seconds to run -
+With 64 jobs in parallel the 128 B<sleep>s will take 2-8 seconds to run -
 depending on how fast your machine is.
 
-By default --jobs is the same as the number of CPU cores. So this:
+By default B<--jobs> is the same as the number of CPU cores. So this:
 
   /usr/bin/time parallel -N0 sleep 1 :::: num128
 
@@ -973,13 +1058,13 @@ should take twice the time of running 2 jobs per CPU core:
 
   /usr/bin/time parallel -N0 --jobs 200% sleep 1 :::: num128
 
---jobs 0 will run as many jobs in parallel as possible:
+B<--jobs 0> will run as many jobs in parallel as possible:
 
   /usr/bin/time parallel -N0 --jobs 0 sleep 1 :::: num128
 
 which should take 1-7 seconds depending on how fast your machine is.
 
---jobs can read from a file which is re-read when a job finishes:
+B<--jobs> can read from a file which is re-read when a job finishes:
 
   echo 50% > my_jobs
   /usr/bin/time parallel -N0 --jobs my_jobs sleep 1 :::: num128 &
@@ -987,12 +1072,12 @@ which should take 1-7 seconds depending on how fast your machine is.
   echo 0 > my_jobs
   wait
 
-The first second only 50% of the CPU cores will run a job. The '0' is
-put into my_jobs and then the rest of the jobs will be started in
+The first second only 50% of the CPU cores will run a job. Then B<0> is
+put into B<my_jobs> and then the rest of the jobs will be started in
 parallel.
 
 Instead of basing the percentage on the number of CPU cores 
-GNU Parallel can base it on the number of CPUs:
+GNU B<parallel> can base it on the number of CPUs:
 
   parallel --use-cpus-instead-of-cores -N0 sleep 1 :::: num8
 
@@ -1000,7 +1085,7 @@ GNU Parallel can base it on the number of CPUs:
 
 If you have many jobs (e.g. by multiple combinations of input
 sources), it can be handy to shuffle the jobs, so you get different
-values run.
+values run. Use B<--shuf> for that:
 
   parallel --shuf echo ::: 1 2 3 ::: a b c ::: A B C
 
@@ -1010,7 +1095,7 @@ Output:
 
 =head2 Interactivity
 
-GNU Parallel can ask the user if a command should be run using --interactive:
+GNU B<parallel> can ask the user if a command should be run using B<--interactive>:
 
   parallel --interactive echo ::: 1 2 3
 
@@ -1022,8 +1107,8 @@ Output:
   echo 3 ?...y
   3
 
-GNU Parallel can be used to put arguments on the command line for an
-interactive command such as emacs to edit one file at a time:
+GNU B<parallel> can be used to put arguments on the command line for an
+interactive command such as B<emacs> to edit one file at a time:
 
   parallel --tty emacs ::: 1 2 3
 
@@ -1033,7 +1118,7 @@ Or give multiple argument in one go to open multiple files:
 
 =head2 A terminal for every job
 
-Using tmux GNU Parallel can start a terminal for every job run:
+Using B<--tmux> GNU B<parallel> can start a terminal for every job run:
 
   seq 10 20 | parallel --tmux 'echo start {}; sleep {}; echo done {}'
 
@@ -1041,15 +1126,15 @@ This will tell you to run something similar to:
 
   tmux -S /tmp/tmsrPrO0 attach
 
-Using normal tmux keystrokes (CTRL-b n or CTRL-b p) you can cycle
+Using normal B<tmux> keystrokes (CTRL-b n or CTRL-b p) you can cycle
 between windows of the running jobs. When a job is finished it will
 pause for 10 seconds before closing the window.
 
 =head2 Timing
 
 Some jobs do heavy I/O when they start. To avoid a thundering herd GNU
-Parallel can delay starting new jobs. --delay X will make sure there is
-at least X seconds between each start:
+B<parallel> can delay starting new jobs. B<--delay> I<X> will make
+sure there is at least I<X> seconds between each start:
 
   parallel --delay 2.5 echo Starting {}\;date ::: 1 2 3
 
@@ -1064,8 +1149,8 @@ Output:
 
 
 If jobs taking more than a certain amount of time are known to fail,
-they can be stopped with --timeout. The accuracy of --timeout is 2
-seconds:
+they can be stopped with B<--timeout>. The accuracy of B<--timeout> is
+2 seconds:
 
   parallel --timeout 4.1 sleep {}\; echo {} ::: 2 4 6 8
 
@@ -1074,7 +1159,7 @@ Output:
   2
   4
 
-GNU Parallel can compute the median runtime for jobs and kill those
+GNU B<parallel> can compute the median runtime for jobs and kill those
 that take more than 200% of the median runtime:
 
   parallel --timeout 200% sleep {}\; echo {} ::: 2.1 2.2 3 7 2.3
@@ -1086,7 +1171,9 @@ Output:
   3
   2.3
 
-Based on the runtime of completed jobs GNU Parallel can estimate the
+=head2 Progress information
+
+Based on the runtime of completed jobs GNU B<parallel> can estimate the
 total runtime:
 
   parallel --eta sleep ::: 1 3 2 2 1 3 3 2 1
@@ -1099,9 +1186,7 @@ Output:
   Computer:jobs running/jobs completed/%of started jobs/Average seconds to complete
   ETA: 2s 0left 1.11avg  local:0/9/100%/1.1s 
 
-=head2 Progress
-
-GNU Parallel can give progress information with --progress:
+GNU B<parallel> can give progress information with B<--progress>:
 
   parallel --progress sleep ::: 1 3 2 2 1 3 3 2 1
 
@@ -1113,15 +1198,15 @@ Output:
   Computer:jobs running/jobs completed/%of started jobs/Average seconds to complete
   local:0/9/100%/1.1s
 
-A progress bar can be shown with --bar:
+A progress bar can be shown with B<--bar>:
 
   parallel --bar sleep ::: 1 3 2 2 1 3 3 2 1
 
-And a graphic bar can be shown with --bar and zenity:
+And a graphic bar can be shown with B<--bar> and B<zenity>:
 
   seq 1000 | parallel -j10 --bar '(echo -n {};sleep 0.1)' 2> >(zenity --progress --auto-kill)
 
-A logfile of the jobs completed so far can be generated with --joblog:
+A logfile of the jobs completed so far can be generated with B<--joblog>:
 
   parallel --joblog /tmp/log exit  ::: 1 2 3 0 
   cat /tmp/log
@@ -1135,11 +1220,11 @@ Output:
   4       :       1376577365.003  0.003   0       0       0       0       exit 0
 
 The log contains the job sequence, which host the job was run on, the
-start time and run time, how much data was transferred if the job was
-run on a remote host, the exit value, the signal that killed the job,
-and finally the command being run.
+start time and run time, how much data was transferred, the exit
+value, the signal that killed the job, and finally the command being
+run.
 
-With a joblog GNU Parallel can be stopped and later pickup where it
+With a joblog GNU B<parallel> can be stopped and later pickup where it
 left off. It it important that the input of the completed jobs is
 unchanged.
 
@@ -1164,9 +1249,9 @@ Output:
   5       :       1376580070.028  0.009   0       0       0       0       exit 0
   6       :       1376580070.038  0.007   0       0       0       0       exit 0
 
-Note how the start time of the last 2 jobs is clearly from the second run.
+Note how the start time of the last 2 jobs is clearly different from the second run.
 
-With --resume-failed GNU Parallel will re-run the jobs that failed:
+With B<--resume-failed> GNU B<parallel> will re-run the jobs that failed:
 
   parallel --resume-failed --joblog /tmp/log exit  ::: 1 2 3 0 0 0
   cat /tmp/log
@@ -1184,13 +1269,39 @@ Output:
   2       :       1376580154.444  0.022   0       0       2       0       exit 2
   3       :       1376580154.466  0.005   0       0       3       0       exit 3
 
-Note how seq 1 2 3 have been repeated because they had exit value != 0.
+Note how seq 1 2 3 have been repeated because they had exit value
+different from 0.
+
+B<--retry-failed> does almost the same as B<--resume-failed>. Where
+B<--resume-failed> reads the commands from the command line (and
+ignores the commands in the joblog), B<--retry-failed> ignores the
+command line and reruns the commands mentioned in the joblog.
+
+  parallel --resume-failed --joblog /tmp/log
+  cat /tmp/log
+
+Output:
+
+  Seq     Host    Starttime       Runtime Send    Receive Exitval Signal  Command
+  1       :       1376580069.544  0.008   0       0       1       0       exit 1
+  2       :       1376580069.552  0.009   0       0       2       0       exit 2
+  3       :       1376580069.560  0.012   0       0       3       0       exit 3
+  4       :       1376580069.571  0.005   0       0       0       0       exit 0
+  5       :       1376580070.028  0.009   0       0       0       0       exit 0
+  6       :       1376580070.038  0.007   0       0       0       0       exit 0
+  1       :       1376580154.433  0.010   0       0       1       0       exit 1
+  2       :       1376580154.444  0.022   0       0       2       0       exit 2
+  3       :       1376580154.466  0.005   0       0       3       0       exit 3
+  1       :       1376580164.633  0.010   0       0       1       0       exit 1
+  2       :       1376580164.644  0.022   0       0       2       0       exit 2
+  3       :       1376580164.666  0.005   0       0       3       0       exit 3
+
 
 =head2 Termination
 
 For certain jobs there is no need to continue if one of the jobs fails
-and has an exit code != 0. GNU Parallel will stop spawning new jobs
-with --halt soon,fail=1:
+and has an exit code different from 0. GNU B<parallel> will stop spawning new jobs
+with B<--halt soon,fail=1>:
 
   parallel -j2 --halt soon,fail=1 echo {}\; exit {} ::: 0 0 1 2 3
 
@@ -1205,7 +1316,7 @@ Output:
   parallel: Starting no more jobs. Waiting for 1 jobs to finish. This job failed:
   echo 2; exit 2
 
-With --halt now,fail=1 the running jobs will be killed immediately:
+With B<--halt now,fail=1> the running jobs will be killed immediately:
 
   parallel -j2 --halt now,fail=1 echo {}\; exit {} ::: 0 0 1 2 3
 
@@ -1217,8 +1328,8 @@ Output:
   parallel: This job failed:
   echo 1; exit 1
 
-If --halt is given a percentage this percentage of the jobs must fail
-before GNU Parallel stops spawning more jobs:
+If B<--halt> is given a percentage this percentage of the jobs must fail
+before GNU B<parallel> stops spawning more jobs:
 
   parallel -j2 --halt soon,fail=20% echo {}\; exit {} ::: 0 1 2 3 4 5 6 7 8 9
 
@@ -1236,22 +1347,21 @@ Output:
   parallel: This job failed:
   echo 3; exit 3
 
-If you are looking for success instead of failures, you can use success:
+If you are looking for success instead of failures, you can use
+B<success>. This will finish as soon as the first job succeeds:
 
-  parallel -j2 --halt soon,success=1 echo {}\; exit {} ::: 1 2 3 0 4 5 6
+  parallel -j2 --halt now,success=1 echo {}\; exit {} ::: 1 2 3 0 4 5 6
 
 Output:
-                
+
   1
   2
   3
   0
   parallel: This job succeeded:
   echo 0; exit 0
-  parallel: Starting no more jobs. Waiting for 1 jobs to finish.
-  4
 
-GNU Parallel can retry the command with --retries. This is useful if a
+GNU B<parallel> can retry the command with B<--retries>. This is useful if a
 command fails for unknown reasons now and then.
 
   parallel -k --retries 3 'echo tried {} >>/tmp/runs; echo completed {}; exit {}' ::: 1 2 0
@@ -1273,9 +1383,47 @@ Output:
 
 Note how job 1 and 2 were tried 3 times, but 0 was not retried because it had exit code 0.
 
+=head3 Termination signals (advanced)
+
+Using B<--termseq> you can control which signals are sent when killing
+children. Normally children will be killed by sending them B<SIGTERM>,
+waiting 200 ms, then another B<SIGTERM>, waiting 100 ms, then another
+B<SIGTERM>, waiting 50 ms, then a B<SIGKILL>, finally waiting 25 ms
+before giving up. It looks like this:
+
+  show_signals() {
+    perl -e 'for(keys %SIG) { $SIG{$_} = eval "sub { print \"Got $_\\n\"; }";} while(1){sleep 1}' 
+  }
+  export -f show_signals
+  echo | parallel --termseq TERM,200,TERM,100,TERM,50,KILL,25 -u --timeout 1 show_signals
+
+Output:
+
+  Got TERM
+  Got TERM
+  Got TERM
+
+Or just:
+
+  echo | parallel -u --timeout 1 show_signals
+
+Output: Same as above.
+
+You can change this to B<SIGINT>, B<SIGTERM>, B<SIGKILL>:
+
+  echo | parallel --termseq INT,200,TERM,100,KILL,25 -u --timeout 1 show_signals
+
+Output:                               
+
+  Got INT
+  Got TERM
+
+The B<SIGKILL> does not show because it cannot be caught, and thus the child dies.
+
+
 =head2 Limiting the resources
 
-To avoid overloading systems GNU Parallel can look at the system load
+To avoid overloading systems GNU B<parallel> can look at the system load
 before starting another job:
 
   parallel --load 100% echo load is less than {} job per cpu ::: 1 
@@ -1285,7 +1433,7 @@ Output:
   [when then load is less than the number of cpu cores]
   load is less than 1 job per cpu
 
-GNU Parallel can also check if the system is swapping. 
+GNU B<parallel> can also check if the system is swapping. 
 
   parallel --noswap echo the system is not swapping ::: now
 
@@ -1294,7 +1442,15 @@ Output:
   [when then system is not swapping]
   the system is not swapping now
 
-GNU Parallel can run the jobs with a nice value. This will work both
+Some jobs need a lot of memory, and should only be started when there
+is enough memory free. Using B<--memfree> GNU B<parallel> can check if
+there is enough memory free. Additionally, GNU B<parallel> will kill
+off the youngest job if the memory free falls below 50% of the
+size. The killed job will put back on the queue and retried later.
+
+  parallel --memfree 1G echo will run if more than 1 GB is ::: free
+
+GNU B<parallel> can run the jobs with a nice value. This will work both
 locally and remotely.
 
   parallel --nice 17 echo this is being run with nice -n ::: 17
@@ -1305,12 +1461,12 @@ Output:
 
 =head1 Remote execution
 
-GNU Parallel can run jobs on remote servers. It uses ssh to
+GNU B<parallel> can run jobs on remote servers. It uses B<ssh> to
 communicate with the remote machines. 
 
 =head2 Sshlogin
 
-The most basic sshlogin is -S host:
+The most basic sshlogin is B<-S> I<host>:
 
   parallel -S $SERVER1 echo running on ::: $SERVER1
 
@@ -1318,7 +1474,7 @@ Output:
 
   running on [$SERVER1]
 
-To use a different username prepend the server with username@
+To use a different username prepend the server with I<username@>:
 
   parallel -S username@$SERVER1 echo running on ::: username@$SERVER1
 
@@ -1326,7 +1482,7 @@ Output:
 
   running on [username@$SERVER1]
 
-The special sshlogin ':' is the local machine:
+The special sshlogin B<:> is the local machine:
 
   parallel -S : echo running on ::: the_local_machine
 
@@ -1334,7 +1490,7 @@ Output:
 
   running on the_local_machine
 
-If ssh is not in $PATH it can be prepended to $SERVER1:
+If B<ssh> is not in $PATH it can be prepended to $SERVER1:
 
   parallel -S '/usr/bin/ssh '$SERVER1 echo custom ::: ssh
 
@@ -1342,7 +1498,16 @@ Output:
 
   custom ssh
 
-Several servers can be given using multiple -S:
+The B<ssh> command can also be given using B<--ssh>:
+
+  parallel --ssh /usr/bin/ssh -S $SERVER1 echo custom ::: ssh
+
+or by setting B<$PARALLEL_SSH>:
+
+  export PARALLEL_SSH=/usr/bin/ssh
+  parallel -S $SERVER1 echo custom ::: ssh
+
+Several servers can be given using multiple B<-S>:
 
   parallel -S $SERVER1 -S $SERVER2 echo ::: running on more hosts
 
@@ -1353,7 +1518,7 @@ Output (the order may be different):
   more
   hosts
 
-Or they can be separated by ,:
+Or they can be separated by B<,>:
 
   parallel -S $SERVER1,$SERVER2 echo ::: running on more hosts
 
@@ -1365,7 +1530,7 @@ Or newline:
   SERVERS="`echo $SERVER1; echo $SERVER2`"
   parallel -S "$SERVERS" echo ::: running on more hosts
 
-The can also be read from a file (replace user@ with the user on $SERVER2):
+They can also be read from a file (replace I<user@> with the user on B<$SERVER2>):
 
   echo $SERVER1 > nodefile
   # Force 4 cores, special ssh-command, username
@@ -1374,10 +1539,13 @@ The can also be read from a file (replace user@ with the user on $SERVER2):
 
 Output: Same as above.
 
-The special --sshloginfile '..' reads from ~/.parallel/sshloginfile.
+Every time a job finished, the B<--sshloginfile> will be re-read, so
+it is possible to both add and remove hosts while running.
 
-To force GNU Parallel to treat a server having a given number of CPU
-cores prepend #/ to the sshlogin:
+The special B<--sshloginfile ..> reads from B<~/.parallel/sshloginfile>.
+
+To force GNU B<parallel> to treat a server having a given number of CPU
+cores prepend the number of core followed by B</> to the sshlogin:
 
   parallel -S 4/$SERVER1 echo force {} cpus on server ::: 4
 
@@ -1385,22 +1553,24 @@ Output:
 
   force 4 cpus on server
 
-Servers can be put into groups by prepending '@groupname' to the
-server and the group can then be selected by appending '@groupname' to
-the argument if using '--hostgroup'.
+Servers can be put into groups by prepending I<@groupname> to the
+server and the group can then be selected by appending I<@groupname> to
+the argument if using B<--hostgroup>:
 
-  parallel --hostgroup -S @grp1/$SERVER1 -S @grp2/$SERVER2 echo {} ::: run_on_grp1@grp1 run_on_grp2@grp2
+  parallel --hostgroup -S @grp1/$SERVER1 -S @grp2/$SERVER2 echo {} ::: \
+    run_on_grp1@grp1 run_on_grp2@grp2
 
 Output:
 
   run_on_grp1
   run_on_grp2
 
-A host can be in multiple groups by separating groups with '+', and
+A host can be in multiple groups by separating the groups with B<+>, and
 you can force GNU B<parallel> to limit the groups on which the command
-can be run with '-S @groupname':
+can be run with B<-S> I<@groupname>:
 
-  parallel -S @grp1 -S @grp1+grp2/$SERVER1 -S @grp2/SERVER2 echo {} ::: run_on_grp1 also_grp1
+  parallel -S @grp1 -S @grp1+grp2/$SERVER1 -S @grp2/SERVER2 echo {} ::: \
+    run_on_grp1 also_grp1
 
 Output:
 
@@ -1409,34 +1579,34 @@ Output:
 
 =head2 Transferring files
 
-GNU Parallel can transfer the files to be processed to the remote
+GNU B<parallel> can transfer the files to be processed to the remote
 host. It does that using rsync.
 
   echo This is input_file > input_file
-  parallel -S $SERVER1 --transfer cat ::: input_file 
+  parallel -S $SERVER1 --transferfile {} cat ::: input_file 
 
 Output:
 
   This is input_file
 
-If the files is processed into another file, the resulting file can be
+If the files are processed into another file, the resulting file can be
 transferred back:
 
   echo This is input_file > input_file
-  parallel -S $SERVER1 --transfer --return {}.out cat {} ">"{}.out ::: input_file 
+  parallel -S $SERVER1 --transferfile {} --return {}.out cat {} ">"{}.out ::: input_file 
   cat input_file.out
 
 Output: Same as above.
 
-To remove the input and output file on the remote server use --cleanup:
+To remove the input and output file on the remote server use B<--cleanup>:
 
   echo This is input_file > input_file
-  parallel -S $SERVER1 --transfer --return {}.out --cleanup cat {} ">"{}.out ::: input_file 
+  parallel -S $SERVER1 --transferfile {} --return {}.out --cleanup cat {} ">"{}.out ::: input_file 
   cat input_file.out
 
 Output: Same as above.
 
-There is a short hand for --transfer --return --cleanup called --trc:
+There is a shorthand for B<--transferfile {} --return --cleanup> called B<--trc>:
 
   echo This is input_file > input_file
   parallel -S $SERVER1 --trc {}.out cat {} ">"{}.out ::: input_file 
@@ -1444,8 +1614,8 @@ There is a short hand for --transfer --return --cleanup called --trc:
 
 Output: Same as above.
 
-Some jobs need a common database for all jobs. GNU Parallel can
-transfer that using --basefile which will transfer the file before the
+Some jobs need a common database for all jobs. GNU B<parallel> can
+transfer that using B<--basefile> which will transfer the file before the
 first job:
 
   echo common data > common_file
@@ -1456,24 +1626,24 @@ Output:
   common data
   foo
 
-To remove it from the remote host after the last job use --cleanup.
+To remove it from the remote host after the last job use B<--cleanup>.
 
 
 =head2 Working dir
 
 The default working dir on the remote machines is the login dir. This
-can be changed with --workdir I<mydir>.
+can be changed with B<--workdir> I<mydir>.
 
-Files transferred using --transfer and --return will be relative
+Files transferred using B<--transferfile> and B<--return> will be relative
 to I<mydir> on remote computers, and the command will be executed in
 the dir I<mydir>.
 
-The special I<mydir> value ... will create working dirs under
-~/.parallel/tmp/ on the remote computers. If --cleanup is given
+The special I<mydir> value B<...> will create working dirs under
+B<~/.parallel/tmp> on the remote computers. If B<--cleanup> is given
 these dirs will be removed.
 
-The special I<mydir> value . uses the current working dir.  If the
-current working dir is beneath your home dir, the value . is
+The special I<mydir> value B<.> uses the current working dir.  If the
+current working dir is beneath your home dir, the value B<.> is
 treated as the relative path to your home dir. This means that if your
 home dir is different on remote computers (e.g. if your login is
 different) the relative path will still be relative to your home dir.
@@ -1491,8 +1661,8 @@ Output:
 
 =head2 Avoid overloading sshd
 
-If many jobs are started on the same server, sshd can be
-overloaded. GNU Parallel can insert a delay between each job run on
+If many jobs are started on the same server, B<sshd> can be
+overloaded. GNU B<parallel> can insert a delay between each job run on
 the same server:
 
   parallel -S $SERVER1 --sshdelay 0.2 echo ::: 1 2 3
@@ -1503,7 +1673,7 @@ Output (the order may be different):
   2
   3
 
-Sshd will be less overloaded if using --controlmaster, which will
+B<sshd> will be less overloaded if using B<--controlmaster>, which will
 multiplex ssh connections:
 
   parallel --controlmaster -S $SERVER1 echo ::: 1 2 3
@@ -1512,7 +1682,7 @@ Output: Same as above.
 
 =head2 Ignore hosts that are down
 
-In clusters with many hosts a few of the are often down. GNU Parallel
+In clusters with many hosts a few of them are often down. GNU B<parallel>
 can ignore those hosts. In this case the host 173.194.32.46 is down:
 
   parallel --filter-hosts -S 173.194.32.46,$SERVER1 echo ::: bar 
@@ -1523,7 +1693,7 @@ Output:
 
 =head2 Running the same commands on all hosts
 
-GNU Parallel can run the same command on all the hosts:
+GNU B<parallel> can run the same command on all the hosts:
 
   parallel --onall -S $SERVER1,$SERVER2 echo ::: foo bar
 
@@ -1535,7 +1705,7 @@ Output (the order may be different):
   bar
 
 Often you will just want to run a single command on all hosts with out
-arguments. --nonall is a no argument --onall:
+arguments. B<--nonall> is a no argument B<--onall>:
 
   parallel --nonall -S $SERVER1,$SERVER2 echo foo bar
 
@@ -1544,7 +1714,7 @@ Output:
   foo bar
   foo bar
 
-When --tag is used with --nonall and --onall the --tagstring is the host:
+When B<--tag> is used with B<--nonall> and B<--onall> the B<--tagstring> is the host:
 
   parallel --nonall --tag -S $SERVER1,$SERVER2 echo foo bar
 
@@ -1553,11 +1723,11 @@ Output (the order may be different):
   $SERVER1 foo bar
   $SERVER2 foo bar
 
---jobs sets the number of servers to log in to in parallel.
+B<--jobs> sets the number of servers to log in to in parallel.
 
-=head2 Transfer environment variables and functions
+=head2 Transferring environment variables and functions
 
-Using --env GNU Parallel can transfer an environment variable to the
+Using B<--env> GNU B<parallel> can transfer an environment variable to the
 remote system.
 
   MYVAR='foo bar'
@@ -1568,7 +1738,7 @@ Output:
 
   foo bar baz
 
-This works for functions too if your shell is Bash:
+This works for functions, too, if your shell is Bash:
 
   # This only works in Bash
   my_func() {
@@ -1581,9 +1751,9 @@ Output:
 
   in my_func baz
 
-GNU Parallel can copy all defined variables and functions to the
+GNU B<parallel> can copy all defined variables and functions to the
 remote system. It just needs to record which ones to ignore in
-~/.parallel/ignored_vars. Do that by running this once:
+B<~/.parallel/ignored_vars>. Do that by running this once:
 
   parallel --record-env
   cat ~/.parallel/ignored_vars
@@ -1593,7 +1763,7 @@ Output:
   [list of variables to ignore - including $PATH and $HOME]
 
 Now all new variables and functions defined will be copied when using
---env _:
+B<--env _>:
 
   # The function is only copied if using Bash
   my_func2() {
@@ -1612,24 +1782,28 @@ Output:
 
 =head2 Showing what is actually run
 
---verbose will show the command that would be run on the local
-machine. When a job is run on a remote machine this is wrapped with
-ssh and possibly transferring files and environment variables, setting
-the workdir, and setting --nice value. -vv shows all of this.
+B<--verbose> will show the command that would be run on the local
+machine. When a job is run on a remote machine, this is wrapped with
+B<ssh> and possibly transferring files and environment variables, setting
+the workdir, and setting B<--nice> value. B<-vv> shows all of this.
 
   parallel -vv -S $SERVER1 echo ::: bar
 
 Output:
-
-  ssh lo exec perl\ -e\ \\\$ENV\\\{\\\"PARALLEL_PID\\\"\\\}=\\\"2554030\\\"\\\;\
-  \\$ENV\\\{\\\"PARALLEL_SEQ\\\"\\\}=\\\"1\\\"\\\;\\\$bashfunc\\\ =\\\ \\\"\\\"\
-  \\;@ARGV=\\\"echo\\\ bar\\\"\\\;\\\$SIG\\\{CHLD\\\}=sub\\\{\\\$done=1\\\;\\\}\
-  \\;\\\$pid=fork\\\;unless\\\(\\\$pid\\\)\\\{setpgrp\\\;exec\\\$ENV\\\{SHELL\\\
-  },\\\"-c\\\",\\\(\\\$bashfunc.\\\"@ARGV\\\"\\\)\\\;die\\\"exec:\\\$\\\!\\\\n\\
-  \"\\\;\\\}do\\\{\\\$s=\\\$s\\\<1\\\?0.001+\\\$s\\\*1.03:\\\$s\\\;select\\\(
-  undef,undef,undef,\\\$s\\\)\\\;\\\}until\\\(\\\$done\\\|\\\|getppid==1\\\)\\\;
-  kill\\\(SIGHUP,-\\\$\\\{pid\\\}\\\)unless\\\$done\\\;wait\\\;exit\\\(\\\$\\\?\
-  \\&127\\\?128+\\\(\\\$\\\?\\\&127\\\):1+\\\$\\\?\\\>\\\>8\\\);
+                        
+  ssh lo -- exec perl -e \''@GNU_Parallel=("use","IPC::Open3;","use","MIME::Base64");
+  eval"@GNU_Parallel";my$eval;$eval=decode_base64(join"",@ARGV);eval$eval;'\' 
+  JEVOVnsiUEFSQUxMRUxfUElEIn09IjI3MzQiOyRFTlZ7IlBBUkFMTEVMX1NFUSJ9PSIx
+  IjskYmFzaGZ1bmMgPSAiIjtAQVJHVj0iZWNobyBiYXIiOyRzaGVsbD0iJEVOVntTSEVM
+  TH0iOyR0bXBkaXI9Ii90bXAiOyRuaWNlPTA7ZG97JEVOVntQQVJBTExFTF9UTVB9PSR0
+  bXBkaXIuIi9wYXIiLmpvaW4iIixtYXB7KDAuLjksImEiLi4ieiIsIkEiLi4iWiIpW3Jh
+  bmQoNjIpXX0oMS4uNSk7fXdoaWxlKC1lJEVOVntQQVJBTExFTF9UTVB9KTskU0lHe0NI
+  TER9PXN1YnskZG9uZT0xO307JHBpZD1mb3JrO3VubGVzcygkcGlkKXtzZXRwZ3JwO2V2
+  YWx7c2V0cHJpb3JpdHkoMCwwLCRuaWNlKX07ZXhlYyRzaGVsbCwiLWMiLCgkYmFzaGZ1
+  bmMuIkBBUkdWIik7ZGllImV4ZWM6JCFcbiI7fWRveyRzPSRzPDE/MC4wMDErJHMqMS4w
+  MzokcztzZWxlY3QodW5kZWYsdW5kZWYsdW5kZWYsJHMpO311bnRpbCgkZG9uZXx8Z2V0
+  cHBpZD09MSk7a2lsbChTSUdIVVAsLSR7cGlkfSl1bmxlc3MkZG9uZTt3YWl0O2V4aXQo
+  JD8mMTI3PzEyOCsoJD8mMTI3KToxKyQ/Pj44KQ==;
   bar
 
 When the command gets more complex, the output is so hard to read, that it is only useful for debugging:
@@ -1642,37 +1816,113 @@ When the command gets more complex, the output is so hard to read, that it is on
 
 Output will be similar to:
 
-  ( ssh lo mkdir -p ./.parallel/tmp/aspire-2554425-1;rsync --protocol 30 -rlDzR 
-  -essh ./abc-file lo:./.parallel/tmp/aspire-2554425-1 );ssh lo exec perl -e \''
-  @GNU_Parallel=("use","IPC::Open3;","use","MIME::Base64");eval"@GNU_Parallel";
-  $SIG{CHLD}="IGNORE";my$zip=(grep{-x$_}"/usr/local/bin/bzip2")[0]||"bzip2";my(
-  $in,$out,$eval);open3($in,$out,">&STDERR",$zip,"-dc");if(my$perlpid=fork){
-  close$in;$eval=join"",<$out>;close$out;}else{close$out;print$in(decode_base64(
-  join"",@ARGV));close$in;exit;}wait;eval$eval;'\' QlpoOTFBWSZTWayP388AAbdfgAAQd
-  X/+3//l/wS/7//vQAIq3U6bauIpk1NPUwnqGgND1NGI9TTQ0A0ADIDQNITU9NGqfonpPJRvU0ZQZAA
-  GhpoBoABpqaFNBMh+kGoybUaHogwCYBAADCSgRNqek1TxTeknqemhGyBqek8pk2jRPSeo002mQRo5f
-  oSZYrgzQFDd3HNWaskbx+MxNR89BdDzESFbADOJkI+QhIlnojHCWRVuGc2j2lzMzE41wC7auAMQ06c
-  S3AlqQfKcdo0gd506U0HzAAxMkGJBHjDCZULOMpVbowhIVxxaQz7yansTsBgurEZaGO/6K0Nc4iodr
-  BW4m9SXErqRbLNy5eANDvZ+TIt2c2GBcWSlmYuloxY5u2bGUdU/dGsO5EhyrvKCpZMhIgmQFAQhcwR
-  mD+jMKRawkRFJSGyTNC3PqWnE51ucPyx29Yxjnkyub98lytpyk+v8BUc4eA3xz98dMYjxvb0pgWksh
-  oHZ7HwGQRq1vuDyzKgkwPL9lwGIdL+WPNJFSljlVAahIhQpDCAOJpTqDhgmfoRQcy54PC9T0T3iMnV
-  JeTUdL8P0/s18NqDSUavMNV3qD0CtYi6entl0neNsOQN2VDSLHj0xOMls65LNPo+Wh28rJtVoh2JgE
-  7Q9Qo/XBr6krGIsYpQR6nRDuJCD/5aaQBBFFQGtv2VoFTwkXiUTxFP1CC4AGBznAaMklgWQvVtKguJ
-  zQnPqr9ABtHwbB5GTzPOQ4iWAmrUxvl4j5wqrVchOZcs3NYUQmGO2+VYBimFVxhGcaxDALMZ6bWEUo
-  yt8eC8W5o1ObFtTnHAvjOQgYEL/nHTcxU0G57QMKCzJcASQWFNpe2CpQcgYlBxIN4kwtfxdyRThQkK
-  yP388;_EXIT_status=$?; mkdir -p ./.; rsync --protocol 30 --rsync-path=cd\ 
-  ./.parallel/tmp/aspire-2554425-1/./.\;\ rsync -rlDzR -essh lo:./abc-file.out 
-  ./.;ssh lo \(rm\ -f\ ./.parallel/tmp/aspire-2554425-1/abc-file\;\ sh\ -c\ \'
-  rmdir\ ./.parallel/tmp/aspire-2554425-1/\ ./.parallel/tmp/\ ./.parallel/\ 2\>
-  /dev/null\'\;rm\ -rf\ ./.parallel/tmp/aspire-2554425-1\;\);ssh lo \(rm\ -f\ 
-  ./.parallel/tmp/aspire-2554425-1/abc-file.out\;\ sh\ -c\ \'rmdir\ ./.parallel
-  /tmp/aspire-2554425-1/\ ./.parallel/tmp/\ ./.parallel/\ 2\>/dev/null\'\;rm\ 
-  -rf\ ./.parallel/tmp/aspire-2554425-1\;\);ssh lo rm -rf .parallel/tmp/
-  aspire-2554425-1; exit $_EXIT_status;
+  ( ssh lo -- mkdir -p ./.parallel/tmp/hk-3492-1;rsync --protocol 30
+  -rlDzR -essh ./abc-file lo:./.parallel/tmp/hk-3492-1 );ssh lo --
+  exec perl -e \''@GNU_Parallel=("use","IPC::Open3;","use","MIME::Base64");
+  eval"@GNU_Parallel";my$eval;$eval=decode_base64(join"",@ARGV);eval$eval;'\'
+  c3lzdGVtKCJta2RpciIsIi1wIiwiLS0iLCIucGFyYWxsZWwvdG1wL2hrLTM0OTItMSIp
+  OyBjaGRpciAiLnBhcmFsbGVsL3RtcC9oay0zNDkyLTEiIHx8cHJpbnQoU1RERVJSICJw
+  YXJhbGxlbDogQ2Fubm90IGNoZGlyIHRvIC5wYXJhbGxlbC90bXAvaGstMzQ5Mi0xXG4i
+  KSAmJiBleGl0IDI1NTskRU5WeyJHUEdfQUdFTlRfSU5GTyJ9PSIvdG1wL2dwZy10WjVI
+  U0QvUy5ncGctYWdlbnQ6MjM5NzoxIjskRU5WeyJQQVJBTExFTF9TRVEifT0iMSI7JEVO
+  VnsiU1FMSVRFVEJMIn09InNxbGl0ZTM6Ly8vJTJGdG1wJTJGcGFyYWxsZWwuZGIyL3Bh
+  cnNxbDIiOyRFTlZ7IlBBUkFMTEVMX1BJRCJ9PSIzNDkyIjskRU5WeyJTUUxJVEUifT0i
+  c3FsaXRlMzovLy8lMkZ0bXAlMkZwYXJhbGxlbC5kYjIiOyRFTlZ7IlBBUkFMTEVMX1BJ
+  RCJ9PSIzNDkyIjskRU5WeyJQQVJBTExFTF9TRVEifT0iMSI7QGJhc2hfZnVuY3Rpb25z
+  PXF3KG15X2Z1bmMzKTsgaWYoJEVOVnsiU0hFTEwifT1+L2NzaC8pIHsgcHJpbnQgU1RE
+  RVJSICJDU0gvVENTSCBETyBOT1QgU1VQUE9SVCBuZXdsaW5lcyBJTiBWQVJJQUJMRVMv
+  RlVOQ1RJT05TLiBVbnNldCBAYmFzaF9mdW5jdGlvbnNcbiI7IGV4ZWMgImZhbHNlIjsg
+  fSAKJGJhc2hmdW5jID0gIm15X2Z1bmMzKCkgeyAgZWNobyBpbiBteV9mdW5jIFwkMSA+
+  IFwkMS5vdXQKfTtleHBvcnQgLWYgbXlfZnVuYzMgPi9kZXYvbnVsbDsiO0BBUkdWPSJt
+  eV9mdW5jMyBhYmMtZmlsZSI7JHNoZWxsPSIkRU5We1NIRUxM
+  fSI7JHRtcGRpcj0iL3RtcCI7JG5pY2U9MTc7ZG97JEVOVntQQVJBTExFTF9UTVB9PSR0
+  bXBkaXIuIi9wYXIiLmpvaW4iIixtYXB7KDAuLjksImEiLi4ieiIsIkEiLi4iWiIpW3Jh
+  bmQoNjIpXX0oMS4uNSk7fXdoaWxlKC1lJEVOVntQQVJBTExFTF9UTVB9KTskU0lHe0NI
+  TER9PXN1YnskZG9uZT0xO307JHBpZD1mb3JrO3VubGVzcygkcGlkKXtzZXRwZ3JwO2V2
+  YWx7c2V0cHJpb3JpdHkoMCwwLCRuaWNlKX07ZXhlYyRzaGVsbCwiLWMiLCgkYmFzaGZ1
+  bmMuIkBBUkdWIik7ZGllImV4ZWM6JCFcbiI7fWRveyRzPSRzPDE/MC4wMDErJHMqMS4w
+  MzokcztzZWxlY3QodW5kZWYsdW5kZWYsdW5kZWYsJHMpO311bnRpbCgkZG9uZXx8Z2V0
+  cHBpZD09MSk7a2lsbChTSUdIVVAsLSR7cGlkfSl1bmxlc3MkZG9uZTt3YWl0O2V4aXQo
+  JD8mMTI3PzEyOCsoJD8mMTI3KToxKyQ/Pj44KQ==;_EXIT_status=$?;
+  mkdir -p ./.; rsync --protocol 30 --rsync-path=cd\
+  ./.parallel/tmp/hk-3492-1/./.\;\ rsync -rlDzR -essh
+  lo:./abc-file.out ./.;ssh lo -- \(rm\ -f\
+  ./.parallel/tmp/hk-3492-1/abc-file\;\ sh\ -c\ \'rmdir\
+  ./.parallel/tmp/hk-3492-1/\ ./.parallel/tmp/\ ./.parallel/\
+  2\>/dev/null\'\;rm\ -rf\ ./.parallel/tmp/hk-3492-1\;\);ssh lo --
+  \(rm\ -f\ ./.parallel/tmp/hk-3492-1/abc-file.out\;\ sh\ -c\ \'rmdir\
+  ./.parallel/tmp/hk-3492-1/\ ./.parallel/tmp/\ ./.parallel/\
+  2\>/dev/null\'\;rm\ -rf\ ./.parallel/tmp/hk-3492-1\;\);ssh lo -- rm
+  -rf .parallel/tmp/hk-3492-1; exit $_EXIT_status;
+
+=head1 Saving to an SQL base (advanced)
+
+GNU B<parallel> can save into an SQL base. Point GNU B<parallel> to a
+table and it will put the joblog there together with the variables and
+the outout each in their own column.
+
+GNU B<parallel> uses a DBURL to address the table. A DBURL has this format:
+
+  vendor://[[user][:password]@][host][:port]/[database[/table]
+
+Example:
+
+  mysql://scott:tiger@my.example.com/mydatabase/mytable
+  postgresql://scott:tiger@pg.example.com/mydatabase/mytable
+  sqlite3:///%2Ftmp%2Fmydatabase/mytable
+
+To refer to B</tmp/mydatabase> with B<sqlite> you need to encode the B</> as B<%2F>.
+
+Run a job using B<sqlite> on B<mytable> in B</tmp/mydatabase>:
+
+  DBURL=sqlite3:///%2Ftmp%2Fmydatabase
+  DBURLTABLE=$DBURL/mytable
+  parallel --sqlandworker $DBURLTABLE echo ::: foo bar ::: baz quuz
+
+To see the result:
+
+  sql $DBURL 'SELECT * FROM mytable ORDER BY Seq;'
+
+Output will be similar to:
+
+  Seq|Host|Starttime|JobRuntime|Send|Receive|Exitval|_Signal|Command|V1|V2|Stdout|Stderr
+  1|:|1451619638.903|0.806||8|0|0|echo foo baz|foo|baz|foo baz
+  |
+  2|:|1451619639.265|1.54||9|0|0|echo foo quuz|foo|quuz|foo quuz
+  |
+  3|:|1451619640.378|1.43||8|0|0|echo bar baz|bar|baz|bar baz
+  |
+  4|:|1451619641.473|0.958||9|0|0|echo bar quuz|bar|quuz|bar quuz
+  |
+
+The first columns are well known from B<--joblog>. B<V1> and B<V2> are
+data from the input sources. B<Stdout> and B<Stderr> are standard
+output and standard error, respectively.
+
+=head2 Using multiple workers
+
+Using an SQL base as storage costs a lot of performance.
+
+One of the situations where it makes sense is if you have multiple
+workers.
+
+You can then have a single master machine that submits jobs to the SQL
+base (but does not do any of the work):
+
+  parallel --sql $DBURLTABLE echo ::: foo bar ::: baz quuz
+
+On the worker machines you run exactly the same command except you
+replace B<--sql> with B<--sqlworker>.
+
+  parallel --sqlworker $DBURLTABLE echo ::: foo bar ::: baz quuz
+
+To run a master and a worker on the same machine use B<--sqlandworker>
+as shown earlier.
+
 
 =head1 --pipe
 
-The --pipe functionality puts GNU Parallel in a different mode:
+The B<--pipe> functionality puts GNU B<parallel> in a different mode:
 Instead of treating the data on stdin (standard input) as arguments
 for a command to run, the data will be sent to stdin (standard input)
 of the command.
@@ -1685,7 +1935,7 @@ where command_B is slow, and you want to speed up command_B.
 
 =head2 Chunk size
 
-By default GNU Parallel will start an instance of command_B, read a
+By default GNU B<parallel> will start an instance of command_B, read a
 chunk of 1 MB, and pass that to the instance. Then start another
 instance, read another chunk, and pass that to the second instance.
 
@@ -1701,9 +1951,9 @@ Output (the order may be different):
   149796  149796 1048572
    85349   85349  597444
 
-The size of the chunk is not exactly 1 MB because GNU Parallel only
+The size of the chunk is not exactly 1 MB because GNU B<parallel> only
 passes full lines - never half a line, thus the blocksize is only
-average 1 MB. You can change the block size to 2 MB with --block:
+average 1 MB. You can change the block size to 2 MB with B<--block>:
 
   cat num1000000 | parallel --pipe --block 2M wc
 
@@ -1714,12 +1964,12 @@ Output (the order may be different):
   299593  299593 2097151
    85349   85349  597444
 
-GNU Parallel treats each line as a record. If the order of record is
+GNU B<parallel> treats each line as a record. If the order of record is
 unimportant (e.g. you need all lines processed, but you do not care
-which is processed first), then you can use --round-robin. Without
---round-robin GNU Parallel will start a command per block; with
---round-robin only the requested number of jobs will be started
-(--jobs). The records will then be distributed between the running
+which is processed first), then you can use B<--round-robin>. Without
+B<--round-robin> GNU B<parallel> will start a command per block; with
+B<--round-robin> only the requested number of jobs will be started
+(B<--jobs>). The records will then be distributed between the running
 jobs:
 
   cat num1000000 | parallel --pipe -j4 --round-robin wc
@@ -1736,10 +1986,10 @@ records each, and one instance got 1 full and 1 partial record.
 
 =head2 Records
 
-GNU Parallel sees the input as records. The default record is a single
+GNU B<parallel> sees the input as records. The default record is a single
 line.
 
-Using -N140000 GNU Parallel will read 140000 records at a time:
+Using B<-N140000> GNU B<parallel> will read 140000 records at a time:
 
   cat num1000000 | parallel --pipe -N140000 wc
 
@@ -1757,7 +2007,7 @@ Output (the order may be different):
 Notice that the last job could not get the full 140000 lines, but only
 20000 lines.
 
-If a record is 75 lines -L can be used:
+If a record is 75 lines B<-L> can be used:
 
   cat num1000000 | parallel --pipe -L75 wc
 
@@ -1772,23 +2022,23 @@ Output (the order may be different):
    85350   85350  597450
       25      25     176
 
-Notice GNU Parallel still reads a block of around 1 MB; but instead of
-passing full lines to 'wc' it passes full 75 lines at a time. This
+Notice GNU B<parallel> still reads a block of around 1 MB; but instead of
+passing full lines to B<wc> it passes full 75 lines at a time. This
 of course does not hold for the last job (which in this case got 25
 lines).
 
 =head2 Record separators
 
-GNU Parallel uses separators to determine where two records split.
+GNU B<parallel> uses separators to determine where two records split.
 
---recstart gives the string that starts a record; --recend gives the
-string that ends a record. The default is --recend '\n' (newline).
+B<--recstart> gives the string that starts a record; B<--recend> gives the
+string that ends a record. The default is B<--recend '\n'> (newline).
 
-If both --recend and --recstart are given, then the record will only
+If both B<--recend> and B<--recstart> are given, then the record will only
 split if the recend string is immediately followed by the recstart
 string.
 
-Here the --recend is set to ', ':
+Here the B<--recend> is set to B<', '>:
 
   echo /foo, bar/, /baz, qux/, | parallel -kN1 --recend ', ' --pipe echo JOB{#}\;cat\;echo END
 
@@ -1804,9 +2054,9 @@ Output:
   qux/,
   END
 
-Here the --recstart is set to '/':
+Here the B<--recstart> is set to B</>:
 
-  echo /foo, bar/, /baz, qux/, | parallel -kN1 --recstart '/' --pipe echo JOB{#}\;cat\;echo END
+  echo /foo, bar/, /baz, qux/, | parallel -kN1 --recstart / --pipe echo JOB{#}\;cat\;echo END
 
 Output:
 
@@ -1820,9 +2070,9 @@ Output:
   /,
   END
 
-Here both --recend and --recstart are set:
+Here both B<--recend> and B<--recstart> are set:
 
-  echo /foo, bar/, /baz, qux/, | parallel -kN1 --recend ', ' --recstart '/' --pipe echo JOB{#}\;cat\;echo END
+  echo /foo, bar/, /baz, qux/, | parallel -kN1 --recend ', ' --recstart / --pipe echo JOB{#}\;cat\;echo END
 
 Output:
 
@@ -1834,9 +2084,9 @@ Output:
 
 Note the difference between setting one string and setting both strings.
 
-With --regexp the --recend and --recstart will be treated as a regular expression:
+With B<--regexp> the B<--recend> and B<--recstart> will be treated as a regular expression:
 
-  echo foo,bar,_baz,__qux, | parallel -kN1 --regexp --recend ',_+' --pipe echo JOB{#}\;cat\;echo END
+  echo foo,bar,_baz,__qux, | parallel -kN1 --regexp --recend ,_+ --pipe echo JOB{#}\;cat\;echo END
 
 Output:
 
@@ -1848,9 +2098,9 @@ Output:
   qux,
   END
 
-GNU Parallel can remove the record separators with --remove-rec-sep/--rrs:
+GNU B<parallel> can remove the record separators with B<--remove-rec-sep>/B<--rrs>:
 
-  echo foo,bar,_baz,__qux, | parallel -kN1 --rrs --regexp --recend ',_+' --pipe echo JOB{#}\;cat\;echo END
+  echo foo,bar,_baz,__qux, | parallel -kN1 --rrs --regexp --recend ,_+ --pipe echo JOB{#}\;cat\;echo END
 
 Output:
 
@@ -1865,7 +2115,8 @@ Output:
 =head2 Header
 
 If the input data has a header, the header can be repeated for each
-job by matching the header with --header. If headers start with %:
+job by matching the header with B<--header>. If headers start with
+B<%> you can do this:
 
   cat num_%header | parallel --header '(%.*\n)*' --pipe -N3 echo JOB{#}\;cat
 
@@ -1894,7 +2145,7 @@ Output (the order may be different):
   %head2
   10
 
-If the header is 2 lines, --header 2 will work:
+If the header is 2 lines, B<--header> 2 will work:
 
   cat num_%header | parallel --header 2 --pipe -N3 echo JOB{#}\;cat
 
@@ -1902,10 +2153,10 @@ Output: Same as above.
 
 =head2 --pipepart
 
---pipe is not very efficient. It maxes out at around 500
-MB/s. --pipepart can easily deliver 5 GB/s. But there are a few
+B<--pipe> is not very efficient. It maxes out at around 500
+MB/s. B<--pipepart> can easily deliver 5 GB/s. But there are a few
 limitations. The input has to be a normal file (not a pipe) given by
--a or :::: and -L/-l/-N do not work.
+B<-a> or B<::::> and B<-L>/B<-l>/B<-N> do not work.
 
   parallel --pipepart -a num1000000 --block 3m wc
 
@@ -1920,18 +2171,18 @@ Output (the order may be different):
 
 =head2 Input data and parallel command in the same file
 
-GNU Parallel is often called as:
+GNU B<parallel> is often called as this:
 
   cat input_file | parallel command
 
-With --shebang the input_file and parallel can be combined into the same script.
+With B<--shebang> the I<input_file> and B<parallel> can be combined into the same script.
 
-UNIX-scripts start with a shebang line like:
+UNIX-scripts start with a shebang line like this:
 
   #!/bin/bash
 
-GNU Parallel can do that, too. With --shebang the arguments can be
-listed in the file. The parallel command is the first line of the
+GNU B<parallel> can do that, too. With B<--shebang> the arguments can be
+listed in the file. The B<parallel> command is the first line of the
 script:
 
   #!/usr/bin/parallel --shebang -r echo
@@ -1948,19 +2199,19 @@ Output (the order may be different):
 
 =head2 Parallelizing existing scripts
 
-GNU Parallel is often called as:
+GNU B<parallel> is often called as:
 
   cat input_file | parallel command
   parallel command ::: foo bar
 
-If command is a script parallel can be combined into a single file so:
+If command is a script B<parallel> can be combined into a single file so:
 
   cat input_file | command
   command foo bar
 
-will run the script in parallel.
+will run the script in B<parallel>.
 
-This perl script perl_echo works like echo:
+This B<perl> script B<perl_echo> works like B<echo>:
 
   #!/usr/bin/perl
 
@@ -1970,7 +2221,7 @@ It can be called as:
 
   parallel perl_echo ::: foo bar
 
-By changing the #!-line it can be run in parallel
+By changing the B<#!>-line it can be run in parallel:
 
   #!/usr/bin/parallel --shebang-wrap /usr/bin/perl
 
@@ -1993,55 +2244,106 @@ This technique can be used for:
 
 #!/usr/bin/parallel --shebang-wrap /usr/bin/perl
 
+print "Arguments @ARGV\n";
+
+
 =item Python:
 
 #!/usr/bin/parallel --shebang-wrap /usr/bin/python
 
+import sys
+
+print 'Arguments', str(sys.argv)
+
+
 =item Bash:
 
 #!/usr/bin/parallel --shebang-wrap /bin/bash
 
+echo Arguments "$@"
+
+
 =item R:
 
 #!/usr/bin/parallel --shebang-wrap /usr/bin/Rscript --vanilla --slave
 
+args <- commandArgs(trailingOnly = TRUE)
+print(paste("Arguments ",args))
+
+
 =item GNUplot:
 
 #!/usr/bin/parallel --shebang-wrap ARG={} /usr/bin/gnuplot
 
+print "Arguments ", system('echo $ARG')
+
+
 =item Ruby:
 
 #!/usr/bin/parallel --shebang-wrap /usr/bin/ruby
 
+print "Arguments "
+puts ARGV
+
+
+=item Octave:
+
+#!/usr/bin/parallel --shebang-wrap /usr/bin/octave
+
+printf ("Arguments");
+arg_list = argv ();
+for i = 1:nargin
+  printf (" %s", arg_list{i});
+endfor
+printf ("\n");
+
+=item Common LISP:
+
+#!/usr/bin/parallel --shebang-wrap /usr/bin/clisp
+
+(format t "~&~S~&" 'Arguments)
+(format t "~&~S~&" *args*)
+
+LUA
+PHP
+Javascript
+nodejs
+Tcl
+C#?
+
+
 =back
 
 =head1 Semaphore
 
-GNU Parallel can work as a counting semaphore. This is slower and less
+GNU B<parallel> can work as a counting semaphore. This is slower and less
 efficient than its normal mode.
 
 A counting semaphore is like a row of toilets. People needing a toilet
 can use any toilet, but if there are more people than toilets, they
 will have to wait for one of the toilets to be available.
 
-An alias for 'parallel --semaphore' is 'sem'.
+An alias for B<parallel --semaphore> is B<sem>.
 
-'sem' will follow a person to the toilets, wait until a toilet is
+B<sem> will follow a person to the toilets, wait until a toilet is
 available, leave the person in the toilet and exit.
 
-'sem --fg' will follow a person to the toilets, wait until a toilet is
+B<sem --fg> will follow a person to the toilets, wait until a toilet is
 available, stay with the person in the toilet and exit when the person
 exits.
 
-'sem --wait' will wait for all persons to leave the toilets.
+B<sem --wait> will wait for all persons to leave the toilets.
 
-'sem' does not have a queue discipline, so the next person is chosen
+B<sem> does not have a queue discipline, so the next person is chosen
 randomly.
 
--j sets the number of toilets. The default is to have only one toilet
-(technically this is called a mutex). The program is started in the
-background and 'sem' exits immediately. Use --wait to wait for all
-'sem's to finish:
+B<-j> sets the number of toilets.
+
+=head2 Mutex
+
+The default is to have only one toilet (this is called a mutex). The
+program is started in the background and B<sem> exits immediately. Use
+B<--wait> to wait for all B<sem>s to finish:
 
   sem 'sleep 1; echo The first finished' &&
     echo The first is now running in the background &&
@@ -2056,7 +2358,7 @@ Output:
   The second is now running in the background
   The second finished
 
-The command can be run in the foreground with --fg, which will only
+The command can be run in the foreground with B<--fg>, which will only
 exit when the command completes:
 
   sem --fg 'sleep 1; echo The first finished' &&
@@ -2066,11 +2368,11 @@ exit when the command completes:
   sem --wait
 
 The difference between this and just running the command, is that a
-mutex is set, so if other sems were running in the background only one
-would run at the same time.
+mutex is set, so if other B<sem>s were running in the background only one
+would run at a time.
 
 To tell the difference between which semaphore is used, use
---semaphorename/--id. Run this in one terminal:
+B<--semaphorename>/B<--id>. Run this in one terminal:
 
   sem --id my_id -u 'echo First started; sleep 10; echo The first finished'
 
@@ -2087,8 +2389,8 @@ else will have to wait. A counting semaphore is like having multiple
 toilets: Several people can use the toilets, but when they all are in
 use, everyone else will have to wait.
 
-sem can emulate a counting semaphore. Use --jobs to set the number of
-toilets:
+B<sem> can emulate a counting semaphore. Use B<--jobs> to set the number of
+toilets like this:
 
   sem --jobs 3 --id my_id -u 'echo First started; sleep 5; echo The first finished' &&
   sem --jobs 3 --id my_id -u 'echo Second started; sleep 6; echo The second finished' &&
@@ -2109,7 +2411,7 @@ Output:
 
 =head2 Timeout
 
-With --semaphoretimeout you can force running the command anyway after
+With B<--semaphoretimeout> you can force running the command anyway after
 a period (postive number) or give up (negative number):
 
   sem --id foo -u 'echo Slow started; sleep 5; echo Slow ended' &&
@@ -2129,10 +2431,10 @@ Note how the 'Give up' was not run.
 
 =head1 Informational
 
-GNU Parallel has some options to give short information about the
+GNU B<parallel> has some options to give short information about the
 configuration.
 
---help will print a summary of the most important options:
+B<--help> will print a summary of the most important options:
 
   parallel --help
 
@@ -2167,7 +2469,7 @@ Output:
   O. Tange (2011): GNU Parallel - The Command-Line Power Tool,
   ;login: The USENIX Magazine, February 2011:42-47.
 
-When asking for help, always report the full output of:
+    When asking for help, always report the full output of this:
 
   parallel --version
 
@@ -2186,7 +2488,7 @@ Output:
   O. Tange (2011): GNU Parallel - The Command-Line Power Tool, 
   ;login: The USENIX Magazine, February 2011:42-47.
 
-In scripts --minversion can be used to ensure the user has at least
+In scripts B<--minversion> can be used to ensure the user has at least
 this version:
 
   parallel --minversion 20130722 && echo Your version is at least 20130722.
@@ -2196,8 +2498,8 @@ Output:
   20130722
   Your version is at least 20130722.
 
-If using GNU Parallel for research the BibTeX citation can be
-generated using --bibtex.
+If using GNU B<parallel> for research the BibTeX citation can be
+generated using B<--bibtex>:
 
   parallel --bibtex
 
@@ -2216,7 +2518,7 @@ Output:
    pages = {42-47}
   }
 
-With --max-line-length-allowed GNU Parallel will report the maximal
+With B<--max-line-length-allowed> GNU B<parallel> will report the maximal
 size of the command line:
 
   parallel --max-line-length-allowed
@@ -2225,7 +2527,7 @@ Output (may vary on different systems):
 
   131071
 
---number-of-cpus and --number-of-cores run system specific code to
+B<--number-of-cpus> and B<--number-of-cores> run system specific code to
 determine the number of CPUs and CPU cores on the system. On
 unsupported platforms they will return 1:
 
@@ -2239,11 +2541,11 @@ Output (may vary on different systems):
 
 =head1 Profiles
 
-The defaults for GNU Parallel can be changed systemwise by putting the
-command line options in /etc/parallel/config. They can be changed for
-a user by putting them in ~/.parallel/config.
+The defaults for GNU B<parallel> can be changed systemwide by putting the
+command line options in B</etc/parallel/config>. They can be changed for
+a user by putting them in B<~/.parallel/config>.
 
-Profiles work the same way, but have to be referred to with --profile:
+Profiles work the same way, but have to be referred to with B<--profile>:
 
   echo '--nice 17' > ~/.parallel/nicetimeout
   echo '--timeout 300%' >> ~/.parallel/nicetimeout
@@ -2271,7 +2573,7 @@ Output:
 
 I hope you have learned something from this tutorial.
 
-If you like GNU Parallel:
+If you like GNU B<parallel>:
 
 =over 2
 
@@ -2293,6 +2595,7 @@ mailing lists
 =item *
 
 Request or write a review for your favourite blog or magazine
+(especially if you do something cool with GNU B<parallel>)
 
 =item *
 
@@ -2300,17 +2603,17 @@ Invite me for your next conference
 
 =back
 
-If you use GNU Parallel for research:
+If you use GNU B<parallel> for research:
 
 =over 2
 
 =item *
 
-Please cite GNU Parallel in you publications (use --bibtex)
+Please cite GNU B<parallel> in you publications (use B<--bibtex>)
 
 =back
 
-If GNU Parallel saves you money:
+If GNU B<parallel> saves you money:
 
 =over 2
 
@@ -2321,7 +2624,7 @@ https://my.fsf.org/donate/
 
 =back
 
-(C) 2013,2014,2015 Ole Tange, GPLv3
+(C) 2013,2014,2015,2016 Ole Tange, GPLv3
 
 
 =cut
diff --git a/src/sql b/src/sql
index 46f1f53e..acbd2db4 100755
--- a/src/sql
+++ b/src/sql
@@ -566,7 +566,7 @@ $Global::Initfile && unlink $Global::Initfile;
 exit ($err);
 
 sub parse_options {
-    $Global::version = 20151222;
+    $Global::version = 20160101;
     $Global::progname = 'sql';
 
     # This must be done first as this may exec myself
diff --git a/testsuite/tests-to-run/parallel-local-sql.sh b/testsuite/tests-to-run/parallel-local-sql.sh
new file mode 100644
index 00000000..9f4a9a78
--- /dev/null
+++ b/testsuite/tests-to-run/parallel-local-sql.sh
@@ -0,0 +1,75 @@
+#!/bin/bash
+
+export SQLITE=sqlite3:///%2Frun%2Fshm%2Fparallel.db
+export SQLITETBL=$SQLITE/parsql
+export PG=pg://tange:tange@lo/tange
+export PGTBL=$PG/parsql
+export MYSQL=mysql://tange:tange@lo/tange
+export MYSQLTBL=$MYSQL/parsql
+export PGTBL2=${PGTBL}2
+export PGTBL3=${PGTBL}3
+export PGTBL4=${PGTBL}4
+export PGTBL5=${PGTBL}5
+export T1=$(tempfile)
+export T2=$(tempfile)
+export T3=$(tempfile)
+export T4=$(tempfile)
+export T5=$(tempfile)
+export T6=$(tempfile)
+export T7=$(tempfile)
+export T8=$(tempfile)
+export T9=$(tempfile)
+export T10=$(tempfile)
+export T11=$(tempfile)
+export T12=$(tempfile)
+export T13=$(tempfile)
+export T14=$(tempfile)
+
+#sql mysql://tange:tange@lo/ 'create database tange;'; 
+cat <<'EOF' | sed -e 's/;$/; /;' | stdout parallel -vj0 -k --joblog /tmp/jl-`basename $0` -L1 | perl -pe 's/\s*\d+\.?\d+\s*/999/g;s/999e+999.\s+.\s+/999e+999|999/g;'
+echo '### --sqlandworker mysql'
+  (sleep 2; parallel --sqlworker $MYSQLTBL sleep .3\;echo >$T1) &
+  parallel --sqlandworker $MYSQLTBL sleep .3\;echo ::: {1..5} ::: {a..e} >$T2; 
+  true sort -u $T1 $T2; 
+  sql $MYSQL 'select * from parsql order by seq;'
+
+echo '### --sqlandworker postgresql'
+  (sleep 2; parallel --sqlworker $PGTBL sleep .3\;echo >$T3) &
+  parallel --sqlandworker $PGTBL sleep .3\;echo ::: {1..5} ::: {a..e} >$T4; 
+  true sort -u $T3 $T4; 
+  sql $PG 'select * from parsql order by seq;'
+
+echo '### --sqlandworker sqlite'
+  (sleep 2; parallel --sqlworker $SQLITETBL sleep .3\;echo >$T5) &
+  parallel --sqlandworker $SQLITETBL sleep .3\;echo ::: {1..5} ::: {a..e} >$T6; 
+  true sort -u $T5 $T6; 
+  sql $SQLITE 'select * from parsql order by seq;'
+
+echo '### --sqlandworker postgresql -S lo'
+  (sleep 2; parallel -S lo --sqlworker $PGTBL2 sleep .3\;echo >$T7) &
+  parallel -S lo --sqlandworker $PGTBL2 sleep .3\;echo ::: {1..5} ::: {a..e} >$T8; 
+  true sort -u $T7 $T8; 
+  sql $PG 'select * from parsql2 order by seq;'
+
+echo '### --sqlandworker postgresql --results'
+  mkdir -p /tmp/out--sql
+  (sleep 2; parallel --results /tmp/out--sql --sqlworker $PGTBL3 sleep .3\;echo >$T9) &
+  parallel --results /tmp/out--sql --sqlandworker $PGTBL3 sleep .3\;echo ::: {1..5} ::: {a..e} >$T10; 
+  true sort -u $T9 $T10; 
+  sql $PG 'select * from parsql3 order by seq;'
+
+echo '### --sqlandworker postgresql --linebuffer'
+  (sleep 2; parallel --linebuffer --sqlworker $PGTBL4 sleep .3\;echo >$T11) &
+  parallel --linebuffer --sqlandworker $PGTBL4 sleep .3\;echo ::: {1..5} ::: {a..e} >$T12; 
+  true sort -u $T11 $T12; 
+  sql $PG 'select * from parsql4 order by seq;'
+
+echo '### --sqlandworker postgresql -u'
+  (sleep 2; parallel -u --sqlworker $PGTBL5 sleep .3\;echo >$T13) &
+  parallel -u --sqlandworker $PGTBL5 sleep .3\;echo ::: {1..5} ::: {a..e} >$T14; 
+  true sort -u $T13 $T14; 
+  sql $PG 'select * from parsql5 order by seq;'
+
+EOF
+
+eval rm '$T'{1..14}
\ No newline at end of file