parallel_design.pod: GNU Parallel design considerations.

2024-12-23 13:17:54 +00:00 · 2015-01-19 00:07:12 +01:00 · 2015-01-19 00:07:12 +01:00 · 649e2ec7c3
parent 8c4f4c2b20
commit 649e2ec7c3
3 changed files with 616 additions and 40 deletions
--- a/src/Makefile.am
+++ b/src/Makefile.am
@ -5,8 +5,10 @@ install-exec-hook:
 	$(LN_S) parallel $(DESTDIR)$(bindir)/sem
 if DOCUMENTATION
-man_MANS = parallel.1 sem.1 sql.1 niceload.1 parallel_tutorial.1
+man_MANS = parallel.1 sem.1 sql.1 niceload.1 parallel_tutorial.7 parallel_design.7
-doc_DATA = parallel.html sem.html sql.html niceload.html parallel_tutorial.html parallel.texi sem.texi sql.texi niceload.texi parallel_tutorial.texi parallel.pdf sem.pdf sql.pdf niceload.pdf parallel_tutorial.pdf
+doc_DATA = parallel.html sem.html sql.html niceload.html parallel_tutorial.html parallel_design.html \
 	parallel.texi sem.texi sql.texi niceload.texi parallel_tutorial.texi parallel_design.texi \
 	parallel.pdf sem.pdf sql.pdf niceload.pdf parallel_tutorial.pdf parallel_design.pdf
 endif
 # Build documentation file if the tool to build exists.
@ -17,11 +19,17 @@ parallel.1: parallel.pod
 	&& mv $(srcdir)/parallel.1n $(srcdir)/parallel.1 \
 	|| echo "Warning: pod2man not found. Using old parallel.1"
-parallel_tutorial.1: parallel_tutorial.pod
+parallel_tutorial.7: parallel_tutorial.pod
 	pod2man --release='$(PACKAGE_VERSION)' --center='$(PACKAGE_NAME)' \
-		--section=1 $(srcdir)/parallel_tutorial.pod > $(srcdir)/parallel_tutorial.1n \
+		--section=7 $(srcdir)/parallel_tutorial.pod > $(srcdir)/parallel_tutorial.7n \
-	&& mv $(srcdir)/parallel_tutorial.1n $(srcdir)/parallel_tutorial.1 \
+	&& mv $(srcdir)/parallel_tutorial.7n $(srcdir)/parallel_tutorial.7 \
-	|| echo "Warning: pod2man not found. Using old parallel_tutorial.1"
+	|| echo "Warning: pod2man not found. Using old parallel_tutorial.7"
 parallel_design.7: parallel_design.pod
 	pod2man --release='$(PACKAGE_VERSION)' --center='$(PACKAGE_NAME)' \
 		--section=7 $(srcdir)/parallel_design.pod > $(srcdir)/parallel_design.7n \
 	&& mv $(srcdir)/parallel_design.7n $(srcdir)/parallel_design.7 \
 	|| echo "Warning: pod2man not found. Using old parallel_design.7"
 sem.1: sem.pod
 	pod2man --release='$(PACKAGE_VERSION)' --center='$(PACKAGE_NAME)' \
@ -55,7 +63,14 @@ parallel_tutorial.html: parallel_tutorial.pod parallel.html
 	rm -f $(srcdir)/pod2htm*
 # Depending on parallel_tutorial.html to avoid stupid pod2html race condition
-sem.html: sem.pod parallel_tutorial.html
+parallel_design.html: parallel_design.pod parallel.html
 	pod2html --title "GNU Parallel design" $(srcdir)/parallel_design.pod > $(srcdir)/parallel_design.htmln \
 	&& mv $(srcdir)/parallel_design.htmln $(srcdir)/parallel_design.html \
 	|| echo "Warning: pod2html not found. Using old parallel_design.html"
 	rm -f $(srcdir)/pod2htm*
 # Depending on parallel_design.html to avoid stupid pod2html race condition
 sem.html: sem.pod parallel_design.html
 	pod2html --title "sem (GNU Parallel)" $(srcdir)/sem.pod > $(srcdir)/sem.htmln \
 	&& mv $(srcdir)/sem.htmln $(srcdir)/sem.html \
 	|| echo "Warning: pod2html not found. Using old sem.html"
@ -83,6 +98,10 @@ parallel_tutorial.texi: parallel_tutorial.pod
 	pod2texi --output=$(srcdir)/parallel_tutorial.texi $(srcdir)/parallel_tutorial.pod \
 	|| echo "Warning: pod2texi not found. Using old parallel_tutorial.texi"
 parallel_design.texi: parallel_design.pod
 	pod2texi --output=$(srcdir)/parallel_design.texi $(srcdir)/parallel_design.pod \
 	|| echo "Warning: pod2texi not found. Using old parallel_design.texi"
 sem.texi: sem.pod
 	pod2texi --output=$(srcdir)/sem.texi $(srcdir)/sem.pod \
 	|| echo "Warning: pod2texi not found. Using old sem.texi"
@ -103,6 +122,10 @@ parallel_tutorial.pdf: parallel_tutorial.pod
 	pod2pdf --output-file $(srcdir)/parallel_tutorial.pdf $(srcdir)/parallel_tutorial.pod --title "GNU Parallel Tutorial" \
 	|| echo "Warning: pod2pdf not found. Using old parallel_tutorial.pdf"
 parallel_design.pdf: parallel_design.pod
 	pod2pdf --output-file $(srcdir)/parallel_design.pdf $(srcdir)/parallel_design.pod --title "GNU Parallel Design" \
 	|| echo "Warning: pod2pdf not found. Using old parallel_design.pdf"
 sem.pdf: sem.pod
 	pod2pdf --output-file $(srcdir)/sem.pdf $(srcdir)/sem.pod --title "GNU sem" \
 	|| echo "Warning: pod2pdf not found. Using old sem.pdf"
@ -118,14 +141,11 @@ niceload.pdf: niceload.pod
 sem: parallel
 	ln -fs parallel sem
-DISTCLEANFILES = parallel.1 sem.1 sql.1 niceload.1 parallel_tutorial.1 \
+DISTCLEANFILES = parallel.1 sem.1 sql.1 niceload.1 parallel_tutorial.7 parallel_design.7 \
-	parallel.html sem.html sql.html niceload.html parallel_tutorial.html \
+	parallel.html sem.html sql.html niceload.html parallel_tutorial.html parallel_design.html \
-	parallel.texi sem.texi sql.texi niceload.texi parallel_tutorial.texi \
+	parallel.texi sem.texi sql.texi niceload.texi parallel_tutorial.texi parallel_design.texi \
-	parallel.pdf sem.pdf sql.pdf niceload.pdf parallel_tutorial.pdf
+	parallel.pdf sem.pdf sql.pdf niceload.pdf parallel_tutorial.pdf parallel_design.pdf
 EXTRA_DIST = parallel sem sql niceload \
 	parallel.1 sem.1 sql.1 niceload.1 parallel_tutorial.1 \
 	parallel.html sem.html sql.html niceload.html parallel_tutorial.html \
 	sem.pod parallel.pod niceload.pod parallel_tutorial.pod \
-	parallel.texi sem.texi sql.texi niceload.texi parallel_tutorial.texi \
+	$(DISTCLEANFILES)
 	parallel.pdf sem.pdf sql.pdf niceload.pdf parallel_tutorial.pdf
--- a/src/Makefile.in
+++ b/src/Makefile.in
@ -115,7 +115,7 @@ am__uninstall_files_from_dir = { \
         $(am__cd) "$$dir" && rm -f $$files; }; \
  }
 am__installdirs = "$(DESTDIR)$(bindir)" "$(DESTDIR)$(man1dir)" \
-	"$(DESTDIR)$(docdir)"
+	"$(DESTDIR)$(man7dir)" "$(DESTDIR)$(docdir)"
 SCRIPTS = $(bin_SCRIPTS)
 AM_V_P = $(am__v_P_@AM_V@)
 am__v_P_ = $(am__v_P_@AM_DEFAULT_V@)
@ -137,6 +137,7 @@ am__can_run_installinfo = \
    *) (install-info --version) >/dev/null 2>&1;; \
  esac
 man1dir = $(mandir)/man1
 man7dir = $(mandir)/man7
 NROFF = nroff
 MANS = $(man_MANS)
 DATA = $(doc_DATA)
@ -217,19 +218,19 @@ top_build_prefix = @top_build_prefix@
 top_builddir = @top_builddir@
 top_srcdir = @top_srcdir@
 bin_SCRIPTS = parallel sql niceload
-@DOCUMENTATION_TRUE@man_MANS = parallel.1 sem.1 sql.1 niceload.1 parallel_tutorial.1
+@DOCUMENTATION_TRUE@man_MANS = parallel.1 sem.1 sql.1 niceload.1 parallel_tutorial.7 parallel_design.7
-@DOCUMENTATION_TRUE@doc_DATA = parallel.html sem.html sql.html niceload.html parallel_tutorial.html parallel.texi sem.texi sql.texi niceload.texi parallel_tutorial.texi parallel.pdf sem.pdf sql.pdf niceload.pdf parallel_tutorial.pdf
+@DOCUMENTATION_TRUE@doc_DATA = parallel.html sem.html sql.html niceload.html parallel_tutorial.html parallel_design.html \
-DISTCLEANFILES = parallel.1 sem.1 sql.1 niceload.1 parallel_tutorial.1 \
+@DOCUMENTATION_TRUE@	parallel.texi sem.texi sql.texi niceload.texi parallel_tutorial.texi parallel_design.texi \
-	parallel.html sem.html sql.html niceload.html parallel_tutorial.html \
+@DOCUMENTATION_TRUE@	parallel.pdf sem.pdf sql.pdf niceload.pdf parallel_tutorial.pdf parallel_design.pdf
-	parallel.texi sem.texi sql.texi niceload.texi parallel_tutorial.texi \
+
-	parallel.pdf sem.pdf sql.pdf niceload.pdf parallel_tutorial.pdf
+DISTCLEANFILES = parallel.1 sem.1 sql.1 niceload.1 parallel_tutorial.7 parallel_design.7 \
 	parallel.html sem.html sql.html niceload.html parallel_tutorial.html parallel_design.html \
 	parallel.texi sem.texi sql.texi niceload.texi parallel_tutorial.texi parallel_design.texi \
 	parallel.pdf sem.pdf sql.pdf niceload.pdf parallel_tutorial.pdf parallel_design.pdf
 EXTRA_DIST = parallel sem sql niceload \
 	parallel.1 sem.1 sql.1 niceload.1 parallel_tutorial.1 \
 	parallel.html sem.html sql.html niceload.html parallel_tutorial.html \
 	sem.pod parallel.pod niceload.pod parallel_tutorial.pod \
-	parallel.texi sem.texi sql.texi niceload.texi parallel_tutorial.texi \
+	$(DISTCLEANFILES)
 	parallel.pdf sem.pdf sql.pdf niceload.pdf parallel_tutorial.pdf
 all: all-am
@ -342,6 +343,49 @@ uninstall-man1:
 	} | sed -e 's,.*/,,;h;s,.*\.,,;s,^[^1][0-9a-z]*$$,1,;x' \
 	      -e 's,\.[0-9a-z]*$$,,;$(transform);G;s,\n,.,'`; \
 	dir='$(DESTDIR)$(man1dir)'; $(am__uninstall_files_from_dir)
 install-man7: $(man_MANS)
 	@$(NORMAL_INSTALL)
 	@list1=''; \
 	list2='$(man_MANS)'; \
 	test -n "$(man7dir)" \
 	  && test -n "`echo $$list1$$list2`" \
 	  || exit 0; \
 	echo " $(MKDIR_P) '$(DESTDIR)$(man7dir)'"; \
 	$(MKDIR_P) "$(DESTDIR)$(man7dir)" || exit 1; \
 	{ for i in $$list1; do echo "$$i"; done;  \
 	if test -n "$$list2"; then \
 	  for i in $$list2; do echo "$$i"; done \
 	    | sed -n '/\.7[a-z]*$$/p'; \
 	fi; \
 	} | while read p; do \
 	  if test -f $$p; then d=; else d="$(srcdir)/"; fi; \
 	  echo "$$d$$p"; echo "$$p"; \
 	done | \
 	sed -e 'n;s,.*/,,;p;h;s,.*\.,,;s,^[^7][0-9a-z]*$$,7,;x' \
 	      -e 's,\.[0-9a-z]*$$,,;$(transform);G;s,\n,.,' | \
 	sed 'N;N;s,\n, ,g' | { \
 	list=; while read file base inst; do \
 	  if test "$$base" = "$$inst"; then list="$$list $$file"; else \
 	    echo " $(INSTALL_DATA) '$$file' '$(DESTDIR)$(man7dir)/$$inst'"; \
 	    $(INSTALL_DATA) "$$file" "$(DESTDIR)$(man7dir)/$$inst" || exit $$?; \
 	  fi; \
 	done; \
 	for i in $$list; do echo "$$i"; done | $(am__base_list) | \
 	while read files; do \
 	  test -z "$$files" || { \
 	    echo " $(INSTALL_DATA) $$files '$(DESTDIR)$(man7dir)'"; \
 	    $(INSTALL_DATA) $$files "$(DESTDIR)$(man7dir)" || exit $$?; }; \
 	done; }
 uninstall-man7:
 	@$(NORMAL_UNINSTALL)
 	@list=''; test -n "$(man7dir)" || exit 0; \
 	files=`{ for i in $$list; do echo "$$i"; done; \
 	l2='$(man_MANS)'; for i in $$l2; do echo "$$i"; done | \
 	  sed -n '/\.7[a-z]*$$/p'; \
 	} | sed -e 's,.*/,,;h;s,.*\.,,;s,^[^7][0-9a-z]*$$,7,;x' \
 	      -e 's,\.[0-9a-z]*$$,,;$(transform);G;s,\n,.,'`; \
 	dir='$(DESTDIR)$(man7dir)'; $(am__uninstall_files_from_dir)
 install-docDATA: $(doc_DATA)
 	@$(NORMAL_INSTALL)
 	@list='$(doc_DATA)'; test -n "$(docdir)" || list=; \
@ -404,7 +448,7 @@ check-am: all-am
 check: check-am
 all-am: Makefile $(SCRIPTS) $(MANS) $(DATA)
 installdirs:
-	for dir in "$(DESTDIR)$(bindir)" "$(DESTDIR)$(man1dir)" "$(DESTDIR)$(docdir)"; do \
+	for dir in "$(DESTDIR)$(bindir)" "$(DESTDIR)$(man1dir)" "$(DESTDIR)$(man7dir)" "$(DESTDIR)$(docdir)"; do \
 	  test -z "$$dir" || $(MKDIR_P) "$$dir"; \
 	done
 install: install-am
@ -475,7 +519,7 @@ install-info: install-info-am
 install-info-am:
-install-man: install-man1
+install-man: install-man1 install-man7
 install-pdf: install-pdf-am
@ -505,7 +549,7 @@ ps-am:
 uninstall-am: uninstall-binSCRIPTS uninstall-docDATA uninstall-man
-uninstall-man: uninstall-man1
+uninstall-man: uninstall-man1 uninstall-man7
 .MAKE: install-am install-exec-am install-strip
@ -515,12 +559,13 @@ uninstall-man: uninstall-man1
 	install-data install-data-am install-docDATA install-dvi \
 	install-dvi-am install-exec install-exec-am install-exec-hook \
 	install-html install-html-am install-info install-info-am \
-	install-man install-man1 install-pdf install-pdf-am install-ps \
+	install-man install-man1 install-man7 install-pdf \
-	install-ps-am install-strip installcheck installcheck-am \
+	install-pdf-am install-ps install-ps-am install-strip \
-	installdirs maintainer-clean maintainer-clean-generic \
+	installcheck installcheck-am installdirs maintainer-clean \
-	mostlyclean mostlyclean-generic pdf pdf-am ps ps-am tags-am \
+	maintainer-clean-generic mostlyclean mostlyclean-generic pdf \
-	uninstall uninstall-am uninstall-binSCRIPTS uninstall-docDATA \
+	pdf-am ps ps-am tags-am uninstall uninstall-am \
-	uninstall-man uninstall-man1
+	uninstall-binSCRIPTS uninstall-docDATA uninstall-man \
 	uninstall-man1 uninstall-man7
 install-exec-hook:
@ -535,11 +580,17 @@ parallel.1: parallel.pod
 	&& mv $(srcdir)/parallel.1n $(srcdir)/parallel.1 \
 	|| echo "Warning: pod2man not found. Using old parallel.1"
-parallel_tutorial.1: parallel_tutorial.pod
+parallel_tutorial.7: parallel_tutorial.pod
 	pod2man --release='$(PACKAGE_VERSION)' --center='$(PACKAGE_NAME)' \
-		--section=1 $(srcdir)/parallel_tutorial.pod > $(srcdir)/parallel_tutorial.1n \
+		--section=7 $(srcdir)/parallel_tutorial.pod > $(srcdir)/parallel_tutorial.7n \
-	&& mv $(srcdir)/parallel_tutorial.1n $(srcdir)/parallel_tutorial.1 \
+	&& mv $(srcdir)/parallel_tutorial.7n $(srcdir)/parallel_tutorial.7 \
-	|| echo "Warning: pod2man not found. Using old parallel_tutorial.1"
+	|| echo "Warning: pod2man not found. Using old parallel_tutorial.7"
 parallel_design.7: parallel_design.pod
 	pod2man --release='$(PACKAGE_VERSION)' --center='$(PACKAGE_NAME)' \
 		--section=7 $(srcdir)/parallel_design.pod > $(srcdir)/parallel_design.7n \
 	&& mv $(srcdir)/parallel_design.7n $(srcdir)/parallel_design.7 \
 	|| echo "Warning: pod2man not found. Using old parallel_design.7"
 sem.1: sem.pod
 	pod2man --release='$(PACKAGE_VERSION)' --center='$(PACKAGE_NAME)' \
@ -573,7 +624,14 @@ parallel_tutorial.html: parallel_tutorial.pod parallel.html
 	rm -f $(srcdir)/pod2htm*
 # Depending on parallel_tutorial.html to avoid stupid pod2html race condition
-sem.html: sem.pod parallel_tutorial.html
+parallel_design.html: parallel_design.pod parallel.html
 	pod2html --title "GNU Parallel design" $(srcdir)/parallel_design.pod > $(srcdir)/parallel_design.htmln \
 	&& mv $(srcdir)/parallel_design.htmln $(srcdir)/parallel_design.html \
 	|| echo "Warning: pod2html not found. Using old parallel_design.html"
 	rm -f $(srcdir)/pod2htm*
 # Depending on parallel_design.html to avoid stupid pod2html race condition
 sem.html: sem.pod parallel_design.html
 	pod2html --title "sem (GNU Parallel)" $(srcdir)/sem.pod > $(srcdir)/sem.htmln \
 	&& mv $(srcdir)/sem.htmln $(srcdir)/sem.html \
 	|| echo "Warning: pod2html not found. Using old sem.html"
@ -601,6 +659,10 @@ parallel_tutorial.texi: parallel_tutorial.pod
 	pod2texi --output=$(srcdir)/parallel_tutorial.texi $(srcdir)/parallel_tutorial.pod \
 	|| echo "Warning: pod2texi not found. Using old parallel_tutorial.texi"
 parallel_design.texi: parallel_design.pod
 	pod2texi --output=$(srcdir)/parallel_design.texi $(srcdir)/parallel_design.pod \
 	|| echo "Warning: pod2texi not found. Using old parallel_design.texi"
 sem.texi: sem.pod
 	pod2texi --output=$(srcdir)/sem.texi $(srcdir)/sem.pod \
 	|| echo "Warning: pod2texi not found. Using old sem.texi"
@ -621,6 +683,10 @@ parallel_tutorial.pdf: parallel_tutorial.pod
 	pod2pdf --output-file $(srcdir)/parallel_tutorial.pdf $(srcdir)/parallel_tutorial.pod --title "GNU Parallel Tutorial" \
 	|| echo "Warning: pod2pdf not found. Using old parallel_tutorial.pdf"
 parallel_design.pdf: parallel_design.pod
 	pod2pdf --output-file $(srcdir)/parallel_design.pdf $(srcdir)/parallel_design.pod --title "GNU Parallel Design" \
 	|| echo "Warning: pod2pdf not found. Using old parallel_design.pdf"
 sem.pdf: sem.pod
 	pod2pdf --output-file $(srcdir)/sem.pdf $(srcdir)/sem.pod --title "GNU sem" \
 	|| echo "Warning: pod2pdf not found. Using old sem.pdf"
--- a/src/parallel_design.pod
+++ b/src/parallel_design.pod
@ -0,0 +1,490 @@
 #!/usr/bin/perl -w
 =encoding utf8
 =head1 Design of GNU Parallel
 This document describes design decisions made in the development of
 GNU B<parallel> and the reasoning behind them. It will give an
 overview of why some of the code looks like it does, and help new
 maintainers understand the code better.
 =head2 Job slots
 The easiest way to explain what GNU B<parallel> does is to assume that
 there are a number of job slots, and when a slot becomes available a
 job from the queue will be run in that slot. But originally GNU
 B<parallel> did not model job slots in the code. Job slots have been
 added to make it possible to use {%} as a replacement string.
 Job slots were added to the code in 20140522, but while the job
 sequence number can be computed in advance, the job slot can only be
 computed the moment a slot becomes available. So it has been
 implemented as a stack with lazy evaluation: Draw one from an empty
 stack and the stack is extended by one. When a job is done, push the
 available job slot back on the stack.
 This implementation also means that if you use remote executions, you
 cannot assume that a given job slot will remain on the same remote
 server. This goes double since number of job slots can be adjusted on
 the fly (by giving B<--jobs> a file name).
 =head2 Rsync protocol version
 B<rsync> 3.1.x uses protocol 31 which is unsupported by version
 2.5.7. That means that you cannot push a file to a remote system using
 B<rsync> protocol 31, if the remote system uses 2.5.7. B<rsync> does
 not automatically downgrade to protocol 30.
 GNU B<parallel> does not require protocol 31, so if the B<rsync>
 version is >= 3.1.0 then B<--protocol 30> is added to force newer
 B<rsync>s to talk to version 2.5.7.
 =head2 Wrapping
 The command given by the user can be wrapped in multiple
 templates. Templates can be wrapped in other templates.
 =over 15
 =item --shellquote
 echo <<shell double quoted input>>
 =item --nice I<pri>
 \nice -n I<pri> $shell -c <<shell quoted input>>
 The \ is needed to avoid using the builtin nice command, which does not
 support -n in B<tcsh>. B<$shell -c> is needed to nice composed commands
 command.
 =item --cat
 (cat > {}; <<input>> {}; perl -e '$bash=shift; $csh=shift; for(@ARGV)
 {unlink;rmdir;} if($bash=~s/h//) {exit$bash;} exit$csh;' "$?h"
 "$status" {});
 {} is really just a tmpfile. The Perl script saves the exit value,
 unlinks the tmpfile, and returns the exit value - no matter if the
 shell is B<bash> (using $?) or B<*csh> (using $status).
 =item --fifo
 (mkfifo {};
 (<<input>> {};) & _PID=$!; cat > {};  wait $_PID; perl -e '$bash=shift; $csh=shift; for(@ARGV)
 {unlink;rmdir;} if($bash=~s/h//) {exit$bash;} exit$csh;' "$?h"
 "$status" {});
 B<wait $_PID> makes sure the exit value is from that PID. This makes it 
 incompatible with B<*csh>. The Perl script is the same as from B<--cat>.
 =item --sshlogin I<sln>
 ssh I<sln> <<shell quoted input>>
 =item --transfer
 ( ssh I<sln> mkdir -p ./I<workdir>;rsync --protocol 30 -rlDzR -essh ./{} I<sln>:./I<workdir> ); <<input>>
 Read about B<--protocol 30> in the section B<Rsync protocol version>.
 =item --basefile
 <<todo>>
 =item --return I<file>
 <<input>>; _EXIT_status=$?; mkdir -p I<workdir>; rsync --protocol 30 --rsync-path=cd\ ./I<workdir>\;\ rsync -rlDzR -essh I<sln>:./I<file> ./I<workdir>; exit $_EXIT_status;
 The B<--rsync-path=cd ...> is needed because old versions of B<rsync>
 do not support B<--no-implied-dirs>.
 The B<$_EXIT_status> trick is to postpone the exit value. This makes it
 incompatible with B<*csh> and should be fixed in the future. Maybe a
 wrapping 'sh -c' is enough?
 =item --cleanup
 <<input>> _EXIT_status=$?; <<return>>
 ssh I<sln> \(rm\ -f\ ./I<workdir>/{}\;\ rmdir\ ./I<workdir>\ \>\&/dev/null\;\); exit $_EXIT_status;
 B<$_EXIT_status>: see B<--return> above.
 =item --pipe
 sh -c 'dd bs=1 count=1 of=I<tmpfile> 2>/dev/null'; test ! -s "I<tmpfile>" && rm -f "I<tmpfile>" && exec true; (cat I<tmpfile>; rm I<tmpfile>; cat - ) | ( <<input>> );
 This small wrapper makes sure that <<input>> will never be run if
 there is no data. B<sh -c> is needed to hide stderr if the user's
 shell is B<csh> (which cannot hide stderr).
 =item --tmux
 mkfifo I<tmpfile>; tmux new-session -s pI<PID> -d -n <<shell quoted input>> \( <<shell quoted input>> \)\;\(echo\ \$\?\$status\;echo\ 255\)\ \>I<tmpfile>\&echo\ <<shell double quoted input>>\;echo\ \Job\ finished\ at:\ \`date\`\;sleep\ 10;  exit `perl -ne 'unlink $ARGV; 1..1 and print' I<tmpfile>` 
 The input is used as the name of the windows in B<tmux>. To get the
 exit value out from B<tmux> a fifo is used. This fifo is being opened
 by perl and the first value read is used as exit value. Works in
 B<csh>.
 =back
 The ordering of the wrapping is important:
 =over 5
 =item *
 B<--nice>/B<--cat>/B<--fifo> should be done on the remote machine
 =item *
 B<--pipepart>/B<--pipe> should be done on the local machine inside B<--tmux>
 =back
 =head2 Shell shock
 The shell shock bug in B<bash> did not affect GNU B<parallel>, but the
 solutions did. B<bash> first introduced functions in variables named:
 I<BASH_FUNC_myfunc()> and later changed that to I<BASH_FUNC_myfunc%%>. When
 transferring functions GNU B<parallel> reads off the function and changes
 that into a function definition, which is copied to the remote system and
 executed before the actual command is executed. Therefore GNU B<parallel>
 needs to know how to read the function.
 From version 20150122 GNU B<parallel> tries both the ()-version and
 the %%-version, and the function definition works on both pre- and
 post-shellshock versions of B<bash>.
 =head2 Remote Ctrl-C and standard error (stderr)
 If the user presses Ctrl-C the user expect jobs to stop. This works
 out of the box if the jobs are run locally. Unfortunately it is not so
 simple if the jobs are run remotely.
 If remote jobs are run in a tty using B<ssh -tt>, then Ctrl-C works,
 but all output to standard error (stderr) is sent to standard output
 (stdout). This is not what the user expects.
 If remote jobs are run without a tty using B<ssh> (without B<-tt>),
 then output to standard error (stderr) is kept on stderr, but Ctrl-C
 does not kill remote jobs. This is not what the user expects.
 So what is needed is a way to have both. It seems the reason why
 Ctrl-C does not kill the remote jobs is because the shell does not
 propagate the hang-up signal from B<sshd>. But when B<sshd> dies, the
 parent of the login shell becomes B<init> (process id 1). So by
 exec'ing a Perl wrapper to monitor the parent pid and kill the child
 if the parent pid becomes 1, then Ctrl-C works and stderr is kept on
 stderr. The wrapper looks like this:
    $SIG{CHLD} = sub { $done = 1; };
    $pid = fork;
    unless($pid) {
        # Make own process group to be able to kill HUP it later
        setpgrp;
        exec $ENV{SHELL}, "-c", ($bashfunc."@ARGV");
        die "exec: $!\n";
    }
    do {
        # Parent is not init (ppid=1), so sshd is alive
        # Exponential sleep up to 1 sec
        $s = $s < 1 ? 0.001 + $s * 1.03 : $s;
        select(undef, undef, undef, $s);
    } until ($done || getppid == 1);
    # Kill HUP the process group if job not done
    kill(SIGHUP, -${pid}) unless $done;
    wait;
    exit ($?&127 ? 128+($?&127) : 1+$?>>8)
 =head2 Transferring of variables and functions
 Transferring of variables and functions is done by running a Perl
 script before running the actual command. The Perl script sets
 $ENV{variable} to the correct value before exec'ing the a shell that
 runs the function definition followed by the actual command.
 B<env_parallel> (mentioned in the man page) copies the full current
 environment into the environment variable
 B<parallel_bash_environment>. This variable is picked up by GNU
 B<parallel> and used to create the Perl script mentioned above.
 =head2 Base64 encode bzip2
 B<csh> limits words of commands to 1024 chars. This is often too little
 when GNU B<parallel> encodes environment variables and wraps the
 command with different templates. All of these are combined and quoted
 into one single word, which often is longer than 1024 chars.
 When the line to run is > 1000 chars, GNU B<parallel> therefore
 encodes the line to run. The encoding B<bzip2>s the line to run,
 converts this to base64, splits the base64 into 1000 char blocks (so B<csh>
 does not fail), and prepends it with this Perl script that decodes,
 decompresses and B<eval>s the line.
    @GNU_Parallel=("use","IPC::Open3;","use","MIME::Base64");
    eval "@GNU_Parallel";
    $SIG{CHLD}="IGNORE";
    # Search for bzip2. Not found => use default path
    my $zip = (grep { -x $_ } "/usr/local/bin/bzip2")[0] || "bzip2";
    # $in = stdin on $zip, $out = stdout from $zip
    my($in, $out,$eval);
    open3($in,$out,">&STDERR",$zip,"-dc");
    if(my $perlpid = fork) {
        close $in;
        $eval = join "", <$out>;
        close $out;
    } else {
        close $out;
        # Pipe decoded base64 into 'bzip2 -dc'
        print $in (decode_base64(join"",@ARGV));
        close $in;
        exit;
    }
    wait;
    eval $eval;
 Perl and B<bzip2> must be installed on the remote system, but a small
 test showed that B<bzip2> is installed by default on all platforms
 that runs GNU B<parallel>, so this is not a big problem.
 The added bonus of this is that much bigger environments can now be
 transferred as they will be below B<bash>'s limit of 131072 chars.
 =head2 Which shell to use
 Different shells behave differently. A command that works in B<tcsh>
 may not work in B<bash>.  It is therefore important that the correct
 shell is used when GNU B<parallel> executes commands.
 GNU B<parallel> tries hard to use the right shell. If GNU B<parallel>
 is called from B<tcsh> it will use B<tcsh>.  If it is called from
 B<bash> it will use B<bash>. It does this by looking at the
 (grand*)parent process: If the (grand*)parent process is a shell, use
 this shell; otherwise look at the parent of this (grand*)parent. If
 none of the (grand*)parents are shells, then $SHELL is used.
 This will do the right thing in most cases. If called from:
 =over 2
 =item *
 an interactive shell
 =item *
 a shell script
 =item *
 a Perl script in `` or using B<system> if called as a single string
 =back
 But there are situations where it will fail:
  #!/usr/bin/perl
  system("parallel",'setenv a {}; echo $a',":::",2);
 Here it depends on which shell is used to call the Perl script. If the
 Perl script is called from B<tcsh> it will work just fine, but if it
 is called from B<bash> it will fail.
 =head2 Quoting
 Quoting is kept simple: Use \ for all special chars and ' for
 newline. Whether a char is special depends on the shell and the
 context. Luckily quoting a bit too many does not break things.
 It is fast, but had the distinct disadvantage that if at string needs
 to be quoted multiple times, the \'s double every time.
 =head2 --pipepart vs. --pipe
 While B<--pipe> and B<--pipepart> look much the same to the user, they are
 implemented very differently.
 With B<--pipe> GNU B<parallel> reads the blocks from standard input
 (stdin), which is then given to the command on standard input (stdin);
 so every block is being processed by GNU B<parallel> itself. This is
 the reason why B<--pipe> maxes out at around 100 MB/sec.
 B<--pipepart> on the other hand first identifies at which byte
 position blocks starts and how long they are. It does that by seeking
 into the file by the size of a block and then reading until it meets
 end of a block. The seeking explains why GNU B<parallel> does not know
 the line number and why B<-L/-l> and B<-N> do not work.
 With a reasonable block and file size this seeking is often more than
 1000 faster than reading the full file. The byte positions are then
 given to a small script that reads from position X to Y and sends
 output to standard output (stdout). This small script is prepended to
 the command and the full command is executed just as if GNU
 B<parallel> had been in its normal mode. The script looks like this:
  < file perl -e 'while(@ARGV) { 
     sysseek(STDIN,shift,0) || die;
     $left = shift;
     while($read = sysread(STDIN,$buf, ($left > 32768 ? 32768 : $left))){
       $left -= $read; syswrite(STDOUT,$buf);
     }
  }' startbyte length_in_bytes
 It delivers 1 GB/s per core.
 Instead of the script B<dd> was tried, but many versions of B<dd> do
 not support reading from one byte to another and might cause partial
 data:
  yes | dd bs=1024k count=10 | wc
 =head2 --jobs and --onall
 When running the same commands on many servers what should B<--jobs>
 signify? Is it the number of servers to run on in parallel?  Is it the
 number of jobs run in parallel on each server?
 GNU B<parallel> lets B<--jobs> represent the number of servers to run
 on in parallel. This is to make it possible to run a sequence of
 commands (that cannot be parallelized) on each server, but run the
 same sequence on multiple servers.
 =head2 Disk full
 GNU B<parallel> buffers on disk. If the disk is full data may be
 lost. To check if the disk is full GNU B<parallel> writes a 8193 byte
 file when a job finishes. If this file is written succesfully, it is
 removed immediately. If it is not written succesfully, the disk is
 full. The size 8193 was chosen because 8192 gave wrong result on some
 file systems, whereas 8193 did the correct thing on all tested
 filesystems.
 =head2 Perl replacement strings, {= =}, and --rpl
 The shorthands for replacement strings makes a command look more
 cryptic. Different users will need different replacement
 strings. Instead of inventing more shorthands you get more more
 flexible replacement strings if they can be programmed by the user.
 The language Perl was chosen because GNU B<parallel> is written in
 Perl and it was easy and reasonably fast to run the code given by the
 user.
 If a user needs the same programmed replacement string again and
 again, the user may want to make his own shorthand for it. This is
 what B<--rpl> is for. It works so well, that even GNU B<parallel>'s
 own shorthands are implemented using B<--rpl>.
 In Perl code the bigrams {= and =} rarely exist. They look like a
 matching pair and can be entered on all keyboards. This made them good
 candidates for enclosing the Perl expression in the replacement
 strings. Another candidate ,, and ,, was rejected because they do not
 look like a matching pair. B<--parens> was made, so that the users can
 still use ,, and ,, if they like: B<--parens ,,,,>
 Internally, however, the {= and =} are replaced by \257< and
 \257>. This is to make it simple to make regular expressions: \257 is
 disallowed on the command line, so when that is matched, it is known
 that this is a replacement string.
 =head2 Test suite
 GNU B<parallel> uses its own testing framework. This is mostly due to
 historical reasons. It deals reasonably well with tests that are
 dependent on how long a given test runs (e.g. more than 10 secs is a
 pass, but less is a fail). It parallelizes most tests, but it is easy
 to force a test to run as the single test (which may be important for
 timing issues). It deals reasonably well with tests that fail
 intermittently. It detects which tests that failed and pushes these to
 the top, so when running the test suite again, the tests that failed
 most recently are run first.
 If GNU B<parallel> should adopt a real testing framework then those
 elements would be important.
 Since many tests are dependent on which hardware it is running on,
 these tests break when run on a different hardware than what the test
 was written for.
 When most bugs are fixed a test is added, so this bug will not
 reappear. That is, however, sometimes hard to create the environment
 in which the bug shows up. One of the harder problems is to make a
 machine start swapping without forcing it to its knees.
 =head1 Ideas for new design
 =head2 Multiple processes working together
 Open3 is slow. Printing is slow. It would be good if they did not tie
 up ressources, but were run in separate threads.
 =head2 Transferring of variables and functions from zsh
 Transferring Bash functions to remote zsh works.
 Can parallel_bash_environment be used to import zsh functions?
 =head2 --rrs on remote using a perl wrapper
 ... | perl -pe '$/=$recend$recstart;BEGIN{ if(substr($_) eq $recstart) substr($_)="" } eof and substr($_) eq $recend) substr($_)="" 
 It ought to be possible to write a filter that removed rec sep on the
 fly instead of inside GNU B<parallel>. This could then use more cpus.
 Will that require 2x record size memory?
 Will that require 2x block size memory?
 =head1 Historical decisions
 =head2 --tollef
 You can read about the history of GNU B<parallel> on https://www.gnu.org/software/parallel/history.html
 B<--tollef> was included to make GNU B<parallel> switch compatible
 with the parallel from moreutils (which is made by Tollef Fog
 Heen). This was done so that users of that parallel easily could port
 their use to GNU B<parallel>: Simply set B<PARALLEL="--tollef"> and
 that would be it.
 But several distributions chose to make B<--tollef> global (by putting it
 into /etc/parallel/config), and that caused much confusion when people
 tried out the examples from GNU B<parallel>'s man page and these did
 not work.  The users became frustrated because the distribution did
 not make it clear to them that it has made B<--tollef> global.
 So to lessen the frustration and the resulting support, B<--tollef>
 was obsoleted 20130222 and removed one year later.
 =head2 Transferring of variables and functions
 Until 20150122 variables and functions were transferred by looking at
 $SHELL to see whether the shell was a B<*csh> shell. If so the
 variables would be set using B<setenv>. Otherwise they would be set
 using B<=>. The caused the content of the variable to be repeated:
 echo $SHELL | grep "/t\{0,1\}csh" > /dev/null && setenv VAR foo ||
 export VAR=foo
 =cut