parallel/src/niceload

484 lines
11 KiB
Plaintext
Raw Normal View History

#!/usr/bin/perl -w
2010-12-03 13:42:22 +00:00
=head1 NAME
niceload - slow down a program when the load average is above a certain limit
2010-12-03 13:42:22 +00:00
=head1 SYNOPSIS
B<niceload> [-v] [-n nice] [-l load] [-t time] [-s time|-f factor] command
2010-12-03 13:42:22 +00:00
B<niceload> [-v] [-n nice] [-l load] [-t time] [-s time|-f factor] -p=PID
2010-12-03 13:42:22 +00:00
=head1 DESCRIPTION
GNU B<niceload> will run a program when the load average is below a
certain limit. When the limit is reached the program will be suspended
for some time. Then resumed again for some time. Then the load load
average is checked again and we start over.
If the load is 3.00 then the default settings will run a program
like this:
run 1 second, suspend (3.00-1.00) seconds, run 1 second, suspend
(3.00-1.00) seconds, run 1 second, ...
=head1 OPTIONS
=over 9
=item B<-n> I<niceness>
2010-12-03 13:42:22 +00:00
Sets niceness. See B<nice>(1).
=item B<-l> I<maxload>
2010-12-03 13:42:22 +00:00
Max load. The maximal load average before suspending command. Default
is 1.00.
=item B<-t> I<SEC>
2010-12-03 13:42:22 +00:00
Recheck load time. Sleep SEC seconds before checking load
again. Default is 1 second.
=item B<-s> I<SEC>
2010-12-03 13:42:22 +00:00
Suspend time. Suspend the command this many seconds when the max load
average is reached.
=item B<-f> I<FACTOR>
2010-12-03 13:42:22 +00:00
Suspend time factor. Dynamically set B<-s> as max load average over limit * factor. Default is 1.
=item B<-p> I<PID>
2010-12-03 13:42:22 +00:00
Process ID of process to suspend.
=item B<-v>
Verbose. Print some extra output on what is happening. Use B<-v> until
you know what your are doing.
=back
=head1 EXAMPLE: See niceload in action
In terminal 1 run: top
In terminal 2 run:
B<niceload perl -e '$|=1;do{$l==$r or print "."; $l=$r}until(($r=time-$^T)>>B<50)'>
2010-12-03 13:42:22 +00:00
This will print a '.' every second for 50 seconds and eat a lot of
CPU. When the load rises to 1.0 the process is suspended.
=head1 EXAMPLE: Run updatedb
Running updatedb can often starve the system for disk I/O and thus result in a high load.
Run updatedb but suspend updatedb if the load is above 2.00:
B<niceload -l=2 updatedb>
=head1 EXAMPLE: Run rsync
rsync can just like updatedb starve the system for disk I/O and thus result in a high load.
Run rsync but keep load below 3.4. If load reaches 7 sleep for
(7-3.4)*12 seconds:
B<niceload -l=3.4 -f=12 rsync -Ha /home/ /backup/home/>
=head1 ENVIRONMENT VARIABLES
None. In future versions $NICELOAD will be able to contain default settings.
=head1 EXIT STATUS
Exit status should be the same as the command being run (untested).
=head1 REPORTING BUGS
Report bugs to <bug-parallel@gnu.org>.
=head1 AUTHOR
Copyright (C) 2004-11-19 Ole Tange, http://ole.tange.dk
Copyright (C) 2005,2006,2006,2008,2009,2010 Ole Tange, http://ole.tange.dk
Copyright (C) 2010 Ole Tange, http://ole.tange.dk and Free Software
Foundation, Inc.
=head1 LICENSE
Copyright (C) 2010 Free Software Foundation, Inc.
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 3 of the License, or
at your option any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program. If not, see <http://www.gnu.org/licenses/>.
=head2 Documentation license I
Permission is granted to copy, distribute and/or modify this documentation
under the terms of the GNU Free Documentation License, Version 1.3 or
any later version published by the Free Software Foundation; with no
Invariant Sections, with no Front-Cover Texts, and with no Back-Cover
Texts. A copy of the license is included in the file fdl.txt.
=head2 Documentation license II
You are free:
=over 9
=item B<to Share>
to copy, distribute and transmit the work
=item B<to Remix>
to adapt the work
=back
Under the following conditions:
=over 9
=item B<Attribution>
You must attribute the work in the manner specified by the author or
licensor (but not in any way that suggests that they endorse you or
your use of the work).
=item B<Share Alike>
If you alter, transform, or build upon this work, you may distribute
the resulting work only under the same, similar or a compatible
license.
=back
With the understanding that:
=over 9
=item B<Waiver>
Any of the above conditions can be waived if you get permission from
the copyright holder.
=item B<Public Domain>
Where the work or any of its elements is in the public domain under
applicable law, that status is in no way affected by the license.
=item B<Other Rights>
In no way are any of the following rights affected by the license:
=over 2
=item *
Your fair dealing or fair use rights, or other applicable
copyright exceptions and limitations;
=item *
The author's moral rights;
=item *
Rights other persons may have either in the work itself or in
how the work is used, such as publicity or privacy rights.
=back
=back
=over 9
=item B<Notice>
For any reuse or distribution, you must make clear to others the
license terms of this work.
=back
A copy of the full license is included in the file as cc-by-sa.txt.
=head1 DEPENDENCIES
2010-12-03 14:22:01 +00:00
GNU B<niceload> uses Perl, and the Perl modules POSIX, and
Getopt::Long.
2010-12-03 13:42:22 +00:00
=head1 SEE ALSO
B<parallel>(1), B<nice>(1)
=cut
use strict;
use Getopt::Long;
$Global::progname="niceload";
$Global::version = 20110119;
Getopt::Long::Configure("bundling","require_order");
get_options_from_array(\@ARGV) || die_usage();
if($::opt_version) {
version();
exit 0;
2010-12-03 13:42:22 +00:00
}
if($::opt_help) {
help();
exit 0;
}
if($::opt_factor and $::opt_suspend) {
# You cannot have --suspend and --factor
2010-12-03 13:42:22 +00:00
help();
exit;
}
my $nice = $::opt_nice || 0; # -n=0 Nice level (Default: 0)
my $max_load = $::opt_load || 1; # -l=1 Max acceptable load average (Default: 1)
my $check_time = $::opt_recheck || 1; # -t=1 Seconds between checking load average (Default: 1)
2010-12-03 13:42:22 +00:00
my $wait_factor;
my $wait_time;
if($::opt_suspend) {
# --suspend=sec Seconds to suspend process when load average is too high
$wait_time = $::opt_suspend;
2010-12-03 13:42:22 +00:00
} else {
# --factor=1 compute wait_time dynamically as (load - limit) * factor
$wait_factor=$::opt_factor || 1;
2010-12-03 13:42:22 +00:00
}
my $processid = $::opt_pid; # Control this PID (Default: control the command)
my $verbose = $::opt_verbose || $::opt_debug;
my @program = @ARGV;
2010-12-03 13:42:22 +00:00
$SIG{CHLD} = \&REAPER;
if($processid) {
$Child::fork = $processid;
$::opt_verbose and print STDERR "Control $processid\n";
2010-12-03 13:42:22 +00:00
init_signal_handling_attached_child();
my $child_pgrp = getpgrp $Child::fork;
suspend_resume($max_load,$check_time,$wait_time,$wait_factor,$child_pgrp);
} elsif(@ARGV) {
if($Child::fork = fork) {
sleep 1; # Give child time to setpgrp(0,0);
init_signal_handling_my_child();
my $child_pgrp = getpgrp $Child::fork;
suspend_resume($max_load,$check_time,$wait_time,$wait_factor,$child_pgrp);
} else {
setpgrp(0,0);
debug("Child pid: $$, pgrp: ",getpgrp $$,"\n");
2010-12-03 13:42:22 +00:00
if($nice) {
unshift(@program,"nice","-n",$nice);
}
debug("@program\n");
2010-12-03 13:42:22 +00:00
system(@program);
debug("Child exit\n");
2010-12-03 13:42:22 +00:00
exit;
}
} else {
help();
exit;
}
sub get_options_from_array {
# Run GetOptions on @array
# Returns:
# true if parsing worked
# false if parsing failed
# @array is changed
my $array_ref = shift;
# A bit of shuffling of @ARGV needed as GetOptionsFromArray is not
# supported everywhere
my @save_argv;
my $this_is_ARGV = (\@::ARGV == $array_ref);
if(not $this_is_ARGV) {
@save_argv = @::ARGV;
@::ARGV = @{$array_ref};
}
my @retval = GetOptions
("debug|D" => \$::opt_debug,
"load|l=s" => \$::opt_load,
"factor|f=s" => \$::opt_factor,
"suspend|s=s" => \$::opt_suspend,
"recheck|t=s" => \$::opt_recheck,
"nice|n=i" => \$::opt_nice,
"help|h" => \$::opt_help,
"process|pid|p=s" => \$::opt_pid,
"verbose|v" => \$::opt_verbose,
"version|V" => \$::opt_version,
);
if(not $this_is_ARGV) {
@{$array_ref} = @::ARGV;
@::ARGV = @save_argv;
}
return @retval;
}
sub die_usage {
help();
exit 1;
}
sub help {
print q{
Usage:
niceload [-v] [-n=niceness] [-l=loadavg] [-t=recheck_sec] [-s=suspend_sec|-f=factor] command
niceload [-v] [-n=niceness] [-l=loadavg] [-t=recheck_sec] [-s=suspend_sec|-f=factor] command
};
}
2010-12-03 13:42:22 +00:00
sub debug {
if($::opt_debug) {
print STDERR @_;
}
2010-12-03 13:42:22 +00:00
}
sub version {
# Returns: N/A
print join("\n",
"GNU $Global::progname $Global::version",
"Copyright (C) 2004,2005,2006,2007,2008,2009 Ole Tange",
"Copyright (C) 2010 Ole Tange and Free Software Foundation, Inc.",
"License GPLv3+: GNU GPL version 3 or later <http://gnu.org/licenses/gpl.html>",
"This is free software: you are free to change and redistribute it.",
"GNU $Global::progname comes with no warranty.",
"",
"Web site: http://www.gnu.org/software/parallel\n"
);
}
2010-12-03 13:42:22 +00:00
sub init_signal_handling_attached_child {
$SIG{INT}=\&sigint_attached_child;
}
sub sigint_attached_child {
# Let the attached child continue when detaching
kill_child_CONT();
exit;
}
sub init_signal_handling_my_child {
$SIG{INT}=\&kill_child_INT;
$SIG{TSTP}=\&kill_child_TSTP;
$SIG{CONT}=\&kill_child_CONT;
}
use POSIX ":sys_wait_h";
sub REAPER {
my $stiff;
while (($stiff = waitpid(-1, &WNOHANG)) > 0) {
# do something with $stiff if you want
}
$SIG{CHLD} = \&REAPER; # install *after* calling waitpid
}
sub kill_child_CONT {
debug("SIGCONT received. Killing $Child::fork\n");
2010-12-03 13:42:22 +00:00
kill CONT => -getpgrp($Child::fork);
}
sub kill_child_TSTP {
debug("SIGTSTP received. Killing $Child::fork and self\n");
2010-12-03 13:42:22 +00:00
kill TSTP => -getpgrp($Child::fork);
kill STOP => -$$;
}
sub kill_child_INT {
debug("SIGINT received. Killing $Child::fork Exit\n");
2010-12-03 13:42:22 +00:00
kill INT => -getpgrp($Child::fork);
exit;
}
sub suspend_resume {
my ($max_load,$check_time,$wait_time,$wait_factor,@pids) = @_;
debug("suspend_resume these @pids\n");
2010-12-03 13:42:22 +00:00
resume_pids(@pids);
while (pids_exist(@pids)) {
if ( loadavg() > $max_load ) {
if($wait_factor) {
$wait_time = (loadavg()-$max_load) * $wait_factor;
}
$::opt_verbose and print STDERR "suspending for $wait_time seconds\n";
2010-12-03 13:42:22 +00:00
suspend_pids(@pids);
sleep 1; # for some reason this statement is skipped
sleep $wait_time;
resume_pids(@pids);
}
$::opt_verbose and print STDERR "running for $check_time second(s)\n";
2010-12-03 13:42:22 +00:00
sleep($check_time);
}
}
sub pids_exist {
my (@pids) = @_;
my ($exists) = 0;
for my $pid (@pids) {
2010-12-03 13:42:22 +00:00
if(-e "/proc/".$pid) { $exists++ }
#if(kill 0 => $Child::fork) { $exists++ }
}
return $exists;
}
sub loadavg {
my ($loadavg);
if(open(IN,"/proc/loadavg")) {
# Linux specific (but fast)
my $upString = <IN>;
if($upString =~ m/^(\d+\.\d+)/) {
$loadavg = $1;
} else {
die;
}
close IN;
} elsif (open(IN,"uptime|")) {
my $upString = <IN>;
if($upString =~ m/average.\s*(\d+\.\d+)/) {
$loadavg = $1;
} else {
die;
}
close IN;
}
return $loadavg;
}
sub suspend_pids {
my @pids = @_;
signal_pids("STOP",@pids);
}
sub resume_pids {
my @pids = @_;
signal_pids("CONT",@pids);
}
sub signal_pids {
my ($signal,@pids) = @_;
# local $SIG{$signal} = 'IGNORE';
for my $pid (@pids) {
2010-12-03 13:42:22 +00:00
kill $signal => -$pid; # stop PID group
}
}