2010-12-06 23:30:08 +00:00
|
|
|
#!/usr/bin/perl -w
|
2010-12-03 13:42:22 +00:00
|
|
|
|
|
|
|
=head1 NAME
|
|
|
|
|
2010-12-14 08:40:42 +00:00
|
|
|
niceload - slow down a program when the load average is above a certain limit
|
2010-12-03 13:42:22 +00:00
|
|
|
|
|
|
|
=head1 SYNOPSIS
|
|
|
|
|
2010-12-06 23:30:08 +00:00
|
|
|
B<niceload> [-v] [-n nice] [-l load] [-t time] [-s time|-f factor] command
|
2010-12-03 13:42:22 +00:00
|
|
|
|
2010-12-06 23:30:08 +00:00
|
|
|
B<niceload> [-v] [-n nice] [-l load] [-t time] [-s time|-f factor] -p=PID
|
2010-12-03 13:42:22 +00:00
|
|
|
|
|
|
|
=head1 DESCRIPTION
|
|
|
|
|
|
|
|
GNU B<niceload> will run a program when the load average is below a
|
|
|
|
certain limit. When the limit is reached the program will be suspended
|
|
|
|
for some time. Then resumed again for some time. Then the load load
|
|
|
|
average is checked again and we start over.
|
|
|
|
|
|
|
|
If the load is 3.00 then the default settings will run a program
|
|
|
|
like this:
|
|
|
|
|
|
|
|
run 1 second, suspend (3.00-1.00) seconds, run 1 second, suspend
|
|
|
|
(3.00-1.00) seconds, run 1 second, ...
|
|
|
|
|
|
|
|
=head1 OPTIONS
|
|
|
|
|
|
|
|
=over 9
|
|
|
|
|
2010-12-06 23:30:08 +00:00
|
|
|
=item B<-n> I<niceness>
|
2010-12-03 13:42:22 +00:00
|
|
|
|
|
|
|
Sets niceness. See B<nice>(1).
|
|
|
|
|
2010-12-06 23:30:08 +00:00
|
|
|
=item B<-l> I<maxload>
|
2010-12-03 13:42:22 +00:00
|
|
|
|
|
|
|
Max load. The maximal load average before suspending command. Default
|
|
|
|
is 1.00.
|
|
|
|
|
2010-12-06 23:30:08 +00:00
|
|
|
=item B<-t> I<SEC>
|
2010-12-03 13:42:22 +00:00
|
|
|
|
|
|
|
Recheck load time. Sleep SEC seconds before checking load
|
|
|
|
again. Default is 1 second.
|
|
|
|
|
2010-12-06 23:30:08 +00:00
|
|
|
=item B<-s> I<SEC>
|
2010-12-03 13:42:22 +00:00
|
|
|
|
|
|
|
Suspend time. Suspend the command this many seconds when the max load
|
|
|
|
average is reached.
|
|
|
|
|
2010-12-06 23:30:08 +00:00
|
|
|
=item B<-f> I<FACTOR>
|
2010-12-03 13:42:22 +00:00
|
|
|
|
|
|
|
Suspend time factor. Dynamically set B<-s> as max load average over limit * factor. Default is 1.
|
|
|
|
|
2010-12-06 23:30:08 +00:00
|
|
|
=item B<-p> I<PID>
|
2010-12-03 13:42:22 +00:00
|
|
|
|
|
|
|
Process ID of process to suspend.
|
|
|
|
|
|
|
|
=item B<-v>
|
|
|
|
|
|
|
|
Verbose. Print some extra output on what is happening. Use B<-v> until
|
|
|
|
you know what your are doing.
|
|
|
|
|
|
|
|
=back
|
|
|
|
|
|
|
|
=head1 EXAMPLE: See niceload in action
|
|
|
|
|
|
|
|
In terminal 1 run: top
|
|
|
|
|
|
|
|
In terminal 2 run:
|
|
|
|
|
2010-12-06 23:30:08 +00:00
|
|
|
B<niceload perl -e '$|=1;do{$l==$r or print "."; $l=$r}until(($r=time-$^T)>>B<50)'>
|
2010-12-03 13:42:22 +00:00
|
|
|
|
|
|
|
This will print a '.' every second for 50 seconds and eat a lot of
|
|
|
|
CPU. When the load rises to 1.0 the process is suspended.
|
|
|
|
|
|
|
|
|
|
|
|
=head1 EXAMPLE: Run updatedb
|
|
|
|
|
|
|
|
Running updatedb can often starve the system for disk I/O and thus result in a high load.
|
|
|
|
|
|
|
|
Run updatedb but suspend updatedb if the load is above 2.00:
|
|
|
|
|
|
|
|
B<niceload -l=2 updatedb>
|
|
|
|
|
|
|
|
|
|
|
|
=head1 EXAMPLE: Run rsync
|
|
|
|
|
|
|
|
rsync can just like updatedb starve the system for disk I/O and thus result in a high load.
|
|
|
|
|
|
|
|
Run rsync but keep load below 3.4. If load reaches 7 sleep for
|
|
|
|
(7-3.4)*12 seconds:
|
|
|
|
|
|
|
|
B<niceload -l=3.4 -f=12 rsync -Ha /home/ /backup/home/>
|
|
|
|
|
|
|
|
|
|
|
|
=head1 ENVIRONMENT VARIABLES
|
|
|
|
|
|
|
|
None. In future versions $NICELOAD will be able to contain default settings.
|
|
|
|
|
|
|
|
=head1 EXIT STATUS
|
|
|
|
|
|
|
|
Exit status should be the same as the command being run (untested).
|
|
|
|
|
|
|
|
=head1 REPORTING BUGS
|
|
|
|
|
|
|
|
Report bugs to <bug-parallel@gnu.org>.
|
|
|
|
|
|
|
|
=head1 AUTHOR
|
|
|
|
|
|
|
|
Copyright (C) 2004-11-19 Ole Tange, http://ole.tange.dk
|
|
|
|
|
|
|
|
Copyright (C) 2005,2006,2006,2008,2009,2010 Ole Tange, http://ole.tange.dk
|
|
|
|
|
|
|
|
Copyright (C) 2010 Ole Tange, http://ole.tange.dk and Free Software
|
|
|
|
Foundation, Inc.
|
|
|
|
|
|
|
|
=head1 LICENSE
|
|
|
|
|
|
|
|
Copyright (C) 2010 Free Software Foundation, Inc.
|
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
the Free Software Foundation; either version 3 of the License, or
|
|
|
|
at your option any later version.
|
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
|
|
along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
=head2 Documentation license I
|
|
|
|
|
|
|
|
Permission is granted to copy, distribute and/or modify this documentation
|
|
|
|
under the terms of the GNU Free Documentation License, Version 1.3 or
|
|
|
|
any later version published by the Free Software Foundation; with no
|
|
|
|
Invariant Sections, with no Front-Cover Texts, and with no Back-Cover
|
|
|
|
Texts. A copy of the license is included in the file fdl.txt.
|
|
|
|
|
|
|
|
=head2 Documentation license II
|
|
|
|
|
|
|
|
You are free:
|
|
|
|
|
|
|
|
=over 9
|
|
|
|
|
|
|
|
=item B<to Share>
|
|
|
|
|
|
|
|
to copy, distribute and transmit the work
|
|
|
|
|
|
|
|
=item B<to Remix>
|
|
|
|
|
|
|
|
to adapt the work
|
|
|
|
|
|
|
|
=back
|
|
|
|
|
|
|
|
Under the following conditions:
|
|
|
|
|
|
|
|
=over 9
|
|
|
|
|
|
|
|
=item B<Attribution>
|
|
|
|
|
|
|
|
You must attribute the work in the manner specified by the author or
|
|
|
|
licensor (but not in any way that suggests that they endorse you or
|
|
|
|
your use of the work).
|
|
|
|
|
|
|
|
=item B<Share Alike>
|
|
|
|
|
|
|
|
If you alter, transform, or build upon this work, you may distribute
|
|
|
|
the resulting work only under the same, similar or a compatible
|
|
|
|
license.
|
|
|
|
|
|
|
|
=back
|
|
|
|
|
|
|
|
With the understanding that:
|
|
|
|
|
|
|
|
=over 9
|
|
|
|
|
|
|
|
=item B<Waiver>
|
|
|
|
|
|
|
|
Any of the above conditions can be waived if you get permission from
|
|
|
|
the copyright holder.
|
|
|
|
|
|
|
|
=item B<Public Domain>
|
|
|
|
|
|
|
|
Where the work or any of its elements is in the public domain under
|
|
|
|
applicable law, that status is in no way affected by the license.
|
|
|
|
|
|
|
|
=item B<Other Rights>
|
|
|
|
|
|
|
|
In no way are any of the following rights affected by the license:
|
|
|
|
|
|
|
|
=over 2
|
|
|
|
|
|
|
|
=item *
|
|
|
|
|
|
|
|
Your fair dealing or fair use rights, or other applicable
|
|
|
|
copyright exceptions and limitations;
|
|
|
|
|
|
|
|
=item *
|
|
|
|
|
|
|
|
The author's moral rights;
|
|
|
|
|
|
|
|
=item *
|
|
|
|
|
|
|
|
Rights other persons may have either in the work itself or in
|
|
|
|
how the work is used, such as publicity or privacy rights.
|
|
|
|
|
|
|
|
=back
|
|
|
|
|
|
|
|
=back
|
|
|
|
|
|
|
|
=over 9
|
|
|
|
|
|
|
|
=item B<Notice>
|
|
|
|
|
|
|
|
For any reuse or distribution, you must make clear to others the
|
|
|
|
license terms of this work.
|
|
|
|
|
|
|
|
=back
|
|
|
|
|
|
|
|
A copy of the full license is included in the file as cc-by-sa.txt.
|
|
|
|
|
|
|
|
=head1 DEPENDENCIES
|
|
|
|
|
2010-12-03 14:22:01 +00:00
|
|
|
GNU B<niceload> uses Perl, and the Perl modules POSIX, and
|
|
|
|
Getopt::Long.
|
2010-12-03 13:42:22 +00:00
|
|
|
|
|
|
|
=head1 SEE ALSO
|
|
|
|
|
|
|
|
B<parallel>(1), B<nice>(1)
|
|
|
|
|
|
|
|
|
|
|
|
=cut
|
|
|
|
|
2010-12-06 23:30:08 +00:00
|
|
|
use strict;
|
|
|
|
use Getopt::Long;
|
|
|
|
$Global::progname="niceload";
|
2011-01-02 00:01:21 +00:00
|
|
|
$Global::version = 20110101;
|
2010-12-06 23:30:08 +00:00
|
|
|
Getopt::Long::Configure("bundling","require_order");
|
|
|
|
get_options_from_array(\@ARGV) || die_usage();
|
|
|
|
if($::opt_version) {
|
|
|
|
version();
|
|
|
|
exit 0;
|
2010-12-03 13:42:22 +00:00
|
|
|
}
|
2010-12-06 23:30:08 +00:00
|
|
|
if($::opt_help) {
|
|
|
|
help();
|
|
|
|
exit 0;
|
|
|
|
}
|
|
|
|
if($::opt_factor and $::opt_suspend) {
|
|
|
|
# You cannot have --suspend and --factor
|
2010-12-03 13:42:22 +00:00
|
|
|
help();
|
|
|
|
exit;
|
|
|
|
}
|
|
|
|
|
2010-12-06 23:30:08 +00:00
|
|
|
my $nice = $::opt_nice || 0; # -n=0 Nice level (Default: 0)
|
|
|
|
my $max_load = $::opt_load || 1; # -l=1 Max acceptable load average (Default: 1)
|
|
|
|
my $check_time = $::opt_recheck || 1; # -t=1 Seconds between checking load average (Default: 1)
|
2010-12-03 13:42:22 +00:00
|
|
|
my $wait_factor;
|
|
|
|
my $wait_time;
|
2010-12-06 23:30:08 +00:00
|
|
|
if($::opt_suspend) {
|
|
|
|
# --suspend=sec Seconds to suspend process when load average is too high
|
|
|
|
$wait_time = $::opt_suspend;
|
2010-12-03 13:42:22 +00:00
|
|
|
} else {
|
2010-12-06 23:30:08 +00:00
|
|
|
# --factor=1 compute wait_time dynamically as (load - limit) * factor
|
|
|
|
$wait_factor=$::opt_factor || 1;
|
2010-12-03 13:42:22 +00:00
|
|
|
}
|
2010-12-06 23:30:08 +00:00
|
|
|
my $processid = $::opt_pid; # Control this PID (Default: control the command)
|
|
|
|
my $verbose = $::opt_verbose || $::opt_debug;
|
|
|
|
my @program = @ARGV;
|
2010-12-03 13:42:22 +00:00
|
|
|
$SIG{CHLD} = \&REAPER;
|
|
|
|
|
|
|
|
if($processid) {
|
|
|
|
$Child::fork = $processid;
|
2010-12-06 23:30:08 +00:00
|
|
|
$::opt_verbose and print STDERR "Control $processid\n";
|
2010-12-03 13:42:22 +00:00
|
|
|
init_signal_handling_attached_child();
|
|
|
|
my $child_pgrp = getpgrp $Child::fork;
|
|
|
|
suspend_resume($max_load,$check_time,$wait_time,$wait_factor,$child_pgrp);
|
|
|
|
} elsif(@ARGV) {
|
|
|
|
if($Child::fork = fork) {
|
|
|
|
sleep 1; # Give child time to setpgrp(0,0);
|
|
|
|
init_signal_handling_my_child();
|
|
|
|
my $child_pgrp = getpgrp $Child::fork;
|
|
|
|
suspend_resume($max_load,$check_time,$wait_time,$wait_factor,$child_pgrp);
|
|
|
|
} else {
|
|
|
|
setpgrp(0,0);
|
2010-12-06 23:30:08 +00:00
|
|
|
debug("Child pid: $$, pgrp: ",getpgrp $$,"\n");
|
2010-12-03 13:42:22 +00:00
|
|
|
if($nice) {
|
|
|
|
unshift(@program,"nice","-n",$nice);
|
|
|
|
}
|
2010-12-06 23:30:08 +00:00
|
|
|
debug("@program\n");
|
2010-12-03 13:42:22 +00:00
|
|
|
system(@program);
|
2010-12-06 23:30:08 +00:00
|
|
|
debug("Child exit\n");
|
2010-12-03 13:42:22 +00:00
|
|
|
exit;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
help();
|
|
|
|
exit;
|
|
|
|
}
|
|
|
|
|
2010-12-06 23:30:08 +00:00
|
|
|
sub get_options_from_array {
|
|
|
|
# Run GetOptions on @array
|
|
|
|
# Returns:
|
|
|
|
# true if parsing worked
|
|
|
|
# false if parsing failed
|
|
|
|
# @array is changed
|
|
|
|
my $array_ref = shift;
|
|
|
|
# A bit of shuffling of @ARGV needed as GetOptionsFromArray is not
|
|
|
|
# supported everywhere
|
|
|
|
my @save_argv;
|
|
|
|
my $this_is_ARGV = (\@::ARGV == $array_ref);
|
|
|
|
if(not $this_is_ARGV) {
|
|
|
|
@save_argv = @::ARGV;
|
|
|
|
@::ARGV = @{$array_ref};
|
|
|
|
}
|
|
|
|
my @retval = GetOptions
|
|
|
|
("debug|D" => \$::opt_debug,
|
|
|
|
"load|l=s" => \$::opt_load,
|
|
|
|
"factor|f=s" => \$::opt_factor,
|
|
|
|
"suspend|s=s" => \$::opt_suspend,
|
|
|
|
"recheck|t=s" => \$::opt_recheck,
|
|
|
|
"nice|n=i" => \$::opt_nice,
|
|
|
|
"help|h" => \$::opt_help,
|
|
|
|
"process|pid|p=s" => \$::opt_pid,
|
|
|
|
"verbose|v" => \$::opt_verbose,
|
|
|
|
"version|V" => \$::opt_version,
|
|
|
|
);
|
|
|
|
if(not $this_is_ARGV) {
|
|
|
|
@{$array_ref} = @::ARGV;
|
|
|
|
@::ARGV = @save_argv;
|
|
|
|
}
|
|
|
|
return @retval;
|
|
|
|
}
|
|
|
|
|
|
|
|
sub die_usage {
|
|
|
|
help();
|
|
|
|
exit 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
sub help {
|
|
|
|
print q{
|
|
|
|
Usage:
|
|
|
|
niceload [-v] [-n=niceness] [-l=loadavg] [-t=recheck_sec] [-s=suspend_sec|-f=factor] command
|
|
|
|
niceload [-v] [-n=niceness] [-l=loadavg] [-t=recheck_sec] [-s=suspend_sec|-f=factor] command
|
|
|
|
};
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
2010-12-03 13:42:22 +00:00
|
|
|
sub debug {
|
2010-12-06 23:30:08 +00:00
|
|
|
if($::opt_debug) {
|
|
|
|
print STDERR @_;
|
|
|
|
}
|
2010-12-03 13:42:22 +00:00
|
|
|
}
|
|
|
|
|
2010-12-06 23:30:08 +00:00
|
|
|
sub version {
|
|
|
|
# Returns: N/A
|
|
|
|
print join("\n",
|
|
|
|
"GNU $Global::progname $Global::version",
|
|
|
|
"Copyright (C) 2004,2005,2006,2007,2008,2009 Ole Tange",
|
|
|
|
"Copyright (C) 2010 Ole Tange and Free Software Foundation, Inc.",
|
|
|
|
"License GPLv3+: GNU GPL version 3 or later <http://gnu.org/licenses/gpl.html>",
|
|
|
|
"This is free software: you are free to change and redistribute it.",
|
|
|
|
"GNU $Global::progname comes with no warranty.",
|
|
|
|
"",
|
|
|
|
"Web site: http://www.gnu.org/software/parallel\n"
|
|
|
|
);
|
|
|
|
}
|
2010-12-03 13:42:22 +00:00
|
|
|
|
|
|
|
sub init_signal_handling_attached_child {
|
|
|
|
$SIG{INT}=\&sigint_attached_child;
|
|
|
|
}
|
|
|
|
|
|
|
|
sub sigint_attached_child {
|
|
|
|
# Let the attached child continue when detaching
|
|
|
|
kill_child_CONT();
|
|
|
|
exit;
|
|
|
|
}
|
|
|
|
|
|
|
|
sub init_signal_handling_my_child {
|
|
|
|
$SIG{INT}=\&kill_child_INT;
|
|
|
|
$SIG{TSTP}=\&kill_child_TSTP;
|
|
|
|
$SIG{CONT}=\&kill_child_CONT;
|
|
|
|
}
|
|
|
|
|
|
|
|
use POSIX ":sys_wait_h";
|
|
|
|
|
|
|
|
sub REAPER {
|
|
|
|
my $stiff;
|
|
|
|
while (($stiff = waitpid(-1, &WNOHANG)) > 0) {
|
|
|
|
# do something with $stiff if you want
|
|
|
|
}
|
|
|
|
$SIG{CHLD} = \&REAPER; # install *after* calling waitpid
|
|
|
|
}
|
|
|
|
|
|
|
|
sub kill_child_CONT {
|
2010-12-06 23:30:08 +00:00
|
|
|
debug("SIGCONT received. Killing $Child::fork\n");
|
2010-12-03 13:42:22 +00:00
|
|
|
kill CONT => -getpgrp($Child::fork);
|
|
|
|
}
|
|
|
|
|
|
|
|
sub kill_child_TSTP {
|
2010-12-06 23:30:08 +00:00
|
|
|
debug("SIGTSTP received. Killing $Child::fork and self\n");
|
2010-12-03 13:42:22 +00:00
|
|
|
kill TSTP => -getpgrp($Child::fork);
|
|
|
|
kill STOP => -$$;
|
|
|
|
}
|
|
|
|
|
|
|
|
sub kill_child_INT {
|
2010-12-06 23:30:08 +00:00
|
|
|
debug("SIGINT received. Killing $Child::fork Exit\n");
|
2010-12-03 13:42:22 +00:00
|
|
|
kill INT => -getpgrp($Child::fork);
|
|
|
|
exit;
|
|
|
|
}
|
|
|
|
|
|
|
|
sub suspend_resume {
|
|
|
|
my ($max_load,$check_time,$wait_time,$wait_factor,@pids) = @_;
|
2010-12-06 23:30:08 +00:00
|
|
|
debug("suspend_resume these @pids\n");
|
2010-12-03 13:42:22 +00:00
|
|
|
resume_pids(@pids);
|
|
|
|
while (pids_exist(@pids)) {
|
|
|
|
if ( loadavg() > $max_load ) {
|
|
|
|
if($wait_factor) {
|
|
|
|
$wait_time = (loadavg()-$max_load) * $wait_factor;
|
|
|
|
}
|
2010-12-06 23:30:08 +00:00
|
|
|
$::opt_verbose and print STDERR "suspending for $wait_time seconds\n";
|
2010-12-03 13:42:22 +00:00
|
|
|
suspend_pids(@pids);
|
|
|
|
sleep 1; # for some reason this statement is skipped
|
|
|
|
sleep $wait_time;
|
|
|
|
resume_pids(@pids);
|
|
|
|
}
|
2010-12-06 23:30:08 +00:00
|
|
|
$::opt_verbose and print STDERR "running for $check_time second(s)\n";
|
2010-12-03 13:42:22 +00:00
|
|
|
sleep($check_time);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
sub pids_exist {
|
|
|
|
my (@pids) = @_;
|
|
|
|
my ($exists) = 0;
|
2010-12-06 23:30:08 +00:00
|
|
|
for my $pid (@pids) {
|
2010-12-03 13:42:22 +00:00
|
|
|
if(-e "/proc/".$pid) { $exists++ }
|
|
|
|
#if(kill 0 => $Child::fork) { $exists++ }
|
|
|
|
}
|
|
|
|
return $exists;
|
|
|
|
}
|
|
|
|
|
|
|
|
sub loadavg {
|
|
|
|
my ($loadavg);
|
|
|
|
if(open(IN,"/proc/loadavg")) {
|
|
|
|
# Linux specific (but fast)
|
|
|
|
my $upString = <IN>;
|
|
|
|
if($upString =~ m/^(\d+\.\d+)/) {
|
|
|
|
$loadavg = $1;
|
|
|
|
} else {
|
|
|
|
die;
|
|
|
|
}
|
|
|
|
close IN;
|
|
|
|
} elsif (open(IN,"uptime|")) {
|
|
|
|
my $upString = <IN>;
|
|
|
|
if($upString =~ m/average.\s*(\d+\.\d+)/) {
|
|
|
|
$loadavg = $1;
|
|
|
|
} else {
|
|
|
|
die;
|
|
|
|
}
|
|
|
|
close IN;
|
|
|
|
}
|
|
|
|
return $loadavg;
|
|
|
|
}
|
|
|
|
|
|
|
|
sub suspend_pids {
|
|
|
|
my @pids = @_;
|
|
|
|
signal_pids("STOP",@pids);
|
|
|
|
}
|
|
|
|
|
|
|
|
sub resume_pids {
|
|
|
|
my @pids = @_;
|
|
|
|
signal_pids("CONT",@pids);
|
|
|
|
}
|
|
|
|
|
|
|
|
sub signal_pids {
|
|
|
|
my ($signal,@pids) = @_;
|
|
|
|
|
|
|
|
# local $SIG{$signal} = 'IGNORE';
|
2010-12-06 23:30:08 +00:00
|
|
|
for my $pid (@pids) {
|
2010-12-03 13:42:22 +00:00
|
|
|
kill $signal => -$pid; # stop PID group
|
|
|
|
}
|
|
|
|
}
|