feedgnuplot/feedGnuplot.pl

580 lines
16 KiB
Perl
Raw Normal View History

#!/usr/bin/perl -w
use strict;
use Getopt::Long;
use Time::HiRes qw( usleep );
use IO::Handle;
use List::MoreUtils qw( first_index );
use Data::Dumper;
use threads;
2010-06-07 11:24:41 +08:00
use threads::shared;
use Thread::Queue;
use Text::ParseWords;
open(GNUPLOT_VERSION, "gnuplot --version |");
2010-10-23 15:28:14 +08:00
my ($gnuplotVersion) = <GNUPLOT_VERSION> =~ /gnuplot\s*(\d*\.\d*)/;
if(!$gnuplotVersion)
{
print STDERR "Couldn't find the version of gnuplot. Does it work? Trying anyway...\n";
$gnuplotVersion = 0;
}
close(GNUPLOT_VERSION);
my $usage = <<OEF;
2010-02-06 06:33:46 +08:00
Usage: $0 [options] file1 file2 ...
any number of data files can be given on the cmdline. They will be processed
in sequence. If no data files are given, data will be read in from standard
input.
--[no]domain If enabled, the first element of each line is the
domain variable. If not, the point index is used
--[no]dataindex If enabled, each data point is preceded by the index
of the data set that point corresponds to. If not
enabled, the order of the point is used.
As an example, if line 3 of the input is "0 9 1 20"
'--nodomain --nodataindex' would parse the 4 numbers as points in 4
different curves at x=3
'--domain --nodataindex' would parse the 4 numbers as points in 3 different
curves at x=0. Here, 0 is the x-variable and 9,1,20 are the data values
'--nodomain --dataindex' would parse the 4 numbers as points in 2 different
curves at x=3. Here 0 and 1 are the data indices and 9 and 20 are the
data values
'--domain --dataindex' would parse the 4 numbers as a single point at
x=0. Here 9 is the data index and 1 is the data value. 20 is an extra
value, so it is ignored. If another value followed 20, we'd get another
point in curve number
--[no]stream Do [not] display the data a point at a time, as it
comes in
2010-01-15 06:34:58 +08:00
--[no]lines Do [not] draw lines to connect consecutive points
2010-01-15 06:34:58 +08:00
--[no]points Do [not] draw points
2010-01-15 06:34:58 +08:00
--xlabel xxx Set x-axis label
2010-01-15 06:34:58 +08:00
--ylabel xxx Set y-axis label
2010-01-15 06:34:58 +08:00
--y2label xxx Set y2-axis label
2010-01-15 06:34:58 +08:00
--title xxx Set the title of the plot
2010-01-15 06:34:58 +08:00
--legend xxx Set the label for a curve plot. Give this option multiple
times for multiple curves
2010-01-15 06:34:58 +08:00
--xlen xxx Set the size of the x-window to plot. Omit this or set it
to 0 to plot ALL the data
2010-01-15 06:34:58 +08:00
--xmin xxx Set the range for the x axis. These are ignored in a
streaming plot
2010-01-15 06:34:58 +08:00
--xmax xxx Set the range for the x axis. These are ignored in a
streaming plot
2010-01-15 06:34:58 +08:00
--ymin xxx Set the range for the y axis.
2010-01-15 06:34:58 +08:00
--ymax xxx Set the range for the y axis.
2010-01-15 06:34:58 +08:00
--y2min xxx Set the range for the y2 axis.
2010-01-15 06:34:58 +08:00
--y2max xxx Set the range for the y2 axis.
2010-01-15 06:34:58 +08:00
--y2 xxx Plot the data with this index on the y2 axis. These are
0-indexed
2010-01-15 06:34:58 +08:00
--curvestyle xxx Additional style per curve. Give this option multiple
times for multiple curves
--extracmds xxx Additional commands. These could contain extra global styles
for instance
2010-05-13 14:00:39 +08:00
--size xxx Gnuplot size option
--square Plot data with aspect ratio 1
--hardcopy xxx If not streaming, output to a file specified here. Format
inferred from filename
2010-01-15 06:34:58 +08:00
--maxcurves xxx The maximum allowed number of curves. This is 100 by default,
but can be reset with this option. This exists purely to
prevent perl from allocating all of the system's memory when
reading bogus data
--monotonic If --domain is given, checks to make sure that the x-
coordinate in the input data is monotonically increasing.
If a given x-variable is in the past, all data currently
cached for this curve is purged. Without --monotonic, all
data is kept. No --monotonic by default
--dump Instead of printing to gnuplot, print to STDOUT. For
debugging.
OEF
# if I'm using a self-plotting data file with a #! line, then $ARGV[0] will contain ALL of the
# options and $ARGV[1] will contain the data file to plot. In this case I need to split $ARGV[0] so
# that GetOptions() can parse it correctly. On the other hand, if I'm plotting normally (not with
# #!) a file with spaces in the filename, I don't want to split the filename. Hopefully this logic
# takes care of both those cases.
if(exists $ARGV[0] && !-r $ARGV[0])
{
unshift @ARGV, shellwords shift @ARGV;
}
# do not stream in the data by default
# point plotting by default.
# no monotonicity checks by default
my %options = ( "stream" => 0,
"domain" => 0,
"dataindex" => 0,
"points" => 0,
"lines" => 0,
"xlen" => 0,
"maxcurves" => 100);
GetOptions(\%options,
"stream!",
"domain!",
"dataindex!",
"lines!",
"points!",
"legend=s@",
"xlabel=s",
"ylabel=s",
"y2label=s",
"title=s",
"xlen=f",
"ymin=f",
"ymax=f",
"xmin=f",
"xmax=f",
"y2min=f",
"y2max=f",
"y2=i@",
"curvestyle=s@",
"extracmds=s@",
2010-05-13 14:00:39 +08:00
"size=s",
"square!",
"hardcopy=s",
"maxcurves=i",
"monotonic!",
"help",
"dump") or die($usage);
# set up plotting style
my $style = "";
if($options{"lines"}) { $style .= "lines";}
if($options{"points"}) { $style .= "points";}
if(!$style) { $style = "points"; }
if( defined $options{"help"} )
{
die($usage);
}
# list containing the plot data. Each element is a reference to a list, representing the data for
# one curve. The first "point" is a hash describing various curve parameters. The rest are all
# references to lists of (x,y) tuples
my @curves = ();
# now start the data acquisition and plotting threads
my $dataQueue;
my $xwindow;
2010-06-07 11:24:41 +08:00
my $streamingFinished : shared = undef;
if($options{"stream"})
{
if( defined $options{"hardcopy"})
{
$options{"stream"} = undef;
}
$dataQueue = Thread::Queue->new();
my $addThr = threads->create(\&mainThread);
my $plotThr = threads->create(\&plotThread);
while(<>)
{
chomp;
# place every line of input to the queue, so that the plotting thread can process it. if we are
# using an implicit domain (x = line number), then we send it on the data queue also, since
# $. is not meaningful in the plotting thread
if(!$options{domain})
{
$_ .= " $.";
}
$dataQueue->enqueue($_);
}
2010-06-07 11:24:41 +08:00
$streamingFinished = 1;
$plotThr->join();
2010-06-07 11:24:41 +08:00
$addThr->join();
}
else
{
mainThread();
}
sub plotThread
{
2010-06-07 11:24:41 +08:00
while(! $streamingFinished)
{
sleep(1);
$dataQueue->enqueue("Plot now");
}
2010-06-07 11:24:41 +08:00
$dataQueue->enqueue(undef);
}
sub mainThread {
local *PIPE;
my $dopersist = "";
if($gnuplotVersion >= 4.3)
{
$dopersist = "--persist" if(!$options{"stream"});
}
if(exists $options{"dump"})
{
*PIPE = *STDOUT;
}
else
{
open PIPE, "|gnuplot $dopersist" || die "Can't initialize gnuplot\n";
}
autoflush PIPE 1;
my $outputfile;
my $outputfileType;
if( defined $options{"hardcopy"})
{
$outputfile = $options{"hardcopy"};
($outputfileType) = $outputfile =~ /\.(ps|pdf|png)$/;
if(!$outputfileType) { die("Only .ps, .pdf and .png supported\n"); }
my %terminalOpts =
( ps => 'postscript solid color landscape 10',
pdf => 'pdfcairo solid color font ",10" size 11in,8.5in',
2010-05-12 17:30:51 +08:00
png => 'png size 1280,1024' );
print PIPE "set terminal $terminalOpts{$outputfileType}\n";
print PIPE "set output \"$outputfile\"\n";
}
else
{
print PIPE "set terminal x11\n";
}
# If a bound isn't given I want to set it to the empty string, so I can communicate it simply to
# gnuplot
$options{xmin} = "" unless defined $options{xmin};
$options{xmax} = "" unless defined $options{xmax};
$options{ymin} = "" unless defined $options{ymin};
$options{ymax} = "" unless defined $options{ymax};
$options{y2min} = "" unless defined $options{y2min};
$options{y2max} = "" unless defined $options{y2max};
print PIPE "set xtics\n";
if($options{"y2"})
{
print PIPE "set ytics nomirror\n";
print PIPE "set y2tics\n";
# if any of the ranges are given, set the range
print PIPE "set y2range [". $options{"y2min"} . ":" . $options{"y2max"} ."]\n" if length( $options{"y2min"} . $options{"y2max"} );
}
# if any of the ranges are given, set the range
print PIPE "set xrange [". $options{"xmin"} . ":" . $options{"xmax"} ."]\n" if length( $options{"xmin"} . $options{"xmax"} );
print PIPE "set yrange [". $options{"ymin"} . ":" . $options{"ymax"} ."]\n" if length( $options{"ymin"} . $options{"ymax"} );
print PIPE "set style data $style\n";
print PIPE "set grid\n";
print(PIPE "set xlabel \"" . $options{"xlabel" } . "\"\n") if defined $options{"xlabel"};
print(PIPE "set ylabel \"" . $options{"ylabel" } . "\"\n") if defined $options{"ylabel"};
print(PIPE "set y2label \"" . $options{"y2label"} . "\"\n") if defined $options{"y2label"};
print(PIPE "set title \"" . $options{"title" } . "\"\n") if defined $options{"title"};
if($options{square})
{
$options{size} = '' unless defined $options{size};
$options{size} .= " ratio -1";
}
print(PIPE "set size $options{size}\n") if defined $options{size};
2010-05-13 14:00:39 +08:00
# For the specified values, set the legend entries to 'title "blah blah"'
if($options{"legend"})
{
foreach (@{$options{"legend"}}) { newCurve($_, "") }
}
# For the values requested to be printed on the y2 axis, set that
foreach my $y2idx (@{$options{"y2"}})
{
addCurveOption($y2idx, 'axes x1y2 linewidth 3');
}
# add the extra curve options
if($options{"curvestyle"})
{
my $idx = 0;
foreach (@{$options{"curvestyle"}})
{
addCurveOption($idx, $_);
$idx++;
}
}
# add the extra global options
if($options{"extracmds"})
{
foreach (@{$options{"extracmds"}})
{
print(PIPE "$_\n");
}
}
# regexp for a possibly floating point, possibly scientific notation number, fully captured
2010-10-23 15:28:14 +08:00
my $numRE = qr/([-]?[\d\.]+(?:e[-+]?\d+)?)/io;
my $xlast;
my $haveNewData;
# I should be using the // operator, but I'd like to be compatible with perl 5.8
while( $_ = (defined $dataQueue ? $dataQueue->dequeue() : <>))
{
next if /^#/o;
if($_ ne "Plot now")
{
# parse the incoming data lines. The format is
# x idx0 dat0 idx1 dat1 ....
# where idxX is the index of the curve that datX corresponds to
#
# $options{domain} indicates whether the initial 'x' is given or not (if not, the line
# number is used)
# $options{dataindex} indicates whether idxX is given or not (if not, the point order in the
# line is used)
if($options{domain})
{
/$numRE/go or next;
$xlast = $1;
}
else
{
# since $. is not meaningful in the plotting thread if we're using the data queue, we pass
# $. on the data queue in that case
if(defined $dataQueue)
{
s/ ([\d]+)$//o;
$xlast = $1;
}
else
{
$xlast = $.;
}
}
if($options{dataindex})
{
2010-10-23 15:28:14 +08:00
while(/(\d+)\s+$numRE/go)
{
my $idx = $1;
my $point = $2;
2010-10-19 04:44:33 +08:00
$haveNewData = 1;
pushPoint($idx, [$xlast, $point]);
}
}
else
{
my $idx = 0;
foreach my $point (/$numRE/go)
{
2010-10-19 04:44:33 +08:00
$haveNewData = 1;
pushPoint($idx, [$xlast, $point]);
$idx++;
}
}
}
elsif($options{"stream"})
{
# only redraw a streaming plot if there's new data to plot
next unless $haveNewData;
$haveNewData = undef;
if( $options{"xlen"} )
{
2010-09-29 14:05:17 +08:00
pruneOldData($xlast - $options{"xlen"});
plotStoredData($xlast - $options{"xlen"}, $xlast);
}
else
{
plotStoredData();
}
}
}
2010-01-11 15:45:41 +08:00
# finished reading in all of the data
if($options{"stream"})
{
print PIPE "exit;\n";
close PIPE;
}
else
{
plotStoredData();
if( defined $options{"hardcopy"})
{
print PIPE "set output\n";
# sleep until the plot file exists, and it is closed. Sometimes the output is
# still being written at this point
usleep(100_000) until -e $outputfile;
usleep(100_000) until(system("fuser -s \"$outputfile\""));
print "Wrote output to $outputfile\n";
return;
}
# we persist gnuplot, so we shouldn't need this sleep. However, once
# gnuplot exist, but the persistent window sticks around, you can no
# longer interactively zoom the plot. So we still sleep
sleep(100000);
}
}
2010-09-29 14:05:17 +08:00
sub pruneOldData
{
my ($oldestx) = @_;
foreach my $xy (@curves)
{
if( @$xy > 1 )
{
my $firstInWindow = first_index {$_->[0] >= $oldestx} @{$xy}[1..$#$xy];
splice( @$xy, 1, $firstInWindow ) unless $firstInWindow == -1;
}
}
}
sub plotStoredData
{
my ($xmin, $xmax) = @_;
print PIPE "set xrange [$xmin:$xmax]\n" if defined $xmin;
# get the options for those curves that have any data
my @nonemptyCurves = grep {@$_ > 1} @curves;
my @extraopts = map {$_->[0]{"options"}} @nonemptyCurves;
print PIPE 'plot ' . join(', ' , map({ '"-"' . $_} @extraopts) ) . "\n";
foreach my $buf (@nonemptyCurves)
{
# send each point to gnuplot. Ignore the first "point" since it's the
# curve options
2010-09-24 14:02:35 +08:00
for my $elem (@{$buf}[1..$#$buf])
{
print PIPE "@$elem\n";
}
print PIPE "e\n";
}
}
sub newCurve
{
2010-07-23 10:52:28 +08:00
# I optionally pass in the title of this plot and any additional options separately. The title
# COULD be a part of $opts, but this raises an issue in the no-title case. When no title is
# specified, gnuplot will still add a legend entry with an unhelpful '-' label. I can still grep
# $opts to see if a title is given, but that's a bit ugly in its own way...
my ($title, $opts, $newpoint, $idx) = @_;
if(scalar @curves >= $options{maxcurves})
{
say STDERR "Tried to exceed the --maxcurves setting.";
say STDERR "Invoke with a higher --maxcurves limit if you really want to do this.";
return;
}
# if this curve index doesn't exist, create curve up-to this index
if(defined $idx)
{
while(!exists $curves[$idx])
{
pushNewEmptyCurve();
}
}
else
{
# if we're not given an index, create a new one at the end, and fill it in
pushNewEmptyCurve();
$idx = $#curves;
}
if(defined $title) { $opts = "title \"$title\" $opts" }
else { $opts = "notitle $opts" }
if( defined $newpoint )
{
$curves[$idx] = [{"options" => " $opts"}, $newpoint];
}
else
{
$curves[$idx] = [{"options" => " $opts"}];
}
}
sub addCurveOption
{
my ($idx, $str) = @_;
if(exists $curves[$idx])
{
$curves[$idx][0]{"options"} .= " $str";
}
else
{
newCurve('', $str, undef, $idx);
}
}
sub pushNewEmptyCurve
{
my $opts = "notitle ";
push @curves, [{"options" => " $opts"}];
}
sub pushPoint
{
my ($idx, $xy) = @_;
if ( !exists $curves[$idx] )
{
newCurve("", "", undef, $idx);
}
elsif($options{monotonic})
{
my $curve = $curves[$idx];
if( @$curve > 1 && $xy->[0] < $curve->[$#{$curve}][0] )
{
# the x-coordinate of the new point is in the past, so I wipe out all the data for this curve
# and start anew
splice( @$curve, 1, @$curve-1 );
}
}
push @{$curves[$idx]}, $xy;
}