#!/usr/bin/perl -CA use 5.014; use warnings; use utf8; use List::Util qw( min max sum ); use open qw( :std :utf8 ); use re '/msx'; our $VERSION = '1.09'; my %opt; if (@ARGV) { require Getopt::Long; Getopt::Long->import('2.33', qw( :config gnu_getopt )); GetOptions(\%opt, 'ascii|a!', 'color|C!', 'M' => sub { $opt{color} = 0 }, 'field|f=s' => sub { eval { local $_ = $_[1]; s/\A[0-9]+\z/(?:\\S*\\h+){$_}\\K/; s{\A[+]([0-9]*)\z}{ (!!$1 && '(?:\d+\D+\b){'.$1.'}\K') . '\s* (?=\d)' }e; $opt{anchor} = qr/$_/; } or die $@ =~ s/(?:\ at\ \N+)?\Z/ for option $_[0]/r; }, 'human-readable|H!', 'sexagesimal!', 'reformat!', 'interval|t:i', 'trim|length|l=s' => sub { my ($optname, $optval) = @_; $optval =~ s/%$// and $opt{trimpct}++; $optval =~ m/\A-?[0-9]+\z/ or die( "Value \"$optval\" invalid for option $optname", " (number or percentage expected)\n" ); $opt{trim} = $optval; }, 'value-length=i', 'hidemin=i', 'hidemax=i', 'minval=f', 'maxval=f', 'limit|L:s' => sub { my ($optname, $optval) = @_; $optval ||= 0; $optval =~ /\A-[0-9]+\z/ and $optval .= '-'; # tail shorthand ($opt{hidemin}, $opt{hidemax}) = $optval =~ m/\A (?: (-? [0-9]+)? - )? ([0-9]+)? \z/ or die( "Value \"$optval\" invalid for option limit", " (range expected)\n" ); }, 'log|e!', 'header!', 'markers|m=s', 'graph-format=s' => sub { $opt{'graph-format'} = substr $_[1], 0, 1; }, 'spark|_!', 'indicators:s', 'palette=s' => sub { $opt{palette} = { '' => [], fire => [qw( 90 31 91 33 93 97 96 )], fire256=> [map {"38;5;$_"} qw( 235 52 88 124 160 196 202 208 214 220 226 227 228 229 230 231 159 )], whites => [qw( 1;30 0;37 1;37 )], greys => [map {"38;5;$_"} 0, 232..255, 15], random => [map {"38;5;$_"} List::Util::shuffle(17..231)], rainbow=> [map {"38;5;$_"} 196, # r (map { 196 + $_*6 } 0..4), # +g (map { 226 - $_*6*6 } 0..4), # -r (map { 46 + $_ } 0..4), # +b (map { 51 - $_*6 } 0..4), # -g (map { 21 + $_*6*6 } 0..4), # +r (map { 201 - $_ } 0..4), # -b 196, ], }->{$_[1]} // do { my @vals = split /[^0-9;]/, $_[1] or die "Empty palette resulting from \"$_[1]\"\n"; \@vals; }; }, 'stat|s!', 'report=s', 'signal-stat=s', 'unmodified|u!', 'width|w=i', 'version|V' => sub { my $mascot = $opt{ascii} ? '=^,^=' : 'ฅ^•ﻌ•^ฅ'; say "barcat $mascot version $VERSION"; exit; }, 'usage|h' => sub { /^=/ ? last : print for readline *DATA; # text between __END__ and pod exit; }, 'help|?' => sub { require Pod::Usage; Pod::Usage::pod2usage( -exitval => 0, -perldocopt => '-oman', -verbose => 2, ); }, ) or exit 64; # EX_USAGE } $opt{width} ||= $ENV{COLUMNS} || qx(tput cols) || 80 unless $opt{spark}; $opt{color} //= $ENV{NO_COLOR} ? 0 : -t *STDOUT; # enable on tty $opt{'graph-format'} //= '-'; $opt{trim} *= $opt{width} / 100 if $opt{trimpct}; $opt{units} = [split //, ' kMGTPEZYRQqryzafpn'.($opt{ascii} ? 'u' : 'μ').'m'] if $opt{'human-readable'}; $opt{anchor} //= qr/\A/; $opt{'value-length'} = 4 if $opt{units}; $opt{'value-length'} = 1 if $opt{unmodified}; $opt{'signal-stat'} //= exists $SIG{INFO} ? 'INFO' : 'QUIT'; $opt{markers} //= '=avg >31.73v <68.27v +50v |0'; $opt{report} //= join(', ', '${min; color(31)} min', '${avg; $opt{reformat} or $_ = sprintf "%0.2f", $_; color(36)} avg', '${max; color(32)} max', ); $opt{palette} //= $opt{color} && [31, 90, 32]; $opt{indicators} = [split //, $opt{indicators} || ($opt{ascii} ? ' .oO' : $opt{spark} ? ' ▁▂▃▄▅▆▇█' : ' ▏▎▍▌▋▊▉█') ] if defined $opt{indicators} or $opt{spark}; $opt{hidemin} = ($opt{hidemin} || 1) - 1; $opt{input} = (@ARGV && $ARGV[0] =~ m/\A[-0-9]/) ? \@ARGV : undef and undef $opt{interval}; $opt{'calc-format'} = sub { sprintf '%*.*f', 0, 2, $_[0] }; $opt{'value-format'} = $opt{sexagesimal} ? sub { my $s = abs($_[0]) + .5; sprintf('%s%d:%02d:%02d', $_[0] < 0 && '-', $s/3600, $s/60%60, $s%60); } : $opt{units} && sub { my $unit = ( log(abs $_[0] || 1) / log(10) - 3 * (abs($_[0]) < .9995) # shift to smaller unit if below 1 + 1e-15 # float imprecision ); my $decimal = ($unit % 3) == ($unit < 0); $unit -= log($decimal ? .995 : .9995) / log(10); # rounded $decimal = ($unit % 3) == ($unit < 0); $decimal &&= $_[0] !~ /^-?0*[0-9]{1,3}$/; # integer 0..999 sprintf('%*.*f%1s', 3 + ($_[0] < 0), # digits plus optional negative sign $decimal, # tenths $_[0] / 1000 ** int($unit/3), # number $#{$opt{units}} * 1.5 < abs $unit ? sprintf('e%d', $unit) : $opt{units}->[$unit/3] # suffix ); } and $opt{reformat}++; $opt{'value-format'} ||= sub { sprintf '%.8g', $_[0] }; my (@lines, @values, @order); $SIG{$_} = \&show_stat for $opt{'signal-stat'} || (); $SIG{ALRM} = sub { show_lines(); alarm $opt{interval} if defined $opt{interval} and $opt{interval} > 0; }; $SIG{INT} = \&show_exit; if (defined $opt{interval}) { $opt{interval} ||= 1; alarm $opt{interval} if $opt{interval} > 0; eval { require Tie::Array::Sorted; tie @order, 'Tie::Array::Sorted', sub { $_[1] <=> $_[0] }; } or warn $@, "Expect slowdown with large datasets!\n"; } my $float = qr<[0-9]* [.]? [0-9]+ (?: e[+-]?[0-9]+ )?>; # positive numberish my $valmatch = qr< $opt{anchor} ( \h* -? $float |) >x; while (defined ($_ = $opt{input} ? shift @{ $opt{input} } : readline)) { s/\r?\n\z//; s/\A\h*// unless $opt{unmodified}; my $valnum = s/$valmatch/\n/ && $1; push @values, $valnum; push @order, $valnum if length $valnum; if (defined $opt{trim} and defined $valnum) { my $trimpos = abs $opt{trim}; $trimpos -= length $valnum if $opt{unmodified}; if ($trimpos <= 1) { $_ = substr $_, 0, 2; } elsif (length > $trimpos) { # cut and replace (intentional lvalue for speed, contrary to PBP) substr($_, $trimpos - 1) = $opt{ascii} ? '>' : '…'; } } push @lines, $_; show_lines() if defined $opt{interval} and $opt{interval} < 0 and $. % $opt{interval} == 0; } $SIG{INT} = 'DEFAULT'; sub color { $opt{color} and defined $_[0] or return ''; return "\e[$_[0]m" if defined wantarray; $_ = color(@_) . $_ . color(0) if defined; } sub show_lines { state $nr = $opt{hidemin} < 0 ? max(0, @lines + $opt{hidemin} + 1) : $opt{hidemin}; @lines > $nr or return; my $limit = $#lines; if (defined $opt{hidemax}) { if ($opt{hidemin} and $opt{hidemin} < 0) { $limit -= $opt{hidemax} - 1; } elsif ($opt{hidemax} <= $limit) { $limit = $opt{hidemax} - 1; } } @order = sort { $b <=> $a } @order unless tied @order; my $maxval = $opt{maxval} // ( $opt{hidemax} ? max grep { length } @values[$nr .. $limit] : $order[0] ) // 0; my $minval = $opt{minval} // min $order[-1] // (), 0; my $range = $maxval - $minval; $range &&= log $range if $opt{log}; my $lenval = $opt{'value-length'} // max map { length } @order; my $len = defined $opt{trim} && $opt{trim} <= 0 ? -$opt{trim} + 1 : max map { length $values[$_] && length $lines[$_] } 0 .. min $#lines, $opt{hidemax} || (); # left padding my $size = defined $opt{width} && $range && ($opt{width} - $lenval - $len - !!$opt{indicators}); # bar multiplication my @barmark; if ($opt{markers} and $size > 0) { for my $markspec (split /\h/, $opt{markers}) { my ($char, $func) = split //, $markspec, 2; my @pos = eval { if ($func eq 'avg') { return sum(@order) / @order; } elsif ($func =~ /\A([0-9.]+)v\z/) { $1 <= 100 or die( "Invalid marker $char: percentile $1 out of bounds\n" ); my $index = $#order * $1 / 100; return ($order[$index] + $order[$index + .5]) / 2; } elsif ($func =~ /\A-?[0-9.]+\z/) { return $func; } elsif ($func =~ /\A\/($float)\z/) { my @range = my $multiple = my $next = $1; while ($next < $maxval) { $multiple *= 10 if $opt{log}; push @range, $next += $multiple; } return @range; } else { die "Unknown marker $char: $func\n"; } }; @pos or do { warn $@ if $@; next; }; for my $pos (@pos) { $pos -= $minval; $pos &&= log $pos if $opt{log}; $pos >= 0 or next; color(36) for $barmark[$pos / $range * $size] = $char; } } state $lastmax = $maxval; if ($maxval > $lastmax) { print ' ' x ($lenval + $len); printf color(90); printf '%-*s', ($lastmax - $minval) * $size / $range + .5, '-' x (($values[$nr - 1] - $minval) * $size / $range); print color(92); say '+' x (($range - $lastmax) * $size / $range + .5); print color(0); $lastmax = $maxval; } } say( color(31), sprintf('%*s', $lenval, $minval), color(90), '-', color(36), '+', color(32), sprintf('%*s', $size - 3, $maxval), color(90), '-', color(36), '+', color(0), ) if $opt{header}; while ($nr <= $limit) { my $val = $values[$nr]; my $rel; if (length $val) { $rel = $val - $minval; $rel &&= log $rel if $opt{log}; $rel = min(1, $rel / $range) if $range; # 0..1 } my $color = !length $val || !$opt{palette} ? undef : $val == $order[0] ? $opt{palette}->[-1] : # max $val == $order[-1] ? $opt{palette}->[0] : # min $opt{palette}->[ $rel * ($#{$opt{palette}} - 1) + 1 ]; my $indicator = $opt{indicators} && $opt{indicators}->[ !length($val) || !$#{$opt{indicators}} ? 0 : # blank $#{$opt{indicators}} < 2 ? 1 : $val >= $order[0] ? -1 : $rel * ($#{$opt{indicators}} - 1e-14) + 1 ]; if ($opt{spark}) { say '' if $opt{width} and $nr and $nr % $opt{width} == 0; print color($color), $_ for $indicator; next; } print $indicator if defined $indicator; if (length $val) { $val = sprintf("%*s", $lenval, $opt{reformat} ? $opt{'value-format'}->($val) : $val ); color($color) for $val; } my $line = $lines[$nr] =~ s/\n/$val/r; if (not length $val) { say $line; next; } printf '%-*s', $len + length($val), $line; if ($rel and $size) { print $barmark[$_] // $opt{'graph-format'} for 1 .. $rel * $size + .5; } say ''; } continue { $nr++; } say $opt{palette} ? color(0) : '' if $opt{spark}; return $nr; } sub show_stat { if ($opt{hidemin} or $opt{hidemax}) { my $linemin = $opt{hidemin}; my $linemax = ($opt{hidemax} || @lines) - 1; if ($linemin < 0) { $linemin += @lines; $linemax = @lines - $linemax; } print varfmt('${sum+} of ', { lines => $linemax - $linemin + 1, sum => sum(0, grep {length} @values[$linemin .. $linemax]), }); } if (@order) { my $total = sum @order; my $fmt = '${sum+;color(1)} total in ${count#} values'; $fmt .= ' over ${lines#} lines' if @order != @lines; $fmt .= " ($_)" for $opt{report} || (); print varfmt($fmt, { sum => $total, count => int @order, lines => int @lines, min => $order[-1], max => $order[0], avg => $total / @order, }); } say ''; return 1; } sub varfmt { my ($fmt, $vars) = @_; $fmt =~ s[\$\{ \h*+ ((?: [^{}]++ | \{(?1)\} )+) \}]{ my ($name, $cmd) = split /\s*;/, $1, 2; my $format = $name =~ s/\+// || $name !~ s/\#// && $opt{reformat}; local $_ = $vars->{$name}; if (defined) { $_ = $opt{'value-format'}->($_) if $format; if ($cmd) { eval $cmd; warn "Error in \$$name report: $@" if $@; } $_; } else { warn "Unknown variable \$$name in report\n"; "\$$name"; } }eg; return $fmt; } sub show_exit { show_lines(); show_stat() if $opt{stat}; exit 130 if @_; # 0x80+signo exit; } show_exit(); __END__ Usage: /\_/\ barcat [OPTIONS] [FILES|NUMBERS] (=•.•=) (u u) Options: -a, --[no-]ascii Restrict user interface to ASCII characters -C, --[no-]color Force colored output of values and bar markers -f, --field=([+]N|REGEXP) Compare values after a given number of whitespace separators --header Prepend a chart axis with minimum and maximum values labeled -H, --human-readable Format values using SI unit prefixes --sexagesimal Convert seconds to HH:MM:SS time format -t, --interval[=(N|-LINES)] Output partial progress every given number of seconds or input lines -l, --length=[-]SIZE[%] Trim line contents (between number and bars) -L, --limit[=(N|-LAST|START-[END])] Stop output after a number of lines -e, --log Logarithmic (exponential) scale instead of linear --graph-format=CHAR Glyph to repeat for the graph line -m, --markers=FORMAT Statistical positions to indicate on bars --min=N, --max=N Bars extend from 0 or the minimum value if lower --palette=(PRESET|COLORS) Override colors of parsed numbers -_, --spark Replace lines by sparklines --indicators[=CHARS] Prefix a unicode character corresponding to each value -s, --stat Total statistics after all data -u, --unmodified Do not reformat values, keeping leading whitespace --value-length=SIZE Reserved space for numbers -w, --width=COLUMNS Override the maximum number of columns to use -h, --usage Overview of available options --help Full pod documentation -V, --version Version information =encoding utf8 =head1 NAME barcat - concatenate texts with graph to visualize values =head1 SYNOPSIS B [] [... | ] =head1 DESCRIPTION Visualizes relative sizes of values read from input (parameters, file(s) or STDIN). Contents are concatenated similar to I, but numbers are reformatted and a bar graph is appended to each line. Don't worry, barcat does not drink and divide. It can has various options for input and output (re)formatting, but remains limited to one-dimensional charts. For more complex graphing needs you'll need a larger animal like I. =head1 OPTIONS =over =item -a, --[no-]ascii Restrict user interface to ASCII characters, replacing default UTF-8 by their closest approximation. Input is always interpreted as UTF-8 and shown as is. =item -C, --[no-]color Force colored output of values and bar markers. Defaults on if output is a tty, disabled otherwise such as when piped or redirected. Can also be disabled by setting I<-M> or the I environment variable. =item -f, --field=([+] | ) Compare values after a given number of whitespace separators, or matching a regular expression. Unspecified or I<-f0> means values are at the start of each line. With I<-f1> the second word is taken instead. A string can indicate the starting position of a value (such as I<-f:> if preceded by colons), or capture the numbers itself, for example I<-f'(\d+)'> for the first digits anywhere. A shorthand for this is I<+0>, or I<+N> to find the Nth number. =item --header Prepend a chart axis with minimum and maximum values labeled. =item -H, --human-readable Format values using SI unit prefixes, turning long numbers like I<12356789> into I<12.4M>. Also changes an exponent I<1.602176634e-19> to I<160.2z>. Short integers are aligned but kept without decimal point. =item --sexagesimal Convert seconds to HH:MM:SS time format. =item -t, --interval[=( | -)] Output partial progress every given number of seconds or input lines. An update can also be forced by sending a I alarm signal. =item -l, --length=[-][%] Trim line contents (between number and bars) to a maximum number of characters. The exceeding part is replaced by an abbreviation sign, unless C<--length=0>. Prepend a dash (i.e. make negative) to enforce padding regardless of encountered contents. =item -L, --limit[=( | - | -[])] Stop output after a number of lines. A single value indicates the last line number (like C), or first line counting from the bottom if negative (like C). A specific range can be given by two values. All input is still counted and analyzed for statistics, but disregarded for padding and bar size. =item -e, --log Logarithmic (Ixponential) scale instead of linear to compare orders of magnitude. =item --graph-format= Glyph to repeat for the graph line. Defaults to a dash C<->. =item -m, --markers= Statistical positions to indicate on bars. A single indicator glyph precedes each position: =over 2 =item Exact value to match on the axis. A vertical bar at the zero crossing is displayed by I<|0> for negative values. For example I<π3.14> would locate pi. =item I Repeated at every multiple of a number. For example I<:/1> for a grid at every integer. =item I Ranked value at the given percentile. The default shows I<+> at I<50v> for the mean or median; the middle value or average between middle values. One standard deviation right of the mean is at about I<68.3v>. The default includes I<< >31.73v <68.27v >> to encompass all I results, or 68% of all entries, by B<< <--> >>. =item I Matches the average; the sum of all values divided by the number of counted lines. Indicated by default as I<=>. =back =item --min=, --max= Bars extend from 0 or the minimum value if lower, to the largest value encountered. These options can be set to customize this range. =item --palette=( | ...) Override colors of parsed numbers. Can be any CSI escape, such as I<90> for default dark grey, or alternatively I<1;30> for bright black. In case of additional colors, the last is used for values equal to the maximum, the first for minima. If unspecified, these are green and red respectively (I<31 90 32>). Multiple intermediate colors will be distributed relative to the size of values. Predefined color schemes are named I and I, or I and I for 256-color variants. =item -_, --spark Replace lines by I, single characters (configured by C<--indicators>) corresponding to input values. =item --indicators[=] Prefix a unicode character corresponding to each value. The first specified character will be used for non-values, the remaining sequence will be distributed over the range of values. Unspecified, block fill glyphs U+2581-2588 will be used. =item -s, --stat Total statistics after all data. =item -u, --unmodified Do not reformat values, keeping leading whitespace. Keep original value alignment, which may be significant in some programs. =item --value-length= Reserved space for numbers. =item -w, --width= Override the maximum number of columns to use. Appended graphics will extend to fill up the entire screen, otherwise determined by the environment variable I or by running the C command. =item -h, --usage Overview of available options. =item --help Full pod documentation as rendered by perldoc. =item -V, --version Version information. =back =head1 EXAMPLES Draw a sine wave: seq 30 | awk '{print sin($1/10)}' | barcat Compare file sizes (with human-readable numbers): du -d0 -b * | barcat -H Same from formatted results, selecting the first numeric value: tree -s --noreport | barcat -H -f+ Compare media metadata, like image size or play time: exiftool -T -p '$megapixels ($imagesize) $filename' * | barcat exiftool -T -p '$duration# $avgbitrate# $filename' * | barcat --sexagesimal find -type f -print0 | xargs -0 -L1 \ ffprobe -show_format -of json -v error | jq -r '.format|.duration+" "+.bit_rate+" "+.filename' | barcat --sex Memory usage of user processes with long names truncated: ps xo rss,pid,cmd | barcat -l40 Monitor network latency from prefixed results: ping google.com | barcat -f'time=\K' -t Commonly used after counting, for example users on the current server: users | tr ' ' '\n' | sort | uniq -c | barcat Letter frequencies in text files: cat /usr/share/games/fortunes/*.u8 | perl -CS -nE 'say for grep length, split /\PL*/, uc' | sort | uniq -c | barcat Number of HTTP requests per day: cat httpd/access.log | cut -d\ -f4 | cut -d: -f1 | uniq -c | barcat Any kind of database query results, preserving returned alignment: echo 'SELECT sin(value * .1) FROM generate_series(0, 30) value' | psql -t | barcat -u In PostgreSQL from within the client; a fancy C<\dt+> perhaps: > SELECT schemaname, relname, pg_total_relation_size(relid) FROM pg_statio_user_tables ORDER BY idx_blks_hit \g |barcat -uHf+ Same thing in SQLite (requires the sqlite3 client): > .once |barcat -Hf+ > SELECT name, sum(pgsize) FROM dbstat GROUP BY 1; Earthquakes worldwide magnitude 1+ in the last 24 hours: curl https://earthquake.usgs.gov/earthquakes/feed/v1.0/summary/1.0_day.csv | column -ts, -n | barcat -f4 -u -l80% External datasets, like movies per year: curl https://github.com/prust/wikipedia-movie-data/raw/master/movies.json -L | jq .[].year | uniq -c | barcat Pokémon height comparison: curl https://github.com/Biuni/PokemonGO-Pokedex/raw/master/pokedex.json -L | jq -r '.pokemon[] | [.height,.num,.name] | join(" ")' | barcat USD/EUR exchange rate from CSV provided by the ECB: curl https://sdw.ecb.europa.eu/export.do \ -Gd 'node=SEARCHRESULTS&q=EXR.D.USD.EUR.SP00.A&exportType=csv' | barcat -f',\K' --value-length=7 Total population history in XML from the World Bank: curl http://api.worldbank.org/v2/country/1W/indicator/SP.POP.TOTL | xmlstarlet sel -t -m '*/*' -v wb:date -o ' ' -v wb:value -n | barcat -f1 -H --markers=+/1e9 Population and other information for all countries: curl http://download.geonames.org/export/dump/countryInfo.txt | grep -v '^#\s' | column -ts$'\t' -n | barcat -f+2 -e -u -l150 -s And of course various Git statistics, such commit count by year: git log --pretty=%ci | cut -b-4 | uniq -c | barcat Or the top 3 most frequent authors with statistics over all: git shortlog -sn | barcat -L3 -s Activity graph of the last days (substitute date C<-v-{}d> on BSD): ( git log --pretty=%ci --since=30day | cut -b-10 seq 0 30 | xargs -i date +%F -d-{}day ) | sort | uniq -c | awk '$1--' | barcat --spark Sparkline graphics of simple input given as inline parameters: barcat -_ 3 1 4 1 5 0 9 2 4 Misusing the spark functionality to draw a lolcat line: seq $(tput cols) | barcat --spark --indicator=- --palette=rainbow =head1 AUTHOR Mischa POSLAWSKY =head1 LICENSE GPL3+.