2017-03-28 13:22:32 +02:00
|
|
|
#!@PERL_PATH@
|
2010-12-28 19:57:23 +01:00
|
|
|
|
2017-03-28 13:22:32 +02:00
|
|
|
# Copyright (c) 2000, 2017, Oracle and/or its affiliates. All rights reserved.
|
2010-12-28 19:57:23 +01:00
|
|
|
#
|
|
|
|
# This program is free software; you can redistribute it and/or
|
|
|
|
# modify it under the terms of the GNU Library General Public
|
|
|
|
# License as published by the Free Software Foundation; version 2
|
|
|
|
# of the License.
|
|
|
|
#
|
|
|
|
# This program is distributed in the hope that it will be useful,
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
# Library General Public License for more details.
|
|
|
|
#
|
|
|
|
# You should have received a copy of the GNU Library General Public
|
|
|
|
# License along with this library; if not, write to the Free
|
2011-06-30 17:31:31 +02:00
|
|
|
# Software Foundation, Inc., 51 Franklin St, Fifth Floor, Boston,
|
2019-05-11 20:29:06 +02:00
|
|
|
# MA 02110-1335 USA
|
2010-12-28 19:57:23 +01:00
|
|
|
|
2000-11-21 17:28:46 +01:00
|
|
|
# mysqldumpslow - parse and summarize the MySQL slow query log
|
|
|
|
|
2001-03-08 20:49:15 +01:00
|
|
|
# Original version by Tim Bunce, sometime in 2000.
|
|
|
|
# Further changes by Tim Bunce, 8th March 2001.
|
2001-08-11 00:42:34 +02:00
|
|
|
# Handling of strings with \ and double '' by Monty 11 Aug 2001.
|
2001-03-08 20:49:15 +01:00
|
|
|
|
2000-11-21 17:28:46 +01:00
|
|
|
use strict;
|
|
|
|
use Getopt::Long;
|
|
|
|
|
2014-12-01 03:13:41 +01:00
|
|
|
# t=time, l=lock time, r=rows, a=rows affected
|
|
|
|
# at, al, ar and aa are the corresponding averages
|
2000-11-21 17:28:46 +01:00
|
|
|
|
|
|
|
my %opt = (
|
2001-03-08 20:49:15 +01:00
|
|
|
s => 'at',
|
|
|
|
h => '*',
|
2000-11-21 17:28:46 +01:00
|
|
|
);
|
|
|
|
|
|
|
|
GetOptions(\%opt,
|
2009-02-16 15:38:18 +01:00
|
|
|
'v|verbose+',# verbose
|
2005-03-09 15:00:40 +01:00
|
|
|
'help+', # write usage info
|
2009-02-16 15:38:18 +01:00
|
|
|
'd|debug+', # debug
|
2019-03-15 08:44:53 +01:00
|
|
|
's=s', # what to sort by (aa, ae, al, ar, at, a, c, e, l, r, t)
|
2001-03-08 20:49:15 +01:00
|
|
|
'r!', # reverse the sort order (largest last instead of first)
|
|
|
|
't=i', # just show the top n queries
|
|
|
|
'a!', # don't abstract all numbers to N and strings to 'S'
|
|
|
|
'n=i', # abstract numbers with at least n digits within names
|
|
|
|
'g=s', # grep: only consider stmts that include this string
|
2011-03-18 16:03:43 +01:00
|
|
|
'h=s', # hostname/basename of db server for *-slow.log filename (can be wildcard)
|
2001-03-08 20:49:15 +01:00
|
|
|
'i=s', # name of server instance (if using mysql.server startup script)
|
|
|
|
'l!', # don't subtract lock time from total time
|
2005-03-09 15:00:40 +01:00
|
|
|
) or usage("bad option");
|
2000-11-21 17:28:46 +01:00
|
|
|
|
2005-03-09 15:00:40 +01:00
|
|
|
$opt{'help'} and usage();
|
2000-11-21 17:28:46 +01:00
|
|
|
|
2001-03-08 20:49:15 +01:00
|
|
|
unless (@ARGV) {
|
2013-03-06 09:32:13 +01:00
|
|
|
my $defaults = `my_print_defaults --mysqld`;
|
2001-03-08 20:49:15 +01:00
|
|
|
|
2011-03-18 16:03:43 +01:00
|
|
|
my $datadir = ($defaults =~ m/--datadir=(.*)/g)[-1];
|
2001-03-08 20:49:15 +01:00
|
|
|
if (!$datadir or $opt{i}) {
|
|
|
|
# determine the datadir from the instances section of /etc/my.cnf, if any
|
|
|
|
my $instances = `my_print_defaults instances`;
|
2011-03-18 16:03:43 +01:00
|
|
|
die "Can't determine datadir from 'my_print_defaults instances' output: $defaults"
|
2001-03-08 20:49:15 +01:00
|
|
|
unless $instances;
|
|
|
|
my @instances = ($instances =~ m/^--(\w+)-/mg);
|
|
|
|
die "No -i 'instance_name' specified to select among known instances: @instances.\n"
|
|
|
|
unless $opt{i};
|
|
|
|
die "Instance '$opt{i}' is unknown (known instances: @instances)\n"
|
|
|
|
unless grep { $_ eq $opt{i} } @instances;
|
2011-03-18 16:03:43 +01:00
|
|
|
$datadir = ($instances =~ m/--$opt{i}-datadir=(.*)/g)[-1]
|
2001-03-08 20:49:15 +01:00
|
|
|
or die "Can't determine --$opt{i}-datadir from 'my_print_defaults instances' output: $instances";
|
|
|
|
warn "datadir=$datadir\n" if $opt{v};
|
|
|
|
}
|
|
|
|
|
2011-03-18 16:03:43 +01:00
|
|
|
my $slowlog = ($defaults =~ m/--log[-_]slow[-_]queries=(.*)/g)[-1];
|
|
|
|
if (!$slowlog)
|
|
|
|
{
|
|
|
|
$slowlog = ($defaults =~ m/--slow[-_]query[-_]log[-_]file=(.*)/g)[-1];
|
|
|
|
}
|
|
|
|
if ( $slowlog )
|
|
|
|
{
|
2006-12-19 06:12:01 +01:00
|
|
|
@ARGV = ($slowlog);
|
|
|
|
die "Can't find '$slowlog'\n" unless @ARGV;
|
2011-03-18 16:03:43 +01:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
if (!$opt{h})
|
|
|
|
{
|
|
|
|
$opt{h}= ($defaults =~ m/--log[-_]basename=(.*)/g)[-1];
|
|
|
|
}
|
|
|
|
@ARGV = <$datadir/$opt{h}-slow.log>;
|
|
|
|
die "Can't find '$datadir/$opt{h}-slow.log'\n" unless @ARGV;
|
2006-12-19 06:12:01 +01:00
|
|
|
}
|
2001-03-08 20:49:15 +01:00
|
|
|
}
|
2000-11-21 17:28:46 +01:00
|
|
|
|
2001-03-08 20:49:15 +01:00
|
|
|
warn "\nReading mysql slow query log from @ARGV\n";
|
2000-11-21 17:28:46 +01:00
|
|
|
|
2001-03-08 20:49:15 +01:00
|
|
|
my @pending;
|
|
|
|
my %stmt;
|
|
|
|
$/ = ";\n#"; # read entire statements using paragraph mode
|
|
|
|
while ( defined($_ = shift @pending) or defined($_ = <>) ) {
|
|
|
|
warn "[[$_]]\n" if $opt{d}; # show raw paragraph being read
|
|
|
|
|
|
|
|
my @chunks = split /^\/.*Version.*started with[\000-\377]*?Time.*Id.*Command.*Argument.*\n/m;
|
|
|
|
if (@chunks > 1) {
|
|
|
|
unshift @pending, map { length($_) ? $_ : () } @chunks;
|
|
|
|
warn "<<".join(">>\n<<",@chunks).">>" if $opt{d};
|
|
|
|
next;
|
|
|
|
}
|
|
|
|
|
|
|
|
s/^#? Time: \d{6}\s+\d+:\d+:\d+.*\n//;
|
|
|
|
my ($user,$host) = s/^#? User\@Host:\s+(\S+)\s+\@\s+(\S+).*\n// ? ($1,$2) : ('','');
|
|
|
|
|
2014-12-01 03:13:41 +01:00
|
|
|
s/^# Thread_id: [0-9]+\s+Schema: .*\s+QC_hit:.*[^\n]+\n//;
|
2011-03-18 16:03:43 +01:00
|
|
|
s/^# Query_time: ([0-9.]+)\s+Lock_time: ([0-9.]+)\s+Rows_sent: ([0-9.]+)\s+Rows_examined: ([0-9.]+).*\n//;
|
|
|
|
my ($t, $l, $r, $e) = ($1, $2, $3, $4);
|
2014-12-01 03:13:41 +01:00
|
|
|
s/^# Rows_affected: ([0-9.]+).*\n//;
|
|
|
|
my ($a) = ($1);
|
2011-03-18 16:03:43 +01:00
|
|
|
|
2001-03-08 20:49:15 +01:00
|
|
|
$t -= $l unless $opt{l};
|
|
|
|
|
|
|
|
# remove fluff that mysqld writes to log when it (re)starts:
|
|
|
|
s!^/.*Version.*started with:.*\n!!mg;
|
|
|
|
s!^Tcp port: \d+ Unix socket: \S+\n!!mg;
|
|
|
|
s!^Time.*Id.*Command.*Argument.*\n!!mg;
|
|
|
|
|
2011-03-18 16:03:43 +01:00
|
|
|
# Remove optimizer info
|
|
|
|
s!^# QC_Hit: \S+\s+Full_scan: \S+\s+Full_join: \S+\s+Tmp_table: \S+\s+Tmp_table_on_disk: \S+[^\n]+\n!!mg;
|
|
|
|
s!^# Filesort: \S+\s+Filesort_on_disk: \S+[^\n]+\n!!mg;
|
|
|
|
s!^# Full_scan: \S+\s+Full_join: \S+[^\n]+\n!!mg;
|
|
|
|
|
2001-03-08 20:49:15 +01:00
|
|
|
s/^use \w+;\n//; # not consistently added
|
|
|
|
s/^SET timestamp=\d+;\n//;
|
|
|
|
|
|
|
|
s/^[ ]*\n//mg; # delete blank lines
|
|
|
|
s/^[ ]*/ /mg; # normalize leading whitespace
|
|
|
|
s/\s*;\s*(#\s*)?$//; # remove trailing semicolon(+newline-hash)
|
|
|
|
|
|
|
|
next if $opt{g} and !m/$opt{g}/io;
|
|
|
|
|
|
|
|
unless ($opt{a}) {
|
|
|
|
s/\b\d+\b/N/g;
|
|
|
|
s/\b0x[0-9A-Fa-f]+\b/N/g;
|
2002-03-12 10:52:41 +01:00
|
|
|
s/''/'S'/g;
|
|
|
|
s/""/"S"/g;
|
|
|
|
s/(\\')//g;
|
|
|
|
s/(\\")//g;
|
|
|
|
s/'[^']+'/'S'/g;
|
|
|
|
s/"[^"]+"/"S"/g;
|
2001-03-08 20:49:15 +01:00
|
|
|
# -n=8: turn log_20001231 into log_NNNNNNNN
|
|
|
|
s/([a-z_]+)(\d{$opt{n},})/$1.('N' x length($2))/ieg if $opt{n};
|
|
|
|
# abbreviate massive "in (...)" statements and similar
|
|
|
|
s!(([NS],){100,})!sprintf("$2,{repeated %d times}",length($1)/2)!eg;
|
|
|
|
}
|
|
|
|
|
|
|
|
my $s = $stmt{$_} ||= { users=>{}, hosts=>{} };
|
|
|
|
$s->{c} += 1;
|
|
|
|
$s->{t} += $t;
|
|
|
|
$s->{l} += $l;
|
|
|
|
$s->{r} += $r;
|
2011-03-18 16:03:43 +01:00
|
|
|
$s->{e} += $e;
|
2014-12-01 03:13:41 +01:00
|
|
|
$s->{a} += $a;
|
2001-03-08 20:49:15 +01:00
|
|
|
$s->{users}->{$user}++ if $user;
|
|
|
|
$s->{hosts}->{$host}++ if $host;
|
|
|
|
|
|
|
|
warn "{{$_}}\n\n" if $opt{d}; # show processed statement string
|
2000-11-21 17:28:46 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
foreach (keys %stmt) {
|
2001-03-08 20:49:15 +01:00
|
|
|
my $v = $stmt{$_} || die;
|
2014-12-01 03:13:41 +01:00
|
|
|
my ($c, $t, $l, $r, $e, $a) = @{ $v }{qw(c t l r e a)};
|
2001-03-08 20:49:15 +01:00
|
|
|
$v->{at} = $t / $c;
|
|
|
|
$v->{al} = $l / $c;
|
|
|
|
$v->{ar} = $r / $c;
|
2011-03-18 16:03:43 +01:00
|
|
|
$v->{ae} = $e / $c;
|
2014-12-01 03:13:41 +01:00
|
|
|
$v->{aa} = $a / $c;
|
2000-11-21 17:28:46 +01:00
|
|
|
}
|
|
|
|
|
2001-03-08 20:49:15 +01:00
|
|
|
my @sorted = sort { $stmt{$b}->{$opt{s}} <=> $stmt{$a}->{$opt{s}} } keys %stmt;
|
|
|
|
@sorted = @sorted[0 .. $opt{t}-1] if $opt{t};
|
|
|
|
@sorted = reverse @sorted if $opt{r};
|
2000-11-21 17:28:46 +01:00
|
|
|
|
|
|
|
foreach (@sorted) {
|
2001-03-08 20:49:15 +01:00
|
|
|
my $v = $stmt{$_} || die;
|
2014-12-01 03:13:41 +01:00
|
|
|
my ($c, $t, $at, $l, $al, $r, $ar, $e, $ae, $a, $aa) = @{ $v }{qw(c t at l al r ar e ae a aa)};
|
2001-03-08 20:49:15 +01:00
|
|
|
my @users = keys %{$v->{users}};
|
|
|
|
my $user = (@users==1) ? $users[0] : sprintf "%dusers",scalar @users;
|
|
|
|
my @hosts = keys %{$v->{hosts}};
|
|
|
|
my $host = (@hosts==1) ? $hosts[0] : sprintf "%dhosts",scalar @hosts;
|
2014-12-01 03:13:41 +01:00
|
|
|
printf "Count: %d Time=%.2fs (%ds) Lock=%.2fs (%ds) Rows_sent=%.1f (%d), Rows_examined=%.1f (%d), Rows_affected=%.1f (%d), $user\@$host\n%s\n\n",
|
|
|
|
$c, $at,$t, $al,$l, $ar,$r, $ae, $e, $aa, $a, $_;
|
2000-11-21 17:28:46 +01:00
|
|
|
}
|
2005-03-09 15:00:40 +01:00
|
|
|
|
|
|
|
sub usage {
|
|
|
|
my $str= shift;
|
|
|
|
my $text= <<HERE;
|
|
|
|
Usage: mysqldumpslow [ OPTS... ] [ LOGS... ]
|
|
|
|
|
|
|
|
Parse and summarize the MySQL slow query log. Options are
|
|
|
|
|
|
|
|
--verbose verbose
|
|
|
|
--debug debug
|
|
|
|
--help write this text to standard output
|
|
|
|
|
|
|
|
-v verbose
|
|
|
|
-d debug
|
2019-03-15 08:44:53 +01:00
|
|
|
-s ORDER what to sort by (aa, ae, al, ar, at, a, c, e, l, r, t), 'at' is default
|
|
|
|
aa: average rows affected
|
|
|
|
ae: aggregated rows examined
|
2009-05-07 19:40:00 +02:00
|
|
|
al: average lock time
|
|
|
|
ar: average rows sent
|
|
|
|
at: average query time
|
2019-03-15 08:44:53 +01:00
|
|
|
a: rows affected
|
2009-05-07 19:40:00 +02:00
|
|
|
c: count
|
2019-03-15 08:44:53 +01:00
|
|
|
e: rows examined
|
2009-05-07 19:40:00 +02:00
|
|
|
l: lock time
|
|
|
|
r: rows sent
|
|
|
|
t: query time
|
2005-03-09 15:00:40 +01:00
|
|
|
-r reverse the sort order (largest last instead of first)
|
|
|
|
-t NUM just show the top n queries
|
|
|
|
-a don't abstract all numbers to N and strings to 'S'
|
|
|
|
-n NUM abstract numbers with at least n digits within names
|
|
|
|
-g PATTERN grep: only consider stmts that include this string
|
|
|
|
-h HOSTNAME hostname of db server for *-slow.log filename (can be wildcard),
|
|
|
|
default is '*', i.e. match all
|
|
|
|
-i NAME name of server instance (if using mysql.server startup script)
|
|
|
|
-l don't subtract lock time from total time
|
|
|
|
|
|
|
|
HERE
|
|
|
|
if ($str) {
|
|
|
|
print STDERR "ERROR: $str\n\n";
|
|
|
|
print STDERR $text;
|
|
|
|
exit 1;
|
|
|
|
} else {
|
|
|
|
print $text;
|
|
|
|
exit 0;
|
|
|
|
}
|
|
|
|
}
|