home *** CD-ROM | disk | FTP | other *** search
- #!/usr/bin/perl
- # mysqldumpslow - parse and summarize the MySQL slow query log
-
- # Original version by Tim Bunce, sometime in 2000.
- # Further changes by Tim Bunce, 8th March 2001.
- # Handling of strings with \ and double '' by Monty 11 Aug 2001.
-
- use strict;
- use Getopt::Long;
-
- # t=time, l=lock time, r=rows
- # at, al, and ar are the corresponding averages
-
- my %opt = (
- s => 'at',
- h => '*',
- );
-
- GetOptions(\%opt,
- 'v+', # verbose
- 'd+', # debug
- 's=s', # what to sort by (t, at, l, al, r, ar etc)
- 'r!', # reverse the sort order (largest last instead of first)
- 't=i', # just show the top n queries
- 'a!', # don't abstract all numbers to N and strings to 'S'
- 'n=i', # abstract numbers with at least n digits within names
- 'g=s', # grep: only consider stmts that include this string
- 'h=s', # hostname of db server for *-slow.log filename (can be wildcard)
- 'i=s', # name of server instance (if using mysql.server startup script)
- 'l!', # don't subtract lock time from total time
- ) or die "Bad option";
-
-
- unless (@ARGV) {
- my $defaults = `my_print_defaults mysqld`;
- my $basedir = ($defaults =~ m/--basedir=(.*)/)[0]
- or die "Can't determine basedir from 'my_print_defaults mysqld' output: $defaults";
- warn "basedir=$basedir\n" if $opt{v};
-
- my $datadir = ($defaults =~ m/--datadir=(.*)/)[0];
- if (!$datadir or $opt{i}) {
- # determine the datadir from the instances section of /etc/my.cnf, if any
- my $instances = `my_print_defaults instances`;
- die "Can't determine datadir from 'my_print_defaults mysqld' output: $defaults"
- unless $instances;
- my @instances = ($instances =~ m/^--(\w+)-/mg);
- die "No -i 'instance_name' specified to select among known instances: @instances.\n"
- unless $opt{i};
- die "Instance '$opt{i}' is unknown (known instances: @instances)\n"
- unless grep { $_ eq $opt{i} } @instances;
- $datadir = ($instances =~ m/--$opt{i}-datadir=(.*)/)[0]
- or die "Can't determine --$opt{i}-datadir from 'my_print_defaults instances' output: $instances";
- warn "datadir=$datadir\n" if $opt{v};
- }
-
- @ARGV = <$datadir/$opt{h}-slow.log>;
- die "Can't find '$datadir/$opt{h}-slow.log'\n" unless @ARGV;
- }
-
- warn "\nReading mysql slow query log from @ARGV\n";
-
- my @pending;
- my %stmt;
- $/ = ";\n#"; # read entire statements using paragraph mode
- while ( defined($_ = shift @pending) or defined($_ = <>) ) {
- warn "[[$_]]\n" if $opt{d}; # show raw paragraph being read
-
- my @chunks = split /^\/.*Version.*started with[\000-\377]*?Time.*Id.*Command.*Argument.*\n/m;
- if (@chunks > 1) {
- unshift @pending, map { length($_) ? $_ : () } @chunks;
- warn "<<".join(">>\n<<",@chunks).">>" if $opt{d};
- next;
- }
-
- s/^#? Time: \d{6}\s+\d+:\d+:\d+.*\n//;
- my ($user,$host) = s/^#? User\@Host:\s+(\S+)\s+\@\s+(\S+).*\n// ? ($1,$2) : ('','');
-
- s/^# Query_time: (\d+) Lock_time: (\d+) Rows_sent: (\d+).*\n//;
- my ($t, $l, $r) = ($1, $2, $3);
- $t -= $l unless $opt{l};
-
- # remove fluff that mysqld writes to log when it (re)starts:
- s!^/.*Version.*started with:.*\n!!mg;
- s!^Tcp port: \d+ Unix socket: \S+\n!!mg;
- s!^Time.*Id.*Command.*Argument.*\n!!mg;
-
- s/^use \w+;\n//; # not consistently added
- s/^SET timestamp=\d+;\n//;
-
- s/^[ ]*\n//mg; # delete blank lines
- s/^[ ]*/ /mg; # normalize leading whitespace
- s/\s*;\s*(#\s*)?$//; # remove trailing semicolon(+newline-hash)
-
- next if $opt{g} and !m/$opt{g}/io;
-
- unless ($opt{a}) {
- s/\b\d+\b/N/g;
- s/\b0x[0-9A-Fa-f]+\b/N/g;
- s/''/'S'/g;
- s/""/"S"/g;
- s/(\\')//g;
- s/(\\")//g;
- s/'[^']+'/'S'/g;
- s/"[^"]+"/"S"/g;
- # -n=8: turn log_20001231 into log_NNNNNNNN
- s/([a-z_]+)(\d{$opt{n},})/$1.('N' x length($2))/ieg if $opt{n};
- # abbreviate massive "in (...)" statements and similar
- s!(([NS],){100,})!sprintf("$2,{repeated %d times}",length($1)/2)!eg;
- }
-
- my $s = $stmt{$_} ||= { users=>{}, hosts=>{} };
- $s->{c} += 1;
- $s->{t} += $t;
- $s->{l} += $l;
- $s->{r} += $r;
- $s->{users}->{$user}++ if $user;
- $s->{hosts}->{$host}++ if $host;
-
- warn "{{$_}}\n\n" if $opt{d}; # show processed statement string
- }
-
- foreach (keys %stmt) {
- my $v = $stmt{$_} || die;
- my ($c, $t, $l, $r) = @{ $v }{qw(c t l r)};
- $v->{at} = $t / $c;
- $v->{al} = $l / $c;
- $v->{ar} = $r / $c;
- }
-
- my @sorted = sort { $stmt{$b}->{$opt{s}} <=> $stmt{$a}->{$opt{s}} } keys %stmt;
- @sorted = @sorted[0 .. $opt{t}-1] if $opt{t};
- @sorted = reverse @sorted if $opt{r};
-
- foreach (@sorted) {
- my $v = $stmt{$_} || die;
- my ($c, $t,$at, $l,$al, $r,$ar) = @{ $v }{qw(c t at l al r ar)};
- my @users = keys %{$v->{users}};
- my $user = (@users==1) ? $users[0] : sprintf "%dusers",scalar @users;
- my @hosts = keys %{$v->{hosts}};
- my $host = (@hosts==1) ? $hosts[0] : sprintf "%dhosts",scalar @hosts;
- printf "Count: %d Time=%.2fs (%ds) Lock=%.2fs (%ds) Rows=%.1f (%d), $user\@$host\n%s\n\n",
- $c, $at,$t, $al,$l, $ar,$r, $_;
- }
-