test-select
上传用户:romrleung
上传日期:2022-05-23
资源大小:18897k
文件大小:14k
- #!/usr/bin/perl
- # Copyright (C) 2000 MySQL AB & MySQL Finland AB & TCX DataKonsult AB
- #
- # This library is free software; you can redistribute it and/or
- # modify it under the terms of the GNU Library General Public
- # License as published by the Free Software Foundation; either
- # version 2 of the License, or (at your option) any later version.
- #
- # This library is distributed in the hope that it will be useful,
- # but WITHOUT ANY WARRANTY; without even the implied warranty of
- # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- # Library General Public License for more details.
- #
- # You should have received a copy of the GNU Library General Public
- # License along with this library; if not, write to the Free
- # Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
- # MA 02111-1307, USA
- #
- # Test of selecting on keys that consist of many parts
- #
- ##################### Standard benchmark inits ##############################
- use Cwd;
- use DBI;
- use Getopt::Long;
- use Benchmark;
- $opt_loop_count=10000;
- $opt_medium_loop_count=1000;
- $opt_small_loop_count=10;
- $opt_regions=6;
- $opt_groups=100;
- $pwd = cwd(); $pwd = "." if ($pwd eq '');
- require "$pwd/bench-init.pl" || die "Can't read Configuration file: $!n";
- $columns=min($limits->{'max_columns'},500,($limits->{'query_size'}-50)/24,
- $limits->{'max_conditions'}/2-3);
- if ($opt_small_test)
- {
- $opt_loop_count/=10;
- $opt_medium_loop_count/=10;
- $opt_small_loop_count/=10;
- $opt_groups/=10;
- }
- print "Testing the speed of selecting on keys that consist of many partsn";
- print "The test-table has $opt_loop_count rows and the test is done with $columns ranges.nn";
- ####
- #### Connect and start timeing
- ####
- $dbh = $server->connect();
- $start_time=new Benchmark;
- ####
- #### Create needed tables
- ####
- goto select_test if ($opt_skip_create);
- print "Creating tablen";
- $dbh->do("drop table bench1" . $server->{'drop_attr'});
- do_many($dbh,$server->create("bench1",
- ["region char(1) NOT NULL",
- "idn integer(6) NOT NULL",
- "rev_idn integer(6) NOT NULL",
- "grp integer(6) NOT NULL"],
- ["primary key (region,idn)",
- "unique (region,rev_idn)",
- "unique (region,grp,idn)"]));
- if ($opt_lock_tables)
- {
- do_query($dbh,"LOCK TABLES bench1 WRITE");
- }
- if ($opt_fast && defined($server->{vacuum}))
- {
- $server->vacuum(1,$dbh);
- }
- ####
- #### Insert $opt_loop_count records with
- #### region: "A" -> "E"
- #### idn: 0 -> count
- #### rev_idn: count -> 0,
- #### grp: distributed values 0 - > count/100
- ####
- print "Inserting $opt_loop_count rowsn";
- $loop_time=new Benchmark;
- if ($opt_fast && $server->{transactions})
- {
- $dbh->{AutoCommit} = 0;
- }
- $query="insert into bench1 values (";
- $half_done=$opt_loop_count/2;
- for ($id=0,$rev_id=$opt_loop_count-1 ; $id < $opt_loop_count ; $id++,$rev_id--)
- {
- $grp=$id*3 % $opt_groups;
- $region=chr(65+$id%$opt_regions);
- do_query($dbh,"$query'$region',$id,$rev_id,$grp)");
- if ($id == $half_done)
- { # Test with different insert
- $query="insert into bench1 (region,idn,rev_idn,grp) values (";
- }
- }
- if ($opt_fast && $server->{transactions})
- {
- $dbh->commit;
- $dbh->{AutoCommit} = 1;
- }
- $end_time=new Benchmark;
- print "Time to insert ($opt_loop_count): " .
- timestr(timediff($end_time, $loop_time),"all") . "nn";
- if ($opt_lock_tables)
- {
- do_query($dbh,"UNLOCK TABLES");
- }
- if ($opt_fast && defined($server->{vacuum}))
- {
- $server->vacuum(0,$dbh,"bench1");
- }
- if ($opt_lock_tables)
- {
- do_query($dbh,"LOCK TABLES bench1 WRITE");
- }
- ####
- #### Do some selects on the table
- ####
- select_test:
- if ($limits->{'group_functions'})
- {
- my ($tmp); $tmp=1000;
- print "Test if the database has a query cachen";
- # First ensure that the table is read into memory
- fetch_all_rows($dbh,"select sum(idn+$tmp),sum(rev_idn-$tmp) from bench1");
- $loop_time=new Benchmark;
- for ($tests=0 ; $tests < $opt_loop_count ; $tests++)
- {
- fetch_all_rows($dbh,"select sum(idn+100),sum(rev_idn-100) from bench1");
- }
- $end_time=new Benchmark;
- print "Time for select_cache ($opt_loop_count): " .
- timestr(timediff($end_time, $loop_time),"all") . "nn";
- # If the database has a query cache, the following loop should be much
- # slower than the previous loop
- $loop_time=new Benchmark;
- for ($tests=0 ; $tests < $opt_loop_count ; $tests++)
- {
- fetch_all_rows($dbh,"select sum(idn+$tests),sum(rev_idn-$tests) from bench1");
- }
- $end_time=new Benchmark;
- print "Time for select_cache2 ($opt_loop_count): " .
- timestr(timediff($end_time, $loop_time),"all") . "nn";
- }
- print "Testing big selects on the tablen";
- $loop_time=new Benchmark;
- $rows=0;
- for ($i=0 ; $i < $opt_small_loop_count ; $i++)
- {
- $grp=$i*11 % $opt_groups;
- $region=chr(65+$i%($opt_regions+1)); # One larger to test misses
- $rows+=fetch_all_rows($dbh,"select idn from bench1 where region='$region'");
- $rows+=fetch_all_rows($dbh,"select idn from bench1 where region='$region' and idn=$i");
- $rows+=fetch_all_rows($dbh,"select idn from bench1 where region='$region' and rev_idn=$i");
- $rows+=fetch_all_rows($dbh,"select idn from bench1 where region='$region' and grp=$grp");
- $rows+=fetch_all_rows($dbh,"select idn from bench1 where region>='B' and region<='C' and grp=$grp");
- $rows+=fetch_all_rows($dbh,"select idn from bench1 where region>='B' and region<='E' and grp=$grp");
- $rows+=fetch_all_rows($dbh,"select idn from bench1 where grp=$grp"); # This is hard
- }
- $count=$opt_small_loop_count*7;
- $end_time=new Benchmark;
- print "Time for select_big ($count:$rows): " .
- timestr(timediff($end_time, $loop_time),"all") . "n";
- # Test select with many OR's
- $loop_time=new Benchmark;
- $tmpvar=0;
- $count=0;
- $estimated=0;
- $max_and_conditions=$limits->{'max_conditions'}/2;
- $rows=0;
- for ($i=0 ; $i < $opt_small_loop_count ; $i++)
- {
- $region=chr(65+$i%($opt_regions+1)); # One larger to test out-of-regions
- $query="select * from bench1 where ";
- $or_part="grp = 1";
- $or_part2="region='A' and grp=1";
- for ($j=1 ; $j < $columns; $j++)
- {
- $tmpvar^= ((($tmpvar + 63) + $j)*3 % 100000);
- $tmp=$tmpvar % $opt_groups;
- $tmp_region=chr(65+$tmpvar%$opt_regions);
- $or_part.=" or grp=$tmp";
- if ($j < $max_and_conditions)
- {
- $or_part2.=" or region='$tmp_region' and grp=$tmp";
- }
- }
- $or_part="region='$region' and ($or_part)";
- # Same query, but use 'func_extra_in_num' instead.
- if ($limits->{'func_extra_in_num'})
- {
- $in_part=$or_part;
- $in_part=~ s/ = / IN (/;
- $in_part=~ s/ or grp=/,/g;
- $in_part.= ")";
- defined($found=fetch_all_rows($dbh,$query . $in_part)) || die $DBI::errstr;
- $rows+=$found;
- $count++;
- }
- for ($j=0; $j < 10 ; $j++)
- {
- $rows+=fetch_all_rows($dbh,$query . $or_part);
- $rows+=fetch_all_rows($dbh,$query . $or_part2);
- # Do it a little harder by setting a extra range
- $rows+=fetch_all_rows($dbh,"$query ($or_part) and idn < 50");
- $rows+=fetch_all_rows($dbh,"$query (($or_part) or (region='A' and grp < 10)) and region <='B'")
- }
- $count+=$j*4;
- $end_time=new Benchmark;
- last if ($estimated=predict_query_time($loop_time,$end_time,$count,$i+1,
- $opt_small_loop_count));
- }
- print_time($estimated);
- print " for select_range ($count:$rows): " .
- timestr(timediff($end_time, $loop_time),"all") . "n";
- #
- # Testing MIN() and MAX() on keys
- #
- if ($limits->{'group_functions'} && $limits->{'order_by_unused'})
- {
- $loop_time=new Benchmark;
- $count=0;
- $estimated=0;
- for ($tests=0 ; $tests < $opt_loop_count ; $tests++)
- {
- $count+=7;
- $grp=$tests*3 % $opt_groups;
- $region=chr(65+$tests % $opt_regions);
- if ($limits->{'group_func_sql_min_str'})
- {
- fetch_all_rows($dbh,"select min(region) from bench1");
- fetch_all_rows($dbh,"select max(region) from bench1");
- fetch_all_rows($dbh,"select min(region),max(region) from bench1");
- }
- fetch_all_rows($dbh,"select min(rev_idn) from bench1 where region='$region'");
- fetch_all_rows($dbh,"select max(grp) from bench1 where region='$region'");
- fetch_all_rows($dbh,"select max(idn) from bench1 where region='$region' and grp=$grp");
- if ($limits->{'group_func_sql_min_str'})
- {
- fetch_all_rows($dbh,"select max(region) from bench1 where region<'$region'");
- }
- $end_time=new Benchmark;
- last if ($estimated=predict_query_time($loop_time,$end_time,$count,
- $tests+1, $opt_loop_count));
- }
- print_time($estimated);
- print " for min_max_on_key ($count): " .
- timestr(timediff($end_time, $loop_time),"all") . "n";
- $loop_time=new Benchmark;
- $count=0;
- $estimated=0;
- for ($tests=0 ; $tests < $opt_loop_count ; $tests++)
- {
- $count+=5;
- $grp=$tests*3 % $opt_groups;
- $region=chr(65+$tests % $opt_regions);
- fetch_all_rows($dbh,"select count(*) from bench1 where region='$region'");
- fetch_all_rows($dbh,"select count(*) from bench1 where region='$region' and grp=$grp");
- fetch_all_rows($dbh,"select count(*) from bench1 where region>'$region'");
- fetch_all_rows($dbh,"select count(*) from bench1 where region<='$region'");
- fetch_all_rows($dbh,"select count(*) from bench1 where region='$region' and grp>$grp");
- $end_time=new Benchmark;
- last if ($estimated=predict_query_time($loop_time,$end_time,$count,
- $tests+1, $opt_loop_count));
- }
- print_time($estimated);
- print " for count_on_key ($count): " .
- timestr(timediff($end_time, $loop_time),"all") . "nn";
-
- }
- if ($limits->{'group_functions'})
- {
- $loop_time=new Benchmark;
- $rows=0;
- for ($i=0 ; $i < $opt_medium_loop_count ; $i++)
- {
- $rows+=fetch_all_rows($dbh,"select grp,count(*) from bench1 group by grp");
- }
- $end_time=new Benchmark;
- print "Time for count_group_on_key_parts ($i:$rows): " .
- timestr(timediff($end_time, $loop_time),"all") . "n";
- }
- if ($limits->{'group_distinct_functions'})
- {
- print "Testing count(distinct) on the tablen";
- $loop_time=new Benchmark;
- $rows=$estimated=$count=0;
- for ($i=0 ; $i < $opt_medium_loop_count ; $i++)
- {
- $count++;
- $rows+=fetch_all_rows($dbh,"select count(distinct region) from bench1");
- $end_time=new Benchmark;
- last if ($estimated=predict_query_time($loop_time,$end_time,$count,$i+1,
- $opt_medium_loop_count));
- }
- print_time($estimated);
- print " for count_distinct_key_prefix ($count:$rows): " .
- timestr(timediff($end_time, $loop_time),"all") . "n";
- $loop_time=new Benchmark;
- $rows=$estimated=$count=0;
- for ($i=0 ; $i < $opt_medium_loop_count ; $i++)
- {
- $count++;
- $rows+=fetch_all_rows($dbh,"select count(distinct grp) from bench1");
- $end_time=new Benchmark;
- last if ($estimated=predict_query_time($loop_time,$end_time,$count,$i+1,
- $opt_medium_loop_count));
- }
- print_time($estimated);
- print " for count_distinct ($count:$rows): " .
- timestr(timediff($end_time, $loop_time),"all") . "n";
- # Workaround mimer's behavior
- if ($limits->{'multi_distinct'})
- {
- $loop_time=new Benchmark;
- $rows=$estimated=$count=0;
- for ($i=0 ; $i < $opt_medium_loop_count ; $i++)
- {
- $count++;
- $rows+=fetch_all_rows($dbh,"select count(distinct grp),count(distinct rev_idn) from bench1");
- $end_time=new Benchmark;
- last if ($estimated=predict_query_time($loop_time,$end_time,$count,$i+1,
- $opt_medium_loop_count));
- }
- print_time($estimated);
- print " for count_distinct_2 ($count:$rows): " .
- timestr(timediff($end_time, $loop_time),"all") . "n";
- }
- $loop_time=new Benchmark;
- $rows=$estimated=$count=0;
- for ($i=0 ; $i < $opt_medium_loop_count ; $i++)
- {
- $count++;
- $rows+=fetch_all_rows($dbh,"select region,count(distinct idn) from bench1 group by region");
- $end_time=new Benchmark;
- last if ($estimated=predict_query_time($loop_time,$end_time,$count,$i+1,
- $opt_medium_loop_count));
- }
- print_time($estimated);
- print " for count_distinct_group_on_key ($count:$rows): " .
- timestr(timediff($end_time, $loop_time),"all") . "n";
- $loop_time=new Benchmark;
- $rows=$estimated=$count=0;
- for ($i=0 ; $i < $opt_medium_loop_count ; $i++)
- {
- $count++;
- $rows+=fetch_all_rows($dbh,"select grp,count(distinct idn) from bench1 group by grp");
- $end_time=new Benchmark;
- last if ($estimated=predict_query_time($loop_time,$end_time,$count,$i+1,
- $opt_medium_loop_count));
- }
- print_time($estimated);
- print " for count_distinct_group_on_key_parts ($count:$rows): " .
- timestr(timediff($end_time, $loop_time),"all") . "n";
- $loop_time=new Benchmark;
- $rows=$estimated=$count=0;
- for ($i=0 ; $i < $opt_medium_loop_count ; $i++)
- {
- $count++;
- $rows+=fetch_all_rows($dbh,"select grp,count(distinct rev_idn) from bench1 group by grp");
- $end_time=new Benchmark;
- last if ($estimated=predict_query_time($loop_time,$end_time,$count,$i+1,
- $opt_medium_loop_count));
- }
- print_time($estimated);
- print " for count_distinct_group ($count:$rows): " .
- timestr(timediff($end_time, $loop_time),"all") . "n";
- $loop_time=new Benchmark;
- $rows=$estimated=$count=0;
- $test_count=$opt_medium_loop_count/10;
- for ($i=0 ; $i < $test_count ; $i++)
- {
- $count++;
- $rows+=fetch_all_rows($dbh,"select idn,count(distinct region) from bench1 group by idn");
- $end_time=new Benchmark;
- last if ($estimated=predict_query_time($loop_time,$end_time,$count,$i+1,
- $test_count));
- }
- print_time($estimated);
- print " for count_distinct_big ($count:$rows): " .
- timestr(timediff($end_time, $loop_time),"all") . "n";
- }
- ####
- #### End of benchmark
- ####
- if ($opt_lock_tables)
- {
- do_query($dbh,"UNLOCK TABLES");
- }
- if (!$opt_skip_delete)
- {
- do_query($dbh,"drop table bench1" . $server->{'drop_attr'});
- }
- if ($opt_fast && defined($server->{vacuum}))
- {
- $server->vacuum(0,$dbh);
- }
- $dbh->disconnect; # close connection
- end_benchmark($start_time);