Home | History | Annotate | Download | only in test
      1 # 2011 January 19
      2 #
      3 # The author disclaims copyright to this source code.  In place of
      4 # a legal notice, here is a blessing:
      5 #
      6 #    May you do good and not evil.
      7 #    May you find forgiveness for yourself and forgive others.
      8 #    May you share freely, never taking more than you give.
      9 #
     10 #***********************************************************************
     11 #
     12 # This file implements tests for SQLite library.  The focus of the tests
     13 # in this file is the use of the sqlite_stat2 histogram data on tables
     14 # with many repeated values and only a few distinct values.
     15 #
     16 
     17 set testdir [file dirname $argv0]
     18 source $testdir/tester.tcl
     19 
     20 ifcapable !stat2 {
     21   finish_test
     22   return
     23 }
     24 
     25 set testprefix analyze5
     26 
     27 proc eqp {sql {db db}} {
     28   uplevel execsql [list "EXPLAIN QUERY PLAN $sql"] $db
     29 }
     30 
     31 unset -nocomplain i t u v w x y z
     32 do_test analyze5-1.0 {
     33   db eval {CREATE TABLE t1(t,u,v TEXT COLLATE nocase,w,x,y,z)}
     34   for {set i 0} {$i < 1000} {incr i} {
     35     set y [expr {$i>=25 && $i<=50}]
     36     set z [expr {($i>=400) + ($i>=700) + ($i>=875)}]
     37     set x $z
     38     set w $z
     39     set t [expr {$z+0.5}]
     40     switch $z {
     41       0 {set u "alpha"; unset x}
     42       1 {set u "bravo"}
     43       2 {set u "charlie"}
     44       3 {set u "delta"; unset w}
     45     }
     46     if {$i%2} {set v $u} {set v [string toupper $u]}
     47     db eval {INSERT INTO t1 VALUES($t,$u,$v,$w,$x,$y,$z)}
     48   }
     49   db eval { 
     50     CREATE INDEX t1t ON t1(t);  -- 0.5, 1.5, 2.5, and 3.5
     51     CREATE INDEX t1u ON t1(u);  -- text
     52     CREATE INDEX t1v ON t1(v);  -- mixed case text
     53     CREATE INDEX t1w ON t1(w);  -- integers 0, 1, 2 and a few NULLs
     54     CREATE INDEX t1x ON t1(x);  -- integers 1, 2, 3 and many NULLs
     55     CREATE INDEX t1y ON t1(y);  -- integers 0 and very few 1s
     56     CREATE INDEX t1z ON t1(z);  -- integers 0, 1, 2, and 3
     57     ANALYZE;
     58     SELECT sample FROM sqlite_stat2 WHERE idx='t1u' ORDER BY sampleno;
     59   }
     60 } {alpha alpha alpha alpha bravo bravo bravo charlie charlie delta}
     61 do_test analyze5-1.1 {
     62   string tolower \
     63    [db eval {SELECT sample from sqlite_stat2 WHERE idx='t1v' ORDER BY sampleno}]
     64 } {alpha alpha alpha alpha bravo bravo bravo charlie charlie delta}
     65 do_test analyze5-1.2 {
     66   db eval {SELECT sample from sqlite_stat2 WHERE idx='t1w' ORDER BY sampleno}
     67 } {{} 0 0 0 0 1 1 1 2 2}
     68 do_test analyze5-1.3 {
     69   db eval {SELECT sample from sqlite_stat2 WHERE idx='t1x' ORDER BY sampleno}
     70 } {{} {} {} {} 1 1 1 2 2 3}
     71 do_test analyze5-1.4 {
     72   db eval {SELECT sample from sqlite_stat2 WHERE idx='t1y' ORDER BY sampleno}
     73 } {0 0 0 0 0 0 0 0 0 0}
     74 do_test analyze5-1.5 {
     75   db eval {SELECT sample from sqlite_stat2 WHERE idx='t1z' ORDER BY sampleno}
     76 } {0 0 0 0 1 1 1 2 2 3}
     77 do_test analyze5-1.6 {
     78   db eval {SELECT sample from sqlite_stat2 WHERE idx='t1t' ORDER BY sampleno}
     79 } {0.5 0.5 0.5 0.5 1.5 1.5 1.5 2.5 2.5 3.5}
     80 
     81 
     82 # Verify that range queries generate the correct row count estimates
     83 #
     84 foreach {testid where index rows} {
     85     1  {z>=0 AND z<=0}       t1z  400
     86     2  {z>=1 AND z<=1}       t1z  300
     87     3  {z>=2 AND z<=2}       t1z  200
     88     4  {z>=3 AND z<=3}       t1z  100
     89     5  {z>=4 AND z<=4}       t1z   50
     90     6  {z>=-1 AND z<=-1}     t1z   50
     91     7  {z>1 AND z<3}         t1z  200
     92     8  {z>0 AND z<100}       t1z  600
     93     9  {z>=1 AND z<100}      t1z  600
     94    10  {z>1 AND z<100}       t1z  300
     95    11  {z>=2 AND z<100}      t1z  300
     96    12  {z>2 AND z<100}       t1z  100
     97    13  {z>=3 AND z<100}      t1z  100
     98    14  {z>3 AND z<100}       t1z   50
     99    15  {z>=4 AND z<100}      t1z   50
    100    16  {z>=-100 AND z<=-1}   t1z   50
    101    17  {z>=-100 AND z<=0}    t1z  400
    102    18  {z>=-100 AND z<0}     t1z   50
    103    19  {z>=-100 AND z<=1}    t1z  700
    104    20  {z>=-100 AND z<2}     t1z  700
    105    21  {z>=-100 AND z<=2}    t1z  900
    106    22  {z>=-100 AND z<3}     t1z  900
    107   
    108    31  {z>=0.0 AND z<=0.0}   t1z  400
    109    32  {z>=1.0 AND z<=1.0}   t1z  300
    110    33  {z>=2.0 AND z<=2.0}   t1z  200
    111    34  {z>=3.0 AND z<=3.0}   t1z  100
    112    35  {z>=4.0 AND z<=4.0}   t1z   50
    113    36  {z>=-1.0 AND z<=-1.0} t1z   50
    114    37  {z>1.5 AND z<3.0}     t1z  200
    115    38  {z>0.5 AND z<100}     t1z  600
    116    39  {z>=1.0 AND z<100}    t1z  600
    117    40  {z>1.5 AND z<100}     t1z  300
    118    41  {z>=2.0 AND z<100}    t1z  300
    119    42  {z>2.1 AND z<100}     t1z  100
    120    43  {z>=3.0 AND z<100}    t1z  100
    121    44  {z>3.2 AND z<100}     t1z   50
    122    45  {z>=4.0 AND z<100}    t1z   50
    123    46  {z>=-100 AND z<=-1.0} t1z   50
    124    47  {z>=-100 AND z<=0.0}  t1z  400
    125    48  {z>=-100 AND z<0.0}   t1z   50
    126    49  {z>=-100 AND z<=1.0}  t1z  700
    127    50  {z>=-100 AND z<2.0}   t1z  700
    128    51  {z>=-100 AND z<=2.0}  t1z  900
    129    52  {z>=-100 AND z<3.0}   t1z  900
    130   
    131   101  {z=-1}                t1z   50
    132   102  {z=0}                 t1z  400
    133   103  {z=1}                 t1z  300
    134   104  {z=2}                 t1z  200
    135   105  {z=3}                 t1z  100
    136   106  {z=4}                 t1z   50
    137   107  {z=-10.0}             t1z   50
    138   108  {z=0.0}               t1z  400
    139   109  {z=1.0}               t1z  300
    140   110  {z=2.0}               t1z  200
    141   111  {z=3.0}               t1z  100
    142   112  {z=4.0}               t1z   50
    143   113  {z=1.5}               t1z   50
    144   114  {z=2.5}               t1z   50
    145   
    146   201  {z IN (-1)}           t1z   50
    147   202  {z IN (0)}            t1z  400
    148   203  {z IN (1)}            t1z  300
    149   204  {z IN (2)}            t1z  200
    150   205  {z IN (3)}            t1z  100
    151   206  {z IN (4)}            t1z   50
    152   207  {z IN (0.5)}          t1z   50
    153   208  {z IN (0,1)}          t1z  700
    154   209  {z IN (0,1,2)}        t1z  900
    155   210  {z IN (0,1,2,3)}      {}   100
    156   211  {z IN (0,1,2,3,4,5)}  {}   100
    157   212  {z IN (1,2)}          t1z  500
    158   213  {z IN (2,3)}          t1z  300
    159   214  {z=3 OR z=2}          t1z  300
    160   215  {z IN (-1,3)}         t1z  150
    161   216  {z=-1 OR z=3}         t1z  150
    162 
    163   300  {y=0}                 {}   100
    164   301  {y=1}                 t1y   50
    165   302  {y=0.1}               t1y   50
    166 
    167   400  {x IS NULL}           t1x  400
    168 
    169 } {
    170   # Verify that the expected index is used with the expected row count
    171   do_test analyze5-1.${testid}a {
    172     set x [lindex [eqp "SELECT * FROM t1 WHERE $where"] 3]
    173     set idx {}
    174     regexp {INDEX (t1.) } $x all idx
    175     regexp {~([0-9]+) rows} $x all nrow
    176     list $idx $nrow
    177   } [list $index $rows]
    178 
    179   # Verify that the same result is achieved regardless of whether or not
    180   # the index is used
    181   do_test analyze5-1.${testid}b {
    182     set w2 [string map {y +y z +z} $where]
    183     set a1 [db eval "SELECT rowid FROM t1 NOT INDEXED WHERE $w2\
    184                      ORDER BY +rowid"]
    185     set a2 [db eval "SELECT rowid FROM t1 WHERE $where ORDER BY +rowid"]
    186     if {$a1==$a2} {
    187       set res ok
    188     } else {
    189       set res "a1=\[$a1\] a2=\[$a2\]"
    190     }
    191     set res
    192   } {ok}
    193 }
    194 
    195 # Increase the number of NULLs in column x
    196 #
    197 db eval {
    198    UPDATE t1 SET x=NULL;
    199    UPDATE t1 SET x=rowid
    200     WHERE rowid IN (SELECT rowid FROM t1 ORDER BY random() LIMIT 5);
    201    ANALYZE;
    202 }
    203 
    204 # Verify that range queries generate the correct row count estimates
    205 #
    206 foreach {testid where index rows} {
    207   500  {x IS NULL AND u='charlie'}         t1u  20
    208   501  {x=1 AND u='charlie'}               t1x   5
    209   502  {x IS NULL}                          {} 100
    210   503  {x=1}                               t1x  50
    211   504  {x IS NOT NULL}                     t1x  25
    212   505  {+x IS NOT NULL}                     {} 500
    213   506  {upper(x) IS NOT NULL}               {} 500
    214 
    215 } {
    216   # Verify that the expected index is used with the expected row count
    217   do_test analyze5-1.${testid}a {
    218     set x [lindex [eqp "SELECT * FROM t1 WHERE $where"] 3]
    219     set idx {}
    220     regexp {INDEX (t1.) } $x all idx
    221     regexp {~([0-9]+) rows} $x all nrow
    222     list $idx $nrow
    223   } [list $index $rows]
    224 
    225   # Verify that the same result is achieved regardless of whether or not
    226   # the index is used
    227   do_test analyze5-1.${testid}b {
    228     set w2 [string map {y +y z +z} $where]
    229     set a1 [db eval "SELECT rowid FROM t1 NOT INDEXED WHERE $w2\
    230                      ORDER BY +rowid"]
    231     set a2 [db eval "SELECT rowid FROM t1 WHERE $where ORDER BY +rowid"]
    232     if {$a1==$a2} {
    233       set res ok
    234     } else {
    235       set res "a1=\[$a1\] a2=\[$a2\]"
    236     }
    237     set res
    238   } {ok}
    239 }
    240 
    241 finish_test
    242