1 # 2007 April 26 2 # 3 # The author disclaims copyright to this source code. 4 # 5 #************************************************************************* 6 # This file implements tests for prefix-searching in the fts3 7 # component of the SQLite library. 8 # 9 # $Id: fts3an.test,v 1.2 2007/12/13 21:54:11 drh Exp $ 10 # 11 12 set testdir [file dirname $argv0] 13 source $testdir/tester.tcl 14 15 # If SQLITE_ENABLE_FTS3 is defined, omit this file. 16 ifcapable !fts3 { 17 finish_test 18 return 19 } 20 21 # A large string to prime the pump with. 22 set text { 23 Lorem ipsum dolor sit amet, consectetuer adipiscing elit. Maecenas 24 iaculis mollis ipsum. Praesent rhoncus placerat justo. Duis non quam 25 sed turpis posuere placerat. Curabitur et lorem in lorem porttitor 26 aliquet. Pellentesque bibendum tincidunt diam. Vestibulum blandit 27 ante nec elit. In sapien diam, facilisis eget, dictum sed, viverra 28 at, felis. Vestibulum magna. Sed magna dolor, vestibulum rhoncus, 29 ornare vel, vulputate sit amet, felis. Integer malesuada, tellus at 30 luctus gravida, diam nunc porta nibh, nec imperdiet massa metus eu 31 lectus. Aliquam nisi. Nunc fringilla nulla at lectus. Suspendisse 32 potenti. Cum sociis natoque penatibus et magnis dis parturient 33 montes, nascetur ridiculus mus. Pellentesque odio nulla, feugiat eu, 34 suscipit nec, consequat quis, risus. 35 } 36 37 db eval { 38 CREATE VIRTUAL TABLE t1 USING fts3(c); 39 40 INSERT INTO t1(rowid, c) VALUES(1, $text); 41 INSERT INTO t1(rowid, c) VALUES(2, 'Another lovely row'); 42 } 43 44 # Exact match 45 do_test fts3an-1.1 { 46 execsql "SELECT rowid FROM t1 WHERE t1 MATCH 'lorem'" 47 } {1} 48 49 # And a prefix 50 do_test fts3an-1.2 { 51 execsql "SELECT rowid FROM t1 WHERE t1 MATCH 'lore*'" 52 } {1} 53 54 # Prefix includes exact match 55 do_test fts3an-1.3 { 56 execsql "SELECT rowid FROM t1 WHERE t1 MATCH 'lorem*'" 57 } {1} 58 59 # Make certain everything isn't considered a prefix! 60 do_test fts3an-1.4 { 61 execsql "SELECT rowid FROM t1 WHERE t1 MATCH 'lore'" 62 } {} 63 64 # Prefix across multiple rows. 65 do_test fts3an-1.5 { 66 execsql "SELECT rowid FROM t1 WHERE t1 MATCH 'lo*'" 67 } {1 2} 68 69 # Likewise, with multiple hits in one document. 70 do_test fts3an-1.6 { 71 execsql "SELECT rowid FROM t1 WHERE t1 MATCH 'l*'" 72 } {1 2} 73 74 # Prefix which should only hit one document. 75 do_test fts3an-1.7 { 76 execsql "SELECT rowid FROM t1 WHERE t1 MATCH 'lov*'" 77 } {2} 78 79 # * not at end is dropped. 80 do_test fts3an-1.8 { 81 execsql "SELECT rowid FROM t1 WHERE t1 MATCH 'lo *'" 82 } {} 83 84 # Stand-alone * is dropped. 85 do_test fts3an-1.9 { 86 execsql "SELECT rowid FROM t1 WHERE t1 MATCH '*'" 87 } {} 88 89 # Phrase-query prefix. 90 do_test fts3an-1.10 { 91 execsql "SELECT rowid FROM t1 WHERE t1 MATCH '\"lovely r*\"'" 92 } {2} 93 do_test fts3an-1.11 { 94 execsql "SELECT rowid FROM t1 WHERE t1 MATCH '\"lovely r\"'" 95 } {} 96 97 # Phrase query with multiple prefix matches. 98 do_test fts3an-1.12 { 99 execsql "SELECT rowid FROM t1 WHERE t1 MATCH '\"a* l*\"'" 100 } {1 2} 101 102 # Phrase query with multiple prefix matches. 103 do_test fts3an-1.13 { 104 execsql "SELECT rowid FROM t1 WHERE t1 MATCH '\"a* l* row\"'" 105 } {2} 106 107 108 109 110 # Test across updates (and, by implication, deletes). 111 112 # Version of text without "lorem". 113 regsub -all {[Ll]orem} $text '' ntext 114 115 db eval { 116 CREATE VIRTUAL TABLE t2 USING fts3(c); 117 118 INSERT INTO t2(rowid, c) VALUES(1, $text); 119 INSERT INTO t2(rowid, c) VALUES(2, 'Another lovely row'); 120 UPDATE t2 SET c = $ntext WHERE rowid = 1; 121 } 122 123 # Can't see lorem as an exact match. 124 do_test fts3an-2.1 { 125 execsql "SELECT rowid FROM t2 WHERE t2 MATCH 'lorem'" 126 } {} 127 128 # Can't see a prefix of lorem, either. 129 do_test fts3an-2.2 { 130 execsql "SELECT rowid FROM t2 WHERE t2 MATCH 'lore*'" 131 } {} 132 133 # Can see lovely in the other document. 134 do_test fts3an-2.3 { 135 execsql "SELECT rowid FROM t2 WHERE t2 MATCH 'lo*'" 136 } {2} 137 138 # Can still see other hits. 139 do_test fts3an-2.4 { 140 execsql "SELECT rowid FROM t2 WHERE t2 MATCH 'l*'" 141 } {1 2} 142 143 # Prefix which should only hit one document. 144 do_test fts3an-2.5 { 145 execsql "SELECT rowid FROM t2 WHERE t2 MATCH 'lov*'" 146 } {2} 147 148 149 150 # Test with a segment which will have multiple levels in the tree. 151 152 # Build a big document with lots of unique terms. 153 set bigtext $text 154 foreach c {a b c d e} { 155 regsub -all {[A-Za-z]+} $bigtext "&$c" t 156 append bigtext $t 157 } 158 159 # Populate a table with many copies of the big document, so that we 160 # can test the number of hits found. Populate $ret with the expected 161 # hit counts for each row. offsets() returns 4 elements for every 162 # hit. We'll have 6 hits for row 1, 1 for row 2, and 6*(2^5)==192 for 163 # $bigtext. 164 set ret {6 1} 165 db eval { 166 BEGIN; 167 CREATE VIRTUAL TABLE t3 USING fts3(c); 168 169 INSERT INTO t3(rowid, c) VALUES(1, $text); 170 INSERT INTO t3(rowid, c) VALUES(2, 'Another lovely row'); 171 } 172 for {set i 0} {$i<68} {incr i} { 173 db eval {INSERT INTO t3(rowid, c) VALUES(3+$i, $bigtext)} 174 lappend ret 192 175 } 176 db eval {COMMIT;} 177 178 # Test that we get the expected number of hits. 179 do_test fts3an-3.1 { 180 set t {} 181 db eval {SELECT offsets(t3) as o FROM t3 WHERE t3 MATCH 'l*'} { 182 set l [llength $o] 183 lappend t [expr {$l/4}] 184 } 185 set t 186 } $ret 187 188 # Test a boundary condition: More than 2^16 terms that match a searched for 189 # prefix in a single segment. 190 # 191 puts "This next test can take a little while (~ 30 seconds)..." 192 do_test fts3an-4.1 { 193 execsql { CREATE VIRTUAL TABLE ft USING fts3(x) } 194 execsql BEGIN 195 execsql { INSERT INTO ft VALUES(NULL) } 196 execsql { INSERT INTO ft SELECT * FROM ft } ;# 2 197 execsql { INSERT INTO ft SELECT * FROM ft } ;# 4 198 execsql { INSERT INTO ft SELECT * FROM ft } ;# 8 199 execsql { INSERT INTO ft SELECT * FROM ft } ;# 16 200 execsql { INSERT INTO ft SELECT * FROM ft } ;# 32 201 execsql { INSERT INTO ft SELECT * FROM ft } ;# 64 202 execsql { INSERT INTO ft SELECT * FROM ft } ;# 128 203 execsql { INSERT INTO ft SELECT * FROM ft } ;# 256 204 execsql { INSERT INTO ft SELECT * FROM ft } ;# 512 205 execsql { INSERT INTO ft SELECT * FROM ft } ;# 1024 206 execsql { INSERT INTO ft SELECT * FROM ft } ;# 2048 207 execsql { INSERT INTO ft SELECT * FROM ft } ;# 4096 208 execsql { INSERT INTO ft SELECT * FROM ft } ;# 8192 209 execsql { INSERT INTO ft SELECT * FROM ft } ;# 16384 210 execsql { INSERT INTO ft SELECT * FROM ft } ;# 32768 211 execsql { INSERT INTO ft SELECT * FROM ft } ;# 65536 212 execsql { INSERT INTO ft SELECT * FROM ft } ;# 131072 213 execsql COMMIT 214 execsql { UPDATE ft SET x = 'abc' || rowid } 215 execsql { SELECT count(*) FROM ft WHERE x MATCH 'abc*' } 216 } {131072} 217 218 finish_test 219