1# 2008 June 26 2# 3# The author disclaims copyright to this source code. In place of 4# a legal notice, here is a blessing: 5# 6# May you do good and not evil. 7# May you find forgiveness for yourself and forgive others. 8# May you share freely, never taking more than you give. 9# 10#************************************************************************* 11# This file implements regression tests for SQLite library. The focus 12# of this script is testing the FTS2 module's optimize() function. 13# 14# $Id: fts2q.test,v 1.2 2008/07/22 23:49:44 shess Exp $ 15# 16 17set testdir [file dirname $argv0] 18source $testdir/tester.tcl 19 20# If SQLITE_ENABLE_FTS2 is not defined, omit this file. 21ifcapable !fts2 { 22 finish_test 23 return 24} 25 26#************************************************************************* 27# Probe to see if support for the FTS2 dump_* functions is compiled in. 28# TODO(shess): Change main.mk to do the right thing and remove this test. 29db eval { 30 DROP TABLE IF EXISTS t1; 31 CREATE VIRTUAL TABLE t1 USING fts2(c); 32 INSERT INTO t1 (rowid, c) VALUES (1, 'x'); 33} 34 35set s {SELECT dump_terms(t1, 1) FROM t1 LIMIT 1} 36set r {1 {unable to use function dump_terms in the requested context}} 37if {[catchsql $s]==$r} { 38 finish_test 39 return 40} 41 42#************************************************************************* 43# Utility function to check for the expected terms in the segment 44# level/index. _all version does same but for entire index. 45proc check_terms {test level index terms} { 46 # TODO(shess): Figure out why uplevel in do_test can't catch 47 # $level and $index directly. 48 set ::level $level 49 set ::index $index 50 do_test $test.terms { 51 execsql { 52 SELECT dump_terms(t1, $::level, $::index) FROM t1 LIMIT 1; 53 } 54 } [list $terms] 55} 56proc check_terms_all {test terms} { 57 do_test $test.terms { 58 execsql { 59 SELECT dump_terms(t1) FROM t1 LIMIT 1; 60 } 61 } [list $terms] 62} 63 64# Utility function to check for the expected doclist for the term in 65# segment level/index. _all version does same for entire index. 66proc check_doclist {test level index term doclist} { 67 # TODO(shess): Again, why can't the non-:: versions work? 68 set ::term $term 69 set ::level $level 70 set ::index $index 71 do_test $test { 72 execsql { 73 SELECT dump_doclist(t1, $::term, $::level, $::index) FROM t1 LIMIT 1; 74 } 75 } [list $doclist] 76} 77proc check_doclist_all {test term doclist} { 78 set ::term $term 79 do_test $test { 80 execsql { 81 SELECT dump_doclist(t1, $::term) FROM t1 LIMIT 1; 82 } 83 } [list $doclist] 84} 85 86#************************************************************************* 87# Test results when all rows are deleted and one is added back. 88# Previously older segments would continue to exist, but now the index 89# should be dropped when the table is empty. The results should look 90# exactly like we never added the earlier rows in the first place. 91db eval { 92 DROP TABLE IF EXISTS t1; 93 CREATE VIRTUAL TABLE t1 USING fts2(c); 94 INSERT INTO t1 (rowid, c) VALUES (1, 'This is a test'); 95 INSERT INTO t1 (rowid, c) VALUES (2, 'That was a test'); 96 INSERT INTO t1 (rowid, c) VALUES (3, 'This is a test'); 97 DELETE FROM t1 WHERE 1=1; -- Delete each row rather than dropping table. 98 INSERT INTO t1 (rowid, c) VALUES (1, 'This is a test'); 99} 100 101# Should be a single initial segment. 102do_test fts2q-1.segments { 103 execsql { 104 SELECT level, idx FROM t1_segdir ORDER BY level, idx; 105 } 106} {0 0} 107do_test fts2q-1.matches { 108 execsql { 109 SELECT OFFSETS(t1) FROM t1 110 WHERE t1 MATCH 'this OR that OR was OR a OR is OR test' ORDER BY rowid; 111 } 112} {{0 0 0 4 0 4 5 2 0 3 8 1 0 5 10 4}} 113 114check_terms_all fts2q-1.1 {a is test this} 115check_doclist_all fts2q-1.1.1 a {[1 0[2]]} 116check_doclist_all fts2q-1.1.2 is {[1 0[1]]} 117check_doclist_all fts2q-1.1.3 test {[1 0[3]]} 118check_doclist_all fts2q-1.1.4 this {[1 0[0]]} 119 120check_terms fts2q-1.2 0 0 {a is test this} 121check_doclist fts2q-1.2.1 0 0 a {[1 0[2]]} 122check_doclist fts2q-1.2.2 0 0 is {[1 0[1]]} 123check_doclist fts2q-1.2.3 0 0 test {[1 0[3]]} 124check_doclist fts2q-1.2.4 0 0 this {[1 0[0]]} 125 126#************************************************************************* 127# Test results when everything is optimized manually. 128# NOTE(shess): This is a copy of fts2c-1.3. I've pulled a copy here 129# because fts2q-2 and fts2q-3 should have identical results. 130db eval { 131 DROP TABLE IF EXISTS t1; 132 CREATE VIRTUAL TABLE t1 USING fts2(c); 133 INSERT INTO t1 (rowid, c) VALUES (1, 'This is a test'); 134 INSERT INTO t1 (rowid, c) VALUES (2, 'That was a test'); 135 INSERT INTO t1 (rowid, c) VALUES (3, 'This is a test'); 136 DELETE FROM t1 WHERE rowid IN (1,3); 137 DROP TABLE IF EXISTS t1old; 138 ALTER TABLE t1 RENAME TO t1old; 139 CREATE VIRTUAL TABLE t1 USING fts2(c); 140 INSERT INTO t1 (rowid, c) SELECT rowid, c FROM t1old; 141 DROP TABLE t1old; 142} 143 144# Should be a single optimal segment with the same logical results. 145do_test fts2q-2.segments { 146 execsql { 147 SELECT level, idx FROM t1_segdir ORDER BY level, idx; 148 } 149} {0 0} 150do_test fts2q-2.matches { 151 execsql { 152 SELECT OFFSETS(t1) FROM t1 153 WHERE t1 MATCH 'this OR that OR was OR a OR is OR test' ORDER BY rowid; 154 } 155} {{0 1 0 4 0 2 5 3 0 3 9 1 0 5 11 4}} 156 157check_terms_all fts2q-2.1 {a test that was} 158check_doclist_all fts2q-2.1.1 a {[2 0[2]]} 159check_doclist_all fts2q-2.1.2 test {[2 0[3]]} 160check_doclist_all fts2q-2.1.3 that {[2 0[0]]} 161check_doclist_all fts2q-2.1.4 was {[2 0[1]]} 162 163check_terms fts2q-2.2 0 0 {a test that was} 164check_doclist fts2q-2.2.1 0 0 a {[2 0[2]]} 165check_doclist fts2q-2.2.2 0 0 test {[2 0[3]]} 166check_doclist fts2q-2.2.3 0 0 that {[2 0[0]]} 167check_doclist fts2q-2.2.4 0 0 was {[2 0[1]]} 168 169#************************************************************************* 170# Test results when everything is optimized via optimize(). 171db eval { 172 DROP TABLE IF EXISTS t1; 173 CREATE VIRTUAL TABLE t1 USING fts2(c); 174 INSERT INTO t1 (rowid, c) VALUES (1, 'This is a test'); 175 INSERT INTO t1 (rowid, c) VALUES (2, 'That was a test'); 176 INSERT INTO t1 (rowid, c) VALUES (3, 'This is a test'); 177 DELETE FROM t1 WHERE rowid IN (1,3); 178 SELECT OPTIMIZE(t1) FROM t1 LIMIT 1; 179} 180 181# Should be a single optimal segment with the same logical results. 182do_test fts2q-3.segments { 183 execsql { 184 SELECT level, idx FROM t1_segdir ORDER BY level, idx; 185 } 186} {0 0} 187do_test fts2q-3.matches { 188 execsql { 189 SELECT OFFSETS(t1) FROM t1 190 WHERE t1 MATCH 'this OR that OR was OR a OR is OR test' ORDER BY rowid; 191 } 192} {{0 1 0 4 0 2 5 3 0 3 9 1 0 5 11 4}} 193 194check_terms_all fts2q-3.1 {a test that was} 195check_doclist_all fts2q-3.1.1 a {[2 0[2]]} 196check_doclist_all fts2q-3.1.2 test {[2 0[3]]} 197check_doclist_all fts2q-3.1.3 that {[2 0[0]]} 198check_doclist_all fts2q-3.1.4 was {[2 0[1]]} 199 200check_terms fts2q-3.2 0 0 {a test that was} 201check_doclist fts2q-3.2.1 0 0 a {[2 0[2]]} 202check_doclist fts2q-3.2.2 0 0 test {[2 0[3]]} 203check_doclist fts2q-3.2.3 0 0 that {[2 0[0]]} 204check_doclist fts2q-3.2.4 0 0 was {[2 0[1]]} 205 206#************************************************************************* 207# Test optimize() against a table involving segment merges. 208# NOTE(shess): Since there's no transaction, each of the INSERT/UPDATE 209# statements generates a segment. 210db eval { 211 DROP TABLE IF EXISTS t1; 212 CREATE VIRTUAL TABLE t1 USING fts2(c); 213 214 INSERT INTO t1 (rowid, c) VALUES (1, 'This is a test'); 215 INSERT INTO t1 (rowid, c) VALUES (2, 'That was a test'); 216 INSERT INTO t1 (rowid, c) VALUES (3, 'This is a test'); 217 218 UPDATE t1 SET c = 'This is a test one' WHERE rowid = 1; 219 UPDATE t1 SET c = 'That was a test one' WHERE rowid = 2; 220 UPDATE t1 SET c = 'This is a test one' WHERE rowid = 3; 221 222 UPDATE t1 SET c = 'This is a test two' WHERE rowid = 1; 223 UPDATE t1 SET c = 'That was a test two' WHERE rowid = 2; 224 UPDATE t1 SET c = 'This is a test two' WHERE rowid = 3; 225 226 UPDATE t1 SET c = 'This is a test three' WHERE rowid = 1; 227 UPDATE t1 SET c = 'That was a test three' WHERE rowid = 2; 228 UPDATE t1 SET c = 'This is a test three' WHERE rowid = 3; 229 230 UPDATE t1 SET c = 'This is a test four' WHERE rowid = 1; 231 UPDATE t1 SET c = 'That was a test four' WHERE rowid = 2; 232 UPDATE t1 SET c = 'This is a test four' WHERE rowid = 3; 233 234 UPDATE t1 SET c = 'This is a test' WHERE rowid = 1; 235 UPDATE t1 SET c = 'That was a test' WHERE rowid = 2; 236 UPDATE t1 SET c = 'This is a test' WHERE rowid = 3; 237} 238 239# 2 segments in level 0, 1 in level 1 (18 segments created, 16 240# merged). 241do_test fts2q-4.segments { 242 execsql { 243 SELECT level, idx FROM t1_segdir ORDER BY level, idx; 244 } 245} {0 0 0 1 1 0} 246 247do_test fts2q-4.matches { 248 execsql { 249 SELECT OFFSETS(t1) FROM t1 250 WHERE t1 MATCH 'this OR that OR was OR a OR is OR test' ORDER BY rowid; 251 } 252} [list {0 0 0 4 0 4 5 2 0 3 8 1 0 5 10 4} \ 253 {0 1 0 4 0 2 5 3 0 3 9 1 0 5 11 4} \ 254 {0 0 0 4 0 4 5 2 0 3 8 1 0 5 10 4}] 255 256check_terms_all fts2q-4.1 {a four is one test that this three two was} 257check_doclist_all fts2q-4.1.1 a {[1 0[2]] [2 0[2]] [3 0[2]]} 258check_doclist_all fts2q-4.1.2 four {} 259check_doclist_all fts2q-4.1.3 is {[1 0[1]] [3 0[1]]} 260check_doclist_all fts2q-4.1.4 one {} 261check_doclist_all fts2q-4.1.5 test {[1 0[3]] [2 0[3]] [3 0[3]]} 262check_doclist_all fts2q-4.1.6 that {[2 0[0]]} 263check_doclist_all fts2q-4.1.7 this {[1 0[0]] [3 0[0]]} 264check_doclist_all fts2q-4.1.8 three {} 265check_doclist_all fts2q-4.1.9 two {} 266check_doclist_all fts2q-4.1.10 was {[2 0[1]]} 267 268check_terms fts2q-4.2 0 0 {a four test that was} 269check_doclist fts2q-4.2.1 0 0 a {[2 0[2]]} 270check_doclist fts2q-4.2.2 0 0 four {[2]} 271check_doclist fts2q-4.2.3 0 0 test {[2 0[3]]} 272check_doclist fts2q-4.2.4 0 0 that {[2 0[0]]} 273check_doclist fts2q-4.2.5 0 0 was {[2 0[1]]} 274 275check_terms fts2q-4.3 0 1 {a four is test this} 276check_doclist fts2q-4.3.1 0 1 a {[3 0[2]]} 277check_doclist fts2q-4.3.2 0 1 four {[3]} 278check_doclist fts2q-4.3.3 0 1 is {[3 0[1]]} 279check_doclist fts2q-4.3.4 0 1 test {[3 0[3]]} 280check_doclist fts2q-4.3.5 0 1 this {[3 0[0]]} 281 282check_terms fts2q-4.4 1 0 {a four is one test that this three two was} 283check_doclist fts2q-4.4.1 1 0 a {[1 0[2]] [2 0[2]] [3 0[2]]} 284check_doclist fts2q-4.4.2 1 0 four {[1] [2 0[4]] [3 0[4]]} 285check_doclist fts2q-4.4.3 1 0 is {[1 0[1]] [3 0[1]]} 286check_doclist fts2q-4.4.4 1 0 one {[1] [2] [3]} 287check_doclist fts2q-4.4.5 1 0 test {[1 0[3]] [2 0[3]] [3 0[3]]} 288check_doclist fts2q-4.4.6 1 0 that {[2 0[0]]} 289check_doclist fts2q-4.4.7 1 0 this {[1 0[0]] [3 0[0]]} 290check_doclist fts2q-4.4.8 1 0 three {[1] [2] [3]} 291check_doclist fts2q-4.4.9 1 0 two {[1] [2] [3]} 292check_doclist fts2q-4.4.10 1 0 was {[2 0[1]]} 293 294# Optimize should leave the result in the level of the highest-level 295# prior segment. 296do_test fts2q-4.5 { 297 execsql { 298 SELECT OPTIMIZE(t1) FROM t1 LIMIT 1; 299 SELECT level, idx FROM t1_segdir ORDER BY level, idx; 300 } 301} {{Index optimized} 1 0} 302 303# Identical to fts2q-4.matches. 304do_test fts2q-4.5.matches { 305 execsql { 306 SELECT OFFSETS(t1) FROM t1 307 WHERE t1 MATCH 'this OR that OR was OR a OR is OR test' ORDER BY rowid; 308 } 309} [list {0 0 0 4 0 4 5 2 0 3 8 1 0 5 10 4} \ 310 {0 1 0 4 0 2 5 3 0 3 9 1 0 5 11 4} \ 311 {0 0 0 4 0 4 5 2 0 3 8 1 0 5 10 4}] 312 313check_terms_all fts2q-4.5.1 {a is test that this was} 314check_doclist_all fts2q-4.5.1.1 a {[1 0[2]] [2 0[2]] [3 0[2]]} 315check_doclist_all fts2q-4.5.1.2 is {[1 0[1]] [3 0[1]]} 316check_doclist_all fts2q-4.5.1.3 test {[1 0[3]] [2 0[3]] [3 0[3]]} 317check_doclist_all fts2q-4.5.1.4 that {[2 0[0]]} 318check_doclist_all fts2q-4.5.1.5 this {[1 0[0]] [3 0[0]]} 319check_doclist_all fts2q-4.5.1.6 was {[2 0[1]]} 320 321check_terms fts2q-4.5.2 1 0 {a is test that this was} 322check_doclist fts2q-4.5.2.1 1 0 a {[1 0[2]] [2 0[2]] [3 0[2]]} 323check_doclist fts2q-4.5.2.2 1 0 is {[1 0[1]] [3 0[1]]} 324check_doclist fts2q-4.5.2.3 1 0 test {[1 0[3]] [2 0[3]] [3 0[3]]} 325check_doclist fts2q-4.5.2.4 1 0 that {[2 0[0]]} 326check_doclist fts2q-4.5.2.5 1 0 this {[1 0[0]] [3 0[0]]} 327check_doclist fts2q-4.5.2.6 1 0 was {[2 0[1]]} 328 329# Re-optimizing does nothing. 330do_test fts2q-5.0 { 331 execsql { 332 SELECT OPTIMIZE(t1) FROM t1 LIMIT 1; 333 SELECT level, idx FROM t1_segdir ORDER BY level, idx; 334 } 335} {{Index already optimal} 1 0} 336 337# Even if we move things around, still does nothing. 338do_test fts2q-5.1 { 339 execsql { 340 UPDATE t1_segdir SET level = 2 WHERE level = 1 AND idx = 0; 341 SELECT OPTIMIZE(t1) FROM t1 LIMIT 1; 342 SELECT level, idx FROM t1_segdir ORDER BY level, idx; 343 } 344} {{Index already optimal} 2 0} 345 346finish_test 347