OLD | NEW |
(Empty) | |
| 1 # 2010 November 02 |
| 2 # |
| 3 # The author disclaims copyright to this source code. In place of |
| 4 # a legal notice, here is a blessing: |
| 5 # |
| 6 # May you do good and not evil. |
| 7 # May you find forgiveness for yourself and forgive others. |
| 8 # May you share freely, never taking more than you give. |
| 9 # |
| 10 #*********************************************************************** |
| 11 # This file implements regression tests for the FTS3 module. The focus |
| 12 # of this file is tables created with the "matchinfo=fts3" option. |
| 13 # |
| 14 |
| 15 set testdir [file dirname $argv0] |
| 16 source $testdir/tester.tcl |
| 17 |
| 18 # If SQLITE_ENABLE_FTS3 is not defined, omit this file. |
| 19 ifcapable !fts3 { finish_test ; return } |
| 20 |
| 21 set testprefix fts3matchinfo |
| 22 |
| 23 proc mit {blob} { |
| 24 set scan(littleEndian) i* |
| 25 set scan(bigEndian) I* |
| 26 binary scan $blob $scan($::tcl_platform(byteOrder)) r |
| 27 return $r |
| 28 } |
| 29 db func mit mit |
| 30 |
| 31 do_execsql_test 1.0 { |
| 32 CREATE VIRTUAL TABLE t1 USING fts4(matchinfo=fts3); |
| 33 SELECT name FROM sqlite_master WHERE type = 'table'; |
| 34 } {t1 t1_content t1_segments t1_segdir t1_stat} |
| 35 |
| 36 do_execsql_test 1.1 { |
| 37 INSERT INTO t1(content) VALUES('I wandered lonely as a cloud'); |
| 38 INSERT INTO t1(content) VALUES('That floats on high o''er vales and hills,'); |
| 39 INSERT INTO t1(content) VALUES('When all at once I saw a crowd,'); |
| 40 INSERT INTO t1(content) VALUES('A host, of golden daffodils,'); |
| 41 SELECT mit(matchinfo(t1)) FROM t1 WHERE t1 MATCH 'I'; |
| 42 } {{1 1 1 2 2} {1 1 1 2 2}} |
| 43 |
| 44 # Now create an FTS4 table that does not specify matchinfo=fts3. |
| 45 # |
| 46 do_execsql_test 1.2 { |
| 47 CREATE VIRTUAL TABLE t2 USING fts4; |
| 48 INSERT INTO t2 SELECT * FROM t1; |
| 49 SELECT mit(matchinfo(t2)) FROM t2 WHERE t2 MATCH 'I'; |
| 50 } {{1 1 1 2 2} {1 1 1 2 2}} |
| 51 |
| 52 # Test some syntax-error handling. |
| 53 # |
| 54 do_catchsql_test 2.0 { |
| 55 CREATE VIRTUAL TABLE x1 USING fts4(matchinfo=fs3); |
| 56 } {1 {unrecognized matchinfo: fs3}} |
| 57 do_catchsql_test 2.1 { |
| 58 CREATE VIRTUAL TABLE x2 USING fts4(mtchinfo=fts3); |
| 59 } {1 {unrecognized parameter: mtchinfo=fts3}} |
| 60 |
| 61 # Check that with fts3, the "=" character is permitted in column definitions. |
| 62 # |
| 63 do_execsql_test 3.1 { |
| 64 CREATE VIRTUAL TABLE t3 USING fts3(mtchinfo=fts3); |
| 65 INSERT INTO t3(mtchinfo) VALUES('Beside the lake, beneath the trees'); |
| 66 SELECT mtchinfo FROM t3; |
| 67 } {{Beside the lake, beneath the trees}} |
| 68 |
| 69 do_execsql_test 3.2 { |
| 70 CREATE VIRTUAL TABLE xx USING FTS4; |
| 71 SELECT * FROM xx WHERE xx MATCH 'abc'; |
| 72 SELECT * FROM xx WHERE xx MATCH 'a b c'; |
| 73 } |
| 74 |
| 75 |
| 76 #-------------------------------------------------------------------------- |
| 77 # Proc [do_matchinfo_test] is used to test the FTSX matchinfo() function. |
| 78 # |
| 79 # The first argument - $tn - is a test identifier. This may be either a |
| 80 # full identifier (i.e. "fts3matchinfo-1.1") or, if global var $testprefix |
| 81 # is set, just the numeric component (i.e. "1.1"). |
| 82 # |
| 83 # The second argument is the name of an FTSX table. The third is the |
| 84 # full text of a WHERE/MATCH expression to query the table for |
| 85 # (i.e. "t1 MATCH 'abc'"). The final argument - $results - should be a |
| 86 # key-value list (serialized array) with matchinfo() format specifiers |
| 87 # as keys, and the results of executing the statement: |
| 88 # |
| 89 # SELECT matchinfo($tbl, '$key') FROM $tbl WHERE $expr |
| 90 # |
| 91 # For example: |
| 92 # |
| 93 # CREATE VIRTUAL TABLE t1 USING fts4; |
| 94 # INSERT INTO t1 VALUES('abc'); |
| 95 # INSERT INTO t1 VALUES('def'); |
| 96 # INSERT INTO t1 VALUES('abc abc'); |
| 97 # |
| 98 # do_matchinfo_test 1.1 t1 "t1 MATCH 'abc'" { |
| 99 # n {3 3} |
| 100 # p {1 1} |
| 101 # c {1 1} |
| 102 # x {{1 3 2} {2 3 2}} |
| 103 # } |
| 104 # |
| 105 # If the $results list contains keys mapped to "-" instead of a matchinfo() |
| 106 # result, then this command computes the expected results based on other |
| 107 # mappings to test the matchinfo() function. For example, the command above |
| 108 # could be changed to: |
| 109 # |
| 110 # do_matchinfo_test 1.1 t1 "t1 MATCH 'abc'" { |
| 111 # n {3 3} p {1 1} c {1 1} x {{1 3 2} {2 3 2}} |
| 112 # pcx - |
| 113 # } |
| 114 # |
| 115 # And this command would compute the expected results for matchinfo(t1, 'pcx') |
| 116 # based on the results of matchinfo(t1, 'p'), matchinfo(t1, 'c') and |
| 117 # matchinfo(t1, 'x') in order to test 'pcx'. |
| 118 # |
| 119 proc do_matchinfo_test {tn tbl expr results} { |
| 120 |
| 121 foreach {fmt res} $results { |
| 122 if {$res == "-"} continue |
| 123 set resarray($fmt) $res |
| 124 } |
| 125 |
| 126 set nRow 0 |
| 127 foreach {fmt res} [array get resarray] { |
| 128 if {[llength $res]>$nRow} { set nRow [llength $res] } |
| 129 } |
| 130 |
| 131 # Construct expected results for any formats for which the caller |
| 132 # supplied result is "-". |
| 133 # |
| 134 foreach {fmt res} $results { |
| 135 if {$res == "-"} { |
| 136 set res [list] |
| 137 for {set iRow 0} {$iRow<$nRow} {incr iRow} { |
| 138 set rowres [list] |
| 139 foreach c [split $fmt ""] { |
| 140 set rowres [concat $rowres [lindex $resarray($c) $iRow]] |
| 141 } |
| 142 lappend res $rowres |
| 143 } |
| 144 set resarray($fmt) $res |
| 145 } |
| 146 } |
| 147 |
| 148 # Test each matchinfo() request individually. |
| 149 # |
| 150 foreach {fmt res} [array get resarray] { |
| 151 set sql "SELECT mit(matchinfo($tbl, '$fmt')) FROM $tbl WHERE $expr" |
| 152 do_execsql_test $tn.$fmt $sql [normalize2 $res] |
| 153 } |
| 154 |
| 155 # Test them all executed together (multiple invocations of matchinfo()). |
| 156 # |
| 157 set exprlist [list] |
| 158 foreach {format res} [array get resarray] { |
| 159 lappend exprlist "mit(matchinfo($tbl, '$format'))" |
| 160 } |
| 161 set allres [list] |
| 162 for {set iRow 0} {$iRow<$nRow} {incr iRow} { |
| 163 foreach {format res} [array get resarray] { |
| 164 lappend allres [lindex $res $iRow] |
| 165 } |
| 166 } |
| 167 set sql "SELECT [join $exprlist ,] FROM $tbl WHERE $expr" |
| 168 do_execsql_test $tn.multi $sql [normalize2 $allres] |
| 169 } |
| 170 proc normalize2 {list_of_lists} { |
| 171 set res [list] |
| 172 foreach elem $list_of_lists { |
| 173 lappend res [list {*}$elem] |
| 174 } |
| 175 return $res |
| 176 } |
| 177 |
| 178 |
| 179 do_execsql_test 4.1.0 { |
| 180 CREATE VIRTUAL TABLE t4 USING fts4(x, y); |
| 181 INSERT INTO t4 VALUES('a b c d e', 'f g h i j'); |
| 182 INSERT INTO t4 VALUES('f g h i j', 'a b c d e'); |
| 183 } |
| 184 |
| 185 do_matchinfo_test 4.1.1 t4 {t4 MATCH 'a b c'} { |
| 186 p {3 3} |
| 187 c {2 2} |
| 188 x { |
| 189 {1 1 1 0 1 1 1 1 1 0 1 1 1 1 1 0 1 1} |
| 190 {0 1 1 1 1 1 0 1 1 1 1 1 0 1 1 1 1 1} |
| 191 } |
| 192 n {2 2} |
| 193 l {{5 5} {5 5}} |
| 194 a {{5 5} {5 5}} |
| 195 |
| 196 s {{3 0} {0 3}} |
| 197 |
| 198 xxxxxxxxxxxxxxxxxx - pcx - xpc - ccc - pppxpcpcx - laxnpc - |
| 199 xpxsscplax - |
| 200 } |
| 201 |
| 202 do_matchinfo_test 4.1.2 t4 {t4 MATCH '"g h i"'} { |
| 203 p {1 1} |
| 204 c {2 2} |
| 205 x { |
| 206 {0 1 1 1 1 1} |
| 207 {1 1 1 0 1 1} |
| 208 } |
| 209 n {2 2} |
| 210 l {{5 5} {5 5}} |
| 211 a {{5 5} {5 5}} |
| 212 |
| 213 s {{0 1} {1 0}} |
| 214 |
| 215 xxxxxxxxxxxxxxxxxx - pcx - xpc - ccc - pppxpcpcx - laxnpc - |
| 216 sxsxs - |
| 217 } |
| 218 |
| 219 do_matchinfo_test 4.1.3 t4 {t4 MATCH 'a b'} { s {{2 0} {0 2}} } |
| 220 do_matchinfo_test 4.1.4 t4 {t4 MATCH '"a b" c'} { s {{2 0} {0 2}} } |
| 221 do_matchinfo_test 4.1.5 t4 {t4 MATCH 'a "b c"'} { s {{2 0} {0 2}} } |
| 222 do_matchinfo_test 4.1.6 t4 {t4 MATCH 'd d'} { s {{1 0} {0 1}} } |
| 223 |
| 224 do_execsql_test 4.2.0 { |
| 225 CREATE VIRTUAL TABLE t5 USING fts4; |
| 226 INSERT INTO t5 VALUES('a a a a a'); |
| 227 INSERT INTO t5 VALUES('a b a b a'); |
| 228 INSERT INTO t5 VALUES('c b c b c'); |
| 229 INSERT INTO t5 VALUES('x x x x x'); |
| 230 } |
| 231 do_matchinfo_test 4.2.1 t5 {t5 MATCH 'a a'} { |
| 232 x {{5 8 2 5 8 2} {3 8 2 3 8 2}} |
| 233 s {2 1} |
| 234 } |
| 235 do_matchinfo_test 4.2.2 t5 {t5 MATCH 'a b'} { s {2} } |
| 236 do_matchinfo_test 4.2.3 t5 {t5 MATCH 'a b a'} { s {3} } |
| 237 do_matchinfo_test 4.2.4 t5 {t5 MATCH 'a a a'} { s {3 1} } |
| 238 do_matchinfo_test 4.2.5 t5 {t5 MATCH '"a b" "a b"'} { s {2} } |
| 239 do_matchinfo_test 4.2.6 t5 {t5 MATCH 'a OR b'} { s {1 2 1} } |
| 240 |
| 241 do_execsql_test 4.3.0 "INSERT INTO t5 VALUES('x y [string repeat {b } 50000]')"; |
| 242 |
| 243 do_matchinfo_test 4.3.1 t5 {t5 MATCH 'a a'} { |
| 244 x {{5 8 2 5 5 5} {3 8 2 3 5 5}} |
| 245 s {2 1} |
| 246 } |
| 247 |
| 248 do_matchinfo_test 4.3.2 t5 {t5 MATCH 'a b'} { s {2} } |
| 249 do_matchinfo_test 4.3.3 t5 {t5 MATCH 'a b a'} { s {3} } |
| 250 do_matchinfo_test 4.3.4 t5 {t5 MATCH 'a a a'} { s {3 1} } |
| 251 do_matchinfo_test 4.3.5 t5 {t5 MATCH '"a b" "a b"'} { s {2} } |
| 252 do_matchinfo_test 4.3.6 t5 {t5 MATCH 'a OR b'} { s {1 2 1 1} } |
| 253 |
| 254 do_execsql_test 4.4.0 { |
| 255 INSERT INTO t5(t5) VALUES('optimize'); |
| 256 UPDATE t5_segments |
| 257 SET block = zeroblob(length(block)) |
| 258 WHERE length(block)>10000; |
| 259 } |
| 260 |
| 261 do_matchinfo_test 4.4.2 t5 {t5 MATCH 'a b'} { s {2} } |
| 262 do_matchinfo_test 4.4.1 t5 {t5 MATCH 'a a'} { s {2 1} } |
| 263 do_matchinfo_test 4.4.2 t5 {t5 MATCH 'a b'} { s {2} } |
| 264 do_matchinfo_test 4.4.3 t5 {t5 MATCH 'a b a'} { s {3} } |
| 265 do_matchinfo_test 4.4.4 t5 {t5 MATCH 'a a a'} { s {3 1} } |
| 266 do_matchinfo_test 4.4.5 t5 {t5 MATCH '"a b" "a b"'} { s {2} } |
| 267 |
| 268 do_execsql_test 4.5.0 { |
| 269 CREATE VIRTUAL TABLE t6 USING fts4(a, b, c); |
| 270 INSERT INTO t6 VALUES('a', 'b', 'c'); |
| 271 } |
| 272 do_matchinfo_test 4.5.1 t6 {t6 MATCH 'a b c'} { s {{1 1 1}} } |
| 273 |
| 274 |
| 275 #------------------------------------------------------------------------- |
| 276 # Check the following restrictions: |
| 277 # |
| 278 # + Matchinfo flags 'a', 'l' and 'n' can only be used with fts4, not fts3. |
| 279 # + Matchinfo flag 'l' cannot be used with matchinfo=fts3. |
| 280 # |
| 281 do_execsql_test 5.1 { |
| 282 CREATE VIRTUAL TABLE t7 USING fts3(a, b); |
| 283 INSERT INTO t7 VALUES('u v w', 'x y z'); |
| 284 |
| 285 CREATE VIRTUAL TABLE t8 USING fts4(a, b, matchinfo=fts3); |
| 286 INSERT INTO t8 VALUES('u v w', 'x y z'); |
| 287 } |
| 288 |
| 289 do_catchsql_test 5.2.1 { |
| 290 SELECT matchinfo(t7, 'a') FROM t7 WHERE t7 MATCH 'x y' |
| 291 } {1 {unrecognized matchinfo request: a}} |
| 292 do_catchsql_test 5.2.2 { |
| 293 SELECT matchinfo(t7, 'l') FROM t7 WHERE t7 MATCH 'x y' |
| 294 } {1 {unrecognized matchinfo request: l}} |
| 295 do_catchsql_test 5.2.3 { |
| 296 SELECT matchinfo(t7, 'n') FROM t7 WHERE t7 MATCH 'x y' |
| 297 } {1 {unrecognized matchinfo request: n}} |
| 298 |
| 299 do_catchsql_test 5.3.1 { |
| 300 SELECT matchinfo(t8, 'l') FROM t8 WHERE t8 MATCH 'x y' |
| 301 } {1 {unrecognized matchinfo request: l}} |
| 302 |
| 303 #------------------------------------------------------------------------- |
| 304 # Test that the offsets() function handles corruption in the %_content |
| 305 # table correctly. |
| 306 # |
| 307 do_execsql_test 6.1 { |
| 308 CREATE VIRTUAL TABLE t9 USING fts4; |
| 309 INSERT INTO t9 VALUES( |
| 310 'this record is used to try to dectect corruption' |
| 311 ); |
| 312 SELECT offsets(t9) FROM t9 WHERE t9 MATCH 'to'; |
| 313 } {{0 0 20 2 0 0 27 2}} |
| 314 |
| 315 do_catchsql_test 6.2 { |
| 316 UPDATE t9_content SET c0content = 'this record is used to'; |
| 317 SELECT offsets(t9) FROM t9 WHERE t9 MATCH 'to'; |
| 318 } {1 {database disk image is malformed}} |
| 319 |
| 320 #------------------------------------------------------------------------- |
| 321 # Test the outcome of matchinfo() when used within a query that does not |
| 322 # use the full-text index (i.e. lookup by rowid or full-table scan). |
| 323 # |
| 324 do_execsql_test 7.1 { |
| 325 CREATE VIRTUAL TABLE t10 USING fts4; |
| 326 INSERT INTO t10 VALUES('first record'); |
| 327 INSERT INTO t10 VALUES('second record'); |
| 328 } |
| 329 do_execsql_test 7.2 { |
| 330 SELECT typeof(matchinfo(t10)), length(matchinfo(t10)) FROM t10; |
| 331 } {blob 0 blob 0} |
| 332 do_execsql_test 7.3 { |
| 333 SELECT typeof(matchinfo(t10)), length(matchinfo(t10)) FROM t10 WHERE docid=1; |
| 334 } {blob 0} |
| 335 do_execsql_test 7.4 { |
| 336 SELECT typeof(matchinfo(t10)), length(matchinfo(t10)) |
| 337 FROM t10 WHERE t10 MATCH 'record' |
| 338 } {blob 20 blob 20} |
| 339 |
| 340 #------------------------------------------------------------------------- |
| 341 # Test a special case - matchinfo('nxa') with many zero length documents. |
| 342 # Special because "x" internally uses a statement used by both "n" and "a". |
| 343 # This was causing a problem at one point in the obscure case where the |
| 344 # total number of bytes of data stored in an fts3 table was greater than |
| 345 # the number of rows. i.e. when the following query returns true: |
| 346 # |
| 347 # SELECT sum(length(content)) < count(*) FROM fts4table; |
| 348 # |
| 349 do_execsql_test 8.1 { |
| 350 CREATE VIRTUAL TABLE t11 USING fts4; |
| 351 INSERT INTO t11(t11) VALUES('nodesize=24'); |
| 352 INSERT INTO t11 VALUES('quitealongstringoftext'); |
| 353 INSERT INTO t11 VALUES('anotherquitealongstringoftext'); |
| 354 INSERT INTO t11 VALUES('athirdlongstringoftext'); |
| 355 INSERT INTO t11 VALUES('andonemoreforgoodluck'); |
| 356 } |
| 357 do_test 8.2 { |
| 358 for {set i 0} {$i < 200} {incr i} { |
| 359 execsql { INSERT INTO t11 VALUES('') } |
| 360 } |
| 361 execsql { INSERT INTO t11(t11) VALUES('optimize') } |
| 362 } {} |
| 363 do_execsql_test 8.3 { |
| 364 SELECT mit(matchinfo(t11, 'nxa')) FROM t11 WHERE t11 MATCH 'a*' |
| 365 } {{204 1 3 3 0} {204 1 3 3 0} {204 1 3 3 0}} |
| 366 |
| 367 # Corruption related tests. |
| 368 do_execsql_test 8.4.1.1 { UPDATE t11_stat SET value = X'0000'; } |
| 369 do_catchsql_test 8.5.1.2 { |
| 370 SELECT mit(matchinfo(t11, 'nxa')) FROM t11 WHERE t11 MATCH 'a*' |
| 371 } {1 {database disk image is malformed}} |
| 372 |
| 373 do_execsql_test 8.4.2.1 { UPDATE t11_stat SET value = X'00'; } |
| 374 do_catchsql_test 8.5.2.2 { |
| 375 SELECT mit(matchinfo(t11, 'nxa')) FROM t11 WHERE t11 MATCH 'a*' |
| 376 } {1 {database disk image is malformed}} |
| 377 |
| 378 do_execsql_test 8.4.3.1 { UPDATE t11_stat SET value = NULL; } |
| 379 do_catchsql_test 8.5.3.2 { |
| 380 SELECT mit(matchinfo(t11, 'nxa')) FROM t11 WHERE t11 MATCH 'a*' |
| 381 } {1 {database disk image is malformed}} |
| 382 |
| 383 finish_test |
| 384 |
OLD | NEW |