modernc.org/cc@v1.0.1/v2/testdata/_sqlite/ext/fts5/test/fts5matchinfo.test (about) 1 # 2015 August 05 2 # 3 # The author disclaims copyright to this source code. In place of 4 # a legal notice, here is a blessing: 5 # 6 # May you do good and not evil. 7 # May you find forgiveness for yourself and forgive others. 8 # May you share freely, never taking more than you give. 9 # 10 #*********************************************************************** 11 # 12 13 source [file join [file dirname [info script]] fts5_common.tcl] 14 set testprefix fts5matchinfo 15 16 # If SQLITE_ENABLE_FTS5 is not defined, omit this file. 17 ifcapable !fts5 { finish_test ; return } 18 19 foreach_detail_mode $testprefix { 20 21 proc mit {blob} { 22 set scan(littleEndian) i* 23 set scan(bigEndian) I* 24 binary scan $blob $scan($::tcl_platform(byteOrder)) r 25 return $r 26 } 27 db func mit mit 28 29 sqlite3_fts5_register_matchinfo db 30 31 do_execsql_test 1.0 { 32 CREATE VIRTUAL TABLE t1 USING fts5(content, detail=%DETAIL%); 33 } 34 35 do_execsql_test 1.1 { 36 INSERT INTO t1(content) VALUES('I wandered lonely as a cloud'); 37 INSERT INTO t1(content) VALUES('That floats on high o''er vales and hills,'); 38 INSERT INTO t1(content) VALUES('When all at once I saw a crowd,'); 39 INSERT INTO t1(content) VALUES('A host, of golden daffodils,'); 40 SELECT mit(matchinfo(t1)) FROM t1 WHERE t1 MATCH 'I'; 41 } {{1 1 1 2 2} {1 1 1 2 2}} 42 43 # Now create an FTS4 table that does not specify matchinfo=fts3. 44 # 45 do_execsql_test 1.2 { 46 CREATE VIRTUAL TABLE t2 USING fts5(content, detail=%DETAIL%); 47 INSERT INTO t2 SELECT * FROM t1; 48 SELECT mit(matchinfo(t2)) FROM t2 WHERE t2 MATCH 'I'; 49 } {{1 1 1 2 2} {1 1 1 2 2}} 50 51 52 #-------------------------------------------------------------------------- 53 # Proc [do_matchinfo_test] is used to test the FTSX matchinfo() function. 54 # 55 # The first argument - $tn - is a test identifier. This may be either a 56 # full identifier (i.e. "fts3matchinfo-1.1") or, if global var $testprefix 57 # is set, just the numeric component (i.e. "1.1"). 58 # 59 # The second argument is the name of an FTSX table. The third is the 60 # full text of a WHERE/MATCH expression to query the table for 61 # (i.e. "t1 MATCH 'abc'"). The final argument - $results - should be a 62 # key-value list (serialized array) with matchinfo() format specifiers 63 # as keys, and the results of executing the statement: 64 # 65 # SELECT matchinfo($tbl, '$key') FROM $tbl WHERE $expr 66 # 67 # For example: 68 # 69 # CREATE VIRTUAL TABLE t1 USING fts4; 70 # INSERT INTO t1 VALUES('abc'); 71 # INSERT INTO t1 VALUES('def'); 72 # INSERT INTO t1 VALUES('abc abc'); 73 # 74 # do_matchinfo_test 1.1 t1 "t1 MATCH 'abc'" { 75 # n {3 3} 76 # p {1 1} 77 # c {1 1} 78 # x {{1 3 2} {2 3 2}} 79 # } 80 # 81 # If the $results list contains keys mapped to "-" instead of a matchinfo() 82 # result, then this command computes the expected results based on other 83 # mappings to test the matchinfo() function. For example, the command above 84 # could be changed to: 85 # 86 # do_matchinfo_test 1.1 t1 "t1 MATCH 'abc'" { 87 # n {3 3} p {1 1} c {1 1} x {{1 3 2} {2 3 2}} 88 # pcx - 89 # } 90 # 91 # And this command would compute the expected results for matchinfo(t1, 'pcx') 92 # based on the results of matchinfo(t1, 'p'), matchinfo(t1, 'c') and 93 # matchinfo(t1, 'x') in order to test 'pcx'. 94 # 95 proc do_matchinfo_test {tn tbl expr results} { 96 97 foreach {fmt res} $results { 98 if {$res == "-"} continue 99 set resarray($fmt) $res 100 } 101 102 set nRow 0 103 foreach {fmt res} [array get resarray] { 104 if {[llength $res]>$nRow} { set nRow [llength $res] } 105 } 106 107 # Construct expected results for any formats for which the caller 108 # supplied result is "-". 109 # 110 foreach {fmt res} $results { 111 if {$res == "-"} { 112 set res [list] 113 for {set iRow 0} {$iRow<$nRow} {incr iRow} { 114 set rowres [list] 115 foreach c [split $fmt ""] { 116 set rowres [concat $rowres [lindex $resarray($c) $iRow]] 117 } 118 lappend res $rowres 119 } 120 set resarray($fmt) $res 121 } 122 } 123 124 # Test each matchinfo() request individually. 125 # 126 foreach {fmt res} [array get resarray] { 127 set sql "SELECT mit(matchinfo($tbl, '$fmt')) FROM $tbl WHERE $expr" 128 do_execsql_test $tn.$fmt $sql [normalize2 $res] 129 } 130 131 # Test them all executed together (multiple invocations of matchinfo()). 132 # 133 set exprlist [list] 134 foreach {format res} [array get resarray] { 135 lappend exprlist "mit(matchinfo($tbl, '$format'))" 136 } 137 set allres [list] 138 for {set iRow 0} {$iRow<$nRow} {incr iRow} { 139 foreach {format res} [array get resarray] { 140 lappend allres [lindex $res $iRow] 141 } 142 } 143 set sql "SELECT [join $exprlist ,] FROM $tbl WHERE $expr" 144 do_execsql_test $tn.multi $sql [normalize2 $allres] 145 } 146 proc normalize2 {list_of_lists} { 147 set res [list] 148 foreach elem $list_of_lists { 149 lappend res [list {*}$elem] 150 } 151 return $res 152 } 153 154 # Similar to [do_matchinfo_test], except that this is a no-op if the FTS5 155 # mode is not detail=full. 156 # 157 proc do_matchinfo_p_test {tn tbl expr results} { 158 if {[detail_is_full]} { 159 uplevel [list do_matchinfo_test $tn $tbl $expr $results] 160 } 161 } 162 163 do_execsql_test 4.1.0 { 164 CREATE VIRTUAL TABLE t4 USING fts5(x, y, detail=%DETAIL%); 165 INSERT INTO t4 VALUES('a b c d e', 'f g h i j'); 166 INSERT INTO t4 VALUES('f g h i j', 'a b c d e'); 167 } 168 169 do_matchinfo_test 4.1.1 t4 {t4 MATCH 'a b c'} { 170 s {{3 0} {0 3}} 171 } 172 173 do_matchinfo_test 4.1.1 t4 {t4 MATCH 'a b c'} { 174 p {3 3} 175 x { 176 {1 1 1 0 1 1 1 1 1 0 1 1 1 1 1 0 1 1} 177 {0 1 1 1 1 1 0 1 1 1 1 1 0 1 1 1 1 1} 178 } 179 } 180 181 do_matchinfo_test 4.1.1 t4 {t4 MATCH 'a b c'} { 182 p {3 3} 183 c {2 2} 184 x { 185 {1 1 1 0 1 1 1 1 1 0 1 1 1 1 1 0 1 1} 186 {0 1 1 1 1 1 0 1 1 1 1 1 0 1 1 1 1 1} 187 } 188 n {2 2} 189 l {{5 5} {5 5}} 190 a {{5 5} {5 5}} 191 192 s {{3 0} {0 3}} 193 194 xxxxxxxxxxxxxxxxxx - pcx - xpc - ccc - pppxpcpcx - laxnpc - 195 xpxsscplax - 196 } 197 198 do_matchinfo_p_test 4.1.2 t4 {t4 MATCH '"g h i"'} { 199 p {1 1} 200 c {2 2} 201 x { 202 {0 1 1 1 1 1} 203 {1 1 1 0 1 1} 204 } 205 n {2 2} 206 l {{5 5} {5 5}} 207 a {{5 5} {5 5}} 208 209 s {{0 1} {1 0}} 210 211 xxxxxxxxxxxxxxxxxx - pcx - xpc - ccc - pppxpcpcx - laxnpc - 212 sxsxs - 213 } 214 215 do_matchinfo_test 4.1.3 t4 {t4 MATCH 'a b'} { s {{2 0} {0 2}} } 216 do_matchinfo_p_test 4.1.4 t4 {t4 MATCH '"a b" c'} { s {{2 0} {0 2}} } 217 do_matchinfo_p_test 4.1.5 t4 {t4 MATCH 'a "b c"'} { s {{2 0} {0 2}} } 218 do_matchinfo_test 4.1.6 t4 {t4 MATCH 'd d'} { s {{1 0} {0 1}} } 219 do_matchinfo_test 4.1.7 t4 {t4 MATCH 'f OR abcd'} { 220 x { 221 {0 1 1 1 1 1 0 0 0 0 0 0} 222 {1 1 1 0 1 1 0 0 0 0 0 0} 223 } 224 } 225 do_matchinfo_test 4.1.8 t4 {t4 MATCH 'f NOT abcd'} { 226 x { 227 {0 1 1 1 1 1 0 0 0 0 0 0} 228 {1 1 1 0 1 1 0 0 0 0 0 0} 229 } 230 } 231 232 do_execsql_test 4.2.0 { 233 CREATE VIRTUAL TABLE t5 USING fts5(content, detail=%DETAIL%); 234 INSERT INTO t5 VALUES('a a a a a'); 235 INSERT INTO t5 VALUES('a b a b a'); 236 INSERT INTO t5 VALUES('c b c b c'); 237 INSERT INTO t5 VALUES('x x x x x'); 238 } 239 do_matchinfo_test 4.2.1 t5 {t5 MATCH 'a a'} { 240 x {{5 8 2 5 8 2} {3 8 2 3 8 2}} 241 s {2 1} 242 } 243 do_matchinfo_test 4.2.2 t5 {t5 MATCH 'a b'} { s {2} } 244 do_matchinfo_test 4.2.3 t5 {t5 MATCH 'a b a'} { s {3} } 245 do_matchinfo_test 4.2.4 t5 {t5 MATCH 'a a a'} { s {3 1} } 246 do_matchinfo_p_test 4.2.5 t5 {t5 MATCH '"a b" "a b"'} { s {2} } 247 do_matchinfo_test 4.2.6 t5 {t5 MATCH 'a OR b'} { s {1 2 1} } 248 249 do_execsql_test 4.3.0 "INSERT INTO t5 VALUES('x y [string repeat {b } 50000]')"; 250 251 # It used to be that the second 'a' token would be deferred. That doesn't 252 # work any longer. 253 if 0 { 254 do_matchinfo_test 4.3.1 t5 {t5 MATCH 'a a'} { 255 x {{5 8 2 5 5 5} {3 8 2 3 5 5}} 256 s {2 1} 257 } 258 } 259 260 do_matchinfo_test 4.3.2 t5 {t5 MATCH 'a b'} { s {2} } 261 do_matchinfo_test 4.3.3 t5 {t5 MATCH 'a b a'} { s {3} } 262 do_matchinfo_test 4.3.4 t5 {t5 MATCH 'a a a'} { s {3 1} } 263 do_matchinfo_p_test 4.3.5 t5 {t5 MATCH '"a b" "a b"'} { s {2} } 264 do_matchinfo_test 4.3.6 t5 {t5 MATCH 'a OR b'} { s {1 2 1 1} } 265 266 do_execsql_test 4.4.0.1 { INSERT INTO t5(t5) VALUES('optimize') } 267 268 do_matchinfo_test 4.4.2 t5 {t5 MATCH 'a b'} { s {2} } 269 do_matchinfo_test 4.4.1 t5 {t5 MATCH 'a a'} { s {2 1} } 270 do_matchinfo_test 4.4.2 t5 {t5 MATCH 'a b'} { s {2} } 271 do_matchinfo_test 4.4.3 t5 {t5 MATCH 'a b a'} { s {3} } 272 do_matchinfo_test 4.4.4 t5 {t5 MATCH 'a a a'} { s {3 1} } 273 do_matchinfo_p_test 4.4.5 t5 {t5 MATCH '"a b" "a b"'} { s {2} } 274 275 do_execsql_test 4.5.0 { 276 CREATE VIRTUAL TABLE t6 USING fts5(a, b, c, detail=%DETAIL%); 277 INSERT INTO t6 VALUES('a', 'b', 'c'); 278 } 279 do_matchinfo_test 4.5.1 t6 {t6 MATCH 'a b c'} { s {{1 1 1}} } 280 281 282 #------------------------------------------------------------------------- 283 # Test the outcome of matchinfo() when used within a query that does not 284 # use the full-text index (i.e. lookup by rowid or full-table scan). 285 # 286 do_execsql_test 7.1 { 287 CREATE VIRTUAL TABLE t10 USING fts5(content, detail=%DETAIL%); 288 INSERT INTO t10 VALUES('first record'); 289 INSERT INTO t10 VALUES('second record'); 290 } 291 do_execsql_test 7.2 { 292 SELECT typeof(matchinfo(t10)), length(matchinfo(t10)) FROM t10; 293 } {blob 8 blob 8} 294 do_execsql_test 7.3 { 295 SELECT typeof(matchinfo(t10)), length(matchinfo(t10)) FROM t10 WHERE rowid=1; 296 } {blob 8} 297 do_execsql_test 7.4 { 298 SELECT typeof(matchinfo(t10)), length(matchinfo(t10)) 299 FROM t10 WHERE t10 MATCH 'record' 300 } {blob 20 blob 20} 301 302 #------------------------------------------------------------------------- 303 # Test a special case - matchinfo('nxa') with many zero length documents. 304 # Special because "x" internally uses a statement used by both "n" and "a". 305 # This was causing a problem at one point in the obscure case where the 306 # total number of bytes of data stored in an fts3 table was greater than 307 # the number of rows. i.e. when the following query returns true: 308 # 309 # SELECT sum(length(content)) < count(*) FROM fts4table; 310 # 311 do_execsql_test 8.1 { 312 CREATE VIRTUAL TABLE t11 USING fts5(content, detail=%DETAIL%); 313 INSERT INTO t11(t11, rank) VALUES('pgsz', 32); 314 INSERT INTO t11 VALUES('quitealongstringoftext'); 315 INSERT INTO t11 VALUES('anotherquitealongstringoftext'); 316 INSERT INTO t11 VALUES('athirdlongstringoftext'); 317 INSERT INTO t11 VALUES('andonemoreforgoodluck'); 318 } 319 do_test 8.2 { 320 for {set i 0} {$i < 200} {incr i} { 321 execsql { INSERT INTO t11 VALUES('') } 322 } 323 execsql { INSERT INTO t11(t11) VALUES('optimize') } 324 } {} 325 do_execsql_test 8.3 { 326 SELECT mit(matchinfo(t11, 'nxa')) FROM t11 WHERE t11 MATCH 'a*' 327 } {{204 1 3 3 0} {204 1 3 3 0} {204 1 3 3 0}} 328 329 #------------------------------------------------------------------------- 330 331 if {[detail_is_full]} { 332 do_execsql_test 9.1 { 333 CREATE VIRTUAL TABLE t12 USING fts5(content, detail=%DETAIL%); 334 INSERT INTO t12 VALUES('a b c d'); 335 SELECT mit(matchinfo(t12,'x')) FROM t12 WHERE t12 MATCH 'NEAR(a d, 1) OR a'; 336 } {{0 1 1 0 1 1 1 1 1}} 337 do_execsql_test 9.2 { 338 INSERT INTO t12 VALUES('a d c d'); 339 SELECT mit(matchinfo(t12,'x')) FROM t12 WHERE t12 MATCH 'NEAR(a d, 1) OR a'; 340 } { 341 {0 2 2 0 3 2 1 2 2} {1 2 2 1 3 2 1 2 2} 342 } 343 do_execsql_test 9.3 { 344 INSERT INTO t12 VALUES('a d d a'); 345 SELECT mit(matchinfo(t12,'x')) FROM t12 WHERE t12 MATCH 'NEAR(a d, 1) OR a'; 346 } { 347 {0 4 3 0 5 3 1 4 3} {1 4 3 1 5 3 1 4 3} {2 4 3 2 5 3 2 4 3} 348 } 349 } 350 351 #--------------------------------------------------------------------------- 352 # Test for a memory leak 353 # 354 do_execsql_test 10.1 { 355 DROP TABLE t10; 356 CREATE VIRTUAL TABLE t10 USING fts5(idx, value, detail=%DETAIL%); 357 INSERT INTO t10 values (1, 'one'),(2, 'two'),(3, 'three'); 358 SELECT t10.rowid, t10.* 359 FROM t10 360 JOIN (SELECT 1 AS idx UNION SELECT 2 UNION SELECT 3) AS x 361 WHERE t10 MATCH x.idx 362 AND matchinfo(t10) not null 363 GROUP BY t10.rowid 364 ORDER BY 1; 365 } {1 1 one 2 2 two 3 3 three} 366 367 #--------------------------------------------------------------------------- 368 # Test the 'y' matchinfo flag 369 # 370 reset_db 371 sqlite3_fts5_register_matchinfo db 372 do_execsql_test 11.0 { 373 CREATE VIRTUAL TABLE tt USING fts5(x, y, detail=%DETAIL%); 374 INSERT INTO tt VALUES('c d a c d d', 'e a g b d a'); -- 1 375 INSERT INTO tt VALUES('c c g a e b', 'c g d g e c'); -- 2 376 INSERT INTO tt VALUES('b e f d e g', 'b a c b c g'); -- 3 377 INSERT INTO tt VALUES('a c f f g d', 'd b f d e g'); -- 4 378 INSERT INTO tt VALUES('g a c f c f', 'd g g b c c'); -- 5 379 INSERT INTO tt VALUES('g a c e b b', 'd b f b g g'); -- 6 380 INSERT INTO tt VALUES('f d a a f c', 'e e a d c f'); -- 7 381 INSERT INTO tt VALUES('a c b b g f', 'a b a e d f'); -- 8 382 INSERT INTO tt VALUES('b a f e c c', 'f d b b a b'); -- 9 383 INSERT INTO tt VALUES('f d c e a c', 'f a f a a f'); -- 10 384 } 385 386 db func mit mit 387 foreach {tn expr res} { 388 1 "a" { 389 1 {1 2} 2 {1 0} 3 {0 1} 4 {1 0} 5 {1 0} 390 6 {1 0} 7 {2 1} 8 {1 2} 9 {1 1} 10 {1 3} 391 } 392 393 2 "b" { 394 1 {0 1} 2 {1 0} 3 {1 2} 4 {0 1} 5 {0 1} 395 6 {2 2} 8 {2 1} 9 {1 3} 396 } 397 398 3 "y:a" { 399 1 {0 2} 3 {0 1} 400 7 {0 1} 8 {0 2} 9 {0 1} 10 {0 3} 401 } 402 403 4 "x:a" { 404 1 {1 0} 2 {1 0} 4 {1 0} 5 {1 0} 405 6 {1 0} 7 {2 0} 8 {1 0} 9 {1 0} 10 {1 0} 406 } 407 408 5 "a OR b" { 409 1 {1 2 0 1} 2 {1 0 1 0} 3 {0 1 1 2} 4 {1 0 0 1} 5 {1 0 0 1} 410 6 {1 0 2 2} 7 {2 1 0 0} 8 {1 2 2 1} 9 {1 1 1 3} 10 {1 3 0 0} 411 } 412 413 6 "a AND b" { 414 1 {1 2 0 1} 2 {1 0 1 0} 3 {0 1 1 2} 4 {1 0 0 1} 5 {1 0 0 1} 415 6 {1 0 2 2} 8 {1 2 2 1} 9 {1 1 1 3} 416 } 417 418 7 "a OR (a AND b)" { 419 1 {1 2 1 2 0 1} 2 {1 0 1 0 1 0} 3 {0 1 0 1 1 2} 4 {1 0 1 0 0 1} 420 5 {1 0 1 0 0 1} 6 {1 0 1 0 2 2} 7 {2 1 0 0 0 0} 8 {1 2 1 2 2 1} 421 9 {1 1 1 1 1 3} 10 {1 3 0 0 0 0} 422 } 423 424 } { 425 426 if {[string match *:* $expr] && [detail_is_none]} continue 427 do_execsql_test 11.1.$tn.1 { 428 SELECT rowid, mit(matchinfo(tt, 'y')) FROM tt WHERE tt MATCH $expr 429 } $res 430 431 set r2 [list] 432 foreach {rowid L} $res { 433 lappend r2 $rowid 434 set M [list] 435 foreach {a b} $L { 436 lappend M [expr ($a ? 1 : 0) + ($b ? 2 : 0)] 437 } 438 lappend r2 $M 439 } 440 441 do_execsql_test 11.1.$tn.2 { 442 SELECT rowid, mit(matchinfo(tt, 'b')) FROM tt WHERE tt MATCH $expr 443 } $r2 444 445 do_execsql_test 11.1.$tn.2 { 446 SELECT rowid, mit(matchinfo(tt, 'b')) FROM tt WHERE tt MATCH $expr 447 } $r2 448 } 449 450 #--------------------------------------------------------------------------- 451 # Test the 'b' matchinfo flag 452 # 453 reset_db 454 sqlite3_fts5_register_matchinfo db 455 db func mit mit 456 457 do_test 12.0 { 458 set cols [list] 459 for {set i 0} {$i < 50} {incr i} { lappend cols "c$i" } 460 execsql "CREATE VIRTUAL TABLE tt USING fts5([join $cols ,], detail=%DETAIL%)" 461 } {} 462 463 do_execsql_test 12.1 { 464 INSERT INTO tt (rowid, c4, c45) VALUES(1, 'abc', 'abc'); 465 SELECT mit(matchinfo(tt, 'b')) FROM tt WHERE tt MATCH 'abc'; 466 } [list [list [expr 1<<4] [expr 1<<(45-32)]]] 467 468 } ;# foreach_detail_mode 469 470 #------------------------------------------------------------------------- 471 # Test that a bad fts5() return is detected 472 # 473 reset_db 474 proc xyz {} {} 475 db func fts5 -argcount 1 xyz 476 do_test 13.1 { 477 list [catch { sqlite3_fts5_register_matchinfo db } msg] $msg 478 } {1 SQLITE_ERROR} 479 480 #------------------------------------------------------------------------- 481 # Test that an invalid matchinfo() flag is detected 482 # 483 reset_db 484 sqlite3_fts5_register_matchinfo db 485 do_execsql_test 14.1 { 486 CREATE VIRTUAL TABLE x1 USING fts5(z); 487 INSERT INTO x1 VALUES('a b c a b c a b c'); 488 } {} 489 490 do_catchsql_test 14.2 { 491 SELECT matchinfo(x1, 'd') FROM x1('a b c'); 492 } {1 {unrecognized matchinfo flag: d}} 493 494 finish_test