modernc.org/cc@v1.0.1/v2/testdata/_sqlite/ext/fts5/test/fts5hash.test (about) 1 # 2015 April 21 2 # 3 # The author disclaims copyright to this source code. In place of 4 # a legal notice, here is a blessing: 5 # 6 # May you do good and not evil. 7 # May you find forgiveness for yourself and forgive others. 8 # May you share freely, never taking more than you give. 9 # 10 #*********************************************************************** 11 # 12 # The tests in this file are focused on the code in fts5_hash.c. 13 # 14 15 source [file join [file dirname [info script]] fts5_common.tcl] 16 set testprefix fts5hash 17 18 # If SQLITE_ENABLE_FTS5 is defined, omit this file. 19 ifcapable !fts5 { 20 finish_test 21 return 22 } 23 24 #------------------------------------------------------------------------- 25 # Return a list of tokens (a vocabulary) that all share the same hash 26 # key value. This can be used to test hash collisions. 27 # 28 proc build_vocab1 {args} { 29 30 set O(-nslot) 1024 31 set O(-nword) 20 32 set O(-hash) 88 33 set O(-prefix) "" 34 35 if {[llength $args] % 2} { error "bad args" } 36 array set O2 $args 37 foreach {k v} $args { 38 if {[info exists O($k)]==0} { error "bad option: $k" } 39 set O($k) $v 40 } 41 42 set L [list] 43 while {[llength $L] < $O(-nword)} { 44 set t "$O(-prefix)[random_token]" 45 set h [sqlite3_fts5_token_hash $O(-nslot) $t] 46 if {$O(-hash)==$h} { lappend L $t } 47 } 48 return $L 49 } 50 51 proc random_token {} { 52 set map [list 0 a 1 b 2 c 3 d 4 e 5 f 6 g 7 h 8 i 9 j] 53 set iVal [expr int(rand() * 2000000)] 54 return [string map $map $iVal] 55 } 56 57 proc random_doc {vocab nWord} { 58 set doc "" 59 set nVocab [llength $vocab] 60 for {set i 0} {$i<$nWord} {incr i} { 61 set j [expr {int(rand() * $nVocab)}] 62 lappend doc [lindex $vocab $j] 63 } 64 return $doc 65 } 66 67 foreach_detail_mode $testprefix { 68 69 set vocab [build_vocab1] 70 db func r random_doc 71 72 do_execsql_test 1.0 { 73 CREATE VIRTUAL TABLE eee USING fts5(e, ee, detail=%DETAIL%); 74 BEGIN; 75 WITH ii(i) AS (SELECT 1 UNION ALL SELECT i+1 FROM ii WHERE i<100) 76 INSERT INTO eee SELECT r($vocab, 5), r($vocab, 7) FROM ii; 77 INSERT INTO eee(eee) VALUES('integrity-check'); 78 COMMIT; 79 INSERT INTO eee(eee) VALUES('integrity-check'); 80 } 81 82 set hash [sqlite3_fts5_token_hash 1024 xyz] 83 set vocab [build_vocab1 -prefix xyz -hash $hash] 84 lappend vocab xyz 85 86 do_execsql_test 1.1 { 87 CREATE VIRTUAL TABLE vocab USING fts5vocab(eee, 'row'); 88 BEGIN; 89 } 90 do_test 1.2 { 91 for {set i 1} {$i <= 100} {incr i} { 92 execsql { INSERT INTO eee VALUES( r($vocab, 5), r($vocab, 7) ) } 93 } 94 } {} 95 96 do_test 1.3 { 97 db eval { SELECT term, doc FROM vocab } { 98 set nRow [db one {SELECT count(*) FROM eee WHERE eee MATCH $term}] 99 if {$nRow != $doc} { 100 error "term=$term fts5vocab=$doc cnt=$nRow" 101 } 102 } 103 set {} {} 104 } {} 105 106 do_execsql_test 1.4 { 107 COMMIT; 108 INSERT INTO eee(eee) VALUES('integrity-check'); 109 } 110 111 #----------------------------------------------------------------------- 112 # Add a small and very large token with the same hash value to an 113 # empty table. At one point this would provoke an asan error. 114 # 115 do_test 2.0 { 116 set big [string repeat 12345 40] 117 set hash [sqlite3_fts5_token_hash 1024 $big] 118 while {1} { 119 set small [random_token] 120 if {[sqlite3_fts5_token_hash 1024 $small]==$hash} break 121 } 122 123 execsql { CREATE VIRTUAL TABLE t2 USING fts5(x, detail=%DETAIL%) } 124 execsql { 125 INSERT INTO t2 VALUES($small || ' ' || $big); 126 } 127 } {} 128 129 } ;# foreach_detail_mode 130 131 finish_test