Annotation of embedaddon/sqlite3/test/fts3matchinfo.test, revision 1.1
1.1 ! misho 1: # 2010 November 02
! 2: #
! 3: # The author disclaims copyright to this source code. In place of
! 4: # a legal notice, here is a blessing:
! 5: #
! 6: # May you do good and not evil.
! 7: # May you find forgiveness for yourself and forgive others.
! 8: # May you share freely, never taking more than you give.
! 9: #
! 10: #***********************************************************************
! 11: # This file implements regression tests for the FTS3 module. The focus
! 12: # of this file is tables created with the "matchinfo=fts3" option.
! 13: #
! 14:
! 15: set testdir [file dirname $argv0]
! 16: source $testdir/tester.tcl
! 17:
! 18: # If SQLITE_ENABLE_FTS3 is not defined, omit this file.
! 19: ifcapable !fts3 { finish_test ; return }
! 20:
! 21: set testprefix fts3matchinfo
! 22: set sqlite_fts3_enable_parentheses 0
! 23:
! 24: proc mit {blob} {
! 25: set scan(littleEndian) i*
! 26: set scan(bigEndian) I*
! 27: binary scan $blob $scan($::tcl_platform(byteOrder)) r
! 28: return $r
! 29: }
! 30: db func mit mit
! 31:
! 32: do_execsql_test 1.0 {
! 33: CREATE VIRTUAL TABLE t1 USING fts4(matchinfo=fts3);
! 34: SELECT name FROM sqlite_master WHERE type = 'table';
! 35: } {t1 t1_content t1_segments t1_segdir t1_stat}
! 36:
! 37: do_execsql_test 1.1 {
! 38: INSERT INTO t1(content) VALUES('I wandered lonely as a cloud');
! 39: INSERT INTO t1(content) VALUES('That floats on high o''er vales and hills,');
! 40: INSERT INTO t1(content) VALUES('When all at once I saw a crowd,');
! 41: INSERT INTO t1(content) VALUES('A host, of golden daffodils,');
! 42: SELECT mit(matchinfo(t1)) FROM t1 WHERE t1 MATCH 'I';
! 43: } {{1 1 1 2 2} {1 1 1 2 2}}
! 44:
! 45: # Now create an FTS4 table that does not specify matchinfo=fts3.
! 46: #
! 47: do_execsql_test 1.2 {
! 48: CREATE VIRTUAL TABLE t2 USING fts4;
! 49: INSERT INTO t2 SELECT * FROM t1;
! 50: SELECT mit(matchinfo(t2)) FROM t2 WHERE t2 MATCH 'I';
! 51: } {{1 1 1 2 2} {1 1 1 2 2}}
! 52:
! 53: # Test some syntax-error handling.
! 54: #
! 55: do_catchsql_test 2.0 {
! 56: CREATE VIRTUAL TABLE x1 USING fts4(matchinfo=fs3);
! 57: } {1 {unrecognized matchinfo: fs3}}
! 58: do_catchsql_test 2.1 {
! 59: CREATE VIRTUAL TABLE x2 USING fts4(mtchinfo=fts3);
! 60: } {1 {unrecognized parameter: mtchinfo=fts3}}
! 61: do_catchsql_test 2.2 {
! 62: CREATE VIRTUAL TABLE x2 USING fts4(matchinfo=fts5);
! 63: } {1 {unrecognized matchinfo: fts5}}
! 64:
! 65: # Check that with fts3, the "=" character is permitted in column definitions.
! 66: #
! 67: do_execsql_test 3.1 {
! 68: CREATE VIRTUAL TABLE t3 USING fts3(mtchinfo=fts3);
! 69: INSERT INTO t3(mtchinfo) VALUES('Beside the lake, beneath the trees');
! 70: SELECT mtchinfo FROM t3;
! 71: } {{Beside the lake, beneath the trees}}
! 72:
! 73: do_execsql_test 3.2 {
! 74: CREATE VIRTUAL TABLE xx USING FTS4;
! 75: }
! 76: do_execsql_test 3.3 {
! 77: SELECT * FROM xx WHERE xx MATCH 'abc';
! 78: }
! 79: do_execsql_test 3.4 {
! 80: SELECT * FROM xx WHERE xx MATCH 'a b c';
! 81: }
! 82:
! 83:
! 84: #--------------------------------------------------------------------------
! 85: # Proc [do_matchinfo_test] is used to test the FTSX matchinfo() function.
! 86: #
! 87: # The first argument - $tn - is a test identifier. This may be either a
! 88: # full identifier (i.e. "fts3matchinfo-1.1") or, if global var $testprefix
! 89: # is set, just the numeric component (i.e. "1.1").
! 90: #
! 91: # The second argument is the name of an FTSX table. The third is the
! 92: # full text of a WHERE/MATCH expression to query the table for
! 93: # (i.e. "t1 MATCH 'abc'"). The final argument - $results - should be a
! 94: # key-value list (serialized array) with matchinfo() format specifiers
! 95: # as keys, and the results of executing the statement:
! 96: #
! 97: # SELECT matchinfo($tbl, '$key') FROM $tbl WHERE $expr
! 98: #
! 99: # For example:
! 100: #
! 101: # CREATE VIRTUAL TABLE t1 USING fts4;
! 102: # INSERT INTO t1 VALUES('abc');
! 103: # INSERT INTO t1 VALUES('def');
! 104: # INSERT INTO t1 VALUES('abc abc');
! 105: #
! 106: # do_matchinfo_test 1.1 t1 "t1 MATCH 'abc'" {
! 107: # n {3 3}
! 108: # p {1 1}
! 109: # c {1 1}
! 110: # x {{1 3 2} {2 3 2}}
! 111: # }
! 112: #
! 113: # If the $results list contains keys mapped to "-" instead of a matchinfo()
! 114: # result, then this command computes the expected results based on other
! 115: # mappings to test the matchinfo() function. For example, the command above
! 116: # could be changed to:
! 117: #
! 118: # do_matchinfo_test 1.1 t1 "t1 MATCH 'abc'" {
! 119: # n {3 3} p {1 1} c {1 1} x {{1 3 2} {2 3 2}}
! 120: # pcx -
! 121: # }
! 122: #
! 123: # And this command would compute the expected results for matchinfo(t1, 'pcx')
! 124: # based on the results of matchinfo(t1, 'p'), matchinfo(t1, 'c') and
! 125: # matchinfo(t1, 'x') in order to test 'pcx'.
! 126: #
! 127: proc do_matchinfo_test {tn tbl expr results} {
! 128:
! 129: foreach {fmt res} $results {
! 130: if {$res == "-"} continue
! 131: set resarray($fmt) $res
! 132: }
! 133:
! 134: set nRow 0
! 135: foreach {fmt res} [array get resarray] {
! 136: if {[llength $res]>$nRow} { set nRow [llength $res] }
! 137: }
! 138:
! 139: # Construct expected results for any formats for which the caller
! 140: # supplied result is "-".
! 141: #
! 142: foreach {fmt res} $results {
! 143: if {$res == "-"} {
! 144: set res [list]
! 145: for {set iRow 0} {$iRow<$nRow} {incr iRow} {
! 146: set rowres [list]
! 147: foreach c [split $fmt ""] {
! 148: set rowres [concat $rowres [lindex $resarray($c) $iRow]]
! 149: }
! 150: lappend res $rowres
! 151: }
! 152: set resarray($fmt) $res
! 153: }
! 154: }
! 155:
! 156: # Test each matchinfo() request individually.
! 157: #
! 158: foreach {fmt res} [array get resarray] {
! 159: set sql "SELECT mit(matchinfo($tbl, '$fmt')) FROM $tbl WHERE $expr"
! 160: do_execsql_test $tn.$fmt $sql [normalize2 $res]
! 161: }
! 162:
! 163: # Test them all executed together (multiple invocations of matchinfo()).
! 164: #
! 165: set exprlist [list]
! 166: foreach {format res} [array get resarray] {
! 167: lappend exprlist "mit(matchinfo($tbl, '$format'))"
! 168: }
! 169: set allres [list]
! 170: for {set iRow 0} {$iRow<$nRow} {incr iRow} {
! 171: foreach {format res} [array get resarray] {
! 172: lappend allres [lindex $res $iRow]
! 173: }
! 174: }
! 175: set sql "SELECT [join $exprlist ,] FROM $tbl WHERE $expr"
! 176: do_execsql_test $tn.multi $sql [normalize2 $allres]
! 177: }
! 178: proc normalize2 {list_of_lists} {
! 179: set res [list]
! 180: foreach elem $list_of_lists {
! 181: lappend res [list {*}$elem]
! 182: }
! 183: return $res
! 184: }
! 185:
! 186:
! 187: do_execsql_test 4.1.0 {
! 188: CREATE VIRTUAL TABLE t4 USING fts4(x, y);
! 189: INSERT INTO t4 VALUES('a b c d e', 'f g h i j');
! 190: INSERT INTO t4 VALUES('f g h i j', 'a b c d e');
! 191: }
! 192:
! 193: do_matchinfo_test 4.1.1 t4 {t4 MATCH 'a b c'} {
! 194: p {3 3}
! 195: c {2 2}
! 196: x {
! 197: {1 1 1 0 1 1 1 1 1 0 1 1 1 1 1 0 1 1}
! 198: {0 1 1 1 1 1 0 1 1 1 1 1 0 1 1 1 1 1}
! 199: }
! 200: n {2 2}
! 201: l {{5 5} {5 5}}
! 202: a {{5 5} {5 5}}
! 203:
! 204: s {{3 0} {0 3}}
! 205:
! 206: xxxxxxxxxxxxxxxxxx - pcx - xpc - ccc - pppxpcpcx - laxnpc -
! 207: xpxsscplax -
! 208: }
! 209:
! 210: do_matchinfo_test 4.1.2 t4 {t4 MATCH '"g h i"'} {
! 211: p {1 1}
! 212: c {2 2}
! 213: x {
! 214: {0 1 1 1 1 1}
! 215: {1 1 1 0 1 1}
! 216: }
! 217: n {2 2}
! 218: l {{5 5} {5 5}}
! 219: a {{5 5} {5 5}}
! 220:
! 221: s {{0 1} {1 0}}
! 222:
! 223: xxxxxxxxxxxxxxxxxx - pcx - xpc - ccc - pppxpcpcx - laxnpc -
! 224: sxsxs -
! 225: }
! 226:
! 227: do_matchinfo_test 4.1.3 t4 {t4 MATCH 'a b'} { s {{2 0} {0 2}} }
! 228: do_matchinfo_test 4.1.4 t4 {t4 MATCH '"a b" c'} { s {{2 0} {0 2}} }
! 229: do_matchinfo_test 4.1.5 t4 {t4 MATCH 'a "b c"'} { s {{2 0} {0 2}} }
! 230: do_matchinfo_test 4.1.6 t4 {t4 MATCH 'd d'} { s {{1 0} {0 1}} }
! 231: do_matchinfo_test 4.1.7 t4 {t4 MATCH 'f OR abcd'} {
! 232: x {
! 233: {0 1 1 1 1 1 0 0 0 0 0 0}
! 234: {1 1 1 0 1 1 0 0 0 0 0 0}
! 235: }
! 236: }
! 237: do_matchinfo_test 4.1.8 t4 {t4 MATCH 'f -abcd'} {
! 238: x {
! 239: {0 1 1 1 1 1}
! 240: {1 1 1 0 1 1}
! 241: }
! 242: }
! 243:
! 244: do_execsql_test 4.2.0 {
! 245: CREATE VIRTUAL TABLE t5 USING fts4;
! 246: INSERT INTO t5 VALUES('a a a a a');
! 247: INSERT INTO t5 VALUES('a b a b a');
! 248: INSERT INTO t5 VALUES('c b c b c');
! 249: INSERT INTO t5 VALUES('x x x x x');
! 250: }
! 251: do_matchinfo_test 4.2.1 t5 {t5 MATCH 'a a'} {
! 252: x {{5 8 2 5 8 2} {3 8 2 3 8 2}}
! 253: s {2 1}
! 254: }
! 255: do_matchinfo_test 4.2.2 t5 {t5 MATCH 'a b'} { s {2} }
! 256: do_matchinfo_test 4.2.3 t5 {t5 MATCH 'a b a'} { s {3} }
! 257: do_matchinfo_test 4.2.4 t5 {t5 MATCH 'a a a'} { s {3 1} }
! 258: do_matchinfo_test 4.2.5 t5 {t5 MATCH '"a b" "a b"'} { s {2} }
! 259: do_matchinfo_test 4.2.6 t5 {t5 MATCH 'a OR b'} { s {1 2 1} }
! 260:
! 261: do_execsql_test 4.3.0 "INSERT INTO t5 VALUES('x y [string repeat {b } 50000]')";
! 262:
! 263: # It used to be that the second 'a' token would be deferred. That doesn't
! 264: # work any longer.
! 265: if 0 {
! 266: do_matchinfo_test 4.3.1 t5 {t5 MATCH 'a a'} {
! 267: x {{5 8 2 5 5 5} {3 8 2 3 5 5}}
! 268: s {2 1}
! 269: }
! 270: }
! 271:
! 272: do_matchinfo_test 4.3.2 t5 {t5 MATCH 'a b'} { s {2} }
! 273: do_matchinfo_test 4.3.3 t5 {t5 MATCH 'a b a'} { s {3} }
! 274: do_matchinfo_test 4.3.4 t5 {t5 MATCH 'a a a'} { s {3 1} }
! 275: do_matchinfo_test 4.3.5 t5 {t5 MATCH '"a b" "a b"'} { s {2} }
! 276: do_matchinfo_test 4.3.6 t5 {t5 MATCH 'a OR b'} { s {1 2 1 1} }
! 277:
! 278: do_execsql_test 4.4.0 {
! 279: INSERT INTO t5(t5) VALUES('optimize');
! 280: UPDATE t5_segments
! 281: SET block = zeroblob(length(block))
! 282: WHERE length(block)>10000;
! 283: }
! 284:
! 285: do_matchinfo_test 4.4.2 t5 {t5 MATCH 'a b'} { s {2} }
! 286: do_matchinfo_test 4.4.1 t5 {t5 MATCH 'a a'} { s {2 1} }
! 287: do_matchinfo_test 4.4.2 t5 {t5 MATCH 'a b'} { s {2} }
! 288: do_matchinfo_test 4.4.3 t5 {t5 MATCH 'a b a'} { s {3} }
! 289: do_matchinfo_test 4.4.4 t5 {t5 MATCH 'a a a'} { s {3 1} }
! 290: do_matchinfo_test 4.4.5 t5 {t5 MATCH '"a b" "a b"'} { s {2} }
! 291:
! 292: do_execsql_test 4.5.0 {
! 293: CREATE VIRTUAL TABLE t6 USING fts4(a, b, c);
! 294: INSERT INTO t6 VALUES('a', 'b', 'c');
! 295: }
! 296: do_matchinfo_test 4.5.1 t6 {t6 MATCH 'a b c'} { s {{1 1 1}} }
! 297:
! 298:
! 299: #-------------------------------------------------------------------------
! 300: # Check the following restrictions:
! 301: #
! 302: # + Matchinfo flags 'a', 'l' and 'n' can only be used with fts4, not fts3.
! 303: # + Matchinfo flag 'l' cannot be used with matchinfo=fts3.
! 304: #
! 305: do_execsql_test 5.1 {
! 306: CREATE VIRTUAL TABLE t7 USING fts3(a, b);
! 307: INSERT INTO t7 VALUES('u v w', 'x y z');
! 308:
! 309: CREATE VIRTUAL TABLE t8 USING fts4(a, b, matchinfo=fts3);
! 310: INSERT INTO t8 VALUES('u v w', 'x y z');
! 311: }
! 312:
! 313: do_catchsql_test 5.2.1 {
! 314: SELECT matchinfo(t7, 'a') FROM t7 WHERE t7 MATCH 'x y'
! 315: } {1 {unrecognized matchinfo request: a}}
! 316: do_catchsql_test 5.2.2 {
! 317: SELECT matchinfo(t7, 'l') FROM t7 WHERE t7 MATCH 'x y'
! 318: } {1 {unrecognized matchinfo request: l}}
! 319: do_catchsql_test 5.2.3 {
! 320: SELECT matchinfo(t7, 'n') FROM t7 WHERE t7 MATCH 'x y'
! 321: } {1 {unrecognized matchinfo request: n}}
! 322:
! 323: do_catchsql_test 5.3.1 {
! 324: SELECT matchinfo(t8, 'l') FROM t8 WHERE t8 MATCH 'x y'
! 325: } {1 {unrecognized matchinfo request: l}}
! 326:
! 327: #-------------------------------------------------------------------------
! 328: # Test that the offsets() function handles corruption in the %_content
! 329: # table correctly.
! 330: #
! 331: do_execsql_test 6.1 {
! 332: CREATE VIRTUAL TABLE t9 USING fts4;
! 333: INSERT INTO t9 VALUES(
! 334: 'this record is used to try to dectect corruption'
! 335: );
! 336: SELECT offsets(t9) FROM t9 WHERE t9 MATCH 'to';
! 337: } {{0 0 20 2 0 0 27 2}}
! 338:
! 339: do_catchsql_test 6.2 {
! 340: UPDATE t9_content SET c0content = 'this record is used to';
! 341: SELECT offsets(t9) FROM t9 WHERE t9 MATCH 'to';
! 342: } {1 {database disk image is malformed}}
! 343:
! 344: #-------------------------------------------------------------------------
! 345: # Test the outcome of matchinfo() when used within a query that does not
! 346: # use the full-text index (i.e. lookup by rowid or full-table scan).
! 347: #
! 348: do_execsql_test 7.1 {
! 349: CREATE VIRTUAL TABLE t10 USING fts4;
! 350: INSERT INTO t10 VALUES('first record');
! 351: INSERT INTO t10 VALUES('second record');
! 352: }
! 353: do_execsql_test 7.2 {
! 354: SELECT typeof(matchinfo(t10)), length(matchinfo(t10)) FROM t10;
! 355: } {blob 0 blob 0}
! 356: do_execsql_test 7.3 {
! 357: SELECT typeof(matchinfo(t10)), length(matchinfo(t10)) FROM t10 WHERE docid=1;
! 358: } {blob 0}
! 359: do_execsql_test 7.4 {
! 360: SELECT typeof(matchinfo(t10)), length(matchinfo(t10))
! 361: FROM t10 WHERE t10 MATCH 'record'
! 362: } {blob 20 blob 20}
! 363:
! 364: #-------------------------------------------------------------------------
! 365: # Test a special case - matchinfo('nxa') with many zero length documents.
! 366: # Special because "x" internally uses a statement used by both "n" and "a".
! 367: # This was causing a problem at one point in the obscure case where the
! 368: # total number of bytes of data stored in an fts3 table was greater than
! 369: # the number of rows. i.e. when the following query returns true:
! 370: #
! 371: # SELECT sum(length(content)) < count(*) FROM fts4table;
! 372: #
! 373: do_execsql_test 8.1 {
! 374: CREATE VIRTUAL TABLE t11 USING fts4;
! 375: INSERT INTO t11(t11) VALUES('nodesize=24');
! 376: INSERT INTO t11 VALUES('quitealongstringoftext');
! 377: INSERT INTO t11 VALUES('anotherquitealongstringoftext');
! 378: INSERT INTO t11 VALUES('athirdlongstringoftext');
! 379: INSERT INTO t11 VALUES('andonemoreforgoodluck');
! 380: }
! 381: do_test 8.2 {
! 382: for {set i 0} {$i < 200} {incr i} {
! 383: execsql { INSERT INTO t11 VALUES('') }
! 384: }
! 385: execsql { INSERT INTO t11(t11) VALUES('optimize') }
! 386: } {}
! 387: do_execsql_test 8.3 {
! 388: SELECT mit(matchinfo(t11, 'nxa')) FROM t11 WHERE t11 MATCH 'a*'
! 389: } {{204 1 3 3 0} {204 1 3 3 0} {204 1 3 3 0}}
! 390:
! 391: # Corruption related tests.
! 392: do_execsql_test 8.4.1.1 { UPDATE t11_stat SET value = X'0000'; }
! 393: do_catchsql_test 8.5.1.2 {
! 394: SELECT mit(matchinfo(t11, 'nxa')) FROM t11 WHERE t11 MATCH 'a*'
! 395: } {1 {database disk image is malformed}}
! 396:
! 397: do_execsql_test 8.4.2.1 { UPDATE t11_stat SET value = X'00'; }
! 398: do_catchsql_test 8.5.2.2 {
! 399: SELECT mit(matchinfo(t11, 'nxa')) FROM t11 WHERE t11 MATCH 'a*'
! 400: } {1 {database disk image is malformed}}
! 401:
! 402: do_execsql_test 8.4.3.1 { UPDATE t11_stat SET value = NULL; }
! 403: do_catchsql_test 8.5.3.2 {
! 404: SELECT mit(matchinfo(t11, 'nxa')) FROM t11 WHERE t11 MATCH 'a*'
! 405: } {1 {database disk image is malformed}}
! 406:
! 407: finish_test
! 408:
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>