First public contribution.
3 # The author disclaims copyright to this source code. In place of
4 # a legal notice, here is a blessing:
6 # May you do good and not evil.
7 # May you find forgiveness for yourself and forgive others.
8 # May you share freely, never taking more than you give.
10 #***********************************************************************
11 # This file implements regression tests for SQLite library. The
12 # focus of this file is testing the LIKE and GLOB operators and
13 # in particular the optimizations that occur to help those operators
16 # $Id: like.test,v 1.10 2008/09/09 12:31:34 drh Exp $
18 set testdir [file dirname $argv0]
19 source $testdir/tester.tcl
21 # Create some sample data to work with.
25 CREATE TABLE t1(x TEXT);
43 db eval {INSERT INTO t1 VALUES(:str)}
46 SELECT count(*) FROM t1;
50 # Test that both case sensitive and insensitive version of LIKE work.
54 SELECT x FROM t1 WHERE x LIKE 'abc' ORDER BY 1;
59 SELECT x FROM t1 WHERE x GLOB 'abc' ORDER BY 1;
64 SELECT x FROM t1 WHERE x LIKE 'ABC' ORDER BY 1;
69 SELECT x FROM t1 WHERE x LIKE 'aBc' ORDER BY 1;
74 PRAGMA case_sensitive_like=on;
75 SELECT x FROM t1 WHERE x LIKE 'abc' ORDER BY 1;
80 SELECT x FROM t1 WHERE x GLOB 'abc' ORDER BY 1;
85 SELECT x FROM t1 WHERE x LIKE 'ABC' ORDER BY 1;
90 SELECT x FROM t1 WHERE x LIKE 'aBc' ORDER BY 1;
95 PRAGMA case_sensitive_like=off;
96 SELECT x FROM t1 WHERE x LIKE 'abc' ORDER BY 1;
100 # Tests of the REGEXP operator
103 proc test_regexp {a b} {
104 return [regexp $a $b]
106 db function regexp test_regexp
108 SELECT x FROM t1 WHERE x REGEXP 'abc' ORDER BY 1;
110 } {{ABC abc xyz} abc abcd}
113 SELECT x FROM t1 WHERE x REGEXP '^abc' ORDER BY 1;
117 # Tests of the MATCH operator
120 proc test_match {a b} {
121 return [string match $a $b]
123 db function match -argcount 2 test_match
125 SELECT x FROM t1 WHERE x MATCH '*abc*' ORDER BY 1;
127 } {{ABC abc xyz} abc abcd}
130 SELECT x FROM t1 WHERE x MATCH 'abc*' ORDER BY 1;
134 # For the remaining tests, we need to have the like optimizations
137 ifcapable !like_opt {
142 # This procedure executes the SQL. Then it appends to the result the
143 # "sort" or "nosort" keyword (as in the cksort procedure above) then
144 # it appends the ::sqlite_query_plan variable.
146 proc queryplan {sql} {
147 set ::sqlite_sort_count 0
148 set data [execsql $sql]
149 if {$::sqlite_sort_count} {set x sort} {set x nosort}
151 return [concat $data $::sqlite_query_plan]
154 # Perform tests on the like optimization.
156 # With no index on t1.x and with case sensitivity turned off, no optimization
160 set sqlite_like_count 0
162 SELECT x FROM t1 WHERE x LIKE 'abc%' ORDER BY 1;
164 } {ABC {ABC abc xyz} abc abcd sort t1 {}}
166 set sqlite_like_count
169 # With an index on t1.x and case sensitivity on, optimize completely.
172 set sqlite_like_count 0
174 PRAGMA case_sensitive_like=on;
175 CREATE INDEX i1 ON t1(x);
178 SELECT x FROM t1 WHERE x LIKE 'abc%' ORDER BY 1;
180 } {abc abcd nosort {} i1}
182 set sqlite_like_count
185 # Partial optimization when the pattern does not end in '%'
188 set sqlite_like_count 0
190 SELECT x FROM t1 WHERE x LIKE 'a_c' ORDER BY 1;
194 set sqlite_like_count
197 set sqlite_like_count 0
199 SELECT x FROM t1 WHERE x LIKE 'ab%d' ORDER BY 1;
201 } {abcd abd nosort {} i1}
203 set sqlite_like_count
206 set sqlite_like_count 0
208 SELECT x FROM t1 WHERE x LIKE 'a_c%' ORDER BY 1;
210 } {abc abcd nosort {} i1}
212 set sqlite_like_count
215 # No optimization when the pattern begins with a wildcard.
216 # Note that the index is still used but only for sorting.
219 set sqlite_like_count 0
221 SELECT x FROM t1 WHERE x LIKE '%bcd' ORDER BY 1;
223 } {abcd bcd nosort {} i1}
225 set sqlite_like_count
228 # No optimization for case insensitive LIKE
231 set sqlite_like_count 0
233 PRAGMA case_sensitive_like=off;
234 SELECT x FROM t1 WHERE x LIKE 'abc%' ORDER BY 1;
236 } {ABC {ABC abc xyz} abc abcd nosort {} i1}
238 set sqlite_like_count
241 # No optimization without an index.
244 set sqlite_like_count 0
246 PRAGMA case_sensitive_like=on;
248 SELECT x FROM t1 WHERE x LIKE 'abc%' ORDER BY 1;
250 } {abc abcd sort t1 {}}
252 set sqlite_like_count
255 # No GLOB optimization without an index.
258 set sqlite_like_count 0
260 SELECT x FROM t1 WHERE x GLOB 'abc*' ORDER BY 1;
262 } {abc abcd sort t1 {}}
264 set sqlite_like_count
267 # GLOB is optimized regardless of the case_sensitive_like setting.
270 set sqlite_like_count 0
272 CREATE INDEX i1 ON t1(x);
273 SELECT x FROM t1 WHERE x GLOB 'abc*' ORDER BY 1;
275 } {abc abcd nosort {} i1}
277 set sqlite_like_count
280 set sqlite_like_count 0
282 PRAGMA case_sensitive_like=on;
283 SELECT x FROM t1 WHERE x GLOB 'abc*' ORDER BY 1;
285 } {abc abcd nosort {} i1}
287 set sqlite_like_count
290 set sqlite_like_count 0
292 PRAGMA case_sensitive_like=off;
293 SELECT x FROM t1 WHERE x GLOB 'a[bc]d' ORDER BY 1;
295 } {abd acd nosort {} i1}
297 set sqlite_like_count
300 # No optimization if the LHS of the LIKE is not a column name or
301 # if the RHS is not a string.
304 execsql {PRAGMA case_sensitive_like=on}
305 set sqlite_like_count 0
307 SELECT x FROM t1 WHERE x LIKE 'abc%' ORDER BY 1
309 } {abc abcd nosort {} i1}
311 set sqlite_like_count
314 set sqlite_like_count 0
316 SELECT x FROM t1 WHERE +x LIKE 'abc%' ORDER BY 1
318 } {abc abcd nosort {} i1}
320 set sqlite_like_count
323 set sqlite_like_count 0
325 SELECT x FROM t1 WHERE x LIKE ('ab' || 'c%') ORDER BY 1
327 } {abc abcd nosort {} i1}
329 set sqlite_like_count
332 # Collating sequences on the index disable the LIKE optimization.
333 # Or if the NOCASE collating sequence is used, the LIKE optimization
334 # is enabled when case_sensitive_like is OFF.
337 execsql {PRAGMA case_sensitive_like=off}
338 set sqlite_like_count 0
340 SELECT x FROM t1 WHERE x LIKE 'abc%' ORDER BY 1
342 } {ABC {ABC abc xyz} abc abcd nosort {} i1}
344 set sqlite_like_count
348 CREATE TABLE t2(x COLLATE NOCASE);
349 INSERT INTO t2 SELECT * FROM t1;
350 CREATE INDEX i2 ON t2(x COLLATE NOCASE);
352 set sqlite_like_count 0
354 SELECT x FROM t2 WHERE x LIKE 'abc%' ORDER BY 1
356 } {abc ABC {ABC abc xyz} abcd nosort {} i2}
358 set sqlite_like_count
362 PRAGMA case_sensitive_like=on;
364 set sqlite_like_count 0
366 SELECT x FROM t2 WHERE x LIKE 'abc%' ORDER BY 1
368 } {abc abcd nosort {} i2}
370 set sqlite_like_count
374 PRAGMA case_sensitive_like=off;
376 set sqlite_like_count 0
378 SELECT x FROM t2 WHERE x GLOB 'abc*' ORDER BY 1
380 } {abc abcd nosort {} i2}
382 set sqlite_like_count
385 execsql {PRAGMA case_sensitive_like=off}
386 set sqlite_like_count 0
388 SELECT x FROM t1 WHERE x LIKE 'ABC%' ORDER BY 1
390 } {ABC {ABC abc xyz} abc abcd nosort {} i1}
392 set sqlite_like_count
395 set sqlite_like_count 0
397 SELECT x FROM t2 WHERE x LIKE 'ABC%' ORDER BY 1
399 } {abc ABC {ABC abc xyz} abcd nosort {} i2}
401 set sqlite_like_count
405 PRAGMA case_sensitive_like=on;
407 set sqlite_like_count 0
409 SELECT x FROM t2 WHERE x LIKE 'ABC%' ORDER BY 1
411 } {ABC {ABC abc xyz} nosort {} i2}
413 set sqlite_like_count
417 PRAGMA case_sensitive_like=off;
419 set sqlite_like_count 0
421 SELECT x FROM t2 WHERE x GLOB 'ABC*' ORDER BY 1
423 } {ABC {ABC abc xyz} nosort {} i2}
425 set sqlite_like_count
428 # Boundary case. The prefix for a LIKE comparison is rounded up
429 # when constructing the comparison. Example: "ab" becomes "ac".
430 # In other words, the last character is increased by one.
432 # Make sure this happens correctly when the last character is a
433 # "z" and we are doing case-insensitive comparisons.
439 PRAGMA case_sensitive_like=off;
440 INSERT INTO t2 VALUES('ZZ-upper-upper');
441 INSERT INTO t2 VALUES('zZ-lower-upper');
442 INSERT INTO t2 VALUES('Zz-upper-lower');
443 INSERT INTO t2 VALUES('zz-lower-lower');
446 SELECT x FROM t2 WHERE x LIKE 'zz%';
448 } {zz-lower-lower zZ-lower-upper Zz-upper-lower ZZ-upper-upper nosort {} i2}
451 SELECT x FROM t2 WHERE x LIKE 'zZ%';
453 } {zz-lower-lower zZ-lower-upper Zz-upper-lower ZZ-upper-upper nosort {} i2}
456 SELECT x FROM t2 WHERE x LIKE 'Zz%';
458 } {zz-lower-lower zZ-lower-upper Zz-upper-lower ZZ-upper-upper nosort {} i2}
461 SELECT x FROM t2 WHERE x LIKE 'ZZ%';
463 } {zz-lower-lower zZ-lower-upper Zz-upper-lower ZZ-upper-upper nosort {} i2}
466 PRAGMA case_sensitive_like=on;
468 CREATE INDEX i3 ON t3(x);
469 INSERT INTO t3 VALUES('ZZ-upper-upper');
470 INSERT INTO t3 VALUES('zZ-lower-upper');
471 INSERT INTO t3 VALUES('Zz-upper-lower');
472 INSERT INTO t3 VALUES('zz-lower-lower');
473 SELECT x FROM t3 WHERE x LIKE 'zz%';
475 } {zz-lower-lower nosort {} i3}
478 SELECT x FROM t3 WHERE x LIKE 'zZ%';
480 } {zZ-lower-upper nosort {} i3}
483 SELECT x FROM t3 WHERE x LIKE 'Zz%';
485 } {Zz-upper-lower nosort {} i3}
488 SELECT x FROM t3 WHERE x LIKE 'ZZ%';
490 } {ZZ-upper-upper nosort {} i3}
495 # Make sure the LIKE prefix optimization does not strip off leading
496 # characters of the like pattern that happen to be quote characters.
499 foreach x { 'abc 'bcd 'def 'ax } {
500 set x2 '[string map {' ''} $x]'
501 db eval "INSERT INTO t2 VALUES($x2)"
504 SELECT * FROM t2 WHERE x LIKE '''a%'
510 SELECT * FROM t1 WHERE rowid GLOB '1*';
516 # Overloading the LIKE function with -1 for the number of arguments
517 # will overload both the 2-argument and the 3-argument LIKE.
522 INSERT INTO t8 VALUES('abcdef');
523 INSERT INTO t8 VALUES('ghijkl');
524 INSERT INTO t8 VALUES('mnopqr');
525 SELECT 1, x FROM t8 WHERE x LIKE '%h%';
526 SELECT 2, x FROM t8 WHERE x LIKE '%h%' ESCAPE 'x';
528 } {1 ghijkl 2 ghijkl}
530 proc newlike {args} {return 1} ;# Alternative LIKE is always return TRUE
531 db function like newlike ;# Uses -1 for nArg in sqlite3_create_function
534 SELECT 1, x FROM t8 WHERE x LIKE '%h%';
535 SELECT 2, x FROM t8 WHERE x LIKE '%h%' ESCAPE 'x';
537 } {1 ghijkl 2 ghijkl}
539 db function like -argcount 2 newlike
541 SELECT 1, x FROM t8 WHERE x LIKE '%h%';
542 SELECT 2, x FROM t8 WHERE x LIKE '%h%' ESCAPE 'x';
544 } {1 abcdef 1 ghijkl 1 mnopqr 2 ghijkl}
546 db function like -argcount 3 newlike
548 SELECT 1, x FROM t8 WHERE x LIKE '%h%';
549 SELECT 2, x FROM t8 WHERE x LIKE '%h%' ESCAPE 'x';
551 } {1 abcdef 1 ghijkl 1 mnopqr 2 abcdef 2 ghijkl 2 mnopqr}