# # Tests with the utf8mb4 character set # # Tests will be skipped for the view protocol because the view protocol uses # an additional util connection and don't use for this nessesary configurations # Also need to resolve MDEV-27871 -- source include/no_view_protocol.inc --source include/default_optimizer_switch.inc --disable_warnings drop table if exists t1,t2; --enable_warnings --echo # --echo # Start of 5.5 tests --echo # set names utf8mb4; select left(_utf8mb4 0xD0B0D0B1D0B2,1); select right(_utf8mb4 0xD0B0D0B2D0B2,1); select locate('he','hello'); select locate('he','hello',2); select locate('lo','hello',2); select locate('HE','hello'); select locate('HE','hello',2); select locate('LO','hello',2); select locate('HE','hello' collate utf8mb4_bin); select locate('HE','hello' collate utf8mb4_bin,2); select locate('LO','hello' collate utf8mb4_bin,2); select locate(_utf8mb4 0xD0B1, _utf8mb4 0xD0B0D0B1D0B2); select locate(_utf8mb4 0xD091, _utf8mb4 0xD0B0D0B1D0B2); select locate(_utf8mb4 0xD0B1, _utf8mb4 0xD0B0D091D0B2); select locate(_utf8mb4 0xD091, _utf8mb4 0xD0B0D0B1D0B2 collate utf8mb4_bin); select locate(_utf8mb4 0xD0B1, _utf8mb4 0xD0B0D091D0B2 collate utf8mb4_bin); select length(_utf8mb4 0xD0B1), bit_length(_utf8mb4 0xD0B1), char_length(_utf8mb4 0xD0B1); select 'a' like 'a'; select 'A' like 'a'; select 'A' like 'a' collate utf8mb4_bin; select _utf8mb4 0xD0B0D0B1D0B2 like concat(_utf8mb4'%',_utf8mb4 0xD0B1,_utf8mb4 '%'); # Bug #6040: can't retrieve records with umlaut # characters in case insensitive manner. # Case insensitive search LIKE comparison # was broken for multibyte characters: select convert(_latin1'Günter André' using utf8mb4) like CONVERT(_latin1'GÜNTER%' USING utf8mb4); select CONVERT(_koi8r'×ÁÓÑ' USING utf8mb4) LIKE CONVERT(_koi8r'÷áóñ' USING utf8mb4); select CONVERT(_koi8r'÷áóñ' USING utf8mb4) LIKE CONVERT(_koi8r'×ÁÓÑ' USING utf8mb4); # # Check the following: # "a" == "a " # "a\0" < "a" # "a\0" < "a " SELECT 'a' = 'a '; SELECT 'a\0' < 'a'; SELECT 'a\0' < 'a '; SELECT 'a\t' < 'a'; SELECT 'a\t' < 'a '; # # The same for binary collation # SELECT 'a' = 'a ' collate utf8mb4_bin; SELECT 'a\0' < 'a' collate utf8mb4_bin; SELECT 'a\0' < 'a ' collate utf8mb4_bin; SELECT 'a\t' < 'a' collate utf8mb4_bin; SELECT 'a\t' < 'a ' collate utf8mb4_bin; eval CREATE TABLE t1 (a char(10) character set utf8mb4 not null) ENGINE $engine; INSERT INTO t1 VALUES ('a'),('a\0'),('a\t'),('a '); --sorted_result SELECT hex(a),STRCMP(a,'a'), STRCMP(a,'a ') FROM t1; DROP TABLE t1; # # Fix this, it should return 1: # #select _utf8mb4 0xD0B0D0B1D0B2 like concat(_utf8mb4'%',_utf8mb4 0xD091,_utf8mb4 '%'); # # # Bug 2367: INSERT() behaviour is different for different charsets. # select insert('txs',2,1,'hi'),insert('is ',4,0,'a'),insert('txxxxt',2,4,'es'); select insert("aa",100,1,"b"),insert("aa",1,3,"b"); # # LELF() didn't work well with utf8mb4 in some cases too. # select char_length(left(@a:='теÑÑ‚',5)), length(@a), @a; # # CREATE ... SELECT # eval create table t1 ENGINE $engine select date_format("2004-01-19 10:10:10", "%Y-%m-%d"); show create table t1; select * from t1; drop table t1; # # Bug#22646 LC_TIME_NAMES: Assignment to non-UTF8 target fails # set names utf8mb4; set LC_TIME_NAMES='fr_FR'; eval create table t1 (s1 char(20) character set latin1) engine $engine; insert into t1 values (date_format('2004-02-02','%M')); select hex(s1) from t1; drop table t1; eval create table t1 (s1 char(20) character set koi8r) engine $engine; set LC_TIME_NAMES='ru_RU'; insert into t1 values (date_format('2004-02-02','%M')); insert into t1 values (date_format('2004-02-02','%b')); insert into t1 values (date_format('2004-02-02','%W')); insert into t1 values (date_format('2004-02-02','%a')); --sorted_result select hex(s1), s1 from t1; drop table t1; set LC_TIME_NAMES='en_US'; # # Bug #2366 Wrong utf8mb4 behaviour when data is truncated # set names koi8r; eval create table t1 (s1 char(1) character set utf8mb4) engine $engine; insert ignore into t1 values (_koi8r'ÁÂ'); select s1,hex(s1),char_length(s1),octet_length(s1) from t1; drop table t1; if (!$is_heap) { eval create table t1 (s1 tinytext character set utf8mb4) engine $engine; } if ($is_heap) { eval create table t1 (s1 varchar(255) character set utf8mb4) engine $engine; } insert ignore into t1 select repeat('a',300); insert ignore into t1 select repeat('Ñ',300); insert ignore into t1 select repeat('aÑ',300); insert ignore into t1 select repeat('Ña',300); insert ignore into t1 select repeat('ÑÑ',300); --sorted_result select hex(s1) from t1; --sorted_result select length(s1),char_length(s1) from t1; drop table t1; if (!$is_heap) { eval create table t1 (s1 text character set utf8mb4) engine $engine; } if ($is_heap) { eval create table t1 (s1 varchar(255) character set utf8mb4) engine $engine; } insert ignore into t1 select repeat('a',66000); insert ignore into t1 select repeat('Ñ',66000); insert ignore into t1 select repeat('aÑ',66000); insert ignore into t1 select repeat('Ña',66000); insert ignore into t1 select repeat('ÑÑ',66000); --sorted_result select length(s1),char_length(s1) from t1; drop table t1; # # Bug #2368 Multibyte charsets do not check that incoming data is well-formed # eval create table t1 (s1 char(10) character set utf8mb4) engine $engine; insert ignore into t1 values (0x41FF); select hex(s1) from t1; drop table t1; eval create table t1 (s1 varchar(10) character set utf8mb4) engine $engine; insert ignore into t1 values (0x41FF); select hex(s1) from t1; drop table t1; if (!$is_heap) { eval create table t1 (s1 text character set utf8mb4) engine $engine; insert ignore into t1 values (0x41FF); select hex(s1) from t1; drop table t1; } # # Bug 2699 # UTF8 breaks primary keys for cols > 333 characters # if(!$is_heap) { --error 0,ER_TOO_LONG_KEY eval create table t1 (a text character set utf8mb4, primary key(a(371))) engine $engine; show warnings; drop table if exists t1; } # # Bug 2959 # UTF8 charset breaks joins with mixed column/string constant # eval CREATE TABLE t1 ( a varchar(10) ) CHARACTER SET utf8mb4 ENGINE $engine; INSERT INTO t1 VALUES ( 'test' ); SELECT a.a, b.a FROM t1 a, t1 b WHERE a.a = b.a; SELECT a.a, b.a FROM t1 a, t1 b WHERE a.a = 'test' and b.a = 'test'; SELECT a.a, b.a FROM t1 a, t1 b WHERE a.a = b.a and a.a = 'test'; DROP TABLE t1; eval create table t1 (a char(255) character set utf8mb4) engine $engine; insert into t1 values('b'),('b'); select * from t1 where a = 'b'; select * from t1 where a = 'b' and a = 'b'; select * from t1 where a = 'b' and a != 'b'; drop table t1; # # Testing regexp # set names utf8mb4; --source include/ctype_regex.inc --source include/ctype_regex_utf8.inc # # Bug #4555 # ALTER TABLE crashes mysqld with enum column collated utf8mb4_unicode_ci # eval CREATE TABLE t1 (a enum ('Y', 'N') DEFAULT 'N' COLLATE utf8mb4_unicode_ci) ENGINE $engine; ALTER TABLE t1 ADD COLUMN b CHAR(20); DROP TABLE t1; # Customer Support Center issue # 3299 # ENUM and SET multibyte fields computed their length wronly # when converted into a char field set names utf8mb4; eval create table t1 (a enum('aaaa','проба') character set utf8mb4) engine $engine; show create table t1; insert into t1 values ('проба'); select * from t1; eval create table t2 engine $engine select ifnull(a,a) from t1; show create table t2; select * from t2; drop table t1; drop table t2; # # Bug 4521: unique key prefix interacts poorly with utf8mb4 # MYISAM: keys with prefix compression, case insensitive collation. # eval create table t1 (c varchar(30) character set utf8mb4, unique(c(10))) engine $engine; insert into t1 values ('1'),('2'),('3'),('x'),('y'),('z'); insert into t1 values ('aaaaaaaaaa'); --error ER_DUP_ENTRY insert into t1 values ('aaaaaaaaaaa'); --error ER_DUP_ENTRY insert into t1 values ('aaaaaaaaaaaa'); insert into t1 values (repeat('b',20)); select c c1 from t1 where c='1'; select c c2 from t1 where c='2'; select c c3 from t1 where c='3'; select c cx from t1 where c='x'; select c cy from t1 where c='y'; select c cz from t1 where c='z'; select c ca10 from t1 where c='aaaaaaaaaa'; select c cb20 from t1 where c=repeat('b',20); drop table t1; # # Bug 4521: unique key prefix interacts poorly with utf8mb4 # InnoDB: keys with prefix compression, case insensitive collation. # --disable_warnings eval create table t1 (c varchar(30) character set utf8mb4, unique(c(10))) engine=$engine; --enable_warnings insert into t1 values ('1'),('2'),('3'),('x'),('y'),('z'); insert into t1 values ('aaaaaaaaaa'); --error ER_DUP_ENTRY insert into t1 values ('aaaaaaaaaaa'); --error ER_DUP_ENTRY insert into t1 values ('aaaaaaaaaaaa'); insert into t1 values (repeat('b',20)); select c c1 from t1 where c='1'; select c c2 from t1 where c='2'; select c c3 from t1 where c='3'; select c cx from t1 where c='x'; select c cy from t1 where c='y'; select c cz from t1 where c='z'; select c ca10 from t1 where c='aaaaaaaaaa'; select c cb20 from t1 where c=repeat('b',20); drop table t1; # # Bug 4521: unique key prefix interacts poorly with utf8mb4 # MYISAM: fixed length keys, case insensitive collation # eval create table t1 (c char(3) character set utf8mb4, unique (c(2))) engine $engine; insert into t1 values ('1'),('2'),('3'),('4'),('x'),('y'),('z'); insert into t1 values ('a'); insert into t1 values ('aa'); --error ER_DUP_ENTRY insert into t1 values ('aaa'); insert into t1 values ('b'); insert into t1 values ('bb'); --error ER_DUP_ENTRY insert into t1 values ('bbb'); insert into t1 values ('а'); insert into t1 values ('аа'); --error ER_DUP_ENTRY insert into t1 values ('ааа'); insert into t1 values ('б'); insert into t1 values ('бб'); --error ER_DUP_ENTRY insert into t1 values ('ббб'); insert into t1 values ('ꪪ'); insert into t1 values ('ꪪꪪ'); --error ER_DUP_ENTRY insert into t1 values ('ꪪꪪꪪ'); drop table t1; # # Bug 4521: unique key prefix interacts poorly with utf8mb4 # InnoDB: fixed length keys, case insensitive collation # --disable_warnings eval create table t1 (c char(3) character set utf8mb4, unique (c(2))) engine=$engine; --enable_warnings insert into t1 values ('1'),('2'),('3'),('4'),('x'),('y'),('z'); insert into t1 values ('a'); insert into t1 values ('aa'); --error ER_DUP_ENTRY insert into t1 values ('aaa'); insert into t1 values ('b'); insert into t1 values ('bb'); --error ER_DUP_ENTRY insert into t1 values ('bbb'); insert into t1 values ('а'); insert into t1 values ('аа'); --error ER_DUP_ENTRY insert into t1 values ('ааа'); insert into t1 values ('б'); insert into t1 values ('бб'); --error ER_DUP_ENTRY insert into t1 values ('ббб'); insert into t1 values ('ꪪ'); insert into t1 values ('ꪪꪪ'); --error ER_DUP_ENTRY insert into t1 values ('ꪪꪪꪪ'); drop table t1; # # Bug 4531: unique key prefix interacts poorly with utf8mb4 # Check HEAP+HASH, case insensitive collation # eval create table t1 ( c char(10) character set utf8mb4, unique key a using hash (c(1)) ) engine=$engine; show create table t1; insert into t1 values ('a'),('b'),('c'),('d'),('e'),('f'); --error ER_DUP_ENTRY insert into t1 values ('aa'); --error ER_DUP_ENTRY insert into t1 values ('aaa'); insert into t1 values ('б'); --error ER_DUP_ENTRY insert into t1 values ('бб'); --error ER_DUP_ENTRY insert into t1 values ('ббб'); select c as c_all from t1 order by c; select c as c_a from t1 where c='a'; select c as c_a from t1 where c='б'; drop table t1; # # Bug 4531: unique key prefix interacts poorly with utf8mb4 # Check HEAP+BTREE, case insensitive collation # eval create table t1 ( c char(10) character set utf8mb4, unique key a using btree (c(1)) ) engine=$engine; show create table t1; insert into t1 values ('a'),('b'),('c'),('d'),('e'),('f'); --error ER_DUP_ENTRY insert into t1 values ('aa'); --error ER_DUP_ENTRY insert into t1 values ('aaa'); insert into t1 values ('б'); --error ER_DUP_ENTRY insert into t1 values ('бб'); --error ER_DUP_ENTRY insert into t1 values ('ббб'); select c as c_all from t1 order by c; select c as c_a from t1 where c='a'; select c as c_a from t1 where c='б'; drop table t1; # # Bug 4531: unique key prefix interacts poorly with utf8mb4 # Check BDB, case insensitive collation # --disable_warnings eval create table t1 ( c char(10) character set utf8mb4, unique key a (c(1)) ) engine=$engine; --enable_warnings insert into t1 values ('a'),('b'),('c'),('d'),('e'),('f'); --error ER_DUP_ENTRY insert into t1 values ('aa'); --error ER_DUP_ENTRY insert into t1 values ('aaa'); insert into t1 values ('б'); --error ER_DUP_ENTRY insert into t1 values ('бб'); --error ER_DUP_ENTRY insert into t1 values ('ббб'); select c as c_all from t1 order by c; select c as c_a from t1 where c='a'; select c as c_a from t1 where c='б'; drop table t1; # # Bug 4521: unique key prefix interacts poorly with utf8mb4 # MYISAM: keys with prefix compression, binary collation. # eval create table t1 (c varchar(30) character set utf8mb4 collate utf8mb4_bin, unique(c(10))) engine $engine; insert into t1 values ('1'),('2'),('3'),('x'),('y'),('z'); insert into t1 values ('aaaaaaaaaa'); --error ER_DUP_ENTRY insert into t1 values ('aaaaaaaaaaa'); --error ER_DUP_ENTRY insert into t1 values ('aaaaaaaaaaaa'); insert into t1 values (repeat('b',20)); select c c1 from t1 where c='1'; select c c2 from t1 where c='2'; select c c3 from t1 where c='3'; select c cx from t1 where c='x'; select c cy from t1 where c='y'; select c cz from t1 where c='z'; select c ca10 from t1 where c='aaaaaaaaaa'; select c cb20 from t1 where c=repeat('b',20); drop table t1; # # Bug 4521: unique key prefix interacts poorly with utf8mb4 # MYISAM: fixed length keys, binary collation # eval create table t1 (c char(3) character set utf8mb4 collate utf8mb4_bin, unique (c(2))) engine $engine; insert into t1 values ('1'),('2'),('3'),('4'),('x'),('y'),('z'); insert into t1 values ('a'); insert into t1 values ('aa'); --error ER_DUP_ENTRY insert into t1 values ('aaa'); insert into t1 values ('b'); insert into t1 values ('bb'); --error ER_DUP_ENTRY insert into t1 values ('bbb'); insert into t1 values ('а'); insert into t1 values ('аа'); --error ER_DUP_ENTRY insert into t1 values ('ааа'); insert into t1 values ('б'); insert into t1 values ('бб'); --error ER_DUP_ENTRY insert into t1 values ('ббб'); insert into t1 values ('ꪪ'); insert into t1 values ('ꪪꪪ'); --error ER_DUP_ENTRY insert into t1 values ('ꪪꪪꪪ'); drop table t1; # # Bug 4531: unique key prefix interacts poorly with utf8mb4 # Check HEAP+HASH, binary collation # eval create table t1 ( c char(10) character set utf8mb4 collate utf8mb4_bin, unique key a using hash (c(1)) ) engine=$engine; show create table t1; insert into t1 values ('a'),('b'),('c'),('d'),('e'),('f'); --error ER_DUP_ENTRY insert into t1 values ('aa'); --error ER_DUP_ENTRY insert into t1 values ('aaa'); insert into t1 values ('б'); --error ER_DUP_ENTRY insert into t1 values ('бб'); --error ER_DUP_ENTRY insert into t1 values ('ббб'); select c as c_all from t1 order by c; select c as c_a from t1 where c='a'; select c as c_a from t1 where c='б'; drop table t1; # # Bug 4531: unique key prefix interacts poorly with utf8mb4 # Check HEAP+BTREE, binary collation # eval create table t1 ( c char(10) character set utf8mb4 collate utf8mb4_bin, unique key a using btree (c(1)) ) engine=$engine; show create table t1; insert into t1 values ('a'),('b'),('c'),('d'),('e'),('f'); --error ER_DUP_ENTRY insert into t1 values ('aa'); --error ER_DUP_ENTRY insert into t1 values ('aaa'); insert into t1 values ('б'); --error ER_DUP_ENTRY insert into t1 values ('бб'); --error ER_DUP_ENTRY insert into t1 values ('ббб'); select c as c_all from t1 order by c; select c as c_a from t1 where c='a'; select c as c_a from t1 where c='б'; drop table t1; # # Bug 4531: unique key prefix interacts poorly with utf8mb4 # Check BDB, binary collation # --disable_warnings eval create table t1 ( c char(10) character set utf8mb4 collate utf8mb4_bin, unique key a (c(1)) ) engine=$engine; --enable_warnings insert into t1 values ('a'),('b'),('c'),('d'),('e'),('f'); --error ER_DUP_ENTRY insert into t1 values ('aa'); --error ER_DUP_ENTRY insert into t1 values ('aaa'); insert into t1 values ('б'); --error ER_DUP_ENTRY insert into t1 values ('бб'); --error ER_DUP_ENTRY insert into t1 values ('ббб'); select c as c_all from t1 order by c; select c as c_a from t1 where c='a'; select c as c_a from t1 where c='б'; drop table t1; # Bug#4594: column index make = failed for gbk, but like works # Check MYISAM # eval create table t1 ( str varchar(255) character set utf8mb4 not null, key str (str(2)) ) engine=$engine; INSERT INTO t1 VALUES ('str'); INSERT INTO t1 VALUES ('str2'); select * from t1 where str='str'; drop table t1; # Bug#4594: column index make = failed for gbk, but like works # Check InnoDB # --disable_warnings eval create table t1 ( str varchar(255) character set utf8mb4 not null, key str (str(2)) ) engine=$engine; --enable_warnings INSERT INTO t1 VALUES ('str'); INSERT INTO t1 VALUES ('str2'); select * from t1 where str='str'; drop table t1; # the same for HEAP+BTREE # eval create table t1 ( str varchar(255) character set utf8mb4 not null, key str using btree (str(2)) ) engine=$engine; INSERT INTO t1 VALUES ('str'); INSERT INTO t1 VALUES ('str2'); select * from t1 where str='str'; drop table t1; # the same for HEAP+HASH # eval create table t1 ( str varchar(255) character set utf8mb4 not null, key str using hash (str(2)) ) engine=$engine; INSERT INTO t1 VALUES ('str'); INSERT INTO t1 VALUES ('str2'); select * from t1 where str='str'; drop table t1; # the same for BDB # #hh --disable_warnings eval create table t1 ( str varchar(255) character set utf8mb4 not null, key str (str(2)) ) engine= $engine; --enable_warnings INSERT INTO t1 VALUES ('str'); INSERT INTO t1 VALUES ('str2'); select * from t1 where str='str'; drop table t1; # # Bug #5397: Crash with varchar binary and LIKE # eval CREATE TABLE t1 (a varchar(32) BINARY) CHARACTER SET utf8mb4 ENGINE $engine; INSERT INTO t1 VALUES ('test'); SELECT a FROM t1 WHERE a LIKE '%te'; DROP TABLE t1; # # Bug #5723: length() returns varying results # --disable_warnings SET NAMES utf8mb4; --disable_warnings eval CREATE TABLE t1 ( subject varchar(255) character set utf8mb4 collate utf8mb4_unicode_ci, p varchar(15) character set utf8mb4 ) ENGINE= $engine DEFAULT CHARSET=latin1; --enable_warnings INSERT INTO t1 VALUES ('è°·å·ä¿ŠäºŒã¨ç”³ã—ã¾ã™ãŒã€ã‚¤ãƒ³ã‚¿ãƒ¼ãƒãƒƒãƒˆäºˆç´„ã®ä¼šå“¡ç™»éŒ²ã‚’ã—ã¾ã—ãŸã¨ã“ã‚ã€ãƒ¡ãƒ¼ãƒ«ã‚¢ãƒ‰ãƒ¬ã‚¹ã‚’é–“é•ãˆã¦ã—ã¾ã„会員IDãŒå—ã‘å–ã‚‹ã“ã¨ãŒå‡ºæ¥ã¾ã›ã‚“ã§ã—ãŸã€‚é–“é•ãˆã‚¢ãƒ‰ãƒ¬ã‚¹ã¯tani-shun@n.vodafone.ne.jpを書ãè¾¼ã¿ã¾ã—ãŸã€‚ã©ã†ã™ã‚Œã°ã‚ˆã„ã§ã™ã‹ï¼Ÿ ãã®ä»–ã€ä½æ‰€ç­‰ã¯é–“é•ãˆã‚ã‚Šã¾ã›ã‚“。連絡ãã ã•ã„。よã‚ã—ããŠé¡˜ã„ã—ã¾ã™ã€‚m(__)m','040312-000057'); INSERT INTO t1 VALUES ('aaa','bbb'); --sorted_result SELECT length(subject) FROM t1; SELECT length(subject) FROM t1 ORDER BY 1; DROP TABLE t1; # # Bug #5832 SELECT doesn't return records in some cases # if (!$is_heap) { eval CREATE TABLE t1 ( id int unsigned NOT NULL auto_increment, list_id smallint unsigned NOT NULL, term TEXT NOT NULL, PRIMARY KEY(id), INDEX(list_id, term(4)) ) ENGINE=$engine CHARSET=utf8mb4; INSERT INTO t1 SET list_id = 1, term = "letterc"; INSERT INTO t1 SET list_id = 1, term = "letterb"; INSERT INTO t1 SET list_id = 1, term = "lettera"; INSERT INTO t1 SET list_id = 1, term = "letterd"; SELECT id FROM t1 WHERE (list_id = 1) AND (term = "letterc"); SELECT id FROM t1 WHERE (list_id = 1) AND (term = "letterb"); SELECT id FROM t1 WHERE (list_id = 1) AND (term = "lettera"); SELECT id FROM t1 WHERE (list_id = 1) AND (term = "letterd"); DROP TABLE t1; # # Bug #6043 erratic searching for diacriticals in indexed MyISAM UTF-8 table # SET NAMES latin1; eval CREATE TABLE t1 ( id int unsigned NOT NULL auto_increment, list_id smallint unsigned NOT NULL, term text NOT NULL, PRIMARY KEY(id), INDEX(list_id, term(19)) ) ENGINE=$engine CHARSET=utf8mb4; INSERT INTO t1 set list_id = 1, term = "testétest"; INSERT INTO t1 set list_id = 1, term = "testetest"; INSERT INTO t1 set list_id = 1, term = "testètest"; SELECT id, term FROM t1 where (list_id = 1) AND (term = "testétest"); SELECT id, term FROM t1 where (list_id = 1) AND (term = "testetest"); SELECT id, term FROM t1 where (list_id = 1) AND (term = "testètest"); DROP TABLE t1; } # # Bug #6019 SELECT tries to use too short prefix index on utf8mb4 data # set names utf8mb4; --disable_warnings eval create table t1 ( a int primary key, b varchar(6), index b3(b(3)) ) engine=$engine character set=utf8mb4; --enable_warnings insert into t1 values(1,'foo'),(2,'foobar'); --sorted_result select * from t1 where b like 'foob%'; --disable_query_log set @ctype_save_sql_mode=@@sql_mode; set sql_mode=""; --enable_query_log --disable_warnings alter table t1 engine=innodb; --enable_warnings --disable_query_log set sql_mode=@ctype_save_sql_mode; --enable_query_log --sorted_result select * from t1 where b like 'foob%'; drop table t1; # # Test for calculate_interval_lengths() function # eval create table t1 ( a enum('петÑ','ваÑÑ','анюта') character set utf8mb4 not null default 'анюта', b set('петÑ','ваÑÑ','анюта') character set utf8mb4 not null default 'анюта' ) engine $engine; eval create table t2 engine $engine select concat(a,_utf8mb4'') as a, concat(b,_utf8mb4'')as b from t1; show create table t2; drop table t2; drop table t1; # # Bug #6787 LIKE not working properly with _ and utf8mb4 data # select 'c' like '\_' as want0; # # SUBSTR with negative offset didn't work with multi-byte strings # SELECT SUBSTR('ваÑÑ',-2); # # Bug #7730 Server crash using soundex on an utf8mb4 table # eval create table t1 (id integer, a varchar(100) character set utf8mb4 collate utf8mb4_unicode_ci) engine $engine; insert into t1 values (1, 'Test'); select * from t1 where soundex(a) = soundex('Test'); select * from t1 where soundex(a) = soundex('TEST'); select * from t1 where soundex(a) = soundex('test'); drop table t1; # # Bug#22638 SOUNDEX broken for international characters # select soundex(_utf8mb4 0xE99885E8A788E99A8FE697B6E69BB4E696B0E79A84E696B0E997BB); select hex(soundex(_utf8mb4 0xE99885E8A788E99A8FE697B6E69BB4E696B0E79A84E696B0E997BB)); select soundex(_utf8mb4 0xD091D092D093); select hex(soundex(_utf8mb4 0xD091D092D093)); SET collation_connection='utf8mb4_general_ci'; -- source include/ctype_filesort.inc -- source include/ctype_like_escape.inc -- source include/ctype_german.inc SET collation_connection='utf8mb4_bin'; -- source include/ctype_filesort.inc -- source include/ctype_like_escape.inc # # Bug #7874 CONCAT() gives wrong results mixing # latin1 field and utf8mb4 string literals # eval CREATE TABLE t1 ( user varchar(255) NOT NULL default '' ) ENGINE=$engine DEFAULT CHARSET=latin1; INSERT INTO t1 VALUES ('one'),('two'); SELECT CHARSET('a'); --sorted_result SELECT user, CONCAT('<', user, '>') AS c FROM t1; DROP TABLE t1; # # Bug#8785 # the same problem with the above, but with nested CONCATs # eval create table t1 (f1 varchar(1) not null) default charset utf8mb4 engine $engine; insert into t1 values (''), (''); select concat(concat(_latin1'->',f1),_latin1'<-') from t1; drop table t1; # # Bug#8385: utf8mb4_general_ci treats Cyrillic letters I and SHORT I as the same # select convert(_koi8r'É' using utf8mb4) < convert(_koi8r'Ê' using utf8mb4); # # Bugs#5980: NULL requires a characterset in a union # set names latin1; eval create table t1 (a varchar(10)) character set utf8mb4 engine $engine; insert into t1 values ('test'); select ifnull(a,'') from t1; drop table t1; select repeat(_utf8mb4'+',3) as h union select NULL; select ifnull(NULL, _utf8mb4'string'); # # Bug#9509 Optimizer: wrong result after AND with comparisons # set names utf8mb4; eval create table t1 (s1 char(5) character set utf8mb4 collate utf8mb4_lithuanian_ci) engine $engine; insert into t1 values ('I'),('K'),('Y'); --sorted_result select * from t1 where s1 < 'K' and s1 = 'Y'; --sorted_result select * from t1 where 'K' > s1 and s1 = 'Y'; drop table t1; eval create table t1 (s1 char(5) character set utf8mb4 collate utf8mb4_czech_ci) engine $engine; insert into t1 values ('c'),('d'),('h'),('ch'),('CH'),('cH'),('Ch'),('i'); --sorted_result select * from t1 where s1 > 'd' and s1 = 'CH'; --sorted_result select * from t1 where 'd' < s1 and s1 = 'CH'; --sorted_result select * from t1 where s1 = 'cH' and s1 <> 'ch'; --sorted_result select * from t1 where 'cH' = s1 and s1 <> 'ch'; drop table t1; # # Bug#10714: Inserting double value into utf8mb4 column crashes server # eval create table t1 (a varchar(255)) default character set utf8mb4 engine $engine; insert into t1 values (1.0); drop table t1; # # Bug#10253 compound index length and utf8mb4 char set # produces invalid query results # eval create table t1 ( id int not null, city varchar(20) not null, key (city(7),id) ) character set=utf8mb4 engine $engine; insert into t1 values (1,'Durban North'); insert into t1 values (2,'Durban'); select * from t1 where city = 'Durban'; select * from t1 where city = 'Durban '; drop table t1; # # Bug #11819 CREATE TABLE with a SET DEFAULT 0 and UTF8 crashes server. # --error 1067 eval create table t1 (x set('A', 'B') default 0) character set utf8mb4 engine $engine; --error 1067 eval create table t1 (x enum('A', 'B') default 0) character set utf8mb4 engine $engine; # # Test for bug #11167: join for utf8mb4 varchar value longer than 255 bytes # SET NAMES UTF8; eval CREATE TABLE t1 ( `id` int(20) NOT NULL auto_increment, `country` varchar(100) NOT NULL default '', `shortcode` varchar(100) NOT NULL default '', `operator` varchar(100) NOT NULL default '', `momid` varchar(30) NOT NULL default '', `keyword` varchar(160) NOT NULL default '', `content` varchar(160) NOT NULL default '', `second_token` varchar(160) default NULL, `gateway_id` int(11) NOT NULL default '0', `created` datetime NOT NULL default '0000-00-00 00:00:00', `msisdn` varchar(15) NOT NULL default '', PRIMARY KEY (`id`), UNIQUE KEY `MSCCSPK_20030521130957121` (`momid`), KEY `IX_mobile_originated_message_keyword` (`keyword`), KEY `IX_mobile_originated_message_created` (`created`), KEY `IX_mobile_originated_message_support` (`msisdn`,`momid`,`keyword`,`gateway_id`,`created`) ) ENGINE=$engine DEFAULT CHARSET=utf8mb4; INSERT INTO t1 VALUES (1,'blah','464','aaa','fkc1c9ilc20x0hgae7lx6j09','ERR','ERR Имри.Ðфимим.Ðеимимримдмримрмрирор имримримримр имридм ирбднримрфмририримрфмфмим.Ðд.Д имдимримрад.Ðдимримримрмдиримримримр м.Дадимфшьмримд им.Ðдимимрн имадми','ИМРИ.ÐФИМИМ.ÐЕИМИМРИМДМРИМРМРИРОР',3,'2005-06-01 17:30:43','1234567890'), (2,'blah','464','aaa','haxpl2ilc20x00bj4tt2m5ti','11','11 g','G',3,'2005-06-02 22:43:10','1234567890'); --disable_warnings eval CREATE TABLE t2 ( `msisdn` varchar(15) NOT NULL default '', `operator_id` int(11) NOT NULL default '0', `created` datetime NOT NULL default '0000-00-00 00:00:00', UNIQUE KEY `PK_user` (`msisdn`) ) ENGINE=$engine DEFAULT CHARSET=utf8mb4; --enable_warnings INSERT INTO t2 VALUES ('1234567890',2,'2005-05-24 13:53:25'); SELECT content, t2.msisdn FROM t1, t2 WHERE t1.msisdn = '1234567890'; DROP TABLE t1,t2; # # Bug#11591: CHAR column with utf8mb4 does not work properly # (more chars than expected) # eval create table t1 (a char(20) character set utf8mb4) engine $engine; insert into t1 values ('123456'),('андрей'); SET STATEMENT sql_mode = 'NO_ENGINE_SUBSTITUTION' FOR alter table t1 modify a char(2) character set utf8mb4; select char_length(a), length(a), a from t1 order by a; drop table t1; # # Bugs#12611 # ESCAPE + LIKE do not work when the escape char is a multibyte one # set names utf8mb4; select 'andre%' like 'andreñ%' escape 'ñ'; # # Bugs#11754: SET NAMES utf8mb4 followed by SELECT "A\\" LIKE "A\\" returns 0 # set names utf8mb4; select 'a\\' like 'a\\'; select 'aa\\' like 'a%\\'; eval create table t1 (a char(10), key(a)) character set utf8mb4 engine $engine; insert into t1 values ("a"),("abc"),("abcd"),("hello"),("test"); --sorted_result select * from t1 where a like "abc%"; --sorted_result select * from t1 where a like concat("abc","%"); --sorted_result select * from t1 where a like "ABC%"; select * from t1 where a like "test%"; select * from t1 where a like "te_t"; --sorted_result select * from t1 where a like "%a%"; --sorted_result select * from t1 where a like "%abcd%"; select * from t1 where a like "%abc\d%"; drop table t1; # # Bug#9557 MyISAM utf8mb4 table crash # eval CREATE TABLE t1 ( a varchar(255) NOT NULL default '', KEY a (a) ) ENGINE=$engine DEFAULT CHARSET=utf8mb4 COLLATE utf8mb4_general_ci; insert into t1 values (_utf8mb4 0xe880bd); insert into t1 values (_utf8mb4 0x5b); --sorted_result select hex(a) from t1; drop table t1; # # Bug#13751 find_in_set: Illegal mix of collations # set names 'latin1'; eval create table t1 (a varchar(255)) default charset=utf8mb4 engine $engine; select * from t1 where find_in_set('-1', a); drop table t1; # # Bug#13233: select distinct char(column) fails with utf8mb4 # eval create table t1 (a int) engine $engine; insert into t1 values (48),(49),(50); set names utf8mb4; --sorted_result select distinct char(a) from t1; drop table t1; if (!$is_heap) { # # Bug#15581: COALESCE function truncates mutli-byte TINYTEXT values # eval CREATE TABLE t1 (t TINYTEXT CHARACTER SET utf8mb4) ENGINE $engine; INSERT INTO t1 VALUES(REPEAT('a', 100)); eval CREATE TEMPORARY TABLE t2 ENGINE $engine SELECT COALESCE(t) AS bug FROM t1; SELECT LENGTH(bug) FROM t2; DROP TABLE t2; DROP TABLE t1; } # # Bug#17313: N'xxx' and _utf8mb4'xxx' are not equivalent # eval CREATE TABLE t1 (item varchar(255)) default character set utf8mb4 ENGINE $engine; INSERT INTO t1 VALUES (N'\\'); INSERT INTO t1 VALUES (_utf8mb4'\\'); INSERT INTO t1 VALUES (N'Cote d\'Ivoire'); INSERT INTO t1 VALUES (_utf8mb4'Cote d\'Ivoire'); SELECT item FROM t1 ORDER BY item; DROP TABLE t1; # # Bug#17705: Corruption of compressed index when index length changes between # 254 and 256 # SET NAMES utf8mb4; DROP TABLE IF EXISTS t1; eval CREATE TABLE t1(a VARCHAR(255), KEY(a)) ENGINE=$engine DEFAULT CHARSET=utf8mb4; INSERT INTO t1 VALUES('uuABCDEFGHIGKLMNOPRSTUVWXYZ̈bbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbb'); INSERT INTO t1 VALUES('uu'); check table t1; INSERT INTO t1 VALUES('uU'); check table t1; INSERT INTO t1 VALUES('uu'); check table t1; INSERT INTO t1 VALUES('uuABC'); check table t1; INSERT INTO t1 VALUES('UuABC'); check table t1; INSERT INTO t1 VALUES('uuABC'); check table t1; alter table t1 add b int; INSERT INTO t1 VALUES('uuABCDEFGHIGKLMNOPRSTUVWXYZ̈bbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbb',1); INSERT INTO t1 VALUES('uuABCDEFGHIGKLMNOPRSTUVWXYZ̈bbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbb',2); delete from t1 where b=1; INSERT INTO t1 VALUES('UUABCDEFGHIGKLMNOPRSTUVWXYZ̈bbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbb',1); check table t1; INSERT INTO t1 VALUES('uuABCDEFGHIGKLMNOPRSTUVWXYZ̈bbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbb',3); INSERT INTO t1 VALUES('uuABCDEFGHIGKLMNOPRSTUVWXYZ̈bbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbb',4); delete from t1 where b=3; INSERT INTO t1 VALUES('uUABCDEFGHIGKLMNOPRSTUVWXYZ̈bbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbb',3); check table t1; drop table t1; # # Bug#20471 LIKE search fails with indexed utf8mb4 char column # set names utf8mb4; eval create table t1 (s1 char(5) character set utf8mb4) engine $engine; insert into t1 values ('a'),('b'),(null),('ペテルグル'),('ü'),('Y'); create index it1 on t1 (s1); select s1 as before_delete_general_ci from t1 where s1 like 'ペテ%'; delete from t1 where s1 = 'Y'; select s1 as after_delete_general_ci from t1 where s1 like 'ペテ%'; drop table t1; set names utf8mb4; eval create table t1 (s1 char(5) character set utf8mb4 collate utf8mb4_unicode_ci) engine $engine; insert into t1 values ('a'),('b'),(null),('ペテルグル'),('ü'),('Y'); create index it1 on t1 (s1); select s1 as before_delete_unicode_ci from t1 where s1 like 'ペテ%'; delete from t1 where s1 = 'Y'; select s1 as after_delete_unicode_ci from t1 where s1 like 'ペテ%'; drop table t1; set names utf8mb4; eval create table t1 (s1 char(5) character set utf8mb4 collate utf8mb4_bin) engine $engine; insert into t1 values ('a'),('b'),(null),('ペテルグル'),('ü'),('Y'); create index it1 on t1 (s1); select s1 as before_delete_bin from t1 where s1 like 'ペテ%'; delete from t1 where s1 = 'Y'; select s1 as after_delete_bin from t1 where s1 like 'ペテ%'; drop table t1; # additional tests from duplicate bug#20744 MySQL return no result set names utf8mb4; --disable_warnings eval create table t1 (a varchar(30) not null primary key) engine=$engine default character set utf8mb4 collate utf8mb4_general_ci; --enable_warnings insert into t1 values ('ã‚ã„ã†ãˆãŠã‹ããã‘ã“ã•ã—ã™ã›ã'); insert into t1 values ('ã•ã—ã™ã›ãã‹ããã‘ã“ã‚ã„ã†ãˆãŠ'); select a as gci1 from t1 where a like 'ã•ã—ã™ã›ãã‹ããã‘ã“ã‚ã„ã†ãˆãŠ%'; select a as gci2 from t1 where a like 'ã‚ã„ã†ãˆãŠã‹ããã‘ã“ã•ã—ã™ã›ã'; drop table t1; set names utf8mb4; --disable_warnings eval create table t1 (a varchar(30) not null primary key) engine=$engine default character set utf8mb4 collate utf8mb4_unicode_ci; --enable_warnings insert into t1 values ('ã‚ã„ã†ãˆãŠã‹ããã‘ã“ã•ã—ã™ã›ã'); insert into t1 values ('ã•ã—ã™ã›ãã‹ããã‘ã“ã‚ã„ã†ãˆãŠ'); select a as uci1 from t1 where a like 'ã•ã—ã™ã›ãã‹ããã‘ã“ã‚ã„ã†ãˆãŠ%'; select a as uci2 from t1 where a like 'ã‚ã„ã†ãˆãŠã‹ããã‘ã“ã•ã—ã™ã›ã'; drop table t1; set names utf8mb4; --disable_warnings eval create table t1 (a varchar(30) not null primary key) engine=$engine default character set utf8mb4 collate utf8mb4_bin; --enable_warnings insert into t1 values ('ã‚ã„ã†ãˆãŠã‹ããã‘ã“ã•ã—ã™ã›ã'); insert into t1 values ('ã•ã—ã™ã›ãã‹ããã‘ã“ã‚ã„ã†ãˆãŠ'); select a as bin1 from t1 where a like 'ã•ã—ã™ã›ãã‹ããã‘ã“ã‚ã„ã†ãˆãŠ%'; select a as bin2 from t1 where a like 'ã‚ã„ã†ãˆãŠã‹ããã‘ã“ã•ã—ã™ã›ã'; drop table t1; # # Bug#14896: Comparison with a key in a partial index over mb chararacter field # SET NAMES utf8mb4; eval CREATE TABLE t1 (id int PRIMARY KEY, a varchar(16) collate utf8mb4_unicode_ci NOT NULL default '', b int, f varchar(128) default 'XXX', INDEX (a(4)) ) ENGINE=$engine DEFAULT CHARSET=utf8mb4 COLLATE=utf8mb4_unicode_ci; INSERT INTO t1(id, a, b) VALUES (1, 'cccc', 50), (2, 'cccc', 70), (3, 'cccc', 30), (4, 'cccc', 30), (5, 'cccc', 20), (6, 'bbbbbb', 40), (7, 'dddd', 30), (8, 'aaaa', 10), (9, 'aaaa', 50), (10, 'eeeee', 40), (11, 'bbbbbb', 60); --sorted_result SELECT id, a, b FROM t1; --sorted_result SELECT id, a, b FROM t1 WHERE a BETWEEN 'aaaa' AND 'bbbbbb'; --sorted_result SELECT id, a FROM t1 WHERE a='bbbbbb'; SELECT id, a FROM t1 WHERE a='bbbbbb' ORDER BY b; DROP TABLE t1; # # Bug#16674: LIKE predicate for a utf8mb4 character set column # SET NAMES utf8mb4; eval CREATE TABLE t1 ( a CHAR(13) DEFAULT '', INDEX(a) ) ENGINE=$engine DEFAULT CHARSET=utf8mb4 COLLATE=utf8mb4_general_ci; INSERT INTO t1 VALUES ('Käli Käli 2-4'), ('Käli Käli 2-4'), ('Käli Käli 2+4'), ('Käli Käli 2+4'), ('Käli Käli 2-6'), ('Käli Käli 2-6'); INSERT INTO t1 SELECT * FROM t1; eval CREATE TABLE t2 ( a CHAR(13) DEFAULT '', INDEX(a) ) ENGINE=$engine DEFAULT CHARSET=latin1 COLLATE=latin1_general_ci; INSERT INTO t2 VALUES ('Kali Kali 2-4'), ('Kali Kali 2-4'), ('Kali Kali 2+4'), ('Kali Kali 2+4'), ('Kali Kali 2-6'), ('Kali Kali 2-6'); INSERT INTO t2 SELECT * FROM t2; SELECT a FROM t1 WHERE a LIKE 'Käli Käli 2+4'; SELECT a FROM t2 WHERE a LIKE 'Kali Kali 2+4'; EXPLAIN SELECT a FROM t1 WHERE a LIKE 'Käli Käli 2+4'; EXPLAIN SELECT a FROM t1 WHERE a = 'Käli Käli 2+4'; EXPLAIN SELECT a FROM t2 WHERE a LIKE 'Kali Kali 2+4'; EXPLAIN SELECT a FROM t2 WHERE a = 'Kali Kali 2+4'; DROP TABLE t1,t2; eval CREATE TABLE t1 ( a char(255) DEFAULT '', KEY(a(10)) ) ENGINE=$engine DEFAULT CHARSET=utf8mb4 COLLATE=utf8mb4_general_ci; INSERT INTO t1 VALUES ('Käli Käli 2-4'); SELECT * FROM t1 WHERE a LIKE 'Käli Käli 2%'; INSERT INTO t1 VALUES ('Käli Käli 2-4'); SELECT * FROM t1 WHERE a LIKE 'Käli Käli 2%'; DROP TABLE t1; eval CREATE TABLE t1 ( a char(255) DEFAULT '' ) ENGINE=$engine DEFAULT CHARSET=utf8mb4 COLLATE=utf8mb4_general_ci; INSERT INTO t1 VALUES ('Käli Käli 2-4'); INSERT INTO t1 VALUES ('Käli Käli 2-4'); SELECT * FROM t1 WHERE a LIKE 'Käli Käli 2%'; ALTER TABLE t1 ADD KEY (a(10)); SELECT * FROM t1 WHERE a LIKE 'Käli Käli 2%'; DROP TABLE t1; # # Bug#18359: LIKE predicate for a 'utf8mb4' text column with a partial index # (see bug #16674 as well) # SET NAMES latin2; if (!$is_heap) { eval CREATE TABLE t1 ( id int(11) NOT NULL default '0', tid int(11) NOT NULL default '0', val text NOT NULL, INDEX idx(tid, val(10)) ) ENGINE=$engine DEFAULT CHARSET=utf8mb4; INSERT INTO t1 VALUES (40988,72,'VOLNÝ ADSL'),(41009,72,'VOLNÝ ADSL'), (41032,72,'VOLNÝ ADSL'),(41038,72,'VOLNÝ ADSL'), (41063,72,'VOLNÝ ADSL'),(41537,72,'VOLNÝ ADSL Office'), (42141,72,'VOLNÝ ADSL'),(42565,72,'VOLNÝ ADSL Combi'), (42749,72,'VOLNÝ ADSL'),(44205,72,'VOLNÝ ADSL'); SELECT * FROM t1 WHERE tid=72 and val LIKE 'VOLNY ADSL'; SELECT * FROM t1 WHERE tid=72 and val LIKE 'VOLNÝ ADSL'; SELECT * FROM t1 WHERE tid=72 and val LIKE '%VOLNÝ ADSL'; ALTER TABLE t1 DROP KEY idx; ALTER TABLE t1 ADD KEY idx (tid,val(11)); SELECT * FROM t1 WHERE tid=72 and val LIKE 'VOLNÝ ADSL'; DROP TABLE t1; } # # Bug 20709: problem with utf8mb4 fields in temporary tables # eval create table t1(a char(200) collate utf8mb4_unicode_ci NOT NULL default '') default charset=utf8mb4 collate=utf8mb4_unicode_ci engine $engine; insert into t1 values (unhex('65')), (unhex('C3A9')), (unhex('65')); explain select distinct a from t1; SELECT COUNT(*) FROM (SELECT DISTINCT a FROM t1) AS t2; explain select a from t1 group by a; SELECT COUNT(*) FROM (SELECT a FROM t1 GROUP BY a) AS t2; drop table t1; # # Bug #20204: "order by" changes the results returned # eval create table t1(a char(10)) default charset utf8mb4 engine $engine; insert into t1 values ('123'), ('456'); explain select substr(Z.a,-1), Z.a from t1 as Y join t1 as Z on Y.a=Z.a order by 1; select substr(Z.a,-1), Z.a from t1 as Y join t1 as Z on Y.a=Z.a order by 1; drop table t1; # # Bug #34349: Passing invalid parameter to CHAR() in an ORDER BY causes # MySQL to hang # SET CHARACTER SET utf8mb4; --source include/default_charset.inc SHOW VARIABLES LIKE 'character\_set\_%'; SET @@character_set_server=@save_character_set_server; CREATE DATABASE crashtest DEFAULT CHARACTER SET utf8mb4 COLLATE utf8mb4_bin; USE crashtest; eval CREATE TABLE crashtest (crash char(10)) DEFAULT CHARSET=utf8mb4 ENGINE $engine; INSERT INTO crashtest VALUES ('35'), ('36'), ('37'); SELECT * FROM crashtest ORDER BY CHAR(crash USING utf8mb4); INSERT INTO crashtest VALUES ('-1000'); EXPLAIN SELECT * FROM crashtest ORDER BY CHAR(crash USING utf8mb4); SELECT * FROM crashtest ORDER BY CHAR(crash USING utf8mb4); DROP TABLE crashtest; DROP DATABASE crashtest; USE test; SET CHARACTER SET default; # End of 4.1 tests # # Test for bug #11484: wrong results for a DISTINCT varchar column in uft8. # eval CREATE TABLE t1(id varchar(20) NOT NULL) DEFAULT CHARSET=utf8mb4 ENGINE $engine; INSERT INTO t1 VALUES ('xxx'), ('aa'), ('yyy'), ('aa'); --sorted_result SELECT id FROM t1; --sorted_result SELECT DISTINCT id FROM t1; SELECT DISTINCT id FROM t1 ORDER BY id; DROP TABLE t1; # # Bug#20095 Changing length of VARCHAR field with UTF8 # collation does not truncate values # eval create table t1 ( a varchar(26) not null ) default character set utf8mb4 ENGINE $engine; insert into t1 (a) values ('abcdefghijklmnopqrstuvwxyz'); select * from t1; # varchar to varchar SET STATEMENT sql_mode = 'NO_ENGINE_SUBSTITUTION' FOR alter table t1 change a a varchar(20) character set utf8mb4 not null; select * from t1; # varchar to char SET STATEMENT sql_mode = 'NO_ENGINE_SUBSTITUTION' FOR alter table t1 change a a char(15) character set utf8mb4 not null; select * from t1; # char to char SET STATEMENT sql_mode = 'NO_ENGINE_SUBSTITUTION' FOR alter table t1 change a a char(10) character set utf8mb4 not null; select * from t1; # char to varchar SET STATEMENT sql_mode = 'NO_ENGINE_SUBSTITUTION' FOR alter table t1 change a a varchar(5) character set utf8mb4 not null; select * from t1; drop table t1; # # Check that do_varstring2_mb produces a warning # eval create table t1 ( a varchar(4000) not null ) default character set utf8mb4 engine $engine; insert into t1 values (repeat('a',4000)); SET STATEMENT sql_mode = 'NO_ENGINE_SUBSTITUTION' FOR alter table t1 change a a varchar(3000) character set utf8mb4 not null; select length(a) from t1; drop table t1; # # Bug#10504: Character set does not support traditional mode # Bug#14146: CHAR(...USING ...) and CONVERT(CHAR(...) USING...) # produce different results # set names utf8mb4; # correct value select hex(char(1 using utf8mb4)); select char(0xd1,0x8f using utf8mb4); select char(0xd18f using utf8mb4); select char(53647 using utf8mb4); # incorrect value: return with warning select char(0xff,0x8f using utf8mb4); select convert(char(0xff,0x8f) using utf8mb4); # incorrect value in strict mode: return NULL with "Error" level warning set sql_mode=traditional; select char(0xff,0x8f using utf8mb4); select char(195 using utf8mb4); select char(196 using utf8mb4); select char(2557 using utf8mb4); select convert(char(0xff,0x8f) using utf8mb4); # # Check convert + char + using # select hex(convert(char(2557 using latin1) using utf8mb4)); # # char() without USING returns "binary" by default, any argument is ok # select hex(char(195)); select hex(char(196)); select hex(char(2557)); # # Bug#12891: UNION doesn't return DISTINCT result for multi-byte characters # set names utf8mb4; eval create table t1 (a char(1)) default character set utf8mb4 engine $engine; eval create table t2 (a char(1)) default character set utf8mb4 engine $engine; insert into t1 values('a'),('a'),(0xE38182),(0xE38182); insert into t1 values('i'),('i'),(0xE38184),(0xE38184); --sorted_result select * from t1 union distinct select * from t2; drop table t1,t2; # # Bug#12371: executing prepared statement fails (illegal mix of collations) # set names utf8mb4; eval create table t1 (a char(10), b varchar(10)) engine $engine; insert into t1 values ('bar','kostja'); insert into t1 values ('kostja','bar'); prepare my_stmt from "select * from t1 where a=?"; set @a:='bar'; execute my_stmt using @a; set @a:='kostja'; execute my_stmt using @a; set @a:=null; execute my_stmt using @a; drop table if exists t1; # # Bug#21505 Create view - illegal mix of collation for operation 'UNION' # --disable_warnings drop table if exists t1; drop view if exists v1, v2; --enable_warnings set names utf8mb4; eval create table t1(col1 varchar(12) character set utf8mb4 collate utf8mb4_unicode_ci) engine $engine; insert into t1 values('t1_val'); create view v1 as select 'v1_val' as col1; select coercibility(col1), collation(col1) from v1; create view v2 as select col1 from v1 union select col1 from t1; select coercibility(col1), collation(col1)from v2; drop view v1, v2; create view v1 as select 'v1_val' collate utf8mb4_swedish_ci as col1; select coercibility(col1), collation(col1) from v1; create view v2 as select col1 from v1 union select col1 from t1; select coercibility(col1), collation(col1) from v2; drop view v1, v2; drop table t1; # # Check conversion of NCHAR strings to subset (e.g. latin1). # Conversion is possible if string repertoire is ASCII. # Conversion is not possible if the string have extended characters # set names utf8mb4; eval create table t1 (a varchar(10) character set latin1, b int) engine $engine; insert into t1 values ('a',1); select concat(a, if(b>10, N'x', N'y')) from t1; --error 1267 select concat(a, if(b>10, N'æ', N'ß')) from t1; drop table t1; # Conversion tests for character set introducers set names utf8mb4; eval create table t1 (a varchar(10) character set latin1, b int) engine $engine; insert into t1 values ('a',1); select concat(a, if(b>10, _utf8mb4'x', _utf8mb4'y')) from t1; --error 1267 select concat(a, if(b>10, _utf8mb4'æ', _utf8mb4'ß')) from t1; drop table t1; # Conversion tests for introducer + HEX string set names utf8mb4; eval create table t1 (a varchar(10) character set latin1, b int) engine $engine; insert into t1 values ('a',1); select concat(a, if(b>10, _utf8mb4 0x78, _utf8mb4 0x79)) from t1; --error 1267 select concat(a, if(b>10, _utf8mb4 0xC3A6, _utf8mb4 0xC3AF)) from t1; drop table t1; # Conversion tests for "text_literal TEXT_STRING_literal" syntax structure set names utf8mb4; eval create table t1 (a varchar(10) character set latin1, b int) engine $engine; insert into t1 values ('a',1); select concat(a, if(b>10, 'x' 'x', 'y' 'y')) from t1; --error 1267 select concat(a, if(b>10, 'x' 'æ', 'y' 'ß')) from t1; drop table t1; # # Bug#19960: Inconsistent results when joining # InnoDB tables using partial UTF8 indexes # --disable_warnings eval CREATE TABLE t1 ( colA int(11) NOT NULL, colB varchar(255) character set utf8mb4 NOT NULL, PRIMARY KEY (colA) ) ENGINE=$engine DEFAULT CHARSET=latin1; --enable_warnings INSERT INTO t1 (colA, colB) VALUES (1, 'foo'), (2, 'foo bar'); --disable_warnings eval CREATE TABLE t2 ( colA int(11) NOT NULL, colB varchar(255) character set utf8mb4 NOT NULL, KEY bad (colA,colB(3)) ) ENGINE=$engine DEFAULT CHARSET=latin1; --enable_warnings INSERT INTO t2 (colA, colB) VALUES (1, 'foo'),(2, 'foo bar'); SELECT * FROM t1 JOIN t2 ON t1.colA=t2.colA AND t1.colB=t2.colB WHERE t1.colA < 3; DROP TABLE t1, t2; # # Bug#29205: truncation of UTF8 values when the UNION statement # forces collation to the binary charset # SELECT 'н1234567890' UNION SELECT _binary '1'; SELECT 'н1234567890' UNION SELECT 1; SELECT '1' UNION SELECT 'н1234567890'; SELECT 1 UNION SELECT 'н1234567890'; eval CREATE TABLE t1 (c VARCHAR(11)) CHARACTER SET utf8mb4 ENGINE $engine; eval CREATE TABLE t2 (b CHAR(1) CHARACTER SET binary, i INT) ENGINE $engine; INSERT INTO t1 (c) VALUES ('н1234567890'); INSERT INTO t2 (b, i) VALUES ('1', 1); SELECT c FROM t1 UNION SELECT b FROM t2; SELECT c FROM t1 UNION SELECT i FROM t2; SELECT b FROM t2 UNION SELECT c FROM t1; SELECT i FROM t2 UNION SELECT c FROM t1; DROP TABLE t1, t2; # # Bug#30982: CHAR(..USING..) can return a not-well-formed string # Bug #30986: Character set introducer followed by a HEX string can return bad result # set sql_mode=traditional; select hex(char(0xFF using utf8mb4)); select hex(convert(0xFF using utf8mb4)); --error ER_INVALID_CHARACTER_STRING select hex(_utf8mb4 0x616263FF); --error ER_INVALID_CHARACTER_STRING select hex(_utf8mb4 X'616263FF'); --error ER_INVALID_CHARACTER_STRING select hex(_utf8mb4 B'001111111111'); --error ER_INVALID_CHARACTER_STRING select (_utf8mb4 X'616263FF'); set sql_mode=default; select hex(char(0xFF using utf8mb4)); select hex(convert(0xFF using utf8mb4)); --error ER_INVALID_CHARACTER_STRING select hex(_utf8mb4 0x616263FF); --error ER_INVALID_CHARACTER_STRING select hex(_utf8mb4 X'616263FF'); --error ER_INVALID_CHARACTER_STRING select hex(_utf8mb4 B'001111111111'); --error ER_INVALID_CHARACTER_STRING select (_utf8mb4 X'616263FF'); # # Bug #36772: When using UTF8, CONVERT with GROUP BY returns truncated results # eval CREATE TABLE t1 (a INT NOT NULL, b INT NOT NULL) ENGINE $engine; INSERT INTO t1 VALUES (70000, 1092), (70001, 1085), (70002, 1065); --sorted_result SELECT CONVERT(a, CHAR), CONVERT(b, CHAR) FROM t1 GROUP BY b; --sorted_result SELECT CONVERT(a, CHAR), CONVERT(b, CHAR) FROM t1; ALTER TABLE t1 ADD UNIQUE (b); --sorted_result SELECT CONVERT(a, CHAR), CONVERT(b, CHAR) FROM t1 GROUP BY b; DROP INDEX b ON t1; --sorted_result SELECT CONVERT(a, CHAR), CONVERT(b, CHAR) FROM t1 GROUP BY b; ALTER TABLE t1 ADD INDEX (b); --sorted_result SELECT CONVERT(a, CHAR), CONVERT(b, CHAR) from t1 GROUP BY b; DROP TABLE t1; --echo # --echo # Bug#26474: Add Sinhala script (Sri Lanka) collation to MySQL --echo # --disable_warnings DROP TABLE IF EXISTS t1; --enable_warnings eval CREATE TABLE t1 ( predicted_order int NOT NULL, utf8mb4_encoding VARCHAR(10) NOT NULL ) CHARACTER SET utf8mb4 ENGINE $engine; INSERT INTO t1 VALUES (19, x'E0B696'), (30, x'E0B69AE0B798'), (61, x'E0B6AF'), (93, x'E0B799'), (52, x'E0B6A6'), (73, x'E0B6BBE0B78AE2808D'), (3, x'E0B686'), (56, x'E0B6AA'), (55, x'E0B6A9'), (70, x'E0B6B9'), (94, x'E0B79A'), (80, x'E0B785'), (25, x'E0B69AE0B791'), (48, x'E0B6A2'), (13, x'E0B690'), (86, x'E0B793'), (91, x'E0B79F'), (81, x'E0B786'), (79, x'E0B784'), (14, x'E0B691'), (99, x'E0B78A'), (8, x'E0B68B'), (68, x'E0B6B7'), (22, x'E0B69A'), (16, x'E0B693'), (33, x'E0B69AE0B7B3'), (38, x'E0B69AE0B79D'), (21, x'E0B683'), (11, x'E0B68E'), (77, x'E0B782'), (40, x'E0B69AE0B78A'), (101, x'E0B78AE2808DE0B6BB'), (35, x'E0B69AE0B79A'), (1, x'E0B7B4'), (9, x'E0B68C'), (96, x'E0B79C'), (6, x'E0B689'), (95, x'E0B79B'), (88, x'E0B796'), (64, x'E0B6B3'), (26, x'E0B69AE0B792'), (82, x'E0B78F'), (28, x'E0B69AE0B794'), (39, x'E0B69AE0B79E'), (97, x'E0B79D'), (2, x'E0B685'), (75, x'E0B780'), (34, x'E0B69AE0B799'), (69, x'E0B6B8'), (83, x'E0B790'), (18, x'E0B695'), (90, x'E0B7B2'), (17, x'E0B694'), (72, x'E0B6BB'), (66, x'E0B6B5'), (59, x'E0B6AD'), (44, x'E0B69E'), (15, x'E0B692'), (23, x'E0B69AE0B78F'), (65, x'E0B6B4'), (42, x'E0B69C'), (63, x'E0B6B1'), (85, x'E0B792'), (47, x'E0B6A1'), (49, x'E0B6A3'), (92, x'E0B7B3'), (78, x'E0B783'), (36, x'E0B69AE0B79B'), (4, x'E0B687'), (24, x'E0B69AE0B790'), (87, x'E0B794'), (37, x'E0B69AE0B79C'), (32, x'E0B69AE0B79F'), (29, x'E0B69AE0B796'), (43, x'E0B69D'), (62, x'E0B6B0'), (100, x'E0B78AE2808DE0B6BA'), (60, x'E0B6AE'), (45, x'E0B69F'), (12, x'E0B68F'), (46, x'E0B6A0'), (50, x'E0B6A5'), (51, x'E0B6A4'), (5, x'E0B688'), (76, x'E0B781'), (89, x'E0B798'), (74, x'E0B6BD'), (10, x'E0B68D'), (57, x'E0B6AB'), (71, x'E0B6BA'), (58, x'E0B6AC'), (27, x'E0B69AE0B793'), (54, x'E0B6A8'), (84, x'E0B791'), (31, x'E0B69AE0B7B2'), (98, x'E0B79E'), (53, x'E0B6A7'), (41, x'E0B69B'), (67, x'E0B6B6'), (7, x'E0B68A'), (20, x'E0B682'); SELECT predicted_order, hex(utf8mb4_encoding) FROM t1 ORDER BY utf8mb4_encoding COLLATE utf8mb4_sinhala_ci; DROP TABLE t1; --echo # --echo # Bug#32914 Character sets: illegal characters in utf8mb4 and utf32 columns --echo # eval create table t1 (utf8mb4 char(1) character set utf8mb4) engine $engine; --echo Testing [F0][90..BF][80..BF][80..BF] insert into t1 values (0xF0908080); insert into t1 values (0xF0BFBFBF); insert ignore into t1 values (0xF08F8080); --sorted_result select hex(utf8mb4) from t1; delete from t1; --echo Testing [F2..F3][80..BF][80..BF][80..BF] insert into t1 values (0xF2808080); insert into t1 values (0xF2BFBFBF); --sorted_result select hex(utf8mb4) from t1; delete from t1; --echo Testing [F4][80..8F][80..BF][80..BF] insert into t1 values (0xF4808080); insert into t1 values (0xF48F8080); insert ignore into t1 values (0xF4908080); --sorted_result select hex(utf8mb4) from t1; drop table t1; --echo # --echo # Check strnxfrm() with odd length --echo # set max_sort_length=65; select @@max_sort_length; eval create table t1 (a varchar(128) character set utf8mb4 collate utf8mb4_general_ci) engine $engine; insert into t1 values ('a'),('b'),('c'); select * from t1 order by a; alter table t1 modify a varchar(128) character set utf8mb4 collate utf8mb4_bin; select * from t1 order by a; drop table t1; set max_sort_length=default; --echo # --echo # Bug#26180: Can't add columns to tables created with utf8mb4 text indexes --echo # if (!$is_heap) { eval CREATE TABLE t1 ( clipid INT NOT NULL, Tape TINYTEXT, PRIMARY KEY (clipid), KEY tape(Tape(255)) ) CHARACTER SET=utf8mb4 ENGINE $engine; ALTER TABLE t1 ADD mos TINYINT DEFAULT 0 AFTER clipid; SHOW CREATE TABLE t1; DROP TABLE t1; } #--echo # #--echo # Check that supplementary characters are not allowed in identifiers #--echo # # TODO: activate this when system_charset_info is changed to utf8mb4 #--error 1300 #CREATE DATABASE `ð€€`; #--error 1300 #CREATE TABLE `ð€€` (a int); #--error 1166 #CREATE TABLE test.t1 SELECT 'ð€€'; #--error 1300 #CREATE USER `ð€€`; --echo # --echo # Testing 4-byte values. --echo # --disable_warnings DROP TABLE IF EXISTS t1; --enable_warnings eval CREATE TABLE t1 ( u_decimal int NOT NULL, utf8mb4_encoding VARCHAR(10) NOT NULL ) CHARACTER SET utf8mb4 ENGINE $engine; # Source of the following values: http://www.fileformat.info/info/unicode/block/index.htm # SINGLE BARLINE INSERT INTO t1 VALUES (119040, x'f09d8480'), # G CLEF (119070, x'f09d849e'), # HALF NOTE (119134, x'f09d859e'), # MUSICAL SYMBOL CROIX (119247, x'f09d878f'), # MATHEMATICAL BOLD ITALIC CAPITAL DELTA (120607, x'f09d9c9f'), # SANS-SERIF BOLD ITALIC CAPITAL PI (120735, x'f09d9e9f'), # (last 4 byte character) (1114111, x'f48fbfbf'), # VARIATION SELECTOR-256 (917999, x'f3a087af'); # All from musical chars INSERT INTO t1 VALUES (119070, x'f09d849ef09d859ef09d859ef09d8480f09d859ff09d859ff09d859ff09d85a0f09d85a0f09d8480'); # Mix of 3-byte and 4-byte chars INSERT INTO t1 VALUES (65131, x'efb9abf09d849ef09d859ef09d859ef09d8480f09d859fefb9abefb9abf09d85a0efb9ab'); # All from musical chars, but 11 instead of 10 chars. truncated INSERT IGNORE INTO t1 VALUES (119070, x'f09d849ef09d859ef09d859ef09d8480f09d859ff09d859ff09d859ff09d85a0f09d85a0f09d8480f09d85a0'); --sorted_result SELECT u_decimal, hex(utf8mb4_encoding) FROM t1 ORDER BY utf8mb4_encoding COLLATE utf8mb4_general_ci, BINARY utf8mb4_encoding; # First invalid 4 byte value INSERT IGNORE INTO t1 VALUES (1114111, x'f5808080'); --sorted_result SELECT character_maximum_length, character_octet_length FROM information_schema.columns WHERE table_name= 't1' AND column_name= 'utf8mb4_encoding'; --disable_warnings DROP TABLE IF EXISTS t2; --enable_warnings eval CREATE TABLE t2 ( u_decimal int NOT NULL, utf8mb3_encoding VARCHAR(10) NOT NULL ) CHARACTER SET utf8mb3 ENGINE $engine; # LATIN CAPITAL LETTER VEND INSERT INTO t2 VALUES (42856, x'ea9da8'); # SMALL COMMERCIAL AT INSERT INTO t2 VALUES (65131, x'efb9ab'); # (last 4 byte character) INSERT IGNORE INTO t2 VALUES (1114111, x'f48fbfbf'); --sorted_result SELECT character_maximum_length, character_octet_length FROM information_schema.columns WHERE table_name= 't2' AND column_name= 'utf8mb3_encoding'; # Update a 3-byte char col with a 4-byte char, error UPDATE IGNORE t2 SET utf8mb3_encoding= x'f48fbfbd' where u_decimal= 42856; # Update to a 3-byte char casted to 4-byte, error? UPDATE t2 SET utf8mb3_encoding= _utf8mb4 x'ea9da8' where u_decimal= 42856; # Returns utfmb4 --sorted_result SELECT HEX(CONCAT(utf8mb4_encoding, _utf8 x'ea9da8')) FROM t1; --sorted_result SELECT HEX(CONCAT(utf8mb4_encoding, utf8mb3_encoding)) FROM t1,t2; #--error ER_INVALID_CHARACTER_STRING #SELECT CONCAT(_utf8 utf8mb4_encoding, _utf8 '|') FROM t1; #--error ER_INVALID_CHARACTER_STRING #SELECT CONCAT(_utf8mb3 utf8mb4_encoding, _utf8 '|') FROM t1; SELECT count(*) FROM t1, t2 WHERE t1.utf8mb4_encoding > t2.utf8mb3_encoding; # Alter from 4-byte charset to 3-byte charset, error --disable_warnings SET STATEMENT sql_mode = 'NO_ENGINE_SUBSTITUTION' FOR ALTER TABLE t1 CONVERT TO CHARACTER SET utf8; --enable_warnings SHOW CREATE TABLE t1; --sorted_result SELECT u_decimal,hex(utf8mb4_encoding),utf8mb4_encoding FROM t1; # Alter table from utf8 to utf8mb4 ALTER TABLE t2 CONVERT TO CHARACTER SET utf8mb4; SHOW CREATE TABLE t2; --sorted_result SELECT u_decimal,hex(utf8mb3_encoding) FROM t2; # Alter table back from utf8mb4 to utf8 ALTER TABLE t2 CONVERT TO CHARACTER SET utf8mb3; SHOW CREATE TABLE t2; --sorted_result SELECT u_decimal,hex(utf8mb3_encoding) FROM t2; # ALter of utf8mb4 column to utf8 --disable_warnings ALTER TABLE t1 MODIFY utf8mb4_encoding VARCHAR(10) CHARACTER SET utf8mb3; --enable_warnings SHOW CREATE TABLE t1; --sorted_result SELECT u_decimal,hex(utf8mb4_encoding) FROM t1; # ALter of utf8 column to utf8mb4 ALTER TABLE t1 MODIFY utf8mb4_encoding VARCHAR(10) CHARACTER SET utf8mb4; SHOW CREATE TABLE t1; --sorted_result SELECT u_decimal,hex(utf8mb4_encoding) FROM t1; # ALter of utf8 column to utf8mb4 ALTER TABLE t2 MODIFY utf8mb3_encoding VARCHAR(10) CHARACTER SET utf8mb4; SHOW CREATE TABLE t2; --sorted_result SELECT u_decimal,hex(utf8mb3_encoding) FROM t2; --disable_warnings DROP TABLE IF EXISTS t3; --enable_warnings eval CREATE TABLE t3 ( u_decimal int NOT NULL, utf8mb3_encoding VARCHAR(10) NOT NULL ) CHARACTER SET utf8 ENGINE $engine; # Insert select utf8mb4 (4-byte) into utf8 (3-byte), error #--error ER_INVALID_CHARACTER_STRING INSERT INTO t3 SELECT * FROM t1; --disable_warnings DROP TABLE IF EXISTS t4; --enable_warnings eval CREATE TABLE t4 ( u_decimal int NOT NULL, utf8mb4_encoding VARCHAR(10) NOT NULL ) CHARACTER SET utf8mb4 ENGINE $engine; # Insert select utf8 (3-byte) into utf8mb4 (4-byte) INSERT INTO t3 SELECT * FROM t2; DROP TABLE t1; DROP TABLE t2; DROP TABLE t3; DROP TABLE t4; --echo # --echo # Testing that mixing utf8 and utf8mb4 collations returns utf8mb4 --echo # SELECT CHARSET(CONCAT(_utf8mb4'a',_utf8'b')); eval CREATE TABLE t1 (utf8mb4 VARCHAR(10) CHARACTER SET utf8mb4 NOT NULL) ENGINE $engine; INSERT INTO t1 VALUES (x'ea9da8'),(x'f48fbfbf'); SELECT CONCAT(utf8mb4, _utf8 x'ea9da8') FROM t1 LIMIT 0; eval CREATE TABLE t2 (utf8mb3 VARCHAR(10) CHARACTER SET utf8mb3 NOT NULL) ENGINE $engine; INSERT INTO t2 VALUES (x'ea9da8'); SELECT HEX(CONCAT(utf8mb4, utf8mb3)) FROM t1,t2 ORDER BY 1; SELECT CHARSET(CONCAT(utf8mb4, utf8mb3)) FROM t1, t2 LIMIT 1; eval CREATE TEMPORARY TABLE t3 ENGINE $engine AS SELECT *, concat(utf8mb4,utf8mb3) FROM t1, t2; SHOW CREATE TABLE t3; DROP TEMPORARY TABLE t3; SELECT * FROM t1, t2 WHERE t1.utf8mb4 > t2.utf8mb3; SELECT * FROM t1, t2 WHERE t1.utf8mb4 = t2.utf8mb3; SELECT * FROM t1, t2 WHERE t1.utf8mb4 < t2.utf8mb3; DROP TABLE t1; DROP TABLE t2; --echo # --echo # Check that mixing utf8mb4 with an invalid utf8 constant returns error --echo # # This should perhaps be changed to return ER_INVALID_CHARACTER_STRING eval CREATE TABLE t1 (utf8mb4 VARCHAR(10) CHARACTER SET utf8mb4) ENGINE $engine; INSERT INTO t1 VALUES (x'f48fbfbf'); --error ER_CANT_AGGREGATE_2COLLATIONS SELECT CONCAT(utf8mb4, _utf8 '¿') FROM t1; --error ER_CANT_AGGREGATE_2COLLATIONS SELECT CONCAT('a', _utf8 '¿') FROM t1; DROP TABLE t1; --echo # --echo # End of 5.5 tests --echo # --echo # --echo # ctype_utf8mb4.inc: Start of 10.1 tests --echo # --echo # --echo # MDEV-8417 utf8mb4: compare broken bytes as "greater than any non-broken character" --echo # CREATE TABLE t1 ( id INT NOT NULL AUTO_INCREMENT PRIMARY KEY, a VARCHAR(10) CHARACTER SET utf8mb4, KEY(a,id) ); INSERT INTO t1 (a) VALUES (0x61); INSERT INTO t1 (a) VALUES (0xC280),(0xDFBF); INSERT INTO t1 (a) VALUES (0xE0A080),(0xEFBFBF); INSERT INTO t1 (a) VALUES (0xF0908080),(0xF48FBFBF); SELECT id,HEX(a) FROM t1 ORDER BY a,id; SELECT id,HEX(a) FROM t1 ORDER BY a DESC,id DESC; SELECT COUNT(DISTINCT a) FROM t1; ALTER TABLE t1 MODIFY a VARCHAR(10) CHARACTER SET utf8mb4 COLLATE utf8mb4_bin; SELECT id,HEX(a) FROM t1 ORDER BY a; SELECT id,HEX(a) FROM t1 ORDER BY a DESC,id DESC; SELECT COUNT(DISTINCT a) FROM t1; DROP TABLE t1; --echo # --echo # ctype_utf8mb4.inc: End of 10.1 tests --echo # --echo # --echo # End of ctype_utf8mb4.inc --echo #