From b8f8d0a3798e5b2bd7a056396499baabe162f656 Mon Sep 17 00:00:00 2001 From: Socrates Date: Wed, 20 Nov 2024 23:43:46 +0800 Subject: [PATCH 1/3] fix refreshOnlyCatalogCache when use_meta_cache = false --- .../main/java/org/apache/doris/datasource/ExternalCatalog.java | 1 + 1 file changed, 1 insertion(+) diff --git a/fe/fe-core/src/main/java/org/apache/doris/datasource/ExternalCatalog.java b/fe/fe-core/src/main/java/org/apache/doris/datasource/ExternalCatalog.java index 34525410834506..23e6d68954edfb 100644 --- a/fe/fe-core/src/main/java/org/apache/doris/datasource/ExternalCatalog.java +++ b/fe/fe-core/src/main/java/org/apache/doris/datasource/ExternalCatalog.java @@ -418,6 +418,7 @@ private void refreshOnlyCatalogCache(boolean invalidCache) { if (useMetaCache.get() && metaCache != null) { metaCache.invalidateAll(); } else if (!useMetaCache.get()) { + this.initialized = false; for (ExternalDatabase db : idToDb.values()) { db.setUnInitialized(invalidCache); } From 9ad7cdcdd6b855c9a4004b516cf0209bf796f90b Mon Sep 17 00:00:00 2001 From: Socrates Date: Thu, 21 Nov 2024 16:17:55 +0800 Subject: [PATCH 2/3] add regression --- .../hive/test_hive_use_meta_cache.out | 122 +++++++++++- .../hive/test_hive_use_meta_cache.groovy | 174 +++++++++++------- 2 files changed, 225 insertions(+), 71 deletions(-) diff --git a/regression-test/data/external_table_p0/hive/test_hive_use_meta_cache.out b/regression-test/data/external_table_p0/hive/test_hive_use_meta_cache.out index a5fc7ede82b8be..9db486e2066f17 100644 --- a/regression-test/data/external_table_p0/hive/test_hive_use_meta_cache.out +++ b/regression-test/data/external_table_p0/hive/test_hive_use_meta_cache.out @@ -28,15 +28,24 @@ test_use_meta_cache_db_hive test_use_meta_cache_tbl_hive -- !sql08 -- -test_use_meta_cache_tbl_hive -- !sql09 -- +p1=part1 +p1=part2 -- !sql10 -- -test_use_meta_cache_db_hive +p1=part1 +p1=part2 -- !sql11 -- +-- !sql12 -- + +-- !sql13 -- +test_use_meta_cache_db_hive + +-- !sql14 -- + -- !sql01 -- -- !sql02 -- @@ -61,17 +70,126 @@ test_use_meta_cache_db_hive -- !sql05 -- -- !sql06 -- +test_use_meta_cache_tbl_hive -- !sql07 -- test_use_meta_cache_tbl_hive -- !sql08 -- + +-- !sql09 -- +p1=part1 +p1=part2 + +-- !sql10 -- +p1=part1 +p1=part2 + +-- !sql11 -- +test_use_meta_cache_partitioned_tbl_hive +test_use_meta_cache_tbl_hive + +-- !sql12 -- + +-- !sql13 -- +test_use_meta_cache_db_hive + +-- !sql14 -- + +-- !sql01 -- + +-- !sql02 -- +test_use_meta_cache_db + +-- !sql03 -- +test_use_meta_cache_tbl + +-- !sql04 -- + +-- !sql05 -- + +-- !sql01 -- + +-- !sql02 -- + +-- !sql03 -- +test_use_meta_cache_db_hive + +-- !sql04 -- + +-- !sql05 -- + +-- !sql06 -- + +-- !sql07 -- test_use_meta_cache_tbl_hive +-- !sql08 -- + -- !sql09 -- +p1=part1 +p1=part2 -- !sql10 -- +p1=part1 +p1=part2 + +-- !sql11 -- + +-- !sql12 -- + +-- !sql13 -- +test_use_meta_cache_db_hive + +-- !sql14 -- + +-- !sql01 -- + +-- !sql02 -- +test_use_meta_cache_db + +-- !sql03 -- +test_use_meta_cache_tbl + +-- !sql04 -- + +-- !sql05 -- + +-- !sql01 -- + +-- !sql02 -- + +-- !sql03 -- test_use_meta_cache_db_hive +-- !sql04 -- + +-- !sql05 -- + +-- !sql06 -- +test_use_meta_cache_tbl_hive + +-- !sql07 -- +test_use_meta_cache_tbl_hive + +-- !sql08 -- + +-- !sql09 -- +p1=part1 +p1=part2 + +-- !sql10 -- +p1=part1 +p1=part2 + -- !sql11 -- +test_use_meta_cache_partitioned_tbl_hive +test_use_meta_cache_tbl_hive + +-- !sql12 -- + +-- !sql13 -- +test_use_meta_cache_db_hive + +-- !sql14 -- diff --git a/regression-test/suites/external_table_p0/hive/test_hive_use_meta_cache.groovy b/regression-test/suites/external_table_p0/hive/test_hive_use_meta_cache.groovy index 3562ce3126725d..ed7bf20d807ee7 100644 --- a/regression-test/suites/external_table_p0/hive/test_hive_use_meta_cache.groovy +++ b/regression-test/suites/external_table_p0/hive/test_hive_use_meta_cache.groovy @@ -23,80 +23,116 @@ suite("test_hive_use_meta_cache", "p0,external,hive,external_docker,external_doc return; } - for (String hivePrefix : ["hive3", "hive3"]) { + for (String hivePrefix : ["hive2", "hive3"]) { setHivePrefix(hivePrefix) try { - String hms_port = context.config.otherConfigs.get(hivePrefix + "HmsPort") - String hdfs_port = context.config.otherConfigs.get(hivePrefix + "HdfsPort") - String catalog = "test_${hivePrefix}_use_meta_cache" - String externalEnvIp = context.config.otherConfigs.get("externalEnvIp") + def test_use_meta_cache = { Boolean use_meta_cache -> + String hms_port = context.config.otherConfigs.get(hivePrefix + "HmsPort") + String hdfs_port = context.config.otherConfigs.get(hivePrefix + "HdfsPort") + String use_meta_cache_string = use_meta_cache ? "true" : "false" + String catalog = "test_${hivePrefix}_use_meta_cache_${use_meta_cache}" + String externalEnvIp = context.config.otherConfigs.get("externalEnvIp") - sql """drop catalog if exists ${catalog}""" - sql """create catalog if not exists ${catalog} properties ( - 'type'='hms', - 'hive.metastore.uris' = 'thrift://${externalEnvIp}:${hms_port}', - 'fs.defaultFS' = 'hdfs://${externalEnvIp}:${hdfs_port}', - 'use_meta_cache' = 'true' - );""" + sql """drop catalog if exists ${catalog}""" + sql """create catalog if not exists ${catalog} properties ( + 'type'='hms', + 'hive.metastore.uris' = 'thrift://${externalEnvIp}:${hms_port}', + 'fs.defaultFS' = 'hdfs://${externalEnvIp}:${hdfs_port}', + 'use_meta_cache' = '${use_meta_cache_string}' + );""" + + // create from Doris, the cache will be filled immediately + String database= "test_use_meta_cache_db" + String table = "test_use_meta_cache_tbl" + String database_hive = "test_use_meta_cache_db_hive" + String table_hive = "test_use_meta_cache_tbl_hive" + String partitioned_table_hive = "test_use_meta_cache_partitioned_tbl_hive" + + sql "switch ${catalog}" + sql "drop database if exists ${database}" + sql "drop database if exists ${database_hive}" + order_qt_sql01 "show databases like '%${database}%'"; + sql "drop database if exists ${database}" + sql "create database ${database}" + order_qt_sql02 "show databases like '%${database}%'"; + sql "use ${database}" + sql "create table ${table} (k1 int)" + order_qt_sql03 "show tables" + sql "drop table ${table}" + order_qt_sql04 "show tables" + sql "drop database ${database}" + order_qt_sql05 "show databases like '%${database}%'"; - // create from Doris, the cache will be filled immediately - String database= "test_use_meta_cache_db" - String table = "test_use_meta_cache_tbl" - String database_hive = "test_use_meta_cache_db_hive" - String table_hive = "test_use_meta_cache_tbl_hive" - sql "switch ${catalog}" - sql "drop database if exists ${database}" - sql "drop database if exists ${database_hive}" - order_qt_sql01 "show databases like '%${database}%'"; - sql "drop database if exists ${database}" - sql "create database ${database}" - order_qt_sql02 "show databases like '%${database}%'"; - sql "use ${database}" - sql "create table ${table} (k1 int)" - order_qt_sql03 "show tables" - sql "drop table ${table}" - order_qt_sql04 "show tables" - sql "drop database ${database}" - order_qt_sql05 "show databases like '%${database}%'"; - - // create from Hive, the cache has different behavior - order_qt_sql01 "show databases like '%${database_hive}%'"; - hive_docker "drop database if exists ${database_hive}" - hive_docker "create database ${database_hive}" - // not see - order_qt_sql02 "show databases like '%${database_hive}%'"; - // but can use - sql "use ${database_hive}" - sql "refresh catalog ${catalog}" - // can see - order_qt_sql03 "show databases like '%${database_hive}%'"; - // show tables first to fill cache - order_qt_sql04 "show tables" - hive_docker "create table ${database_hive}.${table_hive} (k1 int)" - // not see - order_qt_sql05 "show tables" - // but can select - sql "select * from ${table_hive}" - // still not see - order_qt_sql06 "show tables" - sql "refresh database ${database_hive}" - // can see - order_qt_sql07 "show tables" - hive_docker "drop table ${database_hive}.${table_hive}" - // still can see - order_qt_sql08 "show tables" - sql "refresh database ${database_hive}" - // can not see - order_qt_sql09 "show tables" - hive_docker "drop database ${database_hive}" - // still can see - order_qt_sql10 "show databases like '%${database_hive}%'"; - sql "refresh catalog ${catalog}" - // can not see - order_qt_sql11 "show databases like '%${database_hive}%'"; + // create from Hive, the cache has different behavior + order_qt_sql01 "show databases like '%${database_hive}%'"; + hive_docker "drop database if exists ${database_hive}" + hive_docker "create database ${database_hive}" + // not see + order_qt_sql02 "show databases like '%${database_hive}%'"; + if (use_meta_cache) { + // if use meta cache, can use + sql "use ${database_hive}" + sql "refresh catalog ${catalog}" + } else { + // if not use meta cache, can not use + sql "refresh catalog ${catalog}" + sql "use ${database_hive}" + } + + // can see + order_qt_sql03 "show databases like '%${database_hive}%'"; + // show tables first to fill cache + order_qt_sql04 "show tables" + hive_docker "create table ${database_hive}.${table_hive} (k1 int)" + // not see + order_qt_sql05 "show tables" + if (use_meta_cache) { + // but can select + sql "select * from ${table_hive}" + // still not see + order_qt_sql06 "show tables" + sql "refresh database ${database_hive}" + } else { + // if not use meta cache, can not select + sql "refresh database ${database_hive}" + sql "select * from ${table_hive}" + order_qt_sql06 "show tables" + } + // can see + order_qt_sql07 "show tables" + + // test Hive Metastore table partition file listing + hive_docker "create table ${database_hive}.${partitioned_table_hive} (k1 int) partitioned by (p1 string)" + sql "refresh catalog ${catalog}" + order_qt_sql08 "show partitions from ${partitioned_table_hive}" + hive_docker "alter table ${database_hive}.${partitioned_table_hive} add partition (p1='part1')" + hive_docker "alter table ${database_hive}.${partitioned_table_hive} add partition (p1='part2')" + // cant not see + order_qt_sql09 "show partitions from ${partitioned_table_hive}" + sql "refresh database ${database_hive}" + // can see + order_qt_sql10 "show partitions from ${partitioned_table_hive}" + + // drop tables + hive_docker "drop table ${database_hive}.${partitioned_table_hive}" + hive_docker "drop table ${database_hive}.${table_hive}" + // still can see + order_qt_sql11 "show tables" + sql "refresh database ${database_hive}" + // can not see + order_qt_sql12 "show tables" + + // drop database + hive_docker "drop database ${database_hive}" + // still can see + order_qt_sql13 "show databases like '%${database_hive}%'"; + sql "refresh catalog ${catalog}" + // can not see + order_qt_sql14 "show databases like '%${database_hive}%'"; + } + test_use_meta_cache(true) + test_use_meta_cache(false) } finally { } } } - - From d08e68f725392a6e6b88cb70de9e32fbc17a7a92 Mon Sep 17 00:00:00 2001 From: Socrates Date: Thu, 21 Nov 2024 16:27:38 +0800 Subject: [PATCH 3/3] fix --- .../hive/test_hive_use_meta_cache.out | 32 +++++-------------- .../hive/test_hive_use_meta_cache.groovy | 13 +++----- 2 files changed, 13 insertions(+), 32 deletions(-) diff --git a/regression-test/data/external_table_p0/hive/test_hive_use_meta_cache.out b/regression-test/data/external_table_p0/hive/test_hive_use_meta_cache.out index 9db486e2066f17..4d54c601c876a2 100644 --- a/regression-test/data/external_table_p0/hive/test_hive_use_meta_cache.out +++ b/regression-test/data/external_table_p0/hive/test_hive_use_meta_cache.out @@ -34,17 +34,13 @@ p1=part1 p1=part2 -- !sql10 -- -p1=part1 -p1=part2 -- !sql11 -- -- !sql12 -- - --- !sql13 -- test_use_meta_cache_db_hive --- !sql14 -- +-- !sql13 -- -- !sql01 -- @@ -82,19 +78,15 @@ p1=part1 p1=part2 -- !sql10 -- -p1=part1 -p1=part2 - --- !sql11 -- test_use_meta_cache_partitioned_tbl_hive test_use_meta_cache_tbl_hive --- !sql12 -- +-- !sql11 -- --- !sql13 -- +-- !sql12 -- test_use_meta_cache_db_hive --- !sql14 -- +-- !sql13 -- -- !sql01 -- @@ -131,17 +123,13 @@ p1=part1 p1=part2 -- !sql10 -- -p1=part1 -p1=part2 -- !sql11 -- -- !sql12 -- - --- !sql13 -- test_use_meta_cache_db_hive --- !sql14 -- +-- !sql13 -- -- !sql01 -- @@ -179,17 +167,13 @@ p1=part1 p1=part2 -- !sql10 -- -p1=part1 -p1=part2 - --- !sql11 -- test_use_meta_cache_partitioned_tbl_hive test_use_meta_cache_tbl_hive --- !sql12 -- +-- !sql11 -- --- !sql13 -- +-- !sql12 -- test_use_meta_cache_db_hive --- !sql14 -- +-- !sql13 -- diff --git a/regression-test/suites/external_table_p0/hive/test_hive_use_meta_cache.groovy b/regression-test/suites/external_table_p0/hive/test_hive_use_meta_cache.groovy index ed7bf20d807ee7..df12fc74898f06 100644 --- a/regression-test/suites/external_table_p0/hive/test_hive_use_meta_cache.groovy +++ b/regression-test/suites/external_table_p0/hive/test_hive_use_meta_cache.groovy @@ -107,28 +107,25 @@ suite("test_hive_use_meta_cache", "p0,external,hive,external_docker,external_doc order_qt_sql08 "show partitions from ${partitioned_table_hive}" hive_docker "alter table ${database_hive}.${partitioned_table_hive} add partition (p1='part1')" hive_docker "alter table ${database_hive}.${partitioned_table_hive} add partition (p1='part2')" - // cant not see + // can see because partition file listing is not cached order_qt_sql09 "show partitions from ${partitioned_table_hive}" - sql "refresh database ${database_hive}" - // can see - order_qt_sql10 "show partitions from ${partitioned_table_hive}" // drop tables hive_docker "drop table ${database_hive}.${partitioned_table_hive}" hive_docker "drop table ${database_hive}.${table_hive}" // still can see - order_qt_sql11 "show tables" + order_qt_sql10 "show tables" sql "refresh database ${database_hive}" // can not see - order_qt_sql12 "show tables" + order_qt_sql11 "show tables" // drop database hive_docker "drop database ${database_hive}" // still can see - order_qt_sql13 "show databases like '%${database_hive}%'"; + order_qt_sql12 "show databases like '%${database_hive}%'"; sql "refresh catalog ${catalog}" // can not see - order_qt_sql14 "show databases like '%${database_hive}%'"; + order_qt_sql13 "show databases like '%${database_hive}%'"; } test_use_meta_cache(true) test_use_meta_cache(false)