Skip to content

Commit

Permalink
[fix](outfile) add regression test for outfile (#44734)
Browse files Browse the repository at this point in the history
### What problem does this PR solve?
Problem Summary:

add regression test for this pr: #43929

TODO:
Support to export data of doris NULL type to orc file format.
  • Loading branch information
BePPPower authored and Your Name committed Nov 30, 2024
1 parent 88926d2 commit 4ecd550
Show file tree
Hide file tree
Showing 2 changed files with 148 additions and 0 deletions.
37 changes: 37 additions & 0 deletions regression-test/data/export_p0/outfile/test_outfile_null_type.out
Original file line number Diff line number Diff line change
@@ -0,0 +1,37 @@
-- This file is automatically generated. You should know what you did if you want to edit this
-- !select_export --
1 ftw-1 19
2 ftw-2 20
3 ftw-3 21
4 ftw-4 22
5 ftw-5 23
6 ftw-6 24
7 ftw-7 25
8 ftw-8 26
9 ftw-9 27
10 \N \N

-- !select_load_parquet --
1 ftw-1 19 \N
10 \N \N \N
2 ftw-2 20 \N
3 ftw-3 21 \N
4 ftw-4 22 \N
5 ftw-5 23 \N
6 ftw-6 24 \N
7 ftw-7 25 \N
8 ftw-8 26 \N
9 ftw-9 27 \N

-- !select_load_csv --
1 ftw-1 19 \N
10 \N \N \N
2 ftw-2 20 \N
3 ftw-3 21 \N
4 ftw-4 22 \N
5 ftw-5 23 \N
6 ftw-6 24 \N
7 ftw-7 25 \N
8 ftw-8 26 \N
9 ftw-9 27 \N

111 changes: 111 additions & 0 deletions regression-test/suites/export_p0/outfile/test_outfile_null_type.groovy
Original file line number Diff line number Diff line change
@@ -0,0 +1,111 @@
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.

suite("test_outfile_null_type", "p0") {
String ak = getS3AK()
String sk = getS3SK()
String s3_endpoint = getS3Endpoint()
String region = getS3Region()
String bucket = context.config.otherConfigs.get("s3BucketName");

def export_table_name = "test_outfile_null_type"
def outFilePath = "${bucket}/outfile/null_type/exp_"

def outfile_to_S3 = { format ->
// select ... into outfile ...
def res = sql """
SELECT *, NULL AS null_col FROM ${export_table_name} t
INTO OUTFILE "s3://${outFilePath}"
FORMAT AS ${format}
PROPERTIES (
"s3.endpoint" = "${s3_endpoint}",
"s3.region" = "${region}",
"s3.secret_key"="${sk}",
"s3.access_key" = "${ak}"
);
"""

return res[0][3]
}

sql """ DROP TABLE IF EXISTS ${export_table_name} """
sql """
CREATE TABLE `${export_table_name}` (
`id` int(11) NULL,
`Name` string NULL,
`age` int(11) NULL
) ENGINE=OLAP
DISTRIBUTED BY HASH(`id`)
PROPERTIES (
"replication_num" = "1"
);
"""

StringBuilder sb = new StringBuilder()
int i = 1
for (; i < 10; i ++) {
sb.append("""
(${i}, 'ftw-${i}', ${i + 18}),
""")
}
sb.append("""
(${i}, NULL, NULL)
""")
sql """ INSERT INTO ${export_table_name} VALUES
${sb.toString()}
"""
def insert_res = sql "show last insert;"
logger.info("insert result: " + insert_res.toString())
qt_select_export """ SELECT * FROM ${export_table_name} t ORDER BY id; """

// parquet file format
def format = "parquet"
def outfile_url = outfile_to_S3("${format}")
order_qt_select_load_parquet """ SELECT * FROM S3 (
"uri" = "http://${bucket}.${s3_endpoint}${outfile_url.substring(5 + bucket.length(), outfile_url.length() - 1)}0.${format}",
"ACCESS_KEY"= "${ak}",
"SECRET_KEY" = "${sk}",
"format" = "${format}",
"region" = "${region}"
);
"""

// TODO(ftw): orc supports to export data of NULL type.
// orc file foramt
// format = "orc"
// outfile_url = outfile_to_S3("${format}")
// qt_select_load_orc """ SELECT * FROM S3 (
// "uri" = "http://${bucket}.${s3_endpoint}${outfile_url.substring(5 + bucket.length(), outfile_url.length() - 1)}0.${format}",
// "ACCESS_KEY"= "${ak}",
// "SECRET_KEY" = "${sk}",
// "format" = "${format}",
// "region" = "${region}"
// );
// """

// csv file foramt
format = "csv"
outfile_url = outfile_to_S3("${format}")
order_qt_select_load_csv """ SELECT * FROM S3 (
"uri" = "http://${bucket}.${s3_endpoint}${outfile_url.substring(5 + bucket.length(), outfile_url.length() - 1)}0.${format}",
"ACCESS_KEY"= "${ak}",
"SECRET_KEY" = "${sk}",
"format" = "${format}",
"region" = "${region}"
);
"""
}

0 comments on commit 4ecd550

Please sign in to comment.