io.prestosql.tests.hive.TestHiveStorageFormats Maven / Gradle / Ivy
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package io.prestosql.tests.hive;
import com.google.common.collect.ImmutableMap;
import io.prestosql.tempto.ProductTest;
import io.prestosql.tempto.assertions.QueryAssert.Row;
import io.prestosql.tempto.query.QueryResult;
import io.prestosql.tests.utils.JdbcDriverUtils;
import org.testng.annotations.DataProvider;
import org.testng.annotations.Test;
import java.sql.Connection;
import java.sql.SQLException;
import java.util.List;
import java.util.Locale;
import java.util.Map;
import static com.google.common.base.MoreObjects.toStringHelper;
import static com.google.common.collect.ImmutableList.toImmutableList;
import static io.prestosql.tempto.assertions.QueryAssert.Row.row;
import static io.prestosql.tempto.assertions.QueryAssert.assertThat;
import static io.prestosql.tempto.query.QueryExecutor.defaultQueryExecutor;
import static io.prestosql.tempto.query.QueryExecutor.query;
import static io.prestosql.tests.TestGroups.STORAGE_FORMATS;
import static io.prestosql.tests.utils.JdbcDriverUtils.setSessionProperty;
import static io.prestosql.tests.utils.QueryExecutors.onHive;
import static java.lang.String.format;
import static java.util.Objects.requireNonNull;
public class TestHiveStorageFormats
extends ProductTest
{
private static final String TPCH_SCHEMA = "tiny";
@DataProvider(name = "storage_formats")
public static Object[][] storageFormats()
{
return new StorageFormat[][] {
{storageFormat("ORC", ImmutableMap.of("hive.orc_optimized_writer_validate", "true"))},
{storageFormat("PARQUET")},
{storageFormat("RCBINARY", ImmutableMap.of("hive.rcfile_optimized_writer_validate", "true"))},
{storageFormat("RCTEXT", ImmutableMap.of("hive.rcfile_optimized_writer_validate", "true"))},
{storageFormat("SEQUENCEFILE")},
{storageFormat("TEXTFILE")},
{storageFormat("AVRO")}
};
}
@Test(dataProvider = "storage_formats", groups = {STORAGE_FORMATS})
public void testInsertIntoTable(StorageFormat storageFormat)
{
// only admin user is allowed to change session properties
setRole("admin");
setSessionProperties(storageFormat);
String tableName = "storage_formats_test_insert_into_" + storageFormat.getName().toLowerCase(Locale.ENGLISH);
query(format("DROP TABLE IF EXISTS %s", tableName));
String createTable = format(
"CREATE TABLE %s(" +
" orderkey BIGINT," +
" partkey BIGINT," +
" suppkey BIGINT," +
" linenumber INTEGER," +
" quantity DOUBLE," +
" extendedprice DOUBLE," +
" discount DOUBLE," +
" tax DOUBLE," +
" linestatus VARCHAR," +
" shipinstruct VARCHAR," +
" shipmode VARCHAR," +
" comment VARCHAR," +
" returnflag VARCHAR" +
") WITH (format='%s')",
tableName,
storageFormat.getName());
query(createTable);
String insertInto = format("INSERT INTO %s " +
"SELECT " +
"orderkey, partkey, suppkey, linenumber, quantity, extendedprice, discount, tax, " +
"linestatus, shipinstruct, shipmode, comment, returnflag " +
"FROM tpch.%s.lineitem", tableName, TPCH_SCHEMA);
query(insertInto);
assertSelect("select sum(tax), sum(discount), sum(linenumber) from %s", tableName);
query(format("DROP TABLE %s", tableName));
}
@Test(dataProvider = "storage_formats", groups = {STORAGE_FORMATS})
public void testCreateTableAs(StorageFormat storageFormat)
{
// only admin user is allowed to change session properties
setRole("admin");
setSessionProperties(storageFormat);
String tableName = "storage_formats_test_create_table_as_select_" + storageFormat.getName().toLowerCase(Locale.ENGLISH);
query(format("DROP TABLE IF EXISTS %s", tableName));
String createTableAsSelect = format(
"CREATE TABLE %s WITH (format='%s') AS " +
"SELECT " +
"partkey, suppkey, extendedprice " +
"FROM tpch.%s.lineitem",
tableName,
storageFormat.getName(),
TPCH_SCHEMA);
query(createTableAsSelect);
assertSelect("select sum(extendedprice), sum(suppkey), count(partkey) from %s", tableName);
query(format("DROP TABLE %s", tableName));
}
@Test(dataProvider = "storage_formats", groups = {STORAGE_FORMATS})
public void testInsertIntoPartitionedTable(StorageFormat storageFormat)
{
// only admin user is allowed to change session properties
setRole("admin");
setSessionProperties(storageFormat);
String tableName = "storage_formats_test_insert_into_partitioned_" + storageFormat.getName().toLowerCase(Locale.ENGLISH);
query(format("DROP TABLE IF EXISTS %s", tableName));
String createTable = format(
"CREATE TABLE %s(" +
" orderkey BIGINT," +
" partkey BIGINT," +
" suppkey BIGINT," +
" linenumber INTEGER," +
" quantity DOUBLE," +
" extendedprice DOUBLE," +
" discount DOUBLE," +
" tax DOUBLE," +
" linestatus VARCHAR," +
" shipinstruct VARCHAR," +
" shipmode VARCHAR," +
" comment VARCHAR," +
" returnflag VARCHAR" +
") WITH (format='%s', partitioned_by = ARRAY['returnflag'])",
tableName,
storageFormat.getName());
query(createTable);
String insertInto = format("INSERT INTO %s " +
"SELECT " +
"orderkey, partkey, suppkey, linenumber, quantity, extendedprice, discount, tax, " +
"linestatus, shipinstruct, shipmode, comment, returnflag " +
"FROM tpch.%s.lineitem", tableName, TPCH_SCHEMA);
query(insertInto);
assertSelect("select sum(tax), sum(discount), sum(length(returnflag)) from %s", tableName);
query(format("DROP TABLE %s", tableName));
}
@Test(dataProvider = "storage_formats", groups = {STORAGE_FORMATS})
public void testCreatePartitionedTableAs(StorageFormat storageFormat)
{
// only admin user is allowed to change session properties
setRole("admin");
setSessionProperties(storageFormat);
String tableName = "storage_formats_test_create_table_as_select_partitioned_" + storageFormat.getName().toLowerCase(Locale.ENGLISH);
query(format("DROP TABLE IF EXISTS %s", tableName));
String createTableAsSelect = format(
"CREATE TABLE %s WITH (format='%s', partitioned_by = ARRAY['returnflag']) AS " +
"SELECT " +
"tax, discount, returnflag " +
"FROM tpch.%s.lineitem",
tableName,
storageFormat.getName(),
TPCH_SCHEMA);
query(createTableAsSelect);
assertSelect("select sum(tax), sum(discount), sum(length(returnflag)) from %s", tableName);
query(format("DROP TABLE %s", tableName));
}
@Test(groups = {STORAGE_FORMATS})
public void testSnappyCompressedParquetTableCreatedInHive()
{
String tableName = "table_created_in_hive_parquet";
onHive().executeQuery("DROP TABLE IF EXISTS " + tableName);
onHive().executeQuery(format(
"CREATE TABLE %s (" +
" c_bigint BIGINT," +
" c_varchar VARCHAR(255))" +
"STORED AS PARQUET " +
"TBLPROPERTIES(\"parquet.compression\"=\"SNAPPY\")",
tableName));
onHive().executeQuery(format("INSERT INTO %s VALUES(1, 'test data')", tableName));
assertThat(query("SELECT * FROM " + tableName)).containsExactly(row(1, "test data"));
onHive().executeQuery("DROP TABLE " + tableName);
}
private static void assertSelect(String query, String tableName)
{
QueryResult expected = query(format(query, "tpch." + TPCH_SCHEMA + ".lineitem"));
List expectedRows = expected.rows().stream()
.map((columns) -> row(columns.toArray()))
.collect(toImmutableList());
QueryResult actual = query(format(query, tableName));
assertThat(actual)
.hasColumns(expected.getColumnTypes())
.containsExactly(expectedRows);
}
private static void setRole(String role)
{
Connection connection = defaultQueryExecutor().getConnection();
try {
JdbcDriverUtils.setRole(connection, role);
}
catch (SQLException e) {
throw new RuntimeException(e);
}
}
private static void setSessionProperties(StorageFormat storageFormat)
{
setSessionProperties(storageFormat.getSessionProperties());
}
private static void setSessionProperties(Map sessionProperties)
{
Connection connection = defaultQueryExecutor().getConnection();
try {
// create more than one split
setSessionProperty(connection, "task_writer_count", "4");
setSessionProperty(connection, "redistribute_writes", "false");
for (Map.Entry sessionProperty : sessionProperties.entrySet()) {
setSessionProperty(connection, sessionProperty.getKey(), sessionProperty.getValue());
}
}
catch (SQLException e) {
throw new RuntimeException(e);
}
}
private static StorageFormat storageFormat(String name)
{
return storageFormat(name, ImmutableMap.of());
}
private static StorageFormat storageFormat(String name, Map sessionProperties)
{
return new StorageFormat(name, sessionProperties);
}
private static class StorageFormat
{
private final String name;
private final Map sessionProperties;
private StorageFormat(String name, Map sessionProperties)
{
this.name = requireNonNull(name, "name is null");
this.sessionProperties = requireNonNull(sessionProperties, "sessionProperties is null");
}
public String getName()
{
return name;
}
public Map getSessionProperties()
{
return sessionProperties;
}
@Override
public String toString()
{
return toStringHelper(this)
.add("name", name)
.add("sessionProperties", sessionProperties)
.toString();
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy