[HUDI-1762] Added HiveStylePartitionExtractor to support Hive style partitions (#2769)
This commit is contained in:
committed by
GitHub
parent
cf3d2e21eb
commit
08e82c469c
@@ -0,0 +1,42 @@
|
|||||||
|
/*
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one
|
||||||
|
* or more contributor license agreements. See the NOTICE file
|
||||||
|
* distributed with this work for additional information
|
||||||
|
* regarding copyright ownership. The ASF licenses this file
|
||||||
|
* to you under the Apache License, Version 2.0 (the
|
||||||
|
* "License"); you may not use this file except in compliance
|
||||||
|
* with the License. You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
|
||||||
|
package org.apache.hudi.hive;
|
||||||
|
|
||||||
|
import java.util.Collections;
|
||||||
|
import java.util.List;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Extractor for Hive Style Partitioned tables, when the parition folders are key value pairs.
|
||||||
|
*
|
||||||
|
* <p>This implementation extracts the partition value of yyyy-mm-dd from the path of type datestr=yyyy-mm-dd.
|
||||||
|
*/
|
||||||
|
public class HiveStylePartitionValueExtractor implements PartitionValueExtractor {
|
||||||
|
private static final long serialVersionUID = 1L;
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public List<String> extractPartitionValuesInPath(String partitionPath) {
|
||||||
|
// partition path is expected to be in this format partition_key=partition_value.
|
||||||
|
String[] splits = partitionPath.split("=");
|
||||||
|
if (splits.length != 2) {
|
||||||
|
throw new IllegalArgumentException(
|
||||||
|
"Partition path " + partitionPath + " is not in the form partition_key=partition_value.");
|
||||||
|
}
|
||||||
|
return Collections.singletonList(splits[1]);
|
||||||
|
}
|
||||||
|
}
|
||||||
@@ -35,4 +35,15 @@ public class TestPartitionValueExtractor {
|
|||||||
assertThrows(IllegalArgumentException.class, () -> hourPartition.extractPartitionValuesInPath("2020/12/20"));
|
assertThrows(IllegalArgumentException.class, () -> hourPartition.extractPartitionValuesInPath("2020/12/20"));
|
||||||
assertEquals(hourPartition.extractPartitionValuesInPath("update_time=2020/12/20/01"), list);
|
assertEquals(hourPartition.extractPartitionValuesInPath("update_time=2020/12/20/01"), list);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void testHiveStylePartition() {
|
||||||
|
HiveStylePartitionValueExtractor hiveStylePartition = new HiveStylePartitionValueExtractor();
|
||||||
|
List<String> list = new ArrayList<>();
|
||||||
|
list.add("2021-04-02");
|
||||||
|
assertEquals(hiveStylePartition.extractPartitionValuesInPath("datestr=2021-04-02"), list);
|
||||||
|
assertThrows(
|
||||||
|
IllegalArgumentException.class,
|
||||||
|
() -> hiveStylePartition.extractPartitionValuesInPath("2021/04/02"));
|
||||||
|
}
|
||||||
}
|
}
|
||||||
Reference in New Issue
Block a user