Sergey Shelukhin created HIVE-14931:
---------------------------------------
Summary: Merge + Union + DP + (Mini?)Tez/LLAP fails
Key: HIVE-14931
URL: https://issues.apache.org/jira/browse/HIVE-14931
Project: Hive
Issue Type: Bug
Reporter: Sergey Shelukhin
Running the following on MiniLlap or MiniTez CLI driver on master: {noformat}
set hive.mapred.mode=nonstrict;
set hive.exec.dynamic.partition.mode=nonstrict;
set hive.fetch.task.conversion=none;
set tez.grouping.min-size=1;
set tez.grouping.max-size=2;
set hive.tez.auto.reducer.parallelism=false;
set hive.merge.orcfile.stripe.level=true;
set hive.merge.tezfiles=true;
set hive.merge.mapfiles=true;
set hive.merge.mapredfiles=true;
drop table intermediate;
create table intermediate(key int) partitioned by (p int) stored as orc;
insert into table intermediate partition(p='455') select distinct key from src
where key >= 0 order by key desc limit 2;
insert into table intermediate partition(p='456') select distinct key from src
where key is not null order by key asc limit 2;
create table merge_union_dp (id int) partitioned by (key int) stored as orc;
insert into table merge_union_dp partition (key)
select key as k0, key as k1 from intermediate
union all
select key as k0, key as k1 from intermediate;
drop table merge_union_dp;
drop table intermediate;
{noformat}
fails:
{noformat}
2016-10-11T15:41:16,393 ERROR [TezChild] OrcFileMergeOperator: Closing
operator..Exception: java.io.IOException: Multiple partitions for one merge
mapper:
hdfs://localhost:51206/build/ql/test/data/warehouse/merge_union_dp/.hive-staging_hive_2016-10-11_15-41-13_220_2560937429066666042-1/-ext-10002/key=0/1
NOT EQUAL TO
hdfs://localhost:51206/build/ql/test/data/warehouse/merge_union_dp/.hive-staging_hive_2016-10-11_15-41-13_220_2560937429066666042-1/-ext-10002/key=0/2
at
org.apache.hadoop.hive.ql.exec.AbstractFileMergeOperator.checkPartitionsMatch(AbstractFileMergeOperator.java:180)
at
org.apache.hadoop.hive.ql.exec.AbstractFileMergeOperator.fixTmpPath(AbstractFileMergeOperator.java:197)
at
org.apache.hadoop.hive.ql.exec.OrcFileMergeOperator.processKeyValuePairs(OrcFileMergeOperator.java:96)
at
org.apache.hadoop.hive.ql.exec.OrcFileMergeOperator.process(OrcFileMergeOperator.java:72)
at
org.apache.hadoop.hive.ql.exec.tez.MergeFileRecordProcessor.processRow(MergeFileRecordProcessor.java:216)
at
org.apache.hadoop.hive.ql.exec.tez.MergeFileRecordProcessor.run(MergeFileRecordProcessor.java:154)
at
org.apache.hadoop.hive.ql.exec.tez.TezProcessor.initializeAndRunProcessor(TezProcessor.java:185)
at
org.apache.hadoop.hive.ql.exec.tez.MergeFileTezProcessor.run(MergeFileTezProcessor.java:42)
at
org.apache.tez.runtime.LogicalIOProcessorRuntimeTask.run(LogicalIOProcessorRuntimeTask.java:370)
at
org.apache.tez.runtime.task.TaskRunner2Callable$1.run(TaskRunner2Callable.java:73)
at
org.apache.tez.runtime.task.TaskRunner2Callable$1.run(TaskRunner2Callable.java:61)
at java.security.AccessController.doPrivileged(Native Method)
at javax.security.auth.Subject.doAs(Subject.java:422)
at
org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1657)
at
org.apache.tez.runtime.task.TaskRunner2Callable.callInternal(TaskRunner2Callable.java:61)
at
org.apache.tez.runtime.task.TaskRunner2Callable.callInternal(TaskRunner2Callable.java:37)
at org.apache.tez.common.CallableWithNdc.call(CallableWithNdc.java:36)
at java.util.concurrent.FutureTask.run(FutureTask.java:266)
at
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142)
at
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617)
at java.lang.Thread.run(Thread.java:745)
{noformat}
--
This message was sent by Atlassian JIRA
(v6.3.4#6332)