Sergey Shelukhin created HIVE-14931:
---------------------------------------

             Summary: Merge + Union + DP + (Mini?)Tez/LLAP fails 
                 Key: HIVE-14931
                 URL: https://issues.apache.org/jira/browse/HIVE-14931
             Project: Hive
          Issue Type: Bug
            Reporter: Sergey Shelukhin


Running the following on MiniLlap or MiniTez CLI driver on master: {noformat}
set hive.mapred.mode=nonstrict;
set hive.exec.dynamic.partition.mode=nonstrict;
set hive.fetch.task.conversion=none;
set tez.grouping.min-size=1;
set tez.grouping.max-size=2;
set hive.tez.auto.reducer.parallelism=false;
set hive.merge.orcfile.stripe.level=true;
set hive.merge.tezfiles=true;
set hive.merge.mapfiles=true;
set hive.merge.mapredfiles=true;

drop table intermediate;
create table intermediate(key int) partitioned by (p int) stored as orc;
insert into table intermediate partition(p='455') select distinct key from src 
where key >= 0 order by key desc limit 2;
insert into table intermediate partition(p='456') select distinct key from src 
where key is not null order by key asc limit 2;

create table merge_union_dp (id int) partitioned by (key int) stored as orc;

insert into table merge_union_dp partition (key)
select key as k0, key as k1 from intermediate
union all
select key as k0, key as k1 from intermediate;

drop table merge_union_dp;
drop table intermediate;
{noformat}

fails:
{noformat}
2016-10-11T15:41:16,393 ERROR [TezChild] OrcFileMergeOperator: Closing 
operator..Exception: java.io.IOException: Multiple partitions for one merge 
mapper: 
hdfs://localhost:51206/build/ql/test/data/warehouse/merge_union_dp/.hive-staging_hive_2016-10-11_15-41-13_220_2560937429066666042-1/-ext-10002/key=0/1
 NOT EQUAL TO 
hdfs://localhost:51206/build/ql/test/data/warehouse/merge_union_dp/.hive-staging_hive_2016-10-11_15-41-13_220_2560937429066666042-1/-ext-10002/key=0/2
        at 
org.apache.hadoop.hive.ql.exec.AbstractFileMergeOperator.checkPartitionsMatch(AbstractFileMergeOperator.java:180)
        at 
org.apache.hadoop.hive.ql.exec.AbstractFileMergeOperator.fixTmpPath(AbstractFileMergeOperator.java:197)
        at 
org.apache.hadoop.hive.ql.exec.OrcFileMergeOperator.processKeyValuePairs(OrcFileMergeOperator.java:96)
        at 
org.apache.hadoop.hive.ql.exec.OrcFileMergeOperator.process(OrcFileMergeOperator.java:72)
        at 
org.apache.hadoop.hive.ql.exec.tez.MergeFileRecordProcessor.processRow(MergeFileRecordProcessor.java:216)
        at 
org.apache.hadoop.hive.ql.exec.tez.MergeFileRecordProcessor.run(MergeFileRecordProcessor.java:154)
        at 
org.apache.hadoop.hive.ql.exec.tez.TezProcessor.initializeAndRunProcessor(TezProcessor.java:185)
        at 
org.apache.hadoop.hive.ql.exec.tez.MergeFileTezProcessor.run(MergeFileTezProcessor.java:42)
        at 
org.apache.tez.runtime.LogicalIOProcessorRuntimeTask.run(LogicalIOProcessorRuntimeTask.java:370)
        at 
org.apache.tez.runtime.task.TaskRunner2Callable$1.run(TaskRunner2Callable.java:73)
        at 
org.apache.tez.runtime.task.TaskRunner2Callable$1.run(TaskRunner2Callable.java:61)
        at java.security.AccessController.doPrivileged(Native Method)
        at javax.security.auth.Subject.doAs(Subject.java:422)
        at 
org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1657)
        at 
org.apache.tez.runtime.task.TaskRunner2Callable.callInternal(TaskRunner2Callable.java:61)
        at 
org.apache.tez.runtime.task.TaskRunner2Callable.callInternal(TaskRunner2Callable.java:37)
        at org.apache.tez.common.CallableWithNdc.call(CallableWithNdc.java:36)
        at java.util.concurrent.FutureTask.run(FutureTask.java:266)
        at 
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142)
        at 
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617)
        at java.lang.Thread.run(Thread.java:745)
{noformat}



--
This message was sent by Atlassian JIRA
(v6.3.4#6332)

Reply via email to