[ 
https://issues.apache.org/jira/browse/HIVE-25404?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel
 ]

Zoltan Haindrich updated HIVE-25404:
------------------------------------
    Description: 

{code}
drop table u;drop table t;

create table t(value string default 'def') partitioned by (id integer);
create table u(id integer);
{code}

right now it causes an exception like:
{code}
See ./ql/target/tmp/log/hive.log or ./itests/qtest/target/tmp/log/hive.log, or 
check ./ql/target/surefire-reports or ./itests/qtest/target/surefire-reports/ 
for specific test cases logs.
 org.apache.hadoop.hive.ql.parse.SemanticException: Encountered parse error 
while parsing rewritten merge/update or delete query
        at 
org.apache.hadoop.hive.ql.parse.RewriteSemanticAnalyzer.parseRewrittenQuery(RewriteSemanticAnalyzer.java:277)
        at 
org.apache.hadoop.hive.ql.parse.MergeSemanticAnalyzer.analyzeMerge(MergeSemanticAnalyzer.java:272)
        at 
org.apache.hadoop.hive.ql.parse.MergeSemanticAnalyzer.analyze(MergeSemanticAnalyzer.java:63)
        at 
org.apache.hadoop.hive.ql.parse.RewriteSemanticAnalyzer.analyzeInternal(RewriteSemanticAnalyzer.java:72)
        at 
org.apache.hadoop.hive.ql.parse.BaseSemanticAnalyzer.analyze(BaseSemanticAnalyzer.java:317)
        at org.apache.hadoop.hive.ql.Compiler.analyze(Compiler.java:223)
[...]
Caused by: org.apache.hadoop.hive.ql.parse.ParseException: line 6:34 cannot 
recognize input near 'partition' '(' 'id' in select clause
        at 
org.apache.hadoop.hive.ql.parse.ParseDriver.parse(ParseDriver.java:125)
        at org.apache.hadoop.hive.ql.parse.ParseUtils.parse(ParseUtils.java:93)
        at org.apache.hadoop.hive.ql.parse.ParseUtils.parse(ParseUtils.java:85)
        at 
org.apache.hadoop.hive.ql.parse.RewriteSemanticAnalyzer.parseRewrittenQuery(RewriteSemanticAnalyzer.java:275)
{code}

because the query is rewritten to

#1 id&value specified
rewritten
{code}
FROM
  `default`.`t`
  RIGHT OUTER JOIN
  `default`.`u`
  ON `t`.`id`=`u`.`id`
INSERT INTO `default`.`t` (`id`,`value`) partition (`id`)    -- insert clause
  SELECT `u`.`id`,'x'
   WHERE `t`.`id` IS NULL
{code}

#2 when values is not specified

{code}
merge into t using u on t.id=u.id when not matched then insert (id) values 
(u.id);
{code}

rewritten query:
{code}
FROM
  `default`.`t`
  RIGHT OUTER JOIN
  `default`.`u`
  ON `t`.`id`=`u`.`id`
INSERT INTO `default`.`t` (`id`) partition (`id`)    -- insert clause
  SELECT `u`.`id`
   WHERE `t`.`id` IS NULL
{code}



  was:
{code}
drop table u;drop table t;

create table t(value string default 'def') partitioned by (id integer);
create table u(id integer);
{code}

#1 id&value specified
rewritten
{code}
FROM
  `default`.`t`
  RIGHT OUTER JOIN
  `default`.`u`
  ON `t`.`id`=`u`.`id`
INSERT INTO `default`.`t` (`id`,`value`) partition (`id`)    -- insert clause
  SELECT `u`.`id`,'x'
   WHERE `t`.`id` IS NULL
{code}

#2 when values is not specified

{code}
merge into t using u on t.id=u.id when not matched then insert (id) values 
(u.id);
{code}

rewritten query:
{code}
FROM
  `default`.`t`
  RIGHT OUTER JOIN
  `default`.`u`
  ON `t`.`id`=`u`.`id`
INSERT INTO `default`.`t` (`id`) partition (`id`)    -- insert clause
  SELECT `u`.`id`
   WHERE `t`.`id` IS NULL
{code}




> Inserts inside merge statements are rewritten incorrectly for partitioned 
> tables
> --------------------------------------------------------------------------------
>
>                 Key: HIVE-25404
>                 URL: https://issues.apache.org/jira/browse/HIVE-25404
>             Project: Hive
>          Issue Type: Bug
>            Reporter: Zoltan Haindrich
>            Assignee: Zoltan Haindrich
>            Priority: Major
>              Labels: pull-request-available
>          Time Spent: 50m
>  Remaining Estimate: 0h
>
> {code}
> drop table u;drop table t;
> create table t(value string default 'def') partitioned by (id integer);
> create table u(id integer);
> {code}
> right now it causes an exception like:
> {code}
> See ./ql/target/tmp/log/hive.log or ./itests/qtest/target/tmp/log/hive.log, 
> or check ./ql/target/surefire-reports or 
> ./itests/qtest/target/surefire-reports/ for specific test cases logs.
>  org.apache.hadoop.hive.ql.parse.SemanticException: Encountered parse error 
> while parsing rewritten merge/update or delete query
>       at 
> org.apache.hadoop.hive.ql.parse.RewriteSemanticAnalyzer.parseRewrittenQuery(RewriteSemanticAnalyzer.java:277)
>       at 
> org.apache.hadoop.hive.ql.parse.MergeSemanticAnalyzer.analyzeMerge(MergeSemanticAnalyzer.java:272)
>       at 
> org.apache.hadoop.hive.ql.parse.MergeSemanticAnalyzer.analyze(MergeSemanticAnalyzer.java:63)
>       at 
> org.apache.hadoop.hive.ql.parse.RewriteSemanticAnalyzer.analyzeInternal(RewriteSemanticAnalyzer.java:72)
>       at 
> org.apache.hadoop.hive.ql.parse.BaseSemanticAnalyzer.analyze(BaseSemanticAnalyzer.java:317)
>       at org.apache.hadoop.hive.ql.Compiler.analyze(Compiler.java:223)
> [...]
> Caused by: org.apache.hadoop.hive.ql.parse.ParseException: line 6:34 cannot 
> recognize input near 'partition' '(' 'id' in select clause
>       at 
> org.apache.hadoop.hive.ql.parse.ParseDriver.parse(ParseDriver.java:125)
>       at org.apache.hadoop.hive.ql.parse.ParseUtils.parse(ParseUtils.java:93)
>       at org.apache.hadoop.hive.ql.parse.ParseUtils.parse(ParseUtils.java:85)
>       at 
> org.apache.hadoop.hive.ql.parse.RewriteSemanticAnalyzer.parseRewrittenQuery(RewriteSemanticAnalyzer.java:275)
> {code}
> because the query is rewritten to
> #1 id&value specified
> rewritten
> {code}
> FROM
>   `default`.`t`
>   RIGHT OUTER JOIN
>   `default`.`u`
>   ON `t`.`id`=`u`.`id`
> INSERT INTO `default`.`t` (`id`,`value`) partition (`id`)    -- insert clause
>   SELECT `u`.`id`,'x'
>    WHERE `t`.`id` IS NULL
> {code}
> #2 when values is not specified
> {code}
> merge into t using u on t.id=u.id when not matched then insert (id) values 
> (u.id);
> {code}
> rewritten query:
> {code}
> FROM
>   `default`.`t`
>   RIGHT OUTER JOIN
>   `default`.`u`
>   ON `t`.`id`=`u`.`id`
> INSERT INTO `default`.`t` (`id`) partition (`id`)    -- insert clause
>   SELECT `u`.`id`
>    WHERE `t`.`id` IS NULL
> {code}



--
This message was sent by Atlassian Jira
(v8.3.4#803005)

Reply via email to