[ https://issues.apache.org/jira/browse/HIVE-25947?focusedWorklogId=727235&page=com.atlassian.jira.plugin.system.issuetabpanels:worklog-tabpanel#worklog-727235 ]
ASF GitHub Bot logged work on HIVE-25947: ----------------------------------------- Author: ASF GitHub Bot Created on: 15/Feb/22 18:33 Start Date: 15/Feb/22 18:33 Worklog Time Spent: 10m Work Description: zabetak commented on a change in pull request #3027: URL: https://github.com/apache/hive/pull/3027#discussion_r806672446 ########## File path: ql/src/java/org/apache/hadoop/hive/ql/txn/compactor/CompactorUtil.java ########## @@ -22,16 +22,29 @@ import org.apache.hadoop.hive.metastore.api.Table; import org.apache.hadoop.hive.metastore.txn.CompactionInfo; +import java.util.ArrayList; +import java.util.Arrays; +import java.util.List; import java.util.concurrent.ExecutorService; import java.util.concurrent.ForkJoinPool; import java.util.concurrent.ForkJoinWorkerThread; +import java.util.function.Function; import static java.lang.String.format; public class CompactorUtil { public static final String COMPACTOR = "compactor"; - static final String COMPACTOR_PREFIX = "compactor."; - static final String MAPRED_QUEUE_NAME = "mapred.job.queue.name"; + /** + * List of accepted properties for defining the compactor's job queue. + * + * The order is important and defines which property has precedence over the other if multiple properties are defined + * at the same time. + */ + private static final List<String> QUEUE_PROPERTIES = Arrays.asList( Review comment: They are MR specific properties so they are not in `HiveConf`. Moreover, I am not sure if we want these to change transparently during a refactoring cause that will probably create backward compatibility problems. What exactly do you have in mind? ########## File path: ql/src/test/org/apache/hadoop/hive/ql/txn/compactor/TestCompactorMRJobQueueConfiguration.java ########## @@ -0,0 +1,262 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ +package org.apache.hadoop.hive.ql.txn.compactor; + +import org.apache.hadoop.hive.common.StringableMap; +import org.apache.hadoop.hive.common.ValidReaderWriteIdList; +import org.apache.hadoop.hive.common.ValidWriteIdList; +import org.apache.hadoop.hive.conf.HiveConf; +import org.apache.hadoop.hive.metastore.api.CompactionType; +import org.apache.hadoop.hive.metastore.api.FieldSchema; +import org.apache.hadoop.hive.metastore.api.StorageDescriptor; +import org.apache.hadoop.hive.metastore.api.Table; +import org.apache.hadoop.hive.metastore.txn.CompactionInfo; +import org.apache.hadoop.mapred.JobConf; +import org.junit.jupiter.params.ParameterizedTest; +import org.junit.jupiter.params.provider.MethodSource; + +import java.time.LocalDate; +import java.time.ZoneOffset; +import java.util.ArrayList; +import java.util.Arrays; +import java.util.Collections; +import java.util.HashMap; +import java.util.List; +import java.util.Map; +import java.util.stream.Stream; + +import static org.junit.jupiter.api.Assertions.assertEquals; + +/** + * Tests for {@link CompactorMR#createBaseJobConf(HiveConf, String, Table, StorageDescriptor, ValidWriteIdList, CompactionInfo)}. + */ +public class TestCompactorMRJobQueueConfiguration { + + @ParameterizedTest + @MethodSource("generateBaseJobConfSetup") + void testCreateBaseJobConfHasCorrectJobQueue(ConfSetup input) { + Table tbl = createPersonTable(); + tbl.setParameters(input.tableProperties); + CompactorMR compactor = new CompactorMR(); + CompactionInfo ci = new CompactionInfo(tbl.getDbName(), tbl.getTableName(), null, CompactionType.MAJOR); + ci.properties = new StringableMap(input.compactionProperties).toString(); + HiveConf conf = new HiveConf(); + input.confProperties.forEach(conf::set); + JobConf c = compactor.createBaseJobConf(conf, "test-job", tbl, tbl.getSd(), new ValidReaderWriteIdList(), ci); + assertEquals(input.expectedQueue, c.getQueueName(), "Test failed for the following input:" + input); + } + + private static Stream<ConfSetup> generateBaseJobConfSetup() { + List<ConfSetup> inputs = new ArrayList<>(); + String mrProperty = "mapreduce.job.queuename"; Review comment: This mimics the way users pass properties to the compactor APIs. If the APIs change and don't accept these properties anymore ideally I would like these tests to break. In other words, I don't want these tests to continue working after a refactoring to avoid having backward compatibility problems left unnoticed. WDYT? -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: gitbox-unsubscr...@hive.apache.org For queries about this service, please contact Infrastructure at: us...@infra.apache.org Issue Time Tracking ------------------- Worklog Id: (was: 727235) Time Spent: 1h 20m (was: 1h 10m) > Compactor job queue cannot be set per table via > compactor.mapred.job.queue.name > ------------------------------------------------------------------------------- > > Key: HIVE-25947 > URL: https://issues.apache.org/jira/browse/HIVE-25947 > Project: Hive > Issue Type: Bug > Components: HiveServer2 > Reporter: Stamatis Zampetakis > Assignee: Stamatis Zampetakis > Priority: Major > Labels: pull-request-available > Time Spent: 1h 20m > Remaining Estimate: 0h > > Before HIVE-20723 it was possible to schedule the compaction for each table > on specific job queues by putting {{compactor.mapred.job.queue.name}} in the > table properties. > {code:sql} > CREATE TABLE person (name STRING, age INT) STORED AS ORC TBLPROPERTIES( > 'transactional'='true', > 'compactor.mapred.job.queue.name'='root.user2); > ALTER TABLE person COMPACT 'major' WITH OVERWRITE > TBLPROPERTIES('compactor.mapred.job.queue.name'='root.user2') > {code} > This is no longer possible (after HIVE-20723) and in order to achieve the > same effect someone needs to use the {{compactor.hive.compactor.job.queue}}. > {code:sql} > CREATE TABLE person (name STRING, age INT) STORED AS ORC TBLPROPERTIES( > 'transactional'='true', > 'compactor.hive.compactor.job.queue'='root.user2); > ALTER TABLE person COMPACT 'major' WITH OVERWRITE > TBLPROPERTIES('compactor.hive.compactor.job.queue'='root.user2') > {code} -- This message was sent by Atlassian Jira (v8.20.1#820001)