[ https://issues.apache.org/jira/browse/HIVE-22893?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=17045890#comment-17045890 ]
Hive QA commented on HIVE-22893: -------------------------------- Here are the results of testing the latest attachment: https://issues.apache.org/jira/secure/attachment/12994641/HIVE-22893.13.patch {color:green}SUCCESS:{color} +1 due to 1 test(s) being added or modified. {color:red}ERROR:{color} -1 due to 47 failed/errored test(s), 18073 tests executed *Failed tests:* {noformat} org.apache.hadoop.hive.cli.TestCliDriver.testCliDriver[timestamptz_2] (batchId=92) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testAlterPartition (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testAlterTable (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testAlterTableCascade (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testAlterViewParititon (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testColumnStatistics (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testComplexTable (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testComplexTypeApi (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testConcurrentMetastores (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testCreateAndGetTableWithDriver (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testCreateTableSettingId (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testDBLocationChange (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testDBOwner (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testDBOwnerChange (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testDatabase (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testDatabaseLocation (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testDatabaseLocationWithPermissionProblems (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testDropDatabaseCascadeMVMultiDB (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testDropTable (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testFilterLastPartition (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testFilterSinglePartition (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testFunctionWithResources (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testGetConfigValue (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testGetMetastoreUuid (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testGetPartitionsWithSpec (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testGetSchemaWithNoClassDefFoundError (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testGetTableObjects (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testGetUUIDInParallel (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testJDOPersistanceManagerCleanup (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testListPartitionNames (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testListPartitions (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testListPartitionsWihtLimitEnabled (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testNameMethods (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testPartition (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testPartitionFilter (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testRenamePartition (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testRetriableClientWithConnLifetime (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testSimpleFunction (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testSimpleTable (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testSimpleTypeApi (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testStatsFastTrivial (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testSynchronized (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testTableDatabase (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testTableFilter (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testUpdatePartitionStat_doesNotUpdateStats (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testValidateTableCols (batchId=234) org.apache.hadoop.hive.metastore.TestRemoteHiveMetaStore.testVersion (batchId=234) {noformat} Test results: https://builds.apache.org/job/PreCommit-HIVE-Build/20840/testReport Console output: https://builds.apache.org/job/PreCommit-HIVE-Build/20840/console Test logs: http://104.198.109.242/logs/PreCommit-HIVE-Build-20840/ Messages: {noformat} Executing org.apache.hive.ptest.execution.TestCheckPhase Executing org.apache.hive.ptest.execution.PrepPhase Executing org.apache.hive.ptest.execution.YetusPhase Executing org.apache.hive.ptest.execution.ExecutionPhase Executing org.apache.hive.ptest.execution.ReportingPhase Tests exited with: TestsFailedException: 47 tests failed {noformat} This message is automatically generated. ATTACHMENT ID: 12994641 - PreCommit-HIVE-Build > Enhance data size estimation for fields computed by UDFs > -------------------------------------------------------- > > Key: HIVE-22893 > URL: https://issues.apache.org/jira/browse/HIVE-22893 > Project: Hive > Issue Type: Improvement > Components: Statistics > Reporter: Zoltan Haindrich > Assignee: Zoltan Haindrich > Priority: Major > Labels: pull-request-available > Attachments: HIVE-22893.01.patch, HIVE-22893.02.patch, > HIVE-22893.03.patch, HIVE-22893.04.patch, HIVE-22893.05.patch, > HIVE-22893.06.patch, HIVE-22893.07.patch, HIVE-22893.08.patch, > HIVE-22893.09.patch, HIVE-22893.10.patch, HIVE-22893.11.patch, > HIVE-22893.12.patch, HIVE-22893.13.patch > > Time Spent: 1h 50m > Remaining Estimate: 0h > > Right now if we have columnstat on a column ; we use that to estimate things > about the column; - however if an UDF is executed on a column ; the resulting > column is treated as unknown thing and defaults are assumed. > An improvement could be to give wide estimation(s) in case of frequently used > udf. > For example; consider {{substr(c,1,1)}} ; no matter what the input; the > output is at most a 1 long string -- This message was sent by Atlassian Jira (v8.3.4#803005)