This is an automated email from the ASF dual-hosted git repository. stigahuang pushed a commit to branch branch-4.4.1 in repository https://gitbox.apache.org/repos/asf/impala.git
commit b02e3c8439a9f0f7a5a886305f47fa720336b29f Author: Fang-Yu Rao <[email protected]> AuthorDate: Mon Aug 5 16:44:16 2024 -0700 IMPALA-13250: [DOCS] Document ENABLED_RUNTIME_FILTER_TYPES query option This patch documents the ENABLED_RUNTIME_FILTER_TYPES query option based on the respective code comments in ImpalaService.thrift and query-options.cc. Change-Id: Ib7a34782bed6f812fedf717d8a076e2706f0bba9 Reviewed-on: http://gerrit.cloudera.org:8080/21645 Tested-by: Impala Public Jenkins <[email protected]> Reviewed-by: Quanlong Huang <[email protected]> --- docs/impala.ditamap | 1 + docs/shared/ImpalaVariables.xml | 1 + docs/shared/impala_common.xml | 19 ++++- .../topics/impala_enabled_runtime_filter_types.xml | 89 ++++++++++++++++++++++ 4 files changed, 109 insertions(+), 1 deletion(-) diff --git a/docs/impala.ditamap b/docs/impala.ditamap index cf4d2e728..4747f9a3d 100644 --- a/docs/impala.ditamap +++ b/docs/impala.ditamap @@ -237,6 +237,7 @@ under the License. <topicref href="topics/impala_request_pool.xml"/> <topicref href="topics/impala_resource_trace_ratio.xml"/> <topicref rev="4.0.0" href="topics/impala_retry_failed_queries.xml"/> + <topicref rev="4.0.0" href="topics/impala_enabled_runtime_filter_types.xml"/> <topicref rev="2.5.0" href="topics/impala_runtime_bloom_filter_size.xml"/> <topicref rev="2.6.0" href="topics/impala_runtime_filter_max_size.xml"/> <topicref rev="2.6.0" href="topics/impala_runtime_filter_min_size.xml"/> diff --git a/docs/shared/ImpalaVariables.xml b/docs/shared/ImpalaVariables.xml index 5caf28907..d7236f06d 100644 --- a/docs/shared/ImpalaVariables.xml +++ b/docs/shared/ImpalaVariables.xml @@ -42,6 +42,7 @@ under the License. The docs included with a distro can refer to the distro release number by editing the values here. <ul> + <li><ph id="impala40">Impala 4.0</ph></li> <li><ph id="impala34">Impala 3.4</ph></li> <li><ph id="impala33">Impala 3.3</ph></li> <li><ph id="impala32">Impala 3.2</ph></li> diff --git a/docs/shared/impala_common.xml b/docs/shared/impala_common.xml index 27eca96a7..091f6c85d 100644 --- a/docs/shared/impala_common.xml +++ b/docs/shared/impala_common.xml @@ -1524,7 +1524,20 @@ alter table partitioned_data set tblproperties ('numRows'='1030000', 'STATS_GENE <xref href="https://asciinema.org/a/1rv7qippo0fe7h5k1b6k4nexk" scope="external" format="html">this animated demo</xref>. </p> - + + <p id="comma_separated_values_blurb"> + Impala backend expects comma separated values to be in quotes when executing the + <codeph>SET</codeph> statement. + This is usually the case when running SET statement like + <codeph>SET ENABLED_RUNTIME_FILTER_TYPES="value1,value2"</codeph> using a JDBC + driver. When using Impala-shell client, the <codeph>SET</codeph> statement is not + executed immediately but query options are updated in the client and applied as + part of the following statement, so no quotes are required for Impala-shell. That + is, we use SET statement like + <codeph>SET ENABLED_RUNTIME_FILTER_TYPES=value1,value2</codeph> when + submitting the query to Impala backend via Impala-shell client. + </p> + <p rev="2.5.0" id="runtime_filter_mode_blurb"> Because the runtime filtering feature is enabled by default only for local processing, the other filtering-related query options have @@ -3419,6 +3432,10 @@ flight_num: INT32 SNAPPY DO:83456393 FPO:83488603 SZ:10216514/11474301 needed to represent each value. </p> + <p rev="4.0.0" id="added_in_400"> + <b>Added in:</b> <keyword keyref="impala40"/> + </p> + <p rev="3.0" id="added_in_30"> <b>Added in:</b> <keyword keyref="impala30_full"/> </p> diff --git a/docs/topics/impala_enabled_runtime_filter_types.xml b/docs/topics/impala_enabled_runtime_filter_types.xml new file mode 100644 index 000000000..8faf6fbf4 --- /dev/null +++ b/docs/topics/impala_enabled_runtime_filter_types.xml @@ -0,0 +1,89 @@ +<?xml version="1.0" encoding="UTF-8"?> +<!-- +Licensed to the Apache Software Foundation (ASF) under one +or more contributor license agreements. See the NOTICE file +distributed with this work for additional information +regarding copyright ownership. The ASF licenses this file +to you under the Apache License, Version 2.0 (the +"License"); you may not use this file except in compliance +with the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, +software distributed under the License is distributed on an +"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +KIND, either express or implied. See the License for the +specific language governing permissions and limitations +under the License. +--> +<!DOCTYPE concept PUBLIC "-//OASIS//DTD DITA Concept//EN" "concept.dtd"> +<concept id="enabled_runtime_filter_types" rev="4.0.0"> + + <title>ENABLED_RUNTIME_FILTER_TYPES Query Option (<keyword keyref="impala40"/> or higher only)</title> + <titlealts audience="PDF"><navtitle>ENABLED RUNTIME FILTER TYPES</navtitle></titlealts> + <prolog> + <metadata> + <data name="Category" value="Impala"/> + <data name="Category" value="Impala Query Options"/> + <data name="Category" value="Performance"/> + <data name="Category" value="Developers"/> + <data name="Category" value="Data Analysts"/> + </metadata> + </prolog> + + <conbody> + + <p rev="4.0.0"> + <indexterm audience="hidden">ENABLED_RUNTIME_FILTER_TYPES query option</indexterm> + The <codeph>ENABLED_RUNTIME_FILTER_TYPES</codeph> query option + sets enabled runtime filter types to be applied to scanners. + This option only applies to HDFS scan nodes and Kudu scan nodes. + The following types are supported. + Specify the enabled types by a comma-separated list of the following values + or enable all types by "<codeph>ALL</codeph>". + <ul> + <li> + <codeph>BLOOM</codeph> + </li> + <li> + <codeph>MIN_MAX</codeph> + </li> + <li> + <codeph>IN_LIST</codeph> + </li> + </ul> + </p> + + <p> + <b>Default:</b> <codeph>"BLOOM,MIN_MAX"</codeph> + </p> + <p conref="../shared/impala_common.xml#common/type_string"/> + + <p conref="../shared/impala_common.xml#common/added_in_400"/> + + <p conref="../shared/impala_common.xml#common/usage_notes_blurb"/> + + <p conref="../shared/impala_common.xml#common/comma_separated_values_blurb"/> + + <p> + Depending on the scan node type, Planner can schedule compatible runtime filter + types as follows. + <ul> + <li>Kudu scan: <codeph>BLOOM</codeph>, <codeph>MIN_MAX</codeph></li> + <li> + HDFS scan on Parquet files: <codeph>BLOOM</codeph>, <codeph>MIN_MAX</codeph> + </li> + <li>HDFS scan on ORC files: <codeph>BLOOM</codeph>, <codeph>IN_LIST</codeph></li> + <li>HDFS scan on other kinds of files: <codeph>BLOOM</codeph></li> + </ul> + </p> + + <p conref="../shared/impala_common.xml#common/related_info"/> + <p> + <xref href="impala_runtime_filtering.xml"/>, + <xref href="impala_runtime_filter_mode.xml#runtime_filter_mode"/> + </p> + + </conbody> +</concept>
