This is an automated email from the ASF dual-hosted git repository. dockerzhang pushed a commit to branch master in repository https://gitbox.apache.org/repos/asf/inlong.git
The following commit(s) were added to refs/heads/master by this push: new bb000828f2 [INLONG-10764][SDK] Transform SQL support temporal functions(Including year, quarter, month, week, dayofyear and dayofmonth) (#10766) bb000828f2 is described below commit bb000828f2dd7c106d5e17331d13ca17c6025566 Author: yfsn666 <61183968+yfsn...@users.noreply.github.com> AuthorDate: Sun Aug 11 15:46:06 2024 +0800 [INLONG-10764][SDK] Transform SQL support temporal functions(Including year, quarter, month, week, dayofyear and dayofmonth) (#10766) --- .../process/function/DateExtractFunction.java | 89 ++++++++++++++++++++++ .../transform/process/operator/OperatorTools.java | 21 +++++ .../sdk/transform/process/parser/DateParser.java | 43 +++++++++++ .../TestTransformTemporalFunctionsProcessor.java | 65 +++++++++++++++- 4 files changed, 217 insertions(+), 1 deletion(-) diff --git a/inlong-sdk/transform-sdk/src/main/java/org/apache/inlong/sdk/transform/process/function/DateExtractFunction.java b/inlong-sdk/transform-sdk/src/main/java/org/apache/inlong/sdk/transform/process/function/DateExtractFunction.java new file mode 100644 index 0000000000..47061c4dcf --- /dev/null +++ b/inlong-sdk/transform-sdk/src/main/java/org/apache/inlong/sdk/transform/process/function/DateExtractFunction.java @@ -0,0 +1,89 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.inlong.sdk.transform.process.function; + +import org.apache.inlong.sdk.transform.decode.SourceData; +import org.apache.inlong.sdk.transform.process.Context; +import org.apache.inlong.sdk.transform.process.operator.OperatorTools; +import org.apache.inlong.sdk.transform.process.parser.ValueParser; + +import net.sf.jsqlparser.expression.Expression; +import net.sf.jsqlparser.expression.Function; + +import java.sql.Date; +import java.time.LocalDate; +import java.time.temporal.TemporalField; +import java.time.temporal.WeekFields; +import java.util.List; +import java.util.Locale; + +/** + * DateExtractFunction + * description: + * - year(date)--returns the year from SQL date date + * - quarter(date)--returns the quarter of a year (an integer between 1 and 4) from SQL date date + * - month(date)--returns the month of a year (an integer between 1 and 12) from SQL date date + * - week(date)--returns the week of a year (an integer between 1 and 53) from SQL date date + * - dayofyear(date)--returns the day of a year (an integer between 1 and 366) from SQL date date + * - dayofmonth(date)--returns the day of a month (an integer between 1 and 31) from SQL date date + */ +public class DateExtractFunction implements ValueParser { + + private DateExtractFunctionType type; + private ValueParser dateParser; + private static final TemporalField weekOfYearField = WeekFields.of(Locale.getDefault()).weekOfWeekBasedYear(); + + public enum DateExtractFunctionType { + YEAR, QUARTER, MONTH, WEEK, DAY_OF_YEAR, DAY_OF_MONTH + } + + public DateExtractFunction(DateExtractFunctionType type, Function expr) { + this.type = type; + List<Expression> expressions = expr.getParameters().getExpressions(); + dateParser = OperatorTools.buildParser(expressions.get(0)); + } + + @Override + public Object parse(SourceData sourceData, int rowIndex, Context context) { + Object dateObj = dateParser.parse(sourceData, rowIndex, context); + Date date = OperatorTools.parseDate(dateObj); + LocalDate localDate = date.toLocalDate(); + switch (type) { + // year + case YEAR: + return localDate.getYear(); + // quarter(between 1 and 4) + case QUARTER: + return (localDate.getMonthValue() - 1) / 3 + 1; + // month(between 1 and 12) + case MONTH: + return localDate.getMonthValue(); + // week(between 1 and 53) + case WEEK: + return localDate.get(weekOfYearField); + // dayofyear(between 1 and 366) + case DAY_OF_YEAR: + return localDate.getDayOfYear(); + // dayofmonth(between 1 and 31) + case DAY_OF_MONTH: + return localDate.getDayOfMonth(); + default: + return null; + } + } +} diff --git a/inlong-sdk/transform-sdk/src/main/java/org/apache/inlong/sdk/transform/process/operator/OperatorTools.java b/inlong-sdk/transform-sdk/src/main/java/org/apache/inlong/sdk/transform/process/operator/OperatorTools.java index dbfa4b93c8..b1c950720e 100644 --- a/inlong-sdk/transform-sdk/src/main/java/org/apache/inlong/sdk/transform/process/operator/OperatorTools.java +++ b/inlong-sdk/transform-sdk/src/main/java/org/apache/inlong/sdk/transform/process/operator/OperatorTools.java @@ -20,6 +20,8 @@ package org.apache.inlong.sdk.transform.process.operator; import org.apache.inlong.sdk.transform.process.function.AbsFunction; import org.apache.inlong.sdk.transform.process.function.CeilFunction; import org.apache.inlong.sdk.transform.process.function.ConcatFunction; +import org.apache.inlong.sdk.transform.process.function.DateExtractFunction; +import org.apache.inlong.sdk.transform.process.function.DateExtractFunction.DateExtractFunctionType; import org.apache.inlong.sdk.transform.process.function.DateFormatFunction; import org.apache.inlong.sdk.transform.process.function.ExpFunction; import org.apache.inlong.sdk.transform.process.function.FloorFunction; @@ -37,6 +39,7 @@ import org.apache.inlong.sdk.transform.process.function.SubstringFunction; import org.apache.inlong.sdk.transform.process.function.ToDateFunction; import org.apache.inlong.sdk.transform.process.parser.AdditionParser; import org.apache.inlong.sdk.transform.process.parser.ColumnParser; +import org.apache.inlong.sdk.transform.process.parser.DateParser; import org.apache.inlong.sdk.transform.process.parser.DivisionParser; import org.apache.inlong.sdk.transform.process.parser.LongParser; import org.apache.inlong.sdk.transform.process.parser.MultiplicationParser; @@ -45,6 +48,7 @@ import org.apache.inlong.sdk.transform.process.parser.StringParser; import org.apache.inlong.sdk.transform.process.parser.SubtractionParser; import org.apache.inlong.sdk.transform.process.parser.ValueParser; +import net.sf.jsqlparser.expression.DateValue; import net.sf.jsqlparser.expression.Expression; import net.sf.jsqlparser.expression.Function; import net.sf.jsqlparser.expression.LongValue; @@ -67,6 +71,7 @@ import net.sf.jsqlparser.schema.Column; import org.apache.commons.lang.ObjectUtils; import java.math.BigDecimal; +import java.sql.Date; import java.util.HashMap; import java.util.Map; @@ -101,6 +106,12 @@ public class OperatorTools { functionMap.put("floor", FloorFunction::new); functionMap.put("sin", SinFunction::new); functionMap.put("sinh", SinhFunction::new); + functionMap.put("year", func -> new DateExtractFunction(DateExtractFunctionType.YEAR, func)); + functionMap.put("quarter", func -> new DateExtractFunction(DateExtractFunctionType.QUARTER, func)); + functionMap.put("month", func -> new DateExtractFunction(DateExtractFunctionType.MONTH, func)); + functionMap.put("week", func -> new DateExtractFunction(DateExtractFunctionType.WEEK, func)); + functionMap.put("dayofyear", func -> new DateExtractFunction(DateExtractFunctionType.DAY_OF_YEAR, func)); + functionMap.put("dayofmonth", func -> new DateExtractFunction(DateExtractFunctionType.DAY_OF_MONTH, func)); } public static ExpressionOperator buildOperator(Expression expr) { @@ -145,6 +156,8 @@ public class OperatorTools { return new MultiplicationParser((Multiplication) expr); } else if (expr instanceof Division) { return new DivisionParser((Division) expr); + } else if (expr instanceof DateValue) { + return new DateParser((DateValue) expr); } else if (expr instanceof Function) { String exprString = expr.toString(); if (exprString.startsWith(ROOT_KEY) || exprString.startsWith(CHILD_KEY)) { @@ -181,6 +194,14 @@ public class OperatorTools { return value.toString(); } + public static Date parseDate(Object value) { + if (value instanceof Date) { + return (Date) value; + } else { + return Date.valueOf(String.valueOf(value)); + } + } + /** * compareValue * @param left diff --git a/inlong-sdk/transform-sdk/src/main/java/org/apache/inlong/sdk/transform/process/parser/DateParser.java b/inlong-sdk/transform-sdk/src/main/java/org/apache/inlong/sdk/transform/process/parser/DateParser.java new file mode 100644 index 0000000000..0f0da4345d --- /dev/null +++ b/inlong-sdk/transform-sdk/src/main/java/org/apache/inlong/sdk/transform/process/parser/DateParser.java @@ -0,0 +1,43 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.inlong.sdk.transform.process.parser; + +import org.apache.inlong.sdk.transform.decode.SourceData; +import org.apache.inlong.sdk.transform.process.Context; + +import net.sf.jsqlparser.expression.DateValue; + +import java.sql.Date; + +/** + * DateParser + * description: parse the sql expression to a java.sql.Date object + */ +public class DateParser implements ValueParser { + + private final Date dateValue; + + public DateParser(DateValue expr) { + this.dateValue = Date.valueOf(expr.getValue().toLocalDate()); + } + + @Override + public Object parse(SourceData sourceData, int rowIndex, Context context) { + return dateValue; + } +} diff --git a/inlong-sdk/transform-sdk/src/test/java/org/apache/inlong/sdk/transform/process/TestTransformTemporalFunctionsProcessor.java b/inlong-sdk/transform-sdk/src/test/java/org/apache/inlong/sdk/transform/process/TestTransformTemporalFunctionsProcessor.java index 25675b25f3..0e847160f3 100644 --- a/inlong-sdk/transform-sdk/src/test/java/org/apache/inlong/sdk/transform/process/TestTransformTemporalFunctionsProcessor.java +++ b/inlong-sdk/transform-sdk/src/test/java/org/apache/inlong/sdk/transform/process/TestTransformTemporalFunctionsProcessor.java @@ -115,9 +115,72 @@ public class TestTransformTemporalFunctionsProcessor { List<String> output3 = processor1.transform("yyyyMMddHHmmss|apple|cloud|1722524216|1|3", new HashMap<>()); Assert.assertEquals(1, output3.size()); Assert.assertEquals(output3.get(0), "result=20240801225656"); - // case1: date_format(1722524216, 'yyyy/MM/dd HH:mm:ss') + // case4: date_format(1722524216, 'yyyy/MM/dd HH:mm:ss') List<String> output4 = processor1.transform("yyyy/MM/dd HH:mm:ss|apple|cloud|1722524216|1|3", new HashMap<>()); Assert.assertEquals(1, output4.size()); Assert.assertEquals(output4.get(0), "result=2024/08/01 22:56:56"); } + + @Test + public void testDateExtractFunction() throws Exception { + String transformSql1 = "select year(string1) from source"; + TransformConfig config1 = new TransformConfig(transformSql1); + TransformProcessor<String, String> processor1 = TransformProcessor + .create(config1, SourceDecoderFactory.createCsvDecoder(csvSource), + SinkEncoderFactory.createKvEncoder(kvSink)); + // case1: year(2024-08-08) + List<String> output1 = processor1.transform("2024-08-08", new HashMap<>()); + Assert.assertEquals(1, output1.size()); + Assert.assertEquals(output1.get(0), "result=2024"); + + String transformSql2 = "select quarter(string1) from source"; + TransformConfig config2 = new TransformConfig(transformSql2); + TransformProcessor<String, String> processor2 = TransformProcessor + .create(config2, SourceDecoderFactory.createCsvDecoder(csvSource), + SinkEncoderFactory.createKvEncoder(kvSink)); + // case2: quarter(2024-08-08) + List<String> output2 = processor2.transform("2024-08-08", new HashMap<>()); + Assert.assertEquals(1, output2.size()); + Assert.assertEquals(output2.get(0), "result=3"); + + String transformSql3 = "select month(string1) from source"; + TransformConfig config3 = new TransformConfig(transformSql3); + TransformProcessor<String, String> processor3 = TransformProcessor + .create(config3, SourceDecoderFactory.createCsvDecoder(csvSource), + SinkEncoderFactory.createKvEncoder(kvSink)); + // case3: month(2024-08-08) + List<String> output3 = processor3.transform("2024-08-08", new HashMap<>()); + Assert.assertEquals(1, output3.size()); + Assert.assertEquals(output3.get(0), "result=8"); + + String transformSql4 = "select week(string1) from source"; + TransformConfig config4 = new TransformConfig(transformSql4); + TransformProcessor<String, String> processor4 = TransformProcessor + .create(config4, SourceDecoderFactory.createCsvDecoder(csvSource), + SinkEncoderFactory.createKvEncoder(kvSink)); + // case4: week(2024-02-29) + List<String> output4 = processor4.transform("2024-02-29", new HashMap<>()); + Assert.assertEquals(1, output4.size()); + Assert.assertEquals(output4.get(0), "result=9"); + + String transformSql5 = "select dayofyear(string1) from source"; + TransformConfig config5 = new TransformConfig(transformSql5); + TransformProcessor<String, String> processor5 = TransformProcessor + .create(config5, SourceDecoderFactory.createCsvDecoder(csvSource), + SinkEncoderFactory.createKvEncoder(kvSink)); + // case5: dayofyear(2024-02-29) + List<String> output5 = processor5.transform("2024-02-29", new HashMap<>()); + Assert.assertEquals(1, output5.size()); + Assert.assertEquals(output5.get(0), "result=60"); + + String transformSql6 = "select dayofmonth(string1) from source"; + TransformConfig config6 = new TransformConfig(transformSql6); + TransformProcessor<String, String> processor6 = TransformProcessor + .create(config6, SourceDecoderFactory.createCsvDecoder(csvSource), + SinkEncoderFactory.createKvEncoder(kvSink)); + // case6: dayofmonth(2024-02-29) + List<String> output6 = processor6.transform("2024-02-29", new HashMap<>()); + Assert.assertEquals(1, output6.size()); + Assert.assertEquals(output6.get(0), "result=29"); + } }