[ https://issues.apache.org/jira/browse/HIVE-26957?focusedWorklogId=844624&page=com.atlassian.jira.plugin.system.issuetabpanels:worklog-tabpanel#worklog-844624 ]
ASF GitHub Bot logged work on HIVE-26957: ----------------------------------------- Author: ASF GitHub Bot Created on: 09/Feb/23 17:47 Start Date: 09/Feb/23 17:47 Worklog Time Spent: 10m Work Description: TaoZex commented on code in PR #3982: URL: https://github.com/apache/hive/pull/3982#discussion_r1101827061 ########## ql/src/java/org/apache/hadoop/hive/ql/udf/generic/GenericUDFConvertCharset.java: ########## @@ -0,0 +1,126 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.hadoop.hive.ql.udf.generic; + +import java.nio.ByteBuffer; +import java.nio.CharBuffer; +import java.nio.charset.CharacterCodingException; +import java.nio.charset.Charset; +import java.nio.charset.CharsetDecoder; +import java.nio.charset.CharsetEncoder; +import java.nio.charset.CodingErrorAction; + +import org.apache.hadoop.hive.ql.exec.Description; +import org.apache.hadoop.hive.ql.exec.UDFArgumentException; +import org.apache.hadoop.hive.ql.exec.UDFArgumentLengthException; +import org.apache.hadoop.hive.ql.exec.UDFArgumentTypeException; +import org.apache.hadoop.hive.ql.metadata.HiveException; +import org.apache.hadoop.hive.serde2.objectinspector.ConstantObjectInspector; +import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspector; +import org.apache.hadoop.hive.serde2.objectinspector.PrimitiveObjectInspector; +import org.apache.hadoop.hive.serde2.objectinspector.primitive.PrimitiveObjectInspectorFactory; +import org.apache.hadoop.hive.serde2.objectinspector.primitive.PrimitiveObjectInspectorUtils; + +@Description(name = "convertCharset", value = "_FUNC_(str, str, str) - Converts the first argument from the second argument character set to the third argument character set", extended = + "Possible options for the character set are 'US-ASCII', 'ISO-8859-1',\n" + + "'UTF-8', 'UTF-16BE', 'UTF-16LE', and 'UTF-16'. If either argument\n" + + "is null, the result will also be null") public class GenericUDFConvertCharset extends GenericUDF { + private transient CharsetEncoder encoder = null; + private transient CharsetDecoder decoder = null; + private transient PrimitiveObjectInspector stringOI = null; + private transient PrimitiveObjectInspector fromCharsetOI = null; + private transient PrimitiveObjectInspector toCharsetOI = null; + + @Override public ObjectInspector initialize(ObjectInspector[] arguments) throws UDFArgumentException { + if (arguments.length != 3) { + throw new UDFArgumentLengthException("ConvertCharset() requires exactly three arguments"); + } + + checkInputArgument(arguments, 0); + stringOI = (PrimitiveObjectInspector) arguments[0]; + + checkInputArgument(arguments, 1); + fromCharsetOI = (PrimitiveObjectInspector) arguments[1]; Review Comment: Thanks for your suggestion. Issue Time Tracking ------------------- Worklog Id: (was: 844624) Time Spent: 4h 10m (was: 4h) > Add convertCharset(s, from, to) function > ---------------------------------------- > > Key: HIVE-26957 > URL: https://issues.apache.org/jira/browse/HIVE-26957 > Project: Hive > Issue Type: New Feature > Reporter: Bingye Chen > Assignee: Bingye Chen > Priority: Major > Labels: pull-request-available > Time Spent: 4h 10m > Remaining Estimate: 0h > > Add convertCharset(s, from, to) function. > The function converts the string `s` from the `from` charset to the `to` > charset.It is already implemented in clickhouse. -- This message was sent by Atlassian Jira (v8.20.10#820010)