maksaska commented on code in PR #311:
URL: https://github.com/apache/ignite-extensions/pull/311#discussion_r2247303016


##########
modules/cdc-ext/src/main/java/org/apache/ignite/cdc/postgresql/IgniteToPostgreSqlCdcApplier.java:
##########
@@ -0,0 +1,670 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.ignite.cdc.postgresql;
+
+import java.math.BigDecimal;
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+import java.sql.Connection;
+import java.sql.PreparedStatement;
+import java.sql.SQLException;
+import java.sql.Statement;
+import java.sql.Types;
+import java.util.Collections;
+import java.util.HashMap;
+import java.util.HashSet;
+import java.util.Iterator;
+import java.util.Map;
+import java.util.Set;
+import java.util.UUID;
+import javax.sql.DataSource;
+import org.apache.ignite.IgniteException;
+import org.apache.ignite.IgniteLogger;
+import org.apache.ignite.binary.BinaryObject;
+import org.apache.ignite.cache.CacheEntryVersion;
+import org.apache.ignite.cache.QueryEntity;
+import org.apache.ignite.cdc.CdcCacheEvent;
+import org.apache.ignite.cdc.CdcEvent;
+import org.apache.ignite.internal.util.typedef.F;
+
+import static 
org.apache.ignite.internal.processors.cache.GridCacheUtils.UNDEFINED_CACHE_ID;
+
+/** */
+public class IgniteToPostgreSqlCdcApplier {
+    /** */
+    public static final String DFLT_SQL_TYPE = "OTHER";
+
+    /** */
+    public static final Map<String, String> JAVA_TO_SQL_TYPES;
+
+    /** */
+    public static final Set<String> SQL_TYPES_WITH_PRECISION_ONLY;
+
+    /** */
+    public static final Set<String> SQL_TYPES_WITH_PRECISION_AND_SCALE;
+
+    static {
+        Map<String, String> javaToSqlTypes = new HashMap<>();
+
+        javaToSqlTypes.put("java.lang.String", "VARCHAR");
+        javaToSqlTypes.put("java.lang.Integer", "INT");
+        javaToSqlTypes.put("int", "INT");
+        javaToSqlTypes.put("java.lang.Long", "BIGINT");
+        javaToSqlTypes.put("long", "BIGINT");
+        javaToSqlTypes.put("java.lang.Boolean", "BOOLEAN");
+        javaToSqlTypes.put("boolean", "BOOLEAN");
+        javaToSqlTypes.put("java.lang.Double", "DOUBLE PRECISION");
+        javaToSqlTypes.put("double", "DOUBLE PRECISION");
+        javaToSqlTypes.put("java.lang.Float", "REAL");
+        javaToSqlTypes.put("float", "REAL");
+        javaToSqlTypes.put("java.math.BigDecimal", "DECIMAL");
+        javaToSqlTypes.put("java.lang.Short", "SMALLINT");
+        javaToSqlTypes.put("short", "SMALLINT");
+        javaToSqlTypes.put("java.lang.Byte", "SMALLINT");
+        javaToSqlTypes.put("byte", "SMALLINT");
+        javaToSqlTypes.put("java.util.UUID", "UUID");
+        javaToSqlTypes.put("[B", "BYTEA");
+        javaToSqlTypes.put("java.lang.Object", "OTHER");
+
+        JAVA_TO_SQL_TYPES = Collections.unmodifiableMap(javaToSqlTypes);
+
+        Set<String> sqlTypesWithPrecisionOnly = new HashSet<>();
+
+        sqlTypesWithPrecisionOnly.add("VARCHAR");
+        sqlTypesWithPrecisionOnly.add("DOUBLE PRECISION");
+
+        SQL_TYPES_WITH_PRECISION_ONLY = 
Collections.unmodifiableSet(sqlTypesWithPrecisionOnly);
+
+        Set<String> sqlTypesWithPrecisionAndScale = new HashSet<>();
+
+        sqlTypesWithPrecisionAndScale.add("DECIMAL");
+        sqlTypesWithPrecisionAndScale.add("REAL");
+
+        SQL_TYPES_WITH_PRECISION_AND_SCALE = 
Collections.unmodifiableSet(sqlTypesWithPrecisionAndScale);
+    }
+
+    /** */
+    private static final boolean DFLT_AUTO_COMMIT = false;
+
+    /** */
+    private final DataSource dataSrc;
+
+    /** */
+    private final long batchSize;
+
+    /** */
+    private final IgniteLogger log;
+
+    /** */
+    private final Map<Integer, String> cacheIdToUpsertQry = new HashMap<>();
+
+    /** */
+    private final Map<Integer, String> cacheIdToDeleteQry = new HashMap<>();
+
+    /** */
+    private final Map<Integer, Set<String>> cacheIdToPrimaryKeys = new 
HashMap<>();
+
+    /** */
+    private final Map<Integer, Set<String>> cacheIdToFields = new HashMap<>();
+
+    /** */
+    private final Set<Object> curKeys = new HashSet<>();
+
+    /**
+     * @param dataSrc {@link DataSource} - connection pool to PostgreSql
+     * @param batchSize the number of CDC events to include in a single batch
+     * @param log the {@link IgniteLogger} instance used for logging CDC 
processing events
+     */
+    public IgniteToPostgreSqlCdcApplier(
+        DataSource dataSrc,
+        long batchSize,
+        IgniteLogger log
+    ) {
+        this.dataSrc = dataSrc;
+        this.batchSize = batchSize;
+        this.log = log;
+    }
+
+    /**
+     * @param evts an {@link Iterator} of {@link CdcEvent} objects to be 
applied
+     * @return the total number of events successfully batched and executed
+     */
+    public long applyEvents(Iterator<CdcEvent> evts) {
+        try (Connection conn = dataSrc.getConnection()) {
+            conn.setAutoCommit(DFLT_AUTO_COMMIT);
+
+            long res = applyEvents(conn, evts);
+
+            conn.commit();
+
+            return res;
+        }
+        catch (Throwable e) {
+            log.error(e.getMessage(), e);
+
+            throw new IgniteException("CDC failure", e);
+        }
+    }
+
+    /**
+     * @param conn connection to PostgreSql
+     * @param evts an {@link Iterator} of {@link CdcEvent} objects to be 
applied
+     * @return the total number of events successfully batched and executed
+     */
+    private long applyEvents(Connection conn, Iterator<CdcEvent> evts) throws 
SQLException {
+        long evtsApplied = 0;
+
+        int currCacheId = UNDEFINED_CACHE_ID;
+        boolean prevOpIsDelete = false;
+        
+        PreparedStatement curPrepStmt = null;
+        CdcEvent evt;
+
+        while (evts.hasNext()) {
+            evt = evts.next();
+
+            if (log.isDebugEnabled())
+                log.debug("Event received [evt=" + evt + ']');
+
+            if (currCacheId != evt.cacheId() || prevOpIsDelete ^ (evt.value() 
== null)) {
+                if (curPrepStmt != null)
+                    evtsApplied += executeBatch(conn, curPrepStmt);
+
+                currCacheId = evt.cacheId();
+                prevOpIsDelete = evt.value() == null;
+
+                curPrepStmt = prepareStatement(conn, evt);
+            }
+
+            if (curKeys.size() >= batchSize || curKeys.contains(evt.key()))
+                evtsApplied += executeBatch(conn, curPrepStmt);
+
+            addEvent(curPrepStmt, evt);
+        }
+
+        if (!curKeys.isEmpty())
+            evtsApplied += executeBatch(conn, curPrepStmt);
+
+        return evtsApplied;
+    }
+
+    /**
+     * @param conn connection to PostgreSql
+     * @param curPrepStmt {@link PreparedStatement}
+     * @return the total number of batches successfully executed. One CdcEvent 
- one batch.
+     */
+    private int executeBatch(Connection conn, PreparedStatement curPrepStmt) {
+        try {
+            curKeys.clear();
+
+            if (log.isDebugEnabled())
+                log.debug("Applying batch " + curPrepStmt.toString());
+
+            if (!curPrepStmt.isClosed()) {
+                int batchSize = curPrepStmt.executeBatch().length;
+
+                // It's better to use autoCommit = false and call commit() 
manually for improved performance and
+                // clearer transaction boundaries
+                conn.commit();
+
+                return batchSize;
+            }
+
+            throw new IgniteException("Tried to execute on closed prepared 
statement!");
+        }
+        catch (SQLException e) {
+            log.error(e.getMessage(), e);
+
+            throw new IgniteException(e);
+        }
+    }
+
+    /**
+     * @param conn connection to PostgreSql
+     * @param evt {@link CdcEvent}
+     * @return relevant {@link PreparedStatement}
+     */
+    private PreparedStatement prepareStatement(Connection conn, CdcEvent evt) {
+        String sqlQry;
+
+        if (evt.value() == null)
+            sqlQry = cacheIdToDeleteQry.get(evt.cacheId());
+        else
+            sqlQry = cacheIdToUpsertQry.get(evt.cacheId());
+
+        if (sqlQry == null)
+            throw new IgniteException("No SQL query is found for cacheId=" + 
evt.cacheId());
+
+        if (log.isDebugEnabled())
+            log.debug("Statement updated [cacheId=" + evt.cacheId() + ", 
sqlQry=" + sqlQry + ']');
+
+        try {
+            return conn.prepareStatement(sqlQry);
+        }
+        catch (SQLException e) {
+            log.error(e.getMessage(), e);
+
+            throw new IgniteException(e);
+        }
+    }
+
+    /**
+     * @param curPrepStmt current {@link PreparedStatement}
+     * @param evt {@link CdcEvent}
+     */
+    private void addEvent(PreparedStatement curPrepStmt, CdcEvent evt) {
+        try {
+            Iterator<String> itFields = evt.value() == null ?
+                cacheIdToPrimaryKeys.get(evt.cacheId()).iterator() :
+                cacheIdToFields.get(evt.cacheId()).iterator();
+
+            String field;
+
+            BinaryObject keyObj = (evt.key() instanceof BinaryObject) ? 
(BinaryObject)evt.key() : null;
+            BinaryObject valObj = (evt.value() instanceof BinaryObject) ? 
(BinaryObject)evt.value() : null;
+
+            int idx = 1;
+            Object obj;
+
+            while (itFields.hasNext()) {
+                field = itFields.next();
+
+                if (cacheIdToPrimaryKeys.get(evt.cacheId()).contains(field))
+                    obj = keyObj != null ? keyObj.field(field) : evt.key();
+                else
+                    obj = valObj != null ? valObj.field(field) : evt.value();
+
+                addObject(curPrepStmt, idx, obj);
+
+                idx++;
+            }
+
+            if (evt.value() != null)
+                curPrepStmt.setBytes(idx, encodeVersion(evt.version()));
+
+            curKeys.add(evt.key());
+
+            curPrepStmt.addBatch();
+        }
+        catch (Throwable e) {
+            log.error(e.getMessage(), e);
+
+            throw new IgniteException(e);
+        }
+    }
+
+    /**
+     * Sets a value in the PreparedStatement at the given index using the 
appropriate setter
+     * based on the runtime type of the object.
+     * @param curPrepStmt {@link PreparedStatement}
+     * @param idx value index in {@link PreparedStatement}
+     * @param obj value
+     */
+    private void addObject(PreparedStatement curPrepStmt, int idx, Object obj) 
throws SQLException {
+        if (obj == null) {
+            curPrepStmt.setObject(idx, null);
+
+            return;
+        }
+
+        if (obj instanceof String)
+            curPrepStmt.setString(idx, (String)obj);
+        else if (obj instanceof Integer)
+            curPrepStmt.setInt(idx, (Integer)obj);
+        else if (obj instanceof Long)
+            curPrepStmt.setLong(idx, (Long)obj);
+        else if (obj instanceof Short)
+            curPrepStmt.setShort(idx, (Short)obj);
+        else if (obj instanceof Byte)
+            curPrepStmt.setByte(idx, (Byte)obj);
+        else if (obj instanceof Boolean)
+            curPrepStmt.setBoolean(idx, (Boolean)obj);
+        else if (obj instanceof Float)
+            curPrepStmt.setFloat(idx, (Float)obj);
+        else if (obj instanceof Double)
+            curPrepStmt.setDouble(idx, (Double)obj);
+        else if (obj instanceof BigDecimal)
+            curPrepStmt.setBigDecimal(idx, (BigDecimal)obj);
+        else if (obj instanceof UUID)
+            curPrepStmt.setObject(idx, obj, Types.OTHER); // PostgreSQL 
expects UUID as OTHER
+        else if (obj instanceof byte[])
+            curPrepStmt.setBytes(idx, (byte[])obj);
+        else
+            curPrepStmt.setObject(idx, obj);
+    }
+
+    /**
+     * @param evts an {@link Iterator} of {@link CdcCacheEvent} objects to 
apply
+     * @param createTables tables creation flag. If true - attempt to create 
tables will be made.
+     * @return Number of applied events.
+     */
+    public long applyCacheEvents(Iterator<CdcCacheEvent> evts, boolean 
createTables) {
+        CdcCacheEvent evt;
+        QueryEntity entity;
+
+        long cnt = 0;
+
+        while (evts.hasNext()) {
+            evt = evts.next();
+
+            if (evt.queryEntities().size() != 1)
+                throw new IgniteException("There should be exactly 1 
QueryEntity for cacheId: " + evt.cacheId());
+
+            entity = evt.queryEntities().iterator().next();
+
+            if (createTables)
+                createTableIfNotExists(entity);
+
+            cacheIdToUpsertQry.put(evt.cacheId(), getUpsertSqlQry(entity));
+
+            cacheIdToDeleteQry.put(evt.cacheId(), getDeleteSqlQry(entity));
+
+            cacheIdToPrimaryKeys.put(evt.cacheId(), getPrimaryKeys(entity));
+
+            cacheIdToFields.put(evt.cacheId(), entity.getFields().keySet());
+
+            if (log.isInfoEnabled())
+                log.info("Cache table created [tableName=" + 
entity.getTableName() +

Review Comment:
   Done!



-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: notifications-unsubscr...@ignite.apache.org

For queries about this service, please contact Infrastructure at:
us...@infra.apache.org

Reply via email to