/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package gobblin.writer.commands;
import java.sql.Connection;
import java.sql.PreparedStatement;
import java.sql.SQLException;
import java.util.List;
import java.util.concurrent.Callable;
import java.util.concurrent.TimeUnit;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import com.github.rholder.retry.Retryer;
import com.github.rholder.retry.RetryerBuilder;
import com.github.rholder.retry.StopStrategies;
import com.github.rholder.retry.WaitStrategies;
import com.google.common.base.Joiner;
import com.google.common.collect.Lists;
import gobblin.configuration.State;
import gobblin.converter.jdbc.JdbcEntryData;
import gobblin.converter.jdbc.JdbcEntryDatum;
import lombok.ToString;
/**
* Base implementation of JdbcBufferedInserter.
* Concrete DB specific implementations are expected to subclass this class.
*
*/
@ToString
public abstract class BaseJdbcBufferedInserter implements JdbcBufferedInserter {
private static final Logger LOG = LoggerFactory.getLogger(BaseJdbcBufferedInserter.class);
protected static final String INSERT_STATEMENT_PREFIX_FORMAT = "INSERT INTO %s.%s (%s) VALUES ";
protected static final Joiner JOINER_ON_COMMA = Joiner.on(',');
protected final Connection conn;
// Rows that are inserted at once in one batch cycle
protected final List<JdbcEntryData> pendingInserts = Lists.newArrayList();
protected final List<String> columnNames = Lists.newArrayList();
protected int batchSize;
protected String insertStmtPrefix;
protected PreparedStatement insertPstmtForFixedBatch;
private final Retryer<Boolean> retryer;
public BaseJdbcBufferedInserter(State state, Connection conn) {
this.conn = conn;
this.batchSize = state.getPropAsInt(WRITER_JDBC_INSERT_BATCH_SIZE, DEFAULT_WRITER_JDBC_INSERT_BATCH_SIZE);
if (this.batchSize < 1) {
throw new IllegalArgumentException(WRITER_JDBC_INSERT_BATCH_SIZE + " should be a positive number");
}
int maxWait = state.getPropAsInt(WRITER_JDBC_INSERT_RETRY_TIMEOUT, DEFAULT_WRITER_JDBC_INSERT_RETRY_TIMEOUT);
int maxAttempts =
state.getPropAsInt(WRITER_JDBC_INSERT_RETRY_MAX_ATTEMPT, DEFAULT_WRITER_JDBC_INSERT_RETRY_MAX_ATTEMPT);
//retry after 2, 4, 8, 16... sec, allow at most maxWait sec delay
this.retryer = RetryerBuilder.<Boolean> newBuilder().retryIfException()
.withWaitStrategy(WaitStrategies.exponentialWait(1000, maxWait, TimeUnit.SECONDS))
.withStopStrategy(StopStrategies.stopAfterAttempt(maxAttempts)).build();
}
/**
* Adds all the records from {@link #pendingInserts} to the PreparedStatement and executes the
* batch insert.
*
* @param pstmt PreparedStatement object
* @return true if the insert was successful
*/
protected abstract boolean insertBatch(final PreparedStatement pstmt) throws SQLException;
/**
* Constructs the SQL insert statement for the batch inserts, using the {@link #INSERT_STATEMENT_PREFIX_FORMAT}
*
* @param batchSize size of one batch
* @return the constructed SQL string for batch inserts
*/
protected abstract String createPrepareStatementStr(int batchSize);
/**
* <p>
* Inserts entry into buffer. If current # of entries filled batch size or it overflowed the buffer,
* it will call underlying JDBC to actually insert it.
* </p>
*
* {@inheritDoc}
* @see gobblin.writer.commands.JdbcBufferedInserter#insert(java.lang.String, java.lang.String, gobblin.converter.jdbc.JdbcEntryData)
*/
@Override
public void insert(String databaseName, String table, JdbcEntryData jdbcEntryData) throws SQLException {
if (this.columnNames.isEmpty()) {
for (JdbcEntryDatum datum : jdbcEntryData) {
this.columnNames.add(datum.getColumnName());
}
initializeBatch(databaseName, table);
}
this.pendingInserts.add(jdbcEntryData);
if (this.pendingInserts.size() == this.batchSize) {
executeBatchInsert(this.insertPstmtForFixedBatch); // Reuse pre-computed Preparedstatement.
}
}
/**
* Initializes variables for batch insert and pre-compute PreparedStatement based on requested batch size and parameter size.
* @param databaseName
* @param table
* @throws SQLException
*/
protected void initializeBatch(String databaseName, String table)
throws SQLException {
this.insertStmtPrefix = createInsertStatementStr(databaseName, table);
this.insertPstmtForFixedBatch =
this.conn.prepareStatement(createPrepareStatementStr(this.batchSize));
LOG.info(String.format("Initialized for %s insert " + this, (this.batchSize > 1) ? "batch" : ""));
}
/**
* Submits the user defined {@link #insertBatch(PreparedStatement)} call to the {@link Retryer} which takes care
* of resubmitting the records according to {@link #WRITER_JDBC_INSERT_RETRY_TIMEOUT} and {@link #WRITER_JDBC_INSERT_RETRY_MAX_ATTEMPT}
* when failure happens.
*
* @param pstmt PreparedStatement object
*/
protected void executeBatchInsert(final PreparedStatement pstmt) {
try {
// Need a Callable interface to be wrapped by Retryer.
this.retryer.wrap(new Callable<Boolean>() {
@Override
public Boolean call() throws Exception {
return insertBatch(pstmt);
}
}).call();
} catch (Exception e) {
throw new RuntimeException("Failed to insert.", e);
}
resetBatch();
}
/**
* Resets the list of rows after the batch insert
*/
protected void resetBatch() {
this.pendingInserts.clear();
}
/**
* Populates the placeholders and constructs the prefix of batch insert statement
* @param databaseName name of the database
* @param table name of the table
* @return {@link #INSERT_STATEMENT_PREFIX_FORMAT} with all its resolved placeholders
*/
protected String createInsertStatementStr(String databaseName, String table) {
return String.format(INSERT_STATEMENT_PREFIX_FORMAT, databaseName, table, JOINER_ON_COMMA.join(this.columnNames));
}
@Override
public void flush() throws SQLException {
if (this.pendingInserts == null || this.pendingInserts.isEmpty()) {
return;
}
try (PreparedStatement pstmt = this.conn.prepareStatement(createPrepareStatementStr(this.pendingInserts.size()));) {
insertBatch(pstmt);
}
}
}