confluentinc
diff --git a/‎README.md‎
Lines changed: 1 addition & 0 deletions b/‎README.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎checkstyle/suppressions.xml‎
Lines changed: 1 addition & 1 deletion b/‎checkstyle/suppressions.xml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pom.xml‎
Lines changed: 37 additions & 14 deletions b/‎pom.xml‎
Lines changed: 37 additions & 14 deletions
diff --git a/‎src/main/java/io/confluent/connect/elasticsearch/AsyncOffsetTracker.java‎
Lines changed: 181 additions & 0 deletions b/‎src/main/java/io/confluent/connect/elasticsearch/AsyncOffsetTracker.java‎
Lines changed: 181 additions & 0 deletions
@@ -1,6 +1,7 @@
 # Kafka Connect Elasticsearch Connector
 [![FOSSA Status](https://app.fossa.io/api/projects/git%2Bhttps%3A%2F%2Fgithub.com%2Fconfluentinc%2Fkafka-connect-elasticsearch.svg?type=shield)](https://app.fossa.io/projects/git%2Bhttps%3A%2F%2Fgithub.com%2Fconfluentinc%2Fkafka-connect-elasticsearch?ref=badge_shield)
 
+Changelog for this connector can be found [here](https://docs.confluent.io/kafka-connect-elasticsearch/current/changelog.html).
 
 kafka-connect-elasticsearch is a [Kafka Connector](http://kafka.apache.org/documentation.html#connect)
 for copying data between Kafka and Elasticsearch.
 
@@ -9,7 +9,7 @@
     <!-- switch statements on types exceed maximum complexity -->
     <suppress
       checks="(CyclomaticComplexity)"
-      files="Mapping.java"
+      files="(Mapping|DataConverter).java"
     />
 
     <suppress
 
@@ -10,7 +10,7 @@
 
     <groupId>io.confluent</groupId>
     <artifactId>kafka-connect-elasticsearch</artifactId>
-    <version>11.0.15-SNAPSHOT</version>
+    <version>11.1.20-SNAPSHOT</version>
     <packaging>jar</packaging>
     <name>kafka-connect-elasticsearch</name>
     <organization>
@@ -34,7 +34,7 @@
         <connection>scm:git:git://github.com/confluentinc/kafka-connect-elasticsearch.git</connection>
         <developerConnection>scm:git:git@github.com:confluentinc/kafka-connect-elasticsearch.git</developerConnection>
         <url>https://github.com/confluentinc/kafka-connect-elasticsearch</url>
-        <tag>11.0.x</tag>
+        <tag>11.1.x</tag>
     </scm>
 
     <properties>
@@ -47,7 +47,9 @@
         <maven.release.plugin.version>2.5.3</maven.release.plugin.version>
         <hadoop.version>3.3.0</hadoop.version>
         <apacheds-jdbm1.version>2.0.0-M2</apacheds-jdbm1.version>
-        <jackson.databind.version>2.10.5.1</jackson.databind.version>
+        <!-- TODO: Remove the version pin after releasing https://github.com/confluentinc/common/pull/494 -->
+        <jackson.databind.version>2.15.0</jackson.databind.version>
+        <jackson.version>2.15.0</jackson.version>
         <!-- temporary fix by pinning the version until we upgrade to a version of common that contains this or newer version.
             See https://github.com/confluentinc/common/pull/332 for details -->
         <dependency.check.version>6.1.6</dependency.check.version>
@@ -60,7 +62,7 @@
         <repository>
             <id>confluent</id>
             <name>Confluent</name>
-            <url>http://packages.confluent.io/maven/</url>
+            <url>https://packages.confluent.io/maven/</url>
         </repository>
     </repositories>
 
@@ -84,11 +86,17 @@
             <groupId>org.elasticsearch</groupId>
             <artifactId>elasticsearch</artifactId>
             <version>${es.version}</version>
+            <exclusions>
+                <exclusion>
+                    <groupId>org.yaml</groupId>
+                    <artifactId>snakeyaml</artifactId>
+                </exclusion>
+            </exclusions>
         </dependency>
         <dependency>
             <groupId>org.apache.logging.log4j</groupId>
             <artifactId>log4j-api</artifactId>
-            <version>2.16.0</version>
+            <version>2.17.1</version>
         </dependency>
         <!-- pin jackson-dataformat-cbor for CVE - the version comes from confluentinc/common -->
         <dependency>
@@ -101,13 +109,6 @@
             <artifactId>commons-codec</artifactId>
             <version>1.15</version>
         </dependency>
-        <!-- pin snakeyaml for CVE -->
-        <dependency>
-            <groupId>org.yaml</groupId>
-            <artifactId>snakeyaml</artifactId>
-            <version>1.27</version>
-        </dependency>
-        <!-- pin httpclient for CVE -->
         <dependency>
             <groupId>org.apache.httpcomponents</groupId>
             <artifactId>httpclient</artifactId>
@@ -282,11 +283,33 @@
 
     <dependencyManagement>
         <dependencies>
+            <dependency>
+                <groupId>com.fasterxml.jackson.core</groupId>
+                <artifactId>jackson-core</artifactId>
+                <version>${jackson.version}</version>
+            </dependency>
+            <dependency>
+                <groupId>com.fasterxml.jackson.core</groupId>
+                <artifactId>jackson-annotations</artifactId>
+                <version>${jackson.version}</version>
+            </dependency>
             <dependency>
                 <groupId>com.fasterxml.jackson.core</groupId>
                 <artifactId>jackson-databind</artifactId>
                 <version>${jackson.databind.version}</version>
             </dependency>
+            <dependency>
+                <groupId>com.fasterxml.jackson</groupId>
+                <artifactId>jackson-bom</artifactId>
+                <version>${jackson.version}</version>
+                <scope>import</scope>
+                <type>pom</type>
+            </dependency>
+            <dependency>
+                <groupId>com.fasterxml.jackson.dataformat</groupId>
+                <artifactId>jackson-dataformat-cbor</artifactId>
+                <version>${jackson.version}</version>
+            </dependency>
         </dependencies>
     </dependencyManagement>
 
@@ -341,7 +364,7 @@
                                         <limit>
                                             <counter>INSTRUCTION</counter>
                                             <value>COVEREDRATIO</value>
-                                            <minimum>0.80</minimum>
+                                            <minimum>0.85</minimum>
                                         </limit>
                                         <limit>
                                             <counter>BRANCH</counter>
@@ -376,7 +399,7 @@
                     </execution>
                     <execution>
                         <id>report</id>
-                        <phase>verify</phase>
+                        <phase>test</phase>
                         <goals>
                             <goal>report</goal>
                         </goals>
 
@@ -0,0 +1,181 @@
+/*
+ * Copyright 2018 Confluent Inc.
+ *
+ * Licensed under the Confluent Community License (the "License"); you may not use
+ * this file except in compliance with the License.  You may obtain a copy of the
+ * License at
+ *
+ * http://www.confluent.io/confluent-community-license
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+ * WARRANTIES OF ANY KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations under the License.
+ */
+
+package io.confluent.connect.elasticsearch;
+
+import java.util.Collection;
+import java.util.HashMap;
+import java.util.Iterator;
+import java.util.LinkedHashMap;
+import java.util.Map;
+import java.util.concurrent.atomic.AtomicLong;
+
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.common.TopicPartition;
+import org.apache.kafka.connect.errors.ConnectException;
+import org.apache.kafka.connect.sink.SinkRecord;
+import org.apache.kafka.connect.sink.SinkTaskContext;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+import static java.util.stream.Collectors.toMap;
+
+/**
+ * It's an asynchronous implementation of <code>OffsetTracker</code>
+ *
+ * <p>Since ElasticsearchClient can potentially process multiple batches asynchronously for the same
+ * partition, if we don't want to wait for all in-flight batches at the end of the put call
+ * (or flush/preCommit) we need to keep track of what's the highest offset that is safe to commit.
+ * For now, we do that at the individual record level because batching is handled by BulkProcessor,
+ * and we don't have control over grouping/ordering.
+ */
+class AsyncOffsetTracker implements OffsetTracker {
+
+  private static final Logger log = LoggerFactory.getLogger(AsyncOffsetTracker.class);
+
+  private final Map<TopicPartition, Map<Long, OffsetState>> offsetsByPartition = new HashMap<>();
+  private final Map<TopicPartition, Long> maxOffsetByPartition = new HashMap<>();
+
+  private final AtomicLong numEntries = new AtomicLong();
+  private final SinkTaskContext context;
+
+  public AsyncOffsetTracker(SinkTaskContext context) {
+    this.context = context;
+  }
+
+  static class AsyncOffsetState implements OffsetState {
+
+    private final long offset;
+    private volatile boolean processed;
+
+    AsyncOffsetState(long offset) {
+      this.offset = offset;
+    }
+
+    @Override
+    public void markProcessed() {
+      processed = true;
+    }
+
+    @Override
+    public boolean isProcessed() {
+      return processed;
+    }
+
+    @Override
+    public long offset() {
+      return offset;
+    }
+  }
+
+  /**
+   * Partitions are no longer owned, we should release all related resources.
+   * @param topicPartitions partitions to close
+   */
+  @Override
+  public synchronized void closePartitions(Collection<TopicPartition> topicPartitions) {
+    topicPartitions.forEach(tp -> {
+      Map<Long, OffsetState> offsets = offsetsByPartition.remove(tp);
+      if (offsets != null) {
+        numEntries.getAndAdd(-offsets.size());
+      }
+      maxOffsetByPartition.remove(tp);
+    });
+  }
+
+  /**
+   * This method assumes that new records are added in offset order.
+   * Older records can be re-added, and the same Offset object will be return if its
+   * offset hasn't been reported yet.
+   * @param sinkRecord record to add
+   * @return offset state record that can be used to mark the record as processed
+   */
+  @Override
+  public synchronized OffsetState addPendingRecord(
+      SinkRecord sinkRecord
+  ) {
+    log.trace("Adding pending record");
+    TopicPartition tp = new TopicPartition(sinkRecord.topic(), sinkRecord.kafkaPartition());
+    if (!context.assignment().contains(tp)) {
+      String msg = String.format("Found a topic name '%s' that doesn't match assigned partitions."
+          + " Connector doesn't support topic mutating SMTs", sinkRecord.topic());
+      throw new ConnectException(msg);
+    }
+    Long partitionMax = maxOffsetByPartition.get(tp);
+    if (partitionMax == null || sinkRecord.kafkaOffset() > partitionMax) {
+      numEntries.incrementAndGet();
+      return offsetsByPartition
+              // Insertion order needs to be maintained
+              .computeIfAbsent(tp, key -> new LinkedHashMap<>())
+              .computeIfAbsent(sinkRecord.kafkaOffset(), AsyncOffsetState::new);
+    } else {
+      return new AsyncOffsetState(sinkRecord.kafkaOffset());
+    }
+  }
+
+  /**
+   * @return overall number of entries currently in memory.
+   */
+  @Override
+  public long numOffsetStateEntries() {
+    return numEntries.get();
+  }
+
+  /**
+   * Move offsets to the highest we can.
+   */
+  @Override
+  public synchronized void updateOffsets() {
+    log.trace("Updating offsets");
+    offsetsByPartition.forEach(((topicPartition, offsets) -> {
+      Long max = maxOffsetByPartition.get(topicPartition);
+      boolean newMaxFound = false;
+      Iterator<OffsetState> iterator = offsets.values().iterator();
+      while (iterator.hasNext()) {
+        OffsetState offsetState = iterator.next();
+        if (offsetState.isProcessed()) {
+          iterator.remove();
+          numEntries.decrementAndGet();
+          if (max == null || offsetState.offset() > max) {
+            max = offsetState.offset();
+            newMaxFound = true;
+          }
+        } else {
+          break;
+        }
+      }
+      if (newMaxFound) {
+        maxOffsetByPartition.put(topicPartition, max);
+      }
+    }));
+    log.trace("Updated offsets, num entries: {}", numEntries);
+  }
+
+  /**
+   * @param currentOffsets current offsets from a task
+   * @return offsets to commit
+   */
+  @Override
+  public synchronized Map<TopicPartition, OffsetAndMetadata> offsets(
+      Map<TopicPartition, OffsetAndMetadata> currentOffsets
+  ) {
+    return maxOffsetByPartition.entrySet().stream()
+        .collect(toMap(
+            Map.Entry::getKey,
+            // The offsets you commit are the offsets of the messages you want to read next
+            // (not the offsets of the messages you did read last)
+            e -> new OffsetAndMetadata(e.getValue() + 1)));
+  }
+}