snowflakedb
diff --git a/‎src/main/java/com/snowflake/kafka/connector/internal/SnowflakeErrors.java‎
Lines changed: 1 addition & 3 deletions b/‎src/main/java/com/snowflake/kafka/connector/internal/SnowflakeErrors.java‎
Lines changed: 1 addition & 3 deletions
diff --git a/‎src/main/java/com/snowflake/kafka/connector/internal/streaming/SnowflakeSinkServiceV2.java‎
Lines changed: 20 additions & 8 deletions b/‎src/main/java/com/snowflake/kafka/connector/internal/streaming/SnowflakeSinkServiceV2.java‎
Lines changed: 20 additions & 8 deletions
diff --git a/‎src/main/java/com/snowflake/kafka/connector/internal/streaming/StreamingRecordService.java‎
Lines changed: 17 additions & 133 deletions b/‎src/main/java/com/snowflake/kafka/connector/internal/streaming/StreamingRecordService.java‎
Lines changed: 17 additions & 133 deletions
diff --git a/‎src/main/java/com/snowflake/kafka/connector/internal/streaming/schemaevolution/iceberg/IcebergColumnJsonValuePair.java‎
Lines changed: 0 additions & 26 deletions b/‎src/main/java/com/snowflake/kafka/connector/internal/streaming/schemaevolution/iceberg/IcebergColumnJsonValuePair.java‎
Lines changed: 0 additions & 26 deletions
diff --git a/‎src/main/java/com/snowflake/kafka/connector/internal/streaming/v2/SnowpipeStreamingPartitionChannel.java‎
Lines changed: 4 additions & 2 deletions b/‎src/main/java/com/snowflake/kafka/connector/internal/streaming/v2/SnowpipeStreamingPartitionChannel.java‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎src/main/java/com/snowflake/kafka/connector/records/IcebergTableStreamingRecordMapper.java‎
Lines changed: 0 additions & 44 deletions b/‎src/main/java/com/snowflake/kafka/connector/records/IcebergTableStreamingRecordMapper.java‎
Lines changed: 0 additions & 44 deletions
@@ -210,9 +210,7 @@ public enum SnowflakeErrors {
       "Failed to put records",
       "SinkTask hasn't been initialized before calling PUT function"),
   ERROR_5015(
-      "5015",
-      "Invalid SinkRecord received",
-      "Error parsing SinkRecord of native converter or SinkRecord header"),
+      "5015", "Invalid SinkRecord received", "Error parsing SinkRecord value or SinkRecord header"),
   ERROR_5020("5020", "Failed to register MBean in MbeanServer", "Object Name is invalid"),
   ERROR_5022("5022", "Invalid column name", "Failed to find column in the schema"),
 
 
@@ -3,7 +3,6 @@
 import static com.google.common.base.Strings.isNullOrEmpty;
 import static com.snowflake.kafka.connector.Constants.KafkaConnectorConfigParams.NAME;
 import static com.snowflake.kafka.connector.Utils.getTableName;
-import static com.snowflake.kafka.connector.Utils.isIcebergEnabled;
 import static com.snowflake.kafka.connector.internal.streaming.channel.TopicPartitionChannel.NO_OFFSET_TOKEN_REGISTERED_IN_SNOWFLAKE;
 import static com.snowflake.kafka.connector.internal.streaming.v2.PipeNameProvider.buildDefaultPipeName;
 import static com.snowflake.kafka.connector.internal.streaming.v2.PipeNameProvider.buildPipeName;
@@ -22,8 +21,7 @@
 import com.snowflake.kafka.connector.internal.streaming.channel.TopicPartitionChannel;
 import com.snowflake.kafka.connector.internal.streaming.v2.SnowpipeStreamingPartitionChannel;
 import com.snowflake.kafka.connector.internal.streaming.v2.StreamingClientManager;
-import com.snowflake.kafka.connector.records.RecordService;
-import com.snowflake.kafka.connector.records.RecordServiceFactory;
+import com.snowflake.kafka.connector.records.SnowflakeMetadataConfig;
 import java.util.Collection;
 import java.util.HashMap;
 import java.util.HashSet;
@@ -58,7 +56,7 @@ public class SnowflakeSinkServiceV2 implements SnowflakeSinkService {
   // Used to connect to Snowflake, could be null during testing
   private final SnowflakeConnectionService conn;
 
-  private final RecordService recordService;
+  private final SnowflakeMetadataConfig metadataConfig;
 
   private final Map<String, String> topicToTableMap;
 
@@ -101,8 +99,7 @@ public SnowflakeSinkServiceV2(
     this.sinkTaskContext = sinkTaskContext;
     this.enableCustomJMXMonitoring = enableCustomJMXMonitoring;
     this.topicToTableMap = topicToTableMap;
-    this.recordService =
-        RecordServiceFactory.createRecordService(isIcebergEnabled(connectorConfig));
+    this.metadataConfig = new SnowflakeMetadataConfig(connectorConfig);
     this.behaviorOnNullValues = behaviorOnNullValues;
     this.partitionsToChannel = new HashMap<>();
 
@@ -214,7 +211,7 @@ private void createStreamingChannelForTopicPartition(
         channelName);
 
     StreamingRecordService streamingRecordService =
-        new StreamingRecordService(this.recordService, this.kafkaRecordErrorReporter);
+        new StreamingRecordService(this.kafkaRecordErrorReporter, this.metadataConfig);
 
     StreamingErrorHandler streamingErrorHandler =
         new StreamingErrorHandler(
@@ -269,7 +266,7 @@ public void insert(final Collection<SinkRecord> records) {
     channelsVisitedPerBatch.clear();
     for (SinkRecord record : records) {
       // check if it needs to handle null value records
-      if (recordService.shouldSkipNullValue(record, behaviorOnNullValues)) {
+      if (shouldSkipNullValue(record)) {
         continue;
       }
 
@@ -305,6 +302,21 @@ public void insert(SinkRecord record) {
     channelPartition.insertRecord(record, isFirstRowPerPartitionInBatch);
   }
 
+  private boolean shouldSkipNullValue(SinkRecord record) {
+    if (behaviorOnNullValues == ConnectorConfigTools.BehaviorOnNullValues.DEFAULT) {
+      return false;
+    }
+    if (record.value() == null) {
+      LOGGER.debug(
+          "Null valued record from topic '{}', partition {} and offset {} was skipped.",
+          record.topic(),
+          record.kafkaPartition(),
+          record.kafkaOffset());
+      return true;
+    }
+    return false;
+  }
+
   @Override
   public long getOffset(TopicPartition topicPartition) {
     String partitionChannelKey =
 
@@ -1,160 +1,44 @@
 package com.snowflake.kafka.connector.internal.streaming;
 
-import static org.apache.kafka.common.record.TimestampType.NO_TIMESTAMP_TYPE;
-
-import com.fasterxml.jackson.core.JsonProcessingException;
-import com.google.common.collect.ImmutableMap;
 import com.snowflake.kafka.connector.dlq.KafkaRecordErrorReporter;
 import com.snowflake.kafka.connector.internal.KCLogger;
-import com.snowflake.kafka.connector.internal.SnowflakeErrors;
-import com.snowflake.kafka.connector.internal.SnowflakeKafkaConnectorException;
-import com.snowflake.kafka.connector.records.RecordService;
-import com.snowflake.kafka.connector.records.SnowflakeJsonSchema;
-import com.snowflake.kafka.connector.records.SnowflakeRecordContent;
-import java.io.ByteArrayOutputStream;
-import java.io.ObjectOutputStream;
+import com.snowflake.kafka.connector.records.SnowflakeMetadataConfig;
+import com.snowflake.kafka.connector.records.SnowflakeSinkRecord;
 import java.util.Map;
-import org.apache.kafka.connect.data.Schema;
 import org.apache.kafka.connect.errors.DataException;
 import org.apache.kafka.connect.sink.SinkRecord;
 
-/** Service to transform data from Kafka format into a map that is accepted by ingest sdk. */
+/**
+ * Service to transform data from Kafka format into a map that is accepted by the Snowflake
+ * Streaming Ingest SDK.
+ */
 public class StreamingRecordService {
+
   private static final KCLogger LOGGER = new KCLogger(StreamingRecordService.class.getName());
 
-  private final RecordService recordService;
   private final KafkaRecordErrorReporter kafkaRecordErrorReporter;
+  private final SnowflakeMetadataConfig metadataConfig;
 
   public StreamingRecordService(
-      RecordService recordService, KafkaRecordErrorReporter kafkaRecordErrorReporter) {
-    this.recordService = recordService;
+      KafkaRecordErrorReporter kafkaRecordErrorReporter, SnowflakeMetadataConfig metadataConfig) {
     this.kafkaRecordErrorReporter = kafkaRecordErrorReporter;
+    this.metadataConfig = metadataConfig;
   }
 
-  /**
-   * @param kafkaSinkRecord a record in Kafka format
-   * @return a map that format depends on the schematization settings
-   */
   public Map<String, Object> transformData(SinkRecord kafkaSinkRecord) {
-    SinkRecord snowflakeSinkRecord = getSnowflakeSinkRecordFromKafkaRecord(kafkaSinkRecord);
-    // broken record
-    if (isRecordBroken(snowflakeSinkRecord)) {
-      // check for error tolerance and log tolerance values
-      // errors.log.enable and errors.tolerance
+    SnowflakeSinkRecord record = SnowflakeSinkRecord.from(kafkaSinkRecord, metadataConfig);
+
+    if (record.isBroken()) {
       LOGGER.debug(
           "Broken record offset:{}, topic:{}",
           kafkaSinkRecord.kafkaOffset(),
           kafkaSinkRecord.topic());
       kafkaRecordErrorReporter.reportError(kafkaSinkRecord, new DataException("Broken Record"));
-    } else {
-      // lag telemetry, note that sink record timestamp might be null
-      if (kafkaSinkRecord.timestamp() != null
-          && kafkaSinkRecord.timestampType() != NO_TIMESTAMP_TYPE) {
-        // TODO:SNOW-529751 telemetry
-      }
-
-      // Convert this records into Json Schema which has content and metadata, add it to DLQ if
-      // there is an exception
-      try {
-        return recordService.getProcessedRecordForStreamingIngest(snowflakeSinkRecord);
-      } catch (JsonProcessingException e) {
-        LOGGER.warn(
-            "Record has JsonProcessingException offset:{}, topic:{}",
-            kafkaSinkRecord.kafkaOffset(),
-            kafkaSinkRecord.topic());
-        kafkaRecordErrorReporter.reportError(kafkaSinkRecord, e);
-      } catch (SnowflakeKafkaConnectorException e) {
-        if (e.checkErrorCode(SnowflakeErrors.ERROR_0010)) {
-          LOGGER.warn(
-              "Cannot parse record offset:{}, topic:{}. Sending to DLQ.",
-              kafkaSinkRecord.kafkaOffset(),
-              kafkaSinkRecord.topic());
-          kafkaRecordErrorReporter.reportError(kafkaSinkRecord, e);
-        } else {
-          throw e;
-        }
-      }
-    }
-
-    // return empty
-    return ImmutableMap.of();
-  }
-
-  /**
-   * Converts the original kafka sink record into a Json Record. i.e key and values are converted
-   * into Json so that it can be used to insert into variant column of Snowflake Table.
-   *
-   * <p>TODO: SNOW-630885 - When schematization is enabled, we should create the map directly from
-   * the SinkRecord instead of first turning it into json
-   */
-  private SinkRecord getSnowflakeSinkRecordFromKafkaRecord(final SinkRecord kafkaSinkRecord) {
-    SinkRecord snowflakeRecord = kafkaSinkRecord;
-    if (shouldConvertContent(kafkaSinkRecord.value())) {
-      snowflakeRecord = handleNativeRecord(kafkaSinkRecord, false);
-    }
-    if (shouldConvertContent(kafkaSinkRecord.key())) {
-      snowflakeRecord = handleNativeRecord(snowflakeRecord, true);
+      return Map.of();
     }
 
-    return snowflakeRecord;
-  }
-
-  private boolean shouldConvertContent(final Object content) {
-    return content != null && !(content instanceof SnowflakeRecordContent);
-  }
-
-  /**
-   * This would always return false for streaming ingest use case since isBroken field is never set.
-   * isBroken is set only when using Custom snowflake converters and the content was not json
-   * serializable.
-   *
-   * <p>For Community converters, the kafka record will not be sent to Kafka connector if the record
-   * is not serializable.
-   */
-  private boolean isRecordBroken(final SinkRecord record) {
-    return isContentBroken(record.value()) || isContentBroken(record.key());
-  }
-
-  private boolean isContentBroken(final Object content) {
-    return content != null && ((SnowflakeRecordContent) content).isBroken();
-  }
-
-  private SinkRecord handleNativeRecord(SinkRecord record, boolean isKey) {
-    SnowflakeRecordContent newSFContent;
-    Schema schema = isKey ? record.keySchema() : record.valueSchema();
-    Object content = isKey ? record.key() : record.value();
-    try {
-      newSFContent = new SnowflakeRecordContent(schema, content);
-    } catch (Exception e) {
-      LOGGER.error("Native content parser error:\n{}", e.getMessage());
-      try {
-        // try to serialize this object and send that as broken record
-        ByteArrayOutputStream out = new ByteArrayOutputStream();
-        ObjectOutputStream os = new ObjectOutputStream(out);
-        os.writeObject(content);
-        newSFContent = new SnowflakeRecordContent(out.toByteArray());
-      } catch (Exception serializeError) {
-        LOGGER.error(
-            "Failed to convert broken native record to byte data:\n{}",
-            serializeError.getMessage());
-        throw e;
-      }
-    }
-    // create new sinkRecord
-    Schema keySchema = isKey ? new SnowflakeJsonSchema() : record.keySchema();
-    Object keyContent = isKey ? newSFContent : record.key();
-    Schema valueSchema = isKey ? record.valueSchema() : new SnowflakeJsonSchema();
-    Object valueContent = isKey ? record.value() : newSFContent;
-    return new SinkRecord(
-        record.topic(),
-        record.kafkaPartition(),
-        keySchema,
-        keyContent,
-        valueSchema,
-        valueContent,
-        record.kafkaOffset(),
-        record.timestamp(),
-        record.timestampType(),
-        record.headers());
+    // Tombstone records are handled by the caller (shouldSkipNullValue check)
+    // If we reach here, it means we should ingest an empty record
+    return record.getContentWithMetadata(metadataConfig.shouldIncludeAllMetadata());
   }
 }
@@ -224,9 +224,11 @@ private void transformAndSend(SinkRecord kafkaSinkRecord) {
       Map<String, Object> transformedRecord = streamingRecordService.transformData(kafkaSinkRecord);
       if (!transformedRecord.isEmpty()) {
         insertRowWithFallback(transformedRecord, kafkaOffset);
-        this.processedOffset.set(kafkaOffset);
-        LOGGER.trace("Setting processedOffset=[{}], channel=[{}]", kafkaOffset, channelName);
       }
+      // Always update processedOffset after transformData, even for empty/broken records
+      // Empty records are already reported to DLQ in transformData if needed
+      this.processedOffset.set(kafkaOffset);
+      LOGGER.trace("Setting processedOffset=[{}], channel=[{}]", kafkaOffset, channelName);
     } catch (TopicPartitionChannelInsertionException ex) {
       // Suppressing the exception because other channels might still continue to ingest
       LOGGER.warn(