From 5de6c598d663ab1baa476030faf5c4312b0dd5d2 Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Wed, 19 Nov 2025 12:35:30 +0000
Subject: [PATCH 01/19] complete build success

# Conflicts:
#	commons/src/main/java/io/aiven/commons/collections/Scale.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/BackoffPolicyFragment.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/CommonConfig.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/FragmentDataAccess.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/OutputFormatFragment.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/SinkCommonConfig.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/SourceCommonConfig.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/validators/FilenameTemplateValidator.java
#	commons/src/main/java/io/aiven/kafka/connect/common/source/input/utils/FilePatternUtils.java
#	commons/src/test/java/io/aiven/kafka/connect/common/config/FileNameFragmentTest.java
#	commons/src/test/java/io/aiven/kafka/connect/common/config/validators/FilenameTemplateValidatorTest.java
#	commons/src/test/java/io/aiven/kafka/connect/common/source/input/ExampleSourceRecordIteratorTest.java
#	gcs-sink-connector/src/main/java/io/aiven/kafka/connect/gcs/GcsSinkConfig.java
#	s3-commons/src/main/java/io/aiven/kafka/connect/config/s3/S3ConfigFragment.java
---
 .../common/config/CompressionType.java        |  17 --
 .../common/output/avro/AvroOutputWriter.java  | 122 +++----------
 .../common/output/parquet/ParquetConfig.java  |  12 +-
 .../source/AbstractSourceRecordIterator.java  |  19 +-
 .../AbstractSourceRecordIteratorTest.java     | 162 +-----------------
 5 files changed, 37 insertions(+), 295 deletions(-)
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java b/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java
index 2de5216cb..669aca3fd 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java
@@ -30,7 +30,6 @@
 import com.github.luben.zstd.ZstdInputStream;
 import com.github.luben.zstd.ZstdOutputStream;
 import org.apache.commons.io.function.IOFunction;
-import org.apache.commons.io.function.IOSupplier;
 import org.xerial.snappy.SnappyInputStream;
 import org.xerial.snappy.SnappyOutputStream;
 
@@ -139,22 +138,6 @@ public final InputStream decompress(final InputStream input) throws IOException
         return decompressor.apply(input);
     }
 
-    /**
-     * Decompresses an input stream wrapped in an IOSupplier
-     *
-     * @param input
-     *            the input stream to read compressed data from.
-     * @return An input stream that returns decompressed data.
-     */
-    public final IOSupplier<InputStream> decompress(final IOSupplier<InputStream> input) {
-        return new IOSupplier<InputStream>() {
-            @Override
-            public InputStream get() throws IOException {
-                return decompress(input.get());
-            }
-        };
-    }
-
     /**
      * Compresses an output stream.
      *
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java b/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java
index f320a34cd..f9380b4c4 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java
@@ -19,6 +19,7 @@
 import java.io.IOException;
 import java.io.OutputStream;
 import java.util.Collection;
+import java.util.List;
 import java.util.Map;
 
 import org.apache.kafka.connect.sink.SinkRecord;
@@ -34,120 +35,49 @@
 import org.apache.avro.file.DataFileWriter;
 import org.apache.avro.generic.GenericDatumWriter;
 import org.apache.avro.generic.GenericRecord;
-import org.apache.commons.io.output.CloseShieldOutputStream;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
-/**
- * An instance of OutputWriter that writes to Avro files.
- */
 public final class AvroOutputWriter extends OutputWriter {
 
     private static final Logger LOGGER = LoggerFactory.getLogger(AvroOutputWriter.class);
 
+    private final AvroSchemaBuilder avroSchemaBuilder;
+    private final SinkRecordConverter sinkRecordConverter;
+
     public AvroOutputWriter(final Collection<OutputField> fields, final OutputStream out,
             final Map<String, String> externalConfig, final boolean envelopeEnabled) {
-        super(out, new AvroOutputStreamWriter(fields, externalConfig, envelopeEnabled), externalConfig);
+        super(out, new OutputStreamWriterStub(), externalConfig);
+        final AvroData avroData = new AvroData(new AvroDataConfig(externalConfig));
+        this.sinkRecordConverter = new SinkRecordConverter(fields, avroData, envelopeEnabled);
+        this.avroSchemaBuilder = new AvroSchemaBuilder(fields, avroData, envelopeEnabled);
     }
 
-    /**
-     * An instance of OutputStreamWriter that handles writing the Avro format
-     */
-    private static final class AvroOutputStreamWriter implements OutputStreamWriter {
-        /**
-         * The sink record converter for Avro.
-         */
-        private final SinkRecordConverter sinkRecordConverter;
-        /**
-         * The Avro schema builder.
-         */
-        private final AvroSchemaBuilder avroSchemaBuilder;
-        /**
-         * The Avro configuration.
-         */
-        private final AvroConfig avroConfiguration;
+    @Override
+    public void writeRecords(final Collection<SinkRecord> sinkRecords) throws IOException {
+        final AvroConfig avroConfiguration = AvroConfig.createAvroConfiguration(externalConfiguration);
+        final Schema avroSchema = avroSchemaBuilder.buildSchema(sinkRecords.iterator().next());
+        LOGGER.debug("Record schema is: {}", avroSchema);
 
-        /**
-         * Lazily constructed Avro schema used in the output stream.
-         */
-        private Schema avroSchema;
-        /**
-         * Lazily constructed Avro DataFileWriter.
-         */
-        private DataFileWriter<GenericRecord> dataFileWriter;
-
-        /**
-         * Constructor.
-         *
-         * @param fields
-         *            the fields to output.
-         * @param externalConfig
-         *            the configuration data for the Avro configuration.
-         * @param envelopeEnabled
-         *            {@code true if the envelope is enabled}
-         */
-        AvroOutputStreamWriter(final Collection<OutputField> fields, final Map<String, String> externalConfig,
-                final boolean envelopeEnabled) {
-            final AvroData avroData = new AvroData(new AvroDataConfig(externalConfig));
-            this.sinkRecordConverter = new SinkRecordConverter(fields, avroData, envelopeEnabled);
-            this.avroSchemaBuilder = new AvroSchemaBuilder(fields, avroData, envelopeEnabled);
-            this.avroConfiguration = AvroConfig.createAvroConfiguration(externalConfig);
-        }
-
-        /**
-         * Create the data file writer if it does not exist. Requires that {@link #getAvroSchema(SinkRecord)} be called
-         * at least once prior.
-         *
-         * @return the DataFileWriter.
-         * @throws IOException
-         *             if the writer can not be created.
-         */
-        private DataFileWriter<GenericRecord> getDataFileWriter(final OutputStream outputStream) throws IOException {
-            if (dataFileWriter == null) {
-                final GenericDatumWriter<GenericRecord> writer = new GenericDatumWriter<>(avroSchema);
-                dataFileWriter = new DataFileWriter<>(writer);
-                dataFileWriter.setCodec(avroConfiguration.codecFactory());
-                // create with output stream that does not close the underlying stream.
-                dataFileWriter.create(avroSchema, CloseShieldOutputStream.wrap(outputStream));
+        final GenericDatumWriter<GenericRecord> writer = new GenericDatumWriter<>(avroSchema);
+        try (DataFileWriter<GenericRecord> dataFileWriter = new DataFileWriter<>(writer)) {
+            dataFileWriter.setCodec(avroConfiguration.codecFactory());
+            dataFileWriter.create(avroSchema, outputStream);
+            for (final SinkRecord record : sinkRecords) {
+                final GenericRecord datum = sinkRecordConverter.convert(record, avroSchema);
+                dataFileWriter.append(datum);
             }
-            return dataFileWriter;
         }
+    }
 
-        /**
-         * Creates the Avro schema if necessary. Will throw an exception if the record schema does not match the output
-         * Avro schema.
-         *
-         * @param sinkRecord
-         *            the record to be written.
-         * @return the file Avro schema.
-         * @throws IOException
-         *             if the record schema does not match the file schema.
-         */
-        private Schema getAvroSchema(final SinkRecord sinkRecord) throws IOException {
-            if (avroSchema == null) {
-                avroSchema = avroSchemaBuilder.buildSchema(sinkRecord);
-                LOGGER.debug("Record schema is: {}", avroSchema);
-            } else {
-                final Schema otherSchema = avroSchemaBuilder.buildSchema(sinkRecord);
-                if (!avroSchema.equals(otherSchema)) {
-                    LOGGER.error("Illegal Schema Change. {}", otherSchema);
-                    throw new IOException("Illegal schema change");
-                }
-            }
-            return avroSchema;
-        }
+    @Override
+    public void writeRecord(final SinkRecord record) throws IOException {
+        writeRecords(List.of(record));
+    }
 
+    private static final class OutputStreamWriterStub implements OutputStreamWriter {
         @Override
         public void writeOneRecord(final OutputStream outputStream, final SinkRecord record) throws IOException {
-            final GenericRecord datum = sinkRecordConverter.convert(record, getAvroSchema(record));
-            getDataFileWriter(outputStream).append(datum);
-        }
-
-        @Override
-        public void stopWriting(final OutputStream outputStream) throws IOException {
-            if (dataFileWriter != null) {
-                dataFileWriter.close();
-            }
         }
     }
 }
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java b/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java
index 6d1fa5f55..eaa692214 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java
@@ -27,7 +27,7 @@
 import org.apache.hadoop.conf.Configuration;
 import org.apache.parquet.hadoop.metadata.CompressionCodecName;
 
-public final class ParquetConfig extends AbstractConfig {
+final class ParquetConfig extends AbstractConfig {
 
     public ParquetConfig(final Map<?, ?> originals) {
         super(new ConfigDef(), originals);
@@ -50,13 +50,10 @@ public Configuration parquetConfiguration() {
     }
 
     public CompressionCodecName compressionCodecName() {
-        return compressionCodecName(CompressionType.forName(
+        final var connectorCompressionType = CompressionType.forName(
                 originals().getOrDefault(FileNameFragment.FILE_COMPRESSION_TYPE_CONFIG, CompressionType.NONE.name)
-                        .toString()));
-    }
-
-    public static CompressionCodecName compressionCodecName(final CompressionType compressionType) {
-        switch (compressionType) {
+                        .toString());
+        switch (connectorCompressionType) {
             case GZIP :
                 return CompressionCodecName.GZIP;
             case SNAPPY :
@@ -67,4 +64,5 @@ public static CompressionCodecName compressionCodecName(final CompressionType co
                 return CompressionCodecName.UNCOMPRESSED;
         }
     }
+
 }
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java b/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java
index 0abb5565c..6c88ca1cf 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java
@@ -27,17 +27,14 @@
 import org.apache.kafka.connect.data.SchemaAndValue;
 
 import io.aiven.commons.collections.RingBuffer;
-import io.aiven.kafka.connect.common.config.CompressionType;
 import io.aiven.kafka.connect.common.config.SourceCommonConfig;
 import io.aiven.kafka.connect.common.config.SourceConfigFragment;
-import io.aiven.kafka.connect.common.source.input.ParquetTransformer;
 import io.aiven.kafka.connect.common.source.input.Transformer;
 import io.aiven.kafka.connect.common.source.input.utils.FilePatternUtils;
 import io.aiven.kafka.connect.common.source.task.Context;
 import io.aiven.kafka.connect.common.source.task.DistributionStrategy;
 import io.aiven.kafka.connect.common.source.task.DistributionType;
 
-import com.google.common.annotations.VisibleForTesting;
 import edu.umd.cs.findbugs.annotations.SuppressFBWarnings;
 import org.apache.commons.io.function.IOSupplier;
 import org.apache.commons.lang3.ObjectUtils;
@@ -239,25 +236,17 @@ final public void remove() {
      *            the SourceRecord that drives the creation of source records with values.
      * @return a stream of T created from the input stream of the native item.
      */
-    @VisibleForTesting
-    Stream<T> convert(final T sourceRecord) {
+    private Stream<T> convert(final T sourceRecord) {
         sourceRecord
                 .setKeyData(transformer.getKeyData(sourceRecord.getNativeKey(), sourceRecord.getTopic(), sourceConfig));
 
         lastSeenNativeKey = sourceRecord.getNativeKey();
 
-        // parquet handles compression internally.
-        final CompressionType compressionType = transformer instanceof ParquetTransformer
-                ? CompressionType.NONE
-                : sourceConfig.getCompressionType();
-        // create an IOSupplier with the specified compression
-        final IOSupplier<InputStream> inputStream = transformer instanceof ParquetTransformer
-                ? getInputStream(sourceRecord)
-                : compressionType.decompress(getInputStream(sourceRecord));
         return transformer
-                .getRecords(inputStream, sourceRecord.getNativeItemSize(), sourceRecord.getContext(), sourceConfig,
-                        sourceRecord.getRecordCount())
+                .getRecords(getInputStream(sourceRecord), sourceRecord.getNativeItemSize(), sourceRecord.getContext(),
+                        sourceConfig, sourceRecord.getRecordCount())
                 .map(new Mapper<N, K, O, T>(sourceRecord));
+
     }
 
     /**
diff --git a/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java b/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java
index 7a913ab81..7d3ac0fde 100644
--- a/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java
+++ b/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java
@@ -25,7 +25,6 @@
 import static org.mockito.Mockito.verify;
 import static org.mockito.Mockito.when;
 
-import java.io.ByteArrayOutputStream;
 import java.io.IOException;
 import java.nio.ByteBuffer;
 import java.nio.charset.StandardCharsets;
@@ -39,31 +38,18 @@
 import java.util.NoSuchElementException;
 import java.util.Queue;
 
-import org.apache.kafka.connect.data.Field;
-import org.apache.kafka.connect.data.Schema;
-import org.apache.kafka.connect.data.SchemaBuilder;
-import org.apache.kafka.connect.data.Struct;
-import org.apache.kafka.connect.json.JsonDeserializer;
-import org.apache.kafka.connect.sink.SinkRecord;
 import org.apache.kafka.connect.source.SourceTaskContext;
 import org.apache.kafka.connect.storage.OffsetStorageReader;
 
-import io.aiven.kafka.connect.common.config.CompressionType;
-import io.aiven.kafka.connect.common.config.FormatType;
-import io.aiven.kafka.connect.common.config.OutputField;
-import io.aiven.kafka.connect.common.config.OutputFieldEncodingType;
-import io.aiven.kafka.connect.common.config.OutputFieldType;
 import io.aiven.kafka.connect.common.config.SourceCommonConfig;
 import io.aiven.kafka.connect.common.format.AvroTestDataFixture;
 import io.aiven.kafka.connect.common.format.JsonTestDataFixture;
 import io.aiven.kafka.connect.common.format.ParquetTestDataFixture;
-import io.aiven.kafka.connect.common.output.OutputWriter;
 import io.aiven.kafka.connect.common.source.input.InputFormat;
 import io.aiven.kafka.connect.common.source.input.Transformer;
 import io.aiven.kafka.connect.common.source.input.TransformerFactory;
 import io.aiven.kafka.connect.common.source.task.DistributionType;
 
-import com.fasterxml.jackson.databind.node.ArrayNode;
 import org.apache.commons.lang3.tuple.Pair;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
@@ -83,7 +69,6 @@
  * @param <T>
  *            The concrete implementation of the {@link AbstractSourceRecord} .
  */
-@SuppressWarnings("PMD.ExcessiveImports")
 public abstract class AbstractSourceRecordIteratorTest<K extends Comparable<K>, N, O extends OffsetManager.OffsetManagerEntry<O>, T extends AbstractSourceRecord<K, N, O, T>> {
     /** The offset manager */
     private OffsetManager<O> offsetManager;
@@ -115,7 +100,7 @@ public abstract class AbstractSourceRecordIteratorTest<K extends Comparable<K>,
      * @param offsetManager
      *            A mock offset manager.
      * @param transformer
-     *            The transformer to use for the test.
+     *            The trnasformer to use for the test.
      * @return A configured AbstractSourceRecordIterator.
      */
     abstract protected AbstractSourceRecordIterator<K, N, O, T> createSourceRecordIterator(
@@ -150,7 +135,7 @@ public void setUp() {
     }
 
     /**
-     * Create a mock SourceConfig with our necessary items added.
+     * Create a mock SourceCOnfig with our necessary items added.
      *
      * @param filePattern
      *            The file pattern to match.
@@ -195,7 +180,6 @@ void testOneObjectReturnsOneObject(final InputFormat format, final byte[] data)
         final Transformer transformer = TransformerFactory.getTransformer(format);
         final SourceCommonConfig mockConfig = mockSourceConfig(FILE_PATTERN, 0, 1, null);
         when(mockConfig.getInputFormat()).thenReturn(format);
-        when(mockConfig.getCompressionType()).thenReturn(CompressionType.NONE);
 
         // verify one data has one data
         createClientMutator().reset().addObject(key, ByteBuffer.wrap(data)).endOfBlock().build();
@@ -261,8 +245,6 @@ void testMultipleRecordsReturned(final InputFormat format, final byte[] data) {
         final SourceCommonConfig config = mockSourceConfig(FILE_PATTERN, 0, 1, null);
         when(config.getTransformerMaxBufferSize()).thenReturn(4096);
         when(config.getInputFormat()).thenReturn(format);
-        when(config.getCompressionType()).thenReturn(CompressionType.NONE);
-
         final AbstractSourceRecordIterator<K, N, O, T> iterator = createSourceRecordIterator(config, offsetManager,
                 transformer);
 
@@ -333,8 +315,6 @@ void testIteratorProcessesMultipleObjectsFromByteArrayTransformer() {
         final SourceCommonConfig config = mockSourceConfig(FILE_PATTERN, 0, 1, null);
         when(config.getTransformerMaxBufferSize()).thenReturn(4096);
         when(config.getInputFormat()).thenReturn(InputFormat.BYTES);
-        when(config.getCompressionType()).thenReturn(CompressionType.NONE);
-
         final AbstractSourceRecordIterator<K, N, O, T> iterator = createSourceRecordIterator(config, offsetManager,
                 transformer);
 
@@ -388,144 +368,6 @@ static List<Arguments> parameterizedNativeStartKey() {
         return List.of(Arguments.of("startKeyOne", 2), Arguments.of("startKeyOne", 2), Arguments.of(null, 1));
     }
 
-    /**
-     * Gets a configured Transformer.
-     *
-     * @param formatType
-     *            The input format for the transformer.
-     * @return the Transformer for the specified input format.
-     */
-    private static InputFormat formatTypeConversion(final FormatType formatType) {
-        switch (formatType) {
-            case AVRO :
-                return InputFormat.AVRO;
-            case PARQUET :
-                return InputFormat.PARQUET;
-            case JSONL :
-                return InputFormat.JSONL;
-            case CSV :
-            case JSON :
-                return InputFormat.BYTES;
-            default :
-                throw new IllegalArgumentException("Unknown format type in configuration: " + formatType);
-        }
-    }
-    @ParameterizedTest
-    @MethodSource("testDecompressionData")
-    @SuppressWarnings("PMD.NcssCount")
-    void testDecompression(final FormatType formatType, final CompressionType compressionType) throws IOException {
-        // setup the data
-        final SourceCommonConfig config = mockSourceConfig(FILE_PATTERN, 0, 1, null);
-        when(config.getTransformerMaxBufferSize()).thenReturn(4096);
-        when(config.getCompressionType()).thenReturn(compressionType);
-        when(config.getInputFormat()).thenReturn(formatTypeConversion(formatType));
-
-        final ByteArrayOutputStream byteArrayOutputStream = new ByteArrayOutputStream();
-        Object value = null;
-        Schema valueSchema = null;
-        try (OutputWriter outputWriter = OutputWriter.builder()
-                .withCompressionType(compressionType)
-                .withOutputFields(
-                        Collections.singletonList(new OutputField(OutputFieldType.VALUE, OutputFieldEncodingType.NONE)))
-                .build(byteArrayOutputStream, formatType)) {
-
-            switch (formatType) {
-                case AVRO :
-                    valueSchema = SchemaBuilder.struct()
-                            .field("message", SchemaBuilder.STRING_SCHEMA)
-                            .field("id", SchemaBuilder.INT32_SCHEMA);
-                    value = new Struct(valueSchema).put("message", "Hello").put("id", 1);
-                    break;
-                case PARQUET :
-                    valueSchema = ParquetTestDataFixture.PARQUET_SCHEMA;
-                    value = new Struct(valueSchema).put("name", "TheDude")
-                            .put("age", 32)
-                            .put("email", "thedude@example.com");
-                    break;
-                case JSONL :
-                    valueSchema = SchemaBuilder.struct()
-                            .field("message", SchemaBuilder.STRING_SCHEMA)
-                            .field("id", SchemaBuilder.INT32_SCHEMA);
-                    value = new Struct(valueSchema).put("message", "Hello").put("id", 2);
-                    break;
-                case CSV :
-                    valueSchema = SchemaBuilder.BYTES_SCHEMA;
-                    value = "'test','one'".getBytes(StandardCharsets.UTF_8);
-                    break;
-                case JSON :
-                    valueSchema = SchemaBuilder.STRING_SCHEMA;
-                    value = "json is here";
-                    break;
-                default :
-                    throw new IllegalArgumentException("Unknown format type: " + formatType);
-            }
-
-            final SinkRecord sinkRecord = new SinkRecord("testTopic", 0, Schema.STRING_SCHEMA, "testRecord",
-                    valueSchema, value, 0);
-            outputWriter.writeRecord(sinkRecord);
-        }
-        createClientMutator().addObject(key, ByteBuffer.wrap(byteArrayOutputStream.toByteArray())).endOfBlock().build();
-        final Transformer transformer = TransformerFactory.getTransformer(formatTypeConversion(formatType));
-
-        // Start the test
-        final AbstractSourceRecordIterator<K, N, O, T> iterator = createSourceRecordIterator(config, offsetManager,
-                transformer);
-        assertThat(iterator).hasNext();
-        final T sourceRecord = iterator.next();
-        assertThat(sourceRecord).isNotNull();
-        switch (formatType) {
-            case AVRO :
-            case PARQUET :
-                Struct struct = (Struct) sourceRecord.getValue().value();
-                struct = (Struct) struct.get("value");
-                assertEquivalent(valueSchema, struct.schema());
-                for (final Field field : valueSchema.fields()) {
-                    assertThat(struct.get(field)).describedAs("field: " + field).isEqualTo(((Struct) value).get(field));
-                }
-                break;
-            case CSV :
-                assertThat(sourceRecord.getValue().schema()).isNull();
-                assertThat(sourceRecord.getValue().value()).isEqualTo(value);
-                break;
-            case JSON :
-                assertThat(sourceRecord.getValue().schema()).isNull();
-                try (JsonDeserializer jsonDeserializer = new JsonDeserializer()) {
-                    final ArrayNode arrayNode = (ArrayNode) jsonDeserializer.deserialize("topic",
-                            (byte[]) sourceRecord.getValue().value());
-                    assertThat(arrayNode.size()).isEqualTo(1);
-                    assertThat(arrayNode.get(0).get("value").asText())
-                            .describedAs(new String((byte[]) sourceRecord.getValue().value(), StandardCharsets.UTF_8)
-                                    + " == " + String.format("[%n{\"value\":\"%s\"}%n]", value))
-                            .isEqualTo(value);
-                }
-                break;
-            case JSONL :
-                assertThat(sourceRecord.getValue().schema()).isNull();
-                Map<String, Object> values = (Map<String, Object>) sourceRecord.getValue().value();
-                values = (Map<String, Object>) values.get("value");
-                assertThat(values.get("id")).isEqualTo(2L);
-                assertThat(values.get("message")).isEqualTo("Hello");
-                break;
-            default :
-                throw new IllegalArgumentException("Unknown format type: " + formatType);
-        }
-    }
-
-    private void assertEquivalent(final Schema expected, final Schema actual) {
-        assertThat(actual.type()).isEqualTo(expected.type());
-        assertThat(actual.fields()).containsExactlyElementsOf(expected.fields());
-    }
-
-    static List<Arguments> testDecompressionData() {
-        final List<Arguments> result = new ArrayList<>();
-        for (final FormatType formatType : FormatType.values()) {
-            for (final CompressionType compressionType : CompressionType.values()) {
-                result.add(Arguments.of(formatType, compressionType));
-            }
-        }
-        return result;
-    }
-
     /**
      * A mutator of the mocked client used by the iterator under test.
      * <p>

From bc89fc079b3b5642cff255850c8a29ea8e7405a4 Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Wed, 19 Nov 2025 13:51:47 +0000
Subject: [PATCH 02/19] cleaned up PR

---
 .../common/config/CompressionType.java        |  17 ++
 .../common/config/SinkCommonConfig.java       |   5 -
 .../common/output/avro/AvroOutputWriter.java  | 122 ++++++++++---
 .../common/output/parquet/ParquetConfig.java  |  12 +-
 .../source/AbstractSourceRecordIterator.java  |  19 +-
 .../AbstractSourceRecordIteratorTest.java     | 162 +++++++++++++++++-
 6 files changed, 295 insertions(+), 42 deletions(-)

diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java b/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java
index 669aca3fd..2de5216cb 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java
@@ -30,6 +30,7 @@
 import com.github.luben.zstd.ZstdInputStream;
 import com.github.luben.zstd.ZstdOutputStream;
 import org.apache.commons.io.function.IOFunction;
+import org.apache.commons.io.function.IOSupplier;
 import org.xerial.snappy.SnappyInputStream;
 import org.xerial.snappy.SnappyOutputStream;
 
@@ -138,6 +139,22 @@ public final InputStream decompress(final InputStream input) throws IOException
         return decompressor.apply(input);
     }
 
+    /**
+     * Decompresses an input stream wrapped in an IOSupplier
+     *
+     * @param input
+     *            the input stream to read compressed data from.
+     * @return An input stream that returns decompressed data.
+     */
+    public final IOSupplier<InputStream> decompress(final IOSupplier<InputStream> input) {
+        return new IOSupplier<InputStream>() {
+            @Override
+            public InputStream get() throws IOException {
+                return decompress(input.get());
+            }
+        };
+    }
+
     /**
      * Compresses an output stream.
      *
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/config/SinkCommonConfig.java b/commons/src/main/java/io/aiven/kafka/connect/common/config/SinkCommonConfig.java
index 956c2093f..7fb68a2b2 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/config/SinkCommonConfig.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/config/SinkCommonConfig.java
@@ -142,11 +142,6 @@ public final TimestampSource getFilenameTimestampSource() {
         return fileNameFragment.getFilenameTimestampSource();
     }
 
-    /**
-     * Gets the maximum records allowed in a single file.
-     *
-     * @return the maximum records allowed in a single file.
-     */
     public final int getMaxRecordsPerFile() {
         return fileNameFragment.getMaxRecordsPerFile();
     }
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java b/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java
index f9380b4c4..f320a34cd 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java
@@ -19,7 +19,6 @@
 import java.io.IOException;
 import java.io.OutputStream;
 import java.util.Collection;
-import java.util.List;
 import java.util.Map;
 
 import org.apache.kafka.connect.sink.SinkRecord;
@@ -35,49 +34,120 @@
 import org.apache.avro.file.DataFileWriter;
 import org.apache.avro.generic.GenericDatumWriter;
 import org.apache.avro.generic.GenericRecord;
+import org.apache.commons.io.output.CloseShieldOutputStream;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
+/**
+ * An instance of OutputWriter that writes to Avro files.
+ */
 public final class AvroOutputWriter extends OutputWriter {
 
     private static final Logger LOGGER = LoggerFactory.getLogger(AvroOutputWriter.class);
 
-    private final AvroSchemaBuilder avroSchemaBuilder;
-    private final SinkRecordConverter sinkRecordConverter;
-
     public AvroOutputWriter(final Collection<OutputField> fields, final OutputStream out,
             final Map<String, String> externalConfig, final boolean envelopeEnabled) {
-        super(out, new OutputStreamWriterStub(), externalConfig);
-        final AvroData avroData = new AvroData(new AvroDataConfig(externalConfig));
-        this.sinkRecordConverter = new SinkRecordConverter(fields, avroData, envelopeEnabled);
-        this.avroSchemaBuilder = new AvroSchemaBuilder(fields, avroData, envelopeEnabled);
+        super(out, new AvroOutputStreamWriter(fields, externalConfig, envelopeEnabled), externalConfig);
     }
 
-    @Override
-    public void writeRecords(final Collection<SinkRecord> sinkRecords) throws IOException {
-        final AvroConfig avroConfiguration = AvroConfig.createAvroConfiguration(externalConfiguration);
-        final Schema avroSchema = avroSchemaBuilder.buildSchema(sinkRecords.iterator().next());
-        LOGGER.debug("Record schema is: {}", avroSchema);
+    /**
+     * An instance of OutputStreamWriter that handles writing the Avro format
+     */
+    private static final class AvroOutputStreamWriter implements OutputStreamWriter {
+        /**
+         * The sink record converter for Avro.
+         */
+        private final SinkRecordConverter sinkRecordConverter;
+        /**
+         * The Avro schema builder.
+         */
+        private final AvroSchemaBuilder avroSchemaBuilder;
+        /**
+         * The Avro configuration.
+         */
+        private final AvroConfig avroConfiguration;
 
-        final GenericDatumWriter<GenericRecord> writer = new GenericDatumWriter<>(avroSchema);
-        try (DataFileWriter<GenericRecord> dataFileWriter = new DataFileWriter<>(writer)) {
-            dataFileWriter.setCodec(avroConfiguration.codecFactory());
-            dataFileWriter.create(avroSchema, outputStream);
-            for (final SinkRecord record : sinkRecords) {
-                final GenericRecord datum = sinkRecordConverter.convert(record, avroSchema);
-                dataFileWriter.append(datum);
+        /**
+         * Lazily constructed Avro schema used in the output stream.
+         */
+        private Schema avroSchema;
+        /**
+         * Lazily constructed Avro DataFileWriter.
+         */
+        private DataFileWriter<GenericRecord> dataFileWriter;
+
+        /**
+         * Constructor.
+         *
+         * @param fields
+         *            the fields to output.
+         * @param externalConfig
+         *            the configuration data for the Avro configuration.
+         * @param envelopeEnabled
+         *            {@code true if the envelope is enabled}
+         */
+        AvroOutputStreamWriter(final Collection<OutputField> fields, final Map<String, String> externalConfig,
+                final boolean envelopeEnabled) {
+            final AvroData avroData = new AvroData(new AvroDataConfig(externalConfig));
+            this.sinkRecordConverter = new SinkRecordConverter(fields, avroData, envelopeEnabled);
+            this.avroSchemaBuilder = new AvroSchemaBuilder(fields, avroData, envelopeEnabled);
+            this.avroConfiguration = AvroConfig.createAvroConfiguration(externalConfig);
+        }
+
+        /**
+         * Create the data file writer if it does not exist. Requires that {@link #getAvroSchema(SinkRecord)} be called
+         * at least once prior.
+         *
+         * @return the DataFileWriter.
+         * @throws IOException
+         *             if the writer can not be created.
+         */
+        private DataFileWriter<GenericRecord> getDataFileWriter(final OutputStream outputStream) throws IOException {
+            if (dataFileWriter == null) {
+                final GenericDatumWriter<GenericRecord> writer = new GenericDatumWriter<>(avroSchema);
+                dataFileWriter = new DataFileWriter<>(writer);
+                dataFileWriter.setCodec(avroConfiguration.codecFactory());
+                // create with output stream that does not close the underlying stream.
+                dataFileWriter.create(avroSchema, CloseShieldOutputStream.wrap(outputStream));
             }
+            return dataFileWriter;
         }
-    }
 
-    @Override
-    public void writeRecord(final SinkRecord record) throws IOException {
-        writeRecords(List.of(record));
-    }
+        /**
+         * Creates the Avro schema if necessary. Will throw an exception if the record schema does not match the output
+         * Avro schema.
+         *
+         * @param sinkRecord
+         *            the record to be written.
+         * @return the file Avro schema.
+         * @throws IOException
+         *             if the record schema does not match the file schema.
+         */
+        private Schema getAvroSchema(final SinkRecord sinkRecord) throws IOException {
+            if (avroSchema == null) {
+                avroSchema = avroSchemaBuilder.buildSchema(sinkRecord);
+                LOGGER.debug("Record schema is: {}", avroSchema);
+            } else {
+                final Schema otherSchema = avroSchemaBuilder.buildSchema(sinkRecord);
+                if (!avroSchema.equals(otherSchema)) {
+                    LOGGER.error("Illegal Schema Change. {}", otherSchema);
+                    throw new IOException("Illegal schema change");
+                }
+            }
+            return avroSchema;
+        }
 
-    private static final class OutputStreamWriterStub implements OutputStreamWriter {
         @Override
         public void writeOneRecord(final OutputStream outputStream, final SinkRecord record) throws IOException {
+            final GenericRecord datum = sinkRecordConverter.convert(record, getAvroSchema(record));
+            getDataFileWriter(outputStream).append(datum);
+        }
+
+        @Override
+        public void stopWriting(final OutputStream outputStream) throws IOException {
+            if (dataFileWriter != null) {
+                dataFileWriter.close();
+            }
         }
     }
 }
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java b/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java
index eaa692214..6d1fa5f55 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java
@@ -27,7 +27,7 @@
 import org.apache.hadoop.conf.Configuration;
 import org.apache.parquet.hadoop.metadata.CompressionCodecName;
 
-final class ParquetConfig extends AbstractConfig {
+public final class ParquetConfig extends AbstractConfig {
 
     public ParquetConfig(final Map<?, ?> originals) {
         super(new ConfigDef(), originals);
@@ -50,10 +50,13 @@ public Configuration parquetConfiguration() {
     }
 
     public CompressionCodecName compressionCodecName() {
-        final var connectorCompressionType = CompressionType.forName(
+        return compressionCodecName(CompressionType.forName(
                 originals().getOrDefault(FileNameFragment.FILE_COMPRESSION_TYPE_CONFIG, CompressionType.NONE.name)
-                        .toString());
-        switch (connectorCompressionType) {
+                        .toString()));
+    }
+
+    public static CompressionCodecName compressionCodecName(final CompressionType compressionType) {
+        switch (compressionType) {
             case GZIP :
                 return CompressionCodecName.GZIP;
             case SNAPPY :
@@ -64,5 +67,4 @@ public CompressionCodecName compressionCodecName() {
                 return CompressionCodecName.UNCOMPRESSED;
         }
     }
-
 }
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java b/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java
index 6c88ca1cf..0abb5565c 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java
@@ -27,14 +27,17 @@
 import org.apache.kafka.connect.data.SchemaAndValue;
 
 import io.aiven.commons.collections.RingBuffer;
+import io.aiven.kafka.connect.common.config.CompressionType;
 import io.aiven.kafka.connect.common.config.SourceCommonConfig;
 import io.aiven.kafka.connect.common.config.SourceConfigFragment;
+import io.aiven.kafka.connect.common.source.input.ParquetTransformer;
 import io.aiven.kafka.connect.common.source.input.Transformer;
 import io.aiven.kafka.connect.common.source.input.utils.FilePatternUtils;
 import io.aiven.kafka.connect.common.source.task.Context;
 import io.aiven.kafka.connect.common.source.task.DistributionStrategy;
 import io.aiven.kafka.connect.common.source.task.DistributionType;
 
+import com.google.common.annotations.VisibleForTesting;
 import edu.umd.cs.findbugs.annotations.SuppressFBWarnings;
 import org.apache.commons.io.function.IOSupplier;
 import org.apache.commons.lang3.ObjectUtils;
@@ -236,17 +239,25 @@ final public void remove() {
      *            the SourceRecord that drives the creation of source records with values.
      * @return a stream of T created from the input stream of the native item.
      */
-    private Stream<T> convert(final T sourceRecord) {
+    @VisibleForTesting
+    Stream<T> convert(final T sourceRecord) {
         sourceRecord
                 .setKeyData(transformer.getKeyData(sourceRecord.getNativeKey(), sourceRecord.getTopic(), sourceConfig));
 
         lastSeenNativeKey = sourceRecord.getNativeKey();
 
+        // parquet handles compression internally.
+        final CompressionType compressionType = transformer instanceof ParquetTransformer
+                ? CompressionType.NONE
+                : sourceConfig.getCompressionType();
+        // create an IOSupplier with the specified compression
+        final IOSupplier<InputStream> inputStream = transformer instanceof ParquetTransformer
+                ? getInputStream(sourceRecord)
+                : compressionType.decompress(getInputStream(sourceRecord));
         return transformer
-                .getRecords(getInputStream(sourceRecord), sourceRecord.getNativeItemSize(), sourceRecord.getContext(),
-                        sourceConfig, sourceRecord.getRecordCount())
+                .getRecords(inputStream, sourceRecord.getNativeItemSize(), sourceRecord.getContext(), sourceConfig,
+                        sourceRecord.getRecordCount())
                 .map(new Mapper<N, K, O, T>(sourceRecord));
-
     }
 
     /**
diff --git a/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java b/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java
index 7d3ac0fde..7a913ab81 100644
--- a/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java
+++ b/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java
@@ -25,6 +25,7 @@
 import static org.mockito.Mockito.verify;
 import static org.mockito.Mockito.when;
 
+import java.io.ByteArrayOutputStream;
 import java.io.IOException;
 import java.nio.ByteBuffer;
 import java.nio.charset.StandardCharsets;
@@ -38,18 +39,31 @@
 import java.util.NoSuchElementException;
 import java.util.Queue;
 
+import org.apache.kafka.connect.data.Field;
+import org.apache.kafka.connect.data.Schema;
+import org.apache.kafka.connect.data.SchemaBuilder;
+import org.apache.kafka.connect.data.Struct;
+import org.apache.kafka.connect.json.JsonDeserializer;
+import org.apache.kafka.connect.sink.SinkRecord;
 import org.apache.kafka.connect.source.SourceTaskContext;
 import org.apache.kafka.connect.storage.OffsetStorageReader;
 
+import io.aiven.kafka.connect.common.config.CompressionType;
+import io.aiven.kafka.connect.common.config.FormatType;
+import io.aiven.kafka.connect.common.config.OutputField;
+import io.aiven.kafka.connect.common.config.OutputFieldEncodingType;
+import io.aiven.kafka.connect.common.config.OutputFieldType;
 import io.aiven.kafka.connect.common.config.SourceCommonConfig;
 import io.aiven.kafka.connect.common.format.AvroTestDataFixture;
 import io.aiven.kafka.connect.common.format.JsonTestDataFixture;
 import io.aiven.kafka.connect.common.format.ParquetTestDataFixture;
+import io.aiven.kafka.connect.common.output.OutputWriter;
 import io.aiven.kafka.connect.common.source.input.InputFormat;
 import io.aiven.kafka.connect.common.source.input.Transformer;
 import io.aiven.kafka.connect.common.source.input.TransformerFactory;
 import io.aiven.kafka.connect.common.source.task.DistributionType;
 
+import com.fasterxml.jackson.databind.node.ArrayNode;
 import org.apache.commons.lang3.tuple.Pair;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
@@ -69,6 +83,7 @@
  * @param <T>
  *            The concrete implementation of the {@link AbstractSourceRecord} .
  */
+@SuppressWarnings("PMD.ExcessiveImports")
 public abstract class AbstractSourceRecordIteratorTest<K extends Comparable<K>, N, O extends OffsetManager.OffsetManagerEntry<O>, T extends AbstractSourceRecord<K, N, O, T>> {
     /** The offset manager */
     private OffsetManager<O> offsetManager;
@@ -100,7 +115,7 @@ public abstract class AbstractSourceRecordIteratorTest<K extends Comparable<K>,
      * @param offsetManager
      *            A mock offset manager.
      * @param transformer
-     *            The trnasformer to use for the test.
+     *            The transformer to use for the test.
      * @return A configured AbstractSourceRecordIterator.
      */
     abstract protected AbstractSourceRecordIterator<K, N, O, T> createSourceRecordIterator(
@@ -135,7 +150,7 @@ public void setUp() {
     }
 
     /**
-     * Create a mock SourceCOnfig with our necessary items added.
+     * Create a mock SourceConfig with our necessary items added.
      *
      * @param filePattern
      *            The file pattern to match.
@@ -180,6 +195,7 @@ void testOneObjectReturnsOneObject(final InputFormat format, final byte[] data)
         final Transformer transformer = TransformerFactory.getTransformer(format);
         final SourceCommonConfig mockConfig = mockSourceConfig(FILE_PATTERN, 0, 1, null);
         when(mockConfig.getInputFormat()).thenReturn(format);
+        when(mockConfig.getCompressionType()).thenReturn(CompressionType.NONE);
 
         // verify one data has one data
         createClientMutator().reset().addObject(key, ByteBuffer.wrap(data)).endOfBlock().build();
@@ -245,6 +261,8 @@ void testMultipleRecordsReturned(final InputFormat format, final byte[] data) {
         final SourceCommonConfig config = mockSourceConfig(FILE_PATTERN, 0, 1, null);
         when(config.getTransformerMaxBufferSize()).thenReturn(4096);
         when(config.getInputFormat()).thenReturn(format);
+        when(config.getCompressionType()).thenReturn(CompressionType.NONE);
+
         final AbstractSourceRecordIterator<K, N, O, T> iterator = createSourceRecordIterator(config, offsetManager,
                 transformer);
 
@@ -315,6 +333,8 @@ void testIteratorProcessesMultipleObjectsFromByteArrayTransformer() {
         final SourceCommonConfig config = mockSourceConfig(FILE_PATTERN, 0, 1, null);
         when(config.getTransformerMaxBufferSize()).thenReturn(4096);
         when(config.getInputFormat()).thenReturn(InputFormat.BYTES);
+        when(config.getCompressionType()).thenReturn(CompressionType.NONE);
+
         final AbstractSourceRecordIterator<K, N, O, T> iterator = createSourceRecordIterator(config, offsetManager,
                 transformer);
 
@@ -368,6 +388,144 @@ static List<Arguments> parameterizedNativeStartKey() {
         return List.of(Arguments.of("startKeyOne", 2), Arguments.of("startKeyOne", 2), Arguments.of(null, 1));
     }
 
+    /**
+     * Gets a configured Transformer.
+     *
+     * @param formatType
+     *            The input format for the transformer.
+     * @return the Transformer for the specified input format.
+     */
+    private static InputFormat formatTypeConversion(final FormatType formatType) {
+        switch (formatType) {
+            case AVRO :
+                return InputFormat.AVRO;
+            case PARQUET :
+                return InputFormat.PARQUET;
+            case JSONL :
+                return InputFormat.JSONL;
+            case CSV :
+            case JSON :
+                return InputFormat.BYTES;
+            default :
+                throw new IllegalArgumentException("Unknown format type in configuration: " + formatType);
+        }
+    }
+    @ParameterizedTest
+    @MethodSource("testDecompressionData")
+    @SuppressWarnings("PMD.NcssCount")
+    void testDecompression(final FormatType formatType, final CompressionType compressionType) throws IOException {
+        // setup the data
+        final SourceCommonConfig config = mockSourceConfig(FILE_PATTERN, 0, 1, null);
+        when(config.getTransformerMaxBufferSize()).thenReturn(4096);
+        when(config.getCompressionType()).thenReturn(compressionType);
+        when(config.getInputFormat()).thenReturn(formatTypeConversion(formatType));
+
+        final ByteArrayOutputStream byteArrayOutputStream = new ByteArrayOutputStream();
+        Object value = null;
+        Schema valueSchema = null;
+        try (OutputWriter outputWriter = OutputWriter.builder()
+                .withCompressionType(compressionType)
+                .withOutputFields(
+                        Collections.singletonList(new OutputField(OutputFieldType.VALUE, OutputFieldEncodingType.NONE)))
+                .build(byteArrayOutputStream, formatType)) {
+
+            switch (formatType) {
+                case AVRO :
+                    valueSchema = SchemaBuilder.struct()
+                            .field("message", SchemaBuilder.STRING_SCHEMA)
+                            .field("id", SchemaBuilder.INT32_SCHEMA);
+                    value = new Struct(valueSchema).put("message", "Hello").put("id", 1);
+                    break;
+                case PARQUET :
+                    valueSchema = ParquetTestDataFixture.PARQUET_SCHEMA;
+                    value = new Struct(valueSchema).put("name", "TheDude")
+                            .put("age", 32)
+                            .put("email", "thedude@example.com");
+                    break;
+                case JSONL :
+                    valueSchema = SchemaBuilder.struct()
+                            .field("message", SchemaBuilder.STRING_SCHEMA)
+                            .field("id", SchemaBuilder.INT32_SCHEMA);
+                    value = new Struct(valueSchema).put("message", "Hello").put("id", 2);
+                    break;
+                case CSV :
+                    valueSchema = SchemaBuilder.BYTES_SCHEMA;
+                    value = "'test','one'".getBytes(StandardCharsets.UTF_8);
+                    break;
+                case JSON :
+                    valueSchema = SchemaBuilder.STRING_SCHEMA;
+                    value = "json is here";
+                    break;
+                default :
+                    throw new IllegalArgumentException("Unknown format type: " + formatType);
+            }
+
+            final SinkRecord sinkRecord = new SinkRecord("testTopic", 0, Schema.STRING_SCHEMA, "testRecord",
+                    valueSchema, value, 0);
+            outputWriter.writeRecord(sinkRecord);
+        }
+        createClientMutator().addObject(key, ByteBuffer.wrap(byteArrayOutputStream.toByteArray())).endOfBlock().build();
+        final Transformer transformer = TransformerFactory.getTransformer(formatTypeConversion(formatType));
+
+        // Start the test
+        final AbstractSourceRecordIterator<K, N, O, T> iterator = createSourceRecordIterator(config, offsetManager,
+                transformer);
+        assertThat(iterator).hasNext();
+        final T sourceRecord = iterator.next();
+        assertThat(sourceRecord).isNotNull();
+        switch (formatType) {
+            case AVRO :
+            case PARQUET :
+                Struct struct = (Struct) sourceRecord.getValue().value();
+                struct = (Struct) struct.get("value");
+                assertEquivalent(valueSchema, struct.schema());
+                for (final Field field : valueSchema.fields()) {
+                    assertThat(struct.get(field)).describedAs("field: " + field).isEqualTo(((Struct) value).get(field));
+                }
+                break;
+            case CSV :
+                assertThat(sourceRecord.getValue().schema()).isNull();
+                assertThat(sourceRecord.getValue().value()).isEqualTo(value);
+                break;
+            case JSON :
+                assertThat(sourceRecord.getValue().schema()).isNull();
+                try (JsonDeserializer jsonDeserializer = new JsonDeserializer()) {
+                    final ArrayNode arrayNode = (ArrayNode) jsonDeserializer.deserialize("topic",
+                            (byte[]) sourceRecord.getValue().value());
+                    assertThat(arrayNode.size()).isEqualTo(1);
+                    assertThat(arrayNode.get(0).get("value").asText())
+                            .describedAs(new String((byte[]) sourceRecord.getValue().value(), StandardCharsets.UTF_8)
+                                    + " == " + String.format("[%n{\"value\":\"%s\"}%n]", value))
+                            .isEqualTo(value);
+                }
+                break;
+            case JSONL :
+                assertThat(sourceRecord.getValue().schema()).isNull();
+                Map<String, Object> values = (Map<String, Object>) sourceRecord.getValue().value();
+                values = (Map<String, Object>) values.get("value");
+                assertThat(values.get("id")).isEqualTo(2L);
+                assertThat(values.get("message")).isEqualTo("Hello");
+                break;
+            default :
+                throw new IllegalArgumentException("Unknown format type: " + formatType);
+        }
+    }
+
+    private void assertEquivalent(final Schema expected, final Schema actual) {
+        assertThat(actual.type()).isEqualTo(expected.type());
+        assertThat(actual.fields()).containsExactlyElementsOf(expected.fields());
+    }
+
+    static List<Arguments> testDecompressionData() {
+        final List<Arguments> result = new ArrayList<>();
+        for (final FormatType formatType : FormatType.values()) {
+            for (final CompressionType compressionType : CompressionType.values()) {
+                result.add(Arguments.of(formatType, compressionType));
+            }
+        }
+        return result;
+    }
+
     /**
      * A mutator of the mocked client used by the iterator under test.
      * <p>

From e04e37bb629361a80ae0e90697f9002102bdc076 Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Wed, 19 Nov 2025 14:09:09 +0000
Subject: [PATCH 03/19] clean up spotless

---
 .../aiven/kafka/connect/common/config/SinkCommonConfig.java  | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/config/SinkCommonConfig.java b/commons/src/main/java/io/aiven/kafka/connect/common/config/SinkCommonConfig.java
index 7fb68a2b2..956c2093f 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/config/SinkCommonConfig.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/config/SinkCommonConfig.java
@@ -142,6 +142,11 @@ public final TimestampSource getFilenameTimestampSource() {
         return fileNameFragment.getFilenameTimestampSource();
     }
 
+    /**
+     * Gets the maximum records allowed in a single file.
+     *
+     * @return the maximum records allowed in a single file.
+     */
     public final int getMaxRecordsPerFile() {
         return fileNameFragment.getMaxRecordsPerFile();
     }

From 50e436ddade5c083478c3271f1769f85d0915c42 Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Mon, 10 Nov 2025 15:47:31 +0000
Subject: [PATCH 04/19] updated S3SinkConfig and tests

---
 .../src/main/java/io/aiven/kafka/connect/s3/S3OutputStream.java | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/s3-sink-connector/src/main/java/io/aiven/kafka/connect/s3/S3OutputStream.java b/s3-sink-connector/src/main/java/io/aiven/kafka/connect/s3/S3OutputStream.java
index cc89e9296..82ef9645e 100644
--- a/s3-sink-connector/src/main/java/io/aiven/kafka/connect/s3/S3OutputStream.java
+++ b/s3-sink-connector/src/main/java/io/aiven/kafka/connect/s3/S3OutputStream.java
@@ -25,6 +25,8 @@
 import java.util.List;
 import java.util.Objects;
 
+import io.aiven.commons.collections.Scale;
+
 import com.amazonaws.services.s3.AmazonS3;
 import com.amazonaws.services.s3.model.AbortMultipartUploadRequest;
 import com.amazonaws.services.s3.model.CompleteMultipartUploadRequest;

From b8e4d08bf217f5e9ec2e2e3439dacbd63b3aacfd Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Thu, 20 Nov 2025 12:16:48 +0000
Subject: [PATCH 05/19] cleaned up s3 configuration

---
 .../src/main/java/io/aiven/kafka/connect/s3/S3OutputStream.java | 2 --
 1 file changed, 2 deletions(-)

diff --git a/s3-sink-connector/src/main/java/io/aiven/kafka/connect/s3/S3OutputStream.java b/s3-sink-connector/src/main/java/io/aiven/kafka/connect/s3/S3OutputStream.java
index 82ef9645e..cc89e9296 100644
--- a/s3-sink-connector/src/main/java/io/aiven/kafka/connect/s3/S3OutputStream.java
+++ b/s3-sink-connector/src/main/java/io/aiven/kafka/connect/s3/S3OutputStream.java
@@ -25,8 +25,6 @@
 import java.util.List;
 import java.util.Objects;
 
-import io.aiven.commons.collections.Scale;
-
 import com.amazonaws.services.s3.AmazonS3;
 import com.amazonaws.services.s3.model.AbortMultipartUploadRequest;
 import com.amazonaws.services.s3.model.CompleteMultipartUploadRequest;

From 363375e39bf2919f2be7ce8d1bb29442cd8fdddd Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Thu, 20 Nov 2025 15:46:27 +0000
Subject: [PATCH 06/19] spotless changes

---
 .../aiven/kafka/connect/s3/source/config/S3SourceConfigDef.java | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/s3-source-connector/src/main/java/io/aiven/kafka/connect/s3/source/config/S3SourceConfigDef.java b/s3-source-connector/src/main/java/io/aiven/kafka/connect/s3/source/config/S3SourceConfigDef.java
index 126979cce..7b0b00e7a 100644
--- a/s3-source-connector/src/main/java/io/aiven/kafka/connect/s3/source/config/S3SourceConfigDef.java
+++ b/s3-source-connector/src/main/java/io/aiven/kafka/connect/s3/source/config/S3SourceConfigDef.java
@@ -26,7 +26,7 @@
 
 public final class S3SourceConfigDef extends SourceCommonConfig.SourceCommonConfigDef {
 
-    public S3SourceConfigDef() {
+    public S3SourceConfigDef() {    
         super();
         S3ConfigFragment.update(this, false);
     }

From 2f2eed3389c26e88d3c0b7a66846011e03ebacb1 Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Thu, 20 Nov 2025 15:55:31 +0000
Subject: [PATCH 07/19] spotless changes

---
 .../aiven/kafka/connect/s3/source/config/S3SourceConfigDef.java | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/s3-source-connector/src/main/java/io/aiven/kafka/connect/s3/source/config/S3SourceConfigDef.java b/s3-source-connector/src/main/java/io/aiven/kafka/connect/s3/source/config/S3SourceConfigDef.java
index 7b0b00e7a..126979cce 100644
--- a/s3-source-connector/src/main/java/io/aiven/kafka/connect/s3/source/config/S3SourceConfigDef.java
+++ b/s3-source-connector/src/main/java/io/aiven/kafka/connect/s3/source/config/S3SourceConfigDef.java
@@ -26,7 +26,7 @@
 
 public final class S3SourceConfigDef extends SourceCommonConfig.SourceCommonConfigDef {
 
-    public S3SourceConfigDef() {    
+    public S3SourceConfigDef() {
         super();
         S3ConfigFragment.update(this, false);
     }

From a274eb8cf6b90a60f9ee091caa95c4fbc025937b Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Fri, 21 Nov 2025 13:12:27 +0000
Subject: [PATCH 08/19] updated timescales

---
 .../java/io/aiven/kafka/connect/config/s3/S3ConfigFragment.java  | 1 +
 1 file changed, 1 insertion(+)

diff --git a/s3-commons/src/main/java/io/aiven/kafka/connect/config/s3/S3ConfigFragment.java b/s3-commons/src/main/java/io/aiven/kafka/connect/config/s3/S3ConfigFragment.java
index dc365e13f..40980411a 100644
--- a/s3-commons/src/main/java/io/aiven/kafka/connect/config/s3/S3ConfigFragment.java
+++ b/s3-commons/src/main/java/io/aiven/kafka/connect/config/s3/S3ConfigFragment.java
@@ -24,6 +24,7 @@
 import java.util.Objects;
 import java.util.stream.Collectors;
 
+import io.aiven.kafka.connect.common.config.validators.TimeScaleValidator;
 import org.apache.kafka.common.config.ConfigDef;
 import org.apache.kafka.common.config.ConfigException;
 import org.apache.kafka.common.config.ConfigValue;

From fbacae201d91c836961145730559b32e084bfe4e Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Fri, 21 Nov 2025 14:22:14 +0000
Subject: [PATCH 09/19] updated validators

---
 .../java/io/aiven/kafka/connect/config/s3/S3ConfigFragment.java  | 1 -
 1 file changed, 1 deletion(-)

diff --git a/s3-commons/src/main/java/io/aiven/kafka/connect/config/s3/S3ConfigFragment.java b/s3-commons/src/main/java/io/aiven/kafka/connect/config/s3/S3ConfigFragment.java
index 40980411a..dc365e13f 100644
--- a/s3-commons/src/main/java/io/aiven/kafka/connect/config/s3/S3ConfigFragment.java
+++ b/s3-commons/src/main/java/io/aiven/kafka/connect/config/s3/S3ConfigFragment.java
@@ -24,7 +24,6 @@
 import java.util.Objects;
 import java.util.stream.Collectors;
 
-import io.aiven.kafka.connect.common.config.validators.TimeScaleValidator;
 import org.apache.kafka.common.config.ConfigDef;
 import org.apache.kafka.common.config.ConfigException;
 import org.apache.kafka.common.config.ConfigValue;

From a28ee17fcef835068f4776ac089d89769543f455 Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Wed, 19 Nov 2025 12:35:30 +0000
Subject: [PATCH 10/19] complete build success

# Conflicts:
#	commons/src/main/java/io/aiven/commons/collections/Scale.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/BackoffPolicyFragment.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/CommonConfig.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/FileNameFragment.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/FragmentDataAccess.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/OutputFormatFragment.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/SinkCommonConfig.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/SourceCommonConfig.java
#	commons/src/main/java/io/aiven/kafka/connect/common/config/validators/FilenameTemplateValidator.java
#	commons/src/main/java/io/aiven/kafka/connect/common/source/input/utils/FilePatternUtils.java
#	commons/src/test/java/io/aiven/kafka/connect/common/config/FileNameFragmentTest.java
#	commons/src/test/java/io/aiven/kafka/connect/common/config/validators/FilenameTemplateValidatorTest.java
#	commons/src/test/java/io/aiven/kafka/connect/common/source/input/ExampleSourceRecordIteratorTest.java
#	gcs-sink-connector/src/main/java/io/aiven/kafka/connect/gcs/GcsSinkConfig.java
#	s3-commons/src/main/java/io/aiven/kafka/connect/config/s3/S3ConfigFragment.java
#	s3-commons/src/main/java/io/aiven/kafka/connect/config/s3/S3SinkBaseConfig.java
#	s3-commons/src/test/java/io/aiven/kafka/connect/tools/AwsCredentialBaseConfig.java
#	s3-sink-connector/src/main/java/io/aiven/kafka/connect/s3/config/S3SinkConfig.java
#	s3-sink-connector/src/main/java/io/aiven/kafka/connect/s3/config/S3SinkConfigDef.java
#	s3-source-connector/src/main/java/io/aiven/kafka/connect/s3/source/config/S3SourceConfig.java
#	s3-source-connector/src/main/java/io/aiven/kafka/connect/s3/source/config/S3SourceConfigDef.java
---
 .../common/config/CompressionType.java        |  17 --
 .../common/output/avro/AvroOutputWriter.java  | 122 +++----------
 .../common/output/parquet/ParquetConfig.java  |  12 +-
 .../source/AbstractSourceRecordIterator.java  |  19 +-
 .../AbstractSourceRecordIteratorTest.java     | 162 +-----------------
 5 files changed, 37 insertions(+), 295 deletions(-)

diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java b/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java
index 2de5216cb..669aca3fd 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java
@@ -30,7 +30,6 @@
 import com.github.luben.zstd.ZstdInputStream;
 import com.github.luben.zstd.ZstdOutputStream;
 import org.apache.commons.io.function.IOFunction;
-import org.apache.commons.io.function.IOSupplier;
 import org.xerial.snappy.SnappyInputStream;
 import org.xerial.snappy.SnappyOutputStream;
 
@@ -139,22 +138,6 @@ public final InputStream decompress(final InputStream input) throws IOException
         return decompressor.apply(input);
     }
 
-    /**
-     * Decompresses an input stream wrapped in an IOSupplier
-     *
-     * @param input
-     *            the input stream to read compressed data from.
-     * @return An input stream that returns decompressed data.
-     */
-    public final IOSupplier<InputStream> decompress(final IOSupplier<InputStream> input) {
-        return new IOSupplier<InputStream>() {
-            @Override
-            public InputStream get() throws IOException {
-                return decompress(input.get());
-            }
-        };
-    }
-
     /**
      * Compresses an output stream.
      *
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java b/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java
index f320a34cd..f9380b4c4 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java
@@ -19,6 +19,7 @@
 import java.io.IOException;
 import java.io.OutputStream;
 import java.util.Collection;
+import java.util.List;
 import java.util.Map;
 
 import org.apache.kafka.connect.sink.SinkRecord;
@@ -34,120 +35,49 @@
 import org.apache.avro.file.DataFileWriter;
 import org.apache.avro.generic.GenericDatumWriter;
 import org.apache.avro.generic.GenericRecord;
-import org.apache.commons.io.output.CloseShieldOutputStream;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
-/**
- * An instance of OutputWriter that writes to Avro files.
- */
 public final class AvroOutputWriter extends OutputWriter {
 
     private static final Logger LOGGER = LoggerFactory.getLogger(AvroOutputWriter.class);
 
+    private final AvroSchemaBuilder avroSchemaBuilder;
+    private final SinkRecordConverter sinkRecordConverter;
+
     public AvroOutputWriter(final Collection<OutputField> fields, final OutputStream out,
             final Map<String, String> externalConfig, final boolean envelopeEnabled) {
-        super(out, new AvroOutputStreamWriter(fields, externalConfig, envelopeEnabled), externalConfig);
+        super(out, new OutputStreamWriterStub(), externalConfig);
+        final AvroData avroData = new AvroData(new AvroDataConfig(externalConfig));
+        this.sinkRecordConverter = new SinkRecordConverter(fields, avroData, envelopeEnabled);
+        this.avroSchemaBuilder = new AvroSchemaBuilder(fields, avroData, envelopeEnabled);
     }
 
-    /**
-     * An instance of OutputStreamWriter that handles writing the Avro format
-     */
-    private static final class AvroOutputStreamWriter implements OutputStreamWriter {
-        /**
-         * The sink record converter for Avro.
-         */
-        private final SinkRecordConverter sinkRecordConverter;
-        /**
-         * The Avro schema builder.
-         */
-        private final AvroSchemaBuilder avroSchemaBuilder;
-        /**
-         * The Avro configuration.
-         */
-        private final AvroConfig avroConfiguration;
+    @Override
+    public void writeRecords(final Collection<SinkRecord> sinkRecords) throws IOException {
+        final AvroConfig avroConfiguration = AvroConfig.createAvroConfiguration(externalConfiguration);
+        final Schema avroSchema = avroSchemaBuilder.buildSchema(sinkRecords.iterator().next());
+        LOGGER.debug("Record schema is: {}", avroSchema);
 
-        /**
-         * Lazily constructed Avro schema used in the output stream.
-         */
-        private Schema avroSchema;
-        /**
-         * Lazily constructed Avro DataFileWriter.
-         */
-        private DataFileWriter<GenericRecord> dataFileWriter;
-
-        /**
-         * Constructor.
-         *
-         * @param fields
-         *            the fields to output.
-         * @param externalConfig
-         *            the configuration data for the Avro configuration.
-         * @param envelopeEnabled
-         *            {@code true if the envelope is enabled}
-         */
-        AvroOutputStreamWriter(final Collection<OutputField> fields, final Map<String, String> externalConfig,
-                final boolean envelopeEnabled) {
-            final AvroData avroData = new AvroData(new AvroDataConfig(externalConfig));
-            this.sinkRecordConverter = new SinkRecordConverter(fields, avroData, envelopeEnabled);
-            this.avroSchemaBuilder = new AvroSchemaBuilder(fields, avroData, envelopeEnabled);
-            this.avroConfiguration = AvroConfig.createAvroConfiguration(externalConfig);
-        }
-
-        /**
-         * Create the data file writer if it does not exist. Requires that {@link #getAvroSchema(SinkRecord)} be called
-         * at least once prior.
-         *
-         * @return the DataFileWriter.
-         * @throws IOException
-         *             if the writer can not be created.
-         */
-        private DataFileWriter<GenericRecord> getDataFileWriter(final OutputStream outputStream) throws IOException {
-            if (dataFileWriter == null) {
-                final GenericDatumWriter<GenericRecord> writer = new GenericDatumWriter<>(avroSchema);
-                dataFileWriter = new DataFileWriter<>(writer);
-                dataFileWriter.setCodec(avroConfiguration.codecFactory());
-                // create with output stream that does not close the underlying stream.
-                dataFileWriter.create(avroSchema, CloseShieldOutputStream.wrap(outputStream));
+        final GenericDatumWriter<GenericRecord> writer = new GenericDatumWriter<>(avroSchema);
+        try (DataFileWriter<GenericRecord> dataFileWriter = new DataFileWriter<>(writer)) {
+            dataFileWriter.setCodec(avroConfiguration.codecFactory());
+            dataFileWriter.create(avroSchema, outputStream);
+            for (final SinkRecord record : sinkRecords) {
+                final GenericRecord datum = sinkRecordConverter.convert(record, avroSchema);
+                dataFileWriter.append(datum);
             }
-            return dataFileWriter;
         }
+    }
 
-        /**
-         * Creates the Avro schema if necessary. Will throw an exception if the record schema does not match the output
-         * Avro schema.
-         *
-         * @param sinkRecord
-         *            the record to be written.
-         * @return the file Avro schema.
-         * @throws IOException
-         *             if the record schema does not match the file schema.
-         */
-        private Schema getAvroSchema(final SinkRecord sinkRecord) throws IOException {
-            if (avroSchema == null) {
-                avroSchema = avroSchemaBuilder.buildSchema(sinkRecord);
-                LOGGER.debug("Record schema is: {}", avroSchema);
-            } else {
-                final Schema otherSchema = avroSchemaBuilder.buildSchema(sinkRecord);
-                if (!avroSchema.equals(otherSchema)) {
-                    LOGGER.error("Illegal Schema Change. {}", otherSchema);
-                    throw new IOException("Illegal schema change");
-                }
-            }
-            return avroSchema;
-        }
+    @Override
+    public void writeRecord(final SinkRecord record) throws IOException {
+        writeRecords(List.of(record));
+    }
 
+    private static final class OutputStreamWriterStub implements OutputStreamWriter {
         @Override
         public void writeOneRecord(final OutputStream outputStream, final SinkRecord record) throws IOException {
-            final GenericRecord datum = sinkRecordConverter.convert(record, getAvroSchema(record));
-            getDataFileWriter(outputStream).append(datum);
-        }
-
-        @Override
-        public void stopWriting(final OutputStream outputStream) throws IOException {
-            if (dataFileWriter != null) {
-                dataFileWriter.close();
-            }
         }
     }
 }
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java b/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java
index 6d1fa5f55..eaa692214 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java
@@ -27,7 +27,7 @@
 import org.apache.hadoop.conf.Configuration;
 import org.apache.parquet.hadoop.metadata.CompressionCodecName;
 
-public final class ParquetConfig extends AbstractConfig {
+final class ParquetConfig extends AbstractConfig {
 
     public ParquetConfig(final Map<?, ?> originals) {
         super(new ConfigDef(), originals);
@@ -50,13 +50,10 @@ public Configuration parquetConfiguration() {
     }
 
     public CompressionCodecName compressionCodecName() {
-        return compressionCodecName(CompressionType.forName(
+        final var connectorCompressionType = CompressionType.forName(
                 originals().getOrDefault(FileNameFragment.FILE_COMPRESSION_TYPE_CONFIG, CompressionType.NONE.name)
-                        .toString()));
-    }
-
-    public static CompressionCodecName compressionCodecName(final CompressionType compressionType) {
-        switch (compressionType) {
+                        .toString());
+        switch (connectorCompressionType) {
             case GZIP :
                 return CompressionCodecName.GZIP;
             case SNAPPY :
@@ -67,4 +64,5 @@ public static CompressionCodecName compressionCodecName(final CompressionType co
                 return CompressionCodecName.UNCOMPRESSED;
         }
     }
+
 }
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java b/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java
index 0abb5565c..6c88ca1cf 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java
@@ -27,17 +27,14 @@
 import org.apache.kafka.connect.data.SchemaAndValue;
 
 import io.aiven.commons.collections.RingBuffer;
-import io.aiven.kafka.connect.common.config.CompressionType;
 import io.aiven.kafka.connect.common.config.SourceCommonConfig;
 import io.aiven.kafka.connect.common.config.SourceConfigFragment;
-import io.aiven.kafka.connect.common.source.input.ParquetTransformer;
 import io.aiven.kafka.connect.common.source.input.Transformer;
 import io.aiven.kafka.connect.common.source.input.utils.FilePatternUtils;
 import io.aiven.kafka.connect.common.source.task.Context;
 import io.aiven.kafka.connect.common.source.task.DistributionStrategy;
 import io.aiven.kafka.connect.common.source.task.DistributionType;
 
-import com.google.common.annotations.VisibleForTesting;
 import edu.umd.cs.findbugs.annotations.SuppressFBWarnings;
 import org.apache.commons.io.function.IOSupplier;
 import org.apache.commons.lang3.ObjectUtils;
@@ -239,25 +236,17 @@ final public void remove() {
      *            the SourceRecord that drives the creation of source records with values.
      * @return a stream of T created from the input stream of the native item.
      */
-    @VisibleForTesting
-    Stream<T> convert(final T sourceRecord) {
+    private Stream<T> convert(final T sourceRecord) {
         sourceRecord
                 .setKeyData(transformer.getKeyData(sourceRecord.getNativeKey(), sourceRecord.getTopic(), sourceConfig));
 
         lastSeenNativeKey = sourceRecord.getNativeKey();
 
-        // parquet handles compression internally.
-        final CompressionType compressionType = transformer instanceof ParquetTransformer
-                ? CompressionType.NONE
-                : sourceConfig.getCompressionType();
-        // create an IOSupplier with the specified compression
-        final IOSupplier<InputStream> inputStream = transformer instanceof ParquetTransformer
-                ? getInputStream(sourceRecord)
-                : compressionType.decompress(getInputStream(sourceRecord));
         return transformer
-                .getRecords(inputStream, sourceRecord.getNativeItemSize(), sourceRecord.getContext(), sourceConfig,
-                        sourceRecord.getRecordCount())
+                .getRecords(getInputStream(sourceRecord), sourceRecord.getNativeItemSize(), sourceRecord.getContext(),
+                        sourceConfig, sourceRecord.getRecordCount())
                 .map(new Mapper<N, K, O, T>(sourceRecord));
+
     }
 
     /**
diff --git a/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java b/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java
index 7a913ab81..7d3ac0fde 100644
--- a/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java
+++ b/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java
@@ -25,7 +25,6 @@
 import static org.mockito.Mockito.verify;
 import static org.mockito.Mockito.when;
 
-import java.io.ByteArrayOutputStream;
 import java.io.IOException;
 import java.nio.ByteBuffer;
 import java.nio.charset.StandardCharsets;
@@ -39,31 +38,18 @@
 import java.util.NoSuchElementException;
 import java.util.Queue;
 
-import org.apache.kafka.connect.data.Field;
-import org.apache.kafka.connect.data.Schema;
-import org.apache.kafka.connect.data.SchemaBuilder;
-import org.apache.kafka.connect.data.Struct;
-import org.apache.kafka.connect.json.JsonDeserializer;
-import org.apache.kafka.connect.sink.SinkRecord;
 import org.apache.kafka.connect.source.SourceTaskContext;
 import org.apache.kafka.connect.storage.OffsetStorageReader;
 
-import io.aiven.kafka.connect.common.config.CompressionType;
-import io.aiven.kafka.connect.common.config.FormatType;
-import io.aiven.kafka.connect.common.config.OutputField;
-import io.aiven.kafka.connect.common.config.OutputFieldEncodingType;
-import io.aiven.kafka.connect.common.config.OutputFieldType;
 import io.aiven.kafka.connect.common.config.SourceCommonConfig;
 import io.aiven.kafka.connect.common.format.AvroTestDataFixture;
 import io.aiven.kafka.connect.common.format.JsonTestDataFixture;
 import io.aiven.kafka.connect.common.format.ParquetTestDataFixture;
-import io.aiven.kafka.connect.common.output.OutputWriter;
 import io.aiven.kafka.connect.common.source.input.InputFormat;
 import io.aiven.kafka.connect.common.source.input.Transformer;
 import io.aiven.kafka.connect.common.source.input.TransformerFactory;
 import io.aiven.kafka.connect.common.source.task.DistributionType;
 
-import com.fasterxml.jackson.databind.node.ArrayNode;
 import org.apache.commons.lang3.tuple.Pair;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
@@ -83,7 +69,6 @@
  * @param <T>
  *            The concrete implementation of the {@link AbstractSourceRecord} .
  */
-@SuppressWarnings("PMD.ExcessiveImports")
 public abstract class AbstractSourceRecordIteratorTest<K extends Comparable<K>, N, O extends OffsetManager.OffsetManagerEntry<O>, T extends AbstractSourceRecord<K, N, O, T>> {
     /** The offset manager */
     private OffsetManager<O> offsetManager;
@@ -115,7 +100,7 @@ public abstract class AbstractSourceRecordIteratorTest<K extends Comparable<K>,
      * @param offsetManager
      *            A mock offset manager.
      * @param transformer
-     *            The transformer to use for the test.
+     *            The trnasformer to use for the test.
      * @return A configured AbstractSourceRecordIterator.
      */
     abstract protected AbstractSourceRecordIterator<K, N, O, T> createSourceRecordIterator(
@@ -150,7 +135,7 @@ public void setUp() {
     }
 
     /**
-     * Create a mock SourceConfig with our necessary items added.
+     * Create a mock SourceCOnfig with our necessary items added.
      *
      * @param filePattern
      *            The file pattern to match.
@@ -195,7 +180,6 @@ void testOneObjectReturnsOneObject(final InputFormat format, final byte[] data)
         final Transformer transformer = TransformerFactory.getTransformer(format);
         final SourceCommonConfig mockConfig = mockSourceConfig(FILE_PATTERN, 0, 1, null);
         when(mockConfig.getInputFormat()).thenReturn(format);
-        when(mockConfig.getCompressionType()).thenReturn(CompressionType.NONE);
 
         // verify one data has one data
         createClientMutator().reset().addObject(key, ByteBuffer.wrap(data)).endOfBlock().build();
@@ -261,8 +245,6 @@ void testMultipleRecordsReturned(final InputFormat format, final byte[] data) {
         final SourceCommonConfig config = mockSourceConfig(FILE_PATTERN, 0, 1, null);
         when(config.getTransformerMaxBufferSize()).thenReturn(4096);
         when(config.getInputFormat()).thenReturn(format);
-        when(config.getCompressionType()).thenReturn(CompressionType.NONE);
-
         final AbstractSourceRecordIterator<K, N, O, T> iterator = createSourceRecordIterator(config, offsetManager,
                 transformer);
 
@@ -333,8 +315,6 @@ void testIteratorProcessesMultipleObjectsFromByteArrayTransformer() {
         final SourceCommonConfig config = mockSourceConfig(FILE_PATTERN, 0, 1, null);
         when(config.getTransformerMaxBufferSize()).thenReturn(4096);
         when(config.getInputFormat()).thenReturn(InputFormat.BYTES);
-        when(config.getCompressionType()).thenReturn(CompressionType.NONE);
-
         final AbstractSourceRecordIterator<K, N, O, T> iterator = createSourceRecordIterator(config, offsetManager,
                 transformer);
 
@@ -388,144 +368,6 @@ static List<Arguments> parameterizedNativeStartKey() {
         return List.of(Arguments.of("startKeyOne", 2), Arguments.of("startKeyOne", 2), Arguments.of(null, 1));
     }
 
-    /**
-     * Gets a configured Transformer.
-     *
-     * @param formatType
-     *            The input format for the transformer.
-     * @return the Transformer for the specified input format.
-     */
-    private static InputFormat formatTypeConversion(final FormatType formatType) {
-        switch (formatType) {
-            case AVRO :
-                return InputFormat.AVRO;
-            case PARQUET :
-                return InputFormat.PARQUET;
-            case JSONL :
-                return InputFormat.JSONL;
-            case CSV :
-            case JSON :
-                return InputFormat.BYTES;
-            default :
-                throw new IllegalArgumentException("Unknown format type in configuration: " + formatType);
-        }
-    }
-    @ParameterizedTest
-    @MethodSource("testDecompressionData")
-    @SuppressWarnings("PMD.NcssCount")
-    void testDecompression(final FormatType formatType, final CompressionType compressionType) throws IOException {
-        // setup the data
-        final SourceCommonConfig config = mockSourceConfig(FILE_PATTERN, 0, 1, null);
-        when(config.getTransformerMaxBufferSize()).thenReturn(4096);
-        when(config.getCompressionType()).thenReturn(compressionType);
-        when(config.getInputFormat()).thenReturn(formatTypeConversion(formatType));
-
-        final ByteArrayOutputStream byteArrayOutputStream = new ByteArrayOutputStream();
-        Object value = null;
-        Schema valueSchema = null;
-        try (OutputWriter outputWriter = OutputWriter.builder()
-                .withCompressionType(compressionType)
-                .withOutputFields(
-                        Collections.singletonList(new OutputField(OutputFieldType.VALUE, OutputFieldEncodingType.NONE)))
-                .build(byteArrayOutputStream, formatType)) {
-
-            switch (formatType) {
-                case AVRO :
-                    valueSchema = SchemaBuilder.struct()
-                            .field("message", SchemaBuilder.STRING_SCHEMA)
-                            .field("id", SchemaBuilder.INT32_SCHEMA);
-                    value = new Struct(valueSchema).put("message", "Hello").put("id", 1);
-                    break;
-                case PARQUET :
-                    valueSchema = ParquetTestDataFixture.PARQUET_SCHEMA;
-                    value = new Struct(valueSchema).put("name", "TheDude")
-                            .put("age", 32)
-                            .put("email", "thedude@example.com");
-                    break;
-                case JSONL :
-                    valueSchema = SchemaBuilder.struct()
-                            .field("message", SchemaBuilder.STRING_SCHEMA)
-                            .field("id", SchemaBuilder.INT32_SCHEMA);
-                    value = new Struct(valueSchema).put("message", "Hello").put("id", 2);
-                    break;
-                case CSV :
-                    valueSchema = SchemaBuilder.BYTES_SCHEMA;
-                    value = "'test','one'".getBytes(StandardCharsets.UTF_8);
-                    break;
-                case JSON :
-                    valueSchema = SchemaBuilder.STRING_SCHEMA;
-                    value = "json is here";
-                    break;
-                default :
-                    throw new IllegalArgumentException("Unknown format type: " + formatType);
-            }
-
-            final SinkRecord sinkRecord = new SinkRecord("testTopic", 0, Schema.STRING_SCHEMA, "testRecord",
-                    valueSchema, value, 0);
-            outputWriter.writeRecord(sinkRecord);
-        }
-        createClientMutator().addObject(key, ByteBuffer.wrap(byteArrayOutputStream.toByteArray())).endOfBlock().build();
-        final Transformer transformer = TransformerFactory.getTransformer(formatTypeConversion(formatType));
-
-        // Start the test
-        final AbstractSourceRecordIterator<K, N, O, T> iterator = createSourceRecordIterator(config, offsetManager,
-                transformer);
-        assertThat(iterator).hasNext();
-        final T sourceRecord = iterator.next();
-        assertThat(sourceRecord).isNotNull();
-        switch (formatType) {
-            case AVRO :
-            case PARQUET :
-                Struct struct = (Struct) sourceRecord.getValue().value();
-                struct = (Struct) struct.get("value");
-                assertEquivalent(valueSchema, struct.schema());
-                for (final Field field : valueSchema.fields()) {
-                    assertThat(struct.get(field)).describedAs("field: " + field).isEqualTo(((Struct) value).get(field));
-                }
-                break;
-            case CSV :
-                assertThat(sourceRecord.getValue().schema()).isNull();
-                assertThat(sourceRecord.getValue().value()).isEqualTo(value);
-                break;
-            case JSON :
-                assertThat(sourceRecord.getValue().schema()).isNull();
-                try (JsonDeserializer jsonDeserializer = new JsonDeserializer()) {
-                    final ArrayNode arrayNode = (ArrayNode) jsonDeserializer.deserialize("topic",
-                            (byte[]) sourceRecord.getValue().value());
-                    assertThat(arrayNode.size()).isEqualTo(1);
-                    assertThat(arrayNode.get(0).get("value").asText())
-                            .describedAs(new String((byte[]) sourceRecord.getValue().value(), StandardCharsets.UTF_8)
-                                    + " == " + String.format("[%n{\"value\":\"%s\"}%n]", value))
-                            .isEqualTo(value);
-                }
-                break;
-            case JSONL :
-                assertThat(sourceRecord.getValue().schema()).isNull();
-                Map<String, Object> values = (Map<String, Object>) sourceRecord.getValue().value();
-                values = (Map<String, Object>) values.get("value");
-                assertThat(values.get("id")).isEqualTo(2L);
-                assertThat(values.get("message")).isEqualTo("Hello");
-                break;
-            default :
-                throw new IllegalArgumentException("Unknown format type: " + formatType);
-        }
-    }
-
-    private void assertEquivalent(final Schema expected, final Schema actual) {
-        assertThat(actual.type()).isEqualTo(expected.type());
-        assertThat(actual.fields()).containsExactlyElementsOf(expected.fields());
-    }
-
-    static List<Arguments> testDecompressionData() {
-        final List<Arguments> result = new ArrayList<>();
-        for (final FormatType formatType : FormatType.values()) {
-            for (final CompressionType compressionType : CompressionType.values()) {
-                result.add(Arguments.of(formatType, compressionType));
-            }
-        }
-        return result;
-    }
-
     /**
      * A mutator of the mocked client used by the iterator under test.
      * <p>

From b8345713ca7a25f7dcea264fa85b04e73389fefc Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Wed, 19 Nov 2025 13:51:47 +0000
Subject: [PATCH 11/19] cleaned up PR

---
 .../common/config/CompressionType.java        |  17 ++
 .../common/output/avro/AvroOutputWriter.java  | 122 ++++++++++---
 .../common/output/parquet/ParquetConfig.java  |  12 +-
 .../source/AbstractSourceRecordIterator.java  |  19 +-
 .../AbstractSourceRecordIteratorTest.java     | 162 +++++++++++++++++-
 5 files changed, 295 insertions(+), 37 deletions(-)

diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java b/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java
index 669aca3fd..2de5216cb 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/config/CompressionType.java
@@ -30,6 +30,7 @@
 import com.github.luben.zstd.ZstdInputStream;
 import com.github.luben.zstd.ZstdOutputStream;
 import org.apache.commons.io.function.IOFunction;
+import org.apache.commons.io.function.IOSupplier;
 import org.xerial.snappy.SnappyInputStream;
 import org.xerial.snappy.SnappyOutputStream;
 
@@ -138,6 +139,22 @@ public final InputStream decompress(final InputStream input) throws IOException
         return decompressor.apply(input);
     }
 
+    /**
+     * Decompresses an input stream wrapped in an IOSupplier
+     *
+     * @param input
+     *            the input stream to read compressed data from.
+     * @return An input stream that returns decompressed data.
+     */
+    public final IOSupplier<InputStream> decompress(final IOSupplier<InputStream> input) {
+        return new IOSupplier<InputStream>() {
+            @Override
+            public InputStream get() throws IOException {
+                return decompress(input.get());
+            }
+        };
+    }
+
     /**
      * Compresses an output stream.
      *
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java b/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java
index f9380b4c4..f320a34cd 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/output/avro/AvroOutputWriter.java
@@ -19,7 +19,6 @@
 import java.io.IOException;
 import java.io.OutputStream;
 import java.util.Collection;
-import java.util.List;
 import java.util.Map;
 
 import org.apache.kafka.connect.sink.SinkRecord;
@@ -35,49 +34,120 @@
 import org.apache.avro.file.DataFileWriter;
 import org.apache.avro.generic.GenericDatumWriter;
 import org.apache.avro.generic.GenericRecord;
+import org.apache.commons.io.output.CloseShieldOutputStream;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
+/**
+ * An instance of OutputWriter that writes to Avro files.
+ */
 public final class AvroOutputWriter extends OutputWriter {
 
     private static final Logger LOGGER = LoggerFactory.getLogger(AvroOutputWriter.class);
 
-    private final AvroSchemaBuilder avroSchemaBuilder;
-    private final SinkRecordConverter sinkRecordConverter;
-
     public AvroOutputWriter(final Collection<OutputField> fields, final OutputStream out,
             final Map<String, String> externalConfig, final boolean envelopeEnabled) {
-        super(out, new OutputStreamWriterStub(), externalConfig);
-        final AvroData avroData = new AvroData(new AvroDataConfig(externalConfig));
-        this.sinkRecordConverter = new SinkRecordConverter(fields, avroData, envelopeEnabled);
-        this.avroSchemaBuilder = new AvroSchemaBuilder(fields, avroData, envelopeEnabled);
+        super(out, new AvroOutputStreamWriter(fields, externalConfig, envelopeEnabled), externalConfig);
     }
 
-    @Override
-    public void writeRecords(final Collection<SinkRecord> sinkRecords) throws IOException {
-        final AvroConfig avroConfiguration = AvroConfig.createAvroConfiguration(externalConfiguration);
-        final Schema avroSchema = avroSchemaBuilder.buildSchema(sinkRecords.iterator().next());
-        LOGGER.debug("Record schema is: {}", avroSchema);
+    /**
+     * An instance of OutputStreamWriter that handles writing the Avro format
+     */
+    private static final class AvroOutputStreamWriter implements OutputStreamWriter {
+        /**
+         * The sink record converter for Avro.
+         */
+        private final SinkRecordConverter sinkRecordConverter;
+        /**
+         * The Avro schema builder.
+         */
+        private final AvroSchemaBuilder avroSchemaBuilder;
+        /**
+         * The Avro configuration.
+         */
+        private final AvroConfig avroConfiguration;
 
-        final GenericDatumWriter<GenericRecord> writer = new GenericDatumWriter<>(avroSchema);
-        try (DataFileWriter<GenericRecord> dataFileWriter = new DataFileWriter<>(writer)) {
-            dataFileWriter.setCodec(avroConfiguration.codecFactory());
-            dataFileWriter.create(avroSchema, outputStream);
-            for (final SinkRecord record : sinkRecords) {
-                final GenericRecord datum = sinkRecordConverter.convert(record, avroSchema);
-                dataFileWriter.append(datum);
+        /**
+         * Lazily constructed Avro schema used in the output stream.
+         */
+        private Schema avroSchema;
+        /**
+         * Lazily constructed Avro DataFileWriter.
+         */
+        private DataFileWriter<GenericRecord> dataFileWriter;
+
+        /**
+         * Constructor.
+         *
+         * @param fields
+         *            the fields to output.
+         * @param externalConfig
+         *            the configuration data for the Avro configuration.
+         * @param envelopeEnabled
+         *            {@code true if the envelope is enabled}
+         */
+        AvroOutputStreamWriter(final Collection<OutputField> fields, final Map<String, String> externalConfig,
+                final boolean envelopeEnabled) {
+            final AvroData avroData = new AvroData(new AvroDataConfig(externalConfig));
+            this.sinkRecordConverter = new SinkRecordConverter(fields, avroData, envelopeEnabled);
+            this.avroSchemaBuilder = new AvroSchemaBuilder(fields, avroData, envelopeEnabled);
+            this.avroConfiguration = AvroConfig.createAvroConfiguration(externalConfig);
+        }
+
+        /**
+         * Create the data file writer if it does not exist. Requires that {@link #getAvroSchema(SinkRecord)} be called
+         * at least once prior.
+         *
+         * @return the DataFileWriter.
+         * @throws IOException
+         *             if the writer can not be created.
+         */
+        private DataFileWriter<GenericRecord> getDataFileWriter(final OutputStream outputStream) throws IOException {
+            if (dataFileWriter == null) {
+                final GenericDatumWriter<GenericRecord> writer = new GenericDatumWriter<>(avroSchema);
+                dataFileWriter = new DataFileWriter<>(writer);
+                dataFileWriter.setCodec(avroConfiguration.codecFactory());
+                // create with output stream that does not close the underlying stream.
+                dataFileWriter.create(avroSchema, CloseShieldOutputStream.wrap(outputStream));
             }
+            return dataFileWriter;
         }
-    }
 
-    @Override
-    public void writeRecord(final SinkRecord record) throws IOException {
-        writeRecords(List.of(record));
-    }
+        /**
+         * Creates the Avro schema if necessary. Will throw an exception if the record schema does not match the output
+         * Avro schema.
+         *
+         * @param sinkRecord
+         *            the record to be written.
+         * @return the file Avro schema.
+         * @throws IOException
+         *             if the record schema does not match the file schema.
+         */
+        private Schema getAvroSchema(final SinkRecord sinkRecord) throws IOException {
+            if (avroSchema == null) {
+                avroSchema = avroSchemaBuilder.buildSchema(sinkRecord);
+                LOGGER.debug("Record schema is: {}", avroSchema);
+            } else {
+                final Schema otherSchema = avroSchemaBuilder.buildSchema(sinkRecord);
+                if (!avroSchema.equals(otherSchema)) {
+                    LOGGER.error("Illegal Schema Change. {}", otherSchema);
+                    throw new IOException("Illegal schema change");
+                }
+            }
+            return avroSchema;
+        }
 
-    private static final class OutputStreamWriterStub implements OutputStreamWriter {
         @Override
         public void writeOneRecord(final OutputStream outputStream, final SinkRecord record) throws IOException {
+            final GenericRecord datum = sinkRecordConverter.convert(record, getAvroSchema(record));
+            getDataFileWriter(outputStream).append(datum);
+        }
+
+        @Override
+        public void stopWriting(final OutputStream outputStream) throws IOException {
+            if (dataFileWriter != null) {
+                dataFileWriter.close();
+            }
         }
     }
 }
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java b/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java
index eaa692214..6d1fa5f55 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/output/parquet/ParquetConfig.java
@@ -27,7 +27,7 @@
 import org.apache.hadoop.conf.Configuration;
 import org.apache.parquet.hadoop.metadata.CompressionCodecName;
 
-final class ParquetConfig extends AbstractConfig {
+public final class ParquetConfig extends AbstractConfig {
 
     public ParquetConfig(final Map<?, ?> originals) {
         super(new ConfigDef(), originals);
@@ -50,10 +50,13 @@ public Configuration parquetConfiguration() {
     }
 
     public CompressionCodecName compressionCodecName() {
-        final var connectorCompressionType = CompressionType.forName(
+        return compressionCodecName(CompressionType.forName(
                 originals().getOrDefault(FileNameFragment.FILE_COMPRESSION_TYPE_CONFIG, CompressionType.NONE.name)
-                        .toString());
-        switch (connectorCompressionType) {
+                        .toString()));
+    }
+
+    public static CompressionCodecName compressionCodecName(final CompressionType compressionType) {
+        switch (compressionType) {
             case GZIP :
                 return CompressionCodecName.GZIP;
             case SNAPPY :
@@ -64,5 +67,4 @@ public CompressionCodecName compressionCodecName() {
                 return CompressionCodecName.UNCOMPRESSED;
         }
     }
-
 }
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java b/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java
index 6c88ca1cf..0abb5565c 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIterator.java
@@ -27,14 +27,17 @@
 import org.apache.kafka.connect.data.SchemaAndValue;
 
 import io.aiven.commons.collections.RingBuffer;
+import io.aiven.kafka.connect.common.config.CompressionType;
 import io.aiven.kafka.connect.common.config.SourceCommonConfig;
 import io.aiven.kafka.connect.common.config.SourceConfigFragment;
+import io.aiven.kafka.connect.common.source.input.ParquetTransformer;
 import io.aiven.kafka.connect.common.source.input.Transformer;
 import io.aiven.kafka.connect.common.source.input.utils.FilePatternUtils;
 import io.aiven.kafka.connect.common.source.task.Context;
 import io.aiven.kafka.connect.common.source.task.DistributionStrategy;
 import io.aiven.kafka.connect.common.source.task.DistributionType;
 
+import com.google.common.annotations.VisibleForTesting;
 import edu.umd.cs.findbugs.annotations.SuppressFBWarnings;
 import org.apache.commons.io.function.IOSupplier;
 import org.apache.commons.lang3.ObjectUtils;
@@ -236,17 +239,25 @@ final public void remove() {
      *            the SourceRecord that drives the creation of source records with values.
      * @return a stream of T created from the input stream of the native item.
      */
-    private Stream<T> convert(final T sourceRecord) {
+    @VisibleForTesting
+    Stream<T> convert(final T sourceRecord) {
         sourceRecord
                 .setKeyData(transformer.getKeyData(sourceRecord.getNativeKey(), sourceRecord.getTopic(), sourceConfig));
 
         lastSeenNativeKey = sourceRecord.getNativeKey();
 
+        // parquet handles compression internally.
+        final CompressionType compressionType = transformer instanceof ParquetTransformer
+                ? CompressionType.NONE
+                : sourceConfig.getCompressionType();
+        // create an IOSupplier with the specified compression
+        final IOSupplier<InputStream> inputStream = transformer instanceof ParquetTransformer
+                ? getInputStream(sourceRecord)
+                : compressionType.decompress(getInputStream(sourceRecord));
         return transformer
-                .getRecords(getInputStream(sourceRecord), sourceRecord.getNativeItemSize(), sourceRecord.getContext(),
-                        sourceConfig, sourceRecord.getRecordCount())
+                .getRecords(inputStream, sourceRecord.getNativeItemSize(), sourceRecord.getContext(), sourceConfig,
+                        sourceRecord.getRecordCount())
                 .map(new Mapper<N, K, O, T>(sourceRecord));
-
     }
 
     /**
diff --git a/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java b/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java
index 7d3ac0fde..7a913ab81 100644
--- a/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java
+++ b/commons/src/testFixtures/java/io/aiven/kafka/connect/common/source/AbstractSourceRecordIteratorTest.java
@@ -25,6 +25,7 @@
 import static org.mockito.Mockito.verify;
 import static org.mockito.Mockito.when;
 
+import java.io.ByteArrayOutputStream;
 import java.io.IOException;
 import java.nio.ByteBuffer;
 import java.nio.charset.StandardCharsets;
@@ -38,18 +39,31 @@
 import java.util.NoSuchElementException;
 import java.util.Queue;
 
+import org.apache.kafka.connect.data.Field;
+import org.apache.kafka.connect.data.Schema;
+import org.apache.kafka.connect.data.SchemaBuilder;
+import org.apache.kafka.connect.data.Struct;
+import org.apache.kafka.connect.json.JsonDeserializer;
+import org.apache.kafka.connect.sink.SinkRecord;
 import org.apache.kafka.connect.source.SourceTaskContext;
 import org.apache.kafka.connect.storage.OffsetStorageReader;
 
+import io.aiven.kafka.connect.common.config.CompressionType;
+import io.aiven.kafka.connect.common.config.FormatType;
+import io.aiven.kafka.connect.common.config.OutputField;
+import io.aiven.kafka.connect.common.config.OutputFieldEncodingType;
+import io.aiven.kafka.connect.common.config.OutputFieldType;
 import io.aiven.kafka.connect.common.config.SourceCommonConfig;
 import io.aiven.kafka.connect.common.format.AvroTestDataFixture;
 import io.aiven.kafka.connect.common.format.JsonTestDataFixture;
 import io.aiven.kafka.connect.common.format.ParquetTestDataFixture;
+import io.aiven.kafka.connect.common.output.OutputWriter;
 import io.aiven.kafka.connect.common.source.input.InputFormat;
 import io.aiven.kafka.connect.common.source.input.Transformer;
 import io.aiven.kafka.connect.common.source.input.TransformerFactory;
 import io.aiven.kafka.connect.common.source.task.DistributionType;
 
+import com.fasterxml.jackson.databind.node.ArrayNode;
 import org.apache.commons.lang3.tuple.Pair;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
@@ -69,6 +83,7 @@
  * @param <T>
  *            The concrete implementation of the {@link AbstractSourceRecord} .
  */
+@SuppressWarnings("PMD.ExcessiveImports")
 public abstract class AbstractSourceRecordIteratorTest<K extends Comparable<K>, N, O extends OffsetManager.OffsetManagerEntry<O>, T extends AbstractSourceRecord<K, N, O, T>> {
     /** The offset manager */
     private OffsetManager<O> offsetManager;
@@ -100,7 +115,7 @@ public abstract class AbstractSourceRecordIteratorTest<K extends Comparable<K>,
      * @param offsetManager
      *            A mock offset manager.
      * @param transformer
-     *            The trnasformer to use for the test.
+     *            The transformer to use for the test.
      * @return A configured AbstractSourceRecordIterator.
      */
     abstract protected AbstractSourceRecordIterator<K, N, O, T> createSourceRecordIterator(
@@ -135,7 +150,7 @@ public void setUp() {
     }
 
     /**
-     * Create a mock SourceCOnfig with our necessary items added.
+     * Create a mock SourceConfig with our necessary items added.
      *
      * @param filePattern
      *            The file pattern to match.
@@ -180,6 +195,7 @@ void testOneObjectReturnsOneObject(final InputFormat format, final byte[] data)
         final Transformer transformer = TransformerFactory.getTransformer(format);
         final SourceCommonConfig mockConfig = mockSourceConfig(FILE_PATTERN, 0, 1, null);
         when(mockConfig.getInputFormat()).thenReturn(format);
+        when(mockConfig.getCompressionType()).thenReturn(CompressionType.NONE);
 
         // verify one data has one data
         createClientMutator().reset().addObject(key, ByteBuffer.wrap(data)).endOfBlock().build();
@@ -245,6 +261,8 @@ void testMultipleRecordsReturned(final InputFormat format, final byte[] data) {
         final SourceCommonConfig config = mockSourceConfig(FILE_PATTERN, 0, 1, null);
         when(config.getTransformerMaxBufferSize()).thenReturn(4096);
         when(config.getInputFormat()).thenReturn(format);
+        when(config.getCompressionType()).thenReturn(CompressionType.NONE);
+
         final AbstractSourceRecordIterator<K, N, O, T> iterator = createSourceRecordIterator(config, offsetManager,
                 transformer);
 
@@ -315,6 +333,8 @@ void testIteratorProcessesMultipleObjectsFromByteArrayTransformer() {
         final SourceCommonConfig config = mockSourceConfig(FILE_PATTERN, 0, 1, null);
         when(config.getTransformerMaxBufferSize()).thenReturn(4096);
         when(config.getInputFormat()).thenReturn(InputFormat.BYTES);
+        when(config.getCompressionType()).thenReturn(CompressionType.NONE);
+
         final AbstractSourceRecordIterator<K, N, O, T> iterator = createSourceRecordIterator(config, offsetManager,
                 transformer);
 
@@ -368,6 +388,144 @@ static List<Arguments> parameterizedNativeStartKey() {
         return List.of(Arguments.of("startKeyOne", 2), Arguments.of("startKeyOne", 2), Arguments.of(null, 1));
     }
 
+    /**
+     * Gets a configured Transformer.
+     *
+     * @param formatType
+     *            The input format for the transformer.
+     * @return the Transformer for the specified input format.
+     */
+    private static InputFormat formatTypeConversion(final FormatType formatType) {
+        switch (formatType) {
+            case AVRO :
+                return InputFormat.AVRO;
+            case PARQUET :
+                return InputFormat.PARQUET;
+            case JSONL :
+                return InputFormat.JSONL;
+            case CSV :
+            case JSON :
+                return InputFormat.BYTES;
+            default :
+                throw new IllegalArgumentException("Unknown format type in configuration: " + formatType);
+        }
+    }
+    @ParameterizedTest
+    @MethodSource("testDecompressionData")
+    @SuppressWarnings("PMD.NcssCount")
+    void testDecompression(final FormatType formatType, final CompressionType compressionType) throws IOException {
+        // setup the data
+        final SourceCommonConfig config = mockSourceConfig(FILE_PATTERN, 0, 1, null);
+        when(config.getTransformerMaxBufferSize()).thenReturn(4096);
+        when(config.getCompressionType()).thenReturn(compressionType);
+        when(config.getInputFormat()).thenReturn(formatTypeConversion(formatType));
+
+        final ByteArrayOutputStream byteArrayOutputStream = new ByteArrayOutputStream();
+        Object value = null;
+        Schema valueSchema = null;
+        try (OutputWriter outputWriter = OutputWriter.builder()
+                .withCompressionType(compressionType)
+                .withOutputFields(
+                        Collections.singletonList(new OutputField(OutputFieldType.VALUE, OutputFieldEncodingType.NONE)))
+                .build(byteArrayOutputStream, formatType)) {
+
+            switch (formatType) {
+                case AVRO :
+                    valueSchema = SchemaBuilder.struct()
+                            .field("message", SchemaBuilder.STRING_SCHEMA)
+                            .field("id", SchemaBuilder.INT32_SCHEMA);
+                    value = new Struct(valueSchema).put("message", "Hello").put("id", 1);
+                    break;
+                case PARQUET :
+                    valueSchema = ParquetTestDataFixture.PARQUET_SCHEMA;
+                    value = new Struct(valueSchema).put("name", "TheDude")
+                            .put("age", 32)
+                            .put("email", "thedude@example.com");
+                    break;
+                case JSONL :
+                    valueSchema = SchemaBuilder.struct()
+                            .field("message", SchemaBuilder.STRING_SCHEMA)
+                            .field("id", SchemaBuilder.INT32_SCHEMA);
+                    value = new Struct(valueSchema).put("message", "Hello").put("id", 2);
+                    break;
+                case CSV :
+                    valueSchema = SchemaBuilder.BYTES_SCHEMA;
+                    value = "'test','one'".getBytes(StandardCharsets.UTF_8);
+                    break;
+                case JSON :
+                    valueSchema = SchemaBuilder.STRING_SCHEMA;
+                    value = "json is here";
+                    break;
+                default :
+                    throw new IllegalArgumentException("Unknown format type: " + formatType);
+            }
+
+            final SinkRecord sinkRecord = new SinkRecord("testTopic", 0, Schema.STRING_SCHEMA, "testRecord",
+                    valueSchema, value, 0);
+            outputWriter.writeRecord(sinkRecord);
+        }
+        createClientMutator().addObject(key, ByteBuffer.wrap(byteArrayOutputStream.toByteArray())).endOfBlock().build();
+        final Transformer transformer = TransformerFactory.getTransformer(formatTypeConversion(formatType));
+
+        // Start the test
+        final AbstractSourceRecordIterator<K, N, O, T> iterator = createSourceRecordIterator(config, offsetManager,
+                transformer);
+        assertThat(iterator).hasNext();
+        final T sourceRecord = iterator.next();
+        assertThat(sourceRecord).isNotNull();
+        switch (formatType) {
+            case AVRO :
+            case PARQUET :
+                Struct struct = (Struct) sourceRecord.getValue().value();
+                struct = (Struct) struct.get("value");
+                assertEquivalent(valueSchema, struct.schema());
+                for (final Field field : valueSchema.fields()) {
+                    assertThat(struct.get(field)).describedAs("field: " + field).isEqualTo(((Struct) value).get(field));
+                }
+                break;
+            case CSV :
+                assertThat(sourceRecord.getValue().schema()).isNull();
+                assertThat(sourceRecord.getValue().value()).isEqualTo(value);
+                break;
+            case JSON :
+                assertThat(sourceRecord.getValue().schema()).isNull();
+                try (JsonDeserializer jsonDeserializer = new JsonDeserializer()) {
+                    final ArrayNode arrayNode = (ArrayNode) jsonDeserializer.deserialize("topic",
+                            (byte[]) sourceRecord.getValue().value());
+                    assertThat(arrayNode.size()).isEqualTo(1);
+                    assertThat(arrayNode.get(0).get("value").asText())
+                            .describedAs(new String((byte[]) sourceRecord.getValue().value(), StandardCharsets.UTF_8)
+                                    + " == " + String.format("[%n{\"value\":\"%s\"}%n]", value))
+                            .isEqualTo(value);
+                }
+                break;
+            case JSONL :
+                assertThat(sourceRecord.getValue().schema()).isNull();
+                Map<String, Object> values = (Map<String, Object>) sourceRecord.getValue().value();
+                values = (Map<String, Object>) values.get("value");
+                assertThat(values.get("id")).isEqualTo(2L);
+                assertThat(values.get("message")).isEqualTo("Hello");
+                break;
+            default :
+                throw new IllegalArgumentException("Unknown format type: " + formatType);
+        }
+    }
+
+    private void assertEquivalent(final Schema expected, final Schema actual) {
+        assertThat(actual.type()).isEqualTo(expected.type());
+        assertThat(actual.fields()).containsExactlyElementsOf(expected.fields());
+    }
+
+    static List<Arguments> testDecompressionData() {
+        final List<Arguments> result = new ArrayList<>();
+        for (final FormatType formatType : FormatType.values()) {
+            for (final CompressionType compressionType : CompressionType.values()) {
+                result.add(Arguments.of(formatType, compressionType));
+            }
+        }
+        return result;
+    }
+
     /**
      * A mutator of the mocked client used by the iterator under test.
      * <p>

From 0c57361ba0b22e520a394cc35bf5397579145ff4 Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Fri, 21 Nov 2025 15:27:37 +0000
Subject: [PATCH 12/19] updated to new commons

---
 azure-sink-connector/build.gradle.kts         |  49 +++-
 .../azure/sink/AvroIntegrationTest.java       |  43 ++--
 .../sink/AvroParquetIntegrationTest.java      |  27 ++-
 .../connect/azure/sink/IntegrationTest.java   |  55 +++--
 .../azure/sink/ParquetIntegrationTest.java    |  35 ++-
 .../azure/sink/AzureBlobConfigFragment.java   | 224 ++++++++++++++++++
 .../azure/sink/AzureBlobSinkConfig.java       | 177 ++------------
 .../azure/sink/AzureBlobSinkConfigDef.java    |  74 +++++-
 .../azure/sink/AzureBlobSinkConnector.java    |   2 +-
 .../src/templates/configData.md.vm            |  15 ++
 .../src/templates/configData.yml.vm           |  10 +
 .../azure/sink/AzureBlobSinkTaskTest.java     |   3 +-
 .../sink/config/AzureSinkConfigTest.java      | 171 +++++++------
 azure-source-connector/build.gradle.kts       |   6 +-
 .../source/AzureBlobSourceConnector.java      |   4 +-
 .../config/AzureBlobConfigFragment.java       | 108 +++++----
 .../source/config/AzureBlobSourceConfig.java  |  22 +-
 .../config/AzureBlobSourceConfigDef.java      |  19 +-
 settings.gradle.kts                           |   2 +-
 19 files changed, 672 insertions(+), 374 deletions(-)
 create mode 100644 azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobConfigFragment.java
 create mode 100644 azure-sink-connector/src/templates/configData.md.vm
 create mode 100644 azure-sink-connector/src/templates/configData.yml.vm

diff --git a/azure-sink-connector/build.gradle.kts b/azure-sink-connector/build.gradle.kts
index e0a2f78cd..85804c2de 100644
--- a/azure-sink-connector/build.gradle.kts
+++ b/azure-sink-connector/build.gradle.kts
@@ -71,6 +71,9 @@ idea {
 
 dependencies {
   compileOnly(apache.kafka.connect.api)
+  compileOnly(project(":site"))
+  compileOnly(apache.velocity.engine.core)
+  compileOnly(apache.velocity.tools)
 
   implementation(project(":commons"))
 
@@ -189,7 +192,7 @@ publishing {
         licenses {
           license {
             name = "Apache 2.0"
-            url = "http://www.apache.org/licenses/LICENSE-2.0"
+            url = "https://www.apache.org/licenses/LICENSE-2.0"
             distribution = "repo"
           }
         }
@@ -249,3 +252,47 @@ signing {
   }
   signatureTypes = ASCSignatureProvider()
 }
+
+/** ******************************* */
+/* Documentation building section */
+/** ******************************* */
+tasks.register("buildDocs") {
+  dependsOn("buildConfigMd")
+  dependsOn("buildConfigYml")
+}
+
+tasks.register<JavaExec>("buildConfigMd") {
+  mainClass = "io.aiven.kafka.connect.tools.ConfigDoc"
+  classpath =
+      sourceSets.main
+          .get()
+          .compileClasspath
+          .plus(files(tasks.jar))
+          .plus(sourceSets.main.get().runtimeClasspath)
+  args =
+      listOf(
+          "io.aiven.kafka.connect.azure.sink.AzureBlobSinkConfig",
+          "configDef",
+          "src/templates/configData.md.vm",
+          "build/site/markdown/azure-sink-connector/AzureSinkConfig.md")
+}
+
+tasks.register<JavaExec>("buildConfigYml") {
+  mainClass = "io.aiven.kafka.connect.tools.ConfigDoc"
+  classpath =
+      sourceSets.main
+          .get()
+          .compileClasspath
+          .plus(files(tasks.jar))
+          .plus(sourceSets.main.get().runtimeClasspath)
+  args =
+      listOf(
+          "io.aiven.kafka.connect.azure.sink.AzureBlobSinkConfig",
+          "configDef",
+          "src/templates/configData.yml.vm",
+          "build/site/azure-sink-connector/AzureSinkConfig.yml")
+}
+
+/** ****************************** */
+/*  End of documentation section */
+/** ****************************** */
diff --git a/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/AvroIntegrationTest.java b/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/AvroIntegrationTest.java
index ba4ada4f5..779911e64 100644
--- a/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/AvroIntegrationTest.java
+++ b/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/AvroIntegrationTest.java
@@ -35,6 +35,11 @@
 import org.apache.kafka.clients.producer.RecordMetadata;
 
 import io.aiven.kafka.connect.common.config.CompressionType;
+import io.aiven.kafka.connect.common.config.FileNameFragment;
+import io.aiven.kafka.connect.common.config.FormatType;
+import io.aiven.kafka.connect.common.config.OutputFieldEncodingType;
+import io.aiven.kafka.connect.common.config.OutputFieldType;
+import io.aiven.kafka.connect.common.config.OutputFormatFragment;
 
 import org.apache.avro.Schema;
 import org.apache.avro.file.DataFileReader;
@@ -95,8 +100,9 @@ private void produceRecords(final int recordCountPerPartition) throws ExecutionE
     @Test
     void avroOutput() throws ExecutionException, InterruptedException, IOException {
         final Map<String, String> connectorConfig = basicConnectorConfig();
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "key,value");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_TYPE_CONFIG, "avro");
+        OutputFormatFragment.setter(connectorConfig)
+                .withFormatType(FormatType.AVRO)
+                .withOutputFields(OutputFieldType.KEY, OutputFieldType.VALUE);
         createConnector(connectorConfig);
 
         final int recordCountPerPartition = 10;
@@ -161,10 +167,11 @@ private byte[] getBlobBytes(final byte[] blobBytes, final String compression) th
     void avroOutputPlainValueWithoutEnvelope(final String avroCodec, final String compression)
             throws ExecutionException, InterruptedException, IOException {
         final Map<String, String> connectorConfig = basicConnectorConfig();
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_ENVELOPE_CONFIG, "false");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "value");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_TYPE_CONFIG, "avro");
-        connectorConfig.put(AzureBlobSinkConfig.FILE_COMPRESSION_TYPE_CONFIG, compression);
+        OutputFormatFragment.setter(connectorConfig)
+                .withFormatType(FormatType.AVRO)
+                .withOutputFields(OutputFieldType.VALUE)
+                .envelopeEnabled(false);
+        FileNameFragment.setter(connectorConfig).fileCompression(CompressionType.forName(compression));
         connectorConfig.put("avro.codec", avroCodec);
         createConnector(connectorConfig);
 
@@ -223,10 +230,12 @@ void avroOutputPlainValueWithoutEnvelope(final String avroCodec, final String co
     @Test
     void schemaChanged() throws ExecutionException, InterruptedException, IOException {
         final Map<String, String> connectorConfig = basicConnectorConfig();
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_ENVELOPE_CONFIG, "false");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "value");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG, "none");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_TYPE_CONFIG, "avro");
+        OutputFormatFragment.setter(connectorConfig)
+                .withFormatType(FormatType.AVRO)
+                .withOutputFields(OutputFieldType.VALUE)
+                .envelopeEnabled(false)
+                .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
+
         createConnector(connectorConfig);
 
         final Schema evolvedAvroInputDataSchema = new Schema.Parser()
@@ -279,10 +288,12 @@ void schemaChanged() throws ExecutionException, InterruptedException, IOExceptio
     void jsonlOutput() throws ExecutionException, InterruptedException {
         final Map<String, String> connectorConfig = basicConnectorConfig();
         final String compression = "none";
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "key,value");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG, "none");
-        connectorConfig.put(AzureBlobSinkConfig.FILE_COMPRESSION_TYPE_CONFIG, compression);
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_TYPE_CONFIG, "jsonl");
+        OutputFormatFragment.setter(connectorConfig)
+                .withFormatType(FormatType.JSONL)
+                .withOutputFields(OutputFieldType.KEY, OutputFieldType.VALUE)
+                .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
+        FileNameFragment.setter(connectorConfig).fileCompression(CompressionType.NONE);
+
         createConnector(connectorConfig);
 
         final int recordCountPerPartition = 10;
@@ -334,12 +345,12 @@ private Map<String, String> basicConnectorConfig() {
         return config;
     }
 
-    protected String getAvroBlobName(final int partition, final int startOffset, final String compression) {
+    String getAvroBlobName(final int partition, final int startOffset, final String compression) {
         return super.getBaseBlobName(partition, startOffset) + ".avro"
                 + CompressionType.forName(compression).extension();
     }
 
-    protected String getAvroBlobName(final int partition, final int startOffset) {
+    String getAvroBlobName(final int partition, final int startOffset) {
         return super.getBaseBlobName(partition, startOffset) + ".avro";
     }
 }
diff --git a/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/AvroParquetIntegrationTest.java b/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/AvroParquetIntegrationTest.java
index dd4875a9a..6df416edf 100644
--- a/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/AvroParquetIntegrationTest.java
+++ b/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/AvroParquetIntegrationTest.java
@@ -33,6 +33,12 @@
 import org.apache.kafka.clients.producer.ProducerConfig;
 import org.apache.kafka.clients.producer.RecordMetadata;
 
+import io.aiven.kafka.connect.common.config.CompressionType;
+import io.aiven.kafka.connect.common.config.FileNameFragment;
+import io.aiven.kafka.connect.common.config.FormatType;
+import io.aiven.kafka.connect.common.config.OutputFieldEncodingType;
+import io.aiven.kafka.connect.common.config.OutputFieldType;
+import io.aiven.kafka.connect.common.config.OutputFormatFragment;
 import io.aiven.kafka.connect.common.format.ParquetTestDataFixture;
 
 import org.apache.avro.Schema;
@@ -66,8 +72,10 @@ void setUp() throws ExecutionException, InterruptedException {
     void allOutputFields(@TempDir final Path tmpDir) throws ExecutionException, InterruptedException, IOException {
         final var compression = "none";
         final Map<String, String> connectorConfig = basicConnectorConfig(compression);
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "key,value,offset,timestamp,headers");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG, "none");
+        OutputFormatFragment.setter(connectorConfig)
+                .withOutputFields(OutputFieldType.KEY, OutputFieldType.VALUE, OutputFieldType.OFFSET,
+                        OutputFieldType.TIMESTAMP, OutputFieldType.HEADERS)
+                .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
         createConnector(connectorConfig);
 
         final Schema valueSchema = SchemaBuilder.record("value")
@@ -134,8 +142,9 @@ void allOutputFields(@TempDir final Path tmpDir) throws ExecutionException, Inte
     void valueComplexType(@TempDir final Path tmpDir) throws ExecutionException, InterruptedException, IOException {
         final String compression = "none";
         final Map<String, String> connectorConfig = basicConnectorConfig(compression);
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "value");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG, "none");
+        OutputFormatFragment.setter(connectorConfig)
+                .withOutputFields(OutputFieldType.VALUE)
+                .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
         createConnector(connectorConfig);
 
         final Schema valueSchema = SchemaBuilder.record("value")
@@ -198,8 +207,9 @@ void valueComplexType(@TempDir final Path tmpDir) throws ExecutionException, Int
     void schemaChanged(@TempDir final Path tmpDir) throws ExecutionException, InterruptedException, IOException {
         final String compression = "none";
         final Map<String, String> connectorConfig = basicConnectorConfig(compression);
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "value");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG, "none");
+        OutputFormatFragment.setter(connectorConfig)
+                .withOutputFields(OutputFieldType.VALUE)
+                .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
         createConnector(connectorConfig);
 
         final Schema valueSchema = SchemaBuilder.record("value")
@@ -290,8 +300,9 @@ private Map<String, String> basicConnectorConfig(final String compression) {
         config.put(AzureBlobSinkConfig.AZURE_STORAGE_CONTAINER_NAME_CONFIG, testContainerName);
         config.put(AzureBlobSinkConfig.FILE_NAME_PREFIX_CONFIG, azurePrefix);
         config.put("topics", testTopic0 + "," + testTopic1);
-        config.put(AzureBlobSinkConfig.FILE_COMPRESSION_TYPE_CONFIG, compression);
-        config.put(AzureBlobSinkConfig.FORMAT_OUTPUT_TYPE_CONFIG, "parquet");
+
+        FileNameFragment.setter(config).fileCompression(CompressionType.forName(compression));
+        OutputFormatFragment.setter(config).withFormatType(FormatType.PARQUET);
         return config;
     }
 }
diff --git a/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/IntegrationTest.java b/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/IntegrationTest.java
index 5646d4ab9..a12dc33cb 100644
--- a/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/IntegrationTest.java
+++ b/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/IntegrationTest.java
@@ -36,6 +36,11 @@
 import org.apache.kafka.common.TopicPartition;
 
 import io.aiven.kafka.connect.common.config.CompressionType;
+import io.aiven.kafka.connect.common.config.FileNameFragment;
+import io.aiven.kafka.connect.common.config.FormatType;
+import io.aiven.kafka.connect.common.config.OutputFieldEncodingType;
+import io.aiven.kafka.connect.common.config.OutputFieldType;
+import io.aiven.kafka.connect.common.config.OutputFormatFragment;
 
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
@@ -63,8 +68,8 @@ void setUp() throws ExecutionException, InterruptedException {
     @ValueSource(strings = { "none", "gzip", "snappy", "zstd" })
     void basicTest(final String compression) throws ExecutionException, InterruptedException {
         final Map<String, String> connectorConfig = basicConnectorConfig();
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "key,value");
-        connectorConfig.put(AzureBlobSinkConfig.FILE_COMPRESSION_TYPE_CONFIG, compression);
+        OutputFormatFragment.setter(connectorConfig).withOutputFields(OutputFieldType.VALUE, OutputFieldType.KEY);
+        FileNameFragment.setter(connectorConfig).fileCompression(CompressionType.forName(compression));
         createConnector(connectorConfig);
 
         final List<Future<RecordMetadata>> sendFutures = new ArrayList<>();
@@ -118,10 +123,11 @@ void basicTest(final String compression) throws ExecutionException, InterruptedE
     @ValueSource(strings = { "none", "gzip", "snappy", "zstd" })
     void groupByTimestampVariable(final String compression) throws ExecutionException, InterruptedException {
         final Map<String, String> connectorConfig = basicConnectorConfig();
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "key,value");
-        connectorConfig.put(AzureBlobSinkConfig.FILE_COMPRESSION_TYPE_CONFIG, compression);
-        connectorConfig.put(AzureBlobSinkConfig.FILE_NAME_TEMPLATE_CONFIG, "{{topic}}-{{partition}}-{{start_offset}}-"
-                + "{{timestamp:unit=yyyy}}-{{timestamp:unit=MM}}-{{timestamp:unit=dd}}");
+        OutputFormatFragment.setter(connectorConfig).withOutputFields(OutputFieldType.VALUE, OutputFieldType.KEY);
+        FileNameFragment.setter(connectorConfig)
+                .fileCompression(CompressionType.forName(compression))
+                .template("{{topic}}-{{partition}}-{{start_offset}}-"
+                        + "{{timestamp:unit=yyyy}}-{{timestamp:unit=MM}}-{{timestamp:unit=dd}}");
         createConnector(connectorConfig);
 
         final List<Future<RecordMetadata>> sendFutures = new ArrayList<>();
@@ -176,10 +182,12 @@ private String getTimestampBlobName(final int partition, final int startOffset)
     @ValueSource(strings = { "none", "gzip", "snappy", "zstd" })
     void oneFilePerRecordWithPlainValues(final String compression) throws ExecutionException, InterruptedException {
         final Map<String, String> connectorConfig = basicConnectorConfig();
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "value");
-        connectorConfig.put(AzureBlobSinkConfig.FILE_COMPRESSION_TYPE_CONFIG, compression);
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG, "none");
-        connectorConfig.put(AzureBlobSinkConfig.FILE_MAX_RECORDS, "1");
+        FileNameFragment.setter(connectorConfig)
+                .maxRecordsPerFile(1)
+                .fileCompression(CompressionType.forName(compression));
+        OutputFormatFragment.setter(connectorConfig)
+                .withOutputFields(OutputFieldType.VALUE)
+                .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
         createConnector(connectorConfig);
 
         final List<Future<RecordMetadata>> sendFutures = new ArrayList<>();
@@ -226,9 +234,10 @@ void groupByKey(final String compression) throws ExecutionException, Interrupted
         final Map<String, String> connectorConfig = basicConnectorConfig();
         final CompressionType compressionType = CompressionType.forName(compression);
         connectorConfig.put("key.converter", "org.apache.kafka.connect.storage.StringConverter");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "key,value");
-        connectorConfig.put(AzureBlobSinkConfig.FILE_COMPRESSION_TYPE_CONFIG, compression);
-        connectorConfig.put(AzureBlobSinkConfig.FILE_NAME_TEMPLATE_CONFIG, "{{key}}" + compressionType.extension());
+        OutputFormatFragment.setter(connectorConfig).withOutputFields(OutputFieldType.VALUE, OutputFieldType.KEY);
+        FileNameFragment.setter(connectorConfig)
+                .fileCompression(CompressionType.forName(compression))
+                .template("{{key}}" + compressionType.extension());
         createConnector(connectorConfig);
 
         final Map<TopicPartition, List<String>> keysPerTopicPartition = new HashMap<>();
@@ -292,14 +301,14 @@ void groupByKey(final String compression) throws ExecutionException, Interrupted
     void jsonlOutput() throws ExecutionException, InterruptedException {
         final Map<String, String> connectorConfig = basicConnectorConfig();
         final String compression = "none";
-        final String contentType = "jsonl";
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "key,value");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG, "none");
         connectorConfig.put("key.converter", "org.apache.kafka.connect.storage.StringConverter");
         connectorConfig.put("value.converter", "org.apache.kafka.connect.json.JsonConverter");
         connectorConfig.put("value.converter.schemas.enable", "false");
-        connectorConfig.put(AzureBlobSinkConfig.FILE_COMPRESSION_TYPE_CONFIG, compression);
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_TYPE_CONFIG, contentType);
+        FileNameFragment.setter(connectorConfig).fileCompression(CompressionType.NONE);
+        OutputFormatFragment.setter(connectorConfig)
+                .withFormatType(FormatType.JSONL)
+                .withOutputFields(OutputFieldType.VALUE, OutputFieldType.KEY)
+                .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
         createConnector(connectorConfig);
 
         final List<Future<RecordMetadata>> sendFutures = new ArrayList<>();
@@ -353,16 +362,16 @@ void jsonlOutput() throws ExecutionException, InterruptedException {
     void jsonOutput() throws ExecutionException, InterruptedException {
         final Map<String, String> connectorConfig = basicConnectorConfig();
         final String compression = "none";
-        final String contentType = "json";
         connectorConfig.put("azure.storage.connection.string",
                 azureEndpoint != null ? azureEndpoint : azureConnectionString); // NOPMD
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "key,value");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG, "none");
         connectorConfig.put("key.converter", "org.apache.kafka.connect.storage.StringConverter");
         connectorConfig.put("value.converter", "org.apache.kafka.connect.json.JsonConverter");
         connectorConfig.put("value.converter.schemas.enable", "false");
-        connectorConfig.put(AzureBlobSinkConfig.FILE_COMPRESSION_TYPE_CONFIG, compression);
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_TYPE_CONFIG, contentType);
+        FileNameFragment.setter(connectorConfig).fileCompression(CompressionType.NONE);
+        OutputFormatFragment.setter(connectorConfig)
+                .withFormatType(FormatType.JSONL)
+                .withOutputFields(OutputFieldType.VALUE, OutputFieldType.KEY)
+                .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
         createConnector(connectorConfig);
 
         final int numEpochs = 10;
diff --git a/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/ParquetIntegrationTest.java b/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/ParquetIntegrationTest.java
index 0110dda06..0d8d6ca05 100644
--- a/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/ParquetIntegrationTest.java
+++ b/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/ParquetIntegrationTest.java
@@ -34,6 +34,12 @@
 import org.apache.kafka.clients.producer.ProducerConfig;
 import org.apache.kafka.clients.producer.RecordMetadata;
 
+import io.aiven.kafka.connect.common.config.CompressionType;
+import io.aiven.kafka.connect.common.config.FileNameFragment;
+import io.aiven.kafka.connect.common.config.FormatType;
+import io.aiven.kafka.connect.common.config.OutputFieldEncodingType;
+import io.aiven.kafka.connect.common.config.OutputFieldType;
+import io.aiven.kafka.connect.common.config.OutputFormatFragment;
 import io.aiven.kafka.connect.common.format.ParquetTestDataFixture;
 
 import org.apache.avro.generic.GenericRecord;
@@ -68,8 +74,10 @@ void setUp() throws ExecutionException, InterruptedException {
     void allOutputFields() throws ExecutionException, InterruptedException, IOException {
         final var compression = "none";
         final Map<String, String> connectorConfig = basicConnectorConfig(compression);
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "key,value,offset,timestamp,headers");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG, "none");
+        OutputFormatFragment.setter(connectorConfig)
+                .withOutputFields(OutputFieldType.KEY, OutputFieldType.VALUE, OutputFieldType.OFFSET,
+                        OutputFieldType.TIMESTAMP, OutputFieldType.HEADERS)
+                .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
         connectorConfig.put("key.converter", "org.apache.kafka.connect.storage.StringConverter");
         connectorConfig.put("value.converter", "org.apache.kafka.connect.storage.StringConverter");
         createConnector(connectorConfig);
@@ -123,8 +131,10 @@ final var record = blobContents.get(blobName).get(i);
     void allOutputFieldsJsonValueAsString() throws ExecutionException, InterruptedException, IOException {
         final var compression = "none";
         final Map<String, String> connectorConfig = basicConnectorConfig(compression);
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "key,value,offset,timestamp,headers");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG, "none");
+        OutputFormatFragment.setter(connectorConfig)
+                .withOutputFields(OutputFieldType.KEY, OutputFieldType.VALUE, OutputFieldType.OFFSET,
+                        OutputFieldType.TIMESTAMP, OutputFieldType.HEADERS)
+                .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
         connectorConfig.put("key.converter", "org.apache.kafka.connect.storage.StringConverter");
         connectorConfig.put("value.converter", "org.apache.kafka.connect.storage.StringConverter");
         createConnector(connectorConfig);
@@ -180,9 +190,10 @@ void jsonValue(final String envelopeEnabled, final String expectedOutput)
             throws ExecutionException, InterruptedException, IOException {
         final var compression = "none";
         final Map<String, String> connectorConfig = basicConnectorConfig(compression);
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "value");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_ENVELOPE_CONFIG, envelopeEnabled);
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG, "none");
+        OutputFormatFragment.setter(connectorConfig)
+                .withOutputFields(OutputFieldType.VALUE)
+                .envelopeEnabled(Boolean.getBoolean(envelopeEnabled))
+                .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
         connectorConfig.put("key.converter", "org.apache.kafka.connect.storage.StringConverter");
         connectorConfig.put("value.converter", "org.apache.kafka.connect.json.JsonConverter");
         createConnector(connectorConfig);
@@ -237,8 +248,9 @@ final var record = blobContents.get(blobName).get(i);
     void schemaChanged() throws ExecutionException, InterruptedException, IOException {
         final var compression = "none";
         final Map<String, String> connectorConfig = basicConnectorConfig(compression);
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_CONFIG, "value");
-        connectorConfig.put(AzureBlobSinkConfig.FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG, "none");
+        OutputFormatFragment.setter(connectorConfig)
+                .withOutputFields(OutputFieldType.VALUE)
+                .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
         connectorConfig.put("key.converter", "org.apache.kafka.connect.storage.StringConverter");
         connectorConfig.put("value.converter", "org.apache.kafka.connect.json.JsonConverter");
         createConnector(connectorConfig);
@@ -306,8 +318,9 @@ private Map<String, String> basicConnectorConfig(final String compression) {
 
         config.put(AzureBlobSinkConfig.FILE_NAME_PREFIX_CONFIG, azurePrefix);
         config.put("topics", testTopic0 + "," + testTopic1);
-        config.put(AzureBlobSinkConfig.FILE_COMPRESSION_TYPE_CONFIG, compression);
-        config.put(AzureBlobSinkConfig.FORMAT_OUTPUT_TYPE_CONFIG, "parquet");
+        FileNameFragment.setter(config).fileCompression(CompressionType.forName(compression));
+        OutputFormatFragment.setter(config).withFormatType(FormatType.PARQUET);
+
         return config;
     }
 
diff --git a/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobConfigFragment.java b/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobConfigFragment.java
new file mode 100644
index 000000000..26fc310eb
--- /dev/null
+++ b/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobConfigFragment.java
@@ -0,0 +1,224 @@
+/*
+ * Copyright 2025 Aiven Oy
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package io.aiven.kafka.connect.azure.sink;
+
+import java.time.Duration;
+import java.util.regex.Pattern;
+
+import org.apache.kafka.common.config.ConfigDef;
+import org.apache.kafka.common.config.ConfigException;
+
+import io.aiven.kafka.connect.common.config.ConfigFragment;
+import io.aiven.kafka.connect.common.config.FragmentDataAccess;
+
+import com.azure.core.http.policy.ExponentialBackoffOptions;
+import com.azure.core.http.policy.HttpLogDetailLevel;
+import com.azure.core.http.policy.HttpLogOptions;
+import com.azure.core.http.policy.RetryOptions;
+import com.azure.core.http.policy.UserAgentPolicy;
+import com.azure.storage.blob.BlobServiceAsyncClient;
+import com.azure.storage.blob.BlobServiceClientBuilder;
+
+/**
+ * The configuration fragment that defines the Azure specific characteristics. TODO merge this with the Azure source
+ * version.
+ */
+public final class AzureBlobConfigFragment extends ConfigFragment {
+
+    public static final String AZURE_PREFIX_CONFIG = "azure.blob.prefix";
+    public static final String AZURE_FETCH_PAGE_SIZE = "azure.blob.fetch.page.size";
+    private static final String USER_AGENT_HEADER_FORMAT = "Azure Blob Source/%s (GPN: Aiven;)";
+    public static final String USER_AGENT_HEADER_VALUE = String.format(USER_AGENT_HEADER_FORMAT, Version.VERSION);
+    private static final String GROUP_AZURE = "Azure";
+    public static final String AZURE_STORAGE_CONNECTION_STRING_CONFIG = "azure.storage.connection.string";
+    public static final String AZURE_STORAGE_CONTAINER_NAME_CONFIG = "azure.storage.container.name";
+    public static final String AZURE_USER_AGENT = "azure.user.agent";
+
+    private static final String GROUP_AZURE_RETRY_BACKOFF_POLICY = "Azure retry backoff policy";
+    private static final String AZURE_FETCH_BUFFER_SIZE = "azure.blob.fetch.buffer.size";
+    public static final String AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG = "azure.retry.backoff.initial.delay.ms";
+    public static final String AZURE_RETRY_BACKOFF_MAX_DELAY_MS_CONFIG = "azure.retry.backoff.max.delay.ms";
+    public static final String AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_CONFIG = "azure.retry.backoff.max.attempts";
+
+    public static final long AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_DEFAULT = 1_000L;
+    public static final long AZURE_RETRY_BACKOFF_MAX_DELAY_MS_DEFAULT = 32_000L;
+    public static final int AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_DEFAULT = 6;
+
+    private final static Pattern CONTAINER_NAME_PATTERN = Pattern.compile("[0-9a-z][0-9a-z\\-]+[0-9a-z]");
+
+    /**
+     * From Azure documentation:
+     * <ul>
+     * <li>Container names must start or end with a letter or number, and can contain only letters, numbers, and the
+     * hyphen/minus (-) character.</li>
+     * <li>Every hyphen/minus (-) character must be immediately preceded and followed by a letter or number; consecutive
+     * hyphens aren't permitted in container names.</li>
+     * <li>All letters in a container name must be lowercase.</li>
+     * <li>Container names must be from 3 through 63 characters long.</li>
+     * </ul>
+     */
+    private static final ConfigDef.Validator CONTAINER_NAME_VALIDATOR = ConfigDef.CompositeValidator
+            .of(ConfigDef.LambdaValidator.with((name, value) -> {
+                final int len = value == null ? 0 : value.toString().length();
+                if (len < 3 || len > 63) {
+                    throw new ConfigException(name, value, "names must be from 3 through 63 characters long.");
+                }
+            }, () -> "must be from 3 through 63 characters long"), ConfigDef.LambdaValidator.with((name, value) -> {
+                if (value.toString().contains("--")) {
+                    throw new ConfigException(name, value,
+                            "Every hyphen/minus (-) character must be immediately preceded and followed by a letter or number; consecutive hyphens aren't permitted in container names.");
+                }
+            }, () -> "consecutive hyphens aren't permitted in container names"),
+                    // regex last for speed
+                    ConfigDef.LambdaValidator.with((name, value) -> {
+                        if (!CONTAINER_NAME_PATTERN.matcher(value.toString()).matches()) {
+                            throw new ConfigException(name, value,
+                                    "must start or end with a letter or number, and can contain only lower case letters, numbers, and the hyphen/minus (-) character.");
+                        }
+                    }, () -> "start or end with a letter or number, and can contain only lower case letters, numbers, and the hyphen/minus (-) character"));
+
+    /**
+     * Construct the Azure Blob ConfigFragment..
+     *
+     * @param dataAccess
+     *            the configuration that this fragment is associated with.
+     */
+    public AzureBlobConfigFragment(final FragmentDataAccess dataAccess) {
+        super(dataAccess);
+    }
+
+    /**
+     * Adds the configuration options for the azure client to the configuration definition.
+     *
+     * @param configDef
+     *            the Configuration definition.
+     * @return the update configuration definition
+     */
+    public static ConfigDef update(final ConfigDef configDef, final boolean isSink) {
+        addUserAgentConfig(configDef);
+        addAzureConfigGroup(configDef, isSink);
+        addAzureRetryPolicies(configDef);
+        return configDef;
+    }
+
+    private static void addUserAgentConfig(final ConfigDef configDef) {
+        configDef.define(AZURE_USER_AGENT, ConfigDef.Type.STRING, USER_AGENT_HEADER_VALUE, ConfigDef.Importance.LOW,
+                "A custom user agent used while contacting Azure");
+    }
+
+    private static void addAzureConfigGroup(final ConfigDef configDef, final boolean isSink) {
+        int azureGroupCounter = 0;
+        configDef.define(AZURE_STORAGE_CONNECTION_STRING_CONFIG, ConfigDef.Type.STRING, ConfigDef.NO_DEFAULT_VALUE,
+                ConfigDef.Importance.HIGH, "Azure Storage connection string.", GROUP_AZURE, ++azureGroupCounter,
+                ConfigDef.Width.NONE, AZURE_STORAGE_CONNECTION_STRING_CONFIG);
+
+        configDef.define(AZURE_STORAGE_CONTAINER_NAME_CONFIG, ConfigDef.Type.STRING, ConfigDef.NO_DEFAULT_VALUE,
+                CONTAINER_NAME_VALIDATOR, ConfigDef.Importance.HIGH,
+                "The Azure Blob container that files will be written to or read from.", GROUP_AZURE,
+                ++azureGroupCounter, ConfigDef.Width.NONE, AZURE_STORAGE_CONTAINER_NAME_CONFIG);
+
+        configDef.define(AZURE_PREFIX_CONFIG, ConfigDef.Type.STRING, null, new ConfigDef.NonEmptyString(),
+                ConfigDef.Importance.MEDIUM,
+                "Prefix for storage file names, generally specifies directory like"
+                        + " structures that do not contain any templated fields.",
+                GROUP_AZURE, ++azureGroupCounter, ConfigDef.Width.NONE, AZURE_PREFIX_CONFIG);
+        if (!isSink) {
+            configDef.define(AZURE_FETCH_PAGE_SIZE, ConfigDef.Type.INT, 10, ConfigDef.Range.atLeast(1),
+                    ConfigDef.Importance.MEDIUM, "Azure fetch page size", GROUP_AZURE, ++azureGroupCounter,
+                    ConfigDef.Width.NONE, AZURE_FETCH_PAGE_SIZE);
+
+            configDef.define(AZURE_FETCH_BUFFER_SIZE, ConfigDef.Type.INT, 1000, ConfigDef.Range.atLeast(1),
+                    ConfigDef.Importance.MEDIUM,
+                    "Azure fetch buffer size. This is the number of object keys kept in a buffer to ensure lexically older objet keys aren't skipped for processing if they are slower to upload.",
+                    GROUP_AZURE, ++azureGroupCounter, ConfigDef.Width.NONE, AZURE_FETCH_BUFFER_SIZE);
+        }
+    }
+
+    static void addAzureRetryPolicies(final ConfigDef configDef) {
+        int retryPolicyGroupCounter = 0;
+        configDef.define(AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG, ConfigDef.Type.LONG,
+                AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_DEFAULT, ConfigDef.Range.atLeast(0L), ConfigDef.Importance.MEDIUM,
+                "Initial retry delay in milliseconds.", GROUP_AZURE_RETRY_BACKOFF_POLICY, ++retryPolicyGroupCounter,
+                ConfigDef.Width.NONE, AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG);
+        configDef.define(AZURE_RETRY_BACKOFF_MAX_DELAY_MS_CONFIG, ConfigDef.Type.LONG,
+                AZURE_RETRY_BACKOFF_MAX_DELAY_MS_DEFAULT, ConfigDef.Range.atLeast(0L), ConfigDef.Importance.MEDIUM,
+                "Maximum retry delay in milliseconds.", GROUP_AZURE_RETRY_BACKOFF_POLICY, ++retryPolicyGroupCounter,
+                ConfigDef.Width.NONE, AZURE_RETRY_BACKOFF_MAX_DELAY_MS_CONFIG);
+        configDef.define(AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_CONFIG, ConfigDef.Type.INT,
+                AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_DEFAULT, ConfigDef.Range.atLeast(0L), ConfigDef.Importance.MEDIUM,
+                "Retry max attempts. The default value is " + AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_DEFAULT,
+                GROUP_AZURE_RETRY_BACKOFF_POLICY, ++retryPolicyGroupCounter, ConfigDef.Width.NONE,
+                AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_CONFIG);
+    }
+
+    public int getAzureFetchPageSize() {
+        return getInt(AZURE_FETCH_PAGE_SIZE);
+    }
+
+    public String getAzurePrefix() {
+        return getString(AZURE_PREFIX_CONFIG);
+    }
+
+    public String getConnectionString() {
+        return getString(AZURE_STORAGE_CONNECTION_STRING_CONFIG);
+    }
+
+    public String getContainerName() {
+        return getString(AZURE_STORAGE_CONTAINER_NAME_CONFIG);
+    }
+
+    public int getAzureRetryBackoffMaxAttempts() {
+        return getInt(AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_CONFIG);
+    }
+
+    public Duration getAzureRetryBackoffInitialDelay() {
+        return Duration.ofMillis(getLong(AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG));
+    }
+
+    public Duration getAzureRetryBackoffMaxDelay() {
+        return Duration.ofMillis(getLong(AZURE_RETRY_BACKOFF_MAX_DELAY_MS_CONFIG));
+    }
+
+    public String getUserAgent() {
+        return getString(AZURE_USER_AGENT);
+    }
+
+    public int getFetchBufferSize() {
+        return getInt(AZURE_FETCH_BUFFER_SIZE);
+    }
+
+    public RetryOptions getAzureRetryOptions() {
+        return new RetryOptions(new ExponentialBackoffOptions().setMaxRetries(getAzureRetryBackoffMaxAttempts())
+                .setBaseDelay(Duration.ofMillis(getAzureRetryBackoffInitialDelay().toMillis()))
+                .setMaxDelay(Duration.ofMillis(getAzureRetryBackoffMaxDelay().toMillis())));
+    }
+
+    /**
+     * Creates an async Service Client which can be used to create async container and blob clients, which can list and
+     * download blobs respectively.
+     *
+     * @return A configured instance of BlobServiceAsyncClient
+     */
+    public BlobServiceAsyncClient getAzureServiceAsyncClient() {
+        return new BlobServiceClientBuilder().connectionString(getConnectionString())
+                .httpLogOptions(new HttpLogOptions().setLogLevel(HttpLogDetailLevel.BODY_AND_HEADERS))
+                .addPolicy(new UserAgentPolicy(getUserAgent()))
+                .retryOptions(getAzureRetryOptions())
+                .buildAsyncClient();
+    }
+
+}
diff --git a/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkConfig.java b/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkConfig.java
index 5159f2c78..7f78fb8d1 100644
--- a/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkConfig.java
+++ b/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkConfig.java
@@ -17,49 +17,26 @@
 package io.aiven.kafka.connect.azure.sink;
 
 import java.time.Duration;
-import java.util.ArrayList;
-import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
-import java.util.regex.Pattern;
+import java.util.stream.Collectors;
 
 import org.apache.kafka.common.config.ConfigDef;
-import org.apache.kafka.common.config.ConfigException;
 
-import io.aiven.kafka.connect.common.config.AivenCommonConfig;
-import io.aiven.kafka.connect.common.config.CompressionType;
+import io.aiven.kafka.connect.common.config.FragmentDataAccess;
 import io.aiven.kafka.connect.common.config.OutputField;
 import io.aiven.kafka.connect.common.config.OutputFieldEncodingType;
 import io.aiven.kafka.connect.common.config.OutputFieldType;
+import io.aiven.kafka.connect.common.config.SinkCommonConfig;
 
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
-
-@SuppressWarnings("PMD.UnusedPrivateMethod")
-public final class AzureBlobSinkConfig extends AivenCommonConfig {
-    private static final Logger LOG = LoggerFactory.getLogger(AzureBlobSinkConfig.class);
-    private static final String USER_AGENT_HEADER_FORMAT = "Azure Blob Sink/%s (GPN: Aiven;)";
-    public static final String USER_AGENT_HEADER_VALUE = String.format(USER_AGENT_HEADER_FORMAT, Version.VERSION);
-    private static final String GROUP_AZURE = "Azure";
+public final class AzureBlobSinkConfig extends SinkCommonConfig {
     public static final String AZURE_STORAGE_CONNECTION_STRING_CONFIG = "azure.storage.connection.string";
     public static final String AZURE_STORAGE_CONTAINER_NAME_CONFIG = "azure.storage.container.name";
-    public static final String AZURE_USER_AGENT = "azure.user.agent";
-    private static final String GROUP_FILE = "File";
-    public static final String FILE_NAME_PREFIX_CONFIG = "file.name.prefix";
-    public static final String FILE_NAME_TEMPLATE_CONFIG = "file.name.template";
-    public static final String FILE_COMPRESSION_TYPE_CONFIG = "file.compression.type";
-    public static final String FILE_MAX_RECORDS = "file.max.records";
-    public static final String FILE_NAME_TIMESTAMP_TIMEZONE = "file.name.timestamp.timezone";
-    public static final String FILE_NAME_TIMESTAMP_SOURCE = "file.name.timestamp.source";
-
-    public static final String FORMAT_OUTPUT_FIELDS_CONFIG = "format.output.fields";
-    public static final String FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG = "format.output.fields.value.encoding";
-
-    private static final String GROUP_AZURE_RETRY_BACKOFF_POLICY = "Azure retry backoff policy";
 
-    public static final String AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG = "azure.retry.backoff.initial.delay.ms";
-    public static final String AZURE_RETRY_BACKOFF_MAX_DELAY_MS_CONFIG = "azure.retry.backoff.max.delay.ms";
-    public static final String AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_CONFIG = "azure.retry.backoff.max.attempts";
+    /**
+     * TODO move this to FileNameFragment and handle it in the grouper code.
+     */
+    public static final String FILE_NAME_PREFIX_CONFIG = "file.name.prefix";
 
     public static final long AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_DEFAULT = 1_000L;
     public static final long AZURE_RETRY_BACKOFF_MAX_DELAY_MS_DEFAULT = 32_000L;
@@ -67,138 +44,34 @@ public final class AzureBlobSinkConfig extends AivenCommonConfig {
 
     public static final String NAME_CONFIG = "name";
 
-    public static SinkCommonConfigDef configDef() {
-        final SinkCommonConfigDef configDef = new SinkCommonConfigDef(OutputFieldType.VALUE, CompressionType.NONE);
-        addAzureConfigGroup(configDef);
-        addFileConfigGroup(configDef);
-        addAzureRetryPolicies(configDef);
-        addUserAgentConfig(configDef);
-        return configDef;
-    }
-
-    private static void addUserAgentConfig(final ConfigDef configDef) {
-        configDef.define(AZURE_USER_AGENT, ConfigDef.Type.STRING, USER_AGENT_HEADER_VALUE, ConfigDef.Importance.LOW,
-                "A custom user agent used while contacting Azure");
-    }
-
-    private static void addAzureConfigGroup(final ConfigDef configDef) {
-        int azureGroupCounter = 0;
-        configDef.define(AZURE_STORAGE_CONNECTION_STRING_CONFIG, ConfigDef.Type.STRING, null, ConfigDef.Importance.HIGH,
-                "Azure Storage connection string.", GROUP_AZURE, azureGroupCounter++, ConfigDef.Width.NONE,
-                AZURE_STORAGE_CONNECTION_STRING_CONFIG);
-
-        configDef.define(AZURE_STORAGE_CONTAINER_NAME_CONFIG, ConfigDef.Type.STRING, ConfigDef.NO_DEFAULT_VALUE,
-                new ConfigDef.NonEmptyString(), ConfigDef.Importance.HIGH,
-                "The Azure Blob container name to store output files in.", GROUP_AZURE, azureGroupCounter++, // NOPMD
-                ConfigDef.Width.NONE, AZURE_STORAGE_CONTAINER_NAME_CONFIG);
-    }
-
-    private static void addAzureRetryPolicies(final ConfigDef configDef) {
-        int retryPolicyGroupCounter = 0;
-        configDef.define(AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG, ConfigDef.Type.LONG,
-                AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_DEFAULT, ConfigDef.Range.atLeast(0L), ConfigDef.Importance.MEDIUM,
-                "Initial retry delay in milliseconds. The default value is "
-                        + AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_DEFAULT,
-                GROUP_AZURE_RETRY_BACKOFF_POLICY, retryPolicyGroupCounter++, ConfigDef.Width.NONE,
-                AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG);
-        configDef.define(AZURE_RETRY_BACKOFF_MAX_DELAY_MS_CONFIG, ConfigDef.Type.LONG,
-                AZURE_RETRY_BACKOFF_MAX_DELAY_MS_DEFAULT, ConfigDef.Range.atLeast(0L), ConfigDef.Importance.MEDIUM,
-                "Maximum retry delay in milliseconds. The default value is " + AZURE_RETRY_BACKOFF_MAX_DELAY_MS_DEFAULT,
-                GROUP_AZURE_RETRY_BACKOFF_POLICY, retryPolicyGroupCounter++, ConfigDef.Width.NONE,
-                AZURE_RETRY_BACKOFF_MAX_DELAY_MS_CONFIG);
-        configDef.define(AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_CONFIG, ConfigDef.Type.INT,
-                AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_DEFAULT, ConfigDef.Range.atLeast(0L), ConfigDef.Importance.MEDIUM,
-                "Retry max attempts. The default value is " + AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_DEFAULT,
-                GROUP_AZURE_RETRY_BACKOFF_POLICY, retryPolicyGroupCounter++, ConfigDef.Width.NONE, // NOPMD
-                                                                                                   // retryPolicyGroupCounter
-                                                                                                   // updated value
-                                                                                                   // never
-                                                                                                   // used
-                AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_CONFIG);
-    }
+    private final AzureBlobConfigFragment azureFragment;
 
-    private static void addFileConfigGroup(final ConfigDef configDef) {
-        configDef.define(FILE_NAME_PREFIX_CONFIG, ConfigDef.Type.STRING, "", new ConfigDef.Validator() {
-            @Override
-            public void ensureValid(final String name, final Object value) {
-                assert value instanceof String;
-                final String valueStr = (String) value;
-                if (valueStr.length() > 1024) { // NOPMD avoid literal
-                    throw new ConfigException(AZURE_STORAGE_CONTAINER_NAME_CONFIG, value,
-                            "cannot be longer than 1024 characters");
-                }
-            }
-        }, ConfigDef.Importance.MEDIUM, "The prefix to be added to the name of each file put on Azure Blob.",
-                GROUP_FILE, 50, ConfigDef.Width.NONE, FILE_NAME_PREFIX_CONFIG);
+    public static ConfigDef configDef() {
+        return new AzureBlobSinkConfigDef();
     }
 
     public AzureBlobSinkConfig(final Map<String, String> properties) {
-        super(configDef(), handleDeprecatedYyyyUppercase(properties));
-        validate();
-    }
-
-    static Map<String, String> handleDeprecatedYyyyUppercase(final Map<String, String> properties) {
-        if (properties.containsKey(FILE_NAME_TEMPLATE_CONFIG)) {
-            final var result = new HashMap<>(properties);
-
-            String template = properties.get(FILE_NAME_TEMPLATE_CONFIG);
-            final String originalTemplate = template;
-
-            final var unitYyyyPattern = Pattern.compile("\\{\\{\\s*timestamp\\s*:\\s*unit\\s*=\\s*YYYY\\s*}}");
-            template = unitYyyyPattern.matcher(template)
-                    .replaceAll(matchResult -> matchResult.group().replace("YYYY", "yyyy"));
-
-            if (!template.equals(originalTemplate)) {
-                LOG.warn(
-                        "{{timestamp:unit=YYYY}} is no longer supported, "
-                                + "please use {{timestamp:unit=yyyy}} instead. " + "It was automatically replaced: {}",
-                        template);
-            }
-
-            result.put(FILE_NAME_TEMPLATE_CONFIG, template);
-
-            return result;
-        } else {
-            return properties;
-        }
-    }
-
-    private void validate() {
-        final String connectionString = getString(AZURE_STORAGE_CONNECTION_STRING_CONFIG);
-
-        if (connectionString == null) {
-            throw new ConfigException(
-                    String.format("The configuration %s cannot be null.", AZURE_STORAGE_CONNECTION_STRING_CONFIG));
-        }
+        super(new AzureBlobSinkConfigDef(), properties);
+        final FragmentDataAccess dataAccess = FragmentDataAccess.from(this);
+        azureFragment = new AzureBlobConfigFragment(dataAccess);
     }
 
     public String getConnectionString() {
-        return getString(AZURE_STORAGE_CONNECTION_STRING_CONFIG);
+        return azureFragment.getConnectionString();
     }
 
     public String getContainerName() {
         return getString(AZURE_STORAGE_CONTAINER_NAME_CONFIG);
     }
 
-    @Override
-    public CompressionType getCompressionType() {
-        return CompressionType.forName(getString(FILE_COMPRESSION_TYPE_CONFIG));
-    }
-
     @Override
     public List<OutputField> getOutputFields() {
-        final List<OutputField> result = new ArrayList<>();
-        for (final String outputFieldTypeStr : getList(FORMAT_OUTPUT_FIELDS_CONFIG)) {
-            final OutputFieldType fieldType = OutputFieldType.forName(outputFieldTypeStr);
-            final OutputFieldEncodingType encodingType;
-            if (fieldType == OutputFieldType.VALUE) {
-                encodingType = OutputFieldEncodingType.forName(getString(FORMAT_OUTPUT_FIELDS_VALUE_ENCODING_CONFIG));
-            } else {
-                encodingType = OutputFieldEncodingType.NONE;
-            }
-            result.add(new OutputField(fieldType, encodingType));
-        }
-        return result;
+        return outputFormatFragment.getOutputFieldTypes()
+                .stream()
+                .map(fieldType -> fieldType == OutputFieldType.VALUE
+                        ? new OutputField(fieldType, outputFormatFragment.getOutputFieldEncodingType())
+                        : new OutputField(fieldType, OutputFieldEncodingType.NONE))
+                .collect(Collectors.toList());
     }
 
     public String getPrefix() {
@@ -210,18 +83,18 @@ public String getConnectorName() {
     }
 
     public int getAzureRetryBackoffMaxAttempts() {
-        return getInt(AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_CONFIG);
+        return azureFragment.getAzureRetryBackoffMaxAttempts();
     }
 
     public Duration getAzureRetryBackoffInitialDelay() {
-        return Duration.ofMillis(getLong(AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG));
+        return azureFragment.getAzureRetryBackoffInitialDelay();
     }
 
     public Duration getAzureRetryBackoffMaxDelay() {
-        return Duration.ofMillis(getLong(AZURE_RETRY_BACKOFF_MAX_DELAY_MS_CONFIG));
+        return azureFragment.getAzureRetryBackoffMaxDelay();
     }
 
     public String getUserAgent() {
-        return getString(AZURE_USER_AGENT);
+        return azureFragment.getUserAgent();
     }
 }
diff --git a/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkConfigDef.java b/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkConfigDef.java
index 27971a281..b9f2db4d4 100644
--- a/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkConfigDef.java
+++ b/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkConfigDef.java
@@ -16,15 +16,81 @@
 
 package io.aiven.kafka.connect.azure.sink;
 
-import java.util.List;
 import java.util.Map;
+import java.util.regex.Pattern;
 
 import org.apache.kafka.common.config.ConfigDef;
+import org.apache.kafka.common.config.ConfigException;
 import org.apache.kafka.common.config.ConfigValue;
 
-public class AzureBlobSinkConfigDef extends ConfigDef {
+import io.aiven.kafka.connect.common.config.CompressionType;
+import io.aiven.kafka.connect.common.config.FileNameFragment;
+import io.aiven.kafka.connect.common.config.FragmentDataAccess;
+import io.aiven.kafka.connect.common.config.OutputFieldType;
+import io.aiven.kafka.connect.common.config.SinkCommonConfig;
+
+public final class AzureBlobSinkConfigDef extends SinkCommonConfig.SinkCommonConfigDef {
+
+    private final static Pattern CONTAINER_NAME_PATTERN = Pattern.compile("[0-9a-z][0-9a-z\\-]+[0-9a-z]");
+
+    /**
+     * From Azure documentation:
+     * <ul>
+     * <li>Container names must start or end with a letter or number, and can contain only letters, numbers, and the
+     * hyphen/minus (-) character.</li>
+     * <li>Every hyphen/minus (-) character must be immediately preceded and followed by a letter or number; consecutive
+     * hyphens aren't permitted in container names.</li>
+     * <li>All letters in a container name must be lowercase.</li>
+     * <li>Container names must be from 3 through 63 characters long.</li>
+     * </ul>
+     */
+    public static final ConfigDef.Validator CONTAINER_NAME_VALIDATOR = ConfigDef.CompositeValidator
+            .of(ConfigDef.LambdaValidator.with((name, value) -> {
+                final int len = value == null ? 0 : value.toString().length();
+                if (len < 3 || len > 63) {
+                    throw new ConfigException(name, value, "names must be from 3 through 63 characters long.");
+                }
+            }, () -> "must be from 3 through 63 characters long"), ConfigDef.LambdaValidator.with((name, value) -> {
+                if (value.toString().contains("--")) {
+                    throw new ConfigException(name, value,
+                            "Every hyphen/minus (-) character must be immediately preceded and followed by a letter or number; consecutive hyphens aren't permitted in container names.");
+                }
+            }, () -> "consecutive hyphens aren't permitted in container names"),
+                    // regex last for speed
+                    ConfigDef.LambdaValidator.with((name, value) -> {
+                        if (!CONTAINER_NAME_PATTERN.matcher(value.toString()).matches()) {
+                            throw new ConfigException(name, value,
+                                    "must start or end with a letter or number, and can contain only lower case letters, numbers, and the hyphen/minus (-) character.");
+                        }
+                    }, () -> "start or end with a letter or number, and can contain only lower case letters, numbers, and the hyphen/minus (-) character"));
+
+    AzureBlobSinkConfigDef() {
+        super(OutputFieldType.VALUE, CompressionType.NONE);
+        AzureBlobConfigFragment.update(this, true);
+        addFileConfigGroup(this);
+    }
+
+    static void addFileConfigGroup(final ConfigDef configDef) {
+
+        configDef.define(AzureBlobSinkConfig.FILE_NAME_PREFIX_CONFIG, ConfigDef.Type.STRING, "",
+                ConfigDef.LambdaValidator.with((name, value) -> {
+                    assert value instanceof String;
+                    final String valueStr = (String) value;
+                    if (valueStr.length() > 1024) { // NOPMD avoid literal
+                        throw new ConfigException(AzureBlobSinkConfig.AZURE_STORAGE_CONTAINER_NAME_CONFIG, value,
+                                "cannot be longer than 1024 characters");
+                    }
+                }, () -> ""), ConfigDef.Importance.MEDIUM,
+                "The prefix to be added to the name of each file put on Azure Blob.", FileNameFragment.GROUP_NAME, 10,
+                ConfigDef.Width.NONE, AzureBlobSinkConfig.FILE_NAME_PREFIX_CONFIG);
+
+    }
+
     @Override
-    public List<ConfigValue> validate(final Map<String, String> props) {
-        return super.validate(AzureBlobSinkConfig.handleDeprecatedYyyyUppercase(props));
+    public Map<String, ConfigValue> multiValidate(final Map<String, ConfigValue> valueMap) {
+        final Map<String, ConfigValue> result = super.multiValidate(valueMap);
+        final FragmentDataAccess dataAccess = FragmentDataAccess.from(result);
+        new AzureBlobConfigFragment(dataAccess).validate(result);
+        return result;
     }
 }
diff --git a/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkConnector.java b/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkConnector.java
index 7fcd4ce93..538465408 100644
--- a/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkConnector.java
+++ b/azure-sink-connector/src/main/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkConnector.java
@@ -49,8 +49,8 @@ public String version() {
     @Override
     public void start(final Map<String, String> props) {
         Objects.requireNonNull(props, "props cannot be null");
-
         this.configProps = Collections.unmodifiableMap(props);
+        AzureBlobSinkConfig.configDef().validate(props);
         this.config = new AzureBlobSinkConfig(props);
         LOG.info("Starting connector {}", config.getConnectorName());
     }
diff --git a/azure-sink-connector/src/templates/configData.md.vm b/azure-sink-connector/src/templates/configData.md.vm
new file mode 100644
index 000000000..65f05c9c4
--- /dev/null
+++ b/azure-sink-connector/src/templates/configData.md.vm
@@ -0,0 +1,15 @@
+
+# Azure Blob Sink Configuration
+
+The complete Azure Blob source configuration file
+
+#foreach ($section in $sections)
+${esc.hash}${esc.hash} ${section.displayName}
+ - Default value: ${section.getDefaultValue()|"none"}
+ - Type:  $section.type
+ - Valid values:  ${section.validator|"no restrictions"}
+ - Importance: $section.importance
+
+ $section.documentation
+
+#end
\ No newline at end of file
diff --git a/azure-sink-connector/src/templates/configData.yml.vm b/azure-sink-connector/src/templates/configData.yml.vm
new file mode 100644
index 000000000..5c3803439
--- /dev/null
+++ b/azure-sink-connector/src/templates/configData.yml.vm
@@ -0,0 +1,10 @@
+AzureBlobSinkConfigDef:
+#foreach ($section in $sections)
+-
+  name: ${section.displayName}
+  documentation:  $section.documentation
+  type:  $section.type
+  default: ${section.getDefaultValue()|"none"}
+  validValues: ${section.validator|"no restrictions"}
+  importance: $section.importance
+#end
\ No newline at end of file
diff --git a/azure-sink-connector/src/test/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkTaskTest.java b/azure-sink-connector/src/test/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkTaskTest.java
index dc463ac5b..86d31ebbb 100644
--- a/azure-sink-connector/src/test/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkTaskTest.java
+++ b/azure-sink-connector/src/test/java/io/aiven/kafka/connect/azure/sink/AzureBlobSinkTaskTest.java
@@ -40,6 +40,7 @@
 
 import io.aiven.kafka.connect.azure.sink.testutils.AzureBlobAccessor;
 import io.aiven.kafka.connect.common.config.CompressionType;
+import io.aiven.kafka.connect.common.config.FileNameFragment;
 
 import com.azure.core.http.rest.PagedIterable;
 import com.azure.storage.blob.BlobClient;
@@ -118,7 +119,7 @@ void basic(final String compression) {
         final List<BlobItem> blobItems = generateTestBlobItems(compression);
         when(pagedIterable.spliterator()).thenReturn(blobItems.spliterator());
         when(blobContainerClient.listBlobs()).thenReturn(pagedIterable);
-        properties.put(AzureBlobSinkConfig.FILE_COMPRESSION_TYPE_CONFIG, compression);
+        FileNameFragment.setter(properties).fileCompression(CompressionType.forName(compression));
         task = new AzureBlobSinkTask(properties, blobServiceClient);
 
         final List<SinkRecord> records = createBasicRecords();
diff --git a/azure-sink-connector/src/test/java/io/aiven/kafka/connect/azure/sink/config/AzureSinkConfigTest.java b/azure-sink-connector/src/test/java/io/aiven/kafka/connect/azure/sink/config/AzureSinkConfigTest.java
index 17fca719f..2afea2b54 100644
--- a/azure-sink-connector/src/test/java/io/aiven/kafka/connect/azure/sink/config/AzureSinkConfigTest.java
+++ b/azure-sink-connector/src/test/java/io/aiven/kafka/connect/azure/sink/config/AzureSinkConfigTest.java
@@ -23,8 +23,11 @@
 import java.time.Duration;
 import java.time.ZoneId;
 import java.time.ZoneOffset;
+import java.util.ArrayList;
 import java.util.HashMap;
+import java.util.List;
 import java.util.Map;
+import java.util.Optional;
 import java.util.stream.Collectors;
 import java.util.stream.Stream;
 
@@ -33,6 +36,7 @@
 
 import io.aiven.kafka.connect.azure.sink.AzureBlobSinkConfig;
 import io.aiven.kafka.connect.common.config.CompressionType;
+import io.aiven.kafka.connect.common.config.FileNameFragment;
 import io.aiven.kafka.connect.common.config.FormatType;
 import io.aiven.kafka.connect.common.config.OutputField;
 import io.aiven.kafka.connect.common.config.OutputFieldEncodingType;
@@ -41,6 +45,7 @@
 import io.aiven.kafka.connect.common.templating.Template;
 import io.aiven.kafka.connect.common.templating.VariableTemplatePart;
 
+import org.junit.jupiter.api.Disabled;
 import org.junit.jupiter.api.Test;
 import org.junit.jupiter.params.ParameterizedTest;
 import org.junit.jupiter.params.provider.NullSource;
@@ -60,18 +65,18 @@ final class AzureSinkConfigTest {
             "{{topic}}-{{partition}}-{{start_offset}}-{{unknown}}" })
     void incorrectFilenameTemplates(final String template) {
         final Map<String, String> properties = Map.of("file.name.template", template, "azure.storage.container.name",
-                "some-container");
+                "some-container", "azure.storage.connection.string", "somestring");
 
         final ConfigValue configValue = AzureBlobSinkConfig.configDef()
                 .validate(properties)
                 .stream()
-                .filter(x -> AzureBlobSinkConfig.FILE_NAME_TEMPLATE_CONFIG.equals(x.name()))
+                .filter(x -> FileNameFragment.FILE_NAME_TEMPLATE_CONFIG.equals(x.name()))
                 .findFirst()
                 .orElseThrow();
         assertThat(configValue.errorMessages()).isNotEmpty();
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
-                .hasMessageStartingWith("There are errors in the configuration:\n" + "Invalid value ");
+                .hasMessageContaining("for configuration file.name.template: ");
     }
 
     @Test
@@ -97,26 +102,30 @@ void acceptMultipleParametersWithTheSameName() {
     void requiredConfigurations() {
         final Map<String, String> properties = Map.of();
 
-        final var expectedErrorMessage = "Missing required configuration \"azure.storage.container.name\" which has no default value.";
+        final String[] expectedErrorMessage = {
+                "Missing required configuration \"azure.storage.container.name\" which has no default value.",
+                "Missing required configuration \"azure.storage.connection.string\" which has no default value.",
+                "Invalid value null for configuration azure.storage.container.name: names must be from 3 through 63 characters long." };
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "azure.storage.container.name",
-                expectedErrorMessage);
+        assertValidationContainsMessage(properties, "azure.storage.container.name", expectedErrorMessage);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
-                .hasMessage(expectedErrorMessage);
+                .hasMessageContaining(
+                        "Missing required configuration \"azure.storage.connection.string\" which has no default value.");
     }
 
     @Test
     void emptyAzureContainerName() {
         final Map<String, String> properties = Map.of("azure.storage.container.name", "");
 
-        final var expectedErrorMessage = "Invalid value  for configuration azure.storage.container.name: String must be non-empty";
+        final var expectedErrorMessage = "Missing required configuration \"azure.storage.connection.string\" which has no default value.";
+        final var expectedErrorMessage2 = "Invalid value  for configuration azure.storage.container.name: names must be from 3 through 63 characters long.";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "azure.storage.container.name",
-                expectedErrorMessage);
+        assertValidationContainsMessage(properties, "azure.storage.container.name", expectedErrorMessage,
+                expectedErrorMessage2);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
-                .hasMessage(expectedErrorMessage);
+                .hasMessageContainingAll(expectedErrorMessage);
     }
 
     @Test
@@ -228,12 +237,11 @@ void unsupportedCompressionType() {
         final var expectedErrorMessage = "Invalid value unsupported for configuration file.compression.type: "
                 + "String must be one of (case insensitive): ZSTD, GZIP, NONE, SNAPPY";
 
-        final var configValue = expectErrorMessageForConfigurationInConfigDefValidation(properties,
-                "file.compression.type", expectedErrorMessage);
+        final var configValue = AzureBlobSinkConfig.configDef().validateAll(properties).get("file.compression.type");
         assertThat(configValue.recommendedValues()).containsExactly("none", "gzip", "snappy", "zstd");
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
-                .hasMessageContaining(expectedErrorMessage);
+                .hasMessage(expectedErrorMessage);
     }
 
     @Test
@@ -243,8 +251,8 @@ void emptyOutputField() {
 
         final var expectedErrorMessage = "Invalid value [] for configuration format.output.fields: cannot be empty";
 
-        final var configValue = expectErrorMessageForConfigurationInConfigDefValidation(properties,
-                "format.output.fields", expectedErrorMessage);
+        final var configValue = assertValidationContainsMessage(properties, "format.output.fields",
+                expectedErrorMessage);
         assertThat(configValue.recommendedValues()).containsExactly("key", "value", "offset", "timestamp", "headers");
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
@@ -261,12 +269,12 @@ void unsupportedOutputField() {
                 + "for configuration format.output.fields: "
                 + "supported values are (case insensitive): key, value, offset, timestamp, headers";
 
-        final var configValue = expectErrorMessageForConfigurationInConfigDefValidation(properties,
-                "format.output.fields", expectedErrorMessage);
+        final var configValue = assertValidationContainsMessage(properties, "format.output.fields",
+                expectedErrorMessage);
         assertThat(configValue.recommendedValues()).containsExactly("key", "value", "offset", "timestamp", "headers");
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
-                .hasMessageContaining(expectedErrorMessage);
+                .hasMessage(expectedErrorMessage);
     }
 
     @Test
@@ -281,6 +289,7 @@ void connectorName() {
     }
 
     @Test
+    @Disabled("need validation of entire fname not just the prefix.")
     void fileNamePrefixTooLong() {
         final Map<String, String> properties = new HashMap<>();
         properties.put("azure.storage.container.name", "test-container");
@@ -290,7 +299,7 @@ void fileNamePrefixTooLong() {
         final var expectedErrorMessage = "Invalid value " + longString
                 + " for configuration azure.storage.container.name: " + "cannot be longer than 1024 characters";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.prefix", expectedErrorMessage);
+        assertValidationContainsMessage(properties, "file.name.prefix", expectedErrorMessage);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
                 .hasMessage(expectedErrorMessage);
@@ -321,15 +330,14 @@ void maxRecordsPerFileSetCorrect() {
     @Test
     void maxRecordsPerFileSetIncorrect() {
         final Map<String, String> properties = Map.of("azure.storage.container.name", "test-container",
-                "file.max.records", "-42");
+                "file.max.records", "-42", AzureBlobSinkConfig.AZURE_STORAGE_CONNECTION_STRING_CONFIG, "test");
 
-        final var expectedErrorMessage = "Invalid value -42 for configuration file.max.records: "
-                + "Value must be at least 0";
+        final var expectedErrorMessage = "Invalid value -42 for configuration file.max.records: Value must be at least 0";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.max.records", expectedErrorMessage);
+        assertValidationContainsMessage(properties, "file.max.records", expectedErrorMessage);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
-                .hasMessageContaining(expectedErrorMessage);
+                .hasMessage(expectedErrorMessage);
     }
 
     @ParameterizedTest
@@ -437,10 +445,8 @@ void emptyFilenameTemplate() {
         final var expectedErrorMessage = "Invalid value  for configuration file.name.template: RecordGrouper requires that the template [] has variables defined. Supported variables are: "
                 + TEMPLATE_VARIABLES + ".";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template", expectedErrorMessage);
+        assertValidationContainsMessage(properties, "file.name.template", expectedErrorMessage);
 
-        assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
-                .hasMessageContaining(expectedErrorMessage);
     }
 
     @Test
@@ -449,18 +455,19 @@ void filenameTemplateUnknownVariable() {
                 "azure.storage.connection.string", "test", "file.name.template",
                 "{{ aaa }}{{ topic }}{{ partition }}{{ start_offset }}");
 
-        final String errMsg1 = "Invalid value {{ aaa }}{{ topic }}{{ partition }}{{ start_offset }} for configuration "
-                + "file.name.template: unsupported template variable used ({{aaa}}), supported values are: {{key}}, {{partition}}, "
-                + "{{start_offset}}, {{timestamp}}, {{topic}}.";
+        final String errorPfx = "Invalid value {{ aaa }}{{ topic }}{{ partition }}{{ start_offset }} "
+                + "for configuration file.name.template: ";
 
-        final String errMsg2 = "Invalid value {{ aaa }}{{ topic }}{{ partition }}{{ start_offset }} for configuration "
-                + "file.name.template: unsupported set of template variables, supported sets are: topic,partition,start_offset,timestamp; "
-                + "topic,partition,key,start_offset,timestamp; key; key,topic,partition.";
+        final var expectedErrorMessage1 = errorPfx + "unsupported template variable used ({{aaa}}), "
+                + "supported values are: {{key}}, {{partition}}, {{start_offset}}, {{timestamp}}, {{topic}}.";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template", errMsg1, errMsg2);
+        final var expectedErrorMessage2 = errorPfx + "unsupported set of template variables, supported sets are: "
+                + TEMPLATE_VARIABLES + ".";
+
+        assertValidationContainsMessage(properties, "file.name.template", expectedErrorMessage1, expectedErrorMessage2);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
-                .hasMessageContaining(errMsg1, errMsg2);
+                .hasMessageContaining(expectedErrorMessage1, expectedErrorMessage2);
     }
 
     @Test
@@ -471,10 +478,7 @@ void filenameTemplateNoTopic() {
         final var expectedErrorMessage = "Invalid value {{ partition }}{{ start_offset }} for configuration file.name.template: "
                 + "unsupported set of template variables, supported sets are: " + TEMPLATE_VARIABLES + ".";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template", expectedErrorMessage);
-
-        assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
-                .hasMessageContaining(expectedErrorMessage);
+        assertValidationContainsMessage(properties, "file.name.template", expectedErrorMessage);
     }
 
     @Test
@@ -483,11 +487,10 @@ void wrongVariableParameterValue() {
                 "azure.storage.connection.string", "test", "file.name.template",
                 "{{start_offset:padding=FALSE}}-{{partition}}-{{topic}}");
 
-        final var expectedErrorMessage = "Invalid value {{start_offset:padding=FALSE}}-{{partition}}-{{topic}} for "
-                + "configuration file.name.template: FALSE is not a valid value for parameter padding, "
-                + "supported values are: true|false.";
+        final var expectedErrorMessage = "Invalid value {{start_offset:padding=FALSE}}-{{partition}}-{{topic}} "
+                + "for configuration file.name.template: FALSE is not a valid value for parameter padding, supported values are: true|false.";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template", expectedErrorMessage);
+        assertValidationContainsMessage(properties, "file.name.template", expectedErrorMessage);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
                 .hasMessageContaining(expectedErrorMessage);
@@ -503,7 +506,7 @@ void variableWithoutRequiredParameterValue() {
                 + "for configuration file.name.template: parameter unit is required for the the variable timestamp, "
                 + "supported values are: yyyy|MM|dd|HH.";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template", expectedErrorMessage);
+        assertValidationContainsMessage(properties, "file.name.template", expectedErrorMessage);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
                 .hasMessageContaining(expectedErrorMessage);
@@ -518,7 +521,8 @@ void wrongVariableWithoutParameter() {
         final var expectedErrorMessage = "Invalid value {{start_offset:}}-{{partition}}-{{topic}} "
                 + "for configuration file.name.template: Wrong variable with parameter definition";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template", expectedErrorMessage);
+        // expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template",
+        // expectedErrorMessage);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
                 .hasMessage(expectedErrorMessage);
@@ -533,7 +537,8 @@ void noVariableWithParameter() {
         final var expectedErrorMessage = "Invalid value {{:padding=true}}-{{partition}}-{{topic}} "
                 + "for configuration file.name.template: Variable name hasn't been set for template: {{:padding=true}}-{{partition}}-{{topic}}";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template", expectedErrorMessage);
+        // expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template",
+        // expectedErrorMessage);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
                 .hasMessage(expectedErrorMessage);
@@ -548,7 +553,7 @@ void wrongVariableWithoutParameterValue() {
         final var expectedErrorMessage = "Invalid value {{start_offset:padding=}}-{{partition}}-{{topic}} "
                 + "for configuration file.name.template: Parameter value for variable `start_offset` and parameter `padding` has not been set";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template", expectedErrorMessage);
+        assertValidationContainsMessage(properties, "file.name.template", expectedErrorMessage);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
                 .hasMessage(expectedErrorMessage);
@@ -563,8 +568,6 @@ void wrongVariableWithoutParameterName() {
         final var expectedErrorMessage = "Invalid value {{start_offset:=true}}-{{partition}}-{{topic}} "
                 + "for configuration file.name.template: Parameter name for variable `start_offset` has not been set";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template", expectedErrorMessage);
-
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
                 .hasMessage(expectedErrorMessage);
     }
@@ -577,7 +580,7 @@ void filenameTemplateNoPartition() {
         final var expectedErrorMessage = "Invalid value {{ topic }}{{ start_offset }} for configuration file.name.template: "
                 + "unsupported set of template variables, supported sets are: " + TEMPLATE_VARIABLES + ".";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template", expectedErrorMessage);
+        assertValidationContainsMessage(properties, "file.name.template", expectedErrorMessage);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
                 .hasMessageContaining(expectedErrorMessage);
@@ -591,7 +594,7 @@ void filenameTemplateNoStartOffset() {
         final var expectedErrorMessage = "Invalid value {{ topic }}{{ partition }} for configuration file.name.template: "
                 + "unsupported set of template variables, supported sets are: " + TEMPLATE_VARIABLES + ".";
 
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template", expectedErrorMessage);
+        assertValidationContainsMessage(properties, "file.name.template", expectedErrorMessage);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
                 .hasMessageContaining(expectedErrorMessage);
@@ -620,13 +623,9 @@ void keyFilenameTemplateAndLimitedRecordsPerFileMoreThan1() {
         final Map<String, String> properties = Map.of("azure.storage.container.name", "test-container",
                 "azure.storage.connection.string", "test", "file.name.template", "{{key}}", "file.max.records", "42");
 
-        final var expectedErrorMessage = "Invalid value 42 for configuration file.max.records: "
-                + "When file.name.template is {{key}}, file.max.records must be either 1 or not set.";
-
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.max.records", expectedErrorMessage);
+        final String expectedErrorMessage = "Invalid value 42 for configuration file.max.records: When file.name.template is {{key}}, file.max.records must be either 1 or not set.";
 
-        assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
-                .hasMessageContaining(expectedErrorMessage);
+        assertValidationContainsMessage(properties, "file.max.records", expectedErrorMessage);
     }
 
     @Test
@@ -657,14 +656,11 @@ void wrongFilenameTimestampSource() {
                 "azure.storage.connection.string", "test", "file.name.timestamp.timezone", "Europe/Berlin",
                 "file.name.timestamp.source", "UNKNOWN_TIMESTAMP_SOURCE");
 
-        final var expectedErrorMessage = "Invalid value UNKNOWN_TIMESTAMP_SOURCE for configuration file.name.timestamp.source: "
-                + "String must be one of (case insensitive): EVENT, WALLCLOCK";
-
-        expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.timestamp.source",
-                expectedErrorMessage);
+        final var expectedErrorMessage = "Invalid value UNKNOWN_TIMESTAMP_SOURCE for configuration "
+                + "file.name.timestamp.source: String must be one of (case insensitive): EVENT, WALLCLOCK";
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
-                .hasMessageContaining(expectedErrorMessage);
+                .hasMessage(expectedErrorMessage);
     }
 
     @Test
@@ -702,24 +698,27 @@ void wrongFormatTypeConfig() {
         final var expectedErrorMessage = "Invalid value unknown for configuration format.output.type: "
                 + "String must be one of (case insensitive): PARQUET, CSV, JSON, AVRO, JSONL";
 
-        final var configValue = expectErrorMessageForConfigurationInConfigDefValidation(properties,
-                "format.output.type", expectedErrorMessage);
+        final var configValue = assertValidationContainsMessage(properties, "format.output.type", expectedErrorMessage);
+
         assertThat(configValue.recommendedValues()).containsExactly("avro", "csv", "json", "jsonl", "parquet");
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
-                .hasMessageContaining(expectedErrorMessage);
+                .hasMessage(expectedErrorMessage);
     }
 
     @ParameterizedTest
     @ValueSource(strings = { "{{key}}", "{{topic}}/{{partition}}/{{key}}" })
     void notSupportedFileMaxRecords(final String fileNameTemplate) {
-        final Map<String, String> properties = Map.of(AzureBlobSinkConfig.FILE_NAME_TEMPLATE_CONFIG, fileNameTemplate,
-                AzureBlobSinkConfig.FILE_MAX_RECORDS, "2", AzureBlobSinkConfig.AZURE_STORAGE_CONTAINER_NAME_CONFIG,
-                "any_container");
-        assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
-                .hasMessageContaining(
-                        String.format("When file.name.template is %s, file.max.records must be either 1 or not set",
-                                fileNameTemplate));
+        final Map<String, String> properties = new HashMap<>();
+        FileNameFragment.setter(properties).template(fileNameTemplate).maxRecordsPerFile(2);
+        properties.put(AzureBlobSinkConfig.AZURE_STORAGE_CONTAINER_NAME_CONFIG, "any-container");
+        properties.put(AzureBlobSinkConfig.AZURE_STORAGE_CONNECTION_STRING_CONFIG, "test");
+
+        final String expectedErrorMessage = String.format(
+                "Invalid value 2 for configuration file.max.records: When file.name.template is %s, file.max.records must be either 1 or not set.",
+                fileNameTemplate);
+
+        assertValidationContainsMessage(properties, "file.max.records", expectedErrorMessage);
     }
 
     private void assertConfigDefValidationPasses(final Map<String, String> properties) {
@@ -728,18 +727,18 @@ private void assertConfigDefValidationPasses(final Map<String, String> propertie
         }
     }
 
-    private ConfigValue expectErrorMessageForConfigurationInConfigDefValidation(final Map<String, String> properties,
+    private ConfigValue assertValidationContainsMessage(final Map<String, String> properties,
             final String configuration, final String... expectedErrorMessages) {
-        ConfigValue result = null;
-        for (final ConfigValue configValue : AzureBlobSinkConfig.configDef().validate(properties)) {
-            if (configValue.name().equals(configuration)) {
-                assertThat(configValue.errorMessages()).containsExactlyInAnyOrder(expectedErrorMessages);
-                result = configValue;
-            } else {
-                assertThat(configValue.errorMessages()).isEmpty();
-            }
-        }
-        assertThat(result).withFailMessage("Config value not found").isNotNull();
-        return result;
+
+        final List<String> errorMsgs = new ArrayList<>();
+        final List<ConfigValue> configValues = AzureBlobSinkConfig.configDef().validate(properties);
+        configValues.stream().map(ConfigValue::errorMessages).forEach(errorMsgs::addAll);
+        assertThat(errorMsgs).containsExactlyInAnyOrder(expectedErrorMessages);
+
+        final Optional<ConfigValue> result = configValues.stream()
+                .filter(cv -> cv.name().equals(configuration))
+                .findAny();
+        assertThat(result).withFailMessage("Config value not found").isNotEmpty();
+        return result.get();
     }
 }
diff --git a/azure-source-connector/build.gradle.kts b/azure-source-connector/build.gradle.kts
index b766eab46..6b6b44a49 100644
--- a/azure-source-connector/build.gradle.kts
+++ b/azure-source-connector/build.gradle.kts
@@ -59,8 +59,8 @@ dependencies {
   compileOnly("org.apache.velocity:velocity-engine-core:2.4.1")
   compileOnly("org.apache.velocity.tools:velocity-tools-generic:3.1")
 
-  implementation(apache.commons.io)
-  implementation(apache.commons.lang3)
+  implementation("commons-io:commons-io:2.18.0")
+  implementation("org.apache.commons:commons-lang3:3.17.0")
   implementation(project(":commons"))
   implementation(apache.commons.collection4)
   implementation("com.azure:azure-storage-blob:12.30.0")
@@ -176,7 +176,7 @@ publishing {
         licenses {
           license {
             name = "Apache 2.0"
-            url = "https://www.apache.org/licenses/LICENSE-2.0"
+            url = "http://www.apache.org/licenses/LICENSE-2.0"
             distribution = "repo"
           }
         }
diff --git a/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/AzureBlobSourceConnector.java b/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/AzureBlobSourceConnector.java
index 82ef42c16..97876c4ab 100644
--- a/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/AzureBlobSourceConnector.java
+++ b/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/AzureBlobSourceConnector.java
@@ -28,7 +28,7 @@
 import org.apache.kafka.connect.connector.Task;
 import org.apache.kafka.connect.source.SourceConnector;
 
-import io.aiven.kafka.connect.azure.source.config.AzureBlobSourceConfig;
+import io.aiven.kafka.connect.azure.source.config.AzureBlobSourceConfigDef;
 import io.aiven.kafka.connect.azure.source.utils.VersionInfo;
 
 import org.slf4j.Logger;
@@ -46,7 +46,7 @@ public class AzureBlobSourceConnector extends SourceConnector {
 
     @Override
     public ConfigDef config() {
-        return AzureBlobSourceConfig.configDef();
+        return new AzureBlobSourceConfigDef();
     }
 
     @Override
diff --git a/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobConfigFragment.java b/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobConfigFragment.java
index 9973832bc..6509cab67 100644
--- a/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobConfigFragment.java
+++ b/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobConfigFragment.java
@@ -17,8 +17,8 @@
 package io.aiven.kafka.connect.azure.source.config;
 
 import java.time.Duration;
+import java.util.regex.Pattern;
 
-import org.apache.kafka.common.config.AbstractConfig;
 import org.apache.kafka.common.config.ConfigDef;
 import org.apache.kafka.common.config.ConfigException;
 
@@ -33,6 +33,7 @@
 import com.azure.core.http.policy.UserAgentPolicy;
 import com.azure.storage.blob.BlobServiceAsyncClient;
 import com.azure.storage.blob.BlobServiceClientBuilder;
+
 /**
  * The configuration fragment that defines the Azure specific characteristics.
  */
@@ -58,14 +59,47 @@ public class AzureBlobConfigFragment extends ConfigFragment {
     public static final long AZURE_RETRY_BACKOFF_MAX_DELAY_MS_DEFAULT = 32_000L;
     public static final int AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_DEFAULT = 6;
 
+    private final static Pattern CONTAINER_NAME_PATTERN = Pattern.compile("[0-9a-z][0-9a-z\\-]+[0-9a-z]");
+
+    /**
+     * From Azure documentation:
+     * <ul>
+     * <li>Container names must start or end with a letter or number, and can contain only letters, numbers, and the
+     * hyphen/minus (-) character.</li>
+     * <li>Every hyphen/minus (-) character must be immediately preceded and followed by a letter or number; consecutive
+     * hyphens aren't permitted in container names.</li>
+     * <li>All letters in a container name must be lowercase.</li>
+     * <li>Container names must be from 3 through 63 characters long.</li>
+     * </ul>
+     */
+    private static final ConfigDef.Validator CONTAINER_NAME_VALIDATOR = ConfigDef.CompositeValidator
+            .of(ConfigDef.LambdaValidator.with((name, value) -> {
+                final int len = value == null ? 0 : value.toString().length();
+                if (len < 3 || len > 63) {
+                    throw new ConfigException(name, value, "names must be from 3 through 63 characters long.");
+                }
+            }, () -> "must be from 3 through 63 characters long"), ConfigDef.LambdaValidator.with((name, value) -> {
+                if (value.toString().contains("--")) {
+                    throw new ConfigException(name, value,
+                            "Every hyphen/minus (-) character must be immediately preceded and followed by a letter or number; consecutive hyphens aren't permitted in container names.");
+                }
+            }, () -> "consecutive hyphens aren't permitted in container names"),
+                    // regex last for speed
+                    ConfigDef.LambdaValidator.with((name, value) -> {
+                        if (!CONTAINER_NAME_PATTERN.matcher(value.toString()).matches()) {
+                            throw new ConfigException(name, value,
+                                    "must start or end with a letter or number, and can contain only lower case letters, numbers, and the hyphen/minus (-) character.");
+                        }
+                    }, () -> "start or end with a letter or number, and can contain only lower case letters, numbers, and the hyphen/minus (-) character"));
+
     /**
      * Construct the Azure Blob ConfigFragment..
      *
-     * @param cfg
+     * @param dataAccess
      *            the configuration that this fragment is associated with.
      */
-    protected AzureBlobConfigFragment(final AbstractConfig cfg) {
-        super(FragmentDataAccess.from(cfg));
+    protected AzureBlobConfigFragment(final FragmentDataAccess dataAccess) {
+        super(dataAccess);
     }
 
     /**
@@ -75,9 +109,9 @@ protected AzureBlobConfigFragment(final AbstractConfig cfg) {
      *            the Configuration definition.
      * @return the update configuration definition
      */
-    public static ConfigDef update(final ConfigDef configDef) {
+    public static ConfigDef update(final ConfigDef configDef, final boolean isSink) {
         addUserAgentConfig(configDef);
-        addAzureConfigGroup(configDef);
+        addAzureConfigGroup(configDef, isSink);
         addAzureRetryPolicies(configDef);
         return configDef;
     }
@@ -87,67 +121,51 @@ private static void addUserAgentConfig(final ConfigDef configDef) {
                 "A custom user agent used while contacting Azure");
     }
 
-    private static void addAzureConfigGroup(final ConfigDef configDef) {
+    private static void addAzureConfigGroup(final ConfigDef configDef, final boolean isSink) {
         int azureGroupCounter = 0;
-        configDef.define(AZURE_STORAGE_CONNECTION_STRING_CONFIG, ConfigDef.Type.STRING, null, ConfigDef.Importance.HIGH,
-                "Azure Storage connection string.", GROUP_AZURE, azureGroupCounter++, ConfigDef.Width.NONE,
-                AZURE_STORAGE_CONNECTION_STRING_CONFIG);
+        configDef.define(AZURE_STORAGE_CONNECTION_STRING_CONFIG, ConfigDef.Type.STRING, ConfigDef.NO_DEFAULT_VALUE,
+                ConfigDef.Importance.HIGH, "Azure Storage connection string.", GROUP_AZURE, ++azureGroupCounter,
+                ConfigDef.Width.NONE, AZURE_STORAGE_CONNECTION_STRING_CONFIG);
 
         configDef.define(AZURE_STORAGE_CONTAINER_NAME_CONFIG, ConfigDef.Type.STRING, ConfigDef.NO_DEFAULT_VALUE,
-                new ConfigDef.NonEmptyString(), ConfigDef.Importance.HIGH,
+                CONTAINER_NAME_VALIDATOR, ConfigDef.Importance.HIGH,
                 "The Azure Blob container that files will be written to or read from.", GROUP_AZURE,
-                azureGroupCounter++, ConfigDef.Width.NONE, AZURE_STORAGE_CONTAINER_NAME_CONFIG);
-        configDef.define(AZURE_FETCH_PAGE_SIZE, ConfigDef.Type.INT, 10, ConfigDef.Range.atLeast(1),
-                ConfigDef.Importance.MEDIUM, "Azure fetch page size", GROUP_AZURE, azureGroupCounter++,
-                ConfigDef.Width.NONE, AZURE_FETCH_PAGE_SIZE);
+                ++azureGroupCounter, ConfigDef.Width.NONE, AZURE_STORAGE_CONTAINER_NAME_CONFIG);
+
         configDef.define(AZURE_PREFIX_CONFIG, ConfigDef.Type.STRING, null, new ConfigDef.NonEmptyString(),
                 ConfigDef.Importance.MEDIUM,
                 "Prefix for storage file names, generally specifies directory like"
                         + " structures that do not contain any templated fields.",
-                GROUP_AZURE, azureGroupCounter++, ConfigDef.Width.NONE, AZURE_PREFIX_CONFIG); // NOPMD increment value
-                                                                                              // never used
-
-        configDef.define(AZURE_FETCH_BUFFER_SIZE, ConfigDef.Type.INT, 1000, ConfigDef.Range.atLeast(1),
-                ConfigDef.Importance.MEDIUM,
-                "Azure fetch buffer size. This is the number of object keys kept in a buffer to ensure lexically older objet keys aren't skipped for processing if they are slower to upload.",
-                GROUP_AZURE, azureGroupCounter++, // NOPMD
-                // UnusedAssignment
-                ConfigDef.Width.NONE, AZURE_FETCH_BUFFER_SIZE);
+                GROUP_AZURE, ++azureGroupCounter, ConfigDef.Width.NONE, AZURE_PREFIX_CONFIG);
+        if (!isSink) {
+            configDef.define(AZURE_FETCH_PAGE_SIZE, ConfigDef.Type.INT, 10, ConfigDef.Range.atLeast(1),
+                    ConfigDef.Importance.MEDIUM, "Azure fetch page size", GROUP_AZURE, ++azureGroupCounter,
+                    ConfigDef.Width.NONE, AZURE_FETCH_PAGE_SIZE);
+
+            configDef.define(AZURE_FETCH_BUFFER_SIZE, ConfigDef.Type.INT, 1000, ConfigDef.Range.atLeast(1),
+                    ConfigDef.Importance.MEDIUM,
+                    "Azure fetch buffer size. This is the number of object keys kept in a buffer to ensure lexically older objet keys aren't skipped for processing if they are slower to upload.",
+                    GROUP_AZURE, ++azureGroupCounter, ConfigDef.Width.NONE, AZURE_FETCH_BUFFER_SIZE);
+        }
     }
 
     private static void addAzureRetryPolicies(final ConfigDef configDef) {
         int retryPolicyGroupCounter = 0;
         configDef.define(AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG, ConfigDef.Type.LONG,
                 AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_DEFAULT, ConfigDef.Range.atLeast(0L), ConfigDef.Importance.MEDIUM,
-                "Initial retry delay in milliseconds. The default value is "
-                        + AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_DEFAULT,
-                GROUP_AZURE_RETRY_BACKOFF_POLICY, retryPolicyGroupCounter++, ConfigDef.Width.NONE,
-                AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG);
+                "Initial retry delay in milliseconds.", GROUP_AZURE_RETRY_BACKOFF_POLICY, ++retryPolicyGroupCounter,
+                ConfigDef.Width.NONE, AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG);
         configDef.define(AZURE_RETRY_BACKOFF_MAX_DELAY_MS_CONFIG, ConfigDef.Type.LONG,
                 AZURE_RETRY_BACKOFF_MAX_DELAY_MS_DEFAULT, ConfigDef.Range.atLeast(0L), ConfigDef.Importance.MEDIUM,
-                "Maximum retry delay in milliseconds. The default value is " + AZURE_RETRY_BACKOFF_MAX_DELAY_MS_DEFAULT,
-                GROUP_AZURE_RETRY_BACKOFF_POLICY, retryPolicyGroupCounter++, ConfigDef.Width.NONE,
-                AZURE_RETRY_BACKOFF_MAX_DELAY_MS_CONFIG);
+                "Maximum retry delay in milliseconds.", GROUP_AZURE_RETRY_BACKOFF_POLICY, ++retryPolicyGroupCounter,
+                ConfigDef.Width.NONE, AZURE_RETRY_BACKOFF_MAX_DELAY_MS_CONFIG);
         configDef.define(AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_CONFIG, ConfigDef.Type.INT,
                 AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_DEFAULT, ConfigDef.Range.atLeast(0L), ConfigDef.Importance.MEDIUM,
                 "Retry max attempts. The default value is " + AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_DEFAULT,
-                GROUP_AZURE_RETRY_BACKOFF_POLICY, retryPolicyGroupCounter++, ConfigDef.Width.NONE, // NOPMD
-                // retryPolicyGroupCounter
-                // updated value
-                // never
-                // used
+                GROUP_AZURE_RETRY_BACKOFF_POLICY, ++retryPolicyGroupCounter, ConfigDef.Width.NONE,
                 AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_CONFIG);
     }
 
-    @Override
-    public void validate() {
-        final String connectionString = getString(AZURE_STORAGE_CONNECTION_STRING_CONFIG);
-
-        if (connectionString == null) {
-            throw new ConfigException(
-                    String.format("The configuration %s cannot be null.", AZURE_STORAGE_CONNECTION_STRING_CONFIG));
-        }
-    }
     public int getAzureFetchPageSize() {
         return getInt(AZURE_FETCH_PAGE_SIZE);
     }
diff --git a/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobSourceConfig.java b/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobSourceConfig.java
index 2449481e2..9ba402b45 100644
--- a/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobSourceConfig.java
+++ b/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobSourceConfig.java
@@ -18,10 +18,8 @@
 
 import java.util.Map;
 
-import io.aiven.kafka.connect.common.config.FileNameFragment;
+import io.aiven.kafka.connect.common.config.FragmentDataAccess;
 import io.aiven.kafka.connect.common.config.SourceCommonConfig;
-import io.aiven.kafka.connect.common.config.SourceConfigFragment;
-import io.aiven.kafka.connect.common.config.TransformerFragment;
 
 import com.azure.storage.blob.BlobServiceAsyncClient;
 
@@ -30,22 +28,8 @@ public class AzureBlobSourceConfig extends SourceCommonConfig {
     // TODO AzureBlobFragment needs to be extracted from Azure Sink.
     private final AzureBlobConfigFragment azureBlobConfigFragment;
     public AzureBlobSourceConfig(final Map<?, ?> properties) {
-        super(configDef(), properties);
-        azureBlobConfigFragment = new AzureBlobConfigFragment(this);
-        validate();
-    }
-
-    public static AzureBlobSourceConfigDef configDef() {
-
-        final var configDef = new AzureBlobSourceConfigDef();
-
-        FileNameFragment.update(configDef);
-        SourceConfigFragment.update(configDef);
-        TransformerFragment.update(configDef);
-        AzureBlobConfigFragment.update(configDef);
-        return configDef;
-    }
-    private void validate() {
+        super(new AzureBlobSourceConfigDef(), properties);
+        azureBlobConfigFragment = new AzureBlobConfigFragment(FragmentDataAccess.from(this));
     }
 
     public int getAzureFetchPageSize() {
diff --git a/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobSourceConfigDef.java b/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobSourceConfigDef.java
index 0699125a9..6dac67b59 100644
--- a/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobSourceConfigDef.java
+++ b/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobSourceConfigDef.java
@@ -16,8 +16,25 @@
 
 package io.aiven.kafka.connect.azure.source.config;
 
+import java.util.Map;
+
+import org.apache.kafka.common.config.ConfigValue;
+
+import io.aiven.kafka.connect.common.config.FragmentDataAccess;
 import io.aiven.kafka.connect.common.config.SourceCommonConfig;
 
-public class AzureBlobSourceConfigDef extends SourceCommonConfig.SourceCommonConfigDef {
+public final class AzureBlobSourceConfigDef extends SourceCommonConfig.SourceCommonConfigDef {
+
+    public AzureBlobSourceConfigDef() {
+        super();
+        AzureBlobConfigFragment.update(this, false);
+    }
 
+    @Override
+    public Map<String, ConfigValue> multiValidate(final Map<String, ConfigValue> valueMap) {
+        final Map<String, ConfigValue> result = super.multiValidate(valueMap);
+        final FragmentDataAccess dataAccess = FragmentDataAccess.from(result);
+        new AzureBlobConfigFragment(dataAccess).validate(result);
+        return result;
+    }
 }
diff --git a/settings.gradle.kts b/settings.gradle.kts
index 1d1a8826d..2567b6ade 100644
--- a/settings.gradle.kts
+++ b/settings.gradle.kts
@@ -43,7 +43,7 @@ dependencyResolutionManagement {
           "org.apache.commons:commons-collections4:$commonsCollections4Version")
       library("commons-io", "commons-io:commons-io:$commonsIOVersion")
       library("commons-lang3", "org.apache.commons:commons-lang3:$commonsLang3Version")
-      library("kafka-connect-api", "org.apache.kafka:connect-api:$kafkaAPIVersion")
+      library("kafka-connect-api", "org.apache.kafka:connect-api:$kafkaVersion")
       library("kafka-connect-json", "org.apache.kafka:connect-json:$kafkaVersion")
       library("kafka-connect-runtime", "org.apache.kafka:connect-runtime:$kafkaVersion")
       library("kafka-connect-transforms", "org.apache.kafka:connect-transforms:$kafkaVersion")

From 5a6d41df6b29f02642ebfc55639d73dc30811ffe Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Fri, 21 Nov 2025 16:05:55 +0000
Subject: [PATCH 13/19] cleaned up reporting

---
 .../src/templates/configData.md.vm            |  2 +-
 .../config/AzureBlobConfigFragment.java       |  9 +--
 .../common/config/CommonConfigFragment.java   | 16 +++--
 .../aiven/kafka/connect/tools/ConfigDoc.java  | 69 ++++++++++++++++++-
 4 files changed, 82 insertions(+), 14 deletions(-)

diff --git a/azure-sink-connector/src/templates/configData.md.vm b/azure-sink-connector/src/templates/configData.md.vm
index 65f05c9c4..a747a741f 100644
--- a/azure-sink-connector/src/templates/configData.md.vm
+++ b/azure-sink-connector/src/templates/configData.md.vm
@@ -10,6 +10,6 @@ ${esc.hash}${esc.hash} ${section.displayName}
  - Valid values:  ${section.validator|"no restrictions"}
  - Importance: $section.importance
 
- $section.documentation
+ ${esc.markdown($section.documentation)}
 
 #end
\ No newline at end of file
diff --git a/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobConfigFragment.java b/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobConfigFragment.java
index 6509cab67..4a45e46c4 100644
--- a/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobConfigFragment.java
+++ b/azure-source-connector/src/main/java/io/aiven/kafka/connect/azure/source/config/AzureBlobConfigFragment.java
@@ -25,6 +25,7 @@
 import io.aiven.kafka.connect.azure.source.utils.VersionInfo;
 import io.aiven.kafka.connect.common.config.ConfigFragment;
 import io.aiven.kafka.connect.common.config.FragmentDataAccess;
+import io.aiven.kafka.connect.common.config.validators.TimeScaleValidator;
 
 import com.azure.core.http.policy.ExponentialBackoffOptions;
 import com.azure.core.http.policy.HttpLogDetailLevel;
@@ -152,11 +153,11 @@ private static void addAzureConfigGroup(final ConfigDef configDef, final boolean
     private static void addAzureRetryPolicies(final ConfigDef configDef) {
         int retryPolicyGroupCounter = 0;
         configDef.define(AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG, ConfigDef.Type.LONG,
-                AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_DEFAULT, ConfigDef.Range.atLeast(0L), ConfigDef.Importance.MEDIUM,
-                "Initial retry delay in milliseconds.", GROUP_AZURE_RETRY_BACKOFF_POLICY, ++retryPolicyGroupCounter,
-                ConfigDef.Width.NONE, AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG);
+                AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_DEFAULT, TimeScaleValidator.atLeast(0),
+                ConfigDef.Importance.MEDIUM, "Initial retry delay in milliseconds.", GROUP_AZURE_RETRY_BACKOFF_POLICY,
+                ++retryPolicyGroupCounter, ConfigDef.Width.NONE, AZURE_RETRY_BACKOFF_INITIAL_DELAY_MS_CONFIG);
         configDef.define(AZURE_RETRY_BACKOFF_MAX_DELAY_MS_CONFIG, ConfigDef.Type.LONG,
-                AZURE_RETRY_BACKOFF_MAX_DELAY_MS_DEFAULT, ConfigDef.Range.atLeast(0L), ConfigDef.Importance.MEDIUM,
+                AZURE_RETRY_BACKOFF_MAX_DELAY_MS_DEFAULT, TimeScaleValidator.atLeast(0), ConfigDef.Importance.MEDIUM,
                 "Maximum retry delay in milliseconds.", GROUP_AZURE_RETRY_BACKOFF_POLICY, ++retryPolicyGroupCounter,
                 ConfigDef.Width.NONE, AZURE_RETRY_BACKOFF_MAX_DELAY_MS_CONFIG);
         configDef.define(AZURE_RETRY_BACKOFF_MAX_ATTEMPTS_CONFIG, ConfigDef.Type.INT,
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/config/CommonConfigFragment.java b/commons/src/main/java/io/aiven/kafka/connect/common/config/CommonConfigFragment.java
index 82bb28e80..50aa635da 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/config/CommonConfigFragment.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/config/CommonConfigFragment.java
@@ -18,6 +18,7 @@
 
 import static org.apache.kafka.common.config.ConfigDef.Range.atLeast;
 
+import java.util.Collections;
 import java.util.Map;
 
 import org.apache.kafka.common.config.ConfigDef;
@@ -52,13 +53,14 @@ public static ConfigDef update(final ConfigDef configDef) {
         int orderInGroup = 0;
         final String commonGroup = "commons";
 
-        return configDef
-                .define(ConnectorConfig.TASKS_MAX_CONFIG, ConfigDef.Type.INT, 1, atLeast(1), ConfigDef.Importance.HIGH,
-                        "Maximum number of tasks to use for this connector.", commonGroup, ++orderInGroup,
-                        ConfigDef.Width.SHORT, ConnectorConfig.TASKS_MAX_CONFIG)
-                .define(TASK_ID, ConfigDef.Type.INT, 1, atLeast(0), ConfigDef.Importance.HIGH,
-                        "The task ID that this connector is working with.", commonGroup, ++orderInGroup,
-                        ConfigDef.Width.SHORT, TASK_ID);
+        configDef.define(ConnectorConfig.TASKS_MAX_CONFIG, ConfigDef.Type.INT, 1, atLeast(1), ConfigDef.Importance.HIGH,
+                "Maximum number of tasks to use for this connector.", commonGroup, ++orderInGroup,
+                ConfigDef.Width.SHORT, ConnectorConfig.TASKS_MAX_CONFIG);
+
+        final ConfigDef.ConfigKey key = new ConfigDef.ConfigKey(TASK_ID, ConfigDef.Type.INT, 0, atLeast(0),
+                ConfigDef.Importance.HIGH, "The task ID that this connector is working with.", commonGroup,
+                ++orderInGroup, ConfigDef.Width.SHORT, TASK_ID, Collections.emptyList(), null, true);
+        return configDef.define(key);
     }
 
     /**
diff --git a/site/src/main/java/io/aiven/kafka/connect/tools/ConfigDoc.java b/site/src/main/java/io/aiven/kafka/connect/tools/ConfigDoc.java
index 1b421a23d..6a7b8338c 100644
--- a/site/src/main/java/io/aiven/kafka/connect/tools/ConfigDoc.java
+++ b/site/src/main/java/io/aiven/kafka/connect/tools/ConfigDoc.java
@@ -74,11 +74,13 @@ public static void execute(final ConfigDef configDef, final String templateFile,
         final Collection<ConfigDef.ConfigKey> keys = configDef.configKeys().values();
         final Map<String, ConfigData> sections = new TreeMap<>();
         for (final ConfigDef.ConfigKey key : keys) {
-            sections.put(key.name, new ConfigData(key));
+            if (!key.internalConfig) {
+                sections.put(key.name, new ConfigData(key));
+            }
         }
 
         context.put("sections", sections.values());
-        context.put("esc", new EscapeTool());
+        context.put("esc", new Escaper());
 
         final File file = new File(output);
         if (!file.getParentFile().exists() && !file.getParentFile().mkdirs()) {
@@ -138,4 +140,67 @@ public static void main(final String[] args) throws IOException, ClassNotFoundEx
         }
     }
 
+    public static class Escaper extends EscapeTool {
+
+        private static String[] charParser(final String charText) {
+            char[] chars = charText.toCharArray();
+            String[] result = new String[chars.length];
+            for (int i = 0; i < chars.length; i++) {
+                result[i] = String.valueOf(chars[i]);
+            }
+            return result;
+        }
+
+        /**
+         * The characters to escape for markdown.
+         */
+        private static final String[] MARKDOWN_CHARS = charParser("\\`*_{}[]<>()#+-.!|");
+        /**
+         * The characters to escape for APT (Almost Plain Text).
+         */
+        private static final String[] APT_CHARS = charParser("\\~=-+*[]<>{}");
+
+        /**
+         * Escapes a text string.
+         *
+         * @param text
+         *            the text to escape.
+         * @param chars
+         *            the characters to escape.
+         * @return the escaped string.
+         */
+        private String escape(final String text, final String[] chars) {
+            if (text == null) {
+                return "";
+            }
+            String result = text;
+            for (String c : chars) {
+                result = result.replace(c, "\\" + c);
+            }
+            return result;
+        }
+
+        /**
+         * Escapes a string for markdown.
+         *
+         * @param text
+         *            the text to escape.
+         * @return the text with the markdown specific characters escaped.
+         */
+        public String markdown(final String text) {
+            return escape(text, MARKDOWN_CHARS);
+        }
+
+        /**
+         * Escapes a string for APT (almost plain text).
+         *
+         * @param text
+         *            the text to escape.
+         * @return the text with the APT specific characters escaped.
+         */
+        public String apt(final String text) {
+            return escape(text, APT_CHARS);
+        }
+
+    }
 }

From ff67e8ae01167738e369234d6f0191beacfb40af Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Mon, 24 Nov 2025 08:59:49 +0000
Subject: [PATCH 14/19] updated configdoc

---
 .../aiven/kafka/connect/tools/ConfigDoc.java  | 22 +++++++++----------
 1 file changed, 11 insertions(+), 11 deletions(-)

diff --git a/site/src/main/java/io/aiven/kafka/connect/tools/ConfigDoc.java b/site/src/main/java/io/aiven/kafka/connect/tools/ConfigDoc.java
index 6a7b8338c..df0d8f567 100644
--- a/site/src/main/java/io/aiven/kafka/connect/tools/ConfigDoc.java
+++ b/site/src/main/java/io/aiven/kafka/connect/tools/ConfigDoc.java
@@ -142,15 +142,6 @@ public static void main(final String[] args) throws IOException, ClassNotFoundEx
 
     public static class Escaper extends EscapeTool {
 
-        private static String[] charParser(final String charText) {
-            char[] chars = charText.toCharArray();
-            String[] result = new String[chars.length];
-            for (int i = 0; i < chars.length; i++) {
-                result[i] = String.valueOf(chars[i]);
-            }
-            return result;
-        }
-
         /**
          * The characters to escape for markdown.
          */
@@ -160,6 +151,15 @@ private static String[] charParser(final String charText) {
          */
         private static final String[] APT_CHARS = charParser("\\~=-+*[]<>{}");
 
+        private static String[] charParser(final String charText) {
+            final char[] chars = charText.toCharArray();
+            final String[] result = new String[chars.length];
+            for (int i = 0; i < chars.length; i++) {
+                result[i] = String.valueOf(chars[i]);
+            }
+            return result;
+        }
+
         /**
          * Escapes a text string.
          *
@@ -174,8 +174,8 @@ private String escape(final String text, final String[] chars) {
                 return "";
             }
             String result = text;
-            for (String c : chars) {
-                result = result.replace(c, "\\" + c);
+            for (final String chrStr : chars) {
+                result = result.replace(chrStr, "\\" + chrStr);
             }
             return result;
         }

From ef469081f84fb0eba57cb9884c7ae3666c7f6d1a Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Tue, 25 Nov 2025 13:44:53 +0000
Subject: [PATCH 15/19] documented change

---
 .../aiven/kafka/connect/common/config/CommonConfigFragment.java  | 1 +
 1 file changed, 1 insertion(+)

diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/config/CommonConfigFragment.java b/commons/src/main/java/io/aiven/kafka/connect/common/config/CommonConfigFragment.java
index 50aa635da..87054a2b8 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/config/CommonConfigFragment.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/config/CommonConfigFragment.java
@@ -57,6 +57,7 @@ public static ConfigDef update(final ConfigDef configDef) {
                 "Maximum number of tasks to use for this connector.", commonGroup, ++orderInGroup,
                 ConfigDef.Width.SHORT, ConnectorConfig.TASKS_MAX_CONFIG);
 
+        // make TASK_ID an internal configuration (not visible to users)
         final ConfigDef.ConfigKey key = new ConfigDef.ConfigKey(TASK_ID, ConfigDef.Type.INT, 0, atLeast(0),
                 ConfigDef.Importance.HIGH, "The task ID that this connector is working with.", commonGroup,
                 ++orderInGroup, ConfigDef.Width.SHORT, TASK_ID, Collections.emptyList(), null, true);

From 9bc40505b420892b654b964a2ef25fd77a817e06 Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Tue, 25 Nov 2025 13:56:26 +0000
Subject: [PATCH 16/19] fixed source configData template

---
 azure-source-connector/src/templates/configData.md.vm | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/azure-source-connector/src/templates/configData.md.vm b/azure-source-connector/src/templates/configData.md.vm
index 8c81ec487..6e5d1e8cb 100644
--- a/azure-source-connector/src/templates/configData.md.vm
+++ b/azure-source-connector/src/templates/configData.md.vm
@@ -10,6 +10,6 @@ ${esc.hash}${esc.hash} ${section.displayName}
  - Valid values:  ${section.validator|"no restrictions"}
  - Importance: $section.importance
 
- $section.documentation
+  ${esc.markdown($section.documentation)}
 
 #end
\ No newline at end of file

From aa5205fcd4f845606ad82259a2b73fa7e17fb681 Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Wed, 26 Nov 2025 12:11:44 +0000
Subject: [PATCH 17/19] fixed integration tests

---
 .../kafka/connect/azure/sink/IntegrationTest.java    | 12 ++++++------
 .../connect/azure/sink/ParquetIntegrationTest.java   |  2 +-
 .../connect/common/config/OutputFormatFragment.java  |  4 ++--
 3 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/IntegrationTest.java b/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/IntegrationTest.java
index a12dc33cb..b13eaad42 100644
--- a/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/IntegrationTest.java
+++ b/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/IntegrationTest.java
@@ -68,7 +68,7 @@ void setUp() throws ExecutionException, InterruptedException {
     @ValueSource(strings = { "none", "gzip", "snappy", "zstd" })
     void basicTest(final String compression) throws ExecutionException, InterruptedException {
         final Map<String, String> connectorConfig = basicConnectorConfig();
-        OutputFormatFragment.setter(connectorConfig).withOutputFields(OutputFieldType.VALUE, OutputFieldType.KEY);
+        OutputFormatFragment.setter(connectorConfig).withOutputFields(OutputFieldType.KEY, OutputFieldType.VALUE);
         FileNameFragment.setter(connectorConfig).fileCompression(CompressionType.forName(compression));
         createConnector(connectorConfig);
 
@@ -123,7 +123,7 @@ void basicTest(final String compression) throws ExecutionException, InterruptedE
     @ValueSource(strings = { "none", "gzip", "snappy", "zstd" })
     void groupByTimestampVariable(final String compression) throws ExecutionException, InterruptedException {
         final Map<String, String> connectorConfig = basicConnectorConfig();
-        OutputFormatFragment.setter(connectorConfig).withOutputFields(OutputFieldType.VALUE, OutputFieldType.KEY);
+        OutputFormatFragment.setter(connectorConfig).withOutputFields(OutputFieldType.KEY, OutputFieldType.VALUE);
         FileNameFragment.setter(connectorConfig)
                 .fileCompression(CompressionType.forName(compression))
                 .template("{{topic}}-{{partition}}-{{start_offset}}-"
@@ -234,7 +234,7 @@ void groupByKey(final String compression) throws ExecutionException, Interrupted
         final Map<String, String> connectorConfig = basicConnectorConfig();
         final CompressionType compressionType = CompressionType.forName(compression);
         connectorConfig.put("key.converter", "org.apache.kafka.connect.storage.StringConverter");
-        OutputFormatFragment.setter(connectorConfig).withOutputFields(OutputFieldType.VALUE, OutputFieldType.KEY);
+        OutputFormatFragment.setter(connectorConfig).withOutputFields(OutputFieldType.KEY, OutputFieldType.VALUE);
         FileNameFragment.setter(connectorConfig)
                 .fileCompression(CompressionType.forName(compression))
                 .template("{{key}}" + compressionType.extension());
@@ -307,7 +307,7 @@ void jsonlOutput() throws ExecutionException, InterruptedException {
         FileNameFragment.setter(connectorConfig).fileCompression(CompressionType.NONE);
         OutputFormatFragment.setter(connectorConfig)
                 .withFormatType(FormatType.JSONL)
-                .withOutputFields(OutputFieldType.VALUE, OutputFieldType.KEY)
+                .withOutputFields(OutputFieldType.KEY, OutputFieldType.VALUE)
                 .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
         createConnector(connectorConfig);
 
@@ -369,8 +369,8 @@ void jsonOutput() throws ExecutionException, InterruptedException {
         connectorConfig.put("value.converter.schemas.enable", "false");
         FileNameFragment.setter(connectorConfig).fileCompression(CompressionType.NONE);
         OutputFormatFragment.setter(connectorConfig)
-                .withFormatType(FormatType.JSONL)
-                .withOutputFields(OutputFieldType.VALUE, OutputFieldType.KEY)
+                .withFormatType(FormatType.JSON)
+                .withOutputFields(OutputFieldType.KEY, OutputFieldType.VALUE)
                 .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
         createConnector(connectorConfig);
 
diff --git a/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/ParquetIntegrationTest.java b/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/ParquetIntegrationTest.java
index 0d8d6ca05..2a702cd80 100644
--- a/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/ParquetIntegrationTest.java
+++ b/azure-sink-connector/src/integration-test/java/io/aiven/kafka/connect/azure/sink/ParquetIntegrationTest.java
@@ -192,7 +192,7 @@ void jsonValue(final String envelopeEnabled, final String expectedOutput)
         final Map<String, String> connectorConfig = basicConnectorConfig(compression);
         OutputFormatFragment.setter(connectorConfig)
                 .withOutputFields(OutputFieldType.VALUE)
-                .envelopeEnabled(Boolean.getBoolean(envelopeEnabled))
+                .envelopeEnabled(Boolean.parseBoolean(envelopeEnabled))
                 .withOutputFieldEncodingType(OutputFieldEncodingType.NONE);
         connectorConfig.put("key.converter", "org.apache.kafka.connect.storage.StringConverter");
         connectorConfig.put("value.converter", "org.apache.kafka.connect.json.JsonConverter");
diff --git a/commons/src/main/java/io/aiven/kafka/connect/common/config/OutputFormatFragment.java b/commons/src/main/java/io/aiven/kafka/connect/common/config/OutputFormatFragment.java
index 7c00b0362..a6f7711d3 100644
--- a/commons/src/main/java/io/aiven/kafka/connect/common/config/OutputFormatFragment.java
+++ b/commons/src/main/java/io/aiven/kafka/connect/common/config/OutputFormatFragment.java
@@ -255,7 +255,7 @@ public Setter withOutputFieldEncodingType(final OutputFieldEncodingType encoding
         }
 
         /**
-         * Sets the list of output fields.
+         * Sets the list of output fields. The order of output fields will match the order they are added.
          *
          * @param outputFields
          *            the list of output fields
@@ -267,7 +267,7 @@ public Setter withOutputFields(final List<OutputFieldType> outputFields) {
         }
 
         /**
-         * Sets the list of output fields.
+         * Sets the list of output fields. The order of output fields will match the order they are added.
          *
          * @param outputFields
          *            the list of output fields

From 53b4bc636c1167ab0ad5b234807f252ed8ff4d53 Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Thu, 27 Nov 2025 09:52:33 +0000
Subject: [PATCH 18/19] updated as per review

---
 .../connect/azure/sink/config/AzureSinkConfigTest.java      | 6 ++----
 azure-source-connector/build.gradle.kts                     | 4 ++--
 2 files changed, 4 insertions(+), 6 deletions(-)

diff --git a/azure-sink-connector/src/test/java/io/aiven/kafka/connect/azure/sink/config/AzureSinkConfigTest.java b/azure-sink-connector/src/test/java/io/aiven/kafka/connect/azure/sink/config/AzureSinkConfigTest.java
index 2afea2b54..235b14b7f 100644
--- a/azure-sink-connector/src/test/java/io/aiven/kafka/connect/azure/sink/config/AzureSinkConfigTest.java
+++ b/azure-sink-connector/src/test/java/io/aiven/kafka/connect/azure/sink/config/AzureSinkConfigTest.java
@@ -521,8 +521,7 @@ void wrongVariableWithoutParameter() {
         final var expectedErrorMessage = "Invalid value {{start_offset:}}-{{partition}}-{{topic}} "
                 + "for configuration file.name.template: Wrong variable with parameter definition";
 
-        // expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template",
-        // expectedErrorMessage);
+        assertValidationContainsMessage(properties, "file.name.template", expectedErrorMessage);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
                 .hasMessage(expectedErrorMessage);
@@ -537,8 +536,7 @@ void noVariableWithParameter() {
         final var expectedErrorMessage = "Invalid value {{:padding=true}}-{{partition}}-{{topic}} "
                 + "for configuration file.name.template: Variable name hasn't been set for template: {{:padding=true}}-{{partition}}-{{topic}}";
 
-        // expectErrorMessageForConfigurationInConfigDefValidation(properties, "file.name.template",
-        // expectedErrorMessage);
+        assertValidationContainsMessage(properties, "file.name.template", expectedErrorMessage);
 
         assertThatThrownBy(() -> new AzureBlobSinkConfig(properties)).isInstanceOf(ConfigException.class)
                 .hasMessage(expectedErrorMessage);
diff --git a/azure-source-connector/build.gradle.kts b/azure-source-connector/build.gradle.kts
index 6b6b44a49..a196fccbe 100644
--- a/azure-source-connector/build.gradle.kts
+++ b/azure-source-connector/build.gradle.kts
@@ -59,8 +59,8 @@ dependencies {
   compileOnly("org.apache.velocity:velocity-engine-core:2.4.1")
   compileOnly("org.apache.velocity.tools:velocity-tools-generic:3.1")
 
-  implementation("commons-io:commons-io:2.18.0")
-  implementation("org.apache.commons:commons-lang3:3.17.0")
+  implementation(apache.commons.io)
+  implementation(apache.commons.lang3)
   implementation(project(":commons"))
   implementation(apache.commons.collection4)
   implementation("com.azure:azure-storage-blob:12.30.0")

From b66a6b97859944a910d8d4d3cd26267af475fe91 Mon Sep 17 00:00:00 2001
From: Claude Warren <claude.warren@aiven.io>
Date: Thu, 27 Nov 2025 10:00:39 +0000
Subject: [PATCH 19/19] changed http -> https

---
 azure-source-connector/build.gradle.kts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/azure-source-connector/build.gradle.kts b/azure-source-connector/build.gradle.kts
index a196fccbe..b766eab46 100644
--- a/azure-source-connector/build.gradle.kts
+++ b/azure-source-connector/build.gradle.kts
@@ -176,7 +176,7 @@ publishing {
         licenses {
           license {
             name = "Apache 2.0"
-            url = "http://www.apache.org/licenses/LICENSE-2.0"
+            url = "https://www.apache.org/licenses/LICENSE-2.0"
             distribution = "repo"
           }
         }