diff --git a/.editorconfig b/.editorconfig
new file mode 100644
index 000000000..7dda17caa
--- /dev/null
+++ b/.editorconfig
@@ -0,0 +1,285 @@
+[*]
+charset = utf-8
+end_of_line = lf
+indent_size = 2
+indent_style = space
+insert_final_newline = false
+max_line_length = 120
+tab_width = 2
+ij_continuation_indent_size = 8
+ij_formatter_off_tag = @formatter:off
+ij_formatter_on_tag = @formatter:on
+ij_formatter_tags_enabled = false
+ij_smart_tabs = false
+ij_visual_guides = none
+ij_wrap_on_typing = false
+
+[*.java]
+indent_size = 4
+tab_width = 4
+ij_java_align_consecutive_assignments = false
+ij_java_align_consecutive_variable_declarations = false
+ij_java_align_group_field_declarations = false
+ij_java_align_multiline_annotation_parameters = false
+ij_java_align_multiline_array_initializer_expression = false
+ij_java_align_multiline_assignment = false
+ij_java_align_multiline_binary_operation = false
+ij_java_align_multiline_chained_methods = false
+ij_java_align_multiline_extends_list = false
+ij_java_align_multiline_for = true
+ij_java_align_multiline_method_parentheses = false
+ij_java_align_multiline_parameters = true
+ij_java_align_multiline_parameters_in_calls = false
+ij_java_align_multiline_parenthesized_expression = false
+ij_java_align_multiline_records = true
+ij_java_align_multiline_resources = true
+ij_java_align_multiline_ternary_operation = false
+ij_java_align_multiline_text_blocks = false
+ij_java_align_multiline_throws_list = false
+ij_java_align_subsequent_simple_methods = false
+ij_java_align_throws_keyword = false
+ij_java_annotation_parameter_wrap = off
+ij_java_array_initializer_new_line_after_left_brace = false
+ij_java_array_initializer_right_brace_on_new_line = false
+ij_java_array_initializer_wrap = off
+ij_java_assert_statement_colon_on_next_line = false
+ij_java_assert_statement_wrap = off
+ij_java_assignment_wrap = off
+ij_java_binary_operation_sign_on_next_line = false
+ij_java_binary_operation_wrap = off
+ij_java_blank_lines_after_anonymous_class_header = 0
+ij_java_blank_lines_after_class_header = 0
+ij_java_blank_lines_after_imports = 1
+ij_java_blank_lines_after_package = 1
+ij_java_blank_lines_around_class = 1
+ij_java_blank_lines_around_field = 0
+ij_java_blank_lines_around_field_in_interface = 0
+ij_java_blank_lines_around_initializer = 1
+ij_java_blank_lines_around_method = 1
+ij_java_blank_lines_around_method_in_interface = 1
+ij_java_blank_lines_before_class_end = 0
+ij_java_blank_lines_before_imports = 1
+ij_java_blank_lines_before_method_body = 0
+ij_java_blank_lines_before_package = 0
+ij_java_block_brace_style = end_of_line
+ij_java_block_comment_at_first_column = true
+ij_java_builder_methods = none
+ij_java_call_parameters_new_line_after_left_paren = false
+ij_java_call_parameters_right_paren_on_new_line = false
+ij_java_call_parameters_wrap = off
+ij_java_case_statement_on_separate_line = true
+ij_java_catch_on_new_line = false
+ij_java_class_annotation_wrap = split_into_lines
+ij_java_class_brace_style = end_of_line
+ij_java_class_count_to_use_import_on_demand = 5
+ij_java_class_names_in_javadoc = 1
+ij_java_do_not_indent_top_level_class_members = false
+ij_java_do_not_wrap_after_single_annotation = false
+ij_java_do_while_brace_force = never
+ij_java_doc_add_blank_line_after_description = true
+ij_java_doc_add_blank_line_after_param_comments = false
+ij_java_doc_add_blank_line_after_return = false
+ij_java_doc_add_p_tag_on_empty_lines = true
+ij_java_doc_align_exception_comments = true
+ij_java_doc_align_param_comments = true
+ij_java_doc_do_not_wrap_if_one_line = false
+ij_java_doc_enable_formatting = true
+ij_java_doc_enable_leading_asterisks = true
+ij_java_doc_indent_on_continuation = true
+ij_java_doc_keep_empty_lines = true
+ij_java_doc_keep_empty_parameter_tag = true
+ij_java_doc_keep_empty_return_tag = true
+ij_java_doc_keep_empty_throws_tag = true
+ij_java_doc_keep_invalid_tags = true
+ij_java_doc_param_description_on_new_line = false
+ij_java_doc_preserve_line_breaks = false
+ij_java_doc_use_throws_not_exception_tag = true
+ij_java_else_on_new_line = false
+ij_java_enum_constants_wrap = off
+ij_java_extends_keyword_wrap = off
+ij_java_extends_list_wrap = off
+ij_java_field_annotation_wrap = split_into_lines
+ij_java_finally_on_new_line = false
+ij_java_for_brace_force = never
+ij_java_for_statement_new_line_after_left_paren = false
+ij_java_for_statement_right_paren_on_new_line = false
+ij_java_for_statement_wrap = off
+ij_java_generate_final_locals = true
+ij_java_generate_final_parameters = true
+ij_java_if_brace_force = never
+ij_java_imports_layout = *, |, javax.**, java.**, |, $*
+ij_java_indent_case_from_switch = true
+ij_java_insert_inner_class_imports = false
+ij_java_insert_override_annotation = true
+ij_java_keep_blank_lines_before_right_brace = 2
+ij_java_keep_blank_lines_between_package_declaration_and_header = 2
+ij_java_keep_blank_lines_in_code = 2
+ij_java_keep_blank_lines_in_declarations = 2
+ij_java_keep_builder_methods_indents = false
+ij_java_keep_control_statement_in_one_line = true
+ij_java_keep_first_column_comment = true
+ij_java_keep_indents_on_empty_lines = false
+ij_java_keep_line_breaks = true
+ij_java_keep_multiple_expressions_in_one_line = false
+ij_java_keep_simple_blocks_in_one_line = false
+ij_java_keep_simple_classes_in_one_line = false
+ij_java_keep_simple_lambdas_in_one_line = false
+ij_java_keep_simple_methods_in_one_line = false
+ij_java_label_indent_absolute = false
+ij_java_label_indent_size = 0
+ij_java_lambda_brace_style = end_of_line
+ij_java_layout_static_imports_separately = true
+ij_java_line_comment_add_space = false
+ij_java_line_comment_at_first_column = true
+ij_java_method_annotation_wrap = split_into_lines
+ij_java_method_brace_style = end_of_line
+ij_java_method_call_chain_wrap = off
+ij_java_method_parameters_new_line_after_left_paren = false
+ij_java_method_parameters_right_paren_on_new_line = false
+ij_java_method_parameters_wrap = off
+ij_java_modifier_list_wrap = false
+ij_java_names_count_to_use_import_on_demand = 3
+ij_java_new_line_after_lparen_in_record_header = false
+ij_java_packages_to_use_import_on_demand = java.awt.*, javax.swing.*
+ij_java_parameter_annotation_wrap = off
+ij_java_parentheses_expression_new_line_after_left_paren = false
+ij_java_parentheses_expression_right_paren_on_new_line = false
+ij_java_place_assignment_sign_on_next_line = false
+ij_java_prefer_longer_names = true
+ij_java_prefer_parameters_wrap = false
+ij_java_record_components_wrap = normal
+ij_java_repeat_synchronized = true
+ij_java_replace_instanceof_and_cast = false
+ij_java_replace_null_check = true
+ij_java_replace_sum_lambda_with_method_ref = true
+ij_java_resource_list_new_line_after_left_paren = false
+ij_java_resource_list_right_paren_on_new_line = false
+ij_java_resource_list_wrap = off
+ij_java_rparen_on_new_line_in_record_header = false
+ij_java_space_after_closing_angle_bracket_in_type_argument = false
+ij_java_space_after_colon = true
+ij_java_space_after_comma = true
+ij_java_space_after_comma_in_type_arguments = true
+ij_java_space_after_for_semicolon = true
+ij_java_space_after_quest = true
+ij_java_space_after_type_cast = true
+ij_java_space_before_annotation_array_initializer_left_brace = false
+ij_java_space_before_annotation_parameter_list = false
+ij_java_space_before_array_initializer_left_brace = false
+ij_java_space_before_catch_keyword = true
+ij_java_space_before_catch_left_brace = true
+ij_java_space_before_catch_parentheses = true
+ij_java_space_before_class_left_brace = true
+ij_java_space_before_colon = true
+ij_java_space_before_colon_in_foreach = true
+ij_java_space_before_comma = false
+ij_java_space_before_do_left_brace = true
+ij_java_space_before_else_keyword = true
+ij_java_space_before_else_left_brace = true
+ij_java_space_before_finally_keyword = true
+ij_java_space_before_finally_left_brace = true
+ij_java_space_before_for_left_brace = true
+ij_java_space_before_for_parentheses = true
+ij_java_space_before_for_semicolon = false
+ij_java_space_before_if_left_brace = true
+ij_java_space_before_if_parentheses = true
+ij_java_space_before_method_call_parentheses = false
+ij_java_space_before_method_left_brace = true
+ij_java_space_before_method_parentheses = false
+ij_java_space_before_opening_angle_bracket_in_type_parameter = false
+ij_java_space_before_quest = true
+ij_java_space_before_switch_left_brace = true
+ij_java_space_before_switch_parentheses = true
+ij_java_space_before_synchronized_left_brace = true
+ij_java_space_before_synchronized_parentheses = true
+ij_java_space_before_try_left_brace = true
+ij_java_space_before_try_parentheses = true
+ij_java_space_before_type_parameter_list = false
+ij_java_space_before_while_keyword = true
+ij_java_space_before_while_left_brace = true
+ij_java_space_before_while_parentheses = true
+ij_java_space_inside_one_line_enum_braces = false
+ij_java_space_within_empty_array_initializer_braces = false
+ij_java_space_within_empty_method_call_parentheses = false
+ij_java_space_within_empty_method_parentheses = false
+ij_java_spaces_around_additive_operators = true
+ij_java_spaces_around_assignment_operators = true
+ij_java_spaces_around_bitwise_operators = true
+ij_java_spaces_around_equality_operators = true
+ij_java_spaces_around_lambda_arrow = true
+ij_java_spaces_around_logical_operators = true
+ij_java_spaces_around_method_ref_dbl_colon = false
+ij_java_spaces_around_multiplicative_operators = true
+ij_java_spaces_around_relational_operators = true
+ij_java_spaces_around_shift_operators = true
+ij_java_spaces_around_type_bounds_in_type_parameters = true
+ij_java_spaces_around_unary_operator = false
+ij_java_spaces_within_angle_brackets = false
+ij_java_spaces_within_annotation_parentheses = false
+ij_java_spaces_within_array_initializer_braces = false
+ij_java_spaces_within_braces = false
+ij_java_spaces_within_brackets = false
+ij_java_spaces_within_cast_parentheses = false
+ij_java_spaces_within_catch_parentheses = false
+ij_java_spaces_within_for_parentheses = false
+ij_java_spaces_within_if_parentheses = false
+ij_java_spaces_within_method_call_parentheses = false
+ij_java_spaces_within_method_parentheses = false
+ij_java_spaces_within_parentheses = false
+ij_java_spaces_within_record_header = false
+ij_java_spaces_within_switch_parentheses = false
+ij_java_spaces_within_synchronized_parentheses = false
+ij_java_spaces_within_try_parentheses = false
+ij_java_spaces_within_while_parentheses = false
+ij_java_special_else_if_treatment = true
+ij_java_subclass_name_suffix = Impl
+ij_java_ternary_operation_signs_on_next_line = false
+ij_java_ternary_operation_wrap = off
+ij_java_test_name_suffix = Test
+ij_java_throws_keyword_wrap = off
+ij_java_throws_list_wrap = off
+ij_java_use_external_annotations = false
+ij_java_use_fq_class_names = false
+ij_java_use_relative_indents = false
+ij_java_use_single_class_imports = true
+ij_java_variable_annotation_wrap = off
+ij_java_visibility = public
+ij_java_while_brace_force = never
+ij_java_while_on_new_line = false
+ij_java_wrap_comments = true
+ij_java_wrap_first_method_in_call_chain = false
+ij_java_wrap_long_lines = false
+
+[.editorconfig]
+ij_editorconfig_align_group_field_declarations = false
+ij_editorconfig_space_after_colon = false
+ij_editorconfig_space_after_comma = true
+ij_editorconfig_space_before_colon = false
+ij_editorconfig_space_before_comma = false
+ij_editorconfig_spaces_around_assignment_operators = true
+
+[{*.ad,*.adoc,*.asciidoc,.asciidoctorconfig}]
+ij_asciidoc_blank_lines_after_header = 1
+ij_asciidoc_blank_lines_keep_after_header = 1
+ij_asciidoc_formatting_enabled = true
+ij_asciidoc_one_sentence_per_line = true
+
+[{*.pom,*.xml}]
+indent_size = 4
+tab_width = 4
+ij_xml_align_attributes = true
+ij_xml_align_text = false
+ij_xml_attribute_wrap = normal
+ij_xml_block_comment_at_first_column = true
+ij_xml_keep_blank_lines = 2
+ij_xml_keep_indents_on_empty_lines = false
+ij_xml_keep_line_breaks = true
+ij_xml_keep_line_breaks_in_text = false
+ij_xml_keep_whitespaces = false
+ij_xml_keep_whitespaces_around_cdata = preserve
+ij_xml_keep_whitespaces_inside_cdata = false
+ij_xml_line_comment_at_first_column = true
+ij_xml_space_after_tag_name = false
+ij_xml_space_around_equals_in_attribute = false
+ij_xml_space_inside_empty_tag = false
+ij_xml_text_wrap = off
diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS
new file mode 100644
index 000000000..b5b1656cf
--- /dev/null
+++ b/.github/CODEOWNERS
@@ -0,0 +1 @@
+*   astubbs
\ No newline at end of file
diff --git a/.github/dependabot.yml b/.github/dependabot.yml
new file mode 100644
index 000000000..ac73c3ed4
--- /dev/null
+++ b/.github/dependabot.yml
@@ -0,0 +1,14 @@
+# Please see the documentation for all configuration options:
+# https://docs.github.com/github/administering-a-repository/configuration-options-for-dependency-updates
+
+version: 2
+updates:
+  - package-ecosystem: "maven" # See documentation for possible values
+    directory: "/" # Location of package manifests
+    schedule:
+      interval: "daily"
+# Don't use any github-actions anymore
+#  - package-ecosystem: "github-actions"
+#    directory: "/"
+#    schedule:
+#      interval: "daily"
diff --git a/.github/pull_request_template.md b/.github/pull_request_template.md
new file mode 100644
index 000000000..803d20097
--- /dev/null
+++ b/.github/pull_request_template.md
@@ -0,0 +1,6 @@
+Description...
+
+### Checklist
+
+- [ ] Documentation (if applicable)
+- [ ] Changelog
\ No newline at end of file
diff --git a/.github/workflows/maven.yml b/.github/workflows/maven.yml
new file mode 100644
index 000000000..0a4cde6a1
--- /dev/null
+++ b/.github/workflows/maven.yml
@@ -0,0 +1,113 @@
+# This workflow will build a Java project with Maven
+# For more information see: https://help.github.com/actions/language-and-framework-guides/building-and-testing-java-with-maven
+
+# Tests disabled due to flakiness with under resourced github test machines. Confluent Jira works fine. Will fix later.
+name: Unit tests only
+
+on:
+  push:
+    branches: [ master ]
+  pull_request:
+    branches: [ master ]
+
+jobs:
+  build:
+    strategy:
+      fail-fast: false
+      matrix:
+        # Why not? because we can.
+        # 2.0.1, 2.1.1, 2.2.2, 2.3.1, 2.4.1 don't work - needs zstd and some kafka client libs.
+        # Doesn't mean it couldn't be modified slightly to work...
+        #ak: [ 2.5.1, 2.6.1, 2.7.0, 2.8.1, 3.0.1, 3.1.0 ]
+        # 25 and 26 include a dep with a vulnerability which ossindex fails the build for
+        ak: [ 2.7.0, 2.8.1, 3.0.1, 3.1.0 ]
+        #ak: [ 2.7.0 ]
+        #jdk: [ '-P jvm8-release -Djvm8.location=/opt/hostedtoolcache/Java_Zulu_jdk/8.0.332-9/x64', '' ]
+        # TG currently targets 11, so can't run the tests on 8 https://github.com/astubbs/truth-generator/issues/114
+        jdk: [ '' ]
+        experimental: [ false ]
+        name: [ "Stable AK version" ]
+        include:
+          # AK 2.4 not supported
+          #           - ak: "'[2.4.1,2.5)'" # currently failing
+          #             experimental: true
+          #             name: "Oldest AK breaking version 2.4.1+ (below 2.5.0) expected to fail"
+          - ak: "'[2.7.0,4)'" # currently failing
+            experimental: true
+            name: "Newest AK version 2.7.0+?"
+
+    continue-on-error: ${{ matrix.experimental }}
+    name: "AK: ${{ matrix.ak }} JDK: ${{ matrix.jdk }}"
+    runs-on: ubuntu-latest
+
+    steps:
+      - uses: actions/checkout@v3
+
+      - name: Setup JDK 1.8
+        uses: actions/setup-java@v3
+        with:
+          java-version: '8'
+          distribution: 'zulu'
+          cache: 'maven'
+
+      # the patch version will be upgraded silently causing the build to eventually start failing - need to store this as a var - possible?
+      - name: Show java 1.8 home
+        # /opt/hostedtoolcache/Java_Zulu_jdk/8.0.332-9/x64/bin/java
+        run: which java
+
+      #     - name: Setup JDK 1.9
+      #       uses: actions/setup-java@v1
+      #       with:
+      #         java-version: 1.9
+
+      #    - name: Show java 1.9 home
+      # /opt/hostedtoolcache/jdk/9.0.7/x64
+      #      run: which java
+
+      - name: Setup JDK 17
+        uses: actions/setup-java@v3
+        with:
+          distribution: 'zulu'
+          java-version: '17'
+          cache: 'maven'
+
+      - name: Show java 17 home
+        # /opt/hostedtoolcache/jdk/13.0.2/x64/bin/java
+        run: which java
+
+      #    - name: Show java version
+      #      run: java -version
+
+      #     - name: Show mvn version
+      #       run: mvn -version
+
+      #    - name: Build with Maven on Java 13
+      #      run: mvn -B package --file pom.xml
+
+
+      # done automatically now
+      #      - name: Cache Maven packages
+      #        uses: actions/cache@v2.1.7
+      #        with:
+      #          path: ~/.m2/repository
+      #          key: ${{ runner.os }}-m2
+      #          restore-keys: ${{ runner.os }}-m2
+
+      - name: Test with Maven
+        run: mvn -Pci -B package ${{ matrix.jdk }} -Dkafka.version=${{ matrix.ak }} -Dlicense.skip
+
+#     - name: Archive test results
+#       if: ${{ always() }}
+#       uses: actions/upload-artifact@v2
+#       with:
+#         name: test-reports
+#         path: target/**-reports/*
+#         retention-days: 14
+#
+#     - name: Archive surefire test results
+#       if: ${{ always() }}
+#       uses: actions/upload-artifact@v2
+#       with:
+#         name: test-reports
+#         path: target/surefire-reports/*
+#         retention-days: 14
diff --git a/.gitignore b/.gitignore
new file mode 100644
index 000000000..48a79e79a
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,75 @@
+.DS_Store
+
+# Compiled class file
+*.class
+
+# Log file
+*.log
+
+# BlueJ files
+*.ctxt
+
+# Mobile Tools for Java (J2ME)
+.mtj.tmp/
+
+# Package Files #
+*.jar
+*.war
+*.nar
+*.ear
+*.zip
+*.tar.gz
+*.rar
+
+# virtual machine crash logs, see http://www.java.com/en/download/help/error_hotspot.xml
+hs_err_pid*
+
+*.versionsBackup
+
+# JENV
+.java-version
+
+delombok/
+**/*.releaseBackup
+
+# User-specific stuff
+.idea/**/workspace.xml
+.idea/**/tasks.xml
+.idea/**/usage.statistics.xml
+.idea/**/dictionaries
+.idea/**/shelf
+.idea/sonarlint/
+.idea/libraries/
+
+
+# Generated files
+.idea/**/contentModel.xml
+
+# Gradle and Maven with auto-import
+# When using Gradle or Maven with auto-import, you should exclude module files,
+# since they will be recreated, and may cause churn.  Uncomment if using
+# auto-import.
+.idea/artifacts
+.idea/compiler.xml
+.idea/jarRepositories.xml
+.idea/modules.xml
+.idea/*.iml
+.idea/modules
+*.iml
+*.ipr
+
+# Mongo Explorer plugin
+.idea/**/mongoSettings.xml
+
+# File-based project format
+*.iws
+
+# Maven
+target
+release.properties
+/.idea/encodings.xml
+/.idea/misc.xml
+/.idea/codeStyles/Project.xml
+/.idea/inspectionProfiles/Project_Default.xml
+/.idea/uiDesigner.xml
+/.idea/vcs.xml
diff --git a/.idea/codeStyles/codeStyleConfig.xml b/.idea/codeStyles/codeStyleConfig.xml
new file mode 100644
index 000000000..a55e7a179
--- /dev/null
+++ b/.idea/codeStyles/codeStyleConfig.xml
@@ -0,0 +1,5 @@
+<component name="ProjectCodeStyleConfiguration">
+  <state>
+    <option name="PREFERRED_PROJECT_CODE_STYLE" value="Default" />
+  </state>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/All.xml b/.idea/runConfigurations/All.xml
new file mode 100644
index 000000000..1080d2485
--- /dev/null
+++ b/.idea/runConfigurations/All.xml
@@ -0,0 +1,26 @@
+<component name="ProjectRunConfigurationManager">
+    <configuration default="false" name="All" type="JUnit" factoryName="JUnit">
+        <extension name="net.ashald.envfile">
+            <option name="IS_ENABLED" value="false" />
+            <option name="IS_SUBST" value="false" />
+            <option name="IS_PATH_MACRO_SUPPORTED" value="false" />
+            <option name="IS_IGNORE_MISSING_FILES" value="false" />
+            <option name="IS_ENABLE_EXPERIMENTAL_INTEGRATIONS" value="false" />
+            <ENTRIES>
+                <ENTRY IS_ENABLED="true" PARSER="runconfig" />
+            </ENTRIES>
+        </extension>
+        <option name="MAIN_CLASS_NAME" value="" />
+        <option name="METHOD_NAME" value="" />
+        <option name="TEST_OBJECT" value="pattern" />
+        <option name="TEST_SEARCH_SCOPE">
+            <value defaultName="wholeProject" />
+        </option>
+        <patterns>
+            <pattern testClass=".*" />
+        </patterns>
+        <method v="2">
+            <option name="Make" enabled="true" />
+        </method>
+    </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/All_Core.xml b/.idea/runConfigurations/All_Core.xml
new file mode 100644
index 000000000..012d635b1
--- /dev/null
+++ b/.idea/runConfigurations/All_Core.xml
@@ -0,0 +1,12 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="All Core" type="JUnit" factoryName="JUnit">
+    <module name="parallel-consumer-core" />
+    <option name="PACKAGE_NAME" value="" />
+    <option name="MAIN_CLASS_NAME" value="" />
+    <option name="METHOD_NAME" value="" />
+    <option name="TEST_OBJECT" value="package" />
+    <method v="2">
+      <option name="Make" enabled="true" />
+    </method>
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/All_Core_Unit_Tests.xml b/.idea/runConfigurations/All_Core_Unit_Tests.xml
new file mode 100644
index 000000000..6e0c4a4e6
--- /dev/null
+++ b/.idea/runConfigurations/All_Core_Unit_Tests.xml
@@ -0,0 +1,12 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="All Core Unit Tests" type="JUnit" factoryName="JUnit" singleton="false">
+    <module name="parallel-consumer-core" />
+    <option name="MAIN_CLASS_NAME" value="" />
+    <option name="METHOD_NAME" value="" />
+    <option name="TEST_OBJECT" value="directory" />
+    <dir value="$PROJECT_DIR$/parallel-consumer-core/src/test/java" />
+    <method v="2">
+      <option name="Make" enabled="true" />
+    </method>
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/All_Modules.xml b/.idea/runConfigurations/All_Modules.xml
new file mode 100644
index 000000000..ab45cfb23
--- /dev/null
+++ b/.idea/runConfigurations/All_Modules.xml
@@ -0,0 +1,9 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="All Modules" type="Multirun" singleton="false" separateTabs="false" reuseTabsWithFailures="true" startOneByOne="false" markFailedProcess="true" hideSuccessProcess="false" delayTime="0.0">
+    <runConfiguration name="All Core" type="JUnit" />
+    <runConfiguration name="All Vertx" type="JUnit" />
+    <runConfiguration name="All example-core" type="JUnit" />
+    <runConfiguration name="All example-vertx" type="JUnit" />
+    <method v="2" />
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/All_Modules___Unit_Tests.xml b/.idea/runConfigurations/All_Modules___Unit_Tests.xml
new file mode 100644
index 000000000..eee0435ec
--- /dev/null
+++ b/.idea/runConfigurations/All_Modules___Unit_Tests.xml
@@ -0,0 +1,8 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="All Modules - Unit Tests" type="Multirun" singleton="false" separateTabs="true" reuseTabsWithFailures="false" startOneByOne="true" markFailedProcess="true" hideSuccessProcess="false" delayTime="0.0">
+    <runConfiguration name="All Core Unit Tests" type="JUnit" />
+    <runConfiguration name="All Vertx Unit Tests" type="JUnit" />
+    <runConfiguration name="All Reactor Unit Tests" type="JUnit" />
+    <method v="2" />
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/All_Reactor_Unit_Tests.xml b/.idea/runConfigurations/All_Reactor_Unit_Tests.xml
new file mode 100644
index 000000000..b90481929
--- /dev/null
+++ b/.idea/runConfigurations/All_Reactor_Unit_Tests.xml
@@ -0,0 +1,12 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="All Reactor Unit Tests" type="JUnit" factoryName="JUnit" singleton="false">
+    <module name="parallel-consumer-example-reactor" />
+    <option name="MAIN_CLASS_NAME" value="" />
+    <option name="METHOD_NAME" value="" />
+    <option name="TEST_OBJECT" value="directory" />
+    <dir value="$PROJECT_DIR$/parallel-consumer-reactor/src/test/java" />
+    <method v="2">
+      <option name="Make" enabled="true" />
+    </method>
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/All_Vertx.xml b/.idea/runConfigurations/All_Vertx.xml
new file mode 100644
index 000000000..a89f6b4b2
--- /dev/null
+++ b/.idea/runConfigurations/All_Vertx.xml
@@ -0,0 +1,12 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="All Vertx" type="JUnit" factoryName="JUnit" singleton="false">
+    <module name="parallel-consumer-vertx" />
+    <option name="PACKAGE_NAME" value="" />
+    <option name="MAIN_CLASS_NAME" value="" />
+    <option name="METHOD_NAME" value="" />
+    <option name="TEST_OBJECT" value="package" />
+    <method v="2">
+      <option name="Make" enabled="true" />
+    </method>
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/All_Vertx_Unit_Tests.xml b/.idea/runConfigurations/All_Vertx_Unit_Tests.xml
new file mode 100644
index 000000000..0b46a963a
--- /dev/null
+++ b/.idea/runConfigurations/All_Vertx_Unit_Tests.xml
@@ -0,0 +1,12 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="All Vertx Unit Tests" type="JUnit" factoryName="JUnit" singleton="false">
+    <module name="parallel-consumer-vertx" />
+    <option name="MAIN_CLASS_NAME" value="" />
+    <option name="METHOD_NAME" value="" />
+    <option name="TEST_OBJECT" value="directory" />
+    <dir value="$PROJECT_DIR$/parallel-consumer-vertx/src/test/java" />
+    <method v="2">
+      <option name="Make" enabled="true" />
+    </method>
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/All_example_core.xml b/.idea/runConfigurations/All_example_core.xml
new file mode 100644
index 000000000..9d53c6d3c
--- /dev/null
+++ b/.idea/runConfigurations/All_example_core.xml
@@ -0,0 +1,12 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="All example-core" type="JUnit" factoryName="JUnit">
+    <module name="parallel-consumer-example-core" />
+    <option name="PACKAGE_NAME" value="" />
+    <option name="MAIN_CLASS_NAME" value="" />
+    <option name="METHOD_NAME" value="" />
+    <option name="TEST_OBJECT" value="package" />
+    <method v="2">
+      <option name="Make" enabled="true" />
+    </method>
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/All_example_vertx.xml b/.idea/runConfigurations/All_example_vertx.xml
new file mode 100644
index 000000000..b0e464ccf
--- /dev/null
+++ b/.idea/runConfigurations/All_example_vertx.xml
@@ -0,0 +1,12 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="All example-vertx" type="JUnit" factoryName="JUnit">
+    <module name="parallel-consumer-example-vertx" />
+    <option name="PACKAGE_NAME" value="" />
+    <option name="MAIN_CLASS_NAME" value="" />
+    <option name="METHOD_NAME" value="" />
+    <option name="TEST_OBJECT" value="package" />
+    <method v="2">
+      <option name="Make" enabled="true" />
+    </method>
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/All_examples.xml b/.idea/runConfigurations/All_examples.xml
new file mode 100644
index 000000000..98c78936f
--- /dev/null
+++ b/.idea/runConfigurations/All_examples.xml
@@ -0,0 +1,22 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="All examples" type="JUnit" factoryName="JUnit" singleton="false">
+    <useClassPathOnly />
+    <extension name="coverage">
+      <pattern>
+        <option name="PATTERN" value="io.confluent.parallalconsumer.examples.core.*" />
+        <option name="ENABLED" value="true" />
+      </pattern>
+    </extension>
+    <option name="PACKAGE_NAME" value="io.confluent.parallelconsumer.examples" />
+    <option name="MAIN_CLASS_NAME" value="" />
+    <option name="METHOD_NAME" value="" />
+    <option name="TEST_OBJECT" value="package" />
+    <option name="PARAMETERS" value="" />
+    <option name="TEST_SEARCH_SCOPE">
+      <value defaultName="wholeProject" />
+    </option>
+    <method v="2">
+      <option name="Make" enabled="true" />
+    </method>
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/README.xml b/.idea/runConfigurations/README.xml
new file mode 100644
index 000000000..cb6986814
--- /dev/null
+++ b/.idea/runConfigurations/README.xml
@@ -0,0 +1,27 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="README" type="MavenRunConfiguration" factoryName="Maven">
+    <MavenSettings>
+      <option name="myGeneralSettings" />
+      <option name="myRunnerSettings" />
+      <option name="myRunnerParameters">
+        <MavenRunnerParameters>
+          <option name="profiles">
+            <set />
+          </option>
+          <option name="goals">
+            <list>
+              <option value="asciidoc-template:build" />
+            </list>
+          </option>
+          <option name="pomFileName" />
+          <option name="profilesMap">
+            <map />
+          </option>
+          <option name="resolveToWorkspace" value="false" />
+          <option name="workingDirPath" value="$PROJECT_DIR$" />
+        </MavenRunnerParameters>
+      </option>
+    </MavenSettings>
+    <method v="2" />
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/_Tag__transactions__.xml b/.idea/runConfigurations/_Tag__transactions__.xml
new file mode 100644
index 000000000..26e7f9dc9
--- /dev/null
+++ b/.idea/runConfigurations/_Tag__transactions__.xml
@@ -0,0 +1,13 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="@Tag(&quot;transactions&quot;)" type="JUnit" factoryName="JUnit">
+    <module name="parallel-consumer-core" />
+    <option name="PACKAGE_NAME" value="io.confluent.parallelconsumer.internal" />
+    <option name="MAIN_CLASS_NAME" value="io.confluent.parallelconsumer.internal.ProducerManagerTest" />
+    <option name="METHOD_NAME" value="" />
+    <option name="TEST_OBJECT" value="tags" />
+    <tag value="transactions" />
+    <method v="2">
+      <option name="Make" enabled="true" />
+    </method>
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/_release_prepare_.xml b/.idea/runConfigurations/_release_prepare_.xml
new file mode 100644
index 000000000..adaacd3ac
--- /dev/null
+++ b/.idea/runConfigurations/_release_prepare_.xml
@@ -0,0 +1,32 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="[release:prepare]" type="MavenRunConfiguration" factoryName="Maven">
+    <MavenSettings>
+      <option name="myGeneralSettings" />
+      <option name="myRunnerSettings" />
+      <option name="myRunnerParameters">
+        <MavenRunnerParameters>
+          <option name="profiles">
+            <set />
+          </option>
+          <option name="goals">
+            <list>
+              <option value="release:prepare" />
+              <option value="-DautoVersionSubmodules=true" />
+              <option value="-DpushChanges=false" />
+              <option value="-Darguments=-DskipTests" />
+            </list>
+          </option>
+          <option name="pomFileName" value="pom.xml" />
+          <option name="profilesMap">
+            <map>
+              <entry key="ci" value="true" />
+            </map>
+          </option>
+          <option name="resolveToWorkspace" value="false" />
+          <option name="workingDirPath" value="$PROJECT_DIR$" />
+        </MavenRunnerParameters>
+      </option>
+    </MavenSettings>
+    <method v="2" />
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/asciidoc_template_build.xml b/.idea/runConfigurations/asciidoc_template_build.xml
new file mode 100644
index 000000000..b5ef11263
--- /dev/null
+++ b/.idea/runConfigurations/asciidoc_template_build.xml
@@ -0,0 +1,28 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="asciidoc-template:build" type="MavenRunConfiguration" factoryName="Maven">
+    <MavenSettings>
+      <option name="myGeneralSettings" />
+      <option name="myRunnerSettings" />
+      <option name="myRunnerParameters">
+        <MavenRunnerParameters>
+          <option name="profiles">
+            <set />
+          </option>
+          <option name="goals">
+            <list>
+              <option value="asciidoc-template:build" />
+              <option value="-e" />
+            </list>
+          </option>
+          <option name="pomFileName" value="pom.xml" />
+          <option name="profilesMap">
+            <map />
+          </option>
+          <option name="resolveToWorkspace" value="false" />
+          <option name="workingDirPath" value="$PROJECT_DIR$" />
+        </MavenRunnerParameters>
+      </option>
+    </MavenSettings>
+    <method v="2" />
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/generate_test_sources__e.xml b/.idea/runConfigurations/generate_test_sources__e.xml
new file mode 100644
index 000000000..2456e1d82
--- /dev/null
+++ b/.idea/runConfigurations/generate_test_sources__e.xml
@@ -0,0 +1,30 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="generate-test-sources -e" type="MavenRunConfiguration" factoryName="Maven">
+    <MavenSettings>
+      <option name="myGeneralSettings" />
+      <option name="myRunnerSettings" />
+      <option name="myRunnerParameters">
+        <MavenRunnerParameters>
+          <option name="profiles">
+            <set />
+          </option>
+          <option name="goals">
+            <list>
+              <option value="generate-test-sources" />
+              <option value="-e" />
+              <option value="-DskipTests" />
+              <option value="-Dlicense.skip" />
+            </list>
+          </option>
+          <option name="pomFileName" />
+          <option name="profilesMap">
+            <map />
+          </option>
+          <option name="resolveToWorkspace" value="false" />
+          <option name="workingDirPath" value="$PROJECT_DIR$" />
+        </MavenRunnerParameters>
+      </option>
+    </MavenSettings>
+    <method v="2" />
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/license_format.xml b/.idea/runConfigurations/license_format.xml
new file mode 100644
index 000000000..09f2bc9ab
--- /dev/null
+++ b/.idea/runConfigurations/license_format.xml
@@ -0,0 +1,27 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="license:format" type="MavenRunConfiguration" factoryName="Maven">
+    <MavenSettings>
+      <option name="myGeneralSettings" />
+      <option name="myRunnerSettings" />
+      <option name="myRunnerParameters">
+        <MavenRunnerParameters>
+          <option name="profiles">
+            <set />
+          </option>
+          <option name="goals">
+            <list>
+              <option value="license:format" />
+            </list>
+          </option>
+          <option name="pomFileName" value="pom.xml" />
+          <option name="profilesMap">
+            <map />
+          </option>
+          <option name="resolveToWorkspace" value="false" />
+          <option name="workingDirPath" value="$PROJECT_DIR$" />
+        </MavenRunnerParameters>
+      </option>
+    </MavenSettings>
+    <method v="2" />
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.idea/runConfigurations/truth_generate__pc_.xml b/.idea/runConfigurations/truth_generate__pc_.xml
new file mode 100644
index 000000000..8778f1801
--- /dev/null
+++ b/.idea/runConfigurations/truth_generate__pc_.xml
@@ -0,0 +1,39 @@
+<component name="ProjectRunConfigurationManager">
+  <configuration default="false" name="truth:generate [pc]" type="MavenRunConfiguration" factoryName="Maven">
+    <MavenSettings>
+      <option name="myGeneralSettings" />
+      <option name="myRunnerSettings" />
+      <option name="myRunnerParameters">
+        <MavenRunnerParameters>
+          <option name="profiles">
+            <set />
+          </option>
+          <option name="goals">
+            <list>
+              <option value="compile" />
+              <option value="truth:generate" />
+              <option value="-e" />
+            </list>
+          </option>
+          <option name="pomFileName" value="pom.xml" />
+          <option name="profilesMap">
+            <map />
+          </option>
+          <option name="resolveToWorkspace" value="false" />
+          <option name="workingDirPath" value="$PROJECT_DIR$/parallel-consumer-core" />
+        </MavenRunnerParameters>
+      </option>
+    </MavenSettings>
+    <extension name="net.ashald.envfile">
+      <option name="IS_ENABLED" value="false" />
+      <option name="IS_SUBST" value="false" />
+      <option name="IS_PATH_MACRO_SUPPORTED" value="false" />
+      <option name="IS_IGNORE_MISSING_FILES" value="false" />
+      <option name="IS_ENABLE_EXPERIMENTAL_INTEGRATIONS" value="false" />
+      <ENTRIES>
+        <ENTRY IS_ENABLED="true" PARSER="runconfig" />
+      </ENTRIES>
+    </extension>
+    <method v="2" />
+  </configuration>
+</component>
\ No newline at end of file
diff --git a/.mvn/wrapper/maven-wrapper.properties b/.mvn/wrapper/maven-wrapper.properties
new file mode 100644
index 000000000..08ea486aa
--- /dev/null
+++ b/.mvn/wrapper/maven-wrapper.properties
@@ -0,0 +1,18 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+distributionUrl=https://repo.maven.apache.org/maven2/org/apache/maven/apache-maven/3.9.0/apache-maven-3.9.0-bin.zip
+wrapperUrl=https://repo.maven.apache.org/maven2/org/apache/maven/wrapper/maven-wrapper/3.2.0/maven-wrapper-3.2.0.jar
diff --git a/.travis-archived.yml b/.travis-archived.yml
new file mode 100644
index 000000000..eb04f839f
--- /dev/null
+++ b/.travis-archived.yml
@@ -0,0 +1,60 @@
+#
+# Copyright (C) 2020-2022 Confluent, Inc.
+#
+
+# Archived in favour of github actions
+
+language: java
+jdk:
+  - openjdk13
+
+sudo: required
+
+# docker and docker in docker setup. disabled for faster builds until needed
+#services:
+#  - docker
+#
+#before_cache:
+#  - rm -f  $HOME/.gradle/caches/modules-2/modules-2.lock
+#  - rm -fr $HOME/.gradle/caches/*/plugin-resolution/
+#cache:
+#  directories:
+#    - "$HOME/.gradle/caches/"
+#    - "$HOME/.gradle/wrapper/"
+#
+#before_install:
+#  - sudo rm /usr/local/bin/docker-compose
+#  - curl -L https://github.com/docker/compose/releases/download/1.24.1/docker-compose-Linux-x86_64 > docker-compose
+#  - chmod +x docker-compose
+#  - sudo mv docker-compose /usr/local/bin
+
+cache:
+  directories:
+    - "$HOME/.m2"
+
+#before_install:
+#  - $TRAVIS_BUILD_DIR/install-jdk.sh --install openjdk9 --target ~/openjdk9
+#  - ls -la ~/
+
+install: skip
+
+# Removed for https://about.codecov.io/security-update/
+# APRIL 15TH, 2021
+# Bash Uploader Security Update
+# after_success:
+#   - bash <(curl -s https://codecov.io/bash)
+
+addons:
+  sonarcloud:
+    organization: "astubbs"
+    token:
+      secure: "zUbcZgSuBEi1j8nboM6y5Eoj7Go6OdcW4h9IYk7iYbHVlSwTCzq1Tez0FG2moSvyxgwaXD+ySd4XvbH1hT04R59b2fumFt2eWO3FbSHFrE3dXdOxliz47FLXkqpg8MvEWNkF4hPHwsi9LTXl4u7UuFRTqOCLilA5RUBZyzQ03AExMQJdZgdlestarlys40thISEGHNmNd4nr+EEekkaekN+1iE3v4HZpXXv8COLdp10Hehl6RPg9ooCZ3g8B++IOI5MdRxMf3HeERyKapMN1xGT6ZpeCkaFd/GbbAjzjlhKHIJ37Mmo2l9nJs/9dpBml62SFb1WdpG+7610e49vQbHuy1yb9h1XOJPdw45AZw+g61/6LTmGuNNlkUTstELQEN0iDoo0GqEMtIlVplKUcnzVAXtldvKU4Ph7Satdk4wdA3K+4E+zhaMaJhzUBNluChF5JldOOQDV5odt9K0rZCH/4zGbmsR0nev+g6JW1DX96laqLkuA4Am1aDistZSjt3T3HqhAXcpf/8VW4p1HKtYhsmMybnOuqoOH7sBpwxXoR0Myvj6FMrh4On/t+/vYQSJm+vyiyLShP/Bouk+azygIcjG3ZUmaFpumRpKesK6C9EYCA2d59vnsYU0/Ob+IwvrDVY40HQl41A+ooC+WVQf8scvvFAIJpYH6V/0TCWXg="
+
+script:
+  # the following command line builds the project, runs the tests with coverage and then execute the SonarCloud analysis
+  # - mvn clean org.jacoco:jacoco-maven-plugin:prepare-agent install sonar:sonar versions:display-dependency-updates
+  # -Djvm8.location=/usr/lib/jvm/java-8-openjdk-amd64/jre
+  # -Djvm9.location=/home/travis/openjdk9
+  - ~/bin/install-jdk.sh --target /home/travis/openjdk9 --feature 9
+  - mvn -version
+  - mvn -Pci clean verify versions:display-plugin-updates versions:display-property-updates versions:display-dependency-updates --fail-at-end -P jvm9-release -Djvm9.location=/home/travis/openjdk9
\ No newline at end of file
diff --git a/CHANGELOG.adoc b/CHANGELOG.adoc
new file mode 100644
index 000000000..7e36bf009
--- /dev/null
+++ b/CHANGELOG.adoc
@@ -0,0 +1,393 @@
+:toc: macro
+:toclevels: 1
+
+= Change Log
+
+A high level summary of noteworthy changes in each version.
+
+NOTE:: Dependency version bumps are not listed here.
+
+// git log --pretty="* %s" 0.3.0.2..HEAD
+
+// only show TOC if this is the root document (not in the README)
+ifndef::github_name[]
+toc::[]
+endif::[]
+== 0.5.2.8
+
+=== Fixes
+
+* fix: Fix equality and hash code for ShardKey with array key (#638), resolves (#579)
+
+== 0.5.2.7
+
+=== Fixes
+
+* fix: Return cached pausedPartitionSet (#620), resolves (#618)
+* fix: Parallel consumer stops processing data sometimes (#623), fixes (#606)
+* fix: Add synchronization to ensure proper intializaiton and closing of PCMetrics singleton (#627), fixes (#617)
+* fix: Readme - metrics example correction (#614)
+* fix: Remove micrometer-atlas dependency (#628), fixes (#625)
+
+=== Improvements
+
+* Refactored metrics implementation to not use singleton - improves meter separation, allows correct metrics subsystem operation when multiple parallel consumer instances are running in same java process (#630), fixes (#617) improves on (#627)
+
+== 0.5.2.6
+=== Improvements
+
+* feature: Micrometer metrics (#594)
+* feature: Adds an option to pass an invalid offset metadata error policy (#537), improves (#326)
+* feature: Lazy intialization of workerThreadPool (#531)
+
+=== Fixes
+
+* fix: Don't drain mode shutdown kills inflight threads (#559)
+* fix: Drain mode shutdown doesn't pause consumption correctly (#552)
+* fix: RunLength offset decoding returns 0 base offset after no-progress commit - related to (#546)
+* fix: Transactional PConsumer stuck while rebalancing - related to (#541)
+
+=== Dependencies
+
+* PL-211: Update dependencies from dependabot, Add mvnw, use mvnw in jenkins (#583)
+* PL-211: Update dependencies from dependabot (#589)
+
+== 0.5.2.5
+
+=== Fixes
+
+* fixes: #195 NoSuchFieldException when using consumer inherited from KafkaConsumer (#469)
+* fix: After new performance fix PR#530 merges - corner case could cause out of order processing (#534)
+* fix: Cleanup WorkManager's count of in-progress work, when work is stale after partition revocation (#547)
+
+=== Improvements
+
+* perf: Adds a caching layer to work management to alleviate O(n) counting (#530)
+
+== 0.5.2.4
+
+=== Improvements
+
+* feature: Simple PCRetriableException to remove error spam from logs (#444)
+* minor: fixes #486: Missing generics in JStreamParallelStreamProcessor #491
+* minor: partially address #459: Moves isClosedOrFailed into top level ParallelConsumer interface (#491)
+* tests: Demonstrates how to use MockConsumer with PC for issue #176
+* other minor improvements
+
+=== Fixes
+
+* fixes #409: Adds support for compacted topics and commit offset resetting (#425)
+** Truncate the offset state when bootstrap polled offset higher or lower than committed
+** Prune missing records from the tracked incomplete offset state, when they're missing from polled batches
+* fix: Improvements to encoding ranges (int vs long) #439
+** Replace integer offset references with long - use Long everywhere we deal with offsets, and where we truncate down, do it exactly, detect and handle truncation issues.
+
+== 0.5.2.3
+
+=== Improvements
+
+* Transactional commit mode system improvements and docs (#355)
+** Clarifies transaction system with much better documentation.
+** Fixes a potential race condition which could cause offset leaks between transactions boundaries.
+** Introduces lock acquisition timeouts.
+** Fixes a potential issue with removing records from the retry queue incorrectly, by having an inconsistency between compareTo and equals in the retry TreeMap.
+* Adds a very simple Dependency Injection system modeled on Dagger (#398)
+* Various refactorings e.g. new ProducerWrap
+
+* Dependencies
+** build(deps): prod: zstd, reactor, dev: podam, progressbar, postgresql maven-plugins: versions, help (#420)
+** build(deps-dev): bump postgresql from 42.4.1 to 42.5.0
+** bump podam, progressbar, zstd, reactor
+** build(deps): bump versions-maven-plugin from 2.11.0 to 2.12.0
+** build(deps): bump maven-help-plugin from 3.2.0 to 3.3.0
+** build(deps-dev): bump Confluent Platform Kafka Broker to 7.2.2 (#421)
+** build(deps): Upgrade to AK 3.3.0 (#309)
+
+
+=== Fixes
+
+* fixes #419: NoSuchElementException during race condition in PartitionState (#422)
+* Fixes #412: ClassCastException with retryDelayProvider (#417)
+* fixes ShardManager retryQueue ordering and set issues due to poor Comparator implementation (#423)
+
+
+== v0.5.2.2
+
+=== Fixes
+
+- Fixes dependency scope for Mockito from compile to test (#376)
+
+== v0.5.2.1
+
+=== Fixes
+
+- Fixes regression issue with order of state truncation vs commit (#362)
+
+== v0.5.2.0
+
+=== Fixes and Improvements
+
+- fixes #184: Fix multi topic subscription with KEY order by adding topic to shard key (#315)
+- fixes #329: Committing around transaction markers causes encoder to crash (#328)
+- build: Upgrade Truth-Generator to 0.1.1 for user Subject discovery (#332)
+
+=== Build
+
+- build: Allow snapshots locally, fail in CI (#331)
+- build: OSS Index scan change to warn only and exclude Guava CVE-2020-8908 as it's WONT_FIX (#330)
+
+=== Dependencies
+
+- build(deps): bump reactor-core from 3.4.19 to 3.4.21 (#344)
+- build(deps): dependabot bump Mockito, Surefire, Reactor, AssertJ, Release (#342) (#342)
+- build(deps): dependabot bump TestContainers, Vert.x, Enforcer, Versions, JUnit, Postgress (#336)
+
+=== Linked issues
+
+- Message with null key lead to continuous failure when using KEY ordering #318
+- Subscribing to two or more topics with KEY ordering, results in messages of the same Key never being processed #184
+- Cannot have negative length BitSet error - committing transaction adjacent offsets #329
+
+== v0.5.1.0
+
+=== Features
+
+* #193: Pause / Resume PC (circuit breaker) without unsubscribing from topics
+
+=== Fixes and Improvements
+
+* #225: Build and runtime support for Java 16+ (#289)
+* #306: Change Truth-Generator dependency from compile to test
+* #298: Improve PollAndProduce performance by first producing all records, and then waiting for the produce results.Previously, this was done for each ProduceRecord individually.
+
+== v0.5.0.0
+
+=== Features
+
+* feature: Poll Context object for API (#223)
+** PollContext API - provides central access to result set with various convenience methods as well as metadata about records, such as failure count
+* major: Batching feature and Event system improvements
+** Batching - all API methods now support batching.
+See the Options class set batch size for more information.
+
+=== Fixes and Improvements
+
+* Event system - better CPU usage in control thread
+* Concurrency stability improvements
+* Update dependencies
+* #247: Adopt Truth-Generator (#249)
+** Adopt https://github.com/astubbs/truth-generator[Truth Generator] for automatic generation of https://truth.dev/[Google Truth] Subjects
+* Large rewrite of internal architecture for improved maintence and simplicity which fixed some corner case issues
+** refactor: Rename PartitionMonitor to PartitionStateManager (#269)
+** refactor: Queue unification (#219)
+** refactor: Partition state tracking instead of search (#218)
+** refactor: Processing Shard object
+* fix: Concurrency and State improvements (#190)
+
+=== Build
+
+* build: Lock TruthGenerator to 0.1 (#272)
+* build: Deploy SNAPSHOTS to maven central snaphots repo (#265)
+* build: Update Kafka to 3.1.0 (#229)
+* build: Crank up Enforcer rules and turn on ossindex audit
+* build: Fix logback dependency back to stable
+* build: Upgrade TestContainer and CP
+
+== v0.4.0.1
+
+=== Improvements
+
+- Add option to specify timeout for how long to wait offset commits in periodic-consumer-sync commit-mode
+- Add option to specify timeout for how long to wait for blocking Producer#send
+
+=== Docs
+
+- docs: Confluent Cloud configuration links
+- docs: Add Confluent's product page for PC to README
+- docs: Add head of line blocking to README
+
+== v0.4.0.0
+// https://github.com/confluentinc/parallel-consumer/releases/tag/0.4.0.0
+
+=== Features
+
+* https://projectreactor.io/[Project Reactor] non-blocking threading adapter module
+* Generic Vert.x Future support - i.e. FileSystem, db etc...
+
+=== Fixes and Improvements
+
+* Vert.x concurrency control via WebClient host limits fixed - see #maxCurrency
+* Vert.x API cleanup of invalid usage
+* Out of bounds for empty collections
+* Use ConcurrentSkipListMap instead of TreeMap to prevent concurrency issues under high pressure
+* log: Show record topic in slow-work warning message
+
+== v0.3.2.0
+
+=== Fixes and Improvements
+
+* Major: Upgrade to Apache Kafka 2.8 (still compatible with 2.6 and 2.7 though)
+* Adds support for managed executor service (Java EE Compatibility feature)
+* #65 support for custom retry delay providers
+
+== v0.3.1.0
+
+=== Fixes and Improvements
+
+* Major refactor to code base - primarily the two large God classes
+** Partition state now tracked separately
+** Code moved into packages
+* Busy spin in some cases fixed (lower CPU usage)
+* Reduce use of static data for test assertions - remaining identified for later removal
+* Various fixes for parallel testing stability
+
+== v0.3.0.3
+
+=== Fixes and Improvements
+
+==== Overview
+
+* Tests now run in parallel
+* License fixing / updating and code formatting
+* License format runs properly now when local, check on CI
+* Fix running on Windows and Linux
+* Fix JAVA_HOME issues
+
+==== Details:
+
+* tests: Enable the fail fast feature now that it's merged upstream
+* tests: Turn on parallel test runs
+* format: Format license, fix placement
+* format: Apply Idea formatting (fix license layout)
+* format: Update mycila license-plugin
+* test: Disable redundant vert.x test - too complicated to fix for little gain
+* test: Fix thread counting test by closing PC @After
+* test: Test bug due to static state overrides when run as a suite
+* format: Apply license format and run every All Idea build
+* format: Organise imports
+* fix: Apply license format when in dev laptops - CI only checks
+* fix: javadoc command for various OS and envs when JAVA_HOME missing
+* fix: By default, correctly run time JVM as jvm.location
+
+== v0.3.0.2
+
+=== Fixes and Improvements
+
+* ci: Add CODEOWNER
+* fix: #101 Validate GroupId is configured on managed consumer
+* Use 8B1DA6120C2BF624 GPG Key For Signing
+* ci: Bump jdk8 version path
+* fix: #97 Vert.x thread and connection pools setup incorrect
+* Disable Travis and Codecov
+* ci: Apache Kafka and JDK build matrix
+* fix: Set Serdes for MockProducer for AK 2.7 partition fix KAFKA-10503 to fix new NPE
+* Only log slow message warnings periodically, once per sweep
+* Upgrade Kafka container version to 6.0.2
+* Clean up stalled message warning logs
+* Reduce log-level if no results are returned from user-function (warn -> debug)
+* Enable java 8 Github
+* Fixes #87 - Upgrade UniJ version for UnsupportedClassVersion error
+* Bump TestContainers to stable release to specifically fix #3574
+* Clarify offset management capabilities
+
+== v0.3.0.1
+
+* fixes #62: Off by one error when restoring offsets when no offsets are encoded in metadata
+* fix: Actually skip work that is found as stale
+
+== v0.3.0.0
+
+=== Features
+
+* Queueing and pressure system now self tuning, performance over default old tuning values (`softMaxNumberMessagesBeyondBaseCommitOffset` and `maxMessagesToQueue`) has doubled.
+** These options have been removed from the system.
+* Offset payload encoding back pressure system
+** If the payload begins to take more than a certain threshold amount of the maximum available, no more messages will be brought in for processing, until the space need beings to reduce back below the threshold.
+This is to try to prevent the situation where the payload is too large to fit at all, and must be dropped entirely.
+** See Proper offset encoding back pressure system so that offset payloads can't ever be too large https://github.com/confluentinc/parallel-consumer/issues/47[#47]
+** Messages that have failed to process, will always be allowed to retry, in order to reduce this pressure.
+
+=== Improvements
+
+* Default ordering mode is now `KEY` ordering (was `UNORDERED`).
+** This is a better default as it's the safest mode yet high performing mode.
+It maintains the partition ordering characteristic that all keys are processed in log order, yet for most use cases will be close to as fast as `UNORDERED` when the key space is large enough.
+* https://github.com/confluentinc/parallel-consumer/issues/37[Support BitSet encoding lengths longer than Short.MAX_VALUE #37] - adds new serialisation formats that supports wider range of offsets - (32,767 vs 2,147,483,647) for both BitSet and run-length encoding.
+* Commit modes have been renamed to make it clearer that they are periodic, not per message.
+* Minor performance improvement, switching away from concurrent collections.
+
+=== Fixes
+
+* Maximum offset payload space increased to correctly not be inversely proportional to assigned partition quantity.
+* Run-length encoding now supports compacted topics, plus other bug fixes as well as fixes to Bitset encoding.
+
+== v0.2.0.3
+
+=== Fixes
+
+** https://github.com/confluentinc/parallel-consumer/issues/35[Bitset overflow check (#35)] - gracefully drop BitSet or Runlength encoding as an option if offset difference too large (short overflow)
+*** A new serialisation format will be added in next version - see https://github.com/confluentinc/parallel-consumer/issues/37[Support BitSet encoding lengths longer than Short.MAX_VALUE #37]
+** Gracefully drops encoding attempts if they can't be run
+** Fixes a bug in the offset drop if it can't fit in the offset metadata payload
+
+== v0.2.0.2
+
+=== Fixes
+
+** Turns back on the https://github.com/confluentinc/parallel-consumer/issues/35[Bitset overflow check (#35)]
+
+== v0.2.0.1 DO NOT USE - has critical bug
+
+=== Fixes
+
+** Incorrectly turns off an over-flow check in https://github.com/confluentinc/parallel-consumer/issues/35[offset serialisation system (#35)]
+
+== v0.2.0.0
+
+=== Features
+
+** Choice of commit modes: Consumer Asynchronous, Synchronous and Producer Transactions
+** Producer instance is now optional
+** Using a _transactional_ Producer is now optional
+** Use the Kafka Consumer to commit `offsets` Synchronously or Asynchronously
+
+=== Improvements
+
+** Memory performance - garbage collect empty shards when in KEY ordering mode
+** Select tests adapted to non transactional (multiple commit modes) as well
+** Adds supervision to broker poller
+** Fixes a performance issue with the async committer not being woken up
+** Make committer thread revoke partitions and commit
+** Have onPartitionsRevoked be responsible for committing on close, instead of an explicit call to commit by controller
+** Make sure Broker Poller now drains properly, committing any waiting work
+
+=== Fixes
+
+** Fixes bug in commit linger, remove genesis offset (0) from testing (avoid races), add ability to request commit
+** Fixes #25 https://github.com/confluentinc/parallel-consumer/issues/25:
+*** Sometimes a transaction error occurs - Cannot call send in state COMMITTING_TRANSACTION #25
+** ReentrantReadWrite lock protects non-thread safe transactional producer from incorrect multithreaded use
+** Wider lock to prevent transaction's containing produced messages that they shouldn't
+** Must start tx in MockProducer as well
+** Fixes example app tests - incorrectly testing wrong thing and MockProducer not configured to auto complete
+** Add missing revoke flow to MockConsumer wrapper
+** Add missing latch timeout check
+
+== v0.1
+
+=== Features:
+
+** Have massively parallel consumption processing without running hundreds or thousands of
+*** Kafka consumer clients
+*** topic partitions
++
+without operational burden or harming the clusters performance
+** Efficient individual message acknowledgement system (without local or third system state) to massively reduce message replay upon failure
+** Per `key` concurrent processing, per `partition` and unordered message processing
+** `Offsets` committed correctly, in order, of only processed messages, regardless of concurrency level or retries
+** Vert.x non-blocking library integration (HTTP currently)
+** Fair partition traversal
+** Zero~ dependencies (`Slf4j` and `Lombok`) for the core module
+** Java 8 compatibility
+** Throttle control and broker liveliness management
+** Clean draining shutdown cycle
diff --git a/Default.xml b/Default.xml
new file mode 100644
index 000000000..cd997255e
--- /dev/null
+++ b/Default.xml
@@ -0,0 +1,28 @@
+<!--
+
+    Copyright (C) 2020-2022 Confluent, Inc.
+
+-->
+<code_scheme name="Default" version="173">
+    <option name="OTHER_INDENT_OPTIONS">
+        <value>
+            <option name="INDENT_SIZE" value="2"/>
+            <option name="TAB_SIZE" value="2"/>
+            <option name="SMART_TABS" value="true"/>
+        </value>
+    </option>
+    <option name="LINE_SEPARATOR" value="&#xA;"/>
+    <Properties>
+        <option name="KEEP_BLANK_LINES" value="true"/>
+    </Properties>
+    <ScalaCodeStyleSettings>
+        <option name="MULTILINE_STRING_CLOSING_QUOTES_ON_NEW_LINE" value="true"/>
+    </ScalaCodeStyleSettings>
+    <XML>
+        <option name="XML_ATTRIBUTE_WRAP" value="4"/>
+        <option name="XML_TEXT_WRAP" value="0"/>
+    </XML>
+    <codeStyleSettings language="JAVA">
+        <option name="WRAP_COMMENTS" value="true"/>
+    </codeStyleSettings>
+</code_scheme>
diff --git a/Jenkinsfile b/Jenkinsfile
new file mode 100644
index 000000000..16a61caa7
--- /dev/null
+++ b/Jenkinsfile
@@ -0,0 +1,66 @@
+#!/usr/bin/env groovy
+
+//common {
+//  slackChannel = 'csid-build'
+//  nodeLabel = 'docker-openjdk13'
+//  runMergeCheck = false
+//  mvnSkipDeploy = true
+}
+
+def RelaseTag = string(name: 'RELEASE_TAG', defaultValue: '',
+        description: 'Provide the tag of project that will be release to maven central,' +
+                'only use the value when you want to release to maven central')
+
+def config = jobConfig {
+    owner = 'csid'
+//  testResultSpecs = ['junit': 'test/results.xml']
+    properties = [parameters([RelaseTag])]
+    slackChannel = 'csid-build'
+    nodeLabel = 'docker-debian-jdk17'
+    runMergeCheck = true
+}
+
+def job = {
+    def maven_command = sh(script: """if test -f "${env.WORKSPACE}/mvnw"; then echo "${env.WORKSPACE}/mvnw"; else echo "mvn"; fi""", returnStdout: true).trim()
+    // If we have a RELEASE_TAG specified as a build parameter, test that the version in pom.xml matches the tag.
+    if (!params.RELEASE_TAG.trim().equals('')) {
+        sh "git checkout ${params.RELEASE_TAG}"
+        def project_version = sh(
+                script: """${maven_command} help:evaluate -Dexpression=project.version -q -DforceStdout | tail -1""",
+                returnStdout: true
+        ).trim()
+
+        if (!params.RELEASE_TAG.trim().equals(project_version)) {
+            echo 'ERROR: tag doesn\'t match project version, please correct and try again'
+            echo "Tag: ${params.RELEASE_TAG}"
+            echo "Project version: ${project_version}"
+            currentBuild.result = 'FAILURE'
+            return
+        }
+    }
+
+    stage('Build') {
+        archiveArtifacts artifacts: 'pom.xml'
+        withVaultEnv([["gpg/confluent-packaging-private-8B1DA6120C2BF624", "passphrase", "GPG_PASSPHRASE"]]) {
+            def mavenSettingsFile = "${env.WORKSPACE_TMP}/maven-global-settings.xml"             
+            withMavenSettings("maven/jenkins_maven_global_settings", "settings", "MAVEN_GLOBAL_SETTINGS", mavenSettingsFile) {
+                withMaven(globalMavenSettingsFilePath: mavenSettingsFile) {
+                    withDockerServer([uri: dockerHost()]) {
+                        def isPrBuild = env.CHANGE_TARGET ? true : false
+                        def buildPhase = isPrBuild ? "install" : "deploy"
+                        if (params.RELEASE_TAG.trim().equals('')) {
+                            sh "${maven_command} --batch-mode -Pjenkins -Pci -U dependency:analyze clean $buildPhase"
+                        } else {
+                            // it's a parameterized job, and we should deploy to maven central.
+                          withGPGkey("gpg/confluent-packaging-private-8B1DA6120C2BF624") {
+                            sh "${maven_command} --batch-mode clean deploy -P maven-central -Pjenkins -Pci -Dgpg.passphrase=$GPG_PASSPHRASE"
+                          }
+                        }
+                        currentBuild.result = 'Success'
+                    }
+                }
+            }
+        }
+    }
+}
+runJob config, job
diff --git a/LICENSE b/LICENSE
new file mode 100644
index 000000000..7a4a3ea24
--- /dev/null
+++ b/LICENSE
@@ -0,0 +1,202 @@
+
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright [yyyy] [name of copyright owner]
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
\ No newline at end of file
diff --git a/README.adoc b/README.adoc
new file mode 100644
index 000000000..81af418e0
--- /dev/null
+++ b/README.adoc
@@ -0,0 +1,1896 @@
+//
+// STOP!!! Make sure you're editing the TEMPLATE version of the README, in /src/docs/README_TEMPLATE.adoc
+//
+// Do NOT edit /README_TEMPLATE.adoc as your changes will be overwritten when the template is rendered again during
+// `process-sources`.
+//
+// Changes made to this template, must then be rendered to the base readme, by running `mvn process-sources`
+//
+// To render the README directly, run `mvn asciidoc-template::build`
+//
+
+
+// dynamic include base for editing in IDEA
+:project_root: ./
+// for editing the template to see the includes, this will correctly render includes
+ifeval::["{docname}" == "README_TEMPLATE"]
+
+TIP:: Editing template file
+
+:project_root: ../../
+
+endif::[]
+
+
+= Confluent Parallel Consumer
+:icons:
+:toc: macro
+:toclevels: 3
+:numbered: 1
+:sectlinks: true
+:sectanchors: true
+
+:github_name: parallel-consumer
+:base_url: https://github.com/confluentinc/{github_name}
+:issues_link: {base_url}/issues
+
+
+ifdef::env-github[]
+:tip-caption: :bulb:
+:note-caption: :information_source:
+:important-caption: :heavy_exclamation_mark:
+:caution-caption: :fire:
+:warning-caption: :warning:
+endif::[]
+
+image:https://maven-badges.herokuapp.com/maven-central/io.confluent.parallelconsumer/parallel-consumer-parent/badge.svg?style=flat[link=https://mvnrepository.com/artifact/io.confluent.parallelconsumer/parallel-consumer-parent,Latest Parallel Consumer on Maven Central]
+
+// Github actions disabled since codecov
+//image:https://github.com/confluentinc/parallel-consumer/actions/workflows/maven.yml/badge.svg[Java 8 Unit Test GitHub] +
+//^(^^full^ ^test^ ^suite^ ^currently^ ^running^ ^only^ ^on^ ^Confluent^ ^internal^ ^CI^ ^server^^)^
+
+// travis badges temporarily disabled as travis isn't running CI currently
+//image:https://travis-ci.com/astubbs/parallel-consumer.svg?branch=master["Build Status", link="https://travis-ci.com/astubbs/parallel-consumer"] image:https://codecov.io/gh/astubbs/parallel-consumer/branch/master/graph/badge.svg["Coverage",https://codecov.io/gh/astubbs/parallel-consumer]
+
+Parallel Apache Kafka client wrapper with client side queueing, a simpler consumer/producer API with *key concurrency* and *extendable non-blocking IO* processing.
+
+Confluent's https://www.confluent.io/confluent-accelerators/#parallel-consumer[product page for the project is here].
+
+TIP: If you like this project, please ⭐ Star it in GitHub to show your appreciation, help us gauge popularity of the project and allocate resources.
+
+NOTE: This is not a part of the Confluent commercial support offering, except through consulting engagements.
+See the <<Support and Issues>> section for more information.
+
+IMPORTANT: This project has been stable and reached its initial target feature set in Q1 2021.
+It is actively maintained by the CSID team at Confluent.
+
+[[intro]]
+This library lets you process messages in parallel via a single Kafka Consumer meaning you can increase consumer parallelism without increasing the number of partitions in the topic you intend to process.
+For many use cases this improves both throughput and latency by reducing load on your brokers.
+It also opens up new use cases like extreme parallelism, external data enrichment, and queuing.
+
+.Consume many messages _concurrently_ with a *single* consumer instance:
+[source,java,indent=0]
+----
+        parallelConsumer.poll(record ->
+                log.info("Concurrently processing a record: {}", record)
+        );
+----
+
+An overview article to the library can also be found on Confluent's https://www.confluent.io/blog/[blog]: https://www.confluent.io/blog/introducing-confluent-parallel-message-processing-client/[Introducing the Confluent Parallel Consumer].
+
+[#demo]
+== Demo
+
+.Relative speed demonstration
+--
+.Click on the animated SVG image to open the https://asciinema.org/a/404299[Asciinema.org player].
+image::https://gist.githubusercontent.com/astubbs/26cccaf8b624a53ae26a52dbc00148b1/raw/cbf558b38b0aa624bd7637406579d2a8f00f51db/demo.svg[link="https://asciinema.org/a/404299"]
+--
+
+:talk_link: https://www.confluent.io/en-gb/events/kafka-summit-europe-2021/introducing-confluent-labs-parallel-consumer-client/
+:talk_preview_image: https://play.vidyard.com/5MLb1Xh7joEQ7phxPxiyPK.jpg
+
+[#talk]
+== Video Overview
+
+.Kafka Summit Europe 2021 Presentation
+--
+.A video presentation overview can be found {talk_link}[from the Kafka Summit Europe 2021] page for the presentatoin, along with slides.
+[link = {talk_link}]
+image::{talk_preview_image}[Talk]
+--
+
+'''
+
+toc::[]
+
+== Motivation
+
+=== Why would I need this?
+
+The unit of parallelism in Kafka’s consumers is the partition but sometimes you want to break away from this approach and manage parallelism yourself using threads rather than new instances of a Consumer.
+Notable use cases include:
+
+* Where partition counts are difficult to change and you need more parallelism than the current configuration allows.
+
+* You wish to avoid over provisioning partitions in topics due to unknown future requirements.
+
+* You wish to reduce the broker-side resource utilization associated with highly-parallel consumer groups.
+
+* You need queue-like semantics that use message level acknowledgment, for example to process a work queue with short- and long-running tasks.
+
+When reading the below, keep in mind that the unit of concurrency and thus performance, is restricted by the number of partitions (degree of sharding / concurrency).
+Currently, you can't adjust the number of partitions in your Kafka topics without jumping through a lot of hoops, or breaking your key ordering.
+
+==== Before
+
+.The slow consumer situation with the raw Apache Kafka Consumer client
+image::https://lucid.app/publicSegments/view/98ad200f-97b2-479b-930c-2805491b2ce7/image.png[align="center"]
+
+==== After
+
+.Example usage of the Parallel Consumer
+image::https://lucid.app/publicSegments/view/2cb3b7e2-bfdf-4e78-8247-22ec394de965/image.png[align="center"]
+
+=== Background
+
+The core Kafka consumer client gives you a batch of messages to process one at a time.
+Processing these in parallel on thread pools is difficult, particularly when considering offset management and strong ordering guarantees.
+You also need to manage your consume loop, and commit transactions properly if using Exactly Once semantics.
+
+This wrapper library for the Apache Kafka Java client handles all this for you, you just supply your processing function.
+
+Another common situation where concurrent processing of messages is advantageous, is what is referred to as "competing consumers".
+A pattern that is often addressed in traditional messaging systems using a shared queue.
+Kafka doesn't provide native queue support and this can result in a slow processing message blocking the messages behind it in the same partition.
+If <<ordering-guarantees,log ordering>> isn't a concern this can be an unwelcome bottleneck for users.
+The Parallel Consumer provides a solution to this problem.
+
+In addition, the <<http-with-vertx,Vert.x extension>> to this library supplies non-blocking interfaces, allowing higher still levels of concurrency with a further simplified interface.
+Also included now is a <<project-reactor,module for>> https://projectreactor.io[Project Reactor.io].
+
+=== FAQ
+
+[qanda]
+Why not just run more consumers?::
+The typical way to address performance issues in a Kafka system, is to increase the number of consumers reading from a topic.
+This is effective in many situations, but falls short in a lot too.
+
+* Primarily: You cannot use more consumers than you have partitions available to read from.
+For example, if you have a topic with five partitions, you cannot use a group with more than five consumers to read from it.
+* Running more extra consumers has resource implications - each consumer takes up resources on both the client and broker side.
+Each consumer adds a lot of overhead in terms of memory, CPU, and network bandwidth.
+* Large consumer groups (especially many large groups) can cause a lot of strain on the consumer group coordination system, such as rebalance storms.
+* Even with several partitions, you cannot achieve the performance levels obtainable by *per-key* ordered or unordered concurrent processing.
+* A single slow or failing message will also still block all messages behind the problematic message, ie. the entire partition.
+The process may recover, but the latency of all the messages behind the problematic one will be negatively impacted severely.
+
+Why not run more consumers __within__ your application instance?::
+* This is in some respects a slightly easier way of running more consumer instances, and in others a more complicated way.
+However, you are still restricted by all the per consumer restrictions as described above.
+
+Why not use the Vert.x library yourself in your processing loop?::
+* Vert.x us used in this library to provide a non-blocking IO system in the message processing step.
+Using Vert.x without using this library with *ordered* processing requires dealing with the quite complicated, and not straight forward, aspect of handling offset commits with Vert.x asynchronous processing system.
++
+*Unordered* processing with Vert.x is somewhat easier, however offset management is still quite complicated, and the Parallel Consumer also provides optimizations for message-level acknowledgment in this case.
+This library handles offset commits for both ordered and unordered processing cases.
+
+=== Scenarios
+
+Below are some real world use cases which illustrate concrete situations where the described advantages massively improve performance.
+
+* Slow consumer systems in transactional systems (online vs offline or reporting systems)
+** Notification system:
++
+*** Notification processing system which sends push notifications to a user to acknowledge a two-factor authentication request on their mobile and authorising a login to a website, requires optimal end-to-end latency for a good user experience.
+*** A specific message in this queue uncharacteristically takes a long time to process because the third party system is sometimes unpredictably slow to respond and so holds up the processing for *ALL* other notifications for other users that are in the same partition behind this message.
+*** Using key order concurrent processing will allow notifications to proceed while this message either slowly succeeds or times out and retires.
+** Slow GPS tracking system (slow HTTP service interfaces that can scale horizontally)
+*** GPS tracking messages from 100,000 different field devices pour through at a high rate into an input topic.
+*** For each message, the GPS location coordinates is checked to be within allowed ranges using a legacy HTTP services, dictated by business rules behind the service.
+*** The service takes 50ms to process each message, however can be scaled out horizontally without restriction.
+*** The input topic only has 10 partitions and for various reasons (see above) cannot be changed.
+*** With the vanilla consumer, messages on each partition must be consumed one after the other in serial order.
+*** The maximum rate of message processing is then:
++
+`1 second / 50 ms * 10 partitions = 200 messages per second.`
+*** By using this library, the 10 partitions can all be processed in key order.
++
+`1 second / 50ms × 100,000 keys = 2,000,000 messages per second`
++
+While the HTTP system probably cannot handle 2,000,000 messages per second, more importantly, your system is no longer the bottleneck.
+
+** Slow CPU bound model processing for fraud prediction
+*** Consider a system where message data is passed through a fraud prediction model which takes CPU cycles, instead of an external system being slow.
+*** We can scale easily the number of CPUs on our virtual machine where the processing is being run, but we choose not to scale the partitions or consumers (see above).
+*** By deploying onto machines with far more CPUs available, we can run our prediction model massively parallel, increasing our throughput and reducing our end-to-end response times.
+* Spikey load with latency sensitive non-functional requirements
+** An upstream system regularly floods our input topic daily at close of business with settlement totals data from retail outlets.
+*** Situations like this are common where systems are designed to comfortably handle average day time load, but are not provisioned to handle sudden increases in traffic as they don't happen often enough to justify the increased spending on processing capacity that would otherwise remain idle.
+*** Without adjusting the available partitions or running consumers, we can reduce our maximum end-to-end latency and increase throughout to get our global days outlet reports to division managers so action can be taken, before close of business.
+** Natural consumer behaviour
+*** Consider scenarios where bursts of data flooding input topics are generated by sudden user behaviour such as sales or television events ("Oprah" moments).
+*** For example, an evening, prime-time game show on TV where users send in quiz answers on their devices.
+The end-to-end latency of the responses to these answers needs to be as low as technically possible, even if the processing step is quick.
+*** Instead of a vanilla client where each user response waits in a virtual queue with others to be processed, this library allows every single response to be processed in parallel.
+* Legacy partition structure
+** Any existing setups where we need higher performance either in throughput or latency where there are not enough partitions for needed concurrency level, the tool can be applied.
+* Partition overloaded brokers
+** Clusters with under-provisioned hardware and with too many partitions already - where we cannot expand partitions even if we were able to.
+** Similar to the above, but from the operations perspective, our system is already over partitioned, perhaps in order to support existing parallel workloads which aren't using the tool (and so need large numbers of partitions).
+** We encourage our development teams to migrate to the tool, and then being a process of actually __lowering__ the number of partitions in our partitions in order to reduce operational complexity, improve reliability and perhaps save on infrastructure costs.
+* Server side resources are controlled by a different team we can't influence
+** The cluster our team is working with is not in our control, we cannot change the partition setup, or perhaps even the consumer layout.
+** We can use the tool ourselves to improve our system performance without touching the cluster / topic setup.
+* Kafka Streams app that had a slow stage
+** We use Kafka Streams for our message processing, but one of it's steps have characteristics of the above and we need better performance.
+We can break out as described below into the tool for processing that step, then return to the Kafka Streams context.
+* Provisioning extra machines (either virtual machines or real machines) to run multiple clients has a cost, using this library instead avoids the need for extra instances to be deployed in any respect.
+
+== Features List
+
+* Have massively parallel consumption processing without running hundreds or thousands of:
+** Kafka consumer clients,
+** topic partitions,
++
+without operational burden or harming the cluster's performance
+* Client side queueing system on top of Apache Kafka consumer
+** Efficient individual message acknowledgement system (without local or third party external system state storage) to massively reduce (and usually completely eliminate) message replay upon failure - see <<offset_map>> section for more details
+* Solution for the https://en.wikipedia.org/wiki/Head-of-line_blocking["head of line"] blocking problem where continued failure of a single message, prevents progress for messages behind it in the queue
+* Per `key` concurrent processing, per partition and unordered message processing
+* Offsets committed correctly, in order, of only processed messages, regardless of concurrency level or retries
+* Batch support in all versions of the API to process batches of messages in parallel instead of single messages.
+** Particularly useful for when your processing function can work with more than a single record at a time - e.g. sending records to an API which has a batch version like Elasticsearch
+* Vert.x and Reactor.io non-blocking library integration
+** Non-blocking I/O work management
+** Vert.x's WebClient and general Vert.x Future support
+** Reactor.io Publisher (Mono/Flux) and Java's CompletableFuture (through `Mono#fromFuture`)
+* Exactly Once bulk transaction system
+** When using the transactional mode, record processing that happens in parallel and produce records back to kafka get all grouped into a large batch transaction, and the offsets and records are submitted through the transactional producer, giving you Exactly once Semantics for parallel processing.
+** For further information, see the <<transaction-system>> section.
+* Fair partition traversal
+* Zero~ dependencies (`Slf4j` and `Lombok`) for the core module
+* Java 8 compatibility
+* Throttle control and broker liveliness management
+* Clean draining shutdown cycle
+* Manual global pause / resume of all partitions, without unsubscribing from topics (useful for implementing a simplistic https://en.wikipedia.org/wiki/Circuit_breaker_design_pattern[circuit breaker])
+** Circuit breaker patterns for individual paritions or keys can be done through throwing failure exceptions in the processing function (see https://github.com/confluentinc/parallel-consumer/pull/291[PR #291 Explicit terminal and retriable exceptions] for further refinement)
+** Note: Pausing of a partition is also automatic, whenever back pressure has built up on a given partition
+
+//image:https://codecov.io/gh/astubbs/parallel-consumer/branch/master/graph/badge.svg["Coverage",https://codecov.io/gh/astubbs/parallel-consumer]
+//image:https://travis-ci.com/astubbs/parallel-consumer.svg?branch=master["Build Status", link="https://travis-ci.com/astubbs/parallel-consumer"]
+
+And more <<roadmap,to come>>!
+
+== Performance
+
+In the best case, you don't care about ordering at all.In which case, the degree of concurrency achievable is simply set by max thread and concurrency settings, or with the Vert.x extension, the Vert.x Vertical being used - e.g. non-blocking HTTP calls.
+
+For example, instead of having to run 1,000 consumers to process 1,000 messages at the same time, we can process all 1,000 concurrently on a single consumer instance.
+
+More typically though you probably still want the per key ordering grantees that Kafka provides.
+For this there is the per key ordering setting.
+This will limit the library from processing any message at the same time or out of order, if they have the same key.
+
+Massively reduce message processing latency regardless of partition count for spikey workloads where there is good key distribution.
+Eg 100,000 “users” all trigger an action at once.
+As long as the processing layer can handle the load horizontally (e.g auto scaling web service), per message latency will be massively decreased, potentially down to the time for processing a single message, if the integration point can handle the concurrency.
+
+For example, if you have a key set of 10,000 unique keys, and you need to call an http endpoint to process each one, you can use the per key order setting, and in the best case the system will process 10,000 at the same time using the non-blocking Vert.x HTTP client library.
+The user just has to provide a function to extract from the message the HTTP call parameters and construct the HTTP request object.
+
+=== Illustrative Performance Example
+
+.(see link:./parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/VolumeTests.java[VolumeTests.java])
+These performance comparison results below, even though are based on real performance measurement results, are for illustrative purposes.
+To see how the performance of the tool is related to instance counts, partition counts, key distribution and how it would relate to the vanilla client.
+Actual results will vary wildly depending upon the setup being deployed into.
+
+For example, if you have hundreds of thousands of keys in your topic, randomly distributed, even with hundreds of partitions, with only a handful of this wrapper deployed, you will probably see many orders of magnitude performance improvements - massively out performing dozens of vanilla Kafka consumer clients.
+
+.Time taken to process a large number of messages with a Single Parallel Consumer vs a single Kafka Consumer, for different key space sizes. As the number of unique keys in the data set increases, the key ordered Parallel Consumer performance starts to approach that of the unordered Parallel Consumer. The raw Kafka consumer performance remains unaffected by the key distribution.
+image::https://docs.google.com/spreadsheets/d/e/2PACX-1vQffkAFG-_BzH-LKfGCVnytdzAHiCNIrixM6X2vF8cqw2YVz6KyW3LBXTB-lVazMAJxW0UDuFILKvtK/pubchart?oid=1691474082&amp;format=image[align="center"]
+
+.Consumer group size effect on total processing time vs a single Parallel Consumer. As instances are added to the consumer group, it's performance starts to approach that of the single instance Parallel Consumer. Key ordering is faster than partition ordering, with unordered being the fastest.
+image::https://docs.google.com/spreadsheets/d/e/2PACX-1vQffkAFG-_BzH-LKfGCVnytdzAHiCNIrixM6X2vF8cqw2YVz6KyW3LBXTB-lVazMAJxW0UDuFILKvtK/pubchart?oid=938493158&format=image[align="center"]
+
+.Consumer group size effect on message latency vs a single Parallel Consumer. As instances are added to the consumer group, it's performance starts to approach that of the single instance Parallel Consumer.
+image::https://docs.google.com/spreadsheets/d/e/2PACX-1vQffkAFG-_BzH-LKfGCVnytdzAHiCNIrixM6X2vF8cqw2YVz6KyW3LBXTB-lVazMAJxW0UDuFILKvtK/pubchart?oid=1161363385&format=image[align="center"]
+
+As an illustrative example of relative performance, given:
+
+* A random processing time between 0 and 5ms
+* 10,000 messages to process
+* A single partition (simplifies comparison - a topic with 5 partitions is the same as 1 partition with a keyspace of 5)
+* Default `ParallelConsumerOptions`
+** maxConcurrency = 100
+** numberOfThreads = 16
+
+.Comparative performance of order modes and key spaces
+[cols="1,1,1,3",options="header"]
+|===
+|Ordering
+|Number of keys
+|Duration
+|Note
+
+|Partition
+|20 (not relevant)
+|22.221s
+|This is the same as a single partition with a single normal serial consumer, as we can see: 2.5ms avg processing time * 10,000 msg / 1000ms = ~25s.
+
+|Key
+|1
+|26.743s
+|Same as above
+
+|Key
+|2
+|13.576s
+|
+
+|Key
+|5
+|5.916s
+|
+
+|Key
+|10
+|3.310s
+|
+
+|Key
+|20
+|2.242s
+|
+
+|Key
+|50
+|2.204s
+|
+
+|Key
+|100
+|2.178s
+|
+
+|Key
+|1,000
+|2.056s
+|
+
+|Key
+|10,000
+|2.128s
+|As key space is t he same as the number of messages, this is similar (but restricted by max concurrency settings) as having a *single consumer* instance and *partition* _per key_. 10,000 msgs * avg processing time 2.5ms = ~2.5s.
+
+|Unordered
+|20 (not relevant)
+|2.829s
+|As there is no order restriction, this is similar (but restricted by max concurrency settings) as having a *single consumer* instance and *partition* _per key_. 10,000 msgs * avg processing time 2.5ms = ~2.5s.
+|===
+
+== Support and Issues
+
+If you encounter any issues, or have any suggestions or future requests, please create issues in the {issues_link}[github issue tracker].
+Issues will be dealt with on a good faith, best efforts basis, by the small team maintaining this library.
+
+We also encourage participation, so if you have any feature ideas etc, please get in touch, and we will help you work on submitting a PR!
+
+NOTE: We are very interested to hear about your experiences!
+And please vote on your favourite issues!
+
+If you have questions, head over to the https://launchpass.com/confluentcommunity[Confluent Slack community], or raise an https://github.com/confluentinc/parallel-consumer/issues[issue] on GitHub.
+
+== License
+
+This library is copyright Confluent Inc, and licensed under the Apache License Version 2.0.
+
+== Usage
+
+=== Maven
+
+This project is available in maven central, https://repo1.maven.org/maven2/io/confluent/parallelconsumer/[repo1], along with SNAPSHOT builds (starting with 0.5-SNAPSHOT) in https://oss.sonatype.org/content/repositories/snapshots/io/confluent/parallelconsumer/[repo1's SNAPSHOTS repo].
+
+Latest version can be seen https://search.maven.org/artifact/io.confluent.parallelconsumer/parallel-consumer-core[here].
+
+Where `${project.version}` is the version to be used:
+
+* group ID: `io.confluent.parallelconsumer`
+* artifact ID: `parallel-consumer-core`
+* version: image:https://maven-badges.herokuapp.com/maven-central/io.confluent.parallelconsumer/parallel-consumer-parent/badge.svg?style=flat[link=https://mvnrepository.com/artifact/io.confluent.parallelconsumer/parallel-consumer-parent,Latest Parallel Consumer on Maven Central]
+
+.Core Module Dependency
+[source,xml,indent=0]
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-core</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+
+.Reactor Module Dependency
+[source,xml,indent=0]
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-reactor</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+
+.Vert.x Module Dependency
+[source,xml,indent=0]
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-vertx</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+
+[[common_preparation]]
+=== Common Preparation
+
+.Setup the client
+[source,java,indent=0]
+----
+        Consumer<String, String> kafkaConsumer = getKafkaConsumer(); // <1>
+        Producer<String, String> kafkaProducer = getKafkaProducer();
+
+        var options = ParallelConsumerOptions.<String, String>builder()
+                .ordering(KEY) // <2>
+                .maxConcurrency(1000) // <3>
+                .consumer(kafkaConsumer)
+                .producer(kafkaProducer)
+                .build();
+
+        ParallelStreamProcessor<String, String> eosStreamProcessor =
+                ParallelStreamProcessor.createEosStreamProcessor(options);
+
+        eosStreamProcessor.subscribe(of(inputTopic)); // <4>
+
+        return eosStreamProcessor;
+----
+
+<1> Setup your clients as per normal.
+A Producer is only required if using the `produce` flows.
+<2> Choose your ordering type, `KEY` in this case.
+This ensures maximum concurrency, while ensuring messages are processed and committed in `KEY` order, making sure no offset is committed unless all offsets before it in it's partition, are completed also.
+<3> The maximum number of concurrent processing operations to be performing at any given time.
+Also, because the library coordinates offsets, `enable.auto.commit` must be disabled in your consumer.
+<5> Subscribe to your topics
+
+NOTE: Because the library coordinates offsets, `enable.auto.commit` must be disabled.
+
+After this setup, one then has the choice of interfaces:
+
+* `ParallelStreamProcessor`
+* `VertxParallelStreamProcessor`
+* `JStreamParallelStreamProcessor`
+* `JStreamVertxParallelStreamProcessor`
+
+There is another interface: `ParallelConsumer` which is integrated, however there is currently no immediate implementation.
+See {issues_link}/12[issue #12], and the `ParallelConsumer` JavaDoc:
+
+[source,java]
+----
+/**
+ * Asynchronous / concurrent message consumer for Kafka.
+ * <p>
+ * Currently, there is no direct implementation, only the {@link ParallelStreamProcessor} version (see
+ * {@link AbstractParallelEoSStreamProcessor}), but there may be in the future.
+ *
+ * @param <K> key consume / produce key type
+ * @param <V> value consume / produce value type
+ * @see AbstractParallelEoSStreamProcessor
+ */
+----
+
+=== Core
+
+==== Simple Message Process
+
+This is the only thing you need to do, in order to get massively concurrent processing in your code.
+
+.Usage - print message content out to the console in parallel
+[source,java,indent=0]
+        parallelConsumer.poll(record ->
+                log.info("Concurrently processing a record: {}", record)
+        );
+
+See the link:{project_root}/parallel-consumer-examples/parallel-consumer-example-core/src/main/java/io/confluent/parallelconsumer/examples/core/CoreApp.java[core example] project, and it's test.
+
+==== Process and Produce a Response Message
+
+This interface allows you to process your message, then publish back to the broker zero, one or more result messages.
+You can also optionally provide a callback function to be run after the message(s) is(are) successfully published to the broker.
+
+.Usage - print message content out to the console in parallel
+[source,java,indent=0]
+        parallelConsumer.pollAndProduce(context -> {
+                    var consumerRecord = context.getSingleRecord().getConsumerRecord();
+                    var result = processBrokerRecord(consumerRecord);
+                    return new ProducerRecord<>(outputTopic, consumerRecord.key(), result.payload);
+                }, consumeProduceResult -> {
+                    log.debug("Message {} saved to broker at offset {}",
+                            consumeProduceResult.getOut(),
+                            consumeProduceResult.getMeta().offset());
+                }
+        );
+
+==== Callbacks vs Streams
+
+You have the option to either use callbacks to be notified of events, or use the `Streaming` versions of the API, which use the `java.util.stream.Stream` system:
+
+* `JStreamParallelStreamProcessor`
+* `JStreamVertxParallelStreamProcessor`
+
+In future versions, we plan to look at supporting other streaming systems like https://github.com/ReactiveX/RxJava[RxJava] via modules.
+
+[[batching]]
+=== Batching
+
+The library also supports sending a batch or records as input to the users processing function in parallel.
+Using this, you can process several records in your function at once.
+
+To use it, set a `batch size` in the options class.
+
+There are then various access methods for the batch of records - see the `PollContext` object for more information.
+
+IMPORTANT: If an exception is thrown while processing the batch, all messages in the batch will be returned to the queue, to be retried with the standard retry system.
+There is no guarantee that the messages will be retried again in the same batch.
+
+==== Usage
+
+[source,java,indent=0]
+----
+        ParallelStreamProcessor.createEosStreamProcessor(ParallelConsumerOptions.<String, String>builder()
+                .consumer(getKafkaConsumer())
+                .producer(getKafkaProducer())
+                .maxConcurrency(100)
+                .batchSize(5) // <1>
+                .build());
+        parallelConsumer.poll(context -> {
+            // convert the batch into the payload for our processing
+            List<String> payload = context.stream()
+                    .map(this::preparePayload)
+                    .collect(Collectors.toList());
+            // process the entire batch payload at once
+            processBatchPayload(payload);
+        });
+----
+
+<1> Choose your batch size.
+
+==== Restrictions
+
+- If using a batch version of the API, you must choose a batch size in the options class.
+- If a batch size is chosen, the "normal" APIs cannot be used, and an error will be thrown.
+
+[[http-with-vertx]]
+=== HTTP with the Vert.x Module
+
+.Call an HTTP endpoint for each message usage
+[source,java,indent=0]
+----
+        var resultStream = parallelConsumer.vertxHttpReqInfoStream(context -> {
+            var consumerRecord = context.getSingleConsumerRecord();
+            log.info("Concurrently constructing and returning RequestInfo from record: {}", consumerRecord);
+            Map<String, String> params = UniMaps.of("recordKey", consumerRecord.key(), "payload", consumerRecord.value());
+            return new RequestInfo("localhost", port, "/api", params); // <1>
+        });
+----
+
+<1> Simply return an object representing the request, the Vert.x HTTP engine will handle the rest, using it's non-blocking engine
+
+See the link:{project_root}/parallel-consumer-examples/parallel-consumer-example-vertx/src/main/java/io/confluent/parallelconsumer/examples/vertx/VertxApp.java[Vert.x example] project, and it's test.
+
+[[project-reactor]]
+=== Project Reactor
+
+As per the Vert.x support, there is also a Reactor module.
+This means you can use Reactor's non-blocking threading model to process your messages, allowing for orders of magnitudes higher concurrent processing than the core module's thread per worker module.
+
+See the link:{project_root}/parallel-consumer-examples/parallel-consumer-example-reactor/src/main/java/io/confluent/parallelconsumer/examples/reactor/ReactorApp.java[Reactor example] project, and it's test.
+
+.Call any Reactor API for each message usage. This example uses a simple `Mono.just` to return a value, but you can use any Reactor API here.
+[source,java,indent=0]
+----
+        parallelConsumer.react(context -> {
+            var consumerRecord = context.getSingleRecord().getConsumerRecord();
+            log.info("Concurrently constructing and returning RequestInfo from record: {}", consumerRecord);
+            Map<String, String> params = UniMaps.of("recordKey", consumerRecord.key(), "payload", consumerRecord.value());
+            return Mono.just("something todo"); // <1>
+        });
+----
+
+[[spring]]
+[[streams-usage-code]]
+=== Kafka Streams Concurrent Processing
+
+Use your Streams app to process your data first, then send anything needed to be processed concurrently to an output topic, to be consumed by the parallel consumer.
+
+.Example usage with Kafka Streams
+image::https://lucid.app/publicSegments/view/43f2740c-2a7f-4b7f-909e-434a5bbe3fbf/image.png[Kafka Streams Usage,align="center"]
+
+.Preprocess in Kafka Streams, then process concurrently
+[source,java,indent=0]
+----
+    void run() {
+        preprocess(); // <1>
+        concurrentProcess(); // <2>
+    }
+
+    void preprocess() {
+        StreamsBuilder builder = new StreamsBuilder();
+        builder.<String, String>stream(inputTopic)
+                .mapValues((key, value) -> {
+                    log.info("Streams preprocessing key: {} value: {}", key, value);
+                    return String.valueOf(value.length());
+                })
+                .to(outputTopicName);
+
+        startStreams(builder.build());
+    }
+
+    void startStreams(Topology topology) {
+        streams = new KafkaStreams(topology, getStreamsProperties());
+        streams.start();
+    }
+
+    void concurrentProcess() {
+        setupParallelConsumer();
+
+        parallelConsumer.poll(record -> {
+            log.info("Concurrently processing a record: {}", record);
+            messageCount.getAndIncrement();
+        });
+    }
+----
+
+<1> Setup your Kafka Streams stage as per normal, performing any type of preprocessing in Kafka Streams
+<2> For the slow consumer part of your Topology, drop down into the parallel consumer, and use massive concurrency
+
+See the link:{project_root}/parallel-consumer-examples/parallel-consumer-example-streams/src/main/java/io/confluent/parallelconsumer/examples/streams/StreamsApp.java[Kafka Streams example] project, and it's test.
+
+[[confluent-cloud]]
+=== Confluent Cloud
+
+. Provision your fully managed Kafka cluster in Confluent Cloud
+.. Sign up for https://www.confluent.io/confluent-cloud/tryfree/[Confluent Cloud], a fully-managed Apache Kafka service.
+.. After you log in to Confluent Cloud, click on `Add cloud environment` and name the environment `learn-kafka`.
+Using a new environment keeps your learning resources separate from your other Confluent Cloud resources.
+.. Click on https://confluent.cloud/learn[LEARN] and follow the instructions to launch a Kafka cluster and to enable Schema Registry.
+. Access the client configuration settings
+.. From the Confluent Cloud Console, navigate to your Kafka cluster.
+From the `Clients` view, get the connection information customized to your cluster (select `Java`).
+.. Create new credentials for your Kafka cluster, and then Confluent Cloud will show a configuration block with your new credentials automatically populated (make sure `show API keys` is checked).
+.. Use these settings presented to https://docs.confluent.io/clients-kafka-java/current/overview.html[configure your clients].
+. Use these clients for steps outlined in the <<common_preparation>> section.
+
+[[upgrading]]
+== Upgrading
+
+=== From 0.4 to 0.5
+
+This version has a breaking change in the API - instead of passing in `ConsumerRecord` instances, it passes in a `PollContext` object which has extra information and utility methods.
+See the `PollContext` class for more information.
+
+[[ordering-guarantees]]
+== Ordering Guarantees
+
+The user has the option to either choose ordered, or unordered message processing.
+
+Either in `ordered` or `unordered` processing, the system will only commit offsets for messages which have been successfully processed.
+
+CAUTION: `Unordered` processing could cause problems for third party integration where ordering by key is required.
+
+CAUTION: Beware of third party systems which are not idempotent, or are key order sensitive.
+
+IMPORTANT: The below diagrams represent a single iteration of the system and a very small number of input partitions and messages.
+
+=== Vanilla Kafka Consumer Operation
+
+Given this input topic with three partitions and a series of messages:
+
+.Input topic
+image::https://lucid.app/publicSegments/view/37d13382-3067-4c93-b521-7e43f2295fff/image.png[align="center"]
+
+The normal Kafka client operations in the following manner.
+Note that typically offset commits are not performed after processing a single message, but is illustrated in this manner for comparison to the single pass concurrent methods below.
+Usually many messages are committed in a single go, which is much more efficient, but for our illustrative purposes is not really relevant, as we are demonstration sequential vs concurrent _processing_ messages.
+
+.Normal execution of the raw Kafka client
+image::https://lucid.app/publicSegments/view/0365890d-e8ff-4a06-b24a-8741175dacc3/image.png[align="center"]
+
+=== Unordered
+
+Unordered processing is where there is no restriction on the order of multiple messages processed per partition, allowing for highest level of concurrency.
+
+This is the fastest option.
+
+.Unordered concurrent processing of message
+image::https://lucid.app/publicSegments/view/aab5d743-de05-46d0-8c1e-0646d7d2946f/image.png[align="center"]
+
+=== Ordered by Partition
+
+At most only one message from any given input partition will be in flight at any given time.
+This means that concurrent processing is restricted to the number of input partitions.
+
+The advantage of ordered processing mode, is that for an assignment of 1000 partitions to a single consumer, you do not need to run 1000 consumer instances or threads, to process the partitions in parallel.
+
+Note that for a given partition, a slow processing message _will_ prevent messages behind it from being processed.
+However, messages in other partitions assigned to the consumer _will_ continue processing.
+
+This option is most like normal operation, except if the consumer is assigned more than one partition, it is free to process all partitions in parallel.
+
+.Partition ordered concurrent processing of messages
+image::https://lucid.app/publicSegments/view/30ad8632-e8fe-4e05-8afd-a2b6b3bab309/image.png[align="center"]
+
+=== Ordered by Key
+
+Most similar to ordered by partition, this mode ensures process ordering by *key* (per partition).
+
+The advantage of this mode, is that a given input topic may not have many partitions, it may have a ~large number of unique keys.
+Each of these key -> message sets can actually be processed concurrently, bringing concurrent processing to a per key level, without having to increase the number of input partitions, whilst keeping strong ordering by key.
+
+As usual, the offset tracking will be correct, regardless of the ordering of unique keys on the partition or adjacency to the committed offset, such that after failure or rebalance, the system will not replay messages already marked as successful.
+
+This option provides the performance of maximum concurrency, while maintaining message processing order per key, which is sufficient for many applications.
+
+.Key ordering concurrent processing of messages
+image::https://lucid.app/publicSegments/view/f7a05e99-24e6-4ea3-b3d0-978e306aa568/image.png[align="center"]
+
+=== Retries and Ordering
+
+Even during retries, offsets will always be committed only after successful processing, and in order.
+
+== Retries
+
+If processing of a record fails, the record will be placed back into it's queue and retried with a configurable delay (see the `ParallelConsumerOptions` class).
+Ordering guarantees will always be adhered to, regardless of failure.
+
+A failure is denoted by *any* exception being thrown from the user's processing function.
+The system catches these exceptions, logs them and replaces the record in the queue for processing later.
+All types of Exceptions thrown are considered retriable.
+To not retry a record, do not throw an exception from your processing function.
+
+TIP:: To avoid the system logging an error, throw an exception which extends PCRetriableException.
+
+TIP:: If there was an error processing a record, and you'd like to skip it - do not throw an exception, and the system will mark the record as succeeded.
+
+If for some reason you want to proactively fail a record, without relying on some other system throwing an exception which you don't catch - simply throw an exception of your own design, which the system will treat the same way.
+
+To configure the retry delay, see `ParallelConsumerOptions#defaultRetryDelay`.
+
+At the moment there is no terminal error support, so messages will continue to be retried forever as long as an exception continues to be thrown from the user function (see <<skipping-records>>).
+But still this will not hold up the queues in `KEY` or `UNORDERED` modes, however in `PARTITION` mode it *will* block progress.
+Offsets will also continue to be committed (see <<commit-mode>> and <<Offset Map>>).
+
+=== Retry Delay Function
+
+As part of the https://github.com/confluentinc/parallel-consumer/issues/65[enhanced retry epic], the ability to https://github.com/confluentinc/parallel-consumer/issues/82[dynamically determine the retry delay] was added.
+This can be used to customise retry delay for a record, such as exponential back off or have different delays for different types of records, or have the delay determined by the status of a system etc.
+
+You can access the retry count of a record through it's wrapped `WorkContainer` class, which is the input variable to the retry delay function.
+
+.Example retry delay function implementing exponential backoff
+[source,java,indent=0]
+----
+        final double multiplier = 0.5;
+        final int baseDelaySecond = 1;
+
+        ParallelConsumerOptions.<String, String>builder()
+                .retryDelayProvider(recordContext -> {
+                    int numberOfFailedAttempts = recordContext.getNumberOfFailedAttempts();
+                    long delayMillis = (long) (baseDelaySecond * Math.pow(multiplier, numberOfFailedAttempts) * 1000);
+                    return Duration.ofMillis(delayMillis);
+                });
+----
+
+[[skipping-records]]
+=== Skipping Records
+
+If for whatever reason you want to skip a record, simply do not throw an exception, or catch any exception being thrown, log and swallow it and return from the user function normally.
+The system will treat this as a record processing success, mark the record as completed and move on as though it was a normal operation.
+
+A user may choose to skip a record for example, if it has been retried too many times or if the record is invalid or doesn't need processing.
+
+Implementing a https://github.com/confluentinc/parallel-consumer/issues/196[max retries feature] as a part of the system is planned.
+
+.Example of skipping a record after a maximum number of retries is reached
+[source,java,indent=0]
+----
+        final int maxRetries = 10;
+        final Map<ConsumerRecord<String, String>, Long> retriesCount = new ConcurrentHashMap<>();
+
+        pc.poll(context -> {
+            var consumerRecord = context.getSingleRecord().getConsumerRecord();
+            Long retryCount = retriesCount.computeIfAbsent(consumerRecord, ignore -> 0L);
+            if (retryCount < maxRetries) {
+                processRecord(consumerRecord);
+                // no exception, so completed - remove from map
+                retriesCount.remove(consumerRecord);
+            } else {
+                log.warn("Retry count {} exceeded max of {} for record {}", retryCount, maxRetries, consumerRecord);
+                // giving up, remove from map
+                retriesCount.remove(consumerRecord);
+            }
+        });
+----
+
+=== Circuit Breaker Pattern
+
+Although the system doesn't have an https://github.com/confluentinc/parallel-consumer/issues/110[explicit circuit breaker pattern feature], one can be created by combining the custom retry delay function and proactive failure.
+For example, the retry delay can be calculated based upon the status of an external system - i.e. if the external system is currently out of action, use a higher retry.
+Then in the processing function, again check the status of the external system first, and if it's still offline, throw an exception proactively without attempting to process the message.
+This will put the message back in the queue.
+
+.Example of circuit break implementation
+[source,java,indent=0]
+----
+        final Map<String, Boolean> upMap = new ConcurrentHashMap<>();
+
+        pc.poll(context -> {
+            var consumerRecord = context.getSingleRecord().getConsumerRecord();
+            String serverId = extractServerId(consumerRecord);
+            boolean up = upMap.computeIfAbsent(serverId, ignore -> true);
+
+            if (!up) {
+                up = updateStatusOfSever(serverId);
+            }
+
+            if (up) {
+                try {
+                    processRecord(consumerRecord);
+                } catch (CircuitBreakingException e) {
+                    log.warn("Server {} is circuitBroken, will retry message when server is up. Record: {}", serverId, consumerRecord);
+                    upMap.put(serverId, false);
+                }
+                // no exception, so set server status UP
+                upMap.put(serverId, true);
+            } else {
+                throw new RuntimeException(msg("Server {} currently down, will retry record latter {}", up, consumerRecord));
+            }
+        });
+----
+
+=== Head of Line Blocking
+
+In order to have a failing record not block progress of a partition, one of the ordering modes other than `PARTITION` must be used, so that the system is allowed to process other messages that are perhaps in `KEY` order or in the case of `UNORDERED` processing - any message.
+This is because in `PARTITION` ordering mode, records are always processed in order of partition, and so the Head of Line blocking feature is effectively disabled.
+
+=== Future Work
+
+Improvements to this system are planned, see the following issues:
+
+* https://github.com/confluentinc/parallel-consumer/issues/65[Enhanced retry epic #65]
+* https://github.com/confluentinc/parallel-consumer/issues/48[Support scheduled message processing (scheduled retry)]
+* https://github.com/confluentinc/parallel-consumer/issues/196[Provide option for max retires, and a call back when reached (potential DLQ) #196]
+* https://github.com/confluentinc/parallel-consumer/issues/34[Monitor for progress and optionally shutdown (leave consumer group), skip message or send to DLQ #34]
+
+== Result Models
+
+* Void
+
+Processing is complete simply when your provided function finishes, and the offsets are committed.
+
+* Streaming User Results
+
+When your function is actually run, a result object will be streamed back to your client code, with information about the operation completion.
+
+* Streaming Message Publishing Results
+
+After your operation completes, you can also choose to publish a result message back to Kafka.
+The message publishing metadata can be streamed back to your client code.
+
+[[commit-mode]]
+== Commit Mode
+
+The system gives you three choices for how to do offset commits.
+The simplest of the three are the two Consumer commits modes.
+They are of course, `synchronous` and `asynchronous` mode.
+The `transactional` mode is explained in the next section.
+
+`Asynchronous` mode is faster, as it doesn't block the control loop.
+
+`Synchronous` will block the processing loop until a successful commit response is received, however, `Asynchronous` will still be capped by the max processing settings in the `ParallelConsumerOptions` class.
+
+If you're used to using the auto commit mode in the normal Kafka consumer, you can think of the `Asynchronous` mode being similar to this.
+We suggest starting with this mode, and it is the default.
+
+[[transaction-system]]
+=== Apache Kafka EoS Transaction Model in BULK
+
+There is also the option to use Kafka's Exactly Once Semantics (EoS) system.
+This causes all messages produced, by all workers in parallel, as a result of processing their messages, to be committed within a SINGLE, BULK transaction, along with their source offset.
+
+Note importantly - this is a BULK transaction, not a per input record transaction.
+
+This means that even under failure, the results will exist exactly once in the Kafka output topic.
+If as a part of your processing, you create side effects in other systems, this pertains to the usual idempotency requirements when breaking of EoS Kafka boundaries.
+
+CAUTION:: This is a BULK transaction, not a per input record transaction.
+There is not a single transaction per input record and per worker "thread", but one *LARGE* transaction that gets used by all parallel processing, until the commit interval.
+
+NOTE:: As with the `synchronous` processing mode, this will also block the processing loop until a successful transaction completes
+
+CAUTION: This cannot be true for any externally integrated third party system, unless that system is __idempotent__.
+
+For implementations details, see the <<Transactional System Architecture>> section.
+
+.From the Options Javadoc
+[source,java,indent=0]
+----
+        /**
+         * Periodically commits through the Producer using transactions.
+         * <p>
+         * Messages sent in parallel by different workers get added to the same transaction block - you end up with
+         * transactions 100ms (by default) "large", containing all records sent during that time period, from the
+         * offsets being committed.
+         * <p>
+         * Of no use, if not also producing messages (i.e. using a {@link ParallelStreamProcessor#pollAndProduce}
+         * variation).
+         * <p>
+         * Note: Records being sent by different threads will all be in a single transaction, as PC shares a single
+         * Producer instance. This could be seen as a performance overhead advantage, efficient resource use, in
+         * exchange for a loss in transaction granularity.
+         * <p>
+         * The benefits of using this mode are:
+         * <p>
+         * a) All records produced from a given source offset will either all be visible, or none will be
+         * ({@link org.apache.kafka.common.IsolationLevel#READ_COMMITTED}).
+         * <p>
+         * b) If any records making up a transaction have a terminal issue being produced, or the system crashes before
+         * finishing sending all the records and committing, none will ever be visible and the system will eventually
+         * retry them in new transactions - potentially with different combinations of records from the original.
+         * <p>
+         * c) A source offset, and it's produced records will be committed as an atomic set. Normally: either the record
+         * producing could fail, or the committing of the source offset could fail, as they are separate individual
+         * operations. When using Transactions, they are committed together - so if either operations fails, the
+         * transaction will never get committed, and upon recovery, the system will retry the set again (and no
+         * duplicates will be visible in the topic).
+         * <p>
+         * This {@code CommitMode} is the slowest of the options, but there will be no duplicates in Kafka caused by
+         * producing a record multiple times if previous offset commits have failed or crashes have occurred (however
+         * message replay may cause duplicates in external systems which is unavoidable - external systems must be
+         * idempotent).
+         * <p>
+         * The default commit interval {@link AbstractParallelEoSStreamProcessor#KAFKA_DEFAULT_AUTO_COMMIT_FREQUENCY}
+         * gets automatically reduced from the default of 5 seconds to 100ms (the same as Kafka Streams <a
+         * href=https://docs.confluent.io/platform/current/streams/developer-guide/config-streams.html">commit.interval.ms</a>).
+         * Reducing this configuration places higher load on the broker, but will reduce (but cannot eliminate) replay
+         * upon failure. Note also that when using transactions in Kafka, consumption in {@code READ_COMMITTED} mode is
+         * blocked up to the offset of the first STILL open transaction. Using a smaller commit frequency reduces this
+         * minimum consumption latency - the faster transactions are closed, the faster the transaction content can be
+         * read by {@code READ_COMMITTED} consumers. More information about this can be found on the Confluent blog
+         * post:
+         * <a href="https://www.confluent.io/blog/enabling-exactly-once-kafka-streams/">Enabling Exactly-Once in Kafka
+         * Streams</a>.
+         * <p>
+         * When producing multiple records (see {@link ParallelStreamProcessor#pollAndProduceMany}), all records must
+         * have been produced successfully to the broker before the transaction will commit, after which all will be
+         * visible together, or none.
+         * <p>
+         * Records produced while running in this mode, won't be seen by consumer running in
+         * {@link ConsumerConfig#ISOLATION_LEVEL_CONFIG} {@link org.apache.kafka.common.IsolationLevel#READ_COMMITTED}
+         * mode until the transaction is complete and all records are produced successfully. Records produced into a
+         * transaction that gets aborted or timed out, will never be visible.
+         * <p>
+         * The system must prevent records from being produced to the brokers whose source consumer record offsets has
+         * not been included in this transaction. Otherwise, the transactions would include produced records from
+         * consumer offsets which would only be committed in the NEXT transaction, which would break the EoS guarantees.
+         * To achieve this, first work processing and record producing is suspended (by acquiring the commit lock -
+         * see{@link #commitLockAcquisitionTimeout}, as record processing requires the produce lock), then succeeded
+         * consumer offsets are gathered, transaction commit is made, then when the transaction has finished, processing
+         * resumes by releasing the commit lock. This periodically slows down record production during this phase, by
+         * the time needed to commit the transaction.
+         * <p>
+         * This is all separate from using an IDEMPOTENT Producer, which can be used, along with the
+         * {@link ParallelConsumerOptions#commitMode} {@link CommitMode#PERIODIC_CONSUMER_SYNC} or
+         * {@link CommitMode#PERIODIC_CONSUMER_ASYNCHRONOUS}.
+         * <p>
+         * Failure:
+         * <p>
+         * Commit lock: If the system cannot acquire the commit lock in time, it will shut down for whatever reason, the
+         * system will shut down (fail fast) - during the shutdown a final commit attempt will be made. The default
+         * timeout for acquisition is very high though - see {@link #commitLockAcquisitionTimeout}. This can be caused
+         * by the user processing function taking too long to complete.
+         * <p>
+         * Produce lock: If the system cannot acquire the produce lock in time, it will fail the record processing and
+         * retry the record later. This can be caused by the controller taking too long to commit for some reason. See
+         * {@link #produceLockAcquisitionTimeout}. If using {@link #allowEagerProcessingDuringTransactionCommit}, this
+         * may cause side effect replay when the record is retried, otherwise there is no replay. See
+         * {@link #allowEagerProcessingDuringTransactionCommit} for more details.
+         *
+         * @see ParallelConsumerOptions.ParallelConsumerOptionsBuilder#commitInterval
+         */
+----
+
+[[streams-usage]]
+== Using with Kafka Streams
+
+Kafka Streams (KS) doesn't yet (https://cwiki.apache.org/confluence/display/KAFKA/KIP-311%3A+Async+processing+with+dynamic+scheduling+in+Kafka+Streams[KIP-311],
+https://cwiki.apache.org/confluence/display/KAFKA/KIP-408%3A+Add+Asynchronous+Processing+To+Kafka+Streams[KIP-408]) have parallel processing of messages.
+However, any given preprocessing can be done in KS, preparing the messages.
+One can then use this library to consume from an input topic, produced by KS to process the messages in parallel.
+
+For a code example, see the <<streams-usage-code>> section.
+
+.Example usage with Kafka Streams
+image::https://lucid.app/publicSegments/view/43f2740c-2a7f-4b7f-909e-434a5bbe3fbf/image.png[Kafka Streams Usage,align="center"]
+[[mertics]]
+== Metrics
+
+Metrics collection subsystem is implemented using Micrometer. This allows for flexible configuration of target metrics backend to be used. See below on example of how to configure MeterRegistry for Parallel Consumer to use for metrics collection.
+
+=== Meters
+Following meters are defined by Parallel Consumer - grouped by Subsystem
+
+
+==== Partition Manager
+
+**Number Of Partitions**
+
+Gauge `pc.partitions.number{subsystem=partitions}`
+
+Number of partitions
+
+**Partition Incomplete Offsets**
+
+Gauge `pc.partition.incomplete.offsets{subsystem=partitions, topic="topicName", partition="partitionNumber"}`
+
+Number of incomplete offsets in the partition
+
+**Partition Highest Completed Offset**
+
+Gauge `pc.partition.highest.completed.offset{subsystem=partitions, topic="topicName", partition="partitionNumber"}`
+
+Highest completed offset in the partition
+
+**Partition Highest Sequential Succeeded Offset**
+
+Gauge `pc.partition.highest.sequential.succeeded.offset{subsystem=partitions, topic="topicName", partition="partitionNumber"}`
+
+Highest sequential succeeded offset in the partition
+
+**Partition Highest Seen Offset**
+
+Gauge `pc.partition.highest.seen.offset{subsystem=partitions, topic="topicName", partition="partitionNumber"}`
+
+Highest seen / consumed offset in the partition
+
+**Partition Last Committed Offset**
+
+Gauge `pc.partition.latest.committed.offset{subsystem=partitions, topic="topicName", partition="partitionNumber"}`
+
+Latest committed offset in the partition
+
+**Partition Assignment Epoch**
+
+Gauge `pc.partition.assignment.epoch{subsystem=partitions, topic="topicName", partition="partitionNumber"}`
+
+Epoch of partition assignment
+
+==== Processor
+
+**User Function Processing Time**
+
+Timer `pc.user.function.processing.time{subsystem=processor}`
+
+User function processing time
+
+**Dynamic Extra Load Factor**
+
+Gauge `pc.dynamic.load.factor{subsystem=processor}`
+
+Dynamic load factor - load of processing buffers
+
+**Pc Status**
+
+Gauge `pc.status{subsystem=processor}`
+
+PC Status, reported as number with following mapping - 0:UNUSED, 1:RUNNING, 2:PAUSED, 3:DRAINING, 4:CLOSING, 5:CLOSED
+
+==== Shard Manager
+
+**Number Of Shards**
+
+Gauge `pc.shards{subsystem=shardmanager}`
+
+Number of shards
+
+**Incomplete Offsets Total**
+
+Gauge `pc.incomplete.offsets.total{subsystem=shardmanager}`
+
+Total number of incomplete offsets
+
+**Shards Size**
+
+Gauge `pc.shards.size{subsystem=shardmanager}`
+
+Number of records queued for processing across all shards
+
+==== Work Manager
+
+**Inflight Records**
+
+Gauge `pc.inflight.records{subsystem=workmanager}`
+
+Total number of records currently being processed or waiting for retry
+
+**Waiting Records**
+
+Gauge `pc.waiting.records{subsystem=workmanager}`
+
+Total number of records waiting to be selected for processing
+
+**Processed Records**
+
+Counter `pc.processed.records{subsystem=workmanager, topic="topicName", partition="partitionNumber"}`
+
+Total number of records successfully processed
+
+**Failed Records**
+
+Counter `pc.failed.records{subsystem=workmanager, topic="topicName", partition="partitionNumber"}`
+
+Total number of records failed to be processed
+
+**Slow Records**
+
+Counter `pc.slow.records{subsystem=workmanager, topic="topicName", partition="partitionNumber"}`
+
+Total number of records that spent more than the configured time threshold in the waiting queue. This setting defaults to 10 seconds
+
+==== Broker Poller
+
+**Pc Poller Status**
+
+Gauge `pc.poller.status{subsystem=poller}`
+
+PC Broker Poller Status, reported as number with following mapping - 0:UNUSED, 1:RUNNING, 2:PAUSED, 3:DRAINING, 4:CLOSING, 5:CLOSED
+
+**Num Paused Partitions**
+
+Gauge `pc.partitions.paused{subsystem=poller}`
+
+Number of paused partitions
+
+==== Offset Encoder
+
+**Offsets Encoding Time**
+
+Timer `pc.offsets.encoding.time{subsystem=offsetencoder}`
+
+Time spend encoding offsets
+
+**Offsets Encoding Usage**
+
+Counter `pc.offsets.encoding.usage{subsystem=offsetencoder, codec="BitSet|BitSetCompressed|BitSetV2Compressed|RunLength"}`
+
+Offset encoding usage per encoding type
+
+**Metadata Space Used**
+
+Distribution Summary `pc.metadata.space.used{subsystem=offsetencoder}`
+
+Ratio between offset metadata payload size and available space
+
+**Payload Ratio Used**
+
+Distribution Summary `pc.payload.ratio.used{subsystem=offsetencoder}`
+
+Ratio between offset metadata payload size and offsets encoded
+
+=== Example Metrics setup steps
+Meter registry that metrics should be bound has to be set using Parallel Consumer Options along with any common tags that identify the PC instance.
+In addition, if desired - Kafka Consumer, Producer can be bound to the registry as well as general JVM metric, logging system and other common binders.
+
+Following example illustrates setup of Parallel Consumer with Meter Registry and binds Kafka Consumer to that same registry as well.
+
+[source,java,indent=0]
+----
+    ParallelStreamProcessor<String, String> setupParallelConsumer() {
+        Consumer<String, String> kafkaConsumer = getKafkaConsumer();
+        String instanceId = UUID.randomUUID().toString();
+        var options = ParallelConsumerOptions.<String, String>builder()
+                .ordering(ParallelConsumerOptions.ProcessingOrder.KEY)
+                .maxConcurrency(1000)
+                .consumer(kafkaConsumer)
+                .meterRegistry(meterRegistry)                     //<1>
+                .metricsTags(Tags.of(Tag.of("common-tag", "tag1")))    //<2>
+                .pcInstanceTag(instanceId)                          //<3>
+                .build();
+
+        ParallelStreamProcessor<String, String> eosStreamProcessor =
+                ParallelStreamProcessor.createEosStreamProcessor(options);
+
+        eosStreamProcessor.subscribe(of(inputTopic));
+
+        kafkaClientMetrics = new KafkaClientMetrics(kafkaConsumer); //<4>
+        kafkaClientMetrics.bindTo(meterRegistry);                 //<5>
+        return eosStreamProcessor;
+    }
+----
+<1> - Meter Registry is set through ParallelConsumerOptions.builder(), if not specified - will default to CompositeMeterRegistry - which is No-op.
+<2> - Optional - common tags can be specified through same builder - they will be added to all Parallel Consumer meters
+<3> - Optional - instance tag value can be specified - it has to be unique to ensure meter uniqueness in cases when multiple parallel consumer instances are recording metrics to the same meter registry. If instance tag is not specified - unique UUID value will be generated and used. Tag is created with tag key 'pcinstance'.
+<4> - Optional - Kafka Consumer Micrometer metrics object created for Kafka Consumer that is later used for Parallel Consumer.
+<5> - Optional - Kafka Consumer Micrometer metrics are bound to Meter Registry.
+
+NOTE:: any additional binders / metrics need to be cleaned up appropriately - for example the Kafka Consumer Metrics registered above - need to be closed using `kafkaClientMetrics.close()` after calling shutting down Parallel Consumer as Parallel Consumer will close Kafka Consumer on shutdown.
+
+
+[[roadmap]]
+== Roadmap
+
+For released changes, see the link:CHANGELOG.adoc[CHANGELOG].
+
+For features in development and a more accurate view on the roadmap, have a look at the
+https://github.com/confluentinc/parallel-consumer/issues[GitHub issues], and clone https://github.com/astubbs/parallel-consumer[Antony's fork].
+
+== Usage Requirements
+
+* Client side
+** JDK 8
+** SLF4J
+** Apache Kafka (AK) Client libraries 2.5
+** Supports all features of the AK client (e.g. security setups, schema registry etc)
+** For use with Streams, see <<streams-usage>> section
+** For use with Connect:
+*** Source: simply consume from the topic that your Connect plugin is publishing to
+*** Sink: use the poll and producer style API and publish the records to the topic that the connector is sinking from
+* Server side
+** Should work with any cluster that the linked AK client library works with
+*** If using EoS/Transactions, needs a cluster setup that supports EoS/transactions
+
+== Development Information
+
+=== Requirements
+
+* Uses https://projectlombok.org/setup/intellij[Lombok], if you're using IntelliJ Idea, get the https://plugins.jetbrains.com/plugin/6317-lombok[plugin].
+* Integration tests require a https://docs.docker.com/docker-for-mac/[running locally accessible Docker host].
+* Has a Maven `profile` setup for IntelliJ Idea, but not Eclipse for example.
+
+=== Notes
+
+The unit test code is set to run at a very high frequency, which can make it difficult to read debug logs (or impossible).
+If you want to debug the code or view the main logs, consider changing the below:
+
+// replace with code inclusion from readme branch
+.ParallelEoSStreamProcessorTestBase
+[source]
+----
+ParallelEoSStreamProcessorTestBase#DEFAULT_BROKER_POLL_FREQUENCY_MS
+ParallelEoSStreamProcessorTestBase#DEFAULT_COMMIT_INTERVAL_MAX_MS
+----
+
+=== Recommended IDEA Plugins
+
+* AsciiDoc
+* CheckStyle
+* CodeGlance
+* EditorConfig
+* Rainbow Brackets
+* SonarLint
+* Lombok
+
+=== Readme
+
+The `README` uses a special https://github.com/whelk-io/asciidoc-template-maven-plugin/pull/25[custom maven processor plugin] to import live code blocks into the root readme, so that GitHub can show the real code as includes in the `README`.
+This is because GitHub https://github.com/github/markup/issues/1095[doesn't properly support the _include_ directive].
+
+The source of truth readme is in link:{project_root}/src/docs/README_TEMPLATE.adoc[].
+
+=== Maven targets
+
+[qanda]
+Compile and run all tests::
+`mvn verify`
+
+Run tests excluding the integration tests::
+`mvn test`
+
+Run all tests::
+`mvn verify`
+
+Run any goal skipping tests (replace `<goalName>` e.g. `install`)::
+`mvn <goalName> -DskipTests`
+
+See what profiles are active::
+`mvn help:active-profiles`
+
+See what plugins or dependencies are available to be updated::
+`mvn versions:display-plugin-updates versions:display-property-updates versions:display-dependency-updates`
+
+Run a single unit test::
+`mvn -Dtest=TestCircle test`
+
+Run a specific integration test method in a submodule project, skipping unit tests::
+`mvn -Dit.test=TransactionAndCommitModeTest#testLowMaxPoll -DskipUTs=true verify  -DfailIfNoTests=false --projects parallel-consumer-core`
+
+Run `git bisect` to find a bad commit, edit the Maven command in `bisect.sh` and run::
+
+[source=bash]
+----
+git bisect start good bad
+git bisect run ./bisect.sh
+----
+
+Note::
+`mvn compile` - Due to a bug in Maven's handling of test-jar dependencies - running `mvn compile` fails, use `mvn test-compile` instead.
+See https://github.com/confluentinc/parallel-consumer/issues/162[issue #162]
+and this https://stackoverflow.com/questions/4786881/why-is-test-jar-dependency-required-for-mvn-compile[Stack Overflow question].
+
+=== Testing
+
+The project has good automated test coverage, of all features.
+Including integration tests running against real Kafka broker and database.
+If you want to run the tests yourself, clone the repository and run the command: `mvn test`.
+The tests require an active docker server on `localhost`.
+
+==== Integration Testing with TestContainers
+//https://github.com/confluentinc/schroedinger#integration-testing-with-testcontainers
+
+We use the excellent https://testcontainers.org[Testcontainers] library for integration testing with JUnit.
+
+To speed up test execution, you can enable container reuse across test runs by setting the following in your https://www.testcontainers.org/features/configuration/[`~/.testcontainers.properties` file]:
+
+[source]
+----
+testcontainers.reuse.enable=true
+----
+
+This will leave the container running after the JUnit test is complete for reuse by subsequent runs.
+
+> NOTE: The container will only be left running if it is not explicitly stopped by the JUnit rule.
+> For this reason, we use a variant of the https://www.testcontainers.org/test_framework_integration/manual_lifecycle_control/#singleton-containers[singleton container pattern]
+> instead of the JUnit rule.
+
+Testcontainers detects if a container is reusable by hashing the container creation parameters from the JUnit test.
+If an existing container is _not_ reusable, a new container will be created, **but the old container will not be removed**.
+
+Target | Description --- | ---
+`testcontainers-list` | List all containers labeled as testcontainers
+`testcontainers-clean` | Remove all containers labeled as testcontainers
+
+.Stop and remove all containers labeled with `org.testcontainers=true`
+[source,bash]
+----
+docker container ls --filter 'label=org.testcontainers=true' --format '{{.ID}}' \
+| $(XARGS) docker container rm --force
+----
+
+.List all containers labeled with `org.testcontainers=true`
+[source,bash]
+----
+docker container ls --filter 'label=org.testcontainers=true'
+----
+
+> NOTE: `testcontainers-clean` removes **all** docker containers on your system with the `io.testcontainers=true` label > (including the most recent container which may be reusable).
+
+See https://github.com/testcontainers/testcontainers-java/pull/1781[this testcontainers PR] for details on the reusable containers feature.
+
+== Implementation Details
+
+=== Core Architecture
+
+Concurrency is controlled by the size of the thread pool (`worker pool` in the diagram).
+Work is performed in a blocking manner, by the users submitted lambda functions.
+
+These are the main sub systems:
+
+- controller thread
+- broker poller thread
+- work pool thread
+- work management
+- offset map manipulation
+
+Each thread collaborates with the others through thread safe Java collections.
+
+.Core Architecture. Threads are represented by letters and colours, with their steps in sequential numbers.
+image::https://lucid.app/publicSegments/view/320d924a-6517-4c54-a72e-b1c4b22e59ed/image.png[Core Architecture,align="center"]
+
+=== Vert.x Architecture
+
+The Vert.x module is an optional extension to the core module.
+As depicted in the diagram, the architecture extends the core architecture.
+
+Instead of the work thread pool count being the degree of concurrency, it is controlled by a max parallel requests setting, and work is performed asynchronously on the Vert.x engine by a _core_ count aligned Vert.x managed thread pool using Vert.x asynchronous IO plugins (https://vertx.io/docs/vertx-core/java/#_verticles[verticles]).
+
+.Vert.x Architecture
+image::https://lucid.app/publicSegments/view/509df410-5997-46be-98e7-ac7f241780b4/image.png[Vert.x Architecture,align="center"]
+
+=== Transactional System Architecture
+
+image::https://lucid.app/publicSegments/view/7480d948-ed7d-4370-a308-8ec12e6b453b/image.png[]
+
+[[offset_map]]
+=== Offset Map
+
+Unlike a traditional queue, messages are not deleted on an acknowledgement.
+However, offsets *are* tracked *per message*, per consumer group - there is no message replay for successful messages, even over clean restarts.
+
+Across a system failure, only completed messages not stored as such in the last offset payload commit will be replayed.
+This is not an _exactly once guarantee_, as message replay cannot be prevented across failure.
+
+CAUTION: Note that Kafka's Exactly Once Semantics (EoS) (transactional processing) also does not prevent _duplicate message replay_ - it *presents* an _effectively once_ result messages in Kafka topics.
+Messages may _still_ be replayed when using `EoS`.
+This is an important consideration when using it, especially when integrating with thrid party systems, which is a very common pattern for utilising this project.
+
+As mentioned previously, offsets are always committed in the correct order and only once all previous messages have been successfully processed; regardless of <<ordering-guarantees,ordering mode>> selected.
+We call this the "highest committable offset".
+
+However, because messages can be processed out of order, messages beyond the highest committable offset must also be tracked for success and not replayed upon restart of failure.
+To achieve this the system goes a step further than normal Kafka offset commits.
+
+When messages beyond the highest committable offset are successfully processed;
+
+. they are stored as such in an internal memory map.
+. when the system then next commits offsets
+. if there are any messages beyond the highest offset which have been marked as succeeded
+.. the offset map is serialised and encoded into a base 64 string, and added to the commit message metadata.
+. upon restore, if needed, the system then deserializes this offset map and loads it back into memory
+. when each messages is polled into the system
+.. it checks if it's already been previously completed
+.. at which point it is then skipped.
+
+This ensures that no message is reprocessed if it's been previously completed.
+
+IMPORTANT: Successful messages beyond the _highest committable offset_ are still recorded as such in a specially constructed metadata payload stored alongside the Kafka committed offset.
+These messages are not replayed upon restore/restart.
+
+The offset map is compressed in parallel using two different compression techniques - run length encoding and bitmap encoding.
+The sizes of the compressed maps are then compared, and the smallest chosen for serialization.
+If both serialised formats are significantly large, they are then both compressed using `zstd` compression, and if that results in a smaller serialization then the compressed form is used instead.
+
+
+==== Storage Notes
+
+* Runtime data model creates list of incomplete offsets
+* Continuously builds a full complete / not complete bit map from the base offset to be committed
+* Dynamically switching storage
+** encodes into a `BitSet`, and a `RunLength`, then compresses both using zstd, then uses the smallest and tags as such in the encoded String
+** Which is smallest can depend on the size and information density of the offset map
+*** Smaller maps fit better into uncompressed `BitSets` ~(30 entry map bitset: compressed: 13 Bytes, uncompressed: 4 Bytes)
+*** Larger maps with continuous sections usually better in compressed `RunLength`
+*** Completely random offset maps, compressed and uncompressed `BitSet` is roughly the same (2000 entries, uncompressed bitset: 250, compressed: 259, compressed bytes array: 477)
+*** Very large maps (20,000 entries), a compressed `BitSet` seems to be significantly smaller again if random.
+* Gets stored along with base offset for each partition, in the offset `commitsync` `metadata` string
+* The offset commit metadata has a hardcoded limit of 4096 bytes (4 kb) per partition (@see `kafka.coordinator.group.OffsetConfig#DefaultMaxMetadataSize = 4096`)
+** Because of this, if our map doesn't fit into this, we have to drop it and not use it, losing the shorter replay benefits.
+However, with runlength encoding and typical offset patterns this should be quite rare.
+*** Work is being done on continuous and predictive space requirements, which will optionally prevent the system from continuing past a point by introducing local backpressure which it can't proceed without dropping the encoded map information - see https://github.com/confluentinc/parallel-consumer/issues/53[Exact continuous offset encoding for precise offset payload size back pressure].
+** Not being able to fit the map into the metadata, depends on message acknowledgement patterns in the use case and the numbers of messages involved.
+Also, the information density in the map (i.e. a single not yet completed message in 4000 completed ones will be a tiny map and will fit very large amounts of messages)
+
+===== FAQ
+
+[qanda]
+If for example, offset 5 cannot be processed for whatever reason, does it cause the committed offset to stick to 5?::
+Yes - the committed offset would "stick" to 5, with the metadata payload containing all the per msg ack's beyond 5.
++
+(Reference: https://github.com/confluentinc/parallel-consumer/issues/415#issuecomment-1256022394[#415])
+
+In the above scenario, would the system eventually exceed the OffsetMap size limit?::
+No, as if the payload size hits 75% or more of the limit (4kB), the back pressure system kicks in, and no more records will be taken for processing, until it drops below 75% again.
+Instead, it will keep retrying existing records.
++
+However, note that if the only record to continually fail is 5, and all others succeed, let's say offset 6-50,000, then the metadata payload is only ~2 shorts (1 and (50,000-6=) 49,994), as it will use run length encoding.
+So it's very efficient.
++
+(Reference: https://github.com/confluentinc/parallel-consumer/issues/415#issuecomment-1256022394[#415])
+
+== Attribution
+
+http://www.apache.org/[Apache®], http://kafka.apache.org/[Apache Kafka], and http://kafka.apache.org/[Kafka®] are either registered trademarks or trademarks of the http://www.apache.org/[Apache Software Foundation] in the United States and/or other countries.
+
+== Tools
+
+image:https://www.yourkit.com/images/yklogo.png[link=https://www.yourkit.com/java/profiler/index.jsp,YourKit]
+
+Quite simply the best profiler for Java, and the only one I use.
+I have been using it for decades.
+Quick, easy to use but soo powerful.
+
+YourKit supports open source projects with innovative and intelligent tools for monitoring and profiling Java and .NET applications.
+
+YourKit is the creator of https://www.google.com/url?q=https://www.yourkit.com/java/profiler/&source=gmail-imap&ust=1670918364000000&usg=AOvVaw3kaQak_H7lmT_plCEzxvde[YourKit Java Profiler],
+https://www.google.com/url?q=https://www.yourkit.com/.net/profiler/&source=gmail-imap&ust=1670918364000000&usg=AOvVaw1ZgQhyH2rIOHTuqtTjFAsA[YourKit .NET Profiler], and https://www.google.com/url?q=https://www.yourkit.com/youmonitor/&source=gmail-imap&ust=1670918364000000&usg=AOvVaw13UzOhGkJLEn-Md3-GNjYB[YourKit YouMonitor].
+
+:leveloffset: +1
+:toc: macro
+:toclevels: 1
+
+= Change Log
+
+A high level summary of noteworthy changes in each version.
+
+NOTE:: Dependency version bumps are not listed here.
+
+// git log --pretty="* %s" 0.3.0.2..HEAD
+
+// only show TOC if this is the root document (not in the README)
+ifndef::github_name[]
+toc::[]
+endif::[]
+== 0.5.2.8
+
+=== Fixes
+
+* fix: Fix equality and hash code for ShardKey with array key (#638), resolves (#579)
+
+== 0.5.2.7
+
+=== Fixes
+
+* fix: Return cached pausedPartitionSet (#620), resolves (#618)
+* fix: Parallel consumer stops processing data sometimes (#623), fixes (#606)
+* fix: Add synchronization to ensure proper intializaiton and closing of PCMetrics singleton (#627), fixes (#617)
+* fix: Readme - metrics example correction (#614)
+* fix: Remove micrometer-atlas dependency (#628), fixes (#625)
+
+=== Improvements
+
+* Refactored metrics implementation to not use singleton - improves meter separation, allows correct metrics subsystem operation when multiple parallel consumer instances are running in same java process (#630), fixes (#617) improves on (#627)
+
+== 0.5.2.6
+=== Improvements
+
+* feature: Micrometer metrics (#594)
+* feature: Adds an option to pass an invalid offset metadata error policy (#537), improves (#326)
+* feature: Lazy intialization of workerThreadPool (#531)
+
+=== Fixes
+
+* fix: Don't drain mode shutdown kills inflight threads (#559)
+* fix: Drain mode shutdown doesn't pause consumption correctly (#552)
+* fix: RunLength offset decoding returns 0 base offset after no-progress commit - related to (#546)
+* fix: Transactional PConsumer stuck while rebalancing - related to (#541)
+
+=== Dependencies
+
+* PL-211: Update dependencies from dependabot, Add mvnw, use mvnw in jenkins (#583)
+* PL-211: Update dependencies from dependabot (#589)
+
+== 0.5.2.5
+
+=== Fixes
+
+* fixes: #195 NoSuchFieldException when using consumer inherited from KafkaConsumer (#469)
+* fix: After new performance fix PR#530 merges - corner case could cause out of order processing (#534)
+* fix: Cleanup WorkManager's count of in-progress work, when work is stale after partition revocation (#547)
+
+=== Improvements
+
+* perf: Adds a caching layer to work management to alleviate O(n) counting (#530)
+
+== 0.5.2.4
+
+=== Improvements
+
+* feature: Simple PCRetriableException to remove error spam from logs (#444)
+* minor: fixes #486: Missing generics in JStreamParallelStreamProcessor #491
+* minor: partially address #459: Moves isClosedOrFailed into top level ParallelConsumer interface (#491)
+* tests: Demonstrates how to use MockConsumer with PC for issue #176
+* other minor improvements
+
+=== Fixes
+
+* fixes #409: Adds support for compacted topics and commit offset resetting (#425)
+** Truncate the offset state when bootstrap polled offset higher or lower than committed
+** Prune missing records from the tracked incomplete offset state, when they're missing from polled batches
+* fix: Improvements to encoding ranges (int vs long) #439
+** Replace integer offset references with long - use Long everywhere we deal with offsets, and where we truncate down, do it exactly, detect and handle truncation issues.
+
+== 0.5.2.3
+
+=== Improvements
+
+* Transactional commit mode system improvements and docs (#355)
+** Clarifies transaction system with much better documentation.
+** Fixes a potential race condition which could cause offset leaks between transactions boundaries.
+** Introduces lock acquisition timeouts.
+** Fixes a potential issue with removing records from the retry queue incorrectly, by having an inconsistency between compareTo and equals in the retry TreeMap.
+* Adds a very simple Dependency Injection system modeled on Dagger (#398)
+* Various refactorings e.g. new ProducerWrap
+
+* Dependencies
+** build(deps): prod: zstd, reactor, dev: podam, progressbar, postgresql maven-plugins: versions, help (#420)
+** build(deps-dev): bump postgresql from 42.4.1 to 42.5.0
+** bump podam, progressbar, zstd, reactor
+** build(deps): bump versions-maven-plugin from 2.11.0 to 2.12.0
+** build(deps): bump maven-help-plugin from 3.2.0 to 3.3.0
+** build(deps-dev): bump Confluent Platform Kafka Broker to 7.2.2 (#421)
+** build(deps): Upgrade to AK 3.3.0 (#309)
+
+
+=== Fixes
+
+* fixes #419: NoSuchElementException during race condition in PartitionState (#422)
+* Fixes #412: ClassCastException with retryDelayProvider (#417)
+* fixes ShardManager retryQueue ordering and set issues due to poor Comparator implementation (#423)
+
+
+== v0.5.2.2
+
+=== Fixes
+
+- Fixes dependency scope for Mockito from compile to test (#376)
+
+== v0.5.2.1
+
+=== Fixes
+
+- Fixes regression issue with order of state truncation vs commit (#362)
+
+== v0.5.2.0
+
+=== Fixes and Improvements
+
+- fixes #184: Fix multi topic subscription with KEY order by adding topic to shard key (#315)
+- fixes #329: Committing around transaction markers causes encoder to crash (#328)
+- build: Upgrade Truth-Generator to 0.1.1 for user Subject discovery (#332)
+
+=== Build
+
+- build: Allow snapshots locally, fail in CI (#331)
+- build: OSS Index scan change to warn only and exclude Guava CVE-2020-8908 as it's WONT_FIX (#330)
+
+=== Dependencies
+
+- build(deps): bump reactor-core from 3.4.19 to 3.4.21 (#344)
+- build(deps): dependabot bump Mockito, Surefire, Reactor, AssertJ, Release (#342) (#342)
+- build(deps): dependabot bump TestContainers, Vert.x, Enforcer, Versions, JUnit, Postgress (#336)
+
+=== Linked issues
+
+- Message with null key lead to continuous failure when using KEY ordering #318
+- Subscribing to two or more topics with KEY ordering, results in messages of the same Key never being processed #184
+- Cannot have negative length BitSet error - committing transaction adjacent offsets #329
+
+== v0.5.1.0
+
+=== Features
+
+* #193: Pause / Resume PC (circuit breaker) without unsubscribing from topics
+
+=== Fixes and Improvements
+
+* #225: Build and runtime support for Java 16+ (#289)
+* #306: Change Truth-Generator dependency from compile to test
+* #298: Improve PollAndProduce performance by first producing all records, and then waiting for the produce results.Previously, this was done for each ProduceRecord individually.
+
+== v0.5.0.0
+
+=== Features
+
+* feature: Poll Context object for API (#223)
+** PollContext API - provides central access to result set with various convenience methods as well as metadata about records, such as failure count
+* major: Batching feature and Event system improvements
+** Batching - all API methods now support batching.
+See the Options class set batch size for more information.
+
+=== Fixes and Improvements
+
+* Event system - better CPU usage in control thread
+* Concurrency stability improvements
+* Update dependencies
+* #247: Adopt Truth-Generator (#249)
+** Adopt https://github.com/astubbs/truth-generator[Truth Generator] for automatic generation of https://truth.dev/[Google Truth] Subjects
+* Large rewrite of internal architecture for improved maintence and simplicity which fixed some corner case issues
+** refactor: Rename PartitionMonitor to PartitionStateManager (#269)
+** refactor: Queue unification (#219)
+** refactor: Partition state tracking instead of search (#218)
+** refactor: Processing Shard object
+* fix: Concurrency and State improvements (#190)
+
+=== Build
+
+* build: Lock TruthGenerator to 0.1 (#272)
+* build: Deploy SNAPSHOTS to maven central snaphots repo (#265)
+* build: Update Kafka to 3.1.0 (#229)
+* build: Crank up Enforcer rules and turn on ossindex audit
+* build: Fix logback dependency back to stable
+* build: Upgrade TestContainer and CP
+
+== v0.4.0.1
+
+=== Improvements
+
+- Add option to specify timeout for how long to wait offset commits in periodic-consumer-sync commit-mode
+- Add option to specify timeout for how long to wait for blocking Producer#send
+
+=== Docs
+
+- docs: Confluent Cloud configuration links
+- docs: Add Confluent's product page for PC to README
+- docs: Add head of line blocking to README
+
+== v0.4.0.0
+// https://github.com/confluentinc/parallel-consumer/releases/tag/0.4.0.0
+
+=== Features
+
+* https://projectreactor.io/[Project Reactor] non-blocking threading adapter module
+* Generic Vert.x Future support - i.e. FileSystem, db etc...
+
+=== Fixes and Improvements
+
+* Vert.x concurrency control via WebClient host limits fixed - see #maxCurrency
+* Vert.x API cleanup of invalid usage
+* Out of bounds for empty collections
+* Use ConcurrentSkipListMap instead of TreeMap to prevent concurrency issues under high pressure
+* log: Show record topic in slow-work warning message
+
+== v0.3.2.0
+
+=== Fixes and Improvements
+
+* Major: Upgrade to Apache Kafka 2.8 (still compatible with 2.6 and 2.7 though)
+* Adds support for managed executor service (Java EE Compatibility feature)
+* #65 support for custom retry delay providers
+
+== v0.3.1.0
+
+=== Fixes and Improvements
+
+* Major refactor to code base - primarily the two large God classes
+** Partition state now tracked separately
+** Code moved into packages
+* Busy spin in some cases fixed (lower CPU usage)
+* Reduce use of static data for test assertions - remaining identified for later removal
+* Various fixes for parallel testing stability
+
+== v0.3.0.3
+
+=== Fixes and Improvements
+
+==== Overview
+
+* Tests now run in parallel
+* License fixing / updating and code formatting
+* License format runs properly now when local, check on CI
+* Fix running on Windows and Linux
+* Fix JAVA_HOME issues
+
+==== Details:
+
+* tests: Enable the fail fast feature now that it's merged upstream
+* tests: Turn on parallel test runs
+* format: Format license, fix placement
+* format: Apply Idea formatting (fix license layout)
+* format: Update mycila license-plugin
+* test: Disable redundant vert.x test - too complicated to fix for little gain
+* test: Fix thread counting test by closing PC @After
+* test: Test bug due to static state overrides when run as a suite
+* format: Apply license format and run every All Idea build
+* format: Organise imports
+* fix: Apply license format when in dev laptops - CI only checks
+* fix: javadoc command for various OS and envs when JAVA_HOME missing
+* fix: By default, correctly run time JVM as jvm.location
+
+== v0.3.0.2
+
+=== Fixes and Improvements
+
+* ci: Add CODEOWNER
+* fix: #101 Validate GroupId is configured on managed consumer
+* Use 8B1DA6120C2BF624 GPG Key For Signing
+* ci: Bump jdk8 version path
+* fix: #97 Vert.x thread and connection pools setup incorrect
+* Disable Travis and Codecov
+* ci: Apache Kafka and JDK build matrix
+* fix: Set Serdes for MockProducer for AK 2.7 partition fix KAFKA-10503 to fix new NPE
+* Only log slow message warnings periodically, once per sweep
+* Upgrade Kafka container version to 6.0.2
+* Clean up stalled message warning logs
+* Reduce log-level if no results are returned from user-function (warn -> debug)
+* Enable java 8 Github
+* Fixes #87 - Upgrade UniJ version for UnsupportedClassVersion error
+* Bump TestContainers to stable release to specifically fix #3574
+* Clarify offset management capabilities
+
+== v0.3.0.1
+
+* fixes #62: Off by one error when restoring offsets when no offsets are encoded in metadata
+* fix: Actually skip work that is found as stale
+
+== v0.3.0.0
+
+=== Features
+
+* Queueing and pressure system now self tuning, performance over default old tuning values (`softMaxNumberMessagesBeyondBaseCommitOffset` and `maxMessagesToQueue`) has doubled.
+** These options have been removed from the system.
+* Offset payload encoding back pressure system
+** If the payload begins to take more than a certain threshold amount of the maximum available, no more messages will be brought in for processing, until the space need beings to reduce back below the threshold.
+This is to try to prevent the situation where the payload is too large to fit at all, and must be dropped entirely.
+** See Proper offset encoding back pressure system so that offset payloads can't ever be too large https://github.com/confluentinc/parallel-consumer/issues/47[#47]
+** Messages that have failed to process, will always be allowed to retry, in order to reduce this pressure.
+
+=== Improvements
+
+* Default ordering mode is now `KEY` ordering (was `UNORDERED`).
+** This is a better default as it's the safest mode yet high performing mode.
+It maintains the partition ordering characteristic that all keys are processed in log order, yet for most use cases will be close to as fast as `UNORDERED` when the key space is large enough.
+* https://github.com/confluentinc/parallel-consumer/issues/37[Support BitSet encoding lengths longer than Short.MAX_VALUE #37] - adds new serialisation formats that supports wider range of offsets - (32,767 vs 2,147,483,647) for both BitSet and run-length encoding.
+* Commit modes have been renamed to make it clearer that they are periodic, not per message.
+* Minor performance improvement, switching away from concurrent collections.
+
+=== Fixes
+
+* Maximum offset payload space increased to correctly not be inversely proportional to assigned partition quantity.
+* Run-length encoding now supports compacted topics, plus other bug fixes as well as fixes to Bitset encoding.
+
+== v0.2.0.3
+
+=== Fixes
+
+** https://github.com/confluentinc/parallel-consumer/issues/35[Bitset overflow check (#35)] - gracefully drop BitSet or Runlength encoding as an option if offset difference too large (short overflow)
+*** A new serialisation format will be added in next version - see https://github.com/confluentinc/parallel-consumer/issues/37[Support BitSet encoding lengths longer than Short.MAX_VALUE #37]
+** Gracefully drops encoding attempts if they can't be run
+** Fixes a bug in the offset drop if it can't fit in the offset metadata payload
+
+== v0.2.0.2
+
+=== Fixes
+
+** Turns back on the https://github.com/confluentinc/parallel-consumer/issues/35[Bitset overflow check (#35)]
+
+== v0.2.0.1 DO NOT USE - has critical bug
+
+=== Fixes
+
+** Incorrectly turns off an over-flow check in https://github.com/confluentinc/parallel-consumer/issues/35[offset serialisation system (#35)]
+
+== v0.2.0.0
+
+=== Features
+
+** Choice of commit modes: Consumer Asynchronous, Synchronous and Producer Transactions
+** Producer instance is now optional
+** Using a _transactional_ Producer is now optional
+** Use the Kafka Consumer to commit `offsets` Synchronously or Asynchronously
+
+=== Improvements
+
+** Memory performance - garbage collect empty shards when in KEY ordering mode
+** Select tests adapted to non transactional (multiple commit modes) as well
+** Adds supervision to broker poller
+** Fixes a performance issue with the async committer not being woken up
+** Make committer thread revoke partitions and commit
+** Have onPartitionsRevoked be responsible for committing on close, instead of an explicit call to commit by controller
+** Make sure Broker Poller now drains properly, committing any waiting work
+
+=== Fixes
+
+** Fixes bug in commit linger, remove genesis offset (0) from testing (avoid races), add ability to request commit
+** Fixes #25 https://github.com/confluentinc/parallel-consumer/issues/25:
+*** Sometimes a transaction error occurs - Cannot call send in state COMMITTING_TRANSACTION #25
+** ReentrantReadWrite lock protects non-thread safe transactional producer from incorrect multithreaded use
+** Wider lock to prevent transaction's containing produced messages that they shouldn't
+** Must start tx in MockProducer as well
+** Fixes example app tests - incorrectly testing wrong thing and MockProducer not configured to auto complete
+** Add missing revoke flow to MockConsumer wrapper
+** Add missing latch timeout check
+
+== v0.1
+
+=== Features:
+
+** Have massively parallel consumption processing without running hundreds or thousands of
+*** Kafka consumer clients
+*** topic partitions
++
+without operational burden or harming the clusters performance
+** Efficient individual message acknowledgement system (without local or third system state) to massively reduce message replay upon failure
+** Per `key` concurrent processing, per `partition` and unordered message processing
+** `Offsets` committed correctly, in order, of only processed messages, regardless of concurrency level or retries
+** Vert.x non-blocking library integration (HTTP currently)
+** Fair partition traversal
+** Zero~ dependencies (`Slf4j` and `Lombok`) for the core module
+** Java 8 compatibility
+** Throttle control and broker liveliness management
+** Clean draining shutdown cycle
+//:leveloffset: -1 - Duplicate key leveloffset (attempted merging values +1 and -1): https://github.com/whelk-io/asciidoc-template-maven-plugin/issues/118
+
diff --git a/RELEASE.adoc b/RELEASE.adoc
new file mode 100644
index 000000000..65994e35d
--- /dev/null
+++ b/RELEASE.adoc
@@ -0,0 +1,15 @@
+= Releasing
+
+- Update the changelog and commit
+- Run the maven release:prepare goal:
+
+`release:prepare -DautoVersionSubmodules=true -DpushChanges=false -Darguments=-DskipTests -Pci`
+
+- Push the master branch with release and tag
+- Trigger master builder to build the tag (this is needed to trigger the deployment flow)
+- Wait for Jenkins to finish running the build (~15 minutes)
+- Wait for Sonatype to publish from it's staging area (~15 minutes) https://repo1.maven.org/maven2/io/confluent/parallelconsumer/parallel-consumer-parent/[repo1 link]
+- Verify the release is available on Maven Central https://repo1.maven.org/maven2/io/confluent/parallelconsumer/parallel-consumer-parent/[repo1 link]
+- Create the release on GH from the tag
+- Paste in the details from the changelog, save, share as discussion
+- Announce on slack (community #clients and internal channels), mailing list, twitter
\ No newline at end of file
diff --git a/bin/build-parallel-consumer-core-without-tests.sh b/bin/build-parallel-consumer-core-without-tests.sh
new file mode 100755
index 000000000..bff424860
--- /dev/null
+++ b/bin/build-parallel-consumer-core-without-tests.sh
@@ -0,0 +1,7 @@
+#!/usr/bin/env bash
+#
+# Copyright (C) 2020-2022 Confluent, Inc.
+#
+
+export JAVA_HOME=$(/usr/libexec/java_home -v13)
+mvn clean install -pl parallel-consumer-core -Dmaven.test.skip=true
diff --git a/bin/build-without-tests.sh b/bin/build-without-tests.sh
new file mode 100755
index 000000000..5fbf92da4
--- /dev/null
+++ b/bin/build-without-tests.sh
@@ -0,0 +1,7 @@
+#!/usr/bin/env bash
+#
+# Copyright (C) 2020-2022 Confluent, Inc.
+#
+
+export JAVA_HOME=$(/usr/libexec/java_home -v13)
+mvn clean install -Dmaven.test.skip=true
diff --git a/bin/checkcompile-license.sh b/bin/checkcompile-license.sh
new file mode 100644
index 000000000..90984f906
--- /dev/null
+++ b/bin/checkcompile-license.sh
@@ -0,0 +1,26 @@
+#!/bin/bash
+#
+# Copyright (C) 2020-2022 Confluent, Inc.
+#
+
+
+COMMITS=$(git log --oneline HEAD...parralel-test-fix^ | cut -d " " -f 1)
+
+testCommit() {
+  # COMMIT = $1
+  echo Checking out commit $COMMIT
+  git checkout $COMMIT >/dev/null 2>/dev/null
+
+  #    mvn compile test-compile > /dev/null 2> /dev/null
+  mvn license:check
+
+  if [ $? -eq 0 ]; then
+    echo $COMMIT passed
+  else
+    echo $COMMIT failed
+  fi
+}
+
+for COMMIT in $COMMITS; do
+  testCommit "$COMMIT"
+done
diff --git a/bin/deploy.sh b/bin/deploy.sh
new file mode 100755
index 000000000..52590b3a9
--- /dev/null
+++ b/bin/deploy.sh
@@ -0,0 +1,7 @@
+#!/usr/bin/env bash
+#
+# Copyright (C) 2020-2022 Confluent, Inc.
+#
+
+export JAVA_HOME=$(/usr/libexec/java_home -v13)
+mvn deploy 
diff --git a/bisect.sh b/bisect.sh
new file mode 100755
index 000000000..2afb2d7be
--- /dev/null
+++ b/bisect.sh
@@ -0,0 +1,32 @@
+#!/bin/bash
+#
+# Copyright (C) 2020-2022 Confluent, Inc.
+#
+
+set -x
+
+# It may be useful to make a copy of this file to run the bisect against a script outside the repository
+
+# tweak the working tree by merging the hot-fix branch
+# and then attempt a build
+# alterantively use cherry pick
+if git merge --no-commit --no-ff hot-fix &&
+  make; then
+  # run project specific test and report its status
+  ~/check_test_case.sh
+  status=$?
+else
+  # tell the caller this is untestable
+  status=125
+fi
+
+# undo the tweak to allow clean flipping to the next commit
+git reset --hard
+
+# return control
+exit $status
+
+mvn testCompile || exit 125 # this skips broken builds
+
+# run a maven test
+mvn -Dit.test=TransactionAndCommitModeTest#testLowMaxPoll -DskipUTs=true -DfailIfNoTests=false --projects parallel-consumer-core integration-test
diff --git a/checkcompile.sh b/checkcompile.sh
new file mode 100755
index 000000000..b94525242
--- /dev/null
+++ b/checkcompile.sh
@@ -0,0 +1,30 @@
+#!/bin/bash                                                                                                                                                                                                                                    
+#
+# Copyright (C) 2020-2022 Confluent, Inc.
+#
+
+
+COMMITS=$(git log --oneline HEAD...182d13c43dec581a84c7edad962dfbd456744a64^ | cut -d " " -f 1)
+
+
+testCommit() {
+    # COMMIT = $1
+    echo Checking out commit $COMMIT
+    git checkout $COMMIT > /dev/null 2> /dev/null
+    
+    mvn compile test-compile > /dev/null 2> /dev/null
+                                                                                                                                                                                                                                
+    if [ $? -eq 0 ]
+    then
+        echo $COMMIT passed
+    else
+        echo $COMMIT failed
+    fi
+}
+
+for COMMIT in $COMMITS
+do
+    testCommit "$COMMIT"
+done
+
+
diff --git a/mvnw b/mvnw
new file mode 100755
index 000000000..8d937f4c1
--- /dev/null
+++ b/mvnw
@@ -0,0 +1,308 @@
+#!/bin/sh
+# ----------------------------------------------------------------------------
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+# ----------------------------------------------------------------------------
+
+# ----------------------------------------------------------------------------
+# Apache Maven Wrapper startup batch script, version 3.2.0
+#
+# Required ENV vars:
+# ------------------
+#   JAVA_HOME - location of a JDK home dir
+#
+# Optional ENV vars
+# -----------------
+#   MAVEN_OPTS - parameters passed to the Java VM when running Maven
+#     e.g. to debug Maven itself, use
+#       set MAVEN_OPTS=-Xdebug -Xrunjdwp:transport=dt_socket,server=y,suspend=y,address=8000
+#   MAVEN_SKIP_RC - flag to disable loading of mavenrc files
+# ----------------------------------------------------------------------------
+
+if [ -z "$MAVEN_SKIP_RC" ] ; then
+
+  if [ -f /usr/local/etc/mavenrc ] ; then
+    . /usr/local/etc/mavenrc
+  fi
+
+  if [ -f /etc/mavenrc ] ; then
+    . /etc/mavenrc
+  fi
+
+  if [ -f "$HOME/.mavenrc" ] ; then
+    . "$HOME/.mavenrc"
+  fi
+
+fi
+
+# OS specific support.  $var _must_ be set to either true or false.
+cygwin=false;
+darwin=false;
+mingw=false
+case "$(uname)" in
+  CYGWIN*) cygwin=true ;;
+  MINGW*) mingw=true;;
+  Darwin*) darwin=true
+    # Use /usr/libexec/java_home if available, otherwise fall back to /Library/Java/Home
+    # See https://developer.apple.com/library/mac/qa/qa1170/_index.html
+    if [ -z "$JAVA_HOME" ]; then
+      if [ -x "/usr/libexec/java_home" ]; then
+        JAVA_HOME="$(/usr/libexec/java_home)"; export JAVA_HOME
+      else
+        JAVA_HOME="/Library/Java/Home"; export JAVA_HOME
+      fi
+    fi
+    ;;
+esac
+
+if [ -z "$JAVA_HOME" ] ; then
+  if [ -r /etc/gentoo-release ] ; then
+    JAVA_HOME=$(java-config --jre-home)
+  fi
+fi
+
+# For Cygwin, ensure paths are in UNIX format before anything is touched
+if $cygwin ; then
+  [ -n "$JAVA_HOME" ] &&
+    JAVA_HOME=$(cygpath --unix "$JAVA_HOME")
+  [ -n "$CLASSPATH" ] &&
+    CLASSPATH=$(cygpath --path --unix "$CLASSPATH")
+fi
+
+# For Mingw, ensure paths are in UNIX format before anything is touched
+if $mingw ; then
+  [ -n "$JAVA_HOME" ] && [ -d "$JAVA_HOME" ] &&
+    JAVA_HOME="$(cd "$JAVA_HOME" || (echo "cannot cd into $JAVA_HOME."; exit 1); pwd)"
+fi
+
+if [ -z "$JAVA_HOME" ]; then
+  javaExecutable="$(which javac)"
+  if [ -n "$javaExecutable" ] && ! [ "$(expr "\"$javaExecutable\"" : '\([^ ]*\)')" = "no" ]; then
+    # readlink(1) is not available as standard on Solaris 10.
+    readLink=$(which readlink)
+    if [ ! "$(expr "$readLink" : '\([^ ]*\)')" = "no" ]; then
+      if $darwin ; then
+        javaHome="$(dirname "\"$javaExecutable\"")"
+        javaExecutable="$(cd "\"$javaHome\"" && pwd -P)/javac"
+      else
+        javaExecutable="$(readlink -f "\"$javaExecutable\"")"
+      fi
+      javaHome="$(dirname "\"$javaExecutable\"")"
+      javaHome=$(expr "$javaHome" : '\(.*\)/bin')
+      JAVA_HOME="$javaHome"
+      export JAVA_HOME
+    fi
+  fi
+fi
+
+if [ -z "$JAVACMD" ] ; then
+  if [ -n "$JAVA_HOME"  ] ; then
+    if [ -x "$JAVA_HOME/jre/sh/java" ] ; then
+      # IBM's JDK on AIX uses strange locations for the executables
+      JAVACMD="$JAVA_HOME/jre/sh/java"
+    else
+      JAVACMD="$JAVA_HOME/bin/java"
+    fi
+  else
+    JAVACMD="$(\unset -f command 2>/dev/null; \command -v java)"
+  fi
+fi
+
+if [ ! -x "$JAVACMD" ] ; then
+  echo "Error: JAVA_HOME is not defined correctly." >&2
+  echo "  We cannot execute $JAVACMD" >&2
+  exit 1
+fi
+
+if [ -z "$JAVA_HOME" ] ; then
+  echo "Warning: JAVA_HOME environment variable is not set."
+fi
+
+# traverses directory structure from process work directory to filesystem root
+# first directory with .mvn subdirectory is considered project base directory
+find_maven_basedir() {
+  if [ -z "$1" ]
+  then
+    echo "Path not specified to find_maven_basedir"
+    return 1
+  fi
+
+  basedir="$1"
+  wdir="$1"
+  while [ "$wdir" != '/' ] ; do
+    if [ -d "$wdir"/.mvn ] ; then
+      basedir=$wdir
+      break
+    fi
+    # workaround for JBEAP-8937 (on Solaris 10/Sparc)
+    if [ -d "${wdir}" ]; then
+      wdir=$(cd "$wdir/.." || exit 1; pwd)
+    fi
+    # end of workaround
+  done
+  printf '%s' "$(cd "$basedir" || exit 1; pwd)"
+}
+
+# concatenates all lines of a file
+concat_lines() {
+  if [ -f "$1" ]; then
+    # Remove \r in case we run on Windows within Git Bash
+    # and check out the repository with auto CRLF management
+    # enabled. Otherwise, we may read lines that are delimited with
+    # \r\n and produce $'-Xarg\r' rather than -Xarg due to word
+    # splitting rules.
+    tr -s '\r\n' ' ' < "$1"
+  fi
+}
+
+log() {
+  if [ "$MVNW_VERBOSE" = true ]; then
+    printf '%s\n' "$1"
+  fi
+}
+
+BASE_DIR=$(find_maven_basedir "$(dirname "$0")")
+if [ -z "$BASE_DIR" ]; then
+  exit 1;
+fi
+
+MAVEN_PROJECTBASEDIR=${MAVEN_BASEDIR:-"$BASE_DIR"}; export MAVEN_PROJECTBASEDIR
+log "$MAVEN_PROJECTBASEDIR"
+
+##########################################################################################
+# Extension to allow automatically downloading the maven-wrapper.jar from Maven-central
+# This allows using the maven wrapper in projects that prohibit checking in binary data.
+##########################################################################################
+wrapperJarPath="$MAVEN_PROJECTBASEDIR/.mvn/wrapper/maven-wrapper.jar"
+if [ -r "$wrapperJarPath" ]; then
+    log "Found $wrapperJarPath"
+else
+    log "Couldn't find $wrapperJarPath, downloading it ..."
+
+    if [ -n "$MVNW_REPOURL" ]; then
+      wrapperUrl="$MVNW_REPOURL/org/apache/maven/wrapper/maven-wrapper/3.2.0/maven-wrapper-3.2.0.jar"
+    else
+      wrapperUrl="https://repo.maven.apache.org/maven2/org/apache/maven/wrapper/maven-wrapper/3.2.0/maven-wrapper-3.2.0.jar"
+    fi
+    while IFS="=" read -r key value; do
+      # Remove '\r' from value to allow usage on windows as IFS does not consider '\r' as a separator ( considers space, tab, new line ('\n'), and custom '=' )
+      safeValue=$(echo "$value" | tr -d '\r')
+      case "$key" in (wrapperUrl) wrapperUrl="$safeValue"; break ;;
+      esac
+    done < "$MAVEN_PROJECTBASEDIR/.mvn/wrapper/maven-wrapper.properties"
+    log "Downloading from: $wrapperUrl"
+
+    if $cygwin; then
+      wrapperJarPath=$(cygpath --path --windows "$wrapperJarPath")
+    fi
+
+    if command -v wget > /dev/null; then
+        log "Found wget ... using wget"
+        [ "$MVNW_VERBOSE" = true ] && QUIET="" || QUIET="--quiet"
+        if [ -z "$MVNW_USERNAME" ] || [ -z "$MVNW_PASSWORD" ]; then
+            wget $QUIET "$wrapperUrl" -O "$wrapperJarPath" || rm -f "$wrapperJarPath"
+        else
+            wget $QUIET --http-user="$MVNW_USERNAME" --http-password="$MVNW_PASSWORD" "$wrapperUrl" -O "$wrapperJarPath" || rm -f "$wrapperJarPath"
+        fi
+    elif command -v curl > /dev/null; then
+        log "Found curl ... using curl"
+        [ "$MVNW_VERBOSE" = true ] && QUIET="" || QUIET="--silent"
+        if [ -z "$MVNW_USERNAME" ] || [ -z "$MVNW_PASSWORD" ]; then
+            curl $QUIET -o "$wrapperJarPath" "$wrapperUrl" -f -L || rm -f "$wrapperJarPath"
+        else
+            curl $QUIET --user "$MVNW_USERNAME:$MVNW_PASSWORD" -o "$wrapperJarPath" "$wrapperUrl" -f -L || rm -f "$wrapperJarPath"
+        fi
+    else
+        log "Falling back to using Java to download"
+        javaSource="$MAVEN_PROJECTBASEDIR/.mvn/wrapper/MavenWrapperDownloader.java"
+        javaClass="$MAVEN_PROJECTBASEDIR/.mvn/wrapper/MavenWrapperDownloader.class"
+        # For Cygwin, switch paths to Windows format before running javac
+        if $cygwin; then
+          javaSource=$(cygpath --path --windows "$javaSource")
+          javaClass=$(cygpath --path --windows "$javaClass")
+        fi
+        if [ -e "$javaSource" ]; then
+            if [ ! -e "$javaClass" ]; then
+                log " - Compiling MavenWrapperDownloader.java ..."
+                ("$JAVA_HOME/bin/javac" "$javaSource")
+            fi
+            if [ -e "$javaClass" ]; then
+                log " - Running MavenWrapperDownloader.java ..."
+                ("$JAVA_HOME/bin/java" -cp .mvn/wrapper MavenWrapperDownloader "$wrapperUrl" "$wrapperJarPath") || rm -f "$wrapperJarPath"
+            fi
+        fi
+    fi
+fi
+##########################################################################################
+# End of extension
+##########################################################################################
+
+# If specified, validate the SHA-256 sum of the Maven wrapper jar file
+wrapperSha256Sum=""
+while IFS="=" read -r key value; do
+  case "$key" in (wrapperSha256Sum) wrapperSha256Sum=$value; break ;;
+  esac
+done < "$MAVEN_PROJECTBASEDIR/.mvn/wrapper/maven-wrapper.properties"
+if [ -n "$wrapperSha256Sum" ]; then
+  wrapperSha256Result=false
+  if command -v sha256sum > /dev/null; then
+    if echo "$wrapperSha256Sum  $wrapperJarPath" | sha256sum -c > /dev/null 2>&1; then
+      wrapperSha256Result=true
+    fi
+  elif command -v shasum > /dev/null; then
+    if echo "$wrapperSha256Sum  $wrapperJarPath" | shasum -a 256 -c > /dev/null 2>&1; then
+      wrapperSha256Result=true
+    fi
+  else
+    echo "Checksum validation was requested but neither 'sha256sum' or 'shasum' are available."
+    echo "Please install either command, or disable validation by removing 'wrapperSha256Sum' from your maven-wrapper.properties."
+    exit 1
+  fi
+  if [ $wrapperSha256Result = false ]; then
+    echo "Error: Failed to validate Maven wrapper SHA-256, your Maven wrapper might be compromised." >&2
+    echo "Investigate or delete $wrapperJarPath to attempt a clean download." >&2
+    echo "If you updated your Maven version, you need to update the specified wrapperSha256Sum property." >&2
+    exit 1
+  fi
+fi
+
+MAVEN_OPTS="$(concat_lines "$MAVEN_PROJECTBASEDIR/.mvn/jvm.config") $MAVEN_OPTS"
+
+# For Cygwin, switch paths to Windows format before running java
+if $cygwin; then
+  [ -n "$JAVA_HOME" ] &&
+    JAVA_HOME=$(cygpath --path --windows "$JAVA_HOME")
+  [ -n "$CLASSPATH" ] &&
+    CLASSPATH=$(cygpath --path --windows "$CLASSPATH")
+  [ -n "$MAVEN_PROJECTBASEDIR" ] &&
+    MAVEN_PROJECTBASEDIR=$(cygpath --path --windows "$MAVEN_PROJECTBASEDIR")
+fi
+
+# Provide a "standardized" way to retrieve the CLI args that will
+# work with both Windows and non-Windows executions.
+MAVEN_CMD_LINE_ARGS="$MAVEN_CONFIG $*"
+export MAVEN_CMD_LINE_ARGS
+
+WRAPPER_LAUNCHER=org.apache.maven.wrapper.MavenWrapperMain
+
+# shellcheck disable=SC2086 # safe args
+exec "$JAVACMD" \
+  $MAVEN_OPTS \
+  $MAVEN_DEBUG_OPTS \
+  -classpath "$MAVEN_PROJECTBASEDIR/.mvn/wrapper/maven-wrapper.jar" \
+  "-Dmaven.multiModuleProjectDirectory=${MAVEN_PROJECTBASEDIR}" \
+  ${WRAPPER_LAUNCHER} $MAVEN_CONFIG "$@"
diff --git a/mvnw.cmd b/mvnw.cmd
new file mode 100644
index 000000000..f80fbad3e
--- /dev/null
+++ b/mvnw.cmd
@@ -0,0 +1,205 @@
+@REM ----------------------------------------------------------------------------
+@REM Licensed to the Apache Software Foundation (ASF) under one
+@REM or more contributor license agreements.  See the NOTICE file
+@REM distributed with this work for additional information
+@REM regarding copyright ownership.  The ASF licenses this file
+@REM to you under the Apache License, Version 2.0 (the
+@REM "License"); you may not use this file except in compliance
+@REM with the License.  You may obtain a copy of the License at
+@REM
+@REM    http://www.apache.org/licenses/LICENSE-2.0
+@REM
+@REM Unless required by applicable law or agreed to in writing,
+@REM software distributed under the License is distributed on an
+@REM "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+@REM KIND, either express or implied.  See the License for the
+@REM specific language governing permissions and limitations
+@REM under the License.
+@REM ----------------------------------------------------------------------------
+
+@REM ----------------------------------------------------------------------------
+@REM Apache Maven Wrapper startup batch script, version 3.2.0
+@REM
+@REM Required ENV vars:
+@REM JAVA_HOME - location of a JDK home dir
+@REM
+@REM Optional ENV vars
+@REM MAVEN_BATCH_ECHO - set to 'on' to enable the echoing of the batch commands
+@REM MAVEN_BATCH_PAUSE - set to 'on' to wait for a keystroke before ending
+@REM MAVEN_OPTS - parameters passed to the Java VM when running Maven
+@REM     e.g. to debug Maven itself, use
+@REM set MAVEN_OPTS=-Xdebug -Xrunjdwp:transport=dt_socket,server=y,suspend=y,address=8000
+@REM MAVEN_SKIP_RC - flag to disable loading of mavenrc files
+@REM ----------------------------------------------------------------------------
+
+@REM Begin all REM lines with '@' in case MAVEN_BATCH_ECHO is 'on'
+@echo off
+@REM set title of command window
+title %0
+@REM enable echoing by setting MAVEN_BATCH_ECHO to 'on'
+@if "%MAVEN_BATCH_ECHO%" == "on"  echo %MAVEN_BATCH_ECHO%
+
+@REM set %HOME% to equivalent of $HOME
+if "%HOME%" == "" (set "HOME=%HOMEDRIVE%%HOMEPATH%")
+
+@REM Execute a user defined script before this one
+if not "%MAVEN_SKIP_RC%" == "" goto skipRcPre
+@REM check for pre script, once with legacy .bat ending and once with .cmd ending
+if exist "%USERPROFILE%\mavenrc_pre.bat" call "%USERPROFILE%\mavenrc_pre.bat" %*
+if exist "%USERPROFILE%\mavenrc_pre.cmd" call "%USERPROFILE%\mavenrc_pre.cmd" %*
+:skipRcPre
+
+@setlocal
+
+set ERROR_CODE=0
+
+@REM To isolate internal variables from possible post scripts, we use another setlocal
+@setlocal
+
+@REM ==== START VALIDATION ====
+if not "%JAVA_HOME%" == "" goto OkJHome
+
+echo.
+echo Error: JAVA_HOME not found in your environment. >&2
+echo Please set the JAVA_HOME variable in your environment to match the >&2
+echo location of your Java installation. >&2
+echo.
+goto error
+
+:OkJHome
+if exist "%JAVA_HOME%\bin\java.exe" goto init
+
+echo.
+echo Error: JAVA_HOME is set to an invalid directory. >&2
+echo JAVA_HOME = "%JAVA_HOME%" >&2
+echo Please set the JAVA_HOME variable in your environment to match the >&2
+echo location of your Java installation. >&2
+echo.
+goto error
+
+@REM ==== END VALIDATION ====
+
+:init
+
+@REM Find the project base dir, i.e. the directory that contains the folder ".mvn".
+@REM Fallback to current working directory if not found.
+
+set MAVEN_PROJECTBASEDIR=%MAVEN_BASEDIR%
+IF NOT "%MAVEN_PROJECTBASEDIR%"=="" goto endDetectBaseDir
+
+set EXEC_DIR=%CD%
+set WDIR=%EXEC_DIR%
+:findBaseDir
+IF EXIST "%WDIR%"\.mvn goto baseDirFound
+cd ..
+IF "%WDIR%"=="%CD%" goto baseDirNotFound
+set WDIR=%CD%
+goto findBaseDir
+
+:baseDirFound
+set MAVEN_PROJECTBASEDIR=%WDIR%
+cd "%EXEC_DIR%"
+goto endDetectBaseDir
+
+:baseDirNotFound
+set MAVEN_PROJECTBASEDIR=%EXEC_DIR%
+cd "%EXEC_DIR%"
+
+:endDetectBaseDir
+
+IF NOT EXIST "%MAVEN_PROJECTBASEDIR%\.mvn\jvm.config" goto endReadAdditionalConfig
+
+@setlocal EnableExtensions EnableDelayedExpansion
+for /F "usebackq delims=" %%a in ("%MAVEN_PROJECTBASEDIR%\.mvn\jvm.config") do set JVM_CONFIG_MAVEN_PROPS=!JVM_CONFIG_MAVEN_PROPS! %%a
+@endlocal & set JVM_CONFIG_MAVEN_PROPS=%JVM_CONFIG_MAVEN_PROPS%
+
+:endReadAdditionalConfig
+
+SET MAVEN_JAVA_EXE="%JAVA_HOME%\bin\java.exe"
+set WRAPPER_JAR="%MAVEN_PROJECTBASEDIR%\.mvn\wrapper\maven-wrapper.jar"
+set WRAPPER_LAUNCHER=org.apache.maven.wrapper.MavenWrapperMain
+
+set WRAPPER_URL="https://repo.maven.apache.org/maven2/org/apache/maven/wrapper/maven-wrapper/3.2.0/maven-wrapper-3.2.0.jar"
+
+FOR /F "usebackq tokens=1,2 delims==" %%A IN ("%MAVEN_PROJECTBASEDIR%\.mvn\wrapper\maven-wrapper.properties") DO (
+    IF "%%A"=="wrapperUrl" SET WRAPPER_URL=%%B
+)
+
+@REM Extension to allow automatically downloading the maven-wrapper.jar from Maven-central
+@REM This allows using the maven wrapper in projects that prohibit checking in binary data.
+if exist %WRAPPER_JAR% (
+    if "%MVNW_VERBOSE%" == "true" (
+        echo Found %WRAPPER_JAR%
+    )
+) else (
+    if not "%MVNW_REPOURL%" == "" (
+        SET WRAPPER_URL="%MVNW_REPOURL%/org/apache/maven/wrapper/maven-wrapper/3.2.0/maven-wrapper-3.2.0.jar"
+    )
+    if "%MVNW_VERBOSE%" == "true" (
+        echo Couldn't find %WRAPPER_JAR%, downloading it ...
+        echo Downloading from: %WRAPPER_URL%
+    )
+
+    powershell -Command "&{"^
+		"$webclient = new-object System.Net.WebClient;"^
+		"if (-not ([string]::IsNullOrEmpty('%MVNW_USERNAME%') -and [string]::IsNullOrEmpty('%MVNW_PASSWORD%'))) {"^
+		"$webclient.Credentials = new-object System.Net.NetworkCredential('%MVNW_USERNAME%', '%MVNW_PASSWORD%');"^
+		"}"^
+		"[Net.ServicePointManager]::SecurityProtocol = [Net.SecurityProtocolType]::Tls12; $webclient.DownloadFile('%WRAPPER_URL%', '%WRAPPER_JAR%')"^
+		"}"
+    if "%MVNW_VERBOSE%" == "true" (
+        echo Finished downloading %WRAPPER_JAR%
+    )
+)
+@REM End of extension
+
+@REM If specified, validate the SHA-256 sum of the Maven wrapper jar file
+SET WRAPPER_SHA_256_SUM=""
+FOR /F "usebackq tokens=1,2 delims==" %%A IN ("%MAVEN_PROJECTBASEDIR%\.mvn\wrapper\maven-wrapper.properties") DO (
+    IF "%%A"=="wrapperSha256Sum" SET WRAPPER_SHA_256_SUM=%%B
+)
+IF NOT %WRAPPER_SHA_256_SUM%=="" (
+    powershell -Command "&{"^
+       "$hash = (Get-FileHash \"%WRAPPER_JAR%\" -Algorithm SHA256).Hash.ToLower();"^
+       "If('%WRAPPER_SHA_256_SUM%' -ne $hash){"^
+       "  Write-Output 'Error: Failed to validate Maven wrapper SHA-256, your Maven wrapper might be compromised.';"^
+       "  Write-Output 'Investigate or delete %WRAPPER_JAR% to attempt a clean download.';"^
+       "  Write-Output 'If you updated your Maven version, you need to update the specified wrapperSha256Sum property.';"^
+       "  exit 1;"^
+       "}"^
+       "}"
+    if ERRORLEVEL 1 goto error
+)
+
+@REM Provide a "standardized" way to retrieve the CLI args that will
+@REM work with both Windows and non-Windows executions.
+set MAVEN_CMD_LINE_ARGS=%*
+
+%MAVEN_JAVA_EXE% ^
+  %JVM_CONFIG_MAVEN_PROPS% ^
+  %MAVEN_OPTS% ^
+  %MAVEN_DEBUG_OPTS% ^
+  -classpath %WRAPPER_JAR% ^
+  "-Dmaven.multiModuleProjectDirectory=%MAVEN_PROJECTBASEDIR%" ^
+  %WRAPPER_LAUNCHER% %MAVEN_CONFIG% %*
+if ERRORLEVEL 1 goto error
+goto end
+
+:error
+set ERROR_CODE=1
+
+:end
+@endlocal & set ERROR_CODE=%ERROR_CODE%
+
+if not "%MAVEN_SKIP_RC%"=="" goto skipRcPost
+@REM check for post script, once with legacy .bat ending and once with .cmd ending
+if exist "%USERPROFILE%\mavenrc_post.bat" call "%USERPROFILE%\mavenrc_post.bat"
+if exist "%USERPROFILE%\mavenrc_post.cmd" call "%USERPROFILE%\mavenrc_post.cmd"
+:skipRcPost
+
+@REM pause the script if MAVEN_BATCH_PAUSE is set to 'on'
+if "%MAVEN_BATCH_PAUSE%"=="on" pause
+
+if "%MAVEN_TERMINATE_CMD%"=="on" exit %ERROR_CODE%
+
+cmd /C exit /B %ERROR_CODE%
diff --git a/parallel-consumer-core/pom.xml b/parallel-consumer-core/pom.xml
new file mode 100644
index 000000000..f3c39f4ea
--- /dev/null
+++ b/parallel-consumer-core/pom.xml
@@ -0,0 +1,168 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Copyright (C) 2020-2023 Confluent, Inc.
+
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <parent>
+        <groupId>io.confluent.parallelconsumer</groupId>
+        <artifactId>parallel-consumer-parent</artifactId>
+        <version>0.5.2.8-SNAPSHOT</version>
+    </parent>
+
+    <modelVersion>4.0.0</modelVersion>
+
+    <artifactId>parallel-consumer-core</artifactId>
+    <name>Confluent Parallel Consumer Core</name>
+
+    <dependencies>
+        <!-- Main -->
+        <dependency>
+            <groupId>org.apache.kafka</groupId>
+            <artifactId>kafka-clients</artifactId>
+            <version>${kafka.version}</version>
+        </dependency>
+        <dependency>
+            <groupId>com.github.luben</groupId>
+            <artifactId>zstd-jni</artifactId>
+            <version>1.5.5-4</version>
+            <scope>compile</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.xerial.snappy</groupId>
+            <artifactId>snappy-java</artifactId>
+            <version>1.1.10.3</version>
+            <scope>compile</scope>
+        </dependency>
+        <dependency>
+            <groupId>io.micrometer</groupId>
+            <artifactId>micrometer-core</artifactId>
+            <scope>compile</scope>
+        </dependency>
+
+        <!-- Testing -->
+        <dependency>
+            <groupId>org.awaitility</groupId>
+            <artifactId>awaitility</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.junit.jupiter</groupId>
+            <artifactId>junit-jupiter-params</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.junit-pioneer</groupId>
+            <artifactId>junit-pioneer</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.testcontainers</groupId>
+            <artifactId>testcontainers</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.testcontainers</groupId>
+            <artifactId>kafka</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.testcontainers</groupId>
+            <artifactId>junit-jupiter</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.apache.commons</groupId>
+            <artifactId>commons-lang3</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>me.tongfei</groupId>
+            <artifactId>progressbar</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.testcontainers</groupId>
+            <artifactId>postgresql</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.postgresql</groupId>
+            <artifactId>postgresql</artifactId>
+            <version>42.6.0</version>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>com.github.tomakehurst</groupId>
+            <artifactId>wiremock-jre8</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.threeten</groupId>
+            <artifactId>threeten-extra</artifactId>
+            <version>1.7.2</version>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>io.stubbs.truth</groupId>
+            <artifactId>truth-generator-api</artifactId>
+            <version>${truth-generator-maven-plugin.version}</version>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>uk.co.jemos.podam</groupId>
+            <artifactId>podam</artifactId>
+            <version>7.2.11.RELEASE</version>
+            <scope>test</scope>
+        </dependency>
+    </dependencies>
+
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>io.stubbs.truth</groupId>
+                <artifactId>truth-generator-maven-plugin</artifactId>
+                <version>${truth-generator-maven-plugin.version}</version>
+                <configuration>
+                    <cleanTargetDir>true</cleanTargetDir>
+                    <useHas>false</useHas>
+                    <useGetterForLegacyClasses>true</useGetterForLegacyClasses>
+                    <releaseTarget>8</releaseTarget>
+                    <classes>
+                        <class>io.confluent.parallelconsumer.PollContext</class>
+                        <class>io.confluent.parallelconsumer.ParallelEoSStreamProcessor</class>
+                        <class>io.confluent.parallelconsumer.internal.ProducerManager</class>
+                        <class>io.confluent.parallelconsumer.state.WorkContainer</class>
+                        <class>io.confluent.parallelconsumer.state.WorkManager</class>
+                        <class>io.confluent.parallelconsumer.state.PartitionState</class>
+                        <class>io.confluent.parallelconsumer.state.ProcessingShard</class>
+                        <class>io.confluent.parallelconsumer.state.ShardKey</class>
+                        <class>io.confluent.parallelconsumer.offsets.OffsetEncoding</class>
+                    </classes>
+                    <legacyClasses>
+                        <!-- todo check legacy is recursive -->
+                        <class>org.apache.kafka.clients.consumer.OffsetAndMetadata</class>
+                        <class>org.apache.kafka.clients.consumer.ConsumerRecord</class>
+                        <class>org.apache.kafka.clients.consumer.ConsumerRecords</class>
+                        <class>org.apache.kafka.clients.consumer.Consumer</class>
+                        <class>org.apache.kafka.clients.producer.RecordMetadata</class>
+                        <class>org.apache.kafka.clients.producer.ProducerRecord</class>
+                        <class>org.apache.kafka.clients.producer.Producer</class>
+                    </legacyClasses>
+                    <entryPointClassPackage>io.confluent.parallelconsumer</entryPointClassPackage>
+                </configuration>
+                <executions>
+                    <execution>
+                        <phase>generate-test-sources</phase>
+                        <goals>
+                            <goal>generate</goal>
+                        </goals>
+                    </execution>
+                </executions>
+            </plugin>
+        </plugins>
+    </build>
+
+
+</project>
diff --git a/parallel-consumer-core/src/main/java/io/confluent/csid/utils/BackportUtils.java b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/BackportUtils.java
new file mode 100644
index 000000000..16c2c5e14
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/BackportUtils.java
@@ -0,0 +1,80 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.UtilityClass;
+
+import java.io.EOFException;
+import java.io.IOException;
+import java.io.InputStream;
+import java.time.Duration;
+import java.util.Arrays;
+import java.util.Optional;
+
+@UtilityClass
+public class BackportUtils {
+
+    /**
+     * @see Duration#toSeconds() intro'd in Java 9 (isn't in 8)
+     */
+    public static long toSeconds(Duration duration) {
+        return duration.toMillis() / 1000;
+    }
+
+    /**
+     * @see Optional#isEmpty()  intro'd java 11
+     */
+    public static boolean isEmpty(Optional<?> optional) {
+        return !optional.isPresent();
+    }
+
+
+    /**
+     * @see Optional#isEmpty()  intro'd java 11
+     */
+    public static boolean hasNo(Optional<?> optional) {
+        return !optional.isPresent();
+    }
+
+    public static byte[] readFully(InputStream is) throws IOException {
+        return BackportUtils.readFully(is, -1, true);
+    }
+
+    /**
+     * Used in Java 8 environments (Java 9 has read all bytes)
+     * <p>
+     * https://stackoverflow.com/a/25892791/105741
+     */
+    public static byte[] readFully(InputStream is, int length, boolean readAll) throws IOException {
+        byte[] output = {};
+        if (length == -1) length = Integer.MAX_VALUE;
+        int pos = 0;
+        while (pos < length) {
+            int bytesToRead;
+            if (pos >= output.length) { // Only expand when there's no room
+                bytesToRead = Math.min(length - pos, output.length + 1024);
+                if (output.length < pos + bytesToRead) {
+                    output = Arrays.copyOf(output, pos + bytesToRead);
+                }
+            } else {
+                bytesToRead = output.length - pos;
+            }
+            int cc = is.read(output, pos, bytesToRead);
+            if (cc < 0) {
+                if (readAll && length != Integer.MAX_VALUE) {
+                    throw new EOFException("Detect premature EOF");
+                } else {
+                    if (output.length != pos) {
+                        output = Arrays.copyOf(output, pos);
+                    }
+                    break;
+                }
+            }
+            pos += cc;
+        }
+        return output;
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/csid/utils/Java8StreamUtils.java b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/Java8StreamUtils.java
new file mode 100644
index 000000000..bf3f78d34
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/Java8StreamUtils.java
@@ -0,0 +1,45 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.UtilityClass;
+
+import java.util.Deque;
+import java.util.Iterator;
+import java.util.Spliterator;
+import java.util.Spliterators;
+import java.util.stream.Stream;
+import java.util.stream.StreamSupport;
+
+@UtilityClass
+public class Java8StreamUtils {
+
+    public static <T> Stream<T> setupStreamFromDeque(Deque<? extends T> userProcessResultsStream) {
+        Spliterator<T> spliterator = Spliterators.spliterator(new DequeIterator<T>(userProcessResultsStream), userProcessResultsStream.size(), Spliterator.NONNULL);
+
+        return StreamSupport.stream(spliterator, false);
+    }
+
+    private static class DequeIterator<T> implements Iterator<T> {
+
+        private final Deque<? extends T> userProcessResultsStream;
+
+        public DequeIterator(Deque<? extends T> userProcessResultsStream) {
+            this.userProcessResultsStream = userProcessResultsStream;
+        }
+
+        @Override
+        public boolean hasNext() {
+            boolean notEmpty = !userProcessResultsStream.isEmpty();
+            return notEmpty;
+        }
+
+        @Override
+        public T next() {
+            T poll = userProcessResultsStream.poll();
+            return poll;
+        }
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/csid/utils/JavaUtils.java b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/JavaUtils.java
new file mode 100644
index 000000000..7d1739e60
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/JavaUtils.java
@@ -0,0 +1,82 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.InternalRuntimeException;
+import lombok.experimental.UtilityClass;
+
+import java.time.Duration;
+import java.util.*;
+import java.util.function.Function;
+import java.util.stream.Collector;
+import java.util.stream.Collectors;
+import java.util.stream.Stream;
+
+import static java.time.Duration.ofMillis;
+
+@UtilityClass
+public class JavaUtils {
+
+    public static <T> Optional<T> getLast(final List<T> someList) {
+        if (someList.isEmpty()) return Optional.empty();
+        return Optional.of(someList.get(someList.size() - 1));
+    }
+
+    public static <T> Optional<T> getFirst(final List<T> someList) {
+        return someList.isEmpty() ? Optional.empty() : Optional.of(someList.get(0));
+    }
+
+    public static <T> Optional<T> getOnlyOne(final Map<String, T> stringMapMap) {
+        if (stringMapMap.isEmpty()) return Optional.empty();
+        Collection<T> values = stringMapMap.values();
+        if (values.size() > 1) throw new InternalRuntimeException("More than one element");
+        return Optional.of(values.iterator().next());
+    }
+
+    public static Duration max(Duration left, Duration right) {
+        long expectedDurationOfClose = Math.max(left.toMillis(), right.toMillis());
+        return ofMillis(expectedDurationOfClose);
+    }
+
+    public static boolean isGreaterThan(Duration compare, Duration to) {
+        return compare.compareTo(to) > 0;
+    }
+
+    /**
+     * A shortcut for changing only the values of a Map.
+     * <p>
+     * https://stackoverflow.com/a/50740570/105741
+     */
+    public static <K, V1, V2> Map<K, V2> remap(Map<K, V1> map,
+                                               Function<? super V1, ? extends V2> function) {
+        return map.entrySet()
+                .stream() // or parallel
+                .collect(Collectors.toMap(
+                        Map.Entry::getKey,
+                        e -> function.apply(e.getValue())
+                ));
+    }
+
+    public static List<String> getRandom(List<String> list, int quantity) {
+        if (list.size() < quantity) {
+            throw new IllegalArgumentException("List size is less than quantity");
+        }
+
+        return createRandomIntStream(list.size())
+                .limit(quantity)
+                .map(list::get)
+                .collect(Collectors.toList());
+    }
+
+    private static Stream<Integer> createRandomIntStream(int range) {
+        final Random random = new Random();
+        return Stream.generate(() -> random.nextInt(range));
+    }
+
+    public static <T> Collector<T, ?, TreeSet<T>> toTreeSet() {
+        return Collectors.toCollection(TreeSet::new);
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/csid/utils/KafkaUtils.java b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/KafkaUtils.java
new file mode 100644
index 000000000..2aa58614f
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/KafkaUtils.java
@@ -0,0 +1,21 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.UtilityClass;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.common.TopicPartition;
+
+/**
+ * Simple identifier tuple for Topic Partitions
+ */
+@UtilityClass
+public final class KafkaUtils {
+
+    public static TopicPartition toTopicPartition(ConsumerRecord<?, ?> rec) {
+        return new TopicPartition(rec.topic(), rec.partition());
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/csid/utils/LoopingResumingIterator.java b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/LoopingResumingIterator.java
new file mode 100644
index 000000000..5258d70cd
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/LoopingResumingIterator.java
@@ -0,0 +1,173 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.Getter;
+import lombok.extern.slf4j.Slf4j;
+
+import java.util.Iterator;
+import java.util.Map;
+import java.util.Optional;
+
+/**
+ * Loop implementations that will resume from a given key. Can be constructed and used as an iterable, or a function
+ * passed into the static version {@link #iterateStartingFromKeyLooping}.
+ * <p>
+ * Uses a looser contract than {@link Iterator} - that being it has no #hasNext() method - instead, it's {@link #next()}
+ * returns {@link Optional#empty()} when it's done.
+ * <p>
+ * The non-functional version is useful when you want to use looping constructs such as {@code break} and
+ * {@code continue}.
+ * <p>
+ *
+ * @author Antony Stubbs
+ */
+@Slf4j
+public class LoopingResumingIterator<KEY, VALUE> {
+
+    private Optional<Map.Entry<KEY, VALUE>> head = Optional.empty();
+
+    /**
+     * See {@link java.util.concurrent.ConcurrentHashMap} docs on iteration
+     *
+     * @see java.util.concurrent.ConcurrentHashMap.Traverser
+     */
+    private Iterator<Map.Entry<KEY, VALUE>> wrappedIterator;
+
+    /**
+     * As {@link java.util.concurrent.ConcurrentHashMap}'s iterators are thread safe, they see a snapshot of the map in
+     * time - this may cause the starting point key to be removed. In which case, we limit our iteration to taking the
+     * expected number of elements.
+     * <p>
+     */
+    private final long iterationTargetCount;
+
+    /**
+     * The number of iterations we've done so far.
+     *
+     * @see #iterationTargetCount
+     */
+    private long iterationCount = 0;
+
+    /**
+     * The key to start from
+     */
+    @Getter
+    private final Optional<KEY> iterationStartingPointKey;
+
+    private final Map<KEY, VALUE> map;
+
+    /**
+     * Where the iteration of the collection has now started again from index zero.
+     * <p>
+     * Binary, as can only loop once after reach the end (to reach the initial starting point again).
+     */
+    private boolean isOnSecondPass = false;
+
+    /**
+     * Iteration has fully completed, and the collection is now exhausted.
+     */
+    private boolean terminalState = false;
+
+    /**
+     * A start key was provided, and it was found in the collection.
+     */
+    private boolean startingPointKeyValid = false;
+
+    public static <KKEY, VVALUE> LoopingResumingIterator<KKEY, VVALUE> build(KKEY startingKey, Map<KKEY, VVALUE> map) {
+        return new LoopingResumingIterator<>(Optional.ofNullable(startingKey), map);
+    }
+
+    /**
+     * Will resume from the startingKey, if it's present
+     */
+    @SuppressWarnings("OptionalUsedAsFieldOrParameterType")
+    public LoopingResumingIterator(Optional<KEY> startingKey, Map<KEY, VALUE> map) {
+        this.iterationStartingPointKey = startingKey;
+        this.map = map;
+        this.wrappedIterator = map.entrySet().iterator();
+        this.iterationTargetCount = map.size();
+
+        // find the starting point
+        if (startingKey.isPresent()) {
+            this.head = advanceToStartingPointAndGet(startingKey.get());
+            if (head.isPresent()) {
+                this.startingPointKeyValid = true;
+            } else {
+                resetIteratorToZero();
+            }
+        }
+    }
+
+    public LoopingResumingIterator(Map<KEY, VALUE> map) {
+        this(Optional.empty(), map);
+    }
+
+
+    /**
+     * @return null if no more elements
+     */
+    public Optional<Map.Entry<KEY, VALUE>> next() {
+        iterationCount++;
+
+        // special cases
+        if (terminalState) {
+            return Optional.empty();
+        } else if (this.head.isPresent()) {
+            Optional<Map.Entry<KEY, VALUE>> headSave = takeHeadValue();
+            return headSave;
+        }
+
+        if (wrappedIterator.hasNext()) {
+            Map.Entry<KEY, VALUE> next = wrappedIterator.next();
+            // could find the starting point earlier
+            boolean onSecondPassAndReachedStartingPoint = iterationStartingPointKey.equals(Optional.of(next.getKey()));
+            // or it could be missing entirely
+            boolean numberElementsReturnedExceeded = iterationCount > iterationTargetCount + 1; // off by one due to eager increment
+            if (onSecondPassAndReachedStartingPoint || numberElementsReturnedExceeded) {
+                // end second iteration reached
+                terminalState = true;
+                return Optional.empty();
+            } else {
+                return Optional.ofNullable(next);
+            }
+        } else if (iterationStartingPointKey.isPresent() && startingPointKeyValid && !isOnSecondPass) {
+            // we've reached the end, but we have a starting point set, so loop back to the start and do second pass
+            resetIteratorToZero();
+            isOnSecondPass = true;
+            return next();
+        } else {
+            // end of 2nd pass
+            return Optional.empty();
+        }
+    }
+
+    private Optional<Map.Entry<KEY, VALUE>> takeHeadValue() {
+        var headSave = head;
+        head = Optional.empty();
+        return headSave;
+    }
+
+    /**
+     * Finds the starting point entry, and sets its index if found.
+     *
+     * @return the starting point entry, if found. Otherwise, null.
+     * @see #startingPointIndex
+     */
+    private Optional<Map.Entry<KEY, VALUE>> advanceToStartingPointAndGet(Object startingPointObject) {
+        while (wrappedIterator.hasNext()) {
+            Map.Entry<KEY, VALUE> next = wrappedIterator.next();
+            if (next.getKey() == startingPointObject) {
+                return Optional.of(next);
+            }
+        }
+        return Optional.empty();
+    }
+
+    private void resetIteratorToZero() {
+        wrappedIterator = map.entrySet().iterator();
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/csid/utils/MathUtils.java b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/MathUtils.java
new file mode 100644
index 000000000..ecb7420ae
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/MathUtils.java
@@ -0,0 +1,29 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.UtilityClass;
+
+/**
+ * @author Antony Stubbs
+ */
+@UtilityClass
+public class MathUtils {
+
+    /**
+     * Ensures exact conversion from a Long to a Short.
+     * <p>
+     * {@link Math} doesn't have an exact conversion from Long to Short.
+     *
+     * @see Math#toIntExact
+     */
+    public static short toShortExact(long value) {
+        final short shortCast = (short) value;
+        if (shortCast != value) {
+            throw new ArithmeticException("short overflow");
+        }
+        return shortCast;
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/csid/utils/Range.java b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/Range.java
new file mode 100644
index 000000000..4edc0bab6
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/Range.java
@@ -0,0 +1,109 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import java.util.Iterator;
+import java.util.List;
+import java.util.NoSuchElementException;
+import java.util.stream.IntStream;
+import java.util.stream.LongStream;
+
+import static java.util.stream.Collectors.toList;
+
+/**
+ * Class for simple ranges.
+ * <p>
+ * <a href="https://stackoverflow.com/a/16570509/105741">For loop - like Python range function</a>
+ *
+ * @see #range(long)
+ */
+public class Range implements Iterable<Long> {
+
+    private final long start;
+
+    private final long limit;
+
+    /**
+     * @see this#range(long)
+     */
+    public Range(int start, long max) {
+        this.start = start;
+        this.limit = max;
+    }
+
+    public Range(long limit) {
+        this.start = 0L;
+        this.limit = limit;
+    }
+
+    /**
+     * Provides an {@link Iterable} for the range of numbers from 0 to the given limit.
+     * <p>
+     * Exclusive of max.
+     * <p>
+     * Consider using {@link IntStream#range(int, int)#forEachOrdered} instead:
+     * <pre>
+     * IntStream.range(0, originalBitsetSize).forEachOrdered(offset -> {
+     * </pre>
+     * However, if you don't want o use a closure, this is a good alternative.
+     */
+    public static Range range(long max) {
+        return new Range(max);
+    }
+
+    /**
+     * @see #range(long)
+     */
+    public static Range range(int start, long max) {
+        return new Range(start, max);
+    }
+
+    /**
+     * Potentially slow, but useful for tests
+     */
+    public static List<Integer> listOfIntegers(int max) {
+        return Range.range(max).listAsIntegers();
+    }
+
+
+    @Override
+    public Iterator<Long> iterator() {
+        final long max = limit;
+        return new Iterator<>() {
+
+            private long current = start;
+
+            @Override
+            public boolean hasNext() {
+                return current < max;
+            }
+
+            @Override
+            public Long next() {
+                if (hasNext()) {
+                    return current++;
+                } else {
+                    throw new NoSuchElementException("Range reached the end");
+                }
+            }
+
+            @Override
+            public void remove() {
+                throw new UnsupportedOperationException("Can't remove values from a Range");
+            }
+        };
+    }
+
+    public List<Integer> listAsIntegers() {
+        return IntStream.range(Math.toIntExact(start), Math.toIntExact(limit))
+                .boxed()
+                .collect(toList());
+    }
+
+    public LongStream toStream() {
+        return LongStream.range(start, limit);
+    }
+
+}
\ No newline at end of file
diff --git a/parallel-consumer-core/src/main/java/io/confluent/csid/utils/StringUtils.java b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/StringUtils.java
new file mode 100644
index 000000000..012e388e5
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/StringUtils.java
@@ -0,0 +1,26 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.UtilityClass;
+import org.slf4j.helpers.FormattingTuple;
+import org.slf4j.helpers.MessageFormatter;
+
+@UtilityClass
+public class StringUtils {
+
+    /**
+     * @see MessageFormatter#arrayFormat(String, Object[])
+     * @see FormattingTuple#getMessage()
+     */
+    public static String msg(String s, Object... args) {
+        return MessageFormatter.arrayFormat(s, args).getMessage();
+    }
+
+    public static boolean isBlank(final String property) {
+        if (property == null) return true;
+        else return property.trim().isEmpty(); // isBlank @since 11
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/csid/utils/SupplierUtils.java b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/SupplierUtils.java
new file mode 100644
index 000000000..d08616959
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/SupplierUtils.java
@@ -0,0 +1,33 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import lombok.experimental.UtilityClass;
+
+import java.util.Objects;
+import java.util.concurrent.atomic.AtomicReference;
+import java.util.function.Supplier;
+
+@UtilityClass
+public class SupplierUtils {
+
+    public static <T> Supplier<T> memoize(Supplier<T> delegate) {
+        Objects.requireNonNull(delegate);
+        AtomicReference<T> value = new AtomicReference<>();
+        return () -> {
+            T val = value.get();
+            if (val == null) {
+                synchronized (value) {
+                    val = value.get();
+                    if (val == null) {
+                        val = Objects.requireNonNull(delegate.get());
+                        value.set(val);
+                    }
+                }
+            }
+            return val;
+        };
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/csid/utils/TimeUtils.java b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/TimeUtils.java
new file mode 100644
index 000000000..e9b3bd161
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/csid/utils/TimeUtils.java
@@ -0,0 +1,54 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.Builder;
+import lombok.SneakyThrows;
+import lombok.Value;
+import lombok.experimental.UtilityClass;
+import lombok.extern.slf4j.Slf4j;
+
+import java.time.Clock;
+import java.time.Duration;
+import java.util.concurrent.Callable;
+
+@Slf4j
+@UtilityClass
+public class TimeUtils {
+
+    public Clock getClock() {
+        return Clock.systemUTC();
+    }
+
+    @SneakyThrows
+    public static <RESULT> RESULT time(final Callable<RESULT> func) {
+        return timeWithMeta(func).getResult();
+    }
+
+    @SneakyThrows
+    public static <RESULT> TimeResult<RESULT> timeWithMeta(final Callable<? extends RESULT> func) {
+        long start = System.currentTimeMillis();
+        TimeResult.TimeResultBuilder<RESULT> timer = TimeResult.<RESULT>builder().startMs(start);
+        RESULT call = func.call();
+        timer.result(call);
+        long end = System.currentTimeMillis();
+        long elapsed = end - start;
+        timer.endMs(end);
+        log.trace("Function took {}", Duration.ofMillis(elapsed));
+        return timer.build();
+    }
+
+    @Builder
+    @Value
+    public static class TimeResult<RESULT> {
+        long startMs;
+        long endMs;
+        RESULT result;
+
+        public Duration getElapsed() {
+            return Duration.ofMillis(endMs - startMs);
+        }
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ExceptionInUserFunctionException.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ExceptionInUserFunctionException.java
new file mode 100644
index 000000000..82192f9ca
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ExceptionInUserFunctionException.java
@@ -0,0 +1,14 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.StandardException;
+
+/**
+ * This exception is only used when there is an exception thrown from code provided by the user.
+ */
+@StandardException
+public class ExceptionInUserFunctionException extends ParallelConsumerException {
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/JStreamParallelEoSStreamProcessor.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/JStreamParallelEoSStreamProcessor.java
new file mode 100644
index 000000000..fa8d90847
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/JStreamParallelEoSStreamProcessor.java
@@ -0,0 +1,41 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.Java8StreamUtils;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.producer.ProducerRecord;
+
+import java.util.List;
+import java.util.concurrent.ConcurrentLinkedDeque;
+import java.util.function.Function;
+import java.util.stream.Stream;
+
+@Slf4j
+public class JStreamParallelEoSStreamProcessor<K, V> extends ParallelEoSStreamProcessor<K, V> implements JStreamParallelStreamProcessor<K, V> {
+
+    private final Stream<ConsumeProduceResult<K, V, K, V>> stream;
+
+    private final ConcurrentLinkedDeque<ConsumeProduceResult<K, V, K, V>> userProcessResultsStream;
+
+    public JStreamParallelEoSStreamProcessor(ParallelConsumerOptions<K, V> parallelConsumerOptions) {
+        super(parallelConsumerOptions);
+
+        this.userProcessResultsStream = new ConcurrentLinkedDeque<>();
+
+        this.stream = Java8StreamUtils.setupStreamFromDeque(this.userProcessResultsStream);
+    }
+
+    @Override
+    public Stream<ConsumeProduceResult<K, V, K, V>> pollProduceAndStream(Function<PollContext<K, V>, List<ProducerRecord<K, V>>> userFunction) {
+        super.pollAndProduceMany(userFunction, result -> {
+            log.trace("Wrapper callback applied, sending result to stream. Input: {}", result);
+            this.userProcessResultsStream.add(result);
+        });
+
+        return this.stream;
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/JStreamParallelStreamProcessor.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/JStreamParallelStreamProcessor.java
new file mode 100644
index 000000000..be55c7d80
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/JStreamParallelStreamProcessor.java
@@ -0,0 +1,30 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.internal.DrainingCloseable;
+import org.apache.kafka.clients.producer.ProducerRecord;
+
+import java.util.List;
+import java.util.function.Function;
+import java.util.stream.Stream;
+
+public interface JStreamParallelStreamProcessor<K, V> extends DrainingCloseable {
+
+    static <K, V> JStreamParallelStreamProcessor<K, V> createJStreamEosStreamProcessor(ParallelConsumerOptions<K, V> options) {
+        return new JStreamParallelEoSStreamProcessor<>(options);
+    }
+
+    /**
+     * Like {@link AbstractParallelEoSStreamProcessor#pollAndProduceMany} but instead of callbacks, streams the results
+     * instead, after the produce result is ack'd by Kafka.
+     *
+     * @return a stream of results of applying the function to the polled records
+     */
+    Stream<ParallelStreamProcessor.ConsumeProduceResult<K, V, K, V>> pollProduceAndStream(
+            Function<PollContext<K, V>,
+                    List<ProducerRecord<K, V>>> userFunction);
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/PCRetriableException.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/PCRetriableException.java
new file mode 100644
index 000000000..7fe1a3ad7
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/PCRetriableException.java
@@ -0,0 +1,23 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.StandardException;
+
+/**
+ * A user's processing function can throw this exception, which signals to PC that processing of the message has failed,
+ * and that it should be retired at a later time.
+ * <p>
+ * The advantage of throwing this exception explicitly, is that PC will not log an ERROR. If any other type of exception
+ * is thrown by the user's function, that will be logged as an error (but will still be retried later).
+ * <p>
+ * So in short, if this exception is thrown, nothing will be logged (except at DEBUG level), any other exception will be
+ * logged as an error.
+ *
+ * @author Antony Stubbs
+ */
+@StandardException
+public class PCRetriableException extends RuntimeException {
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelConsumer.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelConsumer.java
new file mode 100644
index 000000000..de95f1f98
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelConsumer.java
@@ -0,0 +1,101 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.internal.DrainingCloseable;
+import lombok.Data;
+import org.apache.kafka.clients.consumer.ConsumerRebalanceListener;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+
+import java.util.Collection;
+import java.util.regex.Pattern;
+
+// tag::javadoc[]
+/**
+ * Asynchronous / concurrent message consumer for Kafka.
+ * <p>
+ * Currently, there is no direct implementation, only the {@link ParallelStreamProcessor} version (see
+ * {@link AbstractParallelEoSStreamProcessor}), but there may be in the future.
+ *
+ * @param <K> key consume / produce key type
+ * @param <V> value consume / produce value type
+ * @see AbstractParallelEoSStreamProcessor
+ */
+// end::javadoc[]
+public interface ParallelConsumer<K, V> extends DrainingCloseable {
+
+    /**
+     * @return true if the system has either closed, or has crashed
+     */
+    boolean isClosedOrFailed();
+
+    /**
+     * @see KafkaConsumer#subscribe(Collection)
+     */
+    void subscribe(Collection<String> topics);
+
+    /**
+     * @see KafkaConsumer#subscribe(Pattern)
+     */
+    void subscribe(Pattern pattern);
+
+    /**
+     * @see KafkaConsumer#subscribe(Collection, ConsumerRebalanceListener)
+     */
+    void subscribe(Collection<String> topics, ConsumerRebalanceListener callback);
+
+    /**
+     * @see KafkaConsumer#subscribe(Pattern, ConsumerRebalanceListener)
+     */
+    void subscribe(Pattern pattern, ConsumerRebalanceListener callback);
+
+    /**
+     * Pause this consumer (i.e. stop processing of messages).
+     * <p>
+     * This operation only has an effect if the consumer is currently running. In all other cases calling this method
+     * will be silent a no-op.
+     * <p>
+     * Once the consumer is paused, the system will stop submitting work to the processing pool. Already submitted in
+     * flight work however will be finished. This includes work that is currently being processed inside a user function
+     * as well as work that has already been submitted to the processing pool but has not been picked up by a free
+     * worker yet.
+     * <p>
+     * General remarks:
+     * <ul>
+     * <li>A paused consumer may still keep polling for new work until internal buffers are filled.</li>
+     * <li>This operation does not actively pause the subscription on the underlying Kafka Broker (compared to
+     * {@link KafkaConsumer#pause KafkaConsumer#pause}).</li>
+     * <li>Pending offset commits will still be performed when the consumer is paused.</li>
+     * </p>
+     */
+    void pauseIfRunning();
+
+    /**
+     * Resume this consumer (i.e. continue processing of messages).
+     * <p>
+     * This operation only has an effect if the consumer is currently paused. In all other cases calling this method
+     * will be a silent no-op.
+     * </p>
+     */
+    void resumeIfPaused();
+
+    /**
+     * A simple tuple structure.
+     *
+     * @param <L>
+     * @param <R>
+     */
+    @Data
+    class Tuple<L, R> {
+        private final L left;
+        private final R right;
+
+        public static <LL, RR> Tuple<LL, RR> pairOf(LL l, RR r) {
+            return new Tuple<>(l, r);
+        }
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelConsumerException.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelConsumerException.java
new file mode 100644
index 000000000..3826e1f79
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelConsumerException.java
@@ -0,0 +1,16 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.StandardException;
+
+/**
+ * Generic Parallel Consumer {@link RuntimeException} parent.
+ *
+ * @author Antony Stubbs
+ */
+@StandardException
+public class ParallelConsumerException extends RuntimeException {
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelConsumerOptions.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelConsumerOptions.java
new file mode 100644
index 000000000..2268d1a88
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelConsumerOptions.java
@@ -0,0 +1,510 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.metrics.PCMetricsDef;
+import io.micrometer.core.instrument.MeterRegistry;
+import io.micrometer.core.instrument.Tag;
+import io.micrometer.core.instrument.Tags;
+import io.micrometer.core.instrument.composite.CompositeMeterRegistry;
+import lombok.Builder;
+import lombok.Getter;
+import lombok.ToString;
+import lombok.experimental.FieldNameConstants;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.ConsumerConfig;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.common.annotation.InterfaceStability;
+
+import java.time.Duration;
+import java.util.Objects;
+import java.util.UUID;
+import java.util.function.Function;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER;
+import static java.time.Duration.ofMillis;
+import static java.util.Collections.emptyList;
+
+/**
+ * The options for the {@link AbstractParallelEoSStreamProcessor} system.
+ * <p>
+ * The important options to look at are:
+ * <p>
+ * {@link #ordering}, {@link #maxConcurrency} and {@link #batchSize}.
+ * <p>
+ * If you want to go deeper, look at {@link #defaultMessageRetryDelay}, {@link #retryDelayProvider} and
+ * {@link #commitMode}.
+ * <p>
+ * Note: The only required option is the {@link #consumer} ({@link #producer} is only needed if you use the Produce
+ * flows). All other options have sensible defaults.
+ *
+ * @author Antony Stubbs
+ * @see #builder()
+ * @see ParallelConsumerOptions.ParallelConsumerOptionsBuilder
+ */
+@Getter
+@Builder(toBuilder = true)
+@ToString
+@FieldNameConstants
+@InterfaceStability.Evolving
+public class ParallelConsumerOptions<K, V> {
+
+    /**
+     * Required parameter for all use.
+     */
+    private final Consumer<K, V> consumer;
+
+    /**
+     * Supplying a producer is only needed if using the produce flows.
+     *
+     * @see ParallelStreamProcessor
+     */
+    private final Producer<K, V> producer;
+
+    /**
+     * Path to Managed executor service for Java EE
+     */
+    @Builder.Default
+    private final String managedExecutorService = "java:comp/DefaultManagedExecutorService";
+
+    /**
+     * Path to Managed thread factory for Java EE
+     */
+    @Builder.Default
+    private final String managedThreadFactory = "java:comp/DefaultManagedThreadFactory";
+
+    /**
+     * Micrometer MeterRegistry
+     * <p>
+     * Optional - if not specified CompositeMeterRegistry will be used which is NoOp
+     */
+    private final MeterRegistry meterRegistry;
+
+    /**
+     * PC Instance metrics tag value - if specified - should be unique to allow instance specific meters to be created
+     * and cleared. Used with Tag key {@link PCMetricsDef#PC_INSTANCE_TAG}
+     * <p>
+     * If not set - unique UUID will be generated for it
+     */
+    private final String pcInstanceTag;
+
+    /**
+     * Additional common metrics tags - will be added to all created meters
+     */
+    @Builder.Default
+    private final Iterable<Tag> metricsTags = Tags.empty();
+
+    /**
+     * The ordering guarantee to use.
+     */
+    public enum ProcessingOrder {
+
+        /**
+         * No ordering is guaranteed, not even partition order. Fastest. Concurrency is at most the max number of
+         * concurrency or max number of uncommitted messages, limited by the max concurrency or uncommitted settings.
+         */
+        UNORDERED,
+
+        /**
+         * Process messages within a partition in order, but process multiple partitions in parallel. Similar to running
+         * more consumer for a topic. Concurrency is at most the number of partitions.
+         */
+        PARTITION,
+
+        /**
+         * Process messages in key order. Concurrency is at most the number of unique keys in a topic, limited by the
+         * max concurrency or uncommitted settings.
+         */
+        KEY
+    }
+
+    /**
+     * The type of commit to be made, with either a transactions configured Producer where messages produced are
+     * committed back to the Broker along with the offsets they originated from, or with the faster simpler Consumer
+     * offset system either synchronously or asynchronously
+     */
+    public enum CommitMode {
+
+        // tag::transactionalJavadoc[]
+        /**
+         * Periodically commits through the Producer using transactions.
+         * <p>
+         * Messages sent in parallel by different workers get added to the same transaction block - you end up with
+         * transactions 100ms (by default) "large", containing all records sent during that time period, from the
+         * offsets being committed.
+         * <p>
+         * Of no use, if not also producing messages (i.e. using a {@link ParallelStreamProcessor#pollAndProduce}
+         * variation).
+         * <p>
+         * Note: Records being sent by different threads will all be in a single transaction, as PC shares a single
+         * Producer instance. This could be seen as a performance overhead advantage, efficient resource use, in
+         * exchange for a loss in transaction granularity.
+         * <p>
+         * The benefits of using this mode are:
+         * <p>
+         * a) All records produced from a given source offset will either all be visible, or none will be
+         * ({@link org.apache.kafka.common.IsolationLevel#READ_COMMITTED}).
+         * <p>
+         * b) If any records making up a transaction have a terminal issue being produced, or the system crashes before
+         * finishing sending all the records and committing, none will ever be visible and the system will eventually
+         * retry them in new transactions - potentially with different combinations of records from the original.
+         * <p>
+         * c) A source offset, and it's produced records will be committed as an atomic set. Normally: either the record
+         * producing could fail, or the committing of the source offset could fail, as they are separate individual
+         * operations. When using Transactions, they are committed together - so if either operations fails, the
+         * transaction will never get committed, and upon recovery, the system will retry the set again (and no
+         * duplicates will be visible in the topic).
+         * <p>
+         * This {@code CommitMode} is the slowest of the options, but there will be no duplicates in Kafka caused by
+         * producing a record multiple times if previous offset commits have failed or crashes have occurred (however
+         * message replay may cause duplicates in external systems which is unavoidable - external systems must be
+         * idempotent).
+         * <p>
+         * The default commit interval {@link AbstractParallelEoSStreamProcessor#KAFKA_DEFAULT_AUTO_COMMIT_FREQUENCY}
+         * gets automatically reduced from the default of 5 seconds to 100ms (the same as Kafka Streams <a
+         * href=https://docs.confluent.io/platform/current/streams/developer-guide/config-streams.html">commit.interval.ms</a>).
+         * Reducing this configuration places higher load on the broker, but will reduce (but cannot eliminate) replay
+         * upon failure. Note also that when using transactions in Kafka, consumption in {@code READ_COMMITTED} mode is
+         * blocked up to the offset of the first STILL open transaction. Using a smaller commit frequency reduces this
+         * minimum consumption latency - the faster transactions are closed, the faster the transaction content can be
+         * read by {@code READ_COMMITTED} consumers. More information about this can be found on the Confluent blog
+         * post:
+         * <a href="https://www.confluent.io/blog/enabling-exactly-once-kafka-streams/">Enabling Exactly-Once in Kafka
+         * Streams</a>.
+         * <p>
+         * When producing multiple records (see {@link ParallelStreamProcessor#pollAndProduceMany}), all records must
+         * have been produced successfully to the broker before the transaction will commit, after which all will be
+         * visible together, or none.
+         * <p>
+         * Records produced while running in this mode, won't be seen by consumer running in
+         * {@link ConsumerConfig#ISOLATION_LEVEL_CONFIG} {@link org.apache.kafka.common.IsolationLevel#READ_COMMITTED}
+         * mode until the transaction is complete and all records are produced successfully. Records produced into a
+         * transaction that gets aborted or timed out, will never be visible.
+         * <p>
+         * The system must prevent records from being produced to the brokers whose source consumer record offsets has
+         * not been included in this transaction. Otherwise, the transactions would include produced records from
+         * consumer offsets which would only be committed in the NEXT transaction, which would break the EoS guarantees.
+         * To achieve this, first work processing and record producing is suspended (by acquiring the commit lock -
+         * see{@link #commitLockAcquisitionTimeout}, as record processing requires the produce lock), then succeeded
+         * consumer offsets are gathered, transaction commit is made, then when the transaction has finished, processing
+         * resumes by releasing the commit lock. This periodically slows down record production during this phase, by
+         * the time needed to commit the transaction.
+         * <p>
+         * This is all separate from using an IDEMPOTENT Producer, which can be used, along with the
+         * {@link ParallelConsumerOptions#commitMode} {@link CommitMode#PERIODIC_CONSUMER_SYNC} or
+         * {@link CommitMode#PERIODIC_CONSUMER_ASYNCHRONOUS}.
+         * <p>
+         * Failure:
+         * <p>
+         * Commit lock: If the system cannot acquire the commit lock in time, it will shut down for whatever reason, the
+         * system will shut down (fail fast) - during the shutdown a final commit attempt will be made. The default
+         * timeout for acquisition is very high though - see {@link #commitLockAcquisitionTimeout}. This can be caused
+         * by the user processing function taking too long to complete.
+         * <p>
+         * Produce lock: If the system cannot acquire the produce lock in time, it will fail the record processing and
+         * retry the record later. This can be caused by the controller taking too long to commit for some reason. See
+         * {@link #produceLockAcquisitionTimeout}. If using {@link #allowEagerProcessingDuringTransactionCommit}, this
+         * may cause side effect replay when the record is retried, otherwise there is no replay. See
+         * {@link #allowEagerProcessingDuringTransactionCommit} for more details.
+         *
+         * @see ParallelConsumerOptions.ParallelConsumerOptionsBuilder#commitInterval
+         */
+        // end::transactionalJavadoc[]
+        PERIODIC_TRANSACTIONAL_PRODUCER,
+
+        /**
+         * Periodically synchronous commits with the Consumer. Much faster than
+         * {@link #PERIODIC_TRANSACTIONAL_PRODUCER}. Slower but potentially fewer duplicates than
+         * {@link #PERIODIC_CONSUMER_ASYNCHRONOUS} upon replay.
+         */
+        PERIODIC_CONSUMER_SYNC,
+
+        /**
+         * Periodically commits offsets asynchronously. The fastest option, under normal conditions will have few or no
+         * duplicates. Under failure recovery may have more duplicates than {@link #PERIODIC_CONSUMER_SYNC}.
+         */
+        PERIODIC_CONSUMER_ASYNCHRONOUS
+
+    }
+
+    /**
+     * Kafka's default auto commit interval - which is 5000ms.
+     *
+     * @see org.apache.kafka.clients.consumer.ConsumerConfig#AUTO_COMMIT_INTERVAL_MS_CONFIG
+     * @see org.apache.kafka.clients.consumer.ConsumerConfig#CONFIG
+     */
+    public static final int KAFKA_DEFAULT_AUTO_COMMIT_INTERVAL_MS = 5000;
+
+    public static final Duration DEFAULT_COMMIT_INTERVAL = ofMillis(KAFKA_DEFAULT_AUTO_COMMIT_INTERVAL_MS);
+
+    /*
+     * The same as Kafka Streams
+     */
+    public static final Duration DEFAULT_COMMIT_INTERVAL_FOR_TRANSACTIONS = ofMillis(100);
+
+    /**
+     * When using {@link CommitMode#PERIODIC_TRANSACTIONAL_PRODUCER}, allows new records to be processed UP UNTIL the
+     * result record SENDING ({@link Producer#send}) step, potentially while a transaction is being committed. Disabled
+     * by default as to prevent replay side effects when records need to be retried in some scenarios.
+     * <p>
+     * Doesn't interfere with the transaction itself, just reduces side effects.
+     * <p>
+     * Recommended to leave this off to avoid side effect duplicates upon rebalances after a crash. Enabling could
+     * improve performance as the produce lock will only be taken right before it's needed (optimistic locking) to
+     * produce the result record, instead of pessimistically locking.
+     */
+    @Builder.Default
+    private boolean allowEagerProcessingDuringTransactionCommit = false;
+
+    /**
+     * Time to allow for acquiring the commit lock. If record processing or producing takes a long time, you may need to
+     * increase this. If this fails, the system will shut down (fail fast) and attempt to commit once more.
+     */
+    @Builder.Default
+    private Duration commitLockAcquisitionTimeout = Duration.ofMinutes(5);
+
+    /**
+     * Time to allow for acquiring the produce lock. If transaction committing a long time, you may need to increase
+     * this. If this fails, the record will be returned to the processing queue for later retry.
+     */
+    @Builder.Default
+    private Duration produceLockAcquisitionTimeout = Duration.ofMinutes(1);
+
+    /**
+     * Time between commits. Using a higher frequency (a lower value) will put more load on the brokers.
+     */
+    @Builder.Default
+    private Duration commitInterval = DEFAULT_COMMIT_INTERVAL;
+
+    /**
+     * @deprecated only settable during {@code deprecation phase} - use
+     *         {@link ParallelConsumerOptions.ParallelConsumerOptionsBuilder#commitInterval}} instead.
+     */
+    // todo delete in next major version
+    @Deprecated
+    public void setCommitInterval(Duration commitInterval) {
+        this.commitInterval = commitInterval;
+    }
+
+    /**
+     * The {@link ProcessingOrder} type to use
+     */
+    @Builder.Default
+    private final ProcessingOrder ordering = ProcessingOrder.KEY;
+
+    /**
+     * The {@link CommitMode} to be used
+     */
+    @Builder.Default
+    private final CommitMode commitMode = CommitMode.PERIODIC_CONSUMER_ASYNCHRONOUS;
+
+    /**
+     * Controls the maximum degree of concurrency to occur. Used to limit concurrent calls to external systems to a
+     * maximum to prevent overloading them or to a degree, using up quotas.
+     * <p>
+     * When using {@link #getBatchSize()}, this is over and above the batch size setting. So for example, a
+     * {@link #getMaxConcurrency()} of {@code 2} and a batch size of {@code 3} would result in at most {@code 15}
+     * records being processed at once.
+     * <p>
+     * A note on quotas - if your quota is expressed as maximum concurrent calls, this works well. If it's limited in
+     * total requests / sec, this may still overload the system. See towards the distributed rate limiting feature for
+     * this to be properly addressed: https://github.com/confluentinc/parallel-consumer/issues/24 Add distributed rate
+     * limiting support #24.
+     * <p>
+     * In the core module, this sets the number of threads to use in the core's thread pool.
+     * <p>
+     * It's recommended to set this quite high, much higher than core count, as it's expected that these threads will
+     * spend most of their time blocked waiting for IO. For automatic setting of this variable, look out for issue
+     * https://github.com/confluentinc/parallel-consumer/issues/21 Dynamic concurrency control with flow control or tcp
+     * congestion control theory #21.
+     */
+    @Builder.Default
+    private final int maxConcurrency = DEFAULT_MAX_CONCURRENCY;
+
+    public static final int DEFAULT_MAX_CONCURRENCY = 16;
+
+    public static final Duration DEFAULT_STATIC_RETRY_DELAY = Duration.ofSeconds(1);
+
+    /**
+     * Error handling strategy to use when invalid offsets metadata is encountered. This could happen accidentally or
+     * deliberately if the user attempts to reuse an existing consumer group id.
+     */
+    public enum InvalidOffsetMetadataHandlingPolicy {
+        /**
+         * Fails and shuts down the application. This is the default.
+         */
+        FAIL,
+        /**
+         * Ignore the error, logs a warning message and continue processing from the last committed offset.
+         */
+        IGNORE
+    }
+
+    /**
+     * Controls the error handling behaviour to use when invalid offsets metadata from a pre-existing consumer group is
+     * encountered. A potential scenario where this could occur is when a consumer group id from a Kafka Streams
+     * application is accidentally reused.
+     * <p>
+     * Default is {@link InvalidOffsetMetadataHandlingPolicy#FAIL}
+     */
+    @Builder.Default
+    private final InvalidOffsetMetadataHandlingPolicy invalidOffsetMetadataPolicy = InvalidOffsetMetadataHandlingPolicy.FAIL;
+    /**
+     * When a message fails, how long the system should wait before trying that message again. Note that this will not
+     * be exact, and is just a target.
+     *
+     * @deprecated will be renamed to static retry delay
+     */
+    @Deprecated
+    @Builder.Default
+    private final Duration defaultMessageRetryDelay = DEFAULT_STATIC_RETRY_DELAY;
+
+    /**
+     * When present, use this to generate a dynamic retry delay, instead of a static one with
+     * {@link #getDefaultMessageRetryDelay()}.
+     * <p>
+     * Overrides {@link #defaultMessageRetryDelay}, even if it's set.
+     */
+    private final Function<RecordContext<K, V>, Duration> retryDelayProvider;
+
+    /**
+     * Controls how long to block while waiting for the {@link Producer#send} to complete for any ProducerRecords
+     * returned from the user-function. Only relevant if using one of the produce-flows and providing a
+     * {@link ParallelConsumerOptions#producer}. If the timeout occurs the record will be re-processed in the
+     * user-function.
+     * <p>
+     * Consider aligning the value with the {@link ParallelConsumerOptions#producer}-options to avoid unnecessary
+     * re-processing and duplicates on slow {@link Producer#send} calls.
+     *
+     * @see org.apache.kafka.clients.producer.ProducerConfig#DELIVERY_TIMEOUT_MS_CONFIG
+     */
+    @Builder.Default
+    private final Duration sendTimeout = Duration.ofSeconds(10);
+
+    /**
+     * Controls how long to block while waiting for offsets to be committed. Only relevant if using
+     * {@link CommitMode#PERIODIC_CONSUMER_SYNC} commit-mode.
+     */
+    @Builder.Default
+    private final Duration offsetCommitTimeout = Duration.ofSeconds(10);
+
+    /**
+     * The maximum number of messages to attempt to pass into the user functions.
+     * <p>
+     * Batch sizes may sometimes be less than this size, but will never be more.
+     * <p>
+     * The system will treat the messages as a set, so if an error is thrown by the user code, then all messages will be
+     * marked as failed and be retried (Note that when they are retried, there is no guarantee they will all be in the
+     * same batch again). So if you're going to process messages individually, then don't set a batch size.
+     * <p>
+     * Otherwise, if you're going to process messages in sub sets from this batch, it's better to instead adjust the
+     * {@link ParallelConsumerOptions#getBatchSize()} instead to the actual desired size, and process them as a whole.
+     * <p>
+     * Note that there is no relationship between the {@link ConsumerConfig} setting of
+     * {@link ConsumerConfig#MAX_POLL_RECORDS_CONFIG} and this configured batch size, as this library introduces a large
+     * layer of indirection between the managed consumer, and the managed queues we use.
+     * <p>
+     * This indirection effectively disconnects the processing of messages from "polling" them from the managed client,
+     * as we do not wait to process them before calling poll again. We simply call poll as much as we need to, in order
+     * to keep our queues full of enough work to satisfy demand.
+     * <p>
+     * If we have enough, then we actively manage pausing our subscription so that we can continue calling {@code poll}
+     * without pulling in even more messages.
+     * <p>
+     *
+     * @see ParallelConsumerOptions#getBatchSize()
+     */
+    @Builder.Default
+    private final Integer batchSize = 1;
+
+    /**
+     * Configure the amount of delay a record experiences, before a warning is logged.
+     */
+    @Builder.Default
+    private final Duration thresholdForTimeSpendInQueueWarning = Duration.ofSeconds(10);
+
+    public boolean isUsingBatching() {
+        return getBatchSize() > 1;
+    }
+
+    @Builder.Default
+    private final int maxFailureHistory = 10;
+
+    /**
+     * @return the combined target of the desired concurrency by the configured batch size
+     */
+    public int getTargetAmountOfRecordsInFlight() {
+        return getMaxConcurrency() * getBatchSize();
+    }
+
+    public void validate() {
+        Objects.requireNonNull(consumer, "A consumer must be supplied");
+
+        transactionsValidation();
+    }
+
+    private void transactionsValidation() {
+        boolean commitInternalHasNotBeenSet = getCommitInterval() == DEFAULT_COMMIT_INTERVAL;
+
+        if (isUsingTransactionCommitMode()) {
+            if (producer == null) {
+                throw new IllegalArgumentException(msg("Cannot set {} to Transaction Producer mode ({}) without supplying a Producer instance",
+                        Fields.commitMode,
+                        commitMode));
+            }
+
+            // update commit frequency
+            if (commitInternalHasNotBeenSet) {
+                this.commitInterval = DEFAULT_COMMIT_INTERVAL_FOR_TRANSACTIONS;
+            }
+        }
+
+        // inverse
+        if (!isUsingTransactionCommitMode()) {
+            if (isAllowEagerProcessingDuringTransactionCommit()) {
+                throw new IllegalArgumentException(msg("Cannot set {} (eager record processing) when not using transactional commit mode ({}={}).",
+                        Fields.allowEagerProcessingDuringTransactionCommit,
+                        Fields.commitMode,
+                        commitMode));
+            }
+        }
+    }
+
+    /**
+     * @deprecated use {@link #isUsingTransactionCommitMode()}
+     */
+    @Deprecated
+    public boolean isUsingTransactionalProducer() {
+        return isUsingTransactionCommitMode();
+    }
+
+    /**
+     * @see CommitMode#PERIODIC_TRANSACTIONAL_PRODUCER
+     */
+    public boolean isUsingTransactionCommitMode() {
+        return commitMode.equals(PERIODIC_TRANSACTIONAL_PRODUCER);
+    }
+
+    public boolean isProducerSupplied() {
+        return getProducer() != null;
+    }
+
+    /**
+     * Timeout for shutting down execution pool during shutdown in DONT_DRAIN mode. Should be high enough to allow for
+     * inflight messages to finish processing, but low enough to kill any blocked thread to allow to rebalance in a
+     * timely manner, especially if shutting down on error.
+     */
+    @Builder.Default
+    public final Duration shutdownTimeout = Duration.ofSeconds(10);
+
+    /**
+     * Timeout for draining queue during shutdown in DRAIN mode. Should be high enough to allow for all queued messages
+     * to process.
+     */
+    @Builder.Default
+    public final Duration drainTimeout = Duration.ofSeconds(30);
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelEoSStreamProcessor.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelEoSStreamProcessor.java
new file mode 100644
index 000000000..8df85f171
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelEoSStreamProcessor.java
@@ -0,0 +1,165 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.TimeUtils;
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.internal.InternalRuntimeException;
+import io.confluent.parallelconsumer.internal.PCModule;
+import io.confluent.parallelconsumer.internal.ProducerManager;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.clients.producer.RecordMetadata;
+import pl.tlinkowski.unij.api.UniLists;
+
+import java.util.ArrayList;
+import java.util.List;
+import java.util.concurrent.Future;
+import java.util.concurrent.TimeUnit;
+import java.util.concurrent.TimeoutException;
+import java.util.function.Consumer;
+import java.util.function.Function;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER;
+import static io.confluent.parallelconsumer.internal.UserFunctions.carefullyRun;
+import static java.util.Optional.of;
+
+@Slf4j
+public class ParallelEoSStreamProcessor<K, V> extends AbstractParallelEoSStreamProcessor<K, V>
+        implements ParallelStreamProcessor<K, V> {
+
+    /**
+     * Construct the AsyncConsumer by wrapping this passed in consumer and producer, which can be configured any which
+     * way as per normal.
+     *
+     * @see ParallelConsumerOptions
+     */
+    public ParallelEoSStreamProcessor(ParallelConsumerOptions<K, V> newOptions, PCModule<K, V> module) {
+        super(newOptions, module);
+    }
+
+    public ParallelEoSStreamProcessor(ParallelConsumerOptions<K, V> newOptions) {
+        super(newOptions);
+    }
+
+    @Override
+    public void poll(Consumer<PollContext<K, V>> usersVoidConsumptionFunction) {
+        Function<PollContextInternal<K, V>, List<Object>> wrappedUserFunc = (context) -> {
+            log.trace("asyncPoll - Consumed a consumerRecord ({}), executing void function...", context);
+
+            carefullyRun(usersVoidConsumptionFunction, context.getPollContext());
+
+            log.trace("asyncPoll - user function finished ok.");
+            return UniLists.of(); // user function returns no produce records, so we satisfy our api
+        };
+        Consumer<Object> voidCallBack = ignore -> log.trace("Void callback applied.");
+        supervisorLoop(wrappedUserFunc, voidCallBack);
+    }
+
+    @Override
+    @SneakyThrows
+    public void pollAndProduceMany(Function<PollContext<K, V>, List<ProducerRecord<K, V>>> userFunction,
+                                   Consumer<ConsumeProduceResult<K, V, K, V>> callback) {
+        if (!getOptions().isProducerSupplied()) {
+            throw new IllegalArgumentException("To use the produce flows you must supply a Producer in the options");
+        }
+
+        // wrap user func to add produce function
+        Function<PollContextInternal<K, V>, List<ConsumeProduceResult<K, V, K, V>>> producingUserFunctionWrapper =
+                context -> processAndProduceResults(userFunction, context);
+
+        supervisorLoop(producingUserFunctionWrapper, callback);
+    }
+
+    /**
+     * todo refactor to it's own class, so that the wrapping function can be used directly from
+     *  tests, e.g. see: {@see ProducerManagerTest#producedRecordsCantBeInTransactionWithoutItsOffsetDirect}
+     */
+    private List<ConsumeProduceResult<K, V, K, V>> processAndProduceResults(final Function<PollContext<K, V>, List<ProducerRecord<K, V>>> userFunction,
+                                                                            final PollContextInternal<K, V> context) {
+        ProducerManager<K, V> pm = super.getProducerManager().get();
+
+        // if running strict with no processing during commit - get the produce lock first
+        if (options.isUsingTransactionCommitMode() && !options.isAllowEagerProcessingDuringTransactionCommit()) {
+            try {
+                ProducerManager<K, V>.ProducingLock produceLock = pm.beginProducing(context);
+                context.setProducingLock(of(produceLock));
+            } catch (TimeoutException e) {
+                throw new RuntimeException(msg("Timeout trying to early acquire produce lock to send record in {} mode - could not START record processing phase", PERIODIC_TRANSACTIONAL_PRODUCER), e);
+            }
+        }
+
+
+        // run the user function, which is expected to return records to be sent
+        List<ProducerRecord<K, V>> recordListToProduce = carefullyRun(userFunction, context.getPollContext());
+
+        //
+        if (recordListToProduce.isEmpty()) {
+            log.debug("No result returned from function to send.");
+            return UniLists.of();
+        }
+        log.trace("asyncPoll and Stream - Consumed a record ({}), and returning a derivative result record to be produced: {}", context, recordListToProduce);
+
+        List<ConsumeProduceResult<K, V, K, V>> results = new ArrayList<>();
+        log.trace("Producing {} messages in result...", recordListToProduce.size());
+
+        // by having the produce lock span the block on acks, means starting a commit cycle blocks until ack wait is finished
+        if (options.isUsingTransactionCommitMode() && options.isAllowEagerProcessingDuringTransactionCommit()) {
+            try {
+                ProducerManager<K, V>.ProducingLock produceLock = pm.beginProducing(context);
+                context.setProducingLock(of(produceLock));
+            } catch (TimeoutException e) {
+                throw new RuntimeException(msg("Timeout trying to late acquire produce lock to send record in {} mode", PERIODIC_TRANSACTIONAL_PRODUCER), e);
+            }
+        }
+
+        // wait for all acks to complete, see PR #356 for a fully async version which doesn't need to block here
+        try {
+            var futures = pm.produceMessages(recordListToProduce);
+
+            TimeUtils.time(() -> {
+                for (var futureTuple : futures) {
+                    Future<RecordMetadata> futureSend = futureTuple.getRight();
+
+                    var recordMetadata = futureSend.get(options.getSendTimeout().toMillis(), TimeUnit.MILLISECONDS);
+
+                    var result = new ConsumeProduceResult<>(context.getPollContext(), futureTuple.getLeft(), recordMetadata);
+                    results.add(result);
+                }
+                return null; // return from timer function
+            });
+        } catch (Exception e) {
+            throw new InternalRuntimeException("Error while waiting for produce results", e);
+        }
+        return results;
+    }
+
+    @Override
+    @SneakyThrows
+    public void pollAndProduceMany(Function<PollContext<K, V>, List<ProducerRecord<K, V>>> userFunction) {
+        pollAndProduceMany(userFunction, consumerRecord -> {
+            // no op call back
+            log.trace("No-op user callback");
+        });
+    }
+
+    @Override
+    @SneakyThrows
+    public void pollAndProduce(Function<PollContext<K, V>, ProducerRecord<K, V>> userFunction) {
+        pollAndProduce(userFunction, consumerRecord -> {
+            // no op call back
+            log.trace("No-op user callback");
+        });
+    }
+
+    @Override
+    @SneakyThrows
+    public void pollAndProduce(Function<PollContext<K, V>, ProducerRecord<K, V>> userFunction,
+                               Consumer<ConsumeProduceResult<K, V, K, V>> callback) {
+        pollAndProduceMany(consumerRecord -> UniLists.of(userFunction.apply(consumerRecord)), callback);
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelStreamProcessor.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelStreamProcessor.java
new file mode 100644
index 000000000..9fb957281
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelStreamProcessor.java
@@ -0,0 +1,98 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.DrainingCloseable;
+import lombok.Data;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.clients.producer.RecordMetadata;
+
+import java.util.List;
+import java.util.function.Consumer;
+import java.util.function.Function;
+
+/**
+ * Parallel message consumer which also can optionally produce 0 or many {@link ProducerRecord} results to be published
+ * back to Kafka.
+ *
+ * @see #pollAndProduce
+ * @see #pollAndProduceMany
+ */
+public interface ParallelStreamProcessor<K, V> extends ParallelConsumer<K, V>, DrainingCloseable {
+
+    static <KK, VV> ParallelStreamProcessor<KK, VV> createEosStreamProcessor(ParallelConsumerOptions<KK, VV> options) {
+        return new ParallelEoSStreamProcessor<>(options);
+    }
+
+    /**
+     * Register a function to be applied in parallel to each received message.
+     * <p>
+     * Throw a {@link PCRetriableException} to retry the message without the system logging an ERROR level message.
+     *
+     * @param usersVoidConsumptionFunction the function
+     */
+    // todo why isn't this in ParallelConsumer ?
+    void poll(Consumer<PollContext<K, V>> usersVoidConsumptionFunction);
+
+
+    /**
+     * Register a function to be applied in parallel to each received message, which in turn returns one or more
+     * {@link ProducerRecord}s to be sent back to the broker.
+     * <p>
+     * Throw a {@link PCRetriableException} to retry the message without the system logging an ERROR level message.
+     *
+     * @param callback applied after the produced message is acknowledged by kafka
+     */
+    void pollAndProduceMany(Function<PollContext<K, V>, List<ProducerRecord<K, V>>> userFunction,
+                            Consumer<ConsumeProduceResult<K, V, K, V>> callback);
+
+    /**
+     * Register a function to be applied in parallel to each received message, which in turn returns one or many
+     * {@link ProducerRecord}s to be sent back to the broker.
+     * <p>
+     * Throw a {@link PCRetriableException} to retry the message without the system logging an ERROR level message.
+     */
+    void pollAndProduceMany(Function<PollContext<K, V>, List<ProducerRecord<K, V>>> userFunction);
+
+    /**
+     * Register a function to be applied in parallel to each received message, which in turn returns a
+     * {@link ProducerRecord} to be sent back to the broker.
+     * <p>
+     * Throw a {@link PCRetriableException} to retry the message without the system logging an ERROR level message.
+     */
+    void pollAndProduce(Function<PollContext<K, V>, ProducerRecord<K, V>> userFunction);
+
+    /**
+     * Register a function to be applied in parallel to each received message, which in turn returns a
+     * {@link ProducerRecord} to be sent back to the broker.
+     * <p>
+     * Throw a {@link PCRetriableException} to retry the message without the system logging an ERROR level message.
+     *
+     * @param callback applied after the produced message is acknowledged by kafka
+     */
+    void pollAndProduce(Function<PollContext<K, V>, ProducerRecord<K, V>> userFunction,
+                        Consumer<ConsumeProduceResult<K, V, K, V>> callback);
+
+    /**
+     * A simple triple structure to capture the set of coinciding data.
+     *
+     * <ul>
+     *     <li>the record consumer</li>
+     *     <li>any producer record produced as a result of it's processing</li>
+     *     <li>the metadata for publishing that record</li>
+     * </ul>
+     *
+     * @param <K>  in key
+     * @param <V>  in value
+     * @param <KK> out key
+     * @param <VV> out value
+     */
+    @Data
+    class ConsumeProduceResult<K, V, KK, VV> {
+        private final PollContext<K, V> in;
+        private final ProducerRecord<KK, VV> out;
+        private final RecordMetadata meta;
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/PollContext.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/PollContext.java
new file mode 100644
index 000000000..2b7c75cf0
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/PollContext.java
@@ -0,0 +1,234 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.state.WorkContainer;
+import lombok.AccessLevel;
+import lombok.AllArgsConstructor;
+import lombok.EqualsAndHashCode;
+import lombok.ToString;
+import lombok.experimental.FieldDefaults;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.common.TopicPartition;
+
+import java.util.*;
+import java.util.function.Consumer;
+import java.util.stream.Collectors;
+import java.util.stream.Stream;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.internal.Documentation.getLinkHtmlToDocSection;
+
+
+/**
+ * Context object used to pass messages to process to users processing functions.
+ * <p>
+ * Results sets can be iterated in a variety of ways. Explore the different methods available.
+ * <p>
+ * You can access for {@link ConsumerRecord}s directly, or you can get the {@link RecordContext} wrappers, which provide
+ * extra information about the specific records, such as {@link RecordContext#getNumberOfFailedAttempts()}.
+ * <p>
+ * Note that if you are not setting a {@link ParallelConsumerOptions#batchSize}, then you can use the {@link
+ * #getSingleRecord()}, and it's convenience accessors ({@link #value()}, {@link #offset()}, {@link #key()} {@link
+ * #getSingleConsumerRecord()}). But if you have configured batching, they will all throw an {@link
+ * IllegalArgumentException}, as it's not valid to have batches of messages and yet tread the batch input as a single
+ * record.
+ */
+@AllArgsConstructor
+@FieldDefaults(makeFinal = true, level = AccessLevel.PRIVATE)
+@ToString
+@EqualsAndHashCode
+public class PollContext<K, V> implements Iterable<RecordContext<K, V>> {
+
+    protected Map<TopicPartition, Set<RecordContextInternal<K, V>>> records = new HashMap<>();
+
+    PollContext(List<WorkContainer<K, V>> workContainers) {
+        for (var wc : workContainers) {
+            TopicPartition topicPartition = wc.getTopicPartition();
+            var recordSet = records.computeIfAbsent(topicPartition, ignore -> new HashSet<>());
+            recordSet.add(new RecordContextInternal<>(wc));
+        }
+    }
+
+    /**
+     * @return a flat {@link Stream} of {@link RecordContext}s, which wrap the {@link ConsumerRecord}s in this result
+     * set
+     */
+    public Stream<RecordContextInternal<K, V>> streamInternal() {
+        return this.records.values().stream().flatMap(Collection::stream);
+    }
+
+    /**
+     * @return a flat {@link Stream} of {@link RecordContext}s, which wrap the {@link ConsumerRecord}s in this result
+     * set
+     */
+    public Stream<RecordContext<K, V>> stream() {
+        return getByTopicPartitionMap().values().stream().flatMap(Collection::stream);
+    }
+
+    /**
+     * @return a flat {@link Stream} of {@link ConsumerRecord} in this poll set
+     */
+    public Stream<ConsumerRecord<K, V>> streamConsumerRecords() {
+        return stream().map(RecordContext::getConsumerRecord);
+    }
+
+    /**
+     * Must not be using batching ({@link ParallelConsumerOptions#batchSize}).
+     *
+     * @return the single {@link RecordContext} entry in this poll set
+     * @throws IllegalArgumentException if a {@link ParallelConsumerOptions#getBatchSize()} has been set.
+     */
+    public RecordContext<K, V> getSingleRecord() {
+        // instead of calling Options#isUsingBatch - this way we don't need to access to the options class, and this is effectively the same thing
+        if (size() != 1) {
+            throw new IllegalArgumentException(msg("A 'batch size' has been specified in `options`, so you must use the `batch` versions of the polling methods. See {}", getLinkHtmlToDocSection("#batching")));
+        }
+        //noinspection OptionalGetWithoutIsPresent
+        return stream().findFirst().get(); // NOSONAR
+    }
+
+    /**
+     * Must not be using batching ({@link ParallelConsumerOptions#batchSize}).
+     *
+     * @return the single {@link ConsumerRecord} entry in this poll set
+     * @see #getSingleRecord()
+     */
+    public ConsumerRecord<K, V> getSingleConsumerRecord() {
+        return getSingleRecord().getConsumerRecord();
+    }
+
+    /**
+     * For backwards compatibility with {@link ConsumerRecord#value()}.
+     * <p>
+     * Must not be using batching ({@link ParallelConsumerOptions#batchSize}).
+     *
+     * @return the single {@link ConsumerRecord#value()} entry in this poll set
+     * @see #getSingleRecord()
+     */
+    public V value() {
+        return getSingleConsumerRecord().value();
+    }
+
+    /**
+     * For backwards compatibility with {@link ConsumerRecord#key()}.
+     * <p>
+     * Must not be using batching ({@link ParallelConsumerOptions#batchSize}).
+     *
+     * @return the single {@link ConsumerRecord#key()} entry in this poll set
+     * @see #getSingleRecord()
+     */
+    public K key() {
+        return getSingleConsumerRecord().key();
+    }
+
+    /**
+     * For backwards compatibility with {@link ConsumerRecord#offset()}.
+     * <p>
+     * Must not be using batching ({@link ParallelConsumerOptions#batchSize}).
+     *
+     * @return the single {@link ConsumerRecord#offset()} entry in this poll set
+     * @see #getSingleRecord()
+     */
+    public long offset() {
+        return getSingleConsumerRecord().offset();
+    }
+
+    /**
+     * @return a flat {@link List} of {@link RecordContext}s, which wrap the {@link ConsumerRecord}s in this result set
+     */
+    public List<RecordContext<K, V>> getContextsFlattened() {
+        return records.values().stream()
+                .flatMap(Collection::stream)
+                .map(RecordContextInternal::getRecordContext)
+                .collect(Collectors.toList());
+    }
+
+    /**
+     * @return a flat {@link List} of {@link ConsumerRecord}s in this result set
+     */
+    public List<ConsumerRecord<K, V>> getConsumerRecordsFlattened() {
+        return streamConsumerRecords().collect(Collectors.toList());
+    }
+
+    /**
+     * @return a flat {@link Iterator} of the {@link RecordContext}s, which wrap the {@link ConsumerRecord}s in this
+     * result set
+     */
+    @Override
+    public Iterator<RecordContext<K, V>> iterator() {
+        return stream().iterator();
+    }
+
+    /**
+     * @param action to perform on the {@link RecordContext}s, which wrap the {@link ConsumerRecord}s in this result
+     *               set
+     */
+    @Override
+    public void forEach(Consumer<? super RecordContext<K, V>> action) {
+        Iterable.super.forEach(action);
+    }
+
+    /**
+     * @return a flat {@link Spliterator} of the {@link RecordContext}s, which wrap the {@link ConsumerRecord}s in this
+     * result set
+     */
+    @Override
+    public Spliterator<RecordContext<K, V>> spliterator() {
+        return Iterable.super.spliterator();
+    }
+
+    /**
+     * @return a {@link Map} of {@link TopicPartition} to {@link RecordContext} {@link Set}, which wrap the {@link
+     * ConsumerRecord}s in this result set
+     */
+    public Map<TopicPartition, Set<RecordContext<K, V>>> getByTopicPartitionMap() {
+        return this.records.entrySet().stream()
+                .collect(Collectors.toMap(Map.Entry::getKey,
+                                set -> set.getValue().stream()
+                                        .map(RecordContextInternal::getRecordContext)
+                                        .collect(Collectors.toSet())
+                        )
+                );
+    }
+
+    /**
+     * @return the total count of records in this result set
+     */
+    public long size() {
+        return stream().count();
+    }
+
+    /**
+     * Get all the offsets for the records in this result set.
+     * <p>
+     * Note that this flattens the result, so if there are records from multiple {@link TopicPartition}s, the partition
+     * they belong to will be lost. If you want that information as well, try {@link #getOffsets()}.
+     *
+     * @return a flat List of offsets in this result set
+     * @see #getOffsets()
+     */
+    public List<Long> getOffsetsFlattened() {
+        return streamConsumerRecords().mapToLong(ConsumerRecord::offset).boxed().collect(Collectors.toList());
+    }
+
+    /**
+     * Map of partitions to offsets.
+     * <p>
+     * If you don't need the partition information, try {@link #getOffsetsFlattened()}.
+     *
+     * @return a map of {@link TopicPartition} to offsets, of the records in this result set
+     * @see #getOffsetsFlattened()
+     */
+    public Map<TopicPartition, List<Long>> getOffsets() {
+        return getByTopicPartitionMap().entrySet().stream()
+                .collect(Collectors
+                        .toMap(Map.Entry::getKey, e -> e.getValue().stream()
+                                .map(RecordContext::offset).collect(Collectors.toList())
+                        )
+                );
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/PollContextInternal.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/PollContextInternal.java
new file mode 100644
index 000000000..f428e6fc1
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/PollContextInternal.java
@@ -0,0 +1,56 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.ProducerManager;
+import io.confluent.parallelconsumer.state.WorkContainer;
+import lombok.Getter;
+import lombok.Setter;
+import lombok.ToString;
+import lombok.experimental.Delegate;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+
+import java.util.List;
+import java.util.Optional;
+import java.util.stream.Collectors;
+import java.util.stream.Stream;
+
+/**
+ * Internal only view on the {@link PollContext}.
+ */
+@ToString
+public class PollContextInternal<K, V> {
+
+    @Delegate
+    @Getter
+    private final PollContext<K, V> pollContext;
+
+    /**
+     * Used when running in {@link ParallelConsumerOptions.CommitMode#isUsingTransactionCommitMode()} then the produce
+     * lock will be passed around here. It needs to be unlocked when work has been put back in the inbox.
+     */
+    @Getter
+    @Setter
+    protected Optional<ProducerManager<K, V>.ProducingLock> producingLock = Optional.empty();
+
+    public PollContextInternal(List<WorkContainer<K, V>> workContainers) {
+        this.pollContext = new PollContext<>(workContainers);
+    }
+
+    /**
+     * @return a stream of {@link WorkContainer}s
+     */
+    public Stream<WorkContainer<K, V>> streamWorkContainers() {
+        return pollContext.streamInternal().map(RecordContextInternal::getWorkContainer);
+    }
+
+    /**
+     * @return a flat {@link List} of {@link WorkContainer}s, which wrap the {@link ConsumerRecord}s in this result set
+     */
+    public List<WorkContainer<K, V>> getWorkContainers() {
+        return streamWorkContainers().collect(Collectors.toList());
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/RecordContext.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/RecordContext.java
new file mode 100644
index 000000000..f004f702c
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/RecordContext.java
@@ -0,0 +1,75 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.state.ConsumerRecordId;
+import io.confluent.parallelconsumer.state.WorkContainer;
+import lombok.*;
+import lombok.experimental.Delegate;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.common.TopicPartition;
+
+import java.time.Instant;
+import java.util.Optional;
+
+import static lombok.AccessLevel.PROTECTED;
+
+/**
+ * Context information for the wrapped {@link ConsumerRecord}.
+ * <p>
+ * Includes all accessors (~getters) in {@link ConsumerRecord} via delegation ({@link Delegate}).
+ *
+ * @see #getNumberOfFailedAttempts()
+ */
+@Builder(toBuilder = true)
+@AllArgsConstructor
+@ToString
+@EqualsAndHashCode
+public class RecordContext<K, V> {
+
+    @Getter(PROTECTED)
+    protected final WorkContainer<K, V> workContainer;
+
+    @Getter
+    @Delegate
+    private final ConsumerRecord<K, V> consumerRecord;
+
+    public RecordContext(WorkContainer<K, V> wc) {
+        this.consumerRecord = wc.getCr();
+        this.workContainer = wc;
+    }
+
+    /**
+     * A useful ID class for consumer records.
+     *
+     * @return the ID for the contained record
+     */
+    public ConsumerRecordId getRecordId() {
+        var topicPartition = new TopicPartition(topic(), partition());
+        return new ConsumerRecordId(topicPartition, offset());
+    }
+
+    /**
+     * @return the number of times this {@link ConsumerRecord} has failed processing already
+     */
+    public int getNumberOfFailedAttempts() {
+        return workContainer.getNumberOfFailedAttempts();
+    }
+
+    /**
+     * @return if the record has failed, return the time at which is last failed at
+     */
+    public Optional<Instant> getLastFailureAt() {
+        return workContainer.getLastFailedAt();
+    }
+
+    /**
+     * @return if the record had succeeded, returns the time at this the user function returned
+     */
+    public Optional<Instant> getSucceededAt() {
+        return workContainer.getSucceededAt();
+    }
+}
+
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/RecordContextInternal.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/RecordContextInternal.java
new file mode 100644
index 000000000..1385116cb
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/RecordContextInternal.java
@@ -0,0 +1,27 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.state.WorkContainer;
+import lombok.Getter;
+import lombok.ToString;
+
+/**
+ * Internal only view of the {@link RecordContext} class.
+ */
+@ToString
+public class RecordContextInternal<K, V> {
+
+    @Getter
+    private final RecordContext<K, V> recordContext;
+
+    public RecordContextInternal(WorkContainer<K, V> wc) {
+        this.recordContext = new RecordContext<>(wc);
+    }
+
+    public WorkContainer<K, V> getWorkContainer() {
+        return getRecordContext().getWorkContainer();
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/AbstractOffsetCommitter.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/AbstractOffsetCommitter.java
new file mode 100644
index 000000000..6327ab1f2
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/AbstractOffsetCommitter.java
@@ -0,0 +1,64 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.state.WorkManager;
+import lombok.RequiredArgsConstructor;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerGroupMetadata;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.common.TopicPartition;
+
+import java.util.Map;
+import java.util.concurrent.TimeoutException;
+
+@Slf4j
+@RequiredArgsConstructor
+public abstract class AbstractOffsetCommitter<K, V> implements OffsetCommitter {
+
+    protected final ConsumerManager<K, V> consumerMgr;
+    protected final WorkManager<K, V> wm;
+
+    /**
+     * Get offsets from {@link WorkManager} that are ready to commit
+     */
+    @Override
+    public void retrieveOffsetsAndCommit() throws TimeoutException, InterruptedException {
+        log.debug("Find completed work to commit offsets");
+        preAcquireOffsetsToCommit();
+        try {
+            var offsetsToCommit = wm.collectCommitDataForDirtyPartitions();
+            if (offsetsToCommit.isEmpty()) {
+                log.debug("No offsets ready");
+            } else {
+                log.debug("Will commit offsets for {} partition(s): {}", offsetsToCommit.size(), offsetsToCommit);
+                ConsumerGroupMetadata groupMetadata = consumerMgr.groupMetadata();
+
+                log.debug("Begin commit offsets");
+                commitOffsets(offsetsToCommit, groupMetadata);
+
+                log.debug("On commit success");
+                onOffsetCommitSuccess(offsetsToCommit);
+            }
+        } finally {
+            postCommit();
+        }
+    }
+
+    protected void postCommit() {
+        // default noop
+    }
+
+    protected void preAcquireOffsetsToCommit() throws TimeoutException, InterruptedException {
+        // default noop
+    }
+
+    private void onOffsetCommitSuccess(final Map<TopicPartition, OffsetAndMetadata> committed) {
+        wm.onOffsetCommitSuccess(committed);
+    }
+
+    protected abstract void commitOffsets(final Map<TopicPartition, OffsetAndMetadata> offsetsToSend, final ConsumerGroupMetadata groupMetadata);
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/AbstractParallelEoSStreamProcessor.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/AbstractParallelEoSStreamProcessor.java
new file mode 100644
index 000000000..5557fb7d6
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/AbstractParallelEoSStreamProcessor.java
@@ -0,0 +1,1454 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.SupplierUtils;
+import io.confluent.csid.utils.TimeUtils;
+import io.confluent.parallelconsumer.*;
+import io.confluent.parallelconsumer.metrics.PCMetrics;
+import io.confluent.parallelconsumer.metrics.PCMetricsDef;
+import io.confluent.parallelconsumer.state.WorkContainer;
+import io.confluent.parallelconsumer.state.WorkManager;
+import io.micrometer.core.instrument.Gauge;
+import io.micrometer.core.instrument.binder.jvm.ExecutorServiceMetrics;
+import lombok.*;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerRebalanceListener;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.consumer.MockConsumer;
+import org.apache.kafka.clients.consumer.internals.ConsumerCoordinator;
+import org.apache.kafka.common.TopicPartition;
+import org.slf4j.MDC;
+
+import javax.naming.InitialContext;
+import javax.naming.NamingException;
+import java.io.Closeable;
+import java.lang.reflect.Field;
+import java.time.Clock;
+import java.time.Duration;
+import java.time.Instant;
+import java.util.*;
+import java.util.concurrent.*;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.function.Consumer;
+import java.util.function.Function;
+import java.util.function.Supplier;
+import java.util.regex.Pattern;
+import java.util.stream.Collectors;
+
+import static io.confluent.csid.utils.BackportUtils.isEmpty;
+import static io.confluent.csid.utils.BackportUtils.toSeconds;
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.internal.State.*;
+import static io.confluent.parallelconsumer.metrics.PCMetricsDef.USER_FUNCTION_EXECUTOR_PREFIX;
+import static java.lang.Boolean.TRUE;
+import static java.util.concurrent.TimeUnit.MILLISECONDS;
+import static java.util.concurrent.TimeUnit.SECONDS;
+import static lombok.AccessLevel.PRIVATE;
+import static lombok.AccessLevel.PROTECTED;
+
+/**
+ * @see ParallelConsumer
+ */
+@Slf4j
+public abstract class AbstractParallelEoSStreamProcessor<K, V> implements ParallelConsumer<K, V>, ConsumerRebalanceListener, Closeable {
+
+    public static final String MDC_INSTANCE_ID = "pcId";
+
+    /**
+     * Key for the work container descriptor that will be added to the {@link MDC diagnostic context} while inside a
+     * user function.
+     */
+    private static final String MDC_WORK_CONTAINER_DESCRIPTOR = "offset";
+
+    /**
+     * Timeout used by various subsystems(BrokerPoller, Consumer) during shut down.
+     */
+    public static final Duration DEFAULT_TIMEOUT = Duration.ofSeconds(30);
+
+    public static final Duration GRACE_PERIOD_FOR_OVERALL_SHUTDOWN = Duration.ofSeconds(10);
+
+
+    @Getter(PROTECTED)
+    protected final ParallelConsumerOptions<K, V> options;
+
+    /**
+     * Injectable clock for testing
+     */
+    @Setter(AccessLevel.PACKAGE)
+    private Clock clock = TimeUtils.getClock();
+
+    /**
+     * Sets the time between commits. Using a higher frequency will put more load on the brokers.
+     *
+     * @deprecated use {@link  ParallelConsumerOptions.ParallelConsumerOptionsBuilder#commitInterval}} instead. This
+     *         will be deleted in the next major version.
+     */
+    // todo delete in next major version
+    @Deprecated
+    public void setTimeBetweenCommits(final Duration timeBetweenCommits) {
+        options.setCommitInterval(timeBetweenCommits);
+    }
+
+    /**
+     * Gets the time between commits.
+     *
+     * @deprecated use {@link ParallelConsumerOptions#setCommitInterval} instead. This will be deleted in the next major
+     *         version.
+     */
+    // todo delete in next major version
+    @Deprecated
+    public Duration getTimeBetweenCommits() {
+        return options.getCommitInterval();
+    }
+
+    private Instant lastCommitCheckTime = Instant.now();
+
+    @Getter(PROTECTED)
+    private final Optional<ProducerManager<K, V>> producerManager;
+
+    private final org.apache.kafka.clients.consumer.Consumer<K, V> consumer;
+
+    /**
+     * The pool which is used for running the users' supplied function
+     */
+    @Getter(PROTECTED)
+    protected final Supplier<ThreadPoolExecutor> workerThreadPool;
+
+    private Optional<Future<Boolean>> controlThreadFuture = Optional.empty();
+
+    // todo make package level
+    @Getter(AccessLevel.PUBLIC)
+    protected final WorkManager<K, V> wm;
+
+    /**
+     * Collection of work waiting to be
+     */
+    @Getter(PROTECTED)
+    private final BlockingQueue<ControllerEventMessage<K, V>> workMailBox = new LinkedBlockingQueue<>(); // Thread safe, highly performant, non blocking
+
+    private final AtomicBoolean isRebalanceInProgress = new AtomicBoolean(false);
+
+    /**
+     * An inbound message to the controller.
+     * <p>
+     * Currently, an Either type class, representing either newly polled records to ingest, or a work result.
+     */
+    @Value
+    @RequiredArgsConstructor(access = PRIVATE)
+    private static class ControllerEventMessage<K, V> {
+
+        WorkContainer<K, V> workContainer;
+
+        EpochAndRecordsMap<K, V> consumerRecords;
+
+        private boolean isWorkResult() {
+            return workContainer != null;
+        }
+
+        private boolean isNewConsumerRecords() {
+            return !isWorkResult();
+        }
+
+        private static <K, V> ControllerEventMessage<K, V> of(EpochAndRecordsMap<K, V> polledRecords) {
+            return new ControllerEventMessage<>(null, polledRecords);
+        }
+
+        public static <K, V> ControllerEventMessage<K, V> of(WorkContainer<K, V> work) {
+            return new ControllerEventMessage<K, V>(work, null);
+        }
+    }
+
+    private final BrokerPollSystem<K, V> brokerPollSubsystem;
+
+    /**
+     * Useful for testing async code
+     */
+    private final List<Runnable> controlLoopHooks = new ArrayList<>();
+
+    /**
+     * Reference to the control thread, used for waking up a blocking poll ({@link BlockingQueue#poll}) against a
+     * collection sooner.
+     *
+     * @see #processWorkCompleteMailBox
+     */
+    private Thread blockableControlThread;
+
+    /**
+     * @see #notifySomethingToDo
+     * @see #processWorkCompleteMailBox
+     */
+    private final AtomicBoolean currentlyPollingWorkCompleteMailBox = new AtomicBoolean();
+
+    private final OffsetCommitter committer;
+
+    /**
+     * Used to request a commit asap
+     */
+    private final AtomicBoolean commitCommand = new AtomicBoolean(false);
+
+    /**
+     * Multiple of {@link ParallelConsumerOptions#getMaxConcurrency()} to have in our processing queue, in order to make
+     * sure threads always have work to do.
+     */
+    protected final DynamicLoadFactor dynamicExtraLoadFactor;
+
+    /**
+     * If the system failed with an exception, it is referenced here.
+     */
+    private Exception failureReason;
+
+    /**
+     * Time of last successful commit
+     */
+    private Instant lastCommitTime;
+
+    @Override
+    public boolean isClosedOrFailed() {
+        boolean closed = state == State.CLOSED;
+        boolean doneOrCancelled = false;
+        if (this.controlThreadFuture.isPresent()) {
+            Future<Boolean> threadFuture = controlThreadFuture.get();
+            doneOrCancelled = threadFuture.isDone() || threadFuture.isCancelled();
+        }
+        return closed || doneOrCancelled;
+    }
+
+    /**
+     * @return if the system failed, returns the recorded reason.
+     */
+    public Exception getFailureCause() {
+        return this.failureReason;
+    }
+
+    /**
+     * The run state of the controller.
+     *
+     * @see State
+     */
+    @Setter
+    private State state = State.UNUSED;
+
+    /**
+     * Wrapped {@link ConsumerRebalanceListener} passed in by a user that we can also call on events
+     */
+    private Optional<ConsumerRebalanceListener> usersConsumerRebalanceListener = Optional.empty();
+
+    @Getter
+    private int numberOfAssignedPartitions;
+
+    private final RateLimiter queueStatsLimiter = new RateLimiter();
+
+    @Getter(PROTECTED)
+    PCModule<K, V> module;
+
+    /**
+     * Control for stepping loading factor - shouldn't step if work requests can't be fulfilled due to restrictions.
+     * (e.g. we may want 10, but maybe there's a single partition and we're in partition mode - stepping up won't
+     * help).
+     */
+    private boolean lastWorkRequestWasFulfilled = false;
+
+    private io.micrometer.core.instrument.Timer userProcessingTimer;
+    private Gauge loadFactorGauge;
+    private Gauge statusGauge;
+
+    private Duration shutdownTimeout;
+
+    private Duration drainTimeout;
+
+    private PCMetrics pcMetrics;
+
+    protected AbstractParallelEoSStreamProcessor(ParallelConsumerOptions<K, V> newOptions) {
+        this(newOptions, new PCModule<>(newOptions));
+    }
+
+    /**
+     * Construct the AsyncConsumer by wrapping this passed in conusmer and producer, which can be configured any which
+     * way as per normal.
+     *
+     * @see ParallelConsumerOptions
+     */
+    protected AbstractParallelEoSStreamProcessor(ParallelConsumerOptions<K, V> newOptions, PCModule<K, V> module) {
+        Objects.requireNonNull(newOptions, "Options must be supplied");
+        this.module = module;
+        options = newOptions;
+        this.shutdownTimeout = options.getShutdownTimeout();
+        this.drainTimeout = options.getDrainTimeout();
+        this.consumer = options.getConsumer();
+
+        validateConfiguration();
+
+        module.setParallelEoSStreamProcessor(this);
+
+        log.info("Confluent Parallel Consumer initialise... groupId: {}, Options: {}",
+                newOptions.getConsumer().groupMetadata().groupId(),
+                newOptions);
+        //Initialize global metrics - should be initialized before any of the module objects are created so that meters can be bound in them.
+        pcMetrics = module.pcMetrics();
+
+        this.dynamicExtraLoadFactor = module.dynamicExtraLoadFactor();
+
+        workerThreadPool = SupplierUtils.memoize(() -> setupWorkerPool(newOptions.getMaxConcurrency()));
+
+        this.wm = module.workManager();
+
+        this.brokerPollSubsystem = module.brokerPoller(this);
+
+        if (options.isProducerSupplied()) {
+            this.producerManager = Optional.of(module.producerManager());
+            if (options.isUsingTransactionalProducer())
+                this.committer = this.producerManager.get();
+            else
+                this.committer = this.brokerPollSubsystem;
+        } else {
+            this.producerManager = Optional.empty();
+            this.committer = this.brokerPollSubsystem;
+        }
+        //Initialize metrics for this class once all the objects are created
+        initMetrics();
+    }
+
+    private void initMetrics() {
+        this.userProcessingTimer = pcMetrics.getTimerFromMetricDef(PCMetricsDef.USER_FUNCTION_PROCESSING_TIME);
+        this.loadFactorGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.DYNAMIC_EXTRA_LOAD_FACTOR,
+                dynamicExtraLoadFactor, DynamicLoadFactor::getCurrentFactor);
+        this.statusGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.PC_STATUS, this, pc -> pc.state.getValue());
+        new ExecutorServiceMetrics(this.getWorkerThreadPool().get(), "pc-user-function-executor",
+                USER_FUNCTION_EXECUTOR_PREFIX,
+                pcMetrics.getCommonTags()).bindTo(pcMetrics.getMeterRegistry());
+    }
+
+    private void validateConfiguration() {
+        options.validate();
+
+        checkGroupIdConfigured(consumer);
+        checkNotSubscribed(consumer);
+        checkAutoCommitIsDisabled(consumer);
+    }
+
+    private void checkGroupIdConfigured(final org.apache.kafka.clients.consumer.Consumer<K, V> consumer) {
+        try {
+            consumer.groupMetadata();
+        } catch (RuntimeException e) {
+            throw new IllegalArgumentException("Error validating Consumer configuration - no group metadata - missing a " +
+                    "configured GroupId on your Consumer?", e);
+        }
+    }
+
+    protected ThreadPoolExecutor setupWorkerPool(int poolSize) {
+        ThreadFactory defaultFactory;
+        try {
+            defaultFactory = InitialContext.doLookup(options.getManagedThreadFactory());
+        } catch (NamingException e) {
+            log.debug("Using Java SE Thread", e);
+            defaultFactory = Executors.defaultThreadFactory();
+        }
+        ThreadFactory finalDefaultFactory = defaultFactory;
+        ThreadFactory namingThreadFactory = r -> {
+            Thread thread = finalDefaultFactory.newThread(r);
+            String name = thread.getName();
+            thread.setName("pc-" + name);
+            this.getMyId().ifPresent(id -> thread.setName("pc-" + name + "-" + id));
+            return thread;
+        };
+        ThreadPoolExecutor.AbortPolicy rejectionHandler = new ThreadPoolExecutor.AbortPolicy();
+        LinkedBlockingQueue<Runnable> workQueue = new LinkedBlockingQueue<>();
+        return new ThreadPoolExecutor(poolSize, poolSize, 0L, MILLISECONDS, workQueue,
+                namingThreadFactory, rejectionHandler);
+    }
+
+    private void checkNotSubscribed(org.apache.kafka.clients.consumer.Consumer<K, V> consumerToCheck) {
+        if (consumerToCheck instanceof MockConsumer)
+            // disabled for unit tests which don't test rebalancing
+            return;
+        Set<String> subscription = consumerToCheck.subscription();
+        Set<TopicPartition> assignment = consumerToCheck.assignment();
+        if (!subscription.isEmpty() || !assignment.isEmpty()) {
+            throw new IllegalStateException("Consumer subscription must be managed by the Parallel Consumer. Use " + this.getClass().getName() + "#subcribe methods instead.");
+        }
+    }
+
+    @Override
+    public void subscribe(Collection<String> topics) {
+        log.debug("Subscribing to {}", topics);
+        consumer.subscribe(topics, this);
+    }
+
+    @Override
+    public void subscribe(Pattern pattern) {
+        log.debug("Subscribing to {}", pattern);
+        consumer.subscribe(pattern, this);
+    }
+
+    @Override
+    public void subscribe(Collection<String> topics, ConsumerRebalanceListener callback) {
+        log.debug("Subscribing to {}", topics);
+        usersConsumerRebalanceListener = Optional.of(callback);
+        consumer.subscribe(topics, this);
+    }
+
+    @Override
+    public void subscribe(Pattern pattern, ConsumerRebalanceListener callback) {
+        log.debug("Subscribing to {}", pattern);
+        usersConsumerRebalanceListener = Optional.of(callback);
+        consumer.subscribe(pattern, this);
+    }
+
+    /**
+     * Commit our offsets
+     * <p>
+     * Make sure the calling thread is the thread which performs commit - i.e. is the {@link OffsetCommitter}.
+     */
+    @SneakyThrows
+    @Override
+    public void onPartitionsRevoked(Collection<TopicPartition> partitions) {
+        log.debug("Partitions revoked {}, state: {}", partitions, state);
+        isRebalanceInProgress.set(true);
+        while (this.producerManager.map(ProducerManager::isTransactionCommittingInProgress).orElse(false))
+            Thread.sleep(100); //wait for the transaction to finish committing
+
+        numberOfAssignedPartitions = numberOfAssignedPartitions - partitions.size();
+
+        try {
+            // commit any offsets from revoked partitions BEFORE truncation
+            this.producerManager.ifPresent(pm -> {
+                try {
+                    pm.preAcquireOffsetsToCommit();
+                } catch (Exception exc) {
+                    throw new InternalRuntimeException(exc);
+                }
+            });
+
+            commitOffsetsThatAreReady();
+
+            // truncate the revoked partitions
+            wm.onPartitionsRevoked(partitions);
+        } catch (Exception e) {
+            throw new InternalRuntimeException("onPartitionsRevoked event error", e);
+        } finally {
+            isRebalanceInProgress.set(false);
+        }
+        //
+        try {
+            usersConsumerRebalanceListener.ifPresent(listener -> listener.onPartitionsRevoked(partitions));
+        } catch (Exception e) {
+            throw new ExceptionInUserFunctionException("Error from rebalance listener function after #onPartitionsRevoked", e);
+        }
+    }
+
+    /**
+     * Delegate to {@link WorkManager}
+     *
+     * @see WorkManager#onPartitionsAssigned
+     */
+    @Override
+    public void onPartitionsAssigned(Collection<TopicPartition> partitions) {
+        numberOfAssignedPartitions = numberOfAssignedPartitions + partitions.size();
+        log.info("Assigned {} total ({} new) partition(s) {}", numberOfAssignedPartitions, partitions.size(), partitions);
+        wm.onPartitionsAssigned(partitions);
+        usersConsumerRebalanceListener.ifPresent(x -> x.onPartitionsAssigned(partitions));
+        notifySomethingToDo();
+    }
+
+    /**
+     * Cannot commit any offsets for partitions that have been `lost` (as opposed to revoked). Just delegate to
+     * {@link WorkManager} for truncation.
+     *
+     * @see WorkManager#onPartitionsAssigned
+     */
+    @Override
+    public void onPartitionsLost(Collection<TopicPartition> partitions) {
+        numberOfAssignedPartitions = numberOfAssignedPartitions - partitions.size();
+        wm.onPartitionsLost(partitions);
+        usersConsumerRebalanceListener.ifPresent(x -> x.onPartitionsLost(partitions));
+    }
+
+    /**
+     * Nasty reflection to check if auto commit is disabled.
+     * <p>
+     * Other way would be to politely request the user also include their consumer properties when construction, but
+     * this is more reliable in a correctness sense, but brittle in terms of coupling to internal implementation.
+     * Consider requesting ability to inspect configuration at runtime.
+     */
+    private void checkAutoCommitIsDisabled(org.apache.kafka.clients.consumer.Consumer<K, V> consumer) {
+        try {
+            if (consumer instanceof KafkaConsumer) {
+                // Could use Commons Lang FieldUtils#readField - but, avoid needing commons lang
+                Field coordinatorField = KafkaConsumer.class.getDeclaredField("coordinator");
+                coordinatorField.setAccessible(true);
+                ConsumerCoordinator coordinator = (ConsumerCoordinator) coordinatorField.get(consumer); //IllegalAccessException
+
+                if (coordinator == null)
+                    throw new IllegalStateException("Coordinator for Consumer is null - missing GroupId? Reflection broken?");
+
+                Field autoCommitEnabledField = coordinator.getClass().getDeclaredField("autoCommitEnabled");
+                autoCommitEnabledField.setAccessible(true);
+                Boolean isAutoCommitEnabled = (Boolean) autoCommitEnabledField.get(coordinator);
+
+                if (TRUE.equals(isAutoCommitEnabled))
+                    throw new ParallelConsumerException("Consumer auto commit must be disabled, as commits are handled by the library.");
+            } else if (consumer instanceof MockConsumer) {
+                log.debug("Detected MockConsumer class which doesn't do auto commits");
+            } else {
+                // Probably Mockito
+                log.error("Consumer is neither a KafkaConsumer nor a MockConsumer - cannot check auto commit is disabled for consumer type: " + consumer.getClass().getName());
+            }
+        } catch (NoSuchFieldException | IllegalAccessException e) {
+            throw new IllegalStateException("Cannot check auto commit is disabled for consumer type: " + consumer.getClass().getName(), e);
+        }
+    }
+
+    /**
+     * Close the system, without draining.
+     *
+     * @see State#DRAINING
+     */
+    @Override
+    public void close() {
+        closeDontDrainFirst();
+    }
+
+    @Override
+    public void close(Duration timeout, DrainingMode drainMode) {
+        shutdownTimeout = timeout;
+        close(drainMode);
+    }
+
+    @Override
+    @SneakyThrows
+    public void close(DrainingMode drainMode) {
+        if (state == CLOSED) {
+            log.info("Already closed, checking end state..");
+        } else {
+            log.info("Signaling to close...");
+
+            switch (drainMode) {
+                case DRAIN -> {
+                    log.info("Will wait for all in flight to complete before");
+                    transitionToDraining();
+                    waitForClose(drainTimeout.plus(shutdownTimeout).plus(GRACE_PERIOD_FOR_OVERALL_SHUTDOWN));
+
+                }
+                case DONT_DRAIN -> {
+                    log.info("Not waiting for remaining queued to complete, will finish in flight, then close...");
+                    transitionToClosing();
+                    waitForClose(shutdownTimeout.plus(GRACE_PERIOD_FOR_OVERALL_SHUTDOWN));
+                }
+            }
+        }
+
+        if (controlThreadFuture.isPresent()) {
+            log.debug("Checking for control thread exception...");
+            Future<?> future = controlThreadFuture.get();
+            future.get(shutdownTimeout.toMillis(), MILLISECONDS); // throws exception if supervisor saw one
+        }
+
+        log.info("Close complete.");
+    }
+
+    private void waitForClose(Duration timeout) throws TimeoutException, ExecutionException {
+        log.info("Waiting on closed state...");
+        while (!state.equals(CLOSED)) {
+            try {
+                Future<Boolean> booleanFuture = this.controlThreadFuture.get();
+                log.debug("Blocking on control future, for duration {} seconds", toSeconds(timeout));
+                boolean signaled = booleanFuture.get(toSeconds(timeout), SECONDS);
+                if (!signaled)
+                    throw new TimeoutException("Timeout waiting for system to close (" + timeout + ")");
+            } catch (InterruptedException e) {
+                // ignore
+                log.trace("Interrupted", e);
+            } catch (ExecutionException | TimeoutException e) {
+                log.error("Execution or timeout exception while waiting for the control thread to close cleanly " +
+                        "(state was {}). Try increasing your time-out to allow the system to drain, or close without " +
+                        "draining.", state, e);
+                throw e;
+            }
+            log.trace("Still waiting for system to close...");
+        }
+    }
+
+    private void doClose(Duration timeout) throws TimeoutException, ExecutionException, InterruptedException {
+        log.debug("Starting close process (state: {})...", state);
+
+        // Drain and pause polling - keeps consumer alive for later commit, but paused
+        // drained messages will be sent to retry queue and not actually processed.
+        brokerPollSubsystem.drain();
+
+        log.debug("Shutting down execution pool...");
+        //Clear scheduled but not started work in execution pool
+        workerThreadPool.get().getQueue().clear();
+        //request graceful shutdown
+        workerThreadPool.get().shutdown();
+        if (workerThreadPool.get().getActiveCount() > 0) {
+            log.info("Inflight work in execution pool: {}, letting to finish on shutdown with timeout: {}", workerThreadPool.get().getActiveCount(), timeout);
+        }
+
+        log.debug("Awaiting worker pool termination...");
+        boolean awaitingInflightCompletion = true;
+        while (awaitingInflightCompletion) {
+            log.debug("Still awaiting completion of inflight work");
+            try {
+                boolean terminationFinishedWithoutTimeout = workerThreadPool.get().awaitTermination(toSeconds(timeout), SECONDS);
+                awaitingInflightCompletion = false;
+                if (!terminationFinishedWithoutTimeout) {
+                    log.warn("Thread execution pool termination await timeout ({})! Were any processing jobs dead locked (test latch locks?) or otherwise stuck? Forcing shutdown of workers.", timeout);
+                    //Requesting threads shutdown immediately - inflight threads will be interrupted at this point.
+                    workerThreadPool.get().shutdownNow();
+                    //Give a second for any interrupt handling / resource cleanup in user functions
+                    workerThreadPool.get().awaitTermination(toSeconds(Duration.ofSeconds(1)), SECONDS);
+                }
+            } catch (InterruptedException e) {
+                log.error("InterruptedException", e);
+                awaitingInflightCompletion = true;
+            }
+        }
+        if (workerThreadPool.get().getActiveCount() > 0) {
+            log.warn("Clean execution pool termination failed - some threads still active despite await and interrupt - is user function swallowing interrupted exception? Threads still not done count: {}", workerThreadPool.get().getActiveCount());
+        }
+        log.debug("Worker pool terminated.");
+
+        // last check to see if after worker pool closed, has any new work arrived?
+        processWorkCompleteMailBox(Duration.ZERO);
+
+        //
+        if( Thread.currentThread().isInterrupted()) {
+            log.warn("control thread interrupted - may lead to issues with transactional commit lock acquisition");
+        }
+        commitOffsetsThatAreReady();
+
+        // only close consumer once producer has committed it's offsets (tx'l)
+        log.debug("Closing and waiting for broker poll system...");
+        brokerPollSubsystem.closeAndWait();
+
+        maybeCloseConsumer();
+
+        producerManager.ifPresent(x -> x.close(timeout));
+        deregisterMeters();
+        pcMetrics.close();
+        log.debug("Close complete.");
+        this.state = CLOSED;
+
+        if (this.getFailureCause() != null) {
+            log.error("PC closed due to error: {}", getFailureCause(), null);
+        }
+    }
+
+    /**
+     * De-registers and removes user function executor meters from meter registry on shutdown
+     */
+    private void deregisterMeters() {
+        pcMetrics.removeMetersByPrefixAndCommonTags(USER_FUNCTION_EXECUTOR_PREFIX);
+    }
+
+    /**
+     * To keep things simple, make sure the correct thread which can make a commit, is the one to close the consumer.
+     * This way, if partitions are revoked, the commit can be made inline.
+     */
+    private void maybeCloseConsumer() {
+        if (isResponsibleForCommits()) {
+            consumer.close();
+        }
+    }
+
+    private boolean isResponsibleForCommits() {
+        return (committer instanceof ProducerManager);
+    }
+
+    private boolean isRecordsAwaitingProcessing() {
+        boolean isRecordsAwaitingProcessing = wm.isRecordsAwaitingProcessing();
+        boolean threadsDone = areMyThreadsDone();
+        log.trace("isRecordsAwaitingProcessing {} || threadsDone {}", isRecordsAwaitingProcessing, threadsDone);
+        return isRecordsAwaitingProcessing || threadsDone;
+    }
+
+    private void transitionToDraining() {
+        log.debug("Transitioning to draining...");
+        this.state = State.DRAINING;
+        notifySomethingToDo();
+    }
+
+    /**
+     * Control thread can be blocked waiting for work, but is interruptible. Interrupting it can be useful to inform
+     * that work is available when there was none, to make tests run faster, or to move on to shutting down the
+     * {@link BrokerPollSystem} so that less messages are downloaded and queued.
+     */
+    private void interruptControlThread() {
+        if (blockableControlThread != null) {
+            log.debug("Interrupting {} thread in case it's waiting for work", blockableControlThread.getName());
+            blockableControlThread.interrupt();
+        }
+    }
+
+    private boolean areMyThreadsDone() {
+        if (isEmpty(controlThreadFuture)) {
+            // not constructed yet, will become alive, unless #poll is never called
+            return false;
+        } else {
+            return controlThreadFuture.get().isDone();
+        }
+    }
+
+    /**
+     * Optional ID of this instance. Useful for testing.
+     */
+    @Setter
+    @Getter
+    private Optional<String> myId = Optional.empty();
+
+    /**
+     * Kicks off the control loop in the executor, with supervision and returns.
+     *
+     * @see #supervisorLoop(Function, Consumer)
+     */
+    protected <R> void supervisorLoop(Function<PollContextInternal<K, V>, List<R>> userFunctionWrapped,
+                                      Consumer<R> callback) {
+        if (state != State.UNUSED) {
+            throw new IllegalStateException(msg("Invalid state - you cannot call the poll* or pollAndProduce* methods " +
+                    "more than once (they are asynchronous) (current state is {})", state));
+        } else {
+            state = RUNNING;
+        }
+
+        // broker poll subsystem
+        brokerPollSubsystem.start(options.getManagedExecutorService());
+
+        ExecutorService executorService;
+        try {
+            executorService = InitialContext.doLookup(options.getManagedExecutorService());
+        } catch (NamingException e) {
+            log.debug("Using Java SE Thread", e);
+            executorService = Executors.newSingleThreadExecutor();
+        }
+
+
+        // run main pool loop in thread
+        Callable<Boolean> controlTask = () -> {
+            addInstanceMDC();
+            log.info("Control loop starting up...");
+            Thread controlThread = Thread.currentThread();
+            controlThread.setName("pc-control");
+            this.getMyId().ifPresent(id -> controlThread.setName("pc-control-" + id));
+            this.blockableControlThread = controlThread;
+            while (state != CLOSED) {
+                log.debug("Control loop start");
+                try {
+                    controlLoop(userFunctionWrapped, callback);
+                } catch (InterruptedException e) {
+                    log.debug("Control loop interrupted, closing");
+                    Thread.interrupted(); //clear interrupted flag as during close need to acquire commit locks and interrupted flag will cause it to throw another interrupted exception.
+                    doClose(shutdownTimeout);
+                } catch (Exception e) {
+                    if (Thread.interrupted()) { //clear interrupted flag
+                        log.debug("Thread interrupted flag cleared in control loop error handling");
+                    }
+                    log.error("Error from poll control thread, will attempt controlled shutdown, then rethrow. Error: " + e.getMessage(), e);
+                    failureReason = new RuntimeException("Error from poll control thread: " + e.getMessage(), e);
+                    doClose(shutdownTimeout); // attempt to close
+                    throw failureReason;
+                }
+            }
+            log.info("Control loop ending clean (state:{})...", state);
+            return true;
+        };
+        Future<Boolean> controlTaskFutureResult = executorService.submit(controlTask);
+        this.controlThreadFuture = Optional.of(controlTaskFutureResult);
+    }
+
+    /**
+     * Useful when testing with more than one instance
+     */
+    private void addInstanceMDC() {
+        this.myId.ifPresent(id -> MDC.put(MDC_INSTANCE_ID, id));
+    }
+
+    /**
+     * Main control loop
+     */
+    protected <R> void controlLoop(Function<PollContextInternal<K, V>, List<R>> userFunction,
+                                   Consumer<R> callback) throws TimeoutException, ExecutionException, InterruptedException {
+        maybeWakeupPoller();
+
+        final boolean shouldTryCommitNow = maybeAcquireCommitLock();
+
+        // make sure all work that's been completed are arranged ready for commit
+        Duration timeToBlockFor = shouldTryCommitNow ? Duration.ZERO : getTimeToBlockFor();
+        processWorkCompleteMailBox(timeToBlockFor);
+
+        //
+        if (shouldTryCommitNow) {
+            // offsets will be committed when the consumer has its partitions revoked
+            commitOffsetsThatAreReady();
+        }
+
+        // distribute more work
+        retrieveAndDistributeNewWork(userFunction, callback);
+
+        // run call back
+        log.trace("Loop: Running {} loop end plugin(s)", controlLoopHooks.size());
+        this.controlLoopHooks.forEach(Runnable::run);
+
+        log.trace("Current state: {}", state);
+        switch (state) {
+            case DRAINING -> {
+                drain();
+            }
+            case CLOSING -> {
+                doClose(shutdownTimeout);
+            }
+        }
+
+        // sanity - supervise the poller
+        brokerPollSubsystem.supervise();
+
+        // thread yield for spin lock avoidance
+        Duration duration = Duration.ofMillis(1);
+        try {
+            Thread.sleep(duration.toMillis());
+        } catch (InterruptedException e) {
+            log.trace("Woke up", e);
+        }
+
+        // end of loop
+        if (log.isTraceEnabled()) {
+            log.trace("End of control loop, waiting processing {}, remaining in partition queues: {}, out for processing: {}. In state: {}",
+                    wm.getNumberOfWorkQueuedInShardsAwaitingSelection(), wm.getNumberOfIncompleteOffsets(), wm.getNumberRecordsOutForProcessing(), state);
+        }
+    }
+
+    /**
+     * If we don't have enough work queued, and the poller is paused for throttling,
+     * <p>
+     * todo move into {@link WorkManager} as it's specific to WM having enough work?
+     */
+    private void maybeWakeupPoller() {
+        if (state == RUNNING) {
+            if (!wm.isSufficientlyLoaded() && brokerPollSubsystem.isPausedForThrottling()) {
+                log.debug("Found Poller paused with not enough front loaded messages, ensuring poller is awake (mail: {} vs target: {})",
+                        wm.getNumberOfWorkQueuedInShardsAwaitingSelection(),
+                        options.getTargetAmountOfRecordsInFlight());
+                brokerPollSubsystem.wakeupIfPaused();
+            }
+        }
+    }
+
+    /**
+     * If it's time to commit, and using transactional system, tries to acquire the commit lock.
+     * <p>
+     * Call {@link ProducerManager#preAcquireOffsetsToCommit()} early, to initiate the record sending barrier for this
+     * transaction (so no more records can be sent, before collecting offsets to commit).
+     *
+     * @return true if committing should either way be attempted now
+     */
+    private boolean maybeAcquireCommitLock() throws TimeoutException, InterruptedException {
+        final boolean shouldTryCommitNow = isTimeToCommitNow() && wm.isDirty() && !isRebalanceInProgress.get();
+        // could do this optimistically as well, and only get the lock if it's time to commit, so is not frequent
+        if (shouldTryCommitNow && options.isUsingTransactionCommitMode()) {
+            // get into write lock queue, so that no new work can be started from here on
+            log.debug("Acquiring commit lock pessimistically, before we try to collect offsets for committing");
+            //noinspection OptionalGetWithoutIsPresent - options will already be verified
+            producerManager.get().preAcquireOffsetsToCommit();
+        }
+        return shouldTryCommitNow;
+    }
+
+    private <R> int retrieveAndDistributeNewWork(final Function<PollContextInternal<K, V>, List<R>> userFunction, final Consumer<R> callback) {
+        // check queue pressure first before addressing it
+        checkPipelinePressure();
+
+        int gotWorkCount = 0;
+
+        //
+        if (state == RUNNING || state == DRAINING) {
+            int delta = calculateQuantityToRequest();
+            var records = wm.getWorkIfAvailable(delta);
+
+            gotWorkCount = records.size();
+            lastWorkRequestWasFulfilled = gotWorkCount >= delta;
+
+            log.trace("Loop: Submit to pool");
+            submitWorkToPool(userFunction, callback, records);
+        }
+
+        //
+        queueStatsLimiter.performIfNotLimited(() -> {
+            int queueSize = getNumberOfUserFunctionsQueued();
+            log.debug("Stats: \n- pool active: {} queued:{} \n- queue size: {} target: {} loading factor: {}",
+                    workerThreadPool.get().getActiveCount(), queueSize, queueSize, getPoolLoadTarget(), dynamicExtraLoadFactor.getCurrentFactor());
+        });
+
+        return gotWorkCount;
+    }
+
+    /**
+     * Submit a piece of work to the processing pool.
+     *
+     * @param workToProcess the polled records to process
+     */
+    protected <R> void submitWorkToPool(Function<PollContextInternal<K, V>, List<R>> usersFunction,
+                                        Consumer<R> callback,
+                                        List<WorkContainer<K, V>> workToProcess) {
+        if (state.equals(CLOSING) || state.equals(CLOSED)) {
+            log.debug("Not submitting new work as Parallel Consumer is in {} state, incoming work: {}, Pool stats: {}", state, workToProcess.size(), workerThreadPool.get());
+        }
+        if (!workToProcess.isEmpty()) {
+            log.debug("New work incoming: {}, Pool stats: {}", workToProcess.size(), workerThreadPool.get());
+
+            // perf: could inline makeBatches
+            var batches = makeBatches(workToProcess);
+
+            // debugging
+            if (log.isDebugEnabled()) {
+                var sizes = batches.stream().map(List::size).sorted().collect(Collectors.toList());
+                log.debug("Number batches: {}, smallest {}, sizes {}", batches.size(), sizes.stream().findFirst().get(), sizes);
+                List<Integer> integerStream = sizes.stream().filter(x -> x < (int) options.getBatchSize()).collect(Collectors.toList());
+                if (integerStream.size() > 1) {
+                    log.warn("More than one batch isn't target size: {}. Input number of batches: {}", integerStream, batches.size());
+                }
+            }
+
+            // submit
+            for (var batch : batches) {
+                submitWorkToPoolInner(usersFunction, callback, batch);
+            }
+        }
+    }
+
+    private <R> void submitWorkToPoolInner(final Function<PollContextInternal<K, V>, List<R>> usersFunction,
+                                           final Consumer<R> callback,
+                                           final List<WorkContainer<K, V>> batch) {
+        // for each record, construct dispatch to the executor and capture a Future
+        log.trace("Sending work ({}) to pool", batch);
+        Future outputRecordFuture = workerThreadPool.get().submit(() -> {
+            addInstanceMDC();
+            return runUserFunction(usersFunction, callback, batch);
+        });
+        // for a batch, each message in the batch shares the same result
+        for (final WorkContainer<K, V> workContainer : batch) {
+            workContainer.setFuture(outputRecordFuture);
+        }
+    }
+
+    private List<List<WorkContainer<K, V>>> makeBatches(List<WorkContainer<K, V>> workToProcess) {
+        int maxBatchSize = options.getBatchSize();
+        return partition(workToProcess, maxBatchSize);
+    }
+
+    private static <T> List<List<T>> partition(Collection<T> sourceCollection, int maxBatchSize) {
+        List<List<T>> listOfBatches = new ArrayList<>();
+        List<T> batchInConstruction = new ArrayList<>();
+
+        //
+        for (T item : sourceCollection) {
+            batchInConstruction.add(item);
+
+            //
+            if (batchInConstruction.size() == maxBatchSize) {
+                listOfBatches.add(batchInConstruction);
+                batchInConstruction = new ArrayList<>();
+            }
+        }
+
+        // add partial tail
+        if (!batchInConstruction.isEmpty()) {
+            listOfBatches.add(batchInConstruction);
+        }
+
+        if (log.isDebugEnabled()) {
+            log.debug("sourceCollection.size() {}, batches: {}, batch sizes {}",
+                    sourceCollection.size(),
+                    listOfBatches.size(),
+                    listOfBatches.stream().map(List::size).collect(Collectors.toList()));
+        }
+        return listOfBatches;
+    }
+
+    /**
+     * @return number of {@link WorkContainer} to try to get
+     */
+    protected int calculateQuantityToRequest() {
+        int target = getTargetOutForProcessing();
+        int current = wm.getNumberRecordsOutForProcessing();
+        int delta = target - current;
+
+        // always round up to fill batches - get however extra are needed to fill a batch
+        if (options.isUsingBatching()) {
+            //noinspection OptionalGetWithoutIsPresent
+            int batchSize = options.getBatchSize();
+            int modulo = delta % batchSize;
+            if (modulo > 0) {
+                int extraToFillBatch = target - modulo;
+                delta = delta + extraToFillBatch;
+            }
+        }
+
+        log.debug("Will try to get work - target: {}, current queue size: {}, requesting: {}, loading factor: {}",
+                target, current, delta, dynamicExtraLoadFactor.getCurrentFactor());
+        return delta;
+    }
+
+    protected int getTargetOutForProcessing() {
+        return getQueueTargetLoaded();
+    }
+
+    protected int getQueueTargetLoaded() {
+        //noinspection unchecked
+        int batch = options.getBatchSize();
+        return getPoolLoadTarget() * dynamicExtraLoadFactor.getCurrentFactor() * batch;
+    }
+
+    /**
+     * Checks the system has enough pressure in the pipeline of work, if not attempts to step up the load factor.
+     */
+    protected void checkPipelinePressure() {
+        if (log.isTraceEnabled())
+            log.trace("Queue pressure check: (current size: {}, loaded target: {}, factor: {}) " +
+                            "if (isPoolQueueLow() {} && lastWorkRequestWasFulfilled {}))",
+                    getNumberOfUserFunctionsQueued(),
+                    getQueueTargetLoaded(),
+                    dynamicExtraLoadFactor.getCurrentFactor(),
+                    isPoolQueueLow(),
+                    lastWorkRequestWasFulfilled);
+
+        if (isPoolQueueLow() && lastWorkRequestWasFulfilled) {
+            boolean steppedUp = dynamicExtraLoadFactor.maybeStepUp();
+            if (steppedUp) {
+                log.debug("isPoolQueueLow(): Executor pool queue is not loaded with enough work (queue: {} vs target: {}), stepped up loading factor to {}",
+                        getNumberOfUserFunctionsQueued(), getPoolLoadTarget(), dynamicExtraLoadFactor.getCurrentFactor());
+            } else if (dynamicExtraLoadFactor.isMaxReached()) {
+                log.warn("isPoolQueueLow(): Max loading factor steps reached: {}/{}", dynamicExtraLoadFactor.getCurrentFactor(), dynamicExtraLoadFactor.getMaxFactor());
+            }
+        }
+    }
+
+    /**
+     * @return aim to never have the pool queue drop below this
+     */
+    private int getPoolLoadTarget() {
+        return options.getTargetAmountOfRecordsInFlight();
+    }
+
+    private boolean isPoolQueueLow() {
+        int queueSize = getNumberOfUserFunctionsQueued();
+        int queueTarget = getPoolLoadTarget();
+        boolean workAmountBelowTarget = queueSize <= queueTarget;
+        log.debug("isPoolQueueLow()? workAmountBelowTarget {} {} vs {};",
+                workAmountBelowTarget, queueSize, queueTarget);
+        return workAmountBelowTarget;
+    }
+
+    private void drain() {
+        log.debug("Signaling to drain...");
+        brokerPollSubsystem.drain();
+        if (!isRecordsAwaitingProcessing()) {
+            transitionToClosing();
+        } else {
+            log.debug("Records still waiting processing, won't transition to closing.");
+        }
+    }
+
+    private void transitionToClosing() {
+        log.debug("Transitioning to closing...");
+        if (state == State.UNUSED) {
+            state = CLOSED;
+        } else {
+            state = State.CLOSING;
+        }
+        notifySomethingToDo();
+    }
+
+    /**
+     * Check the work queue for work to be done, potentially blocking.
+     * <p>
+     * Can be interrupted if something else needs doing.
+     * <p>
+     * Visible for testing.
+     */
+    protected void processWorkCompleteMailBox(final Duration timeToBlockFor) {
+        log.trace("Processing mailbox (might block waiting for results)...");
+        Queue<ControllerEventMessage<K, V>> results = new ArrayDeque<>();
+
+        if (timeToBlockFor.toMillis() > 0) {
+            currentlyPollingWorkCompleteMailBox.getAndSet(true);
+            if (log.isDebugEnabled()) {
+                log.debug("Blocking poll on work until next scheduled offset commit attempt for {}. active threads: {}, queue: {}",
+                        timeToBlockFor, workerThreadPool.get().getActiveCount(), getNumberOfUserFunctionsQueued());
+            }
+            // wait for work, with a timeToBlockFor for sanity
+            log.trace("Blocking poll {}", timeToBlockFor);
+            try {
+                var firstBlockingPoll = workMailBox.poll(timeToBlockFor.toMillis(), MILLISECONDS);
+                if (firstBlockingPoll == null) {
+                    log.debug("Mailbox results returned null, indicating timeToBlockFor elapsed (which was set as {})", timeToBlockFor);
+                } else {
+                    log.debug("Work arrived in mailbox during blocking poll. (Timeout was set as {})", timeToBlockFor);
+                    results.add(firstBlockingPoll);
+                }
+            } catch (InterruptedException e) {
+                log.debug("Interrupted waiting on work results");
+            } finally {
+                currentlyPollingWorkCompleteMailBox.getAndSet(false);
+            }
+            log.trace("Blocking poll finish");
+        }
+
+        // check for more work to batch up, there may be more work queued up behind the head that we can also take
+        // see how big the queue is now, and poll that many times
+        int size = workMailBox.size();
+        log.trace("Draining {} more, got {} already...", size, results.size());
+        workMailBox.drainTo(results, size);
+
+        log.trace("Processing drained work {}...", results.size());
+        for (var action : results) {
+            if (action.isNewConsumerRecords()) {
+                wm.registerWork(action.getConsumerRecords());
+            } else {
+                WorkContainer<K, V> work = action.getWorkContainer();
+                MDC.put(MDC_WORK_CONTAINER_DESCRIPTOR, work.toString());
+                wm.handleFutureResult(work);
+                MDC.remove(MDC_WORK_CONTAINER_DESCRIPTOR);
+            }
+        }
+    }
+
+    /**
+     * The amount of time to block poll in this cycle
+     *
+     * @return either the duration until next commit, or next work retry
+     * @see ParallelConsumerOptions#getTargetAmountOfRecordsInFlight()
+     */
+    private Duration getTimeToBlockFor() {
+        // if less than target work already in flight, don't sleep longer than the next retry time for failed work, if it exists - so that we can wake up and maybe retry the failed work
+        if (!wm.isWorkInFlightMeetingTarget()) {
+            // though check if we have work awaiting retry
+            var lowestScheduledOpt = wm.getLowestRetryTime();
+            if (lowestScheduledOpt.isPresent()) {
+                // todo can sleep for less than this time? is this lower bound required? given that if we're starved - the failed work will most likely be selected? And even if not selected - then we will no longer be starved.
+                Duration retryDelay = options.getDefaultMessageRetryDelay();
+                // at min block for the retry time - retry time is not exact
+                Duration lowestScheduled = lowestScheduledOpt.get();
+                Duration timeBetweenCommits = getTimeBetweenCommits();
+                Duration effectiveRetryDelay = lowestScheduled.toMillis() < retryDelay.toMillis() ? retryDelay : lowestScheduled;
+                Duration result = timeBetweenCommits.toMillis() < effectiveRetryDelay.toMillis() ? timeBetweenCommits : effectiveRetryDelay;
+                log.debug("Not enough work in flight, while work is waiting to be retried - so will only sleep until next retry time of {} (lowestScheduled = {})", result, lowestScheduled);
+                return result;
+            }
+        }
+
+        //
+        Duration effectiveCommitAttemptDelay = getTimeToNextCommitCheck();
+        log.debug("Calculated next commit time in {}", effectiveCommitAttemptDelay);
+        return effectiveCommitAttemptDelay;
+    }
+
+    private boolean isIdlingOrRunning() {
+        return state == RUNNING || state == DRAINING || state == PAUSED;
+    }
+
+    protected boolean isTimeToCommitNow() {
+        updateLastCommitCheckTime();
+
+        Duration elapsedSinceLastCommit = this.lastCommitTime == null ? Duration.ofDays(1) : Duration.between(this.lastCommitTime, Instant.now());
+
+        boolean commitFrequencyOK = elapsedSinceLastCommit.compareTo(getTimeBetweenCommits()) > 0;
+        boolean lingerBeneficial = lingeringOnCommitWouldBeBeneficial();
+        boolean isCommandedToCommit = isCommandedToCommit();
+
+        boolean shouldDoANormalCommit = commitFrequencyOK && !lingerBeneficial;
+
+        boolean shouldCommitNow = shouldDoANormalCommit || isCommandedToCommit;
+
+        if (log.isDebugEnabled()) {
+            log.debug("Should commit this cycle? " +
+                    "shouldCommitNow? " + shouldCommitNow + " : " +
+                    "shouldDoANormalCommit? " + shouldDoANormalCommit + ", " +
+                    "commitFrequencyOK? " + commitFrequencyOK + ", " +
+                    "lingerBeneficial? " + lingerBeneficial + ", " +
+                    "isCommandedToCommit? " + isCommandedToCommit
+            );
+        }
+
+        return shouldCommitNow;
+    }
+
+    private int getNumberOfUserFunctionsQueued() {
+        return workerThreadPool.get().getQueue().size();
+    }
+
+    /**
+     * Under some conditions, waiting longer before committing can be faster
+     *
+     * @return true if waiting to commit would help performance
+     */
+    private boolean lingeringOnCommitWouldBeBeneficial() {
+        if (log.isTraceEnabled()) {
+            // work is waiting to be done
+            boolean workIsWaitingToBeCompletedSuccessfully = wm.workIsWaitingToBeProcessed();
+            // no work is currently being done
+            boolean workInFlight = wm.hasWorkInFlight();
+            // work mailbox is empty
+            boolean workWaitingInMailbox = !workMailBox.isEmpty();
+            boolean workWaitingToProcess = wm.hasIncompleteOffsets();
+            log.trace("workIsWaitingToBeCompletedSuccessfully {} || workInFlight {} || workWaitingInMailbox {} || !workWaitingToProcess {};",
+                    workIsWaitingToBeCompletedSuccessfully, workInFlight, workWaitingInMailbox, !workWaitingToProcess);
+            boolean result = workIsWaitingToBeCompletedSuccessfully || workInFlight || workWaitingInMailbox || !workWaitingToProcess;
+        }
+
+        // todo disable - commit frequency takes care of lingering? is this outdated?
+        return false;
+    }
+
+    private Duration getTimeToNextCommitCheck() {
+        // draining is a normal running mode for the controller
+        if (isIdlingOrRunning()) {
+            Duration timeSinceLastCommit = getTimeSinceLastCheck();
+            Duration timeBetweenCommits = getTimeBetweenCommits();
+            @SuppressWarnings("UnnecessaryLocalVariable")
+            Duration minus = timeBetweenCommits.minus(timeSinceLastCommit);
+            return minus;
+        } else {
+            log.debug("System not {} (state: {}), so don't wait to commit, only a small thread yield time", RUNNING, state);
+            return Duration.ZERO;
+        }
+    }
+
+    private Duration getTimeSinceLastCheck() {
+        Instant now = clock.instant();
+        return Duration.between(lastCommitCheckTime, now);
+    }
+
+    /**
+     * Visible for testing
+     */
+    protected void commitOffsetsThatAreReady() throws TimeoutException, InterruptedException {
+        log.trace("Synchronizing on commitCommand...");
+        synchronized (commitCommand) {
+            log.debug("Committing offsets that are ready...");
+            committer.retrieveOffsetsAndCommit();
+            clearCommitCommand();
+            this.lastCommitTime = Instant.now();
+        }
+    }
+
+    private void updateLastCommitCheckTime() {
+        lastCommitCheckTime = Instant.now();
+    }
+
+    /**
+     * Run the supplied function.
+     */
+    protected <R> List<ParallelConsumer.Tuple<ConsumerRecord<K, V>, R>> runUserFunction(Function<PollContextInternal<K, V>, List<R>> usersFunction,
+                                                                                        Consumer<R> callback,
+                                                                                        List<WorkContainer<K, V>> workContainerBatch) {
+        if (log.isDebugEnabled()) {
+            // first offset of the batch
+            MDC.put(MDC_WORK_CONTAINER_DESCRIPTOR, workContainerBatch.get(0).offset() + "");
+        }
+        log.trace("Pool received: {}", workContainerBatch);
+
+        /*
+         *  Handle stale work from the batch, before creating the internal context for running user function.
+         *  The context created is used by the "wrapped" user function to inject transactional producer synchronization.
+         */
+        final boolean containsStaleWork = wm.checkIfWorkIsStale(workContainerBatch);
+
+        if (containsStaleWork) {
+            handleStaleWork(workContainerBatch);
+        }
+
+        final List<WorkContainer<K, V>> activeWorkContainers = containsStaleWork ?
+                workContainerBatch
+                        .stream()
+                        .filter(wc -> !wm.checkIfWorkIsStale(wc))
+                        .collect(Collectors.toList())
+                : workContainerBatch;
+
+        final PollContextInternal<K, V> context = new PollContextInternal<>(activeWorkContainers);
+
+        try {
+            if (!activeWorkContainers.isEmpty()) {
+                return runUserFunctionInternal(usersFunction, context, callback, activeWorkContainers);
+            }
+            return Collections.emptyList();
+        } catch (Exception e) {
+            // handle fail
+            var cause = e.getCause();
+            String msg = msg("Exception caught in user function running stage, registering WC as failed, returning to" +
+                    " mailbox. Context: {}", context, e);
+            if (cause instanceof PCRetriableException) {
+                log.debug("Explicit " + PCRetriableException.class.getSimpleName() + " caught, logging at DEBUG only. " + msg, e);
+            } else {
+                log.error(msg, e);
+            }
+
+            for (var wc : workContainerBatch) {
+                wc.onUserFunctionFailure(e);
+                addToMailbox(context, wc); // always add on error
+            }
+            throw e; // trow again to make the future failed
+        } finally {
+            cleanUpContext(context);
+        }
+    }
+
+    /**
+     * Given the batch of work containers, publish stale work to feedback loop to be reduced from in progress work.
+     *
+     * @param workContainerBatch
+     */
+    protected void handleStaleWork(final List<WorkContainer<K, V>> workContainerBatch) {
+        final List<WorkContainer<K, V>> staleWorkContainers = workContainerBatch
+                .stream()
+                .filter(wm::checkIfWorkIsStale)
+                .collect(Collectors.toList());
+        final PollContextInternal<K, V> internalContext = new PollContextInternal<>(staleWorkContainers);
+        try {
+            // when epoch's change, we can't remove them from the executor pool queue, so we just have to skip them when we find them
+            log.debug("Pool found work from old generation of assigned work, skipping message as epoch doesn't match current {}", staleWorkContainers);
+            staleWorkContainers.forEach(wc -> addToMailbox(internalContext, wc));
+        } finally {
+            cleanUpContext(internalContext);
+        }
+    }
+
+    protected <R> ArrayList<Tuple<ConsumerRecord<K, V>, R>> runUserFunctionInternal(final Function<PollContextInternal<K, V>, List<R>> usersFunction,
+                                                                                    final PollContextInternal<K, V> context,
+                                                                                    final Consumer<R> callback,
+                                                                                    final List<WorkContainer<K, V>> activeWorkContainers) {
+        List<R> resultsFromUserFunction;
+        resultsFromUserFunction = userProcessingTimer.record(() -> usersFunction.apply(context));
+
+
+        for (final WorkContainer<K, V> kvWorkContainer : activeWorkContainers) {
+            onUserFunctionSuccess(kvWorkContainer, resultsFromUserFunction);
+        }
+
+        // capture each result, against the input record
+        var intermediateResults = new ArrayList<Tuple<ConsumerRecord<K, V>, R>>();
+        for (R result : resultsFromUserFunction) {
+            log.trace("Running users call back...");
+            callback.accept(result);
+        }
+
+        // fail or succeed, either way we're done
+        for (var kvWorkContainer : activeWorkContainers) {
+            addToMailBoxOnUserFunctionSuccess(context, kvWorkContainer, resultsFromUserFunction);
+        }
+        log.trace("User function future registered");
+
+        return intermediateResults;
+    }
+
+    private void cleanUpContext(final PollContextInternal<K, V> context) {
+        context.getProducingLock().ifPresent(ProducerManager.ProducingLock::unlock);
+    }
+
+    protected void addToMailBoxOnUserFunctionSuccess(PollContextInternal<K, V> context, WorkContainer<K, V> wc, List<?> resultsFromUserFunction) {
+        addToMailbox(context, wc);
+    }
+
+    protected void onUserFunctionSuccess(WorkContainer<K, V> wc, List<?> resultsFromUserFunction) {
+        log.trace("User function success");
+        wc.onUserFunctionSuccess();
+    }
+
+    protected void addToMailbox(PollContextInternal<K, V> pollContext, WorkContainer<K, V> wc) {
+        String state = wc.isUserFunctionSucceeded() ? "succeeded" : "FAILED";
+        log.trace("Adding {} {} to mailbox...", state, wc);
+        workMailBox.add(ControllerEventMessage.of(wc));
+
+        wc.onPostAddToMailBox(pollContext, producerManager);
+    }
+
+    public void registerWork(EpochAndRecordsMap<K, V> polledRecords) {
+        log.trace("Adding {} to mailbox...", polledRecords);
+        workMailBox.add(ControllerEventMessage.of(polledRecords));
+    }
+
+    /**
+     * Early notify of work arrived.
+     * <p>
+     * Only wake up the thread if it's sleeping while polling the mail box.
+     *
+     * @see #processWorkCompleteMailBox
+     * @see #blockableControlThread
+     */
+    public void notifySomethingToDo() {
+        boolean noTransactionInProgress = !producerManager.map(ProducerManager::isTransactionCommittingInProgress).orElse(false);
+        if (noTransactionInProgress) {
+            log.trace("Interrupting control thread: Knock knock, wake up! You've got mail (tm)!");
+            interruptControlThread();
+        } else {
+            log.trace("Would have interrupted control thread, but TX in progress");
+        }
+    }
+
+    @Override
+    public long workRemaining() {
+        return wm.getNumberOfIncompleteOffsets();
+    }
+
+    /**
+     * Plugin a function to run at the end of each main loop.
+     * <p>
+     * Useful for testing and controlling loop progression.
+     */
+    public void addLoopEndCallBack(Runnable r) {
+        this.controlLoopHooks.add(r);
+    }
+
+    public void setLongPollTimeout(Duration ofMillis) {
+        BrokerPollSystem.setLongPollTimeout(ofMillis);
+    }
+
+    /**
+     * Request a commit as soon as possible (ASAP), overriding other constraints.
+     */
+    public void requestCommitAsap() {
+        log.debug("Registering command to commit next chance");
+        synchronized (commitCommand) {
+            this.commitCommand.set(true);
+        }
+        notifySomethingToDo();
+    }
+
+    private boolean isCommandedToCommit() {
+        synchronized (commitCommand) {
+            return this.commitCommand.get();
+        }
+    }
+
+    private void clearCommitCommand() {
+        synchronized (commitCommand) {
+            if (commitCommand.get()) {
+                log.debug("Command to commit asap received, clearing");
+                this.commitCommand.set(false);
+            }
+        }
+    }
+
+    @Override
+    public void pauseIfRunning() {
+        if (this.state == State.RUNNING) {
+            log.info("Transitioning parallel consumer to state paused.");
+            this.state = State.PAUSED;
+        } else {
+            log.debug("Skipping transition of parallel consumer to state paused. Current state is {}.", this.state);
+        }
+    }
+
+    @Override
+    public void resumeIfPaused() {
+        if (this.state == State.PAUSED) {
+            log.info("Transitioning parallel consumer to state running.");
+            this.state = State.RUNNING;
+            notifySomethingToDo();
+        } else {
+            log.debug("Skipping transition of parallel consumer to state running. Current state is {}.", this.state);
+        }
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/BrokerPollSystem.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/BrokerPollSystem.java
new file mode 100644
index 000000000..66cabb561
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/BrokerPollSystem.java
@@ -0,0 +1,400 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode;
+import io.confluent.parallelconsumer.metrics.PCMetrics;
+import io.confluent.parallelconsumer.metrics.PCMetricsDef;
+import io.confluent.parallelconsumer.state.WorkManager;
+import io.micrometer.core.instrument.Gauge;
+import lombok.Getter;
+import lombok.Setter;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerRecords;
+import org.apache.kafka.common.TopicPartition;
+import org.slf4j.MDC;
+
+import javax.naming.InitialContext;
+import javax.naming.NamingException;
+import java.time.Duration;
+import java.util.Optional;
+import java.util.Set;
+import java.util.concurrent.*;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor.DEFAULT_TIMEOUT;
+import static io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor.MDC_INSTANCE_ID;
+import static io.confluent.parallelconsumer.internal.State.*;
+import static java.util.concurrent.TimeUnit.MILLISECONDS;
+
+/**
+ * Subsystem for polling the broker for messages.
+ *
+ * @param <K>
+ * @param <V>
+ */
+@Slf4j
+public class BrokerPollSystem<K, V> implements OffsetCommitter {
+
+    private final ConsumerManager<K, V> consumerManager;
+
+    private State runState = RUNNING;
+
+    private Optional<Future<Boolean>> pollControlThreadFuture = Optional.empty();
+
+    /**
+     * While {@link io.confluent.parallelconsumer.internal.State#PAUSED paused} is an externally controlled state that
+     * temporarily stops polling and work registration, the {@code paused} flag is used internally to pause
+     * subscriptions if polling needs to be throttled.
+     */
+    @Getter
+    private volatile boolean pausedForThrottling = false;
+
+    private final AbstractParallelEoSStreamProcessor<K, V> pc;
+
+    private Optional<ConsumerOffsetCommitter<K, V>> committer = Optional.empty();
+
+    /**
+     * Note how this relates to {@link BrokerPollSystem#getLongPollTimeout()} - if longPollTimeout is high and loading
+     * factor is low, there may not be enough messages queued up to satisfy demand.
+     */
+    @Setter
+    @Getter
+    private static Duration longPollTimeout = Duration.ofMillis(2000);
+
+    private final WorkManager<K, V> wm;
+
+    private final PCMetrics pcMetrics;
+
+    private Gauge statusGauge;
+    private Gauge numPausedPartitionsGauge;
+
+    public BrokerPollSystem(ConsumerManager<K, V> consumerMgr, WorkManager<K, V> wm, AbstractParallelEoSStreamProcessor<K, V> pc, final ParallelConsumerOptions<K, V> options) {
+        this.wm = wm;
+        this.pc = pc;
+
+        this.consumerManager = consumerMgr;
+
+        switch (options.getCommitMode()) {
+            case PERIODIC_CONSUMER_SYNC, PERIODIC_CONSUMER_ASYNCHRONOUS -> {
+                ConsumerOffsetCommitter<K, V> consumerCommitter = new ConsumerOffsetCommitter<>(consumerMgr, wm, options);
+                committer = Optional.of(consumerCommitter);
+            }
+        }
+        pcMetrics = pc.getModule().pcMetrics();
+        initMetrics();
+    }
+
+    private void initMetrics() {
+        statusGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.PC_POLLER_STATUS, this, poller -> poller.runState.getValue());
+        numPausedPartitionsGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.NUM_PAUSED_PARTITIONS,
+                this.consumerManager, ConsumerManager::getPausedPartitionSize);
+    }
+
+    public void start(String managedExecutorService) {
+        ExecutorService executorService;
+        try {
+            executorService = InitialContext.doLookup(managedExecutorService);
+        } catch (NamingException e) {
+            log.debug("Couldn't look up an execution service, falling back to Java SE Thread", e);
+            executorService = Executors.newSingleThreadExecutor();
+        }
+        Future<Boolean> submit = executorService.submit(this::controlLoop);
+        this.pollControlThreadFuture = Optional.of(submit);
+    }
+
+    public void supervise() {
+        if (pollControlThreadFuture.isPresent()) {
+            Future<Boolean> booleanFuture = pollControlThreadFuture.get();
+            if (booleanFuture.isCancelled() || booleanFuture.isDone()) {
+                try {
+                    booleanFuture.get();
+                } catch (Exception e) {
+                    throw new InternalRuntimeException("Error in " + BrokerPollSystem.class.getSimpleName() + " system.", e);
+                }
+            }
+        }
+    }
+
+    /**
+     * @return true if closed cleanly
+     */
+    private boolean controlLoop() throws TimeoutException, InterruptedException {
+        Thread.currentThread().setName("pc-broker-poll");
+        pc.getMyId().ifPresent(id -> {
+            Thread.currentThread().setName("pc-broker-poll-" + id);
+            MDC.put(MDC_INSTANCE_ID, id);
+        });
+        log.trace("Broker poll control loop start");
+        committer.ifPresent(ConsumerOffsetCommitter::claim);
+        try {
+            while (runState != CLOSED) {
+                handlePoll();
+
+                maybeDoCommit();
+
+                switch (runState) {
+                    case DRAINING -> {
+                        doPause();
+                    }
+                    case CLOSING -> {
+                        doClose();
+                    }
+                }
+            }
+            log.debug("Broker poller thread finished normally, returning OK (true) to future...");
+            return true;
+        } catch (Exception e) {
+            log.error("Unknown error", e);
+            throw e;
+        }
+    }
+
+    private void handlePoll() {
+        log.trace("Loop: Broker poller: ({})", runState);
+        if (runState == RUNNING || runState == DRAINING) { // if draining - subs will be paused, so use this to just sleep
+            var polledRecords = pollBrokerForRecords();
+            int count = polledRecords.count();
+            log.debug("Got {} records in poll result", count);
+
+            if (count > 0) {
+                log.trace("Loop: Register work");
+                pc.registerWork(polledRecords);
+            }
+        }
+    }
+
+    private void doClose() {
+        log.debug("Doing close...");
+        doPause();
+        maybeCloseConsumerManager();
+        runState = CLOSED;
+    }
+
+    /**
+     * To keep things simple, make sure the correct thread which can make a commit, is the one to close the consumer.
+     * This way, if partitions are revoked, the commit can be made inline.
+     */
+    private void maybeCloseConsumerManager() {
+        if (isResponsibleForCommits()) {
+            log.debug("Closing {}, first closing consumer...", this.getClass().getSimpleName());
+            this.consumerManager.close(DEFAULT_TIMEOUT);
+            log.debug("Consumer closed.");
+        }
+    }
+
+    private boolean isResponsibleForCommits() {
+        return committer.isPresent();
+    }
+
+    private EpochAndRecordsMap<K, V> pollBrokerForRecords() {
+
+        checkStateForPausingSubscriptions();
+
+        log.debug("Subscriptions are paused: {}", pausedForThrottling);
+
+        boolean pollTimeoutNormally = runState == RUNNING || runState == DRAINING;
+        Duration thisLongPollTimeout = pollTimeoutNormally ? BrokerPollSystem.longPollTimeout
+                : Duration.ofMillis(1); // Can't use Duration.ZERO - this causes Object#wait to wait forever
+
+        log.debug("Long polling broker with timeout {}, might appear to sleep here if subs are paused, or no data available on broker. Run state: {}", thisLongPollTimeout, runState);
+        ConsumerRecords<K, V> poll = consumerManager.poll(thisLongPollTimeout);
+
+        log.debug("Poll completed");
+
+        // build records map
+        return new EpochAndRecordsMap<>(poll, wm.getPm());
+    }
+
+    private void checkStateForPausingSubscriptions() {
+        if (runState == DRAINING) {
+            doPause();
+        } else {
+            managePauseOfSubscription();
+        }
+    }
+
+    /**
+     * Will begin the shutdown process, eventually closing itself once drained
+     */
+    public void drain() {
+        // idempotent
+        if (runState != State.DRAINING) {
+            log.debug("Signaling poll system to drain, waking up consumer...");
+            runState = State.DRAINING;
+            consumerManager.wakeup();
+        }
+    }
+
+    private final RateLimiter pauseLimiter = new RateLimiter(1);
+
+    private void doPauseMaybe() {
+        // idempotent
+        if (pausedForThrottling) {
+            log.trace("Already paused");
+        } else {
+            if (pauseLimiter.couldPerform()) {
+                pauseLimiter.performIfNotLimited(() -> {
+                    doPause();
+                });
+            } else {
+                if (log.isDebugEnabled()) {
+                    log.debug("Should pause but pause rate limit exceeded {} vs {}.",
+                            pauseLimiter.getElapsedDuration(),
+                            pauseLimiter.getRate());
+                }
+            }
+        }
+    }
+
+    /**
+     * Pause all assignments
+     */
+    private void doPause() {
+        if (!pausedForThrottling) {
+            pausedForThrottling = true;
+            log.debug("Pausing subs");
+            Set<TopicPartition> assignment = consumerManager.assignment();
+            consumerManager.pause(assignment);
+        } else {
+            log.debug("Already paused, skipping");
+        }
+    }
+
+    public void closeAndWait() throws TimeoutException, ExecutionException {
+        log.debug("Requesting broker polling system to close...");
+        transitionToClosing();
+        if (pollControlThreadFuture.isPresent()) {
+            log.debug("Wait for loop to finish ending...");
+            Future<Boolean> pollControlResult = pollControlThreadFuture.get();
+            boolean interrupted = true;
+            while (interrupted) {
+                try {
+                    Boolean pollShutdownSuccess = pollControlResult.get(DEFAULT_TIMEOUT.toMillis(), MILLISECONDS);
+                    interrupted = false;
+                    if (!pollShutdownSuccess) {
+                        log.warn("Broker poll control thread not closed cleanly.");
+                    }
+                } catch (InterruptedException e) {
+                    log.debug("Interrupted waiting for broker poller thread to finish", e);
+                } catch (ExecutionException | TimeoutException e) {
+                    log.error("Execution or timeout exception waiting for broker poller thread to finish", e);
+                    throw e;
+                }
+            }
+        }
+        log.debug("Broker poll system finished closing");
+    }
+
+    private void transitionToClosing() {
+        log.debug("Poller transitioning to closing, waking up consumer");
+        runState = State.CLOSING;
+        consumerManager.wakeup();
+    }
+
+    /**
+     * If we are currently processing too many records, we must stop polling for more from the broker. But we must also
+     * make sure we maintain the keep alive with the broker so as not to cause a rebalance.
+     */
+    private void managePauseOfSubscription() {
+        boolean throttle = shouldThrottle();
+        log.trace("Need to throttle: {}", throttle);
+        if (throttle) {
+            doPauseMaybe();
+        } else {
+            resumeIfPaused();
+        }
+    }
+
+    /**
+     * Has no flap limit, always resume if we need to
+     */
+    private void resumeIfPaused() {
+        // idempotent
+        if (pausedForThrottling) {
+            log.debug("Resuming consumer, waking up");
+            Set<TopicPartition> pausedTopics = consumerManager.paused();
+            consumerManager.resume(pausedTopics);
+            // trigger consumer to perform a new poll without the assignments paused, otherwise it will continue to long poll on nothing
+            consumerManager.wakeup();
+            pausedForThrottling = false;
+        }
+    }
+
+    private boolean shouldThrottle() {
+        return wm.shouldThrottle();
+    }
+
+    /**
+     * Optionally blocks. Threadsafe
+     *
+     * @see CommitMode
+     */
+    @SneakyThrows
+    @Override
+    public void retrieveOffsetsAndCommit() {
+        if (runState == RUNNING || runState == DRAINING || runState == CLOSING) {
+            // {@link Optional#ifPresentOrElse} only @since 9
+            ConsumerOffsetCommitter<K, V> committer = this.committer.orElseThrow(() -> {
+                // shouldn't be here
+                throw new IllegalStateException("No committer configured");
+            });
+            committer.commit();
+        } else {
+            throw new IllegalStateException(msg("Can't commit - not running (state: {}", runState));
+        }
+    }
+
+    /**
+     * Will silently skip if not configured with a committer
+     */
+    private void maybeDoCommit() throws TimeoutException, InterruptedException {
+        if (committer.isPresent()) {
+            committer.get().maybeDoCommit();
+        }
+    }
+
+    /**
+     * Wakeup if colling the broker
+     */
+    public void wakeupIfPaused() {
+        if (pausedForThrottling)
+            consumerManager.wakeup();
+    }
+
+    /**
+     * Pause polling from the underlying Kafka Broker.
+     * <p>
+     * Note: If the poll system is currently not in state
+     * {@link io.confluent.parallelconsumer.internal.State#RUNNING running}, calling this method will be a no-op.
+     * </p>
+     */
+    public void pausePollingAndWorkRegistrationIfRunning() {
+        if (this.runState == RUNNING) {
+            log.info("Transitioning broker poll system to state paused.");
+            this.runState = PAUSED;
+        } else {
+            log.info("Skipping transition of broker poll system to state paused. Current state is {}.", this.runState);
+        }
+    }
+
+    /**
+     * Resume polling from the underlying Kafka Broker.
+     * <p>
+     * Note: If the poll system is currently not in state
+     * {@link io.confluent.parallelconsumer.internal.State#PAUSED paused}, calling this method will be a no-op.
+     * </p>
+     */
+    public void resumePollingAndWorkRegistrationIfPaused() {
+        if (this.runState == PAUSED) {
+            log.info("Transitioning broker poll system to state running.");
+            this.runState = RUNNING;
+        } else {
+            log.info("Skipping transition of broker poll system to state running. Current state is {}.", this.runState);
+        }
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ConsumerManager.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ConsumerManager.java
new file mode 100644
index 000000000..fc4b7e53f
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ConsumerManager.java
@@ -0,0 +1,152 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import lombok.RequiredArgsConstructor;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.*;
+import org.apache.kafka.common.TopicPartition;
+import org.apache.kafka.common.errors.WakeupException;
+import pl.tlinkowski.unij.api.UniMaps;
+
+import java.time.Duration;
+import java.util.Map;
+import java.util.Set;
+import java.util.concurrent.atomic.AtomicBoolean;
+
+/**
+ * Delegate for {@link KafkaConsumer}
+ */
+@Slf4j
+@RequiredArgsConstructor
+public class ConsumerManager<K, V> {
+
+    private final Consumer<K, V> consumer;
+
+    private final AtomicBoolean pollingBroker = new AtomicBoolean(false);
+
+
+    /**
+     * Since Kakfa 2.7, multi-threaded access to consumer group metadata was blocked, so before and after polling, save
+     * a copy of the metadata.
+     *
+     * @since 2.7.0
+     */
+    private ConsumerGroupMetadata metaCache;
+
+    private volatile int pausedPartitionSizeCache = 0;
+
+    private int erroneousWakups = 0;
+    private int correctPollWakeups = 0;
+    private int noWakeups = 0;
+    private boolean commitRequested;
+
+    ConsumerRecords<K, V> poll(Duration requestedLongPollTimeout) {
+        Duration timeoutToUse = requestedLongPollTimeout;
+        ConsumerRecords<K, V> records;
+        try {
+            if (commitRequested) {
+                log.debug("Commit requested, so will not long poll as need to perform the commit");
+                timeoutToUse = Duration.ofMillis(1);// disable long poll, as commit needs performing
+                commitRequested = false;
+            }
+            pollingBroker.set(true);
+            updateCache();
+            log.debug("Poll starting with timeout: {}", timeoutToUse);
+            records = consumer.poll(timeoutToUse);
+            log.debug("Poll completed normally (after timeout of {}) and returned {}...", timeoutToUse, records.count());
+            updateCache();
+        } catch (WakeupException w) {
+            correctPollWakeups++;
+            log.debug("Awoken from broker poll");
+            log.trace("Wakeup caller is:", w);
+            records = new ConsumerRecords<>(UniMaps.of());
+        } finally {
+            pollingBroker.set(false);
+        }
+        return records;
+    }
+
+    protected void updateCache() {
+        metaCache = consumer.groupMetadata();
+        pausedPartitionSizeCache = consumer.paused().size();
+    }
+
+    /**
+     * Wakes up the consumer, but only if it's polling.
+     * <p>
+     * Otherwise, we can interrupt other operations like {@link KafkaConsumer#commitSync()}.
+     */
+    public void wakeup() {
+        // boolean reduces the chances of a mis-timed call to wakeup, but doesn't prevent all spurious wake up calls to other methods like #commit
+        // if the call to wakeup happens /after/ the check for a wake up state inside #poll, then the next call will through the wake up exception (i.e. #commit)
+        if (pollingBroker.get()) {
+            log.debug("Waking up consumer");
+            consumer.wakeup();
+        }
+    }
+
+    public void commitSync(final Map<TopicPartition, OffsetAndMetadata> offsetsToSend) {
+        // we dont' want to be woken up during a commit, only polls
+        boolean inProgress = true;
+        noWakeups++;
+        while (inProgress) {
+            try {
+                consumer.commitSync(offsetsToSend);
+                inProgress = false;
+            } catch (WakeupException w) {
+                log.debug("Got woken up, retry. errors: " + erroneousWakups + " none: " + noWakeups + " correct:" + correctPollWakeups, w);
+                erroneousWakups++;
+            }
+        }
+    }
+
+    public void commitAsync(Map<TopicPartition, OffsetAndMetadata> offsets, OffsetCommitCallback callback) {
+        // we dont' want to be woken up during a commit, only polls
+        boolean inProgress = true;
+        noWakeups++;
+        while (inProgress) {
+            try {
+                consumer.commitAsync(offsets, callback);
+                inProgress = false;
+            } catch (WakeupException w) {
+                log.debug("Got woken up, retry. errors: " + erroneousWakups + " none: " + noWakeups + " correct:" + correctPollWakeups, w);
+                erroneousWakups++;
+            }
+        }
+    }
+
+    public ConsumerGroupMetadata groupMetadata() {
+        return metaCache;
+    }
+
+    public void close(final Duration defaultTimeout) {
+        consumer.close(defaultTimeout);
+    }
+
+    public Set<TopicPartition> assignment() {
+        return consumer.assignment();
+    }
+
+    public void pause(final Set<TopicPartition> assignment) {
+        consumer.pause(assignment);
+    }
+
+    public Set<TopicPartition> paused() {
+        return consumer.paused();
+    }
+
+    public int getPausedPartitionSize() {
+        return pausedPartitionSizeCache;
+    }
+
+    public void resume(final Set<TopicPartition> pausedTopics) {
+        consumer.resume(pausedTopics);
+    }
+
+    public void onCommitRequested() {
+        this.commitRequested = true;
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ConsumerOffsetCommitter.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ConsumerOffsetCommitter.java
new file mode 100644
index 000000000..c4393fab1
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ConsumerOffsetCommitter.java
@@ -0,0 +1,191 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode;
+import io.confluent.parallelconsumer.state.WorkManager;
+import lombok.Value;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerGroupMetadata;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.common.TopicPartition;
+
+import java.time.Duration;
+import java.util.Map;
+import java.util.Optional;
+import java.util.Queue;
+import java.util.UUID;
+import java.util.concurrent.*;
+
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_CONSUMER_SYNC;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER;
+
+/**
+ * Committer that uses the Kafka Consumer to commit either synchronously or asynchronously
+ *
+ * @see CommitMode
+ */
+@Slf4j
+public class ConsumerOffsetCommitter<K, V> extends AbstractOffsetCommitter<K, V> implements OffsetCommitter {
+
+    /**
+     * Chosen arbitrarily - retries should never be needed, if they are it's an invalid state
+     */
+    private static final int ARBITRARY_RETRY_LIMIT = 50;
+
+    private final CommitMode commitMode;
+
+    private final Duration commitTimeout;
+
+    private Optional<Thread> owningThread = Optional.empty();
+
+    /**
+     * Queue of commit requests from other threads
+     */
+    private final Queue<CommitRequest> commitRequestQueue = new ConcurrentLinkedQueue<>();
+
+    /**
+     * Queue of commit responses, for other threads to block on
+     */
+    private final BlockingQueue<CommitResponse> commitResponseQueue = new LinkedBlockingQueue<>();
+
+    public ConsumerOffsetCommitter(final ConsumerManager<K, V> newConsumer, final WorkManager<K, V> newWorkManager, final ParallelConsumerOptions options) {
+        super(newConsumer, newWorkManager);
+        commitMode = options.getCommitMode();
+        commitTimeout = options.getOffsetCommitTimeout();
+        if (commitMode.equals(PERIODIC_TRANSACTIONAL_PRODUCER)) {
+            throw new IllegalArgumentException("Cannot use " + commitMode + " when using " + this.getClass().getSimpleName());
+        }
+    }
+
+    /**
+     * Might block if using {@link CommitMode#PERIODIC_CONSUMER_SYNC}
+     *
+     * @see CommitMode
+     */
+    void commit() throws TimeoutException, InterruptedException {
+        if (isOwner()) {
+            retrieveOffsetsAndCommit();
+        } else if (isSync()) {
+            log.debug("Sync commit");
+            commitAndWait();
+            log.debug("Finished waiting");
+        } else {
+            // async
+            // we just request the commit and hope
+            log.debug("Async commit to be requested");
+            requestCommitInternal();
+        }
+    }
+
+    @Override
+    protected void commitOffsets(final Map<TopicPartition, OffsetAndMetadata> offsetsToSend, final ConsumerGroupMetadata groupMetadata) {
+        if (offsetsToSend.isEmpty()) {
+            log.trace("Nothing to commit");
+            return;
+        }
+        switch (commitMode) {
+            case PERIODIC_CONSUMER_SYNC -> {
+                log.debug("Committing offsets Sync");
+                consumerMgr.commitSync(offsetsToSend);
+            }
+            case PERIODIC_CONSUMER_ASYNCHRONOUS -> {
+                //
+                log.debug("Committing offsets Async");
+                consumerMgr.commitAsync(offsetsToSend, (offsets, exception) -> {
+                    if (exception != null) {
+                        log.error("Error committing offsets", exception);
+                        // todo keep work in limbo until async response is received?
+                    }
+                });
+            }
+            default ->
+                    throw new IllegalArgumentException("Cannot use " + commitMode + " when using " + this.getClass().getSimpleName());
+        }
+    }
+
+    /**
+     * @see #commit()
+     */
+    @Override
+    protected void postCommit() {
+    }
+
+    private boolean isOwner() {
+        return Thread.currentThread().equals(owningThread.orElse(null));
+    }
+
+    /**
+     * Commit request message
+     */
+    @Value
+    public static class CommitRequest {
+        UUID id = UUID.randomUUID();
+        long requestedAtMs = System.currentTimeMillis();
+    }
+
+    /**
+     * Commit response message, linked to a {@link CommitRequest}
+     */
+    @Value
+    public static class CommitResponse {
+        CommitRequest request;
+    }
+
+    private void commitAndWait() {
+        // request
+        CommitRequest commitRequest = requestCommitInternal();
+
+        // wait
+        boolean waitingOnCommitResponse = true;
+        int attempts = 0;
+        while (waitingOnCommitResponse) {
+            if (attempts > ARBITRARY_RETRY_LIMIT)
+                throw new InternalRuntimeException("Too many attempts taking commit responses");
+
+            try {
+                log.debug("Waiting on a commit response");
+                Duration timeout = AbstractParallelEoSStreamProcessor.DEFAULT_TIMEOUT;
+                CommitResponse take = commitResponseQueue.poll(commitTimeout.toMillis(), TimeUnit.MILLISECONDS); // blocks, drain until we find our response
+                if (take == null) {
+                    throw InternalRuntimeException.msg("Timeout waiting for commit response {} to request {}", timeout, commitRequest);
+                }
+                waitingOnCommitResponse = take.getRequest().getId() != commitRequest.getId();
+            } catch (InterruptedException e) {
+                log.debug("Interrupted waiting for commit response", e);
+            }
+            attempts++;
+        }
+    }
+
+    private CommitRequest requestCommitInternal() {
+        CommitRequest request = new CommitRequest();
+        commitRequestQueue.add(request);
+        consumerMgr.wakeup();
+        return request;
+    }
+
+    void maybeDoCommit() throws TimeoutException, InterruptedException {
+        CommitRequest poll = commitRequestQueue.poll();
+        if (poll != null) {
+            log.debug("Commit requested, performing...");
+            retrieveOffsetsAndCommit();
+            // only need to send a response if someone will be waiting
+            if (isSync()) {
+                log.debug("Adding commit response to queue...");
+                commitResponseQueue.add(new CommitResponse(poll));
+            }
+        }
+    }
+
+    public boolean isSync() {
+        return commitMode.equals(PERIODIC_CONSUMER_SYNC);
+    }
+
+    public void claim() {
+        owningThread = Optional.of(Thread.currentThread());
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/Documentation.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/Documentation.java
new file mode 100644
index 000000000..3737bc1a4
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/Documentation.java
@@ -0,0 +1,15 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+public class Documentation {
+
+    public static final String DOCS_ROOT = "https://github.com/confluentinc/parallel-consumer/";
+
+    public static String getLinkHtmlToDocSection(String section) {
+        return DOCS_ROOT + section;
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/DrainingCloseable.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/DrainingCloseable.java
new file mode 100644
index 000000000..cf6de3e0b
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/DrainingCloseable.java
@@ -0,0 +1,86 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import java.io.Closeable;
+import java.time.Duration;
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+
+public interface DrainingCloseable extends Closeable {
+
+    enum DrainingMode {
+        /**
+         * Stop downloading more messages from the Broker, but finish processing what has already been queued.
+         */
+        DRAIN,
+        /**
+         * Stop downloading more messages, and stop processing more messages in the queue, but finish processing
+         * messages already being processed locally.
+         */
+        DONT_DRAIN
+    }
+
+    /**
+     * Close the consumer, without draining. Uses a timeout specified through ParallelConsumerOptions.
+     *
+     * @see ParallelConsumerOptions#shutdownTimeout
+     * @see #close(Duration, DrainingMode)
+     */
+    default void close() {
+        closeDontDrainFirst();
+    }
+
+    /**
+     * @see DrainingMode#DRAIN
+     */
+    default void closeDrainFirst() {
+        close(DrainingMode.DRAIN);
+    }
+
+    /**
+     * @see DrainingMode#DONT_DRAIN
+     */
+    default void closeDontDrainFirst() {
+        close(DrainingMode.DONT_DRAIN);
+    }
+
+    /**
+     * @see DrainingMode#DRAIN
+     */
+    default void closeDrainFirst(Duration timeout) {
+        close(timeout, DrainingMode.DRAIN);
+    }
+
+    /**
+     * @see DrainingMode#DONT_DRAIN
+     */
+    default void closeDontDrainFirst(Duration timeout) {
+        close(timeout, DrainingMode.DONT_DRAIN);
+    }
+
+    /**
+     * Close the consumer.
+     *
+     * @param timeout      how long to wait before giving up - override timeout set in ParallelConsumerOptions
+     * @param drainingMode specify if PC should wait for messages already consumed from the broker to be processed before closing
+     */
+    void close(Duration timeout, DrainingMode drainingMode);
+
+    /**
+     * Close the consumer using timeout specified in ParallelConsumerOptions
+     *
+     * @param drainingMode wait for messages already consumed from the broker to be processed before closing
+     */
+    void close(DrainingMode drainingMode);
+
+    /**
+     * Of the records consumed from the broker, how many do we have remaining in our local queues
+     *
+     * @return the number of consumed but outstanding records to process
+     */
+    long workRemaining();
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/DynamicLoadFactor.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/DynamicLoadFactor.java
new file mode 100644
index 000000000..ced4882ea
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/DynamicLoadFactor.java
@@ -0,0 +1,137 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.Getter;
+import lombok.extern.slf4j.Slf4j;
+
+import java.time.Duration;
+import java.time.Instant;
+
+/**
+ * Controls a loading factor. Is used to ensure enough messages in multiples of our target concurrency are queued ready
+ * for processing.
+ * <p>
+ * Ensures that increases in loading factor aren't performed a) too soon after the last increase ({@link
+ * #isNotCoolingDown()})  and b) too soon after starting the system ({@link #isWarmUpPeriodOver()}).
+ */
+// todo make so can be fractional like 50% - this is because some systems need a fractional factor, like 1.1 or 1.2 rather than 2
+@Slf4j
+public class DynamicLoadFactor {
+
+    /**
+     * Don't change this unless you know what you're doing.
+     * <p>
+     * The default value is already quite aggressive for very fast processing functions.
+     * <p>
+     * This controls the loading factor of the buffers used to feed the executor engine. A higher value means more
+     * memory usage, but more importantly, more offsets may be beyond the highest committable offset for processing
+     * (which if the serialised information can't fit, will be dropped and could cause much larger replays than
+     * necessary).
+     * <p>
+     * Starts off as 2, so there's a good guarantee that we start off with enough data queued up.
+     */
+    private static final int DEFAULT_INITIAL_LOADING_FACTOR = 2;
+
+    private final long startTimeMs = System.currentTimeMillis();
+
+    /**
+     * Min duration between steps - i.e. don't ever step up faster than this
+     */
+    private final Duration coolDown = Duration.ofSeconds(2);
+
+    /**
+     * Delay after initial start, before any steps are allowed.
+     * <p>
+     * Consumer Group usually takes a few seconds to start running
+     */
+    private final Duration warmUp = Duration.ofSeconds(2);
+
+    /**
+     * The amount to increase the current load by, each step
+     */
+    private final int stepUpFactorBy = 1;
+
+    /**
+     * Upper safety cap on multiples of target queue size to reach (e.g. with 20 threads, this would be 20 * 100 =
+     * 20,000 messages _queued_.
+     * <p>
+     * Expectation is some relatively small multiple of the degree of concurrency, enough that each time a thread
+     * finishes, theres at least one more entry for it in the queue.
+     */
+    @Getter
+    private final int maxFactor = 100;
+
+    @Getter
+    private int currentFactor = DEFAULT_INITIAL_LOADING_FACTOR;
+    private long lastSteppedFactor = currentFactor;
+    private Instant lastStepTime = Instant.MIN;
+
+    /**
+     * Try to increase the loading factor
+     *
+     * @return true if could step up
+     */
+    public boolean maybeStepUp() {
+        if (couldStep()) {
+            return doStep();
+        }
+        return false;
+    }
+
+    private synchronized boolean doStep() {
+        if (isMaxReached()) {
+            return false;
+        } else {
+            // compare and set
+            currentFactor = currentFactor + stepUpFactorBy;
+            long delta = currentFactor - lastSteppedFactor;
+            log.debug("Stepped up load factor by {} from {} to {}", delta, lastSteppedFactor, currentFactor);
+
+            //
+            lastSteppedFactor = currentFactor;
+            lastStepTime = Instant.now();
+            return true;
+        }
+    }
+
+    /**
+     * Checks various conditions to see if a step is allowed
+     *
+     * @return true is a step-up is now allowed
+     */
+    boolean couldStep() {
+        boolean warmUpPeriodOver = isWarmUpPeriodOver();
+        boolean noCoolDown = isNotCoolingDown();
+        return warmUpPeriodOver && noCoolDown;
+    }
+
+    /**
+     * @return true if the cool-down period is over
+     * @see #coolDown
+     */
+    private boolean isNotCoolingDown() {
+        var now = Instant.now();
+        Duration elapsed = Duration.between(lastStepTime, now);
+        boolean coolDownElapsed = elapsed.compareTo(coolDown) > 0;
+        return coolDownElapsed;
+    }
+
+    /**
+     * Is the warm-up period over?
+     *
+     * @return true if warn up os over
+     * @see #warmUp
+     */
+    public boolean isWarmUpPeriodOver() {
+        long now = System.currentTimeMillis();
+        long elapsed = now - startTimeMs;
+        return elapsed > warmUp.toMillis();
+    }
+
+    public boolean isMaxReached() {
+        return currentFactor >= maxFactor;
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/EpochAndRecordsMap.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/EpochAndRecordsMap.java
new file mode 100644
index 000000000..1ad4f6aa0
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/EpochAndRecordsMap.java
@@ -0,0 +1,71 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.state.PartitionStateManager;
+import lombok.NonNull;
+import lombok.Value;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.ConsumerRecords;
+import org.apache.kafka.common.TopicPartition;
+
+import java.util.*;
+
+/**
+ * For tagging polled records with our epoch
+ *
+ * @see BrokerPollSystem#partitionAssignmentEpoch
+ */
+@Value
+public class EpochAndRecordsMap<K, V> {
+
+    Map<TopicPartition, RecordsAndEpoch> recordMap = new HashMap<>();
+
+    public EpochAndRecordsMap(ConsumerRecords<K, V> poll, PartitionStateManager<K, V> pm) {
+        poll.partitions().forEach(partition -> {
+            var records = poll.records(partition);
+            Long epochOfPartition = pm.getEpochOfPartition(partition);
+            RecordsAndEpoch entry = new RecordsAndEpoch(partition, epochOfPartition, records);
+            recordMap.put(partition, entry);
+        });
+    }
+
+    /**
+     * Get the partitions which have records contained in this record set.
+     *
+     * @return the set of partitions with data in this record set (may be empty if no data was returned)
+     */
+    public Set<TopicPartition> partitions() {
+        return Collections.unmodifiableSet(recordMap.keySet());
+    }
+
+    /**
+     * Get just the records for the given partition
+     *
+     * @param partition The partition to get records for
+     */
+    public RecordsAndEpoch records(TopicPartition partition) {
+        return this.recordMap.get(partition);
+    }
+
+    /**
+     * The number of records for all topics
+     */
+    public int count() {
+        return this.recordMap.values().stream()
+                .mapToInt(x ->
+                        x.getRecords().size()
+                )
+                .sum();
+    }
+
+    @Value
+    public class RecordsAndEpoch {
+        @NonNull TopicPartition topicPartition;
+        @NonNull Long epochOfPartitionAtPoll;
+        @NonNull List<ConsumerRecord<K, V>> records;
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ExternalEngine.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ExternalEngine.java
new file mode 100644
index 000000000..45dade404
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ExternalEngine.java
@@ -0,0 +1,94 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.PollContextInternal;
+import io.confluent.parallelconsumer.state.WorkContainer;
+import lombok.extern.slf4j.Slf4j;
+
+import java.util.List;
+import java.util.concurrent.ThreadPoolExecutor;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+
+/**
+ * Overrides key aspects required in common for other threading engines like Vert.x and Reactor
+ */
+@Slf4j
+public abstract class ExternalEngine<K, V> extends AbstractParallelEoSStreamProcessor<K, V> {
+
+    protected ExternalEngine(final ParallelConsumerOptions<K, V> newOptions) {
+        super(newOptions);
+
+        validate(options);
+    }
+
+    private void validate(ParallelConsumerOptions options) {
+        if (options.isUsingTransactionCommitMode()) {
+            throw new IllegalStateException(msg("External engines (such as Vert.x and Reactor) do not support transactions / EoS ({})", ParallelConsumerOptions.CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER));
+        }
+    }
+
+    /**
+     * @return the number of records to try to get, based on the current count of records outstanding - but unlike core,
+     *         we don't pipeline messages into the executor pool for processing.
+     */
+    protected int getTargetOutForProcessing() {
+        return getOptions().getTargetAmountOfRecordsInFlight();
+    }
+
+    @Override
+    protected void checkPipelinePressure() {
+        // no-op - as calculateQuantityToRequest does not use a pressure system, unlike the core module
+    }
+
+    /**
+     * The vert.x module doesn't use any thread pool for dispatching work, as the work is all done by the vert.x engine.
+     * This thread is only used to dispatch the work to vert.x.
+     * <p>
+     * TODO optimise thread usage by not using any extra thread here at all - go straight from the control thread to
+     * vert.x.
+     */
+    @Override
+    protected ThreadPoolExecutor setupWorkerPool(int poolSize) {
+        return super.setupWorkerPool(1);
+    }
+
+    /**
+     * With Vertx and Reactor, a function hasn't succeeded until the inner vertx function has also succeeded logging
+     */
+    @Override
+    protected void onUserFunctionSuccess(WorkContainer<K, V> wc, List<?> resultsFromUserFunction) {
+        if (isAsyncFutureWork(resultsFromUserFunction)) {
+            log.debug("Reactor creation function success, user's function success");
+        } else {
+            super.onUserFunctionSuccess(wc, resultsFromUserFunction);
+        }
+    }
+
+    /**
+     * With Vertx and Reactor, a function hasn't succeeded until the inner vertx function has also succeeded no op
+     */
+    @Override
+    protected void addToMailBoxOnUserFunctionSuccess(final PollContextInternal<K, V> context, WorkContainer<K, V> wc, List<?> resultsFromUserFunction) {
+        if (isAsyncFutureWork(resultsFromUserFunction)) {
+            log.debug("User function success but not adding vertx vertical to mailbox yet");
+        } else {
+            super.addToMailBoxOnUserFunctionSuccess(context, wc, resultsFromUserFunction);
+        }
+    }
+
+    /**
+     * System dependent way for the core engine to know if an external scheduler needs to be relied on for completion,
+     * as opposed to the internal threading system in the core module.
+     *
+     * @param resultsFromUserFunction the results to test
+     * @return true if the work needs special treatment
+     */
+    // TODO: Now that the modules don't use the internal threading systems at all, is this method redundant as all work from a module extension would return true
+    protected abstract boolean isAsyncFutureWork(List<?> resultsFromUserFunction);
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/InternalException.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/InternalException.java
new file mode 100644
index 000000000..6809b691e
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/InternalException.java
@@ -0,0 +1,17 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.StandardException;
+
+/**
+ * Generic Parallel Consumer parent exception.
+ *
+ * @author Antony Stubbs
+ * @see InternalRuntimeException RuntimeException version
+ */
+@StandardException
+public class InternalException extends Exception {
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/InternalRuntimeException.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/InternalRuntimeException.java
new file mode 100644
index 000000000..22993b0dc
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/InternalRuntimeException.java
@@ -0,0 +1,33 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.StringUtils;
+import lombok.experimental.StandardException;
+
+/**
+ * Internal {@link RuntimeException}
+ *
+ * @author Antony Stubbs
+ * @see InternalException
+ */
+@StandardException
+public class InternalRuntimeException extends RuntimeException {
+
+    /**
+     * @see StringUtils#msg(String, Object...)
+     */
+    public static InternalRuntimeException msg(String message, Object... vars) {
+        return new InternalRuntimeException(StringUtils.msg(message, vars));
+    }
+
+    /**
+     * @see StringUtils#msg(String, Object...)
+     */
+    public InternalRuntimeException(String message, Throwable e, Object... args) {
+        this(StringUtils.msg(message, args), e);
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/OffsetCommitter.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/OffsetCommitter.java
new file mode 100644
index 000000000..1b20507e6
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/OffsetCommitter.java
@@ -0,0 +1,17 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import java.util.concurrent.TimeoutException;
+
+/**
+ * Contract for committing offsets. As there are two ways to commit offsets - through the Consumer or Producer, and
+ * several systems involved, we need a contract.
+ *
+ * @author Antony Stubbs
+ */
+public interface OffsetCommitter {
+    void retrieveOffsetsAndCommit() throws TimeoutException, InterruptedException;
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/PCModule.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/PCModule.java
new file mode 100644
index 000000000..5eba2d559
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/PCModule.java
@@ -0,0 +1,119 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.TimeUtils;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.metrics.PCMetrics;
+import io.confluent.parallelconsumer.state.WorkManager;
+import lombok.Setter;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.producer.Producer;
+
+import java.time.Clock;
+
+/**
+ * Minimum dependency injection system, modled on how Dagger works.
+ * <p>
+ * Note: Not using Dagger as PC has a zero dependency policy, and franky it would be overkill for our needs.
+ *
+ * @author Antony Stubbs
+ */
+public class PCModule<K, V> {
+
+    protected ParallelConsumerOptions<K, V> optionsInstance;
+
+    @Setter
+    protected AbstractParallelEoSStreamProcessor<K, V> parallelEoSStreamProcessor;
+
+    public PCModule(ParallelConsumerOptions<K, V> options) {
+        this.optionsInstance = options;
+    }
+
+    public ParallelConsumerOptions<K, V> options() {
+        return optionsInstance;
+    }
+
+    private ProducerWrapper<K, V> producerWrapper;
+
+    protected ProducerWrapper<K, V> producerWrap() {
+        if (this.producerWrapper == null) {
+            this.producerWrapper = new ProducerWrapper<>(options());
+        }
+        return producerWrapper;
+    }
+
+    private ProducerManager<K, V> producerManager;
+
+    protected ProducerManager<K, V> producerManager() {
+        if (producerManager == null) {
+            this.producerManager = new ProducerManager<>(producerWrap(), consumerManager(), workManager(), options());
+        }
+        return producerManager;
+    }
+
+    public Producer<K, V> producer() {
+        return optionsInstance.getProducer();
+    }
+
+    public Consumer<K, V> consumer() {
+        return optionsInstance.getConsumer();
+    }
+
+    private ConsumerManager<K, V> consumerManager;
+
+    protected ConsumerManager<K, V> consumerManager() {
+        if (consumerManager == null) {
+            consumerManager = new ConsumerManager<>(optionsInstance.getConsumer());
+        }
+        return consumerManager;
+    }
+
+    @Setter
+    private WorkManager<K, V> workManager;
+
+    public WorkManager<K, V> workManager() {
+        if (workManager == null) {
+            workManager = new WorkManager<>(this, dynamicExtraLoadFactor());
+        }
+        return workManager;
+    }
+
+    protected AbstractParallelEoSStreamProcessor<K, V> pc() {
+        if (parallelEoSStreamProcessor == null) {
+            parallelEoSStreamProcessor = new ParallelEoSStreamProcessor<>(options(), this);
+        }
+        return parallelEoSStreamProcessor;
+    }
+
+    final DynamicLoadFactor dynamicLoadFactor = new DynamicLoadFactor();
+
+    protected DynamicLoadFactor dynamicExtraLoadFactor() {
+        return dynamicLoadFactor;
+    }
+
+    private BrokerPollSystem<K, V> brokerPollSystem;
+
+    protected BrokerPollSystem<K, V> brokerPoller(AbstractParallelEoSStreamProcessor<K, V> pc) {
+        if (brokerPollSystem == null) {
+            brokerPollSystem = new BrokerPollSystem<>(consumerManager(), workManager(), pc, options());
+        }
+        return brokerPollSystem;
+    }
+
+    public Clock clock() {
+        return TimeUtils.getClock();
+    }
+
+    private PCMetrics pcMetrics;
+
+    public PCMetrics pcMetrics() {
+        if (pcMetrics == null) {
+            pcMetrics = new PCMetrics(options().getMeterRegistry(), optionsInstance.getMetricsTags(), optionsInstance.getPcInstanceTag());
+        }
+        return pcMetrics;
+    }
+}
\ No newline at end of file
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ProducerManager.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ProducerManager.java
new file mode 100644
index 000000000..b9c169703
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ProducerManager.java
@@ -0,0 +1,462 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.*;
+import io.confluent.parallelconsumer.state.WorkManager;
+import lombok.Getter;
+import lombok.NonNull;
+import lombok.RequiredArgsConstructor;
+import lombok.ToString;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerGroupMetadata;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.clients.producer.*;
+import org.apache.kafka.clients.producer.internals.RecordAccumulator;
+import org.apache.kafka.common.KafkaException;
+import org.apache.kafka.common.TopicPartition;
+import org.apache.kafka.common.errors.InterruptException;
+import org.apache.kafka.common.errors.InvalidProducerEpochException;
+import org.apache.kafka.common.errors.ProducerFencedException;
+import org.apache.kafka.common.errors.TimeoutException;
+
+import java.time.Duration;
+import java.util.ArrayList;
+import java.util.ConcurrentModificationException;
+import java.util.List;
+import java.util.Map;
+import java.util.concurrent.Future;
+import java.util.concurrent.TimeUnit;
+import java.util.concurrent.locks.ReentrantReadWriteLock;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+
+/**
+ * Sub system for interacting with the Producer and managing transactions (and thus offset committing through the
+ * Producer).
+ */
+@Slf4j
+@ToString(onlyExplicitlyIncluded = true)
+public class ProducerManager<K, V> extends AbstractOffsetCommitter<K, V> implements OffsetCommitter {
+
+    @Getter
+    protected final ProducerWrapper<K, V> producerWrapper;
+
+    private final ParallelConsumerOptions<K, V> options;
+
+    /**
+     * The {@link KafkaProducer} isn't actually completely thread safe, at least when using it transactionally. We must
+     * be careful not to send messages to the producer, while we are committing a transaction - "Cannot call send in
+     * state COMMITTING_TRANSACTION".
+     * <p>
+     * We also need to use this as a synchronisation barrier on transactions - so that when we start a commit cycle, we
+     * first block any further records from being sent, then drain ourselves to get all sent records ack'd, and then
+     * commit the tx during the synchronisation barrier, then unlock the barrier.
+     * <p>
+     * This could be implemented more simply, using the new micro Actor system, by sending {@link ProducerRecord}s as
+     * actor messages, and having the controller process the {@link ProducerManager}s actor queue (send the queued up
+     * records). However, given our implementation, that would have the side effect of all producer record sending being
+     * done by the controller thread. Now as the Producer is thread safe - it uses the {@link RecordAccumulator}
+     * effectively as it's Actor bus, and all network communication, amongst other things, are done through a separate
+     * thread. However, before sending records to the accumulator, some non-trivial work is done while still in the
+     * multithreading context - most particularly (because it's probably the slowest part) is the serialisation of the
+     * payload. By moving to the new micro Actor framework, that serialisation would then be done in the controller.
+     * Give the existing shared state system using the {@link ReentrantReadWriteLock} works really well, and so sending
+     * work is done by worker threads, I'm hesitant to give up the performance over simplification in this case.
+     */
+    @Getter
+    private ReentrantReadWriteLock producerTransactionLock;
+
+    public ProducerManager(ProducerWrapper<K, V> newProducer,
+                           ConsumerManager<K, V> newConsumer,
+                           WorkManager<K, V> wm,
+                           ParallelConsumerOptions<K, V> options) {
+        super(newConsumer, wm);
+        this.producerWrapper = newProducer;
+        this.options = options;
+
+        initProducer();
+    }
+
+    private void initProducer() {
+        producerTransactionLock = new ReentrantReadWriteLock(true);
+
+        if (options.isUsingTransactionalProducer()) {
+            if (!producerWrapper.isConfiguredForTransactions()) {
+                throw new IllegalArgumentException("Using transactional option, yet Producer doesn't have a transaction ID - Producer needs a transaction id");
+            }
+            try {
+                log.debug("Initialising producer transaction session...");
+                producerWrapper.initTransactions();
+            } catch (KafkaException e) {
+                log.error("Make sure your producer is setup for transactions - specifically make sure it's {} is set.", ProducerConfig.TRANSACTIONAL_ID_CONFIG, e);
+                throw e;
+            }
+        } else {
+            if (producerWrapper.isConfiguredForTransactions()) {
+                throw new IllegalArgumentException("Using non-transactional producer option, but Producer has a transaction ID - "
+                        + "the Producer must not have a transaction ID for this option. This is because having such an ID forces the "
+                        + "Producer into transactional mode - i.e. you cannot use it without using transactions.");
+            }
+        }
+    }
+
+    /**
+     * Produce a message back to the broker.
+     * <p>
+     * Implementation uses the blocking API, by blocking on produce ack results (in batches when the flatMap version of
+     * producing a list of records is used). Performance upgrade in later versions (#356). This is of course not an
+     * issue for the more common use case of PC where messages aren't produced
+     * ({@link ParallelEoSStreamProcessor#poll}), and the {@code produce ack block} is still multi-threaded after all.
+     * <p>
+     * May block while a transaction is in progress - see
+     * {@link ParallelConsumerOptions.CommitMode#PERIODIC_TRANSACTIONAL_PRODUCER}.
+     *
+     * @see ParallelConsumerOptions.CommitMode#PERIODIC_TRANSACTIONAL_PRODUCER
+     * @see ParallelStreamProcessor#pollAndProduceMany
+     */
+    public List<ParallelConsumer.Tuple<ProducerRecord<K, V>, Future<RecordMetadata>>> produceMessages(List<ProducerRecord<K, V>> outMsgs) {
+        ensureProduceStarted();
+        lazyMaybeBeginTransaction();
+
+        // only needed if not using tx
+        Callback callback = (RecordMetadata metadata, Exception exception) -> {
+            if (exception != null) {
+                log.error("Error producing result message", exception);
+                throw new InternalRuntimeException("Error producing result message", exception);
+            }
+        };
+
+        List<ParallelConsumer.Tuple<ProducerRecord<K, V>, Future<RecordMetadata>>> futures = new ArrayList<>(outMsgs.size());
+        for (ProducerRecord<K, V> rec : outMsgs) {
+            log.trace("Producing {}", rec);
+            var future = producerWrapper.send(rec, callback);
+            futures.add(ParallelConsumer.Tuple.pairOf(rec, future));
+        }
+        return futures;
+    }
+
+    /**
+     * Optimistic locking for synchronising on the producer to ensure single writer for transaction state. The other
+     * methods that manipulate the transaction must be single writer - i.e. from the controller thread actually doing
+     * the commit.
+     * <p>
+     * Thread safe.
+     */
+    private void lazyMaybeBeginTransaction() {
+        if (options.isUsingTransactionCommitMode()) {
+            boolean txNotBegunAlready = !producerWrapper.isTransactionOpen();
+            if (txNotBegunAlready) {
+                syncBeginTransaction();
+            }
+        }
+    }
+
+    /**
+     * Pessimistic lock (synchronized method) on beginning a transaction
+     * <p>
+     * Thread safe.
+     */
+    private synchronized void syncBeginTransaction() {
+        boolean txNotBegunAlready = !producerWrapper.isTransactionOpen();
+        if (txNotBegunAlready) {
+            beginTransaction();
+        }
+    }
+
+    protected void releaseProduceLock(ProducingLock lock) {
+        lock.unlock();
+    }
+
+    protected ProducingLock acquireProduceLock(PollContextInternal<K, V> context) throws java.util.concurrent.TimeoutException {
+        ReentrantReadWriteLock.ReadLock readLock = producerTransactionLock.readLock();
+        Duration produceLockTimeout = options.getProduceLockAcquisitionTimeout();
+        log.debug("Acquiring produce lock (timeout: {})...", produceLockTimeout);
+        boolean lockAcquired = false;
+        try {
+            lockAcquired = readLock.tryLock(produceLockTimeout.toMillis(), TimeUnit.MILLISECONDS);
+        } catch (InterruptedException e) {
+            throw new InternalRuntimeException("Interrupted while waiting to get produce lock (timeout was set to {})", e, produceLockTimeout);
+        }
+
+        if (lockAcquired) {
+            log.debug("Produce lock acquired (context: {}).", context.getOffsets());
+        } else {
+            throw new java.util.concurrent.TimeoutException(msg("Timeout while waiting to get produce lock (was set to {}). " +
+                    "Commit taking too long? Try increasing the produce lock timeout.", produceLockTimeout));
+        }
+
+        log.trace("Produce lock acquired.");
+        return new ProducingLock(context, readLock);
+    }
+
+    /**
+     * First lock, so no other records can be sent. Then wait for the producer to get all its {@code acks} complete by
+     * calling {@link Producer#flush()}.
+     */
+    @Override
+    protected void preAcquireOffsetsToCommit() throws java.util.concurrent.TimeoutException, InterruptedException {
+        acquireCommitLock();
+        flush();
+    }
+
+
+    /**
+     * Wait for all in flight records to be ack'd before continuing, so they are all in the tx.
+     */
+    private void flush() {
+        producerWrapper.flush();
+    }
+
+    /**
+     * Only release lock when commit successful
+     */
+    @Override
+    protected void postCommit() {
+        if (producerTransactionLock.getWriteHoldCount() > 1) // sanity
+            throw new ConcurrentModificationException("Lock held too many times, won't be released problem and will cause deadlock");
+
+        releaseCommitLock();
+    }
+
+    /**
+     * @see InvalidProducerEpochException
+     * @see KafkaProducer#commitTransaction()
+     */
+    @Override
+    protected void commitOffsets(@NonNull Map<TopicPartition, OffsetAndMetadata> offsetsToSend, @NonNull ConsumerGroupMetadata groupMetadata) {
+        log.debug("Transactional offset commit starting");
+        if (!options.isUsingTransactionalProducer()) {
+            throw new IllegalStateException("Bug: cannot use if not using transactional producer");
+        }
+
+        // producer commit lock should already be acquired at this point, before work was retrieved to commit,
+        // so that more messages don't sneak into this tx block - the consumer records of which won't yet be
+        // in this offset collection
+        ensureCommitLockHeld();
+
+        //
+        lazyMaybeBeginTransaction(); // if not using a produce flow or if no records sent yet, a tx will need to be started here (as no records are being produced)
+        try {
+            producerWrapper.sendOffsetsToTransaction(offsetsToSend, groupMetadata);
+        } catch (ProducerFencedException e) {
+            // todo consider wrapping all client calls with a catch and new exception in the ProducerWrapper, so can get stack traces
+            //  see APIException#fillInStackTrace
+            throw new InternalRuntimeException(e);
+        }
+
+        // see {@link KafkaProducer#commit} this can be interrupted and is safe to retry
+        boolean committed = false;
+        int retryCount = 0;
+        int arbitrarilyChosenLimitForArbitraryErrorSituation = 200;
+        Exception lastErrorSavedForRethrow = null;
+        while (!committed) {
+            if (retryCount > arbitrarilyChosenLimitForArbitraryErrorSituation) {
+                String msg = msg("Retired too many times ({} > limit of {}), giving up. See error above.", retryCount, arbitrarilyChosenLimitForArbitraryErrorSituation);
+                log.error(msg, lastErrorSavedForRethrow);
+                throw new InternalRuntimeException(msg, lastErrorSavedForRethrow);
+            }
+            try {
+                if (producerWrapper.isMockProducer()) {
+                    commitTransaction();
+                } else {
+                    // TODO talk about alternatives to this brute force approach for retrying committing transactions
+                    boolean retrying = retryCount > 0;
+                    if (retrying) {
+                        if (producerWrapper.isTransactionCompleting()) {
+                            // try wait again
+                            commitTransaction();
+                        }
+                        boolean transactionModeIsReady = lastErrorSavedForRethrow == null || !lastErrorSavedForRethrow.getMessage().contains("Invalid transition attempted from state READY to state COMMITTING_TRANSACTION");
+                        if (transactionModeIsReady) {
+                            // try again
+                            log.error("Transaction was already in READY state - tx completed between interrupt and retry");
+                        }
+                    } else {
+                        // happy path
+                        commitTransaction();
+                    }
+                }
+
+                committed = true;
+                if (retryCount > 0) {
+                    log.warn("Commit success, but took {} tries.", retryCount);
+                }
+            }
+            /*
+            Producer#begin does not throw any retriable exceptions
+
+            Producer#commit throws the following exceptions:
+
+             // terminal general
+             AuthorizationException – fatal error indicating that the configured transactional.id is not authorized. See the exception for more details
+             KafkaException – if the producer has encountered a previous fatal or abortable error, or for any other unexpected error
+
+             // terminal tx
+             IllegalStateException – if no transactional.id has been configured or no transaction has been started
+             UnsupportedVersionException – fatal error indicating the broker does not support transactions (i.e. if its version is lower than 0.11.0.0)
+             ProducerFencedException – fatal error indicating another producer with the same transactional.id is active
+             InvalidProducerEpochException – if the producer has attempted to produce with an old epoch to the partition leader. See the exception for more details
+             - as per - InvalidProducerEpochException javadoc the, the tx should be aborted and the Producer initialised again, so to fail
+               this we will just fail fast and have to be restarted
+
+             // retriable tx
+             TimeoutException – if the time taken for committing the transaction has surpassed max.block.ms.
+             InterruptException – if the thread is interrupted while blocked
+
+             Only catch and retry the retriable ones, others fail fast the control thread
+             */ catch (TimeoutException | InterruptException e) {
+                log.warn("Commit exception, will retry, have tried {} times (see KafkaProducer#commit)", retryCount, e);
+                lastErrorSavedForRethrow = e;
+                retryCount++;
+            }
+        }
+    }
+
+    private void commitTransaction() {
+        producerWrapper.commitTransaction();
+    }
+
+    private void beginTransaction() {
+        /*
+         FYI:
+         // terminal general
+         AuthorizationException – fatal error indicating that the configured transactional.id is not authorized. See the exception for more details
+         KafkaException – if the producer has encountered a previous fatal error or for any other unexpected error
+
+         // terminal tx
+         IllegalStateException – if no transactional.id has been configured or if initTransactions() has not yet been invoked
+         UnsupportedVersionException – fatal error indicating the broker does not support transactions (i.e. if its version is lower than 0.11.0.0)
+         ProducerFencedException – if another producer with the same transactional.id is active
+         InvalidProducerEpochException – if the producer has attempted to produce with an old epoch to the partition leader. See the exception for more details
+
+         // retriable tx
+         none
+         */
+        producerWrapper.beginTransaction();
+    }
+
+    /**
+     * Assumes the system is drained at this point, or draining is not desired.
+     */
+    public void close(Duration timeout) {
+        log.debug("Closing producer, assuming no more in flight...");
+        if (options.isUsingTransactionalProducer() && !producerWrapper.isTransactionReady()) {
+            try {
+                acquireCommitLock();
+            } catch (java.util.concurrent.TimeoutException | InterruptedException e) {
+                log.error("Exception acquiring commit lock, will try to abort anyway", e);
+            }
+            try {
+                // close started after tx began, but before work was done, otherwise a tx wouldn't have been started
+                abortTransaction();
+            } finally {
+                releaseCommitLock();
+            }
+        }
+        closeProducer(timeout);
+    }
+
+    private void closeProducer(Duration timeout) {
+        producerWrapper.close(timeout);
+    }
+
+    private void abortTransaction() {
+        producerWrapper.abortTransaction();
+    }
+
+    private void acquireCommitLock() throws java.util.concurrent.TimeoutException, InterruptedException {
+        log.debug("Acquiring commit - checking lock state...");
+        if (producerTransactionLock.isWriteLocked() && producerTransactionLock.isWriteLockedByCurrentThread()) {
+            log.debug("Lock already held, returning with-out reentering to avoid write lock layers...");
+            return;
+        }
+
+        ReentrantReadWriteLock.WriteLock writeLock = producerTransactionLock.writeLock();
+        if (producerTransactionLock.isWriteLocked() && !producerTransactionLock.isWriteLockedByCurrentThread()) {
+            throw new ConcurrentModificationException(this.getClass().getSimpleName() + " is not safe for multi-threaded access - write lock already held by another thread");
+        }
+
+        // acquire lock the commit lock
+        var commitLockTimeout = options.getCommitLockAcquisitionTimeout();
+        log.debug("Acquiring commit lock (timeout: {})...", commitLockTimeout);
+        boolean gotLock = writeLock.tryLock(commitLockTimeout.toMillis(), TimeUnit.MILLISECONDS);
+
+        if (gotLock) {
+            log.debug("Commit lock acquired.");
+        } else {
+            var msg = msg("Timeout getting commit lock (which was set to {}). Slow processing or too many records being ack'd? " +
+                            "Try increasing the commit lock timeout ({}), or reduce your record processing time.",
+                    commitLockTimeout,
+                    ParallelConsumerOptions.Fields.commitLockAcquisitionTimeout
+            );
+            throw new java.util.concurrent.TimeoutException(msg);
+        }
+    }
+
+    private void releaseCommitLock() {
+        log.debug("Releasing commit lock...");
+        ReentrantReadWriteLock.WriteLock writeLock = producerTransactionLock.writeLock();
+        if (!producerTransactionLock.isWriteLockedByCurrentThread())
+            throw new IllegalStateException("Not held be me");
+        writeLock.unlock();
+        log.debug("Commit lock released.");
+    }
+
+    private void ensureCommitLockHeld() {
+        if (!producerTransactionLock.isWriteLockedByCurrentThread())
+            throw new IllegalStateException("Expected commit lock to be held");
+    }
+
+    /**
+     * @return true if the commit lock has been acquired by any thread.
+     */
+    public boolean isTransactionCommittingInProgress() {
+        return producerTransactionLock.isWriteLocked();
+    }
+
+    /**
+     * Must call before sending records - acquires the lock on sending records, which blocks committing transactions)
+     */
+    public ProducingLock beginProducing(PollContextInternal<K, V> context) throws java.util.concurrent.TimeoutException {
+        return acquireProduceLock(context);
+    }
+
+    /**
+     * Must call after finishing sending records - unlocks the produce lock to potentially unblock transaction
+     * committing.
+     */
+    public void finishProducing(@NonNull ProducingLock produceLock) {
+        ensureProduceStarted();
+        releaseProduceLock(produceLock);
+    }
+
+    /**
+     * Sanity check to make sure the produce lock is held.
+     */
+    private void ensureProduceStarted() {
+        if (options.isUsingTransactionCommitMode() && producerTransactionLock.getReadHoldCount() < 1) {
+            throw new InternalRuntimeException("Need to call #beginProducing first");
+        }
+    }
+
+    /**
+     * Readability wrapper on the {@link ReentrantReadWriteLock.ReadLock}s of our {@link #producerTransactionLock}.
+     */
+    @RequiredArgsConstructor
+    public class ProducingLock {
+
+        private final PollContextInternal<K, V> context;
+        private final ReentrantReadWriteLock.ReadLock produceLock;
+
+        /**
+         * Unlocks the produce lock
+         */
+        protected void unlock() {
+            produceLock.unlock();
+            log.debug("Unlocking produce lock (context: {}).", context.getOffsets());
+        }
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ProducerWrapper.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ProducerWrapper.java
new file mode 100644
index 000000000..6d3b87f03
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/ProducerWrapper.java
@@ -0,0 +1,220 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import lombok.*;
+import lombok.experimental.Delegate;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerGroupMetadata;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.clients.producer.KafkaProducer;
+import org.apache.kafka.clients.producer.MockProducer;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.clients.producer.internals.TransactionManager;
+import org.apache.kafka.common.TopicPartition;
+import org.apache.kafka.common.errors.ProducerFencedException;
+
+import java.lang.reflect.Field;
+import java.lang.reflect.Method;
+import java.time.Duration;
+import java.util.Map;
+
+import static io.confluent.parallelconsumer.internal.ProducerWrapper.ProducerState.*;
+
+/**
+ * Our extension of the standard Producer to mostly add some introspection functions and state tracking.
+ *
+ * @author Antony Stubbs
+ */
+@Slf4j
+@RequiredArgsConstructor
+public class ProducerWrapper<K, V> implements Producer<K, V> {
+
+    /**
+     * Used to track Producer's transaction state, as it' isn't otherwise exposed.
+     */
+    public enum ProducerState {
+        INSTANTIATED, INIT, BEGIN, COMMIT, ABORT, CLOSE
+    }
+
+    /**
+     * Tracks the internal transaction state of the Prodocer
+     */
+    @ToString.Include
+    @Getter
+    private volatile ProducerState producerState = ProducerState.INSTANTIATED;
+
+
+    @NonNull
+    private final ParallelConsumerOptions<K, V> options;
+
+    /**
+     * Cached discovery of whether the underlying Producer has been set up for transactions or not.
+     */
+    private final boolean producerIsConfiguredForTransactions;
+
+    // nasty reflection
+    private Field txManagerField;
+    private Method txManagerMethodIsCompleting;
+    private Method txManagerMethodIsReady;
+
+    @NonNull
+    @Delegate(excludes = Excludes.class)
+    private final Producer<K, V> producer;
+
+    public ProducerWrapper(ParallelConsumerOptions<K, V> options) {
+        this.options = options;
+        producer = options.getProducer();
+        this.producerIsConfiguredForTransactions = discoverIfProducerIsConfiguredForTransactions();
+    }
+
+    public boolean isMockProducer() {
+        return producer instanceof MockProducer;
+    }
+
+    public boolean isConfiguredForTransactions() {
+        return this.producerIsConfiguredForTransactions;
+    }
+
+    /**
+     * Type erasure issue fix
+     */
+    interface Excludes {
+        void sendOffsetsToTransaction(Map<TopicPartition, OffsetAndMetadata> offsets,
+                                      String consumerGroupId) throws ProducerFencedException;
+
+        void sendOffsetsToTransaction(Map<TopicPartition, OffsetAndMetadata> offsets,
+                                      ConsumerGroupMetadata groupMetadata) throws ProducerFencedException;
+    }
+
+    /**
+     * @deprecated use {@link #sendOffsetsToTransaction(Map, ConsumerGroupMetadata)}
+     */
+    @Deprecated
+    public void sendOffsetsToTransaction(Map<TopicPartition, OffsetAndMetadata> offsets,
+                                         String consumerGroupId) throws ProducerFencedException {
+        sendOffsetsToTransaction(offsets, new ConsumerGroupMetadata(consumerGroupId));
+    }
+
+    public void sendOffsetsToTransaction(Map<TopicPartition, OffsetAndMetadata> offsets,
+                                         ConsumerGroupMetadata groupMetadata) throws ProducerFencedException {
+        producer.sendOffsetsToTransaction(offsets, groupMetadata);
+    }
+
+
+    /**
+     * @return boolean which shows if we are set up for transactions or not
+     */
+    @SneakyThrows
+    private boolean discoverIfProducerIsConfiguredForTransactions() {
+        if (producer instanceof KafkaProducer) {
+            txManagerField = producer.getClass().getDeclaredField("transactionManager");
+            txManagerField.setAccessible(true);
+
+            boolean producerIsConfiguredForTransactions = getProducerIsTransactional();
+            if (producerIsConfiguredForTransactions) {
+                TransactionManager transactionManager = getTransactionManager();
+                txManagerMethodIsCompleting = transactionManager.getClass().getDeclaredMethod("isCompleting");
+                txManagerMethodIsCompleting.setAccessible(true);
+
+                txManagerMethodIsReady = transactionManager.getClass().getDeclaredMethod("isReady");
+                txManagerMethodIsReady.setAccessible(true);
+            }
+            return producerIsConfiguredForTransactions;
+        } else if (producer instanceof MockProducer) {
+            // can act as both, delegate to user selection
+            return options.isUsingTransactionalProducer();
+        } else {
+            // unknown
+            return false;
+        }
+    }
+
+    /**
+     * Nasty reflection but better than relying on user supplying a copy of their config, maybe
+     *
+     * @see AbstractParallelEoSStreamProcessor#checkAutoCommitIsDisabled
+     */
+    @SneakyThrows
+    private boolean getProducerIsTransactional() {
+        if (producer instanceof MockProducer) {
+            // can act as both, delegate to user selection
+            return options.isUsingTransactionalProducer();
+        } else {
+            TransactionManager transactionManager = getTransactionManager();
+            if (transactionManager == null) {
+                return false;
+            } else {
+                return transactionManager.isTransactional();
+            }
+        }
+    }
+
+    @SneakyThrows
+    private TransactionManager getTransactionManager() {
+        if (txManagerField == null) return null;
+        TransactionManager transactionManager = (TransactionManager) txManagerField.get(producer);
+        return transactionManager;
+    }
+
+    @SneakyThrows
+    protected boolean isTransactionCompleting() {
+        if (producer instanceof MockProducer) return false;
+        return (boolean) txManagerMethodIsCompleting.invoke(getTransactionManager());
+    }
+
+    @SneakyThrows
+    protected boolean isTransactionReady() {
+        if (producer instanceof MockProducer) return true;
+        return (boolean) txManagerMethodIsReady.invoke(getTransactionManager());
+    }
+
+    @Override
+    public void initTransactions() {
+        producer.initTransactions();
+        this.producerState = INIT;
+    }
+
+    @Override
+    public void beginTransaction() throws ProducerFencedException {
+        producer.beginTransaction();
+        this.producerState = BEGIN;
+    }
+
+    @Override
+    public void commitTransaction() throws ProducerFencedException {
+        log.debug("Committing transaction...");
+        producer.commitTransaction();
+        this.producerState = COMMIT;
+    }
+
+    @Override
+    public void abortTransaction() throws ProducerFencedException {
+        producer.abortTransaction();
+        this.producerState = ABORT;
+    }
+
+    @Override
+    public void close() {
+        producer.close();
+        this.producerState = CLOSE;
+    }
+
+    @Override
+    public void close(final Duration timeout) {
+        producer.close(timeout);
+        this.producerState = CLOSE;
+    }
+
+    /**
+     * According to our state tracking, does the Producer have an open transaction
+     *
+     * @return true if there's an open transaction
+     */
+    public boolean isTransactionOpen() {
+        return this.producerState.equals(BEGIN);
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/RateLimiter.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/RateLimiter.java
new file mode 100644
index 000000000..cafbb68e8
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/RateLimiter.java
@@ -0,0 +1,50 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.Getter;
+
+import java.time.Duration;
+
+public class RateLimiter {
+
+    @Getter
+    private Duration rate = Duration.ofSeconds(1);
+    private long lastFireMs = 0;
+
+    public RateLimiter() {
+    }
+
+    public RateLimiter(int seconds) {
+        this.rate = Duration.ofSeconds(seconds);
+    }
+
+    public void performIfNotLimited(final Runnable action) {
+        if (isOkToCallAction()) {
+            lastFireMs = System.currentTimeMillis();
+            action.run();
+        }
+    }
+
+    public boolean couldPerform() {
+        return isOkToCallAction();
+    }
+
+    private boolean isOkToCallAction() {
+        long elapsed = getElapsedMs();
+        return lastFireMs == 0 || elapsed > rate.toMillis();
+    }
+
+    private long getElapsedMs() {
+        long now = System.currentTimeMillis();
+        long elapsed = now - lastFireMs;
+        return elapsed;
+    }
+
+    public Duration getElapsedDuration() {
+        return Duration.ofMillis(getElapsedMs());
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/State.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/State.java
new file mode 100644
index 000000000..49d756f9c
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/State.java
@@ -0,0 +1,40 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import lombok.Getter;
+
+import java.util.function.Predicate;
+
+/**
+ * The run state of the controller.
+ */
+public enum State {
+    UNUSED(0),
+    RUNNING(1),
+    /**
+     * When paused, the system will stop submitting work to the processing pool. Polling for new work however may
+     * continue until internal buffers have been filled sufficiently and the auto-throttling takes effect. In flight
+     * work will not be affected by transitioning to this state (i.e. processing will finish without any interrupts
+     * being sent).
+     */
+    PAUSED(2),
+    /**
+     * When draining, the system will stop polling for more records, but will attempt to process all already downloaded
+     * records. Note that if you choose to close without draining, records already processed will still be committed
+     * first before closing.
+     */
+    DRAINING(3),
+    CLOSING(4),
+    CLOSED(5);
+
+    // Enum value used for metrics - deterministic as opposed to ordinal to prevent change on adding / removing enum constants
+    @Getter
+    private int value;
+
+    State(int value) {
+        this.value = value;
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/UserFunctions.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/UserFunctions.java
new file mode 100644
index 000000000..d156175a0
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/internal/UserFunctions.java
@@ -0,0 +1,67 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ExceptionInUserFunctionException;
+import lombok.experimental.UtilityClass;
+
+import java.util.function.BiFunction;
+import java.util.function.Consumer;
+import java.util.function.Function;
+
+/**
+ * Single entry point for wrapping the actual execution of user functions
+ */
+@UtilityClass
+public class UserFunctions {
+
+    public static final String MSG = "Error occurred in code supplied by user";
+
+    /**
+     * @param <PARAM_ONE>      the first in type for the user function
+     * @param <PARAM_TWO>      the second in type for the user function
+     * @param <RESULT>         the out type for the user function
+     * @param wrappedFunction  the function to run
+     * @param userFuncParamOne a parameter to pass into the user's function
+     * @param userFuncParamTwo a parameter to pass into the user's function
+     */
+    public static <PARAM_ONE, PARAM_TWO, RESULT> RESULT carefullyRun(BiFunction<PARAM_ONE, PARAM_TWO, RESULT> wrappedFunction,
+                                                                     PARAM_ONE userFuncParamOne,
+                                                                     PARAM_TWO userFuncParamTwo) {
+        try {
+            return wrappedFunction.apply(userFuncParamOne, userFuncParamTwo);
+        } catch (Throwable e) {
+            throw new ExceptionInUserFunctionException(MSG, e);
+        }
+    }
+
+    /**
+     * @param <PARAM>         the in type for the user function
+     * @param <RESULT>        the out type for the user function
+     * @param wrappedFunction the function to run
+     * @param userFuncParam   the parameter to pass into the user's function
+     */
+    public static <PARAM, RESULT> RESULT carefullyRun(Function<PARAM, RESULT> wrappedFunction, PARAM userFuncParam) {
+        try {
+            return wrappedFunction.apply(userFuncParam);
+        } catch (Throwable e) {
+            throw new ExceptionInUserFunctionException(MSG, e);
+        }
+    }
+
+    /**
+     * @param <PARAM>         the in type for the user function
+     * @param wrappedFunction the function to run
+     * @param userFuncParam   the parameter to pass into the user's function
+     */
+    public static <PARAM> void carefullyRun(Consumer<PARAM> wrappedFunction, PARAM userFuncParam) {
+        try {
+            wrappedFunction.accept(userFuncParam);
+        } catch (Throwable e) {
+            throw new ExceptionInUserFunctionException(MSG, e);
+        }
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/metrics/PCMetrics.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/metrics/PCMetrics.java
new file mode 100644
index 000000000..3725a7af8
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/metrics/PCMetrics.java
@@ -0,0 +1,253 @@
+package io.confluent.parallelconsumer.metrics;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.micrometer.core.instrument.*;
+import io.micrometer.core.instrument.Timer;
+import io.micrometer.core.instrument.composite.CompositeMeterRegistry;
+import io.micrometer.core.instrument.search.Search;
+import lombok.Getter;
+import lombok.extern.slf4j.Slf4j;
+
+import java.util.*;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.function.ToDoubleFunction;
+
+import static java.util.Collections.singleton;
+
+/**
+ * Main metrics collection and initialization service. Singleton - makes it easier to add metrics throughout the code
+ */
+@Slf4j
+public class PCMetrics {
+
+    /**
+     * Meter registry used for metrics - set through init call on singleton initialization. Configurable through
+     * Parallel Consumer Options.
+     */
+    @Getter
+    private MeterRegistry meterRegistry;
+
+    /**
+     * Tracking of registered meters for removal from registry on shutdown.
+     */
+    private List<Meter.Id> registeredMeters = new ArrayList<>();
+
+    /**
+     * Common metrics tags added to all meters - for example PC instance. Configurable through Parallel Consumer
+     * Options.
+     */
+    @Getter
+    private Iterable<Tag> commonTags;
+
+    @Getter
+    private Tag instanceTag;
+
+    private final AtomicBoolean isClosed = new AtomicBoolean(true);
+
+    private final boolean isNoop;
+
+    /**
+     * @param meterRegistry: meterRegistry to use for meter registration - configured through
+     *                       {@link io.confluent.parallelconsumer.ParallelConsumerOptions} on PC initialization
+     * @param commonTags:    set of tags to add to all meters - for example - PC instance.
+     */
+    public PCMetrics(MeterRegistry meterRegistry, Iterable<Tag> commonTags, String instanceTag) {
+        if (meterRegistry == null) {
+            this.isNoop = true;
+            this.meterRegistry = new CompositeMeterRegistry();
+        } else {
+            this.isNoop = false;
+            this.meterRegistry = meterRegistry;
+        }
+        if (instanceTag != null) {
+            this.instanceTag = Tag.of(PCMetricsDef.PC_INSTANCE_TAG, instanceTag);
+        } else {
+            this.instanceTag = generateUniqueInstanceTag();
+        }
+        this.commonTags = combine(this.instanceTag, commonTags);
+        this.isClosed.set(false);
+    }
+
+    /**
+     * Combines instance tag and common tags specified while ensuring there are no tags with same tag key.
+     *
+     * @param instanceTag
+     * @param commonTags
+     * @return combined tag collection with unique tag keys
+     */
+    private Iterable<Tag> combine(Tag instanceTag, Iterable<Tag> commonTags) {
+        Set<String> tagKeys = new HashSet<>();
+        List<Tag> tags = new LinkedList<>();
+
+        tagKeys.add(instanceTag.getKey());
+        tags.add(instanceTag);
+        commonTags.forEach(tag -> {
+            if (!tagKeys.contains(tag.getKey())) {
+                tagKeys.add(tag.getKey());
+                tags.add(tag);
+            } else {
+                log.warn("Duplicate metrics tag specified : {}", tag.getKey());
+            }
+        });
+        return tags;
+    }
+
+
+    private Tag generateUniqueInstanceTag() {
+        boolean inUse;
+        Tag tagToUse;
+        do {
+            tagToUse = Tag.of(PCMetricsDef.PC_INSTANCE_TAG, UUID.randomUUID().toString());
+            inUse = Search.in(meterRegistry).tags(singleton(instanceTag)).meter() != null;
+        } while (inUse);
+        return tagToUse;
+    }
+
+    /**
+     * Returns a counter from the metric definition. The counter will be registered with the meter.
+     *
+     * @param metricDef:      the metric definition to use.
+     * @param additionalTags: additional tags to add to the counter.
+     */
+    public Counter getCounterFromMetricDef(PCMetricsDef metricDef, Tag... additionalTags) {
+        Counter counter = Counter.builder(metricDef.getName())
+                .description(metricDef.getDescription())
+                .tags(commonTags)
+                .tags(metricDef.getSubsystemAsTagsOrEmpty())
+                .tags(Arrays.asList(additionalTags))
+                .register(this.meterRegistry);
+        registeredMeters.add(counter.getId());
+        return counter;
+    }
+
+    /**
+     * Returns a timer from the metric definition. The timer will be registered with the meter.
+     *
+     * @param metricDef:      the metric definition to use.
+     * @param additionalTags: additional tags to add to the timer.
+     */
+    public Timer getTimerFromMetricDef(PCMetricsDef metricDef, Tag... additionalTags) {
+        Timer timer = Timer.builder(metricDef.getName())
+                .publishPercentiles(0, 0.5, 0.75, 0.95, 0.99, 0.999)
+                .description(metricDef.getDescription())
+                .tags(commonTags)
+                .tags(metricDef.getSubsystemAsTagsOrEmpty())
+                .tags(Arrays.asList(additionalTags))
+                .register(this.meterRegistry);
+        registeredMeters.add(timer.getId());
+        return timer;
+    }
+
+    /**
+     * Returns a gauge from the metric definition. The gauge will be registered with the meter. The returned Gauge
+     * instance is not useful except in testing, as the gauge is already set up to track a value automatically upon
+     * registration.
+     *
+     * <p><strong>Note: Make sure you hold a strong reference to your object. Otherwise once the
+     * object being gauged is re-referenced and is garbage collected, micrometer starts reporting NaN or nothing for a
+     * gauge</strong>
+     *
+     * <p>See <a
+     * href="https://github.com/micrometer-metrics/micrometer-docs/blob/main/src/docs/concepts/gauges.adoc#why-is-my-gauge-reporting-nan-or-disappearing">micrometer
+     * docs</a> for more info
+     *
+     * @param metricDef:      the metric definition to use.
+     * @param stateObject:    object to collect metrics from
+     * @param valueFunction:  function of the stateObject that is invoked on gauge observation to return the value
+     * @param additionalTags: additional tags to add to the gauge.
+     * @return the Gauge instance.
+     */
+    public <T> Gauge gaugeFromMetricDef(
+            PCMetricsDef metricDef,
+            T stateObject,
+            ToDoubleFunction<T> valueFunction,
+            Tag... additionalTags) {
+        Gauge gauge = Gauge.builder(metricDef.getName(), stateObject, valueFunction)
+                .description(metricDef.getDescription())
+                .tags(commonTags)
+                .tags(metricDef.getSubsystemAsTagsOrEmpty())
+                .tags(Arrays.asList(additionalTags))
+                .strongReference(true)
+                .register(this.meterRegistry);
+        registeredMeters.add(gauge.getId());
+        return gauge;
+    }
+
+    /**
+     * Returns a distribution summary from the metric definition. The distribution summary will be registered with the
+     * meter.
+     *
+     * @param metricDef:      the metric definition to use.
+     * @param additionalTags: additional tags to add to the distribution summary.
+     * @return the DistributionSummary instance.
+     */
+    public DistributionSummary getDistributionSummaryFromMetricDef(
+            PCMetricsDef metricDef, Tag... additionalTags) {
+        DistributionSummary distributionSummary = DistributionSummary.builder(metricDef.getName())
+                .publishPercentiles(0, 0.5, 0.75, 0.95, 0.99, 0.999)
+                .description(metricDef.getDescription())
+                .tags(commonTags)
+                .tags(metricDef.getSubsystemAsTagsOrEmpty())
+                .tags(Arrays.asList(additionalTags))
+                .register(this.meterRegistry);
+        registeredMeters.add(distributionSummary.getId());
+        return distributionSummary;
+    }
+
+    /**
+     * Closes PCMetrics object and cleans up all meters from registry - should be recreated before using it again.
+     */
+    public synchronized void close() {
+        if (this.isClosed.getAndSet(true)) {
+            //Instance already closed - warn and ignore.
+            log.warn("Trying to close PCMetrics instance that is already closed.");
+            return;
+        }
+        log.debug("Closing PCMetrics");
+        // clean up the instance resources
+        this.registeredMeters.forEach(this.meterRegistry::remove);
+        this.registeredMeters.clear();
+        if (isNoop) {
+            this.meterRegistry.close();
+        }
+    }
+
+    /**
+     * Removes the metric from the singletons meter registry.
+     * <p>
+     * Synchronized with close method to avoid concurrent modification race on shutdown between removal of partition
+     * meters on revocation and closing metrics subsystem
+     *
+     * @param meter to remove.
+     */
+    public synchronized void removeMeter(Meter meter) {
+        if (meter != null) {
+            removeMeter(meter.getId());
+        }
+    }
+
+
+    private void removeMeter(Meter.Id meterId) {
+        if (this.isClosed.get()) {
+            //Already closed metrics subsystem - ignore
+            log.debug("Trying to remove meter when metrics subsystem is already closed. Meter Id {}", meterId);
+            return;
+        }
+        log.debug("Removing meter: {}", meterId);
+        this.meterRegistry.remove(meterId);
+        this.registeredMeters.remove(meterId);
+    }
+
+    public void removeMetersByPrefixAndCommonTags(String meterNamePrefix) {
+        if (this.isClosed.get()) {
+            //Already closed metrics subsystem - ignore
+            log.debug("Trying to remove meters when metrics subsystem is already closed.");
+            return;
+        }
+        Search.in(meterRegistry).name(name -> name.startsWith(meterNamePrefix))
+                .tags(commonTags).meters().forEach(meterRegistry::remove);
+    }
+}
\ No newline at end of file
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/metrics/PCMetricsDef.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/metrics/PCMetricsDef.java
new file mode 100644
index 000000000..f0010063f
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/metrics/PCMetricsDef.java
@@ -0,0 +1,202 @@
+package io.confluent.parallelconsumer.metrics;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumer;
+import io.confluent.parallelconsumer.internal.State;
+import io.micrometer.core.instrument.Tag;
+import io.micrometer.core.instrument.Tags;
+import lombok.Getter;
+
+import java.util.Arrays;
+import java.util.stream.Collectors;
+
+import static io.confluent.parallelconsumer.metrics.PCMetricsDef.MeterType.*;
+
+/**
+ * This enum defines the metrics that are collected by the PC.
+ */
+public enum PCMetricsDef {
+
+    USER_FUNCTION_PROCESSING_TIME("user.function.processing.time", "User function processing time", PCMetricsSubsystem.PROCESSOR, TIMER),
+    DYNAMIC_EXTRA_LOAD_FACTOR("dynamic.load.factor", "Dynamic load factor - load of processing buffers", PCMetricsSubsystem.PROCESSOR, GAUGE),
+
+    INFLIGHT_RECORDS("inflight.records", "Total number of records currently being processed or waiting for retry", PCMetricsSubsystem.WORK_MANAGER, GAUGE),
+    WAITING_RECORDS("waiting.records", "Total number of records waiting to be selected for processing", PCMetricsSubsystem.WORK_MANAGER, GAUGE),
+    PROCESSED_RECORDS("processed.records", "Total number of records successfully processed", PCMetricsSubsystem.WORK_MANAGER, COUNTER, topicPartitionTags()),
+    FAILED_RECORDS("failed.records", "Total number of records failed to be processed", PCMetricsSubsystem.WORK_MANAGER, COUNTER, topicPartitionTags()),
+    SLOW_RECORDS("slow.records", "Total number of records that spent more than the configured time threshold in the waiting queue. This setting defaults to 10 seconds", PCMetricsSubsystem.WORK_MANAGER, COUNTER, topicPartitionTags()),
+
+    PC_POLLER_STATUS("poller.status", "PC Broker Poller Status, reported as number with following mapping - " + getStateToValueListing(), PCMetricsSubsystem.BROKER_POLLER, GAUGE),
+    PC_STATUS("status", "PC Status, reported as number with following mapping - " + getStateToValueListing(), PCMetricsSubsystem.PROCESSOR, GAUGE),
+    NUM_PAUSED_PARTITIONS("partitions.paused", "Number of paused partitions", PCMetricsSubsystem.BROKER_POLLER, GAUGE),
+
+
+    NUMBER_OF_SHARDS("shards", "Number of shards", PCMetricsSubsystem.SHARD_MANAGER, GAUGE),
+
+    INCOMPLETE_OFFSETS_TOTAL("incomplete.offsets.total", "Total number of incomplete offsets", PCMetricsSubsystem.SHARD_MANAGER, GAUGE),
+    SHARDS_SIZE("shards.size", "Number of records queued for processing across all shards", PCMetricsSubsystem.SHARD_MANAGER, GAUGE),
+
+
+    //TODO: Not implemented yet - add to Metrics.adoc when implemented
+    // AVERAGE_USER_PROCESSING_TIME("avg.processing.time", "Average user function processing time", PCMetricsSubsystem.SHARD_MANAGER),
+
+    //TODO: Not implemented yet - add to Metrics.adoc when implemented
+    // AVERAGE_WAITING_TIME("avg.waiting.time", "Average waiting time in the processing queue", PCMetricsSubsystem.SHARD_MANAGER),
+
+    NUMBER_OF_PARTITIONS("partitions.number", "Number of partitions", PCMetricsSubsystem.PARTITION_MANAGER, GAUGE),
+    PARTITION_INCOMPLETE_OFFSETS("partition.incomplete.offsets", "Number of incomplete offsets in the partition", PCMetricsSubsystem.PARTITION_MANAGER, GAUGE, topicPartitionTags()),
+    PARTITION_HIGHEST_COMPLETED_OFFSET("partition.highest.completed.offset", "Highest completed offset in the partition", PCMetricsSubsystem.PARTITION_MANAGER, GAUGE, topicPartitionTags()),
+    PARTITION_HIGHEST_SEQUENTIAL_SUCCEEDED_OFFSET("partition.highest.sequential.succeeded.offset", "Highest sequential succeeded offset in the partition", PCMetricsSubsystem.PARTITION_MANAGER, GAUGE, topicPartitionTags()),
+    PARTITION_HIGHEST_SEEN_OFFSET("partition.highest.seen.offset", "Highest seen / consumed offset in the partition", PCMetricsSubsystem.PARTITION_MANAGER, GAUGE, topicPartitionTags()),
+    PARTITION_LAST_COMMITTED_OFFSET("partition.latest.committed.offset", "Latest committed offset in the partition", PCMetricsSubsystem.PARTITION_MANAGER, GAUGE, topicPartitionTags()),
+    PARTITION_ASSIGNMENT_EPOCH("partition.assignment.epoch", "Epoch of partition assignment", PCMetricsSubsystem.PARTITION_MANAGER, GAUGE, topicPartitionTags()),
+
+
+    OFFSETS_ENCODING_TIME("offsets.encoding.time", "Time spend encoding offsets", PCMetricsSubsystem.OFFSET_ENCODER, TIMER),
+    OFFSETS_ENCODING_USAGE("offsets.encoding.usage", "Offset encoding usage per encoding type", PCMetricsSubsystem.OFFSET_ENCODER, COUNTER, tag("codec", "BitSet|BitSetCompressed|BitSetV2Compressed|RunLength")),
+    METADATA_SPACE_USED("metadata.space.used", "Ratio between offset metadata payload size and available space", PCMetricsSubsystem.OFFSET_ENCODER, DISTRIBUTION_SUMMARY),
+    PAYLOAD_RATIO_USED("payload.ratio.used", "Ratio between offset metadata payload size and offsets encoded", PCMetricsSubsystem.OFFSET_ENCODER, DISTRIBUTION_SUMMARY);
+
+    public static final String PC_INSTANCE_TAG = "pcinstance";
+
+    private static String getStateToValueListing() {
+        return Arrays.stream(State.values()).map(state -> state.getValue() + ":" + state).collect(Collectors.joining(", "));
+    }
+
+    private static ParallelConsumer.Tuple<String, String>[] topicPartitionTags() {
+        return new ParallelConsumer.Tuple[]{tag("topic", "topicName"), tag("partition", "partitionNumber")};
+    }
+
+    private static final String SUBSYSTEM_TAG_KEY = "subsystem";
+
+    private static final String METER_PREFIX = "pc.";
+    public static final String USER_FUNCTION_EXECUTOR_PREFIX = METER_PREFIX+"user.function.";
+
+    @Getter
+    private final String name;
+    @Getter
+    private final String description;
+    private final ParallelConsumer.Tuple<String, String>[] tags;
+    private final MeterType type;
+    @Getter
+    private Tag subsystem;
+
+    /**
+     * @param name:        the name of the metric
+     * @param description: A quick summary of the metric
+     * @param subsystem:   PC subsystem tag for meter grouping
+     * @param type:        Meter type - Counter, Timer etc - only for meter definition markdown generation
+     * @param tags:        Metrics tags - keys of tags used for meters - only for meter definition markdown generation
+     */
+    PCMetricsDef(String name, String description, PCMetricsSubsystem subsystem, MeterType type, ParallelConsumer.Tuple<String, String>... tags) {
+        this.name = METER_PREFIX + name;
+        this.description = description;
+        this.tags = tags;
+        if (subsystem != null) {
+            this.subsystem = Tag.of(SUBSYSTEM_TAG_KEY, subsystem.subsystemTag);
+        }
+        this.type = type;
+    }
+
+    public Tags getSubsystemAsTagsOrEmpty() {
+        if (this.subsystem == null) {
+            return Tags.empty();
+        } else {
+            return Tags.of(subsystem);
+        }
+    }
+
+    //Formatting methods for markdown generation
+    public static void main(String[] args) {
+        System.out.println(toMarkdown());
+    }
+
+    private static String toCamelCase(String s) {
+        return Arrays.stream(s.replace("_", " ").split(" ")).map(string -> string.substring(0, 1).toUpperCase() + string.substring(1).toLowerCase()).collect(Collectors.joining(" "));
+    }
+
+    private static String formatMetricDef(PCMetricsDef metricsDef) {
+        StringBuilder sb = new StringBuilder();
+        sb.append(String.format("**%s**%n%n", toCamelCase(metricsDef.name())));
+        sb.append(String.format("%s `%s%s`%n%n", toCamelCase(metricsDef.type.name()), metricsDef.name, formatTagsAndSubsystem(metricsDef)));
+        sb.append(metricsDef.description);
+        sb.append("\n\n");
+        return sb.toString();
+    }
+
+    private static String formatTagsAndSubsystem(PCMetricsDef metricsDef) {
+        String res = "";
+        if (metricsDef.subsystem != null) {
+            res += String.format("%s=%s", metricsDef.subsystem.getKey(), metricsDef.subsystem.getValue());
+        }
+        if (metricsDef.tags != null && metricsDef.tags.length > 0) {
+            if (res.length() > 0) {
+                res += ", ";
+            }
+            res += joinTagsForRendering(metricsDef.tags);
+        }
+        if (res.length() > 0) {
+            res = "{" + res + "}";
+        }
+        return res;
+    }
+
+    /**
+     * Outputs a markdown representation of the above enums
+     */
+    private static String toMarkdown() {
+        StringBuilder sb = new StringBuilder();
+        Arrays.stream(PCMetricsSubsystem.values()).forEach(sub -> {
+                    sb.append(formatSubsystem(sub));
+                    Arrays.stream(PCMetricsDef.values())
+                            .filter(def -> def.subsystem != null && def.subsystem.getValue().equals(sub.subsystemTag))
+                            .forEach(v -> sb.append(formatMetricDef(v)));
+                }
+        );
+        return sb.toString();
+    }
+
+    private static String formatSubsystem(PCMetricsSubsystem sub) {
+        return String.format("==== %s%n%n", toCamelCase(sub.name()));
+    }
+
+    private static String joinTagsForRendering(ParallelConsumer.Tuple<String, String>[] tags) {
+        if (tags == null || tags.length == 0) {
+            return "";
+        }
+        return Arrays.stream(tags).map(tag -> tag.getLeft() + "=\"" + tag.getRight() + "\"")
+                .collect(Collectors.joining(", "));
+    }
+
+    static ParallelConsumer.Tuple<String, String> tag(String key, String valueToken) {
+        return ParallelConsumer.Tuple.pairOf(key, valueToken);
+    }
+
+    /**
+     * Metrics are divided into subsystems for better representation and fine-grained filtering.
+     */
+    public enum PCMetricsSubsystem {
+        PARTITION_MANAGER("partitions"),
+        PROCESSOR("processor"),
+        SHARD_MANAGER("shardmanager"),
+        WORK_MANAGER("workmanager"),
+        BROKER_POLLER("poller"),
+        OFFSET_ENCODER("offsetencoder");
+
+        private final String subsystemTag;
+
+        PCMetricsSubsystem(String subsystemTag) {
+            this.subsystemTag = subsystemTag;
+        }
+    }
+
+    public enum MeterType {
+        COUNTER,
+        TIMER,
+        GAUGE,
+        DISTRIBUTION_SUMMARY
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/BitSetEncoder.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/BitSetEncoder.java
new file mode 100644
index 000000000..39bdda7e1
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/BitSetEncoder.java
@@ -0,0 +1,185 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.MathUtils;
+import io.confluent.csid.utils.StringUtils;
+import io.confluent.parallelconsumer.internal.InternalRuntimeException;
+import io.confluent.parallelconsumer.state.PartitionState;
+import lombok.Getter;
+import lombok.ToString;
+import lombok.extern.slf4j.Slf4j;
+
+import java.nio.BufferOverflowException;
+import java.nio.ByteBuffer;
+import java.util.BitSet;
+import java.util.Optional;
+
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.*;
+
+/**
+ * Encodes a range of offsets, from an incompletes collection into a BitSet.
+ * <p>
+ * Highly efficient when the completion status is random.
+ * <p>
+ * Highly inefficient when the completion status is in large blocks ({@link RunLengthEncoder} is much better)
+ * <p>
+ * Because our system works on manipulating INCOMPLETE offsets, it doesn't matter if the offset range we're encoding is
+ * Sequential or not. Because as records are always in commit order, if we've seen a range of offsets, we know we've
+ * seen all that exist (within said range). So if offset 8 is missing from the partition, we will encode it as having
+ * been completed (when in fact it doesn't exist), because we only compare against known incompletes, and assume all
+ * others are complete. See {@link PartitionState#incompleteOffsets} for more discussion on this.
+ * <p>
+ * So, when we deserialize, the INCOMPLETES collection is then restored, and that's what's used to compare to see if a
+ * record should be skipped or not. So if record 8 is recorded as completed, it will be absent from the restored
+ * INCOMPLETES list, and we are assured we will never see record 8.
+ *
+ * @author Antony Stubbs
+ * @see PartitionState#incompleteOffsets
+ * @see RunLengthEncoder
+ * @see OffsetBitSet
+ */
+@ToString(callSuper = true)
+@Slf4j
+public class BitSetEncoder extends OffsetEncoder {
+
+    private static final Version DEFAULT_VERSION = Version.v2;
+
+    /**
+     * {@link BitSet} only supports {@link Integer#MAX_VALUE) bits
+     */
+    public static final Integer MAX_LENGTH_ENCODABLE = Integer.MAX_VALUE;
+
+    @Getter
+    private final BitSet bitSet;
+
+    private final long originalLength;
+
+    private Optional<byte[]> encodedBytes = Optional.empty();
+
+    /**
+     * @param length the difference between the highest and lowest offset to be encoded
+     */
+    public BitSetEncoder(long length, OffsetSimultaneousEncoder offsetSimultaneousEncoder, Version newVersion) throws BitSetEncodingNotSupportedException {
+        super(offsetSimultaneousEncoder, newVersion);
+
+        // prep bit set buffer, range check above
+        try {
+            bitSet = new BitSet(Math.toIntExact(length));
+        } catch (ArithmeticException e) {
+            throw new BitSetEncodingNotSupportedException("BitSet only supports " + MAX_LENGTH_ENCODABLE + " bits, but " + length + " were requested", e);
+        }
+
+        this.originalLength = length;
+    }
+
+    private ByteBuffer constructWrappedByteBuffer(long length, Version newVersion) throws BitSetEncodingNotSupportedException {
+        return switch (newVersion) {
+            case v1 -> initV1(length);
+            case v2 -> initV2(length);
+        };
+    }
+
+    /**
+     * Switch from encoding bitset length as a short to an integer (Short.MAX_VALUE size of 32,000 was too short).
+     * <p>
+     * Integer.MAX_VALUE is the most we can use, as {@link BitSet} only supports {@link Integer#MAX_VALUE} bits.
+     */
+    // TODO refactor inivtV2 and V1 together, passing in the Short or Integer
+    private ByteBuffer initV2(long bitsetEntriesRequired) throws BitSetEncodingNotSupportedException {
+        if (bitsetEntriesRequired > MAX_LENGTH_ENCODABLE) {
+            // need to upgrade to using Integer for the bitset length, but can't change serialisation format in-place
+            throw new BitSetEncodingNotSupportedException(StringUtils.msg("BitSet V2 too long to encode, as length overflows Integer.MAX_VALUE. Length: {}. (max: {})", bitsetEntriesRequired, MAX_LENGTH_ENCODABLE));
+        }
+
+        int bytesRequiredForEntries = (int) (Math.ceil((double) bitsetEntriesRequired / Byte.SIZE));
+        int lengthEntryWidth = Integer.BYTES;
+        int wrappedBufferLength = lengthEntryWidth + bytesRequiredForEntries + 1;
+        final ByteBuffer wrappedBitSetBytesBuffer = ByteBuffer.allocate(wrappedBufferLength);
+
+        // bitset doesn't serialise it's set capacity, so we have to as the unused capacity actually means something
+        wrappedBitSetBytesBuffer.putInt(Math.toIntExact(bitsetEntriesRequired));
+
+        return wrappedBitSetBytesBuffer;
+    }
+
+    /**
+     * This was a bit "short" sighted of me.... Encodes the capacity of the bitset as a short, which is only ~32,000
+     * bits ({@link Short#MAX_VALUE}).
+     */
+    private ByteBuffer initV1(long bitsetEntriesRequired) throws BitSetEncodingNotSupportedException {
+        if (bitsetEntriesRequired > Short.MAX_VALUE) {
+            // need to upgrade to using Integer for the bitset length, but can't change serialisation format in-place
+            throw new BitSetEncodingNotSupportedException("Input too long to encode for BitSet V1, length overflows Short.MAX_VALUE: " + bitsetEntriesRequired + ". (max: " + Short.MAX_VALUE + ")");
+        }
+
+        int bytesRequiredForEntries = (int) (Math.ceil((double) bitsetEntriesRequired / Byte.SIZE));
+        int lengthEntryWidth = Short.BYTES;
+        int wrappedBufferLength = lengthEntryWidth + bytesRequiredForEntries + 1;
+        final ByteBuffer wrappedBitSetBytesBuffer = ByteBuffer.allocate(wrappedBufferLength);
+
+        // bitset doesn't serialise it's set capacity, so we have to as the unused capacity actually means something
+        wrappedBitSetBytesBuffer.putShort(MathUtils.toShortExact(bitsetEntriesRequired));
+
+        return wrappedBitSetBytesBuffer;
+    }
+
+    @Override
+    protected OffsetEncoding getEncodingType() {
+        return switch (version) {
+            case v1 -> BitSet;
+            case v2 -> BitSetV2;
+        };
+    }
+
+    @Override
+    protected OffsetEncoding getEncodingTypeCompressed() {
+        return switch (version) {
+            case v1 -> BitSetCompressed;
+            case v2 -> BitSetV2Compressed;
+        };
+    }
+
+    @Override
+    public void encodeIncompleteOffset(final long relativeOffset) {
+        // noop - bitset defaults to 0's (`unset`)
+    }
+
+    @Override
+    public void encodeCompletedOffset(final long relativeOffset) {
+        // range will already have been checked at initialization
+        bitSet.set(Math.toIntExact(relativeOffset));
+    }
+
+    @Override
+    public byte[] serialise() throws BitSetEncodingNotSupportedException {
+        final byte[] bitSetArray = this.bitSet.toByteArray();
+        ByteBuffer wrappedBitSetBytesBuffer = constructWrappedByteBuffer(originalLength, version);
+
+        if (wrappedBitSetBytesBuffer.remaining() < bitSetArray.length)
+            throw new InternalRuntimeException("Not enough space in byte array");
+
+        try {
+            wrappedBitSetBytesBuffer.put(bitSetArray);
+        } catch (BufferOverflowException e) {
+            throw new InternalRuntimeException("Error copying bitset into byte wrapper", e);
+        }
+
+        final byte[] array = wrappedBitSetBytesBuffer.array();
+        this.encodedBytes = Optional.of(array);
+        return array;
+    }
+
+    @Override
+    public int getEncodedSize() {
+        return this.encodedBytes.get().length;
+    }
+
+    @Override
+    protected byte[] getEncodedBytes() {
+        return this.encodedBytes.get();
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/BitSetEncodingNotSupportedException.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/BitSetEncodingNotSupportedException.java
new file mode 100644
index 000000000..b0b7b98d5
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/BitSetEncodingNotSupportedException.java
@@ -0,0 +1,16 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.StandardException;
+
+/**
+ * Thrown under situations where the {@link BitSetEncoder} would not be able to encode the given data.
+ *
+ * @author Antony Stubbs
+ */
+@StandardException
+public class BitSetEncodingNotSupportedException extends EncodingNotSupportedException {
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/ByteBufferEncoder.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/ByteBufferEncoder.java
new file mode 100644
index 000000000..5f330bcfc
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/ByteBufferEncoder.java
@@ -0,0 +1,68 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.ToString;
+
+import java.nio.ByteBuffer;
+
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.ByteArray;
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.ByteArrayCompressed;
+
+/**
+ * Encodes offsets into a {@link ByteBuffer}. Doesn't have any advantage over  the {@link BitSetEncoder} and
+ * {@link RunLengthEncoder}, but can be useful for testing and comparison.
+ *
+ * @author Antony Stubbs
+ */
+@ToString(callSuper = true)
+public class ByteBufferEncoder extends OffsetEncoder {
+
+    private final ByteBuffer bytesBuffer;
+
+    public ByteBufferEncoder(long length, OffsetSimultaneousEncoder offsetSimultaneousEncoder) {
+        super(offsetSimultaneousEncoder, OffsetEncoding.Version.v1);
+
+        // safe cast the length to an int, as we're not expecting to have more than 2^31 offsets
+        final int safeCast = Math.toIntExact(length);
+        this.bytesBuffer = ByteBuffer.allocate(1 + safeCast);
+    }
+
+    @Override
+    protected OffsetEncoding getEncodingType() {
+        return ByteArray;
+    }
+
+    @Override
+    protected OffsetEncoding getEncodingTypeCompressed() {
+        return ByteArrayCompressed;
+    }
+
+    @Override
+    public void encodeIncompleteOffset(final long relativeOffset) {
+        this.bytesBuffer.put((byte) 0);
+    }
+
+    @Override
+    public void encodeCompletedOffset(final long relativeOffset) {
+        this.bytesBuffer.put((byte) 1);
+    }
+
+    @Override
+    public byte[] serialise() {
+        return this.bytesBuffer.array();
+    }
+
+    @Override
+    public int getEncodedSize() {
+        return this.bytesBuffer.capacity();
+    }
+
+    @Override
+    protected byte[] getEncodedBytes() {
+        return this.bytesBuffer.array();
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/EncodedOffsetPair.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/EncodedOffsetPair.java
new file mode 100644
index 000000000..eb33e73f4
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/EncodedOffsetPair.java
@@ -0,0 +1,135 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.internal.InternalRuntimeException;
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager.HighestOffsetAndIncompletes;
+import lombok.Getter;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+
+import java.nio.ByteBuffer;
+import java.util.Comparator;
+
+import static io.confluent.parallelconsumer.offsets.OffsetBitSet.deserialiseBitSetWrap;
+import static io.confluent.parallelconsumer.offsets.OffsetBitSet.deserialiseBitSetWrapToIncompletes;
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.*;
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.Version.v1;
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.Version.v2;
+import static io.confluent.parallelconsumer.offsets.OffsetRunLength.*;
+import static io.confluent.parallelconsumer.offsets.OffsetSimpleSerialisation.decompressZstd;
+import static io.confluent.parallelconsumer.offsets.OffsetSimpleSerialisation.deserialiseByteArrayToBitMapString;
+
+/**
+ * Encapsulates the encoding type, and the actual encoded data, when creating an offset map encoding. Central place for
+ * decoding  the data.
+ *
+ * @author Antony Stubbs
+ * @see #unwrap
+ */
+@Slf4j
+public final class EncodedOffsetPair implements Comparable<EncodedOffsetPair> {
+
+    public static final Comparator<EncodedOffsetPair> SIZE_COMPARATOR = Comparator.comparingInt(x -> x.data.capacity());
+    @Getter
+    OffsetEncoding encoding;
+    @Getter
+    ByteBuffer data;
+
+    /**
+     * @see #unwrap
+     */
+    EncodedOffsetPair(OffsetEncoding encoding, ByteBuffer data) {
+        this.encoding = encoding;
+        this.data = data;
+    }
+
+    @Override
+    public int compareTo(EncodedOffsetPair o) {
+        return SIZE_COMPARATOR.compare(this, o);
+    }
+
+    /**
+     * Used for printing out the comparative map of each encoder
+     */
+    @Override
+    public String toString() {
+        return "\n{" + encoding.name() + ", \t\t\tsize=" + data.capacity() + "}";
+    }
+
+    /**
+     * Copies array out of the ByteBuffer
+     */
+    public byte[] readDataArrayForDebug() {
+        return copyBytesOutOfBufferForDebug(data);
+    }
+
+    private static byte[] copyBytesOutOfBufferForDebug(ByteBuffer bbData) {
+        bbData.position(0);
+        byte[] bytes = new byte[bbData.remaining()];
+        bbData.get(bytes, 0, bbData.limit());
+        return bytes;
+    }
+
+    static EncodedOffsetPair unwrap(byte[] input) {
+        ByteBuffer wrap = ByteBuffer.wrap(input).asReadOnlyBuffer();
+        byte magic = wrap.get();
+        OffsetEncoding decode = decode(magic);
+        ByteBuffer slice = wrap.slice();
+
+        return new EncodedOffsetPair(decode, slice);
+    }
+
+    @SneakyThrows
+    public String getDecodedString() {
+        String binaryArrayString = switch (encoding) {
+            case ByteArray -> deserialiseByteArrayToBitMapString(data);
+            case ByteArrayCompressed -> deserialiseByteArrayToBitMapString(decompressZstd(data));
+            case BitSet -> deserialiseBitSetWrap(data, v1);
+            case BitSetCompressed -> deserialiseBitSetWrap(decompressZstd(data), v1);
+            case RunLength -> runLengthDecodeToString(runLengthDeserialise(data));
+            case RunLengthCompressed -> runLengthDecodeToString(runLengthDeserialise(decompressZstd(data)));
+            case BitSetV2 -> deserialiseBitSetWrap(data, v2);
+            case BitSetV2Compressed -> deserialiseBitSetWrap(data, v2);
+            case RunLengthV2 -> deserialiseBitSetWrap(data, v2);
+            case RunLengthV2Compressed -> deserialiseBitSetWrap(data, v2);
+            default ->
+                    throw new InternalRuntimeException("Invalid state"); // todo why is this needed? what's not covered?
+        };
+        return binaryArrayString;
+    }
+
+    public HighestOffsetAndIncompletes getDecodedIncompletes(long baseOffset) {
+        return getDecodedIncompletes(baseOffset,  ParallelConsumerOptions.InvalidOffsetMetadataHandlingPolicy.FAIL);
+    }
+
+    @SneakyThrows
+    public HighestOffsetAndIncompletes getDecodedIncompletes(long baseOffset, ParallelConsumerOptions.InvalidOffsetMetadataHandlingPolicy errorPolicy) {
+        HighestOffsetAndIncompletes binaryArrayString = switch (encoding) {
+//            case ByteArray -> deserialiseByteArrayToBitMapString(data);
+//            case ByteArrayCompressed -> deserialiseByteArrayToBitMapString(decompressZstd(data));
+            case BitSet -> deserialiseBitSetWrapToIncompletes(encoding, baseOffset, data);
+            case BitSetCompressed -> deserialiseBitSetWrapToIncompletes(BitSet, baseOffset, decompressZstd(data));
+            case RunLength -> runLengthDecodeToIncompletes(encoding, baseOffset, data);
+            case RunLengthCompressed -> runLengthDecodeToIncompletes(RunLength, baseOffset, decompressZstd(data));
+            case BitSetV2 -> deserialiseBitSetWrapToIncompletes(encoding, baseOffset, data);
+            case BitSetV2Compressed -> deserialiseBitSetWrapToIncompletes(BitSetV2, baseOffset, decompressZstd(data));
+            case RunLengthV2 -> runLengthDecodeToIncompletes(encoding, baseOffset, data);
+            case RunLengthV2Compressed -> runLengthDecodeToIncompletes(RunLengthV2, baseOffset, decompressZstd(data));
+            case KafkaStreams, KafkaStreamsV2 ->{
+                if (errorPolicy == ParallelConsumerOptions.InvalidOffsetMetadataHandlingPolicy.IGNORE) {
+                    log.warn("Ignoring existing Kafka Streams offset metadata and reusing offsets");
+                    yield HighestOffsetAndIncompletes.of(baseOffset);
+                } else {
+                    throw new KafkaStreamsEncodingNotSupported();
+                }
+            }
+            default ->
+                    throw new UnsupportedOperationException("Encoding (" + encoding.description() + ") not supported");
+        };
+        return binaryArrayString;
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/EncodingNotSupportedException.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/EncodingNotSupportedException.java
new file mode 100644
index 000000000..58097d6ea
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/EncodingNotSupportedException.java
@@ -0,0 +1,17 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.InternalException;
+import lombok.experimental.StandardException;
+
+/**
+ * Parent of the exceptions for when the {@link OffsetEncoder} cannot encode the given data.
+ *
+ * @author Antony Stubbs
+ */
+@StandardException
+public class EncodingNotSupportedException extends InternalException {
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/KafkaStreamsEncodingNotSupported.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/KafkaStreamsEncodingNotSupported.java
new file mode 100644
index 000000000..e717952f2
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/KafkaStreamsEncodingNotSupported.java
@@ -0,0 +1,21 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.StandardException;
+
+/**
+ * Thrown when magic number for Kafka Streams offset metadata is found.
+ * @see <a href="https://github.com/apache/kafka/blob/cc77a38d280657a0e3969b255f103af4d11c7914/streams/src/main/java/org/apache/kafka/streams/processor/internals/TopicPartitionMetadata.java#L33">Kafka Streams magic number</a>
+ * @author Nacho Munoz
+ */
+@StandardException
+public class KafkaStreamsEncodingNotSupported extends EncodingNotSupportedException{
+    private static final String ERROR_MESSAGE = "It looks like you might be reusing a Kafka Streams consumer group id, as KS magic numbers were found in the serialised payload, instead of our own. Using PC on top of KS commit data isn't supported. Please, use a fresh consumer group, unique to PC.";
+
+    public KafkaStreamsEncodingNotSupported() {
+        super(ERROR_MESSAGE);
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/NoEncodingPossibleException.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/NoEncodingPossibleException.java
new file mode 100644
index 000000000..2b33ab767
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/NoEncodingPossibleException.java
@@ -0,0 +1,17 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.InternalException;
+import lombok.experimental.StandardException;
+
+/**
+ * Throw when for whatever reason, no encoding of the offsets is possible.
+ *
+ * @author Antony Stubbs
+ */
+@StandardException
+public class NoEncodingPossibleException extends InternalException {
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetBitSet.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetBitSet.java
new file mode 100644
index 000000000..94b625d1f
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetBitSet.java
@@ -0,0 +1,85 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.InternalRuntimeException;
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager.HighestOffsetAndIncompletes;
+import lombok.extern.slf4j.Slf4j;
+
+import java.nio.ByteBuffer;
+import java.util.BitSet;
+import java.util.SortedSet;
+import java.util.TreeSet;
+
+import static io.confluent.csid.utils.Range.range;
+
+/**
+ * Deserialization tools for {@link BitSetEncoder}.
+ * <p>
+ * todo unify or refactor with {@link BitSetEncoder}. Why was it ever separate?
+ *
+ * @author Antony Stubbs
+ * @see BitSetEncoder
+ */
+@Slf4j
+public class OffsetBitSet {
+
+    static String deserialiseBitSetWrap(ByteBuffer wrap, OffsetEncoding.Version version) {
+        wrap.rewind();
+
+        int originalBitsetSize = switch (version) {
+            case v1 -> (int) wrap.getShort(); // up cast ok
+            case v2 -> wrap.getInt();
+        };
+
+        ByteBuffer slice = wrap.slice();
+        return deserialiseBitSet(originalBitsetSize, slice);
+    }
+
+    static String deserialiseBitSet(int originalBitsetSize, ByteBuffer s) {
+        BitSet bitSet = BitSet.valueOf(s);
+
+        StringBuilder result = new StringBuilder(bitSet.size());
+        for (Long offset : range(originalBitsetSize)) {
+            // range will already have been checked at initialization
+            if (bitSet.get(Math.toIntExact(offset))) {
+                result.append('x');
+            } else {
+                result.append('o');
+            }
+        }
+
+        return result.toString();
+    }
+
+    static HighestOffsetAndIncompletes deserialiseBitSetWrapToIncompletes(OffsetEncoding encoding, long baseOffset, ByteBuffer wrap) {
+        wrap.rewind();
+        int originalBitsetSize = switch (encoding) {
+            case BitSet -> wrap.getShort();
+            case BitSetV2 -> wrap.getInt();
+            default -> throw new InternalRuntimeException("Invalid state");
+        };
+        ByteBuffer slice = wrap.slice();
+        SortedSet<Long> incompletes = deserialiseBitSetToIncompletes(baseOffset, originalBitsetSize, slice);
+        long highestSeenOffset = baseOffset + originalBitsetSize - 1;
+        return HighestOffsetAndIncompletes.of(highestSeenOffset, incompletes);
+    }
+
+    static SortedSet<Long> deserialiseBitSetToIncompletes(long baseOffset, int originalBitsetSize, ByteBuffer inputBuffer) {
+        BitSet bitSet = BitSet.valueOf(inputBuffer);
+        var incompletes = new TreeSet<Long>();
+        for (long relativeOffsetLong : range(originalBitsetSize)) {
+            // range will already have been checked at initialization
+            var relativeOffset = Math.toIntExact(relativeOffsetLong);
+            long offset = baseOffset + relativeOffset;
+            if (bitSet.get(relativeOffset)) {
+                log.trace("Ignoring completed offset {}", relativeOffset);
+            } else {
+                incompletes.add(offset);
+            }
+        }
+        return incompletes;
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetDecodingError.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetDecodingError.java
new file mode 100644
index 000000000..2a1a8f17e
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetDecodingError.java
@@ -0,0 +1,19 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.InternalException;
+import lombok.experimental.StandardException;
+
+/*-
+ * Error decoding offsets
+ *
+ * TODO should extend java.lang.Error ?
+ *
+ * @author Antony Stubbs
+ */
+@StandardException
+public class OffsetDecodingError extends InternalException {
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetEncoder.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetEncoder.java
new file mode 100644
index 000000000..4bfefe9f4
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetEncoder.java
@@ -0,0 +1,78 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import lombok.SneakyThrows;
+import lombok.ToString;
+import lombok.extern.slf4j.Slf4j;
+
+import java.io.IOException;
+import java.nio.ByteBuffer;
+
+
+/**
+ * Base OffsetEncoder, defining the contract for encoding offset data.
+ *
+ * @author Antony Stubbs
+ */
+// metrics: avg offsets mapped per bit, average encoded size, avg time to encode,
+@ToString
+@Slf4j
+public abstract class OffsetEncoder {
+
+    /**
+     * Implementation version of the encoding
+     */
+    protected final OffsetEncoding.Version version;
+
+    private final OffsetSimultaneousEncoder offsetSimultaneousEncoder;
+
+    protected OffsetEncoder(OffsetSimultaneousEncoder offsetSimultaneousEncoder, OffsetEncoding.Version version) {
+        this.offsetSimultaneousEncoder = offsetSimultaneousEncoder;
+        this.version = version;
+    }
+
+    protected abstract OffsetEncoding getEncodingType();
+
+    protected abstract OffsetEncoding getEncodingTypeCompressed();
+
+    abstract void encodeIncompleteOffset(final long relativeOffset) throws EncodingNotSupportedException;
+
+    abstract void encodeCompletedOffset(final long relativeOffset) throws EncodingNotSupportedException;
+
+    abstract byte[] serialise() throws EncodingNotSupportedException;
+
+    abstract int getEncodedSize();
+
+    boolean quiteSmall() {
+        return this.getEncodedSize() < OffsetSimultaneousEncoder.LARGE_ENCODED_SIZE_THRESHOLD_BYTES;
+    }
+
+    byte[] compress() throws IOException {
+        return OffsetSimpleSerialisation.compressZstd(this.getEncodedBytes());
+    }
+
+    void register() throws EncodingNotSupportedException {
+        final byte[] bytes = this.serialise();
+        final OffsetEncoding encodingType = this.getEncodingType();
+        this.register(encodingType, bytes);
+    }
+
+    private void register(final OffsetEncoding type, final byte[] bytes) {
+        log.debug("Registering {}, with size {}", type, bytes.length);
+        EncodedOffsetPair encodedPair = new EncodedOffsetPair(type, ByteBuffer.wrap(bytes));
+        offsetSimultaneousEncoder.sortedEncodings.add(encodedPair);
+        offsetSimultaneousEncoder.encodingMap.put(type, bytes);
+    }
+
+    @SneakyThrows
+    void registerCompressed() {
+        final byte[] compressed = compress();
+        final OffsetEncoding encodingType = this.getEncodingTypeCompressed();
+        this.register(encodingType, compressed);
+    }
+
+    protected abstract byte[] getEncodedBytes();
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetEncoding.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetEncoding.java
new file mode 100644
index 000000000..a2d6cae27
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetEncoding.java
@@ -0,0 +1,75 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.Getter;
+import lombok.RequiredArgsConstructor;
+import lombok.ToString;
+
+import java.util.Arrays;
+import java.util.Map;
+import java.util.function.Function;
+import java.util.stream.Collectors;
+
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.Version.v1;
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.Version.v2;
+
+/**
+ * Offset encoding MagicNumbers to {@link OffsetEncoder}.
+ *
+ * @author Antony Stubbs
+ */
+@ToString
+@RequiredArgsConstructor
+public enum OffsetEncoding {
+    ByteArray(v1, (byte) 'L'),
+    ByteArrayCompressed(v1, (byte) 'î'),
+    BitSet(v1, (byte) 'l'),
+    BitSetCompressed(v1, (byte) 'a'),
+    RunLength(v1, (byte) 'n'),
+    RunLengthCompressed(v1, (byte) 'J'),
+    /**
+     * switch from encoding bitset length as a short to an integer (length of 32,000 was reasonable too short)
+     */
+    BitSetV2(v2, (byte) 'o'),
+    BitSetV2Compressed(v2, (byte) 's'),
+    /**
+     * switch from encoding run lengths as Shorts to Integers
+     */
+    RunLengthV2(v2, (byte) 'e'),
+    RunLengthV2Compressed(v2, (byte) 'p'),
+
+    /**
+     * Checks for pre-existing Kafka Streams metadata. Although the Kafka Streams magic numbers are annoyingly simple, ours are not, so should be safe to take this guess that they are indeed from Kafka Streams.
+     * <a href="https://github.com/apache/kafka/blob/cc77a38d280657a0e3969b255f103af4d11c7914/streams/src/main/java/org/apache/kafka/streams/processor/internals/TopicPartitionMetadata.java#L33">source from Kafka Streams code</a>
+     */
+    KafkaStreams(v1, (byte) 1),
+    KafkaStreamsV2(v2, (byte) 2);
+
+
+    public enum Version {
+        v1, v2
+    }
+
+    public final Version version;
+
+    @Getter
+    public final byte magicByte;
+
+    private static final Map<Byte, OffsetEncoding> magicMap = Arrays.stream(values()).collect(Collectors.toMap(OffsetEncoding::getMagicByte, Function.identity()));
+
+    public static OffsetEncoding decode(byte magic) {
+        OffsetEncoding encoding = magicMap.get(magic);
+        if (encoding == null) {
+            throw new RuntimeException("Unexpected magic: " + magic);
+        } else {
+            return encoding;
+        }
+    }
+
+    public String description() {
+        return name() + ":" + version;
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetMapCodecManager.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetMapCodecManager.java
new file mode 100644
index 000000000..14d5af515
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetMapCodecManager.java
@@ -0,0 +1,286 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.internal.InternalRuntimeException;
+import io.confluent.parallelconsumer.internal.PCModule;
+import io.confluent.parallelconsumer.metrics.PCMetrics;
+import io.confluent.parallelconsumer.metrics.PCMetricsDef;
+import io.micrometer.core.instrument.Tag;
+import io.confluent.parallelconsumer.state.PartitionState;
+import io.micrometer.core.instrument.Counter;
+import io.micrometer.core.instrument.Timer;
+import lombok.Value;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.common.TopicPartition;
+import org.apache.kafka.common.errors.WakeupException;
+
+import java.nio.ByteBuffer;
+import java.nio.charset.Charset;
+import java.util.*;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+import static java.nio.charset.StandardCharsets.UTF_8;
+
+/**
+ * Uses multiple encodings to compare, when decided, can refactor other options out for analysis only -
+ * {@link #encodeOffsetsCompressed}
+ * <p>
+ * TODO: consider IO exception management - question sneaky throws usage?
+ * <p>
+ * TODO: enforce max uncommitted {@literal <} encoding length (Short.MAX)
+ * <p>
+ * Bitset serialisation format:
+ * <ul>
+ * <li>byte1: magic
+ * <li>byte2-3: Short: bitset size
+ * <li>byte4-n: serialised {@link BitSet}
+ * </ul>
+ *
+ * @author Antony Stubbs
+ */
+// metrics: avg time spend encoding, number of times each encoding used
+@Slf4j
+public class OffsetMapCodecManager<K, V> {
+
+    /**
+     * Used to prevent tests running in parallel that depends on setting static state in this class. Manipulation of
+     * static state in tests needs to be removed to this isn't necessary.
+     * <p>
+     * todo remove static state manipulation from tests (make non static)
+     */
+    public static final String METADATA_DATA_SIZE_RESOURCE_LOCK = "Value doesn't matter, just needs a constant";
+
+    /**
+     * Maximum size of the commit offset metadata
+     *
+     * @see <a
+     *         href="https://github.com/apache/kafka/blob/9bc9a37e50e403a356a4f10d6df12e9f808d4fba/core/src/main/scala/kafka/coordinator/group/OffsetConfig.scala#L52">OffsetConfig#DefaultMaxMetadataSize</a>
+     * @see "kafka.coordinator.group.OffsetConfig#DefaultMaxMetadataSize"
+     */
+    // todo refactored to constant in the remove statics branch
+    public static int DefaultMaxMetadataSize = 4096;
+
+    public static final Charset CHARSET_TO_USE = UTF_8;
+
+    private final PCModule module;
+
+    private Timer offsetEncodingTimer;
+    private final Map<OffsetEncoding, Counter> encodingCounters = new HashMap<>();
+
+    private final PCMetrics pcMetrics;
+
+    private static ParallelConsumerOptions.InvalidOffsetMetadataHandlingPolicy errorPolicy = ParallelConsumerOptions.InvalidOffsetMetadataHandlingPolicy.FAIL;
+
+    /**
+     * Decoding result for encoded offsets
+     */
+    @Value
+    public static class HighestOffsetAndIncompletes {
+
+        /**
+         * The highest represented offset in this result.
+         */
+        Optional<Long> highestSeenOffset;
+
+        /**
+         * Of the offsets encoded, the incomplete ones.
+         */
+        // todo change to List as Sets have no order
+        SortedSet<Long> incompleteOffsets;
+
+        public static HighestOffsetAndIncompletes of(long highestSeenOffset) {
+            return new HighestOffsetAndIncompletes(Optional.of(highestSeenOffset), new TreeSet<>());
+        }
+
+        public static HighestOffsetAndIncompletes of(long highestSeenOffset, SortedSet<Long> incompleteOffsets) {
+            return new HighestOffsetAndIncompletes(Optional.of(highestSeenOffset), incompleteOffsets);
+        }
+
+        public static HighestOffsetAndIncompletes of() {
+            return new HighestOffsetAndIncompletes(Optional.empty(), new TreeSet<>());
+        }
+    }
+
+    /**
+     * Forces the use of a specific codec, instead of choosing the most efficient one. Useful for testing.
+     */
+    public static Optional<OffsetEncoding> forcedCodec = Optional.empty();
+
+    // todo remove consumer #233
+    public OffsetMapCodecManager(PCModule<K, V> module) {
+        this.module = module;
+        if (module != null){
+            this.errorPolicy = module.options().getInvalidOffsetMetadataPolicy();
+        }
+        pcMetrics = module.pcMetrics();
+        initMeters();
+    }
+
+    private void initMeters() {
+        offsetEncodingTimer = pcMetrics.getTimerFromMetricDef(PCMetricsDef.OFFSETS_ENCODING_TIME);
+    }
+
+    /**
+     * Load all the previously completed offsets that were not committed
+     */
+    // todo this is the only method that needs the consumer - offset encoding is being conflated with decoding upon assignment #233
+    // todo make package private?
+    // todo rename
+    public Map<TopicPartition, PartitionState<K, V>> loadPartitionStateForAssignment(final Collection<TopicPartition> assignment) {
+        // load last committed state / metadata from consumer
+        // todo this should be controlled for - improve consumer management so that this can't happen
+        Map<TopicPartition, OffsetAndMetadata> partitionLastCommittedOffsets = null;
+        int attempts = 0;
+        while (partitionLastCommittedOffsets == null) {
+            WakeupException lastWakeupException = null;
+            try {
+                partitionLastCommittedOffsets = module.consumer().committed(new HashSet<>(assignment));
+            } catch (WakeupException exception) {
+                log.debug("Woken up trying to get assignment", exception);
+                lastWakeupException = exception;
+            }
+            attempts++;
+            if (attempts > 10) // shouldn't need more than 1 ever
+                throw new InternalRuntimeException("Failed to get partition assignment - continuously woken up.", lastWakeupException);
+        }
+
+        var partitionStates = new HashMap<TopicPartition, PartitionState<K, V>>();
+        partitionLastCommittedOffsets.forEach((tp, offsetAndMeta) -> {
+            if (offsetAndMeta != null) {
+                try {
+                    PartitionState<K, V> state = decodePartitionState(tp, offsetAndMeta);
+                    partitionStates.put(tp, state);
+                } catch (OffsetDecodingError offsetDecodingError) {
+                    log.error("Error decoding offsets from assigned partition, dropping offset map (will replay previously completed messages - partition: {}, data: {})",
+                            tp, offsetAndMeta, offsetDecodingError);
+                }
+            }
+
+        });
+
+        // assigned partitions for which there has never been a commit
+        // for each assignment with no commit history, enter a default entry. Catches multiple other cases.
+        assignment.stream()
+                .filter(topicPartition -> !partitionStates.containsKey(topicPartition))
+                .forEach(topicPartition -> {
+                    var psm = module.workManager().getPm();
+                    var epoch = psm.getEpochOfPartition(topicPartition);
+                    PartitionState<K, V> defaultEntry = new PartitionState<>(epoch, module, topicPartition, HighestOffsetAndIncompletes.of());
+                    partitionStates.put(topicPartition, defaultEntry);
+                });
+
+        return partitionStates;
+    }
+
+    private HighestOffsetAndIncompletes deserialiseIncompleteOffsetMapFromBase64(OffsetAndMetadata offsetData) throws OffsetDecodingError {
+        return deserialiseIncompleteOffsetMapFromBase64(offsetData.offset(), offsetData.metadata());
+    }
+
+    public static HighestOffsetAndIncompletes deserialiseIncompleteOffsetMapFromBase64(long committedOffsetForPartition, String base64EncodedOffsetPayload) throws OffsetDecodingError {
+        byte[] decodedBytes;
+        try {
+            decodedBytes = OffsetSimpleSerialisation.decodeBase64(base64EncodedOffsetPayload);
+        } catch (IllegalArgumentException a) {
+            throw new OffsetDecodingError(msg("Error decoding offset metadata, input was: {}", base64EncodedOffsetPayload), a);
+        }
+        return decodeCompressedOffsets(committedOffsetForPartition, decodedBytes);
+    }
+
+    PartitionState<K, V> decodePartitionState(TopicPartition tp, OffsetAndMetadata offsetData) throws OffsetDecodingError {
+        HighestOffsetAndIncompletes incompletes = deserialiseIncompleteOffsetMapFromBase64(offsetData);
+        log.debug("Loaded incomplete offsets from offset payload {}", incompletes);
+        var epoch = module.workManager().getPm().getEpochOfPartition(tp);
+        return new PartitionState<>(epoch, module, tp, incompletes);
+    }
+
+    public String makeOffsetMetadataPayload(long baseOffsetForPartition, PartitionState<K, V> state) throws NoEncodingPossibleException {
+        String offsetMap = serialiseIncompleteOffsetMapToBase64(baseOffsetForPartition, state);
+        return offsetMap;
+    }
+
+    String serialiseIncompleteOffsetMapToBase64(long baseOffsetForPartition, PartitionState<K, V> state) throws NoEncodingPossibleException {
+        byte[] compressedEncoding = encodeOffsetsCompressed(baseOffsetForPartition, state);
+        String b64 = OffsetSimpleSerialisation.base64(compressedEncoding);
+        return b64;
+    }
+
+    /**
+     * Print out all the offset status into a String, and use X to effectively do run length encoding compression on the
+     * string.
+     * <p>
+     * Include the magic byte in the returned array.
+     * <p>
+     * Can remove string encoding in favour of the boolean array for the `BitSet` if that's how things settle.
+     */
+    byte[] encodeOffsetsCompressed(long baseOffsetForPartition, PartitionState<K, V> partitionState) throws NoEncodingPossibleException {
+        var incompleteOffsets = partitionState.getIncompleteOffsetsBelowHighestSucceeded();
+        long highestSucceeded = partitionState.getOffsetHighestSucceeded();
+        if (log.isDebugEnabled()) {
+            log.debug("Encoding partition {}, highest succeeded {}, incomplete offsets to encode {}",
+                    partitionState.getTp(),
+                    highestSucceeded,
+                    incompleteOffsets);
+        }
+
+
+        OffsetSimultaneousEncoder simultaneousEncoder = null;
+        try {
+            simultaneousEncoder = new OffsetSimultaneousEncoder(baseOffsetForPartition, highestSucceeded, incompleteOffsets);
+            offsetEncodingTimer.recordCallable(simultaneousEncoder::invoke);
+        } catch (Exception e) {
+            throw new InternalRuntimeException("Error encoding offsets", e);
+        }
+
+        //
+        if (forcedCodec.isPresent()) {
+            var forcedOffsetEncoding = forcedCodec.get();
+            log.debug("Forcing use of {}, for testing", forcedOffsetEncoding);
+            getCounterMeterForEncoding(forcedOffsetEncoding).increment();
+
+            Map<OffsetEncoding, byte[]> encodingMap = simultaneousEncoder.getEncodingMap();
+            byte[] bytes = encodingMap.get(forcedOffsetEncoding);
+            if (bytes == null)
+                throw new NoEncodingPossibleException(msg("Can't force an encoding that hasn't been run: {}", forcedOffsetEncoding));
+            return simultaneousEncoder.packEncoding(new EncodedOffsetPair(forcedOffsetEncoding, ByteBuffer.wrap(bytes)));
+        } else {
+            getCounterMeterForEncoding(simultaneousEncoder.sortedEncodings.first().getEncoding()).increment();
+            return simultaneousEncoder.packSmallest();
+        }
+    }
+
+    private Counter getCounterMeterForEncoding(OffsetEncoding encoding) {
+        Counter counter = encodingCounters.get(encoding);
+        if (counter == null) {
+            counter = pcMetrics.getCounterFromMetricDef(PCMetricsDef.OFFSETS_ENCODING_USAGE,
+                    Tag.of("encoding", encoding.name()));
+            encodingCounters.put(encoding, counter);
+        }
+        return counter;
+    }
+
+    /**
+     * Print out all the offset status into a String, and potentially use zstd to effectively do run length encoding
+     * compression
+     *
+     * @return Set of offsets which are not complete, and the highest offset encoded.
+     */
+    static HighestOffsetAndIncompletes decodeCompressedOffsets(long nextExpectedOffset, byte[] decodedBytes) {
+
+        // if no offset bitmap data
+        if (decodedBytes.length == 0) {
+            // in this case, as there is no encoded offset data in the matadata, the highest we previously saw must be
+            // the offset before the committed offset
+            long highestSeenOffsetIsThen = nextExpectedOffset - 1;
+            return HighestOffsetAndIncompletes.of(highestSeenOffsetIsThen);
+        } else {
+            var result = EncodedOffsetPair.unwrap(decodedBytes);
+            return result.getDecodedIncompletes(nextExpectedOffset, errorPolicy);
+        }
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetRunLength.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetRunLength.java
new file mode 100644
index 000000000..fef1f2ce1
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetRunLength.java
@@ -0,0 +1,165 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager.HighestOffsetAndIncompletes;
+import lombok.experimental.UtilityClass;
+import lombok.extern.slf4j.Slf4j;
+
+import java.nio.BufferUnderflowException;
+import java.nio.ByteBuffer;
+import java.nio.IntBuffer;
+import java.nio.ShortBuffer;
+import java.util.ArrayList;
+import java.util.List;
+import java.util.TreeSet;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.function.Supplier;
+
+/**
+ * Methods for encoding and decoding the run-lengths.
+ *
+ * @author Antony Stubbs
+ */
+@Slf4j
+@UtilityClass
+public class OffsetRunLength {
+
+    /**
+     * @return run length encoding, always starting with an 'o' count
+     */
+    static List<Integer> runLengthEncode(final String in) {
+        final AtomicInteger length = new AtomicInteger();
+        final AtomicBoolean previous = new AtomicBoolean(false);
+        final List<Integer> encoding = new ArrayList<>();
+        in.chars().forEachOrdered(bit -> {
+            final boolean current = switch (bit) {
+                case 'o' -> false;
+                case 'x' -> true;
+                default -> throw new IllegalArgumentException(bit + " in " + in);
+            };
+            if (previous.get() == current) {
+                length.getAndIncrement();
+            } else {
+                previous.set(current);
+                encoding.add(length.get());
+                length.set(1);
+            }
+        });
+        encoding.add(length.get()); // add tail
+        return encoding;
+    }
+
+    /**
+     * @see #runLengthEncode
+     */
+    static String runLengthDecodeToString(final List<Integer> in) {
+        final StringBuilder sb = new StringBuilder(in.size());
+        boolean current = false;
+        for (final Integer i : in) {
+            for (int x = 0; x < i; x++) {
+                if (current) {
+                    sb.append('x');
+                } else {
+                    sb.append('o');
+                }
+            }
+            current = !current; // toggle
+        }
+        return sb.toString();
+    }
+
+
+    /**
+     * @see #runLengthEncode
+     */
+    static HighestOffsetAndIncompletes runLengthDecodeToIncompletes(OffsetEncoding encoding, final long baseOffset, final ByteBuffer in) {
+        in.rewind();
+        final ShortBuffer v1ShortBuffer = in.asShortBuffer();
+        final IntBuffer v2IntegerBuffer = in.asIntBuffer();
+
+        final var incompletes = new TreeSet<Long>();
+
+        /*
+        Set highestSeenOffset to baseOffset -1 initially - in case the metadata doesn't actually contain any data and
+        highestSeenOffset would remain at 0 otherwise.
+        That may cause warning / state truncation.
+        Issue #546 - https://github.com/confluentinc/parallel-consumer/issues/546
+         */
+        //TODO: look at offset encoding logic - maybe in those cases we should not create metadata at all?
+        long highestSeenOffset = (baseOffset > 0) ? (baseOffset - 1) : 0L;
+
+        Supplier<Boolean> hasRemainingTest = () -> {
+            return switch (encoding.version) {
+                case v1 -> v1ShortBuffer.hasRemaining();
+                case v2 -> v2IntegerBuffer.hasRemaining();
+            };
+        };
+        if (log.isTraceEnabled()) {
+            // print out all run lengths
+            var runlengths = new ArrayList<Number>();
+            try {
+                while (hasRemainingTest.get()) {
+                    Number runLength = switch (encoding.version) {
+                        case v1 -> v1ShortBuffer.get();
+                        case v2 -> v2IntegerBuffer.get();
+                    };
+                    runlengths.add(runLength);
+                }
+            } catch (BufferUnderflowException u) {
+                log.error("Error decoding offsets", u);
+            }
+            log.debug("Unrolled runlengths: {}", runlengths);
+            v1ShortBuffer.rewind();
+            v2IntegerBuffer.rewind();
+        }
+
+        // decodes incompletes
+        boolean currentRunLengthIsComplete = false;
+        long currentOffset = baseOffset;
+        while (hasRemainingTest.get()) {
+            try {
+                Number runLength = switch (encoding.version) {
+                    case v1 -> v1ShortBuffer.get();
+                    case v2 -> v2IntegerBuffer.get();
+                };
+
+                if (currentRunLengthIsComplete) {
+                    log.trace("Ignoring {} completed offset(s) (offset:{})", runLength, currentOffset);
+                    currentOffset += runLength.longValue();
+                    highestSeenOffset = currentOffset - 1;
+                } else {
+                    log.trace("Adding {} incomplete offset(s) (starting with offset:{})", runLength, currentOffset);
+                    for (int relativeOffset = 0; relativeOffset < runLength.longValue(); relativeOffset++) {
+                        incompletes.add(currentOffset);
+                        highestSeenOffset = currentOffset;
+                        currentOffset++;
+                    }
+                }
+                log.trace("Highest seen: {}", highestSeenOffset);
+            } catch (BufferUnderflowException u) {
+                log.error("Error decoding offsets", u);
+                throw u;
+            }
+            currentRunLengthIsComplete = !currentRunLengthIsComplete; // toggle
+        }
+        return HighestOffsetAndIncompletes.of(highestSeenOffset, incompletes);
+    }
+
+    static List<Integer> runLengthDeserialise(final ByteBuffer in) {
+        // view as short buffer
+        in.rewind();
+        final ShortBuffer shortBuffer = in.asShortBuffer();
+
+        //
+        final List<Integer> results = new ArrayList<>(shortBuffer.capacity());
+        while (shortBuffer.hasRemaining()) {
+            results.add((int) shortBuffer.get());
+        }
+        return results;
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetSimpleSerialisation.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetSimpleSerialisation.java
new file mode 100644
index 000000000..cac345862
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetSimpleSerialisation.java
@@ -0,0 +1,129 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+import com.github.luben.zstd.ZstdInputStream;
+import com.github.luben.zstd.ZstdOutputStream;
+import lombok.SneakyThrows;
+import lombok.experimental.UtilityClass;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.common.utils.ByteBufferInputStream;
+import org.xerial.snappy.SnappyInputStream;
+import org.xerial.snappy.SnappyOutputStream;
+
+import java.io.*;
+import java.nio.ByteBuffer;
+import java.util.Base64;
+import java.util.Set;
+import java.util.TreeSet;
+import java.util.zip.GZIPInputStream;
+import java.util.zip.GZIPOutputStream;
+
+import static io.confluent.csid.utils.BackportUtils.readFully;
+
+/**
+ * Methods for compressing, decompressing and encoding / encoding data.
+ *
+ * @author Antony Stubbs
+ */
+@UtilityClass
+@Slf4j
+public class OffsetSimpleSerialisation {
+
+    @SneakyThrows
+    static String encodeAsJavaObjectStream(final Set<Long> incompleteOffsets) {
+        final ByteArrayOutputStream baos = new ByteArrayOutputStream();
+        try (final ObjectOutputStream os = new ObjectOutputStream(baos)) {
+            os.writeObject(incompleteOffsets);
+        }
+        return Base64.getEncoder().encodeToString(baos.toByteArray());
+    }
+
+    private static TreeSet<Long> deserialiseJavaWriteObject(final byte[] decode) throws IOException, ClassNotFoundException {
+        final Set<Long> raw;
+        try (final ObjectInputStream objectInputStream = new ObjectInputStream(new ByteArrayInputStream(decode))) {
+            raw = (Set<Long>) objectInputStream.readObject();
+        }
+        return new TreeSet<>(raw);
+    }
+
+    @SneakyThrows
+    static byte[] compressSnappy(final byte[] bytes) {
+        try (final var out = new ByteArrayOutputStream();
+             final var stream = new SnappyOutputStream(out)) {
+            stream.write(bytes);
+            return out.toByteArray();
+        }
+    }
+
+    static ByteBuffer decompressSnappy(final ByteBuffer input) throws IOException {
+        try (final var snappy = new SnappyInputStream(new ByteBufferInputStream(input))) {
+            byte[] bytes = readFully(snappy);
+            return ByteBuffer.wrap(bytes);
+        }
+    }
+
+    static String base64(final ByteArrayOutputStream out) {
+        final byte[] src = out.toByteArray();
+        return base64(src);
+    }
+
+    static byte[] compressZstd(final byte[] bytes) throws IOException {
+        final var out = new ByteArrayOutputStream();
+        try (final var zstream = new ZstdOutputStream(out)) {
+            zstream.write(bytes);
+        }
+        return out.toByteArray();
+    }
+
+    static byte[] compressGzip(final byte[] bytes) throws IOException {
+        final var out = new ByteArrayOutputStream();
+        try (final var zstream = new GZIPOutputStream(out)) {
+            zstream.write(bytes);
+        }
+        return out.toByteArray();
+    }
+
+    static String base64(final byte[] src) {
+        final byte[] encode = Base64.getEncoder().encode(src);
+        final String out = new String(encode, OffsetMapCodecManager.CHARSET_TO_USE);
+        log.trace("Final b64 size: {}", out.length());
+        return out;
+    }
+
+    static byte[] decodeBase64(final String b64) {
+        final byte[] bytes = b64.getBytes(OffsetMapCodecManager.CHARSET_TO_USE);
+        return Base64.getDecoder().decode(bytes);
+    }
+
+    static ByteBuffer decompressZstd(final ByteBuffer input) throws IOException {
+        try (final var zstream = new ZstdInputStream(new ByteBufferInputStream(input))) {
+            final byte[] bytes = readFully(zstream);
+            return ByteBuffer.wrap(bytes);
+        }
+    }
+
+    static byte[] decompressGzip(final ByteBuffer input) throws IOException {
+        try (final var gstream = new GZIPInputStream(new ByteBufferInputStream(input))) {
+            return readFully(gstream);
+        }
+    }
+
+    /**
+     * @see OffsetEncoding#ByteArray
+     */
+    static String deserialiseByteArrayToBitMapString(final ByteBuffer data) {
+        data.rewind();
+        final StringBuilder sb = new StringBuilder(data.capacity());
+        while (data.hasRemaining()) {
+            final byte b = data.get();
+            if (b == 1) {
+                sb.append('x');
+            } else {
+                sb.append('o');
+            }
+        }
+        return sb.toString();
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetSimultaneousEncoder.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetSimultaneousEncoder.java
new file mode 100644
index 000000000..fa173bb7e
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/OffsetSimultaneousEncoder.java
@@ -0,0 +1,304 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.Range;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.state.PartitionState;
+import io.confluent.parallelconsumer.state.WorkManager;
+import lombok.Getter;
+import lombok.ToString;
+import lombok.extern.slf4j.Slf4j;
+
+import java.nio.ByteBuffer;
+import java.util.*;
+import java.util.concurrent.ConcurrentHashMap;
+
+import static io.confluent.csid.utils.Range.range;
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.Version.v1;
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.Version.v2;
+import static io.confluent.parallelconsumer.state.PartitionState.KAFKA_OFFSET_ABSENCE;
+
+/**
+ * Encode with multiple strategies at the same time.
+ * <p>
+ * Have results in an accessible structure, easily selecting the highest compression.
+ *
+ * @author Antony Stubbs
+ * @see #invoke()
+ */
+@Slf4j
+@ToString(onlyExplicitlyIncluded = true)
+public class OffsetSimultaneousEncoder {
+
+    /**
+     * Size threshold in bytes after which compressing the encodings will be compared, as it seems to be typically worth
+     * the extra compression step when beyond this size in the source array.
+     */
+    public static final int LARGE_ENCODED_SIZE_THRESHOLD_BYTES = 200;
+
+    /**
+     * Size threshold to notice particularly large input maps.
+     */
+    public static final int LARGE_INPUT_MAP_SIZE = 2_000;
+
+    /**
+     * The offsets which have not yet been fully completed and can't have their offset committed - only used to test
+     * with {@link Set#contains} (no order requirement, but {@link SortedSet} just in case).
+     */
+    @Getter
+    private final SortedSet<Long> incompleteOffsets;
+
+    /**
+     * The lowest committable offset
+     */
+    @ToString.Include
+    private final long lowWaterMark;
+
+    /**
+     * The difference between the base offset (the offset to be committed) and the highest seen offset.
+     */
+    @ToString.Include
+    private final long lengthBetweenBaseAndHighOffset;
+
+    /**
+     * Map of different encoding types for the same offset data, used for retrieving the data for the encoding type
+     */
+    @Getter
+    Map<OffsetEncoding, byte[]> encodingMap = new EnumMap<>(OffsetEncoding.class);
+
+    /**
+     * Ordered set of the different encodings, used to quickly retrieve the most compressed encoding
+     *
+     * @see #packSmallest()
+     */
+    @Getter
+    SortedSet<EncodedOffsetPair> sortedEncodings = new TreeSet<>();
+
+    /**
+     * Force the encoder to also add the compressed versions. Useful for testing.
+     * <p>
+     * Visible for testing.
+     */
+    @ToString.Include
+    public static boolean compressionForced = false;
+
+    /**
+     * Used to prevent tests running in parallel that depends on setting static state in this class. Manipulation of
+     * static state in tests needs to be removed to this isn't necessary.
+     */
+    public static final String COMPRESSION_FORCED_RESOURCE_LOCK = "Value doesn't matter, just needs a constant";
+
+    /**
+     * The encoders to run. Concurrent so we can remove encoders while traversing.
+     */
+    private final ConcurrentHashMap.KeySetView<OffsetEncoder, Boolean> activeEncoders;
+
+    public OffsetSimultaneousEncoder(long baseOffsetToCommit, long highestSucceededOffset, SortedSet<Long> incompleteOffsets) {
+        this.lowWaterMark = baseOffsetToCommit;
+        this.incompleteOffsets = incompleteOffsets;
+
+        //
+        if (highestSucceededOffset == KAFKA_OFFSET_ABSENCE) { // nothing succeeded yet
+            highestSucceededOffset = baseOffsetToCommit;
+        }
+
+        highestSucceededOffset = maybeRaiseOffsetHighestSucceeded(baseOffsetToCommit, highestSucceededOffset);
+
+        lengthBetweenBaseAndHighOffset = highestSucceededOffset - this.lowWaterMark + 1;
+
+        if (lengthBetweenBaseAndHighOffset < 0) {
+            // sanity check
+            throw new IllegalStateException(msg("Cannot have negative length encoding (calculated length: {}, base offset to commit: {}, highest succeeded offset: {})",
+                    lengthBetweenBaseAndHighOffset, baseOffsetToCommit, highestSucceededOffset));
+        }
+
+        this.activeEncoders = initEncoders();
+    }
+
+    /**
+     * Ensure that the {@param #highestSucceededOffset} is always at least a single offset behind the {}@param
+     * baseOffsetToCommit}. Needed to allow us to jump over gaps in the partitions such as transaction markers.
+     * <p>
+     * Under normal operation, it is expected that the highest succeeded offset will generally always be higher than the
+     * next expected offset to poll. This is because PC processes records well beyond the
+     * {@link PartitionState#getOffsetHighestSequentialSucceeded()} all the time, unless operation in
+     * {@link ParallelConsumerOptions.ProcessingOrder#PARTITION} order. So this situation - where the highest succeeded
+     * offset is below the next offset to poll at the time of commit - will either be an incredibly rare case: only at
+     * the very beginning of processing records, or where ALL records are slow enough or blocked, or in synthetically
+     * created scenarios (like test cases).
+     */
+    private long maybeRaiseOffsetHighestSucceeded(long baseOffsetToCommit, long highestSucceededOffset) {
+        long nextExpectedMinusOne = baseOffsetToCommit - 1;
+
+        boolean gapLargerThanOne = highestSucceededOffset < nextExpectedMinusOne;
+        if (gapLargerThanOne) {
+            long gap = nextExpectedMinusOne - highestSucceededOffset;
+            log.debug("Gap detected in partition (highest succeeded: {} while next expected poll offset: {} - gap is {}), probably tx markers. Moving highest succeeded to next expected - 1",
+                    highestSucceededOffset,
+                    nextExpectedMinusOne,
+                    gap);
+            // jump straight to the lowest incomplete - 1, allows us to jump over gaps in the partitions such as transaction markers
+            highestSucceededOffset = nextExpectedMinusOne;
+        }
+
+        return highestSucceededOffset;
+    }
+
+    private ConcurrentHashMap.KeySetView<OffsetEncoder, Boolean> initEncoders() {
+        ConcurrentHashMap.KeySetView<OffsetEncoder, Boolean> newEncoders = ConcurrentHashMap.newKeySet();
+        if (lengthBetweenBaseAndHighOffset > LARGE_INPUT_MAP_SIZE) {
+            log.trace("Relatively large input map size: {} (start: {} end: {})", lengthBetweenBaseAndHighOffset, lowWaterMark, getEndOffsetExclusive());
+        }
+
+        addBitsetEncoder(newEncoders, v1);
+        addBitsetEncoder(newEncoders, v2);
+
+
+        newEncoders.add(new RunLengthEncoder(this, v1));
+        newEncoders.add(new RunLengthEncoder(this, v2));
+
+        return newEncoders;
+    }
+
+    private void addBitsetEncoder(ConcurrentHashMap.KeySetView<OffsetEncoder, Boolean> newEncoders, OffsetEncoding.Version version) {
+        try {
+            newEncoders.add(new BitSetEncoder(lengthBetweenBaseAndHighOffset, this, version));
+        } catch (BitSetEncodingNotSupportedException a) {
+            log.debug("Cannot construct {} version {} : {}", BitSetEncoder.class.getSimpleName(), version, a.getMessage());
+        }
+    }
+
+    /**
+     * The end offset (exclusive)
+     */
+    private long getEndOffsetExclusive() {
+        return lowWaterMark + lengthBetweenBaseAndHighOffset;
+    }
+
+    /**
+     * Not enabled as byte buffer seems to always be beaten by BitSet, which makes sense
+     * <p>
+     * Visible for testing
+     */
+    void addByteBufferEncoder() {
+        try {
+            activeEncoders.add(new ByteBufferEncoder(lengthBetweenBaseAndHighOffset, this));
+        } catch (ArithmeticException a) {
+            log.warn("Cannot use {} encoder ({})", BitSetEncoder.class.getSimpleName(), a.getMessage());
+        }
+    }
+
+    /**
+     * Highwater mark already encoded in string - {@link OffsetMapCodecManager#makeOffsetMetadataPayload} - so encoding
+     * BitSet run length may not be needed, or could be swapped
+     * <p/>
+     * Simultaneously encodes:
+     * <ul>
+     * <li>{@link OffsetEncoding#BitSet}</li>
+     * <li>{@link OffsetEncoding#RunLength}</li>
+     * </ul>
+     * Conditionally encodes compression variants:
+     * <ul>
+     * <li>{@link OffsetEncoding#BitSetCompressed}</li>
+     * <li>{@link OffsetEncoding#RunLengthCompressed}</li>
+     * </ul>
+     * Currently commented out is {@link OffsetEncoding#ByteArray} as there doesn't seem to be an advantage over
+     * BitSet encoding.
+     * <p>
+     * TODO: optimisation - inline this into the partition iteration loop in {@link WorkManager}
+     * <p>
+     * TODO: optimisation - could double the run-length range from Short.MAX_VALUE (~33,000) to Short.MAX_VALUE * 2
+     *  (~66,000) by using unsigned shorts instead (highest representable relative offset is Short.MAX_VALUE because each
+     *  run-length entry is a Short)
+     * <p>
+     *  TODO VERY large offset ranges is slow (Integer.MAX_VALUE) - encoding scans could be avoided if passing in map of incompletes which should already be known
+     */
+    public OffsetSimultaneousEncoder invoke() {
+        log.debug("Starting encode of incompletes, base offset is: {}, end offset is: {}", lowWaterMark, getEndOffsetExclusive());
+        log.trace("Incompletes are: {}", this.incompleteOffsets);
+
+        //
+        log.debug("Encode loop offset start,end: [{},{}] length: {}", this.lowWaterMark, getEndOffsetExclusive(), lengthBetweenBaseAndHighOffset);
+        /*
+         * todo refactor this loop into the encoders (or sequential vs non sequential encoders) as RunLength doesn't need
+         *  to look at every offset in the range, only the ones that change from 0 to 1. BitSet however needs to iterate
+         *  the entire range. So when BitSet can't be used, the encoding would be potentially a lot faster as RunLength
+         *  didn't need the whole loop.
+         */
+        Range relativeOffsetsLongRange = range(lengthBetweenBaseAndHighOffset);
+        relativeOffsetsLongRange.forEach(relativeOffset -> {
+            // range index (relativeOffset) is used as we don't actually encode offsets, we encode the relative offset from the base offset
+            final long actualOffset = this.lowWaterMark + relativeOffset;
+            final boolean isIncomplete = this.incompleteOffsets.contains(actualOffset);
+            activeEncoders.forEach(encoder -> {
+                try {
+                    if (isIncomplete) {
+                        log.trace("Found an incomplete offset {}", actualOffset);
+                        encoder.encodeIncompleteOffset(relativeOffset);
+                    } else {
+                        encoder.encodeCompletedOffset(relativeOffset);
+                    }
+                } catch (EncodingNotSupportedException e) {
+                    log.debug("Error encoding offset {} with encoder {}, removing encoder", actualOffset, encoder, e);
+                    activeEncoders.remove(encoder);
+                }
+            });
+        });
+
+        registerEncodings(activeEncoders);
+
+        log.debug("In order: {}", this.sortedEncodings);
+
+        return this;
+    }
+
+    private void registerEncodings(final Set<? extends OffsetEncoder> encoders) {
+        List<OffsetEncoder> toRemove = new ArrayList<>();
+        for (OffsetEncoder encoder : encoders) {
+            try {
+                encoder.register();
+            } catch (EncodingNotSupportedException e) {
+                log.debug("Removing {} encoder, not supported ({})", encoder.getEncodingType().description(), e.getMessage());
+                toRemove.add(encoder);
+            }
+        }
+        toRemove.forEach(encoders::remove);
+
+        // compressed versions
+        // sizes over LARGE_INPUT_MAP_SIZE_THRESHOLD bytes seem to benefit from compression
+        boolean noEncodingsAreSmallEnough = encoders.stream().noneMatch(OffsetEncoder::quiteSmall);
+        if (noEncodingsAreSmallEnough || compressionForced) {
+            encoders.forEach(OffsetEncoder::registerCompressed);
+        }
+    }
+
+    /**
+     * Select the smallest encoding, and pack it.
+     *
+     * @see #packEncoding(EncodedOffsetPair)
+     */
+    public byte[] packSmallest() throws NoEncodingPossibleException {
+        if (sortedEncodings.isEmpty()) {
+            throw new NoEncodingPossibleException("No encodings could be used");
+        }
+        final EncodedOffsetPair best = this.sortedEncodings.first();
+        log.debug("Compression chosen is: {}", best.encoding.name());
+        return packEncoding(best);
+    }
+
+    /**
+     * Pack the encoded bytes into a magic byte wrapped byte array which indicates the encoding type.
+     */
+    byte[] packEncoding(final EncodedOffsetPair best) {
+        final int magicByteSize = Byte.BYTES;
+        final ByteBuffer result = ByteBuffer.allocate(magicByteSize + best.data.capacity());
+        result.put(best.encoding.magicByte);
+        result.put(best.data);
+        return result.array();
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/RunLengthEncoder.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/RunLengthEncoder.java
new file mode 100644
index 000000000..c579a773c
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/RunLengthEncoder.java
@@ -0,0 +1,177 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.MathUtils;
+import io.confluent.csid.utils.Range;
+import lombok.Getter;
+import lombok.ToString;
+
+import java.nio.ByteBuffer;
+import java.util.ArrayList;
+import java.util.List;
+import java.util.Optional;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.*;
+import static io.confluent.parallelconsumer.state.PartitionState.KAFKA_OFFSET_ABSENCE;
+
+/**
+ * RunLength encoder that leverages the nature of this system.
+ * <p>
+ * One such nature is that gaps between completed offsets get encoded as succeeded offsets. This doesn't matter because
+ * they don't exist, and we'll never see them (they no longer exist in the source partition).
+ * <p>
+ * Run-length is written "Run-length": https://en.wikipedia.org/wiki/Run-length_encoding
+ *
+ * @author Antony Stubbs
+ */
+@ToString(callSuper = true, onlyExplicitlyIncluded = true)
+public class RunLengthEncoder extends OffsetEncoder {
+
+    @ToString.Include
+    private int currentRunLengthSize = 0;
+
+    @ToString.Include
+    private boolean previousRunLengthState = false;
+
+    @ToString.Include
+    @Getter
+    private final List<Integer> runLengthEncodingIntegers;
+
+    private Optional<byte[]> encodedBytes = Optional.empty();
+
+    private static final Version DEFAULT_VERSION = Version.v2;
+
+    public RunLengthEncoder(OffsetSimultaneousEncoder offsetSimultaneousEncoder, Version newVersion) {
+        super(offsetSimultaneousEncoder, newVersion);
+        // run length setup
+        runLengthEncodingIntegers = new ArrayList<>();
+    }
+
+    @Override
+    protected OffsetEncoding getEncodingType() {
+        return switch (version) {
+            case v1 -> RunLength;
+            case v2 -> RunLengthV2;
+        };
+    }
+
+    @Override
+    protected OffsetEncoding getEncodingTypeCompressed() {
+        return switch (version) {
+            case v1 -> RunLengthCompressed;
+            case v2 -> RunLengthV2Compressed;
+        };
+    }
+
+    @Override
+    public void encodeIncompleteOffset(final long relativeOffset) throws EncodingNotSupportedException {
+        encodeRunLength(false, relativeOffset);
+    }
+
+    @Override
+    public void encodeCompletedOffset(final long relativeOffset) throws EncodingNotSupportedException {
+        encodeRunLength(true, relativeOffset);
+    }
+
+    @Override
+    public byte[] serialise() throws EncodingNotSupportedException {
+        addTail();
+
+        int entryWidth = switch (version) {
+            case v1 -> Short.BYTES;
+            case v2 -> Integer.BYTES;
+        };
+        ByteBuffer runLengthEncodedByteBuffer = ByteBuffer.allocate(runLengthEncodingIntegers.size() * entryWidth);
+
+        for (final Integer runLength : runLengthEncodingIntegers) {
+            switch (version) {
+                case v1 -> {
+                    try {
+                        runLengthEncodedByteBuffer.putShort(MathUtils.toShortExact(runLength));
+                    } catch (ArithmeticException e) {
+                        throw new RunLengthV1EncodingNotSupported(msg("Run-length too long for Short ({} vs Short max of {})", runLength, Short.MAX_VALUE));
+                    }
+                }
+                case v2 -> {
+                    runLengthEncodedByteBuffer.putInt(runLength);
+                }
+            }
+        }
+
+        byte[] array = runLengthEncodedByteBuffer.array();
+        encodedBytes = Optional.of(array);
+
+        return array;
+    }
+
+    void addTail() {
+        runLengthEncodingIntegers.add(currentRunLengthSize);
+    }
+
+    @Override
+    public int getEncodedSize() {
+        return encodedBytes.get().length;
+    }
+
+    @Override
+    protected byte[] getEncodedBytes() {
+        return encodedBytes.get();
+    }
+
+    long previousRangeIndex = KAFKA_OFFSET_ABSENCE;
+
+    private void encodeRunLength(final boolean currentIsComplete, final long relativeOffset) throws EncodingNotSupportedException {
+        // run length
+        final long delta = relativeOffset - previousRangeIndex;
+        boolean currentOffsetMatchesOurRunLengthState = previousRunLengthState == currentIsComplete;
+        if (currentOffsetMatchesOurRunLengthState) {
+            switch (version) {
+                case v1 -> {
+                    try {
+                        final int deltaAsInt = Math.toIntExact(delta);
+                        final int newRunLength = Math.addExact(currentRunLengthSize, deltaAsInt);
+                        currentRunLengthSize = MathUtils.toShortExact(newRunLength);
+                    } catch (ArithmeticException e) {
+                        throw new RunLengthV1EncodingNotSupported(msg("Run-length too big for Short ({} vs max of {})", currentRunLengthSize + delta, Short.MAX_VALUE));
+                    }
+                }
+                case v2 -> {
+                    try {
+                        currentRunLengthSize = Math.toIntExact(Math.addExact(currentRunLengthSize, delta));
+                    } catch (ArithmeticException e) {
+                        throw new RunLengthV2EncodingNotSupported(msg("Run-length too big for Integer ({} vs max of {})", currentRunLengthSize, Integer.MAX_VALUE));
+                    }
+                }
+            }
+        } else {
+            previousRunLengthState = currentIsComplete;
+            runLengthEncodingIntegers.add(currentRunLengthSize);
+            currentRunLengthSize = 1; // reset to 1
+        }
+        previousRangeIndex = relativeOffset;
+    }
+
+    /**
+     * @return the offsets which are succeeded
+     */
+    public List<Long> calculateSucceededActualOffsets(long originalBaseOffset) {
+        List<Long> successfulOffsets = new ArrayList<>();
+        boolean succeeded = false;
+        long offsetPosition = originalBaseOffset;
+        for (final int run : runLengthEncodingIntegers) {
+            if (succeeded) {
+                for (final Long integer : Range.range(run)) {
+                    long newGoodOffset = offsetPosition + integer;
+                    successfulOffsets.add(newGoodOffset);
+                }
+            }
+            offsetPosition += run;
+            succeeded = !succeeded;
+        }
+        return successfulOffsets;
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/RunLengthV1EncodingNotSupported.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/RunLengthV1EncodingNotSupported.java
new file mode 100644
index 000000000..62cf89c25
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/RunLengthV1EncodingNotSupported.java
@@ -0,0 +1,16 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.StandardException;
+
+/**
+ * Thrown when Runlength V1 encoding is not supported.
+ *
+ * @author Antony Stubbs
+ */
+@StandardException
+public class RunLengthV1EncodingNotSupported extends EncodingNotSupportedException {
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/RunLengthV2EncodingNotSupported.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/RunLengthV2EncodingNotSupported.java
new file mode 100644
index 000000000..e40ea9cf9
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/offsets/RunLengthV2EncodingNotSupported.java
@@ -0,0 +1,16 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.StandardException;
+
+/**
+ * Thrown when Runlength V1 encoding is not supported.
+ *
+ * @author Antony Stubbs
+ */
+@StandardException
+public class RunLengthV2EncodingNotSupported extends EncodingNotSupportedException {
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/ConsumerRecordId.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/ConsumerRecordId.java
new file mode 100644
index 000000000..4d0f9da02
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/ConsumerRecordId.java
@@ -0,0 +1,18 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.Value;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.common.TopicPartition;
+
+/**
+ * Useful identifier for a {@link ConsumerRecord}.
+ */
+@Value
+public class ConsumerRecordId {
+    TopicPartition tp;
+    long offset;
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/PartitionState.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/PartitionState.java
new file mode 100644
index 000000000..25fa7f0d0
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/PartitionState.java
@@ -0,0 +1,694 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.BrokerPollSystem;
+import io.confluent.parallelconsumer.internal.EpochAndRecordsMap;
+import io.confluent.parallelconsumer.internal.PCModule;
+import io.confluent.parallelconsumer.metrics.PCMetrics;
+import io.confluent.parallelconsumer.metrics.PCMetricsDef;
+import io.confluent.parallelconsumer.offsets.NoEncodingPossibleException;
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager;
+import io.micrometer.core.instrument.DistributionSummary;
+import io.micrometer.core.instrument.Gauge;
+import io.micrometer.core.instrument.Tag;
+import lombok.Getter;
+import lombok.NonNull;
+import lombok.Setter;
+import lombok.ToString;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.common.TopicPartition;
+
+import java.util.*;
+import java.util.concurrent.ConcurrentSkipListMap;
+import java.util.stream.Collectors;
+
+import static io.confluent.csid.utils.JavaUtils.*;
+import static io.confluent.parallelconsumer.offsets.OffsetMapCodecManager.DefaultMaxMetadataSize;
+import static java.util.Optional.empty;
+import static java.util.Optional.of;
+import static lombok.AccessLevel.*;
+
+/**
+ * Our view of the state of the partitions that we've been assigned.
+ *
+ * @author Antony Stubbs
+ * @see PartitionStateManager
+ */
+@ToString
+@Slf4j
+public class PartitionState<K, V> {
+
+    /**
+     * Symbolic value for a parameter which is initialised as having an offset absent (instead of using Optional or
+     * null)
+     */
+    public static final long KAFKA_OFFSET_ABSENCE = -1L;
+
+    private final PCModule<K, V> module;
+
+    @NonNull
+    @Getter
+    private final TopicPartition tp;
+
+    /**
+     * Offsets beyond the highest committable offset (see {@link #getOffsetHighestSequentialSucceeded()}) which haven't
+     * totally succeeded. Based on decoded metadata and polled records (not offset ranges).
+     * <p>
+     * Mapped to the corresponding {@link ConsumerRecord}, once it's been polled from the broker.
+     * <p>
+     * Initially mapped to an empty optional, until the record is polled from the broker, because we initially get only
+     * the incomplete offsets decoded from the metadata payload first, before receiving the records from poll requests.
+     * <p>
+     * <p>
+     * <h2>How does this handle gaps in the offsets in the source partitions?:</h2>
+     * <p>
+     * We track per record acknowledgement, by only storing the offsets of records <em>OF WHICH WE'VE RECEIVED</em>
+     * through {@link KafkaConsumer#poll} calls.
+     * <p>
+     * This is as explicitly opposed to looking at the lowest offset we've polled, and synthetically creating a list of
+     * EXPECTED offsets from the range from it to the highest polled. If we were to construct this offset range
+     * synthetically like this, then we would need to expect to process/receive records which might not exist, for
+     * whatever reason, usually due to compaction.
+     * <p>
+     * Instead, the offsets tracked are only determined from the records we've given to process from the broker - we
+     * make no assumptions about which offsets exist. This way we don't have to worry about gaps in the offsets. Also, a
+     * nice outcome of this is that a gap in the offsets is effectively the same as, as far as we're concerned, an
+     * offset which has succeeded - because either way we have no action to take.
+     * <p>
+     * This is independent of the actual queued {@link WorkContainer}s. This is because to start with, data about
+     * incomplete offsets come from the encoded metadata payload that gets committed along with the highest committable
+     * offset ({@link #getOffsetHighestSequentialSucceeded()}) and so we don't yet have ConsumerRecord's for those
+     * offsets until we start polling for them. And so they are not always in sync.
+     * <p>
+     * <p>
+     * <h2>Concurrency:</h2>
+     * <p>
+     * Needs to be concurrent because, the committer requesting the data to commit may be another thread - the broker
+     * polling sub system - {@link BrokerPollSystem#maybeDoCommit}. The alternative to having this as a concurrent
+     * collection, would be to have the control thread prepare possible commit data on every cycle, and park that data
+     * so that the broker polling thread can grab it, if it wants to commit - i.e. the poller would not prepare/query
+     * the data for itself. This requirement is removed in the upcoming PR #200 Refactor: Consider a shared nothing
+     * architecture.
+     *
+     * @see io.confluent.parallelconsumer.offsets.BitSetEncoder for disucssion on how this is impacts per record ack
+     *         storage
+     */
+    @NonNull
+    private ConcurrentSkipListMap<Long, Optional<ConsumerRecord<K, V>>> incompleteOffsets;
+
+    /**
+     * Marks whether any {@link WorkContainer}s have been added yet or not. Used for some initial poll analysis.
+     */
+    private boolean bootstrapPhase = true;
+
+    /**
+     * Cache view of the state of the partition. Is set dirty when the incomplete state of any offset changes. Is set
+     * clean after a successful commit of the state.
+     */
+    @Setter(PRIVATE)
+    @Getter(PACKAGE)
+    private boolean dirty;
+
+    /**
+     * The highest seen offset for a partition.
+     * <p>
+     * Starts off as -1 - no data. Offsets in Kafka are never negative, so this is fine.
+     */
+    // visible for testing
+    @Getter(PUBLIC)
+    private long offsetHighestSeen;
+
+    /**
+     * Highest offset which has completed successfully ("succeeded").
+     * <p>
+     * Note that this may in some conditions, there may be a gap between this and the next offset to poll - that being,
+     * there may be some number of transaction marker records above it, and the next offset to poll.
+     * <p>
+     * Note that as we only encode our offset map up to the highest succeeded offset (as encoding higher has no value),
+     * upon bootstrap, this will always start off as the same as the {@link #offsetHighestSeen}.
+     */
+    @Getter(PUBLIC)
+    private long offsetHighestSucceeded = KAFKA_OFFSET_ABSENCE;
+
+    /**
+     * If true, more messages are allowed to process for this partition.
+     * <p>
+     * If false, we have calculated that we can't record any more offsets for this partition, as our best performing
+     * encoder requires nearly as much space is available for this partitions allocation of the maximum offset metadata
+     * size.
+     * <p>
+     * Default (missing elements) is true - more messages can be processed.
+     * <p>
+     * AKA high watermark (which is a deprecated description).
+     *
+     * @see OffsetMapCodecManager#DefaultMaxMetadataSize
+     */
+    @Getter(PACKAGE)
+    @Setter(PRIVATE)
+    private boolean allowedMoreRecords = true;
+
+    /**
+     * The Epoch of the generation of partition assignment, for fencing off invalid work.
+     * <p>
+     * Will unified actor partition assignment messages, epochs may no longer be needed.
+     */
+    @Getter
+    private final long partitionsAssignmentEpoch;
+
+    private long lastCommittedOffset;
+    private Gauge lastCommittedOffsetGauge;
+    private Gauge highestSeenOffsetGauge;
+    private Gauge highestCompletedOffsetGauge;
+    private Gauge highestSequentialSucceededOffsetGauge;
+    private Gauge numberOfIncompletesGauge;
+    private Gauge ephochGauge;
+    private DistributionSummary ratioPayloadUsedDistributionSummary;
+    private DistributionSummary ratioMetadataSpaceUsedDistributionSummary;
+    private final PCMetrics pcMetrics;
+
+    public PartitionState(long newEpoch,
+                          PCModule<K, V> pcModule,
+                          TopicPartition topicPartition,
+                          OffsetMapCodecManager.HighestOffsetAndIncompletes offsetData) {
+        this.module = pcModule;
+
+        this.tp = topicPartition;
+        this.partitionsAssignmentEpoch = newEpoch;
+        this.pcMetrics = module.pcMetrics();
+        initStateFromOffsetData(offsetData);
+        initMetrics();
+    }
+
+    private void initStateFromOffsetData(OffsetMapCodecManager.HighestOffsetAndIncompletes offsetData) {
+        this.offsetHighestSeen = offsetData.getHighestSeenOffset().orElse(KAFKA_OFFSET_ABSENCE);
+
+        this.incompleteOffsets = new ConcurrentSkipListMap<>();
+        offsetData.getIncompleteOffsets()
+                .forEach(offset -> incompleteOffsets.put(offset, Optional.empty()));
+
+        this.offsetHighestSucceeded = this.offsetHighestSeen; // by definition, as we only encode up to the highest seen offset (inclusive)
+    }
+
+    private void maybeRaiseHighestSeenOffset(final long offset) {
+        // rise the highest seen offset
+        if (offset >= offsetHighestSeen) {
+            log.trace("Updating highest seen - was: {} now: {}", offsetHighestSeen, offset);
+            offsetHighestSeen = offset;
+        }
+    }
+
+    public void onOffsetCommitSuccess(OffsetAndMetadata committed) { //NOSONAR
+        lastCommittedOffset = committed.offset();
+        setClean();
+    }
+
+    private void setClean() {
+        setDirty(false);
+    }
+
+    private void setDirty() {
+        setDirty(true);
+    }
+
+    // todo rename isRecordComplete()
+    // todo add support for this to TruthGen
+    public boolean isRecordPreviouslyCompleted(final ConsumerRecord<K, V> rec) {
+        long recOffset = rec.offset();
+        if (incompleteOffsets.containsKey(recOffset)) {
+            // we haven't recorded this far up, so must not have been processed yet
+            return false;
+        } else {
+            // if within the range of tracked offsets, must have been previously completed, as it's not in the incomplete set
+            return recOffset <= offsetHighestSeen;
+        }
+    }
+
+    public boolean hasIncompleteOffsets() {
+        return !incompleteOffsets.isEmpty();
+    }
+
+    public int getNumberOfIncompleteOffsets() {
+        return incompleteOffsets.size();
+    }
+
+    public void onSuccess(long offset) {
+        //noinspection OptionalAssignedToNull - null check to see if key existed
+        boolean removedFromIncompletes = this.incompleteOffsets.remove(offset) != null; // NOSONAR
+        assert (removedFromIncompletes);
+
+        updateHighestSucceededOffsetSoFar(offset);
+
+        setDirty();
+    }
+
+    public void onFailure(WorkContainer<K, V> work) {
+        // no-op
+    }
+
+    /**
+     * Update highest Succeeded seen so far
+     */
+    private void updateHighestSucceededOffsetSoFar(long thisOffset) {
+        long highestSucceeded = getOffsetHighestSucceeded();
+        if (thisOffset > highestSucceeded) {
+            log.trace("Updating highest completed - was: {} now: {}", highestSucceeded, thisOffset);
+            this.offsetHighestSucceeded = thisOffset;
+        }
+    }
+
+    private boolean epochIsStale(EpochAndRecordsMap<K, V>.RecordsAndEpoch recordsAndEpoch) {
+        // do epochs still match? do a proactive check, but the epoch will be checked again at work completion as well
+        var currentPartitionEpoch = getPartitionsAssignmentEpoch();
+        Long epochOfInboundRecords = recordsAndEpoch.getEpochOfPartitionAtPoll();
+
+        return !Objects.equals(epochOfInboundRecords, currentPartitionEpoch);
+    }
+
+    public void maybeRegisterNewPollBatchAsWork(@NonNull EpochAndRecordsMap<K, V>.RecordsAndEpoch recordsAndEpoch) {
+        if (epochIsStale(recordsAndEpoch)) {
+            log.debug("Inbound record of work has epoch ({}) not matching currently assigned epoch for the applicable partition ({}), skipping",
+                    recordsAndEpoch.getEpochOfPartitionAtPoll(), getPartitionsAssignmentEpoch());
+            return;
+        }
+
+        //
+        maybeTruncateOrPruneTrackedOffsets(recordsAndEpoch);
+
+        //
+        long epochOfInboundRecords = recordsAndEpoch.getEpochOfPartitionAtPoll();
+        List<ConsumerRecord<K, V>> recordPollBatch = recordsAndEpoch.getRecords();
+        for (var aRecord : recordPollBatch) {
+            if (isRecordPreviouslyCompleted(aRecord)) {
+                log.trace("Record previously completed, skipping. offset: {}", aRecord.offset());
+            } else {
+                getShardManager().addWorkContainer(epochOfInboundRecords, aRecord);
+                addNewIncompleteRecord(aRecord);
+            }
+        }
+
+    }
+
+    /**
+     * Used for adding work to, if it's been successfully added to our tracked state
+     *
+     * @see #maybeRegisterNewPollBatchAsWork
+     */
+    private ShardManager<K, V> getShardManager() {
+        return module.workManager().getSm();
+    }
+
+    public boolean isPartitionRemovedOrNeverAssigned() {
+        return false;
+    }
+
+    // visible for legacy testing
+    public void addNewIncompleteRecord(ConsumerRecord<K, V> record) {
+        long offset = record.offset();
+        maybeRaiseHighestSeenOffset(offset);
+
+        // idempotently add the offset to our incompletes track - if it was already there from loading our metadata on startup, there is no affect
+        incompleteOffsets.put(offset, Optional.of(record));
+    }
+
+
+    /**
+     * If the offset is higher than expected, according to the previously committed / polled offset, truncate up to it.
+     * If lower, reset down to it.
+     * <p>
+     * Only runs if this is the first {@link ConsumerRecord} to be added since instantiation.
+     * <p>
+     * Can be caused by the offset reset policy of the underlying consumer.
+     */
+    private void maybeTruncateBelowOrAbove(long bootstrapPolledOffset) {
+        if (bootstrapPhase) {
+            bootstrapPhase = false;
+        } else {
+            // Not bootstrap phase anymore, so not checking for truncation
+            return;
+        }
+
+        // during bootstrap, getOffsetToCommit() will return the offset of the last record committed, so we can use that to determine if we need to truncate
+        long expectedBootstrapRecordOffset = getOffsetToCommit();
+
+        boolean pollAboveExpected = bootstrapPolledOffset > expectedBootstrapRecordOffset;
+
+        boolean pollBelowExpected = bootstrapPolledOffset < expectedBootstrapRecordOffset;
+
+        if (pollAboveExpected) {
+            // previously committed offset record has been removed from the topic, so we need to truncate up to it
+            log.warn("Truncating state - removing records lower than {} from partition {} of topic {}. Offsets have been removed from the partition " +
+                            "by the broker or committed offset has been raised. Bootstrap polled {} but expected {} from loaded commit data. " +
+                            "Could be caused by record retention or compaction and offset reset policy LATEST.",
+                    bootstrapPolledOffset,
+                    this.tp.partition(),
+                    this.tp.topic(),
+                    bootstrapPolledOffset,
+                    expectedBootstrapRecordOffset);
+
+            // truncate
+            final NavigableSet<Long> incompletesToPrune = incompleteOffsets.keySet().headSet(bootstrapPolledOffset, false);
+            incompletesToPrune.forEach(incompleteOffsets::remove);
+        } else if (pollBelowExpected) {
+            // reset to lower offset detected, so we need to reset our state to match
+            log.warn("Bootstrap polled offset has been reset to an earlier offset ({}) for partition {} of topic {} - truncating state - all records " +
+                            "above (including this) will be replayed. Was expecting {} but bootstrap poll was {}. " +
+                            "Could be caused by record retention or compaction and offset reset policy EARLIEST.",
+                    bootstrapPolledOffset,
+                    this.tp.partition(),
+                    this.tp.topic(),
+                    expectedBootstrapRecordOffset,
+                    bootstrapPolledOffset
+            );
+
+            // reset
+            var offsetData = OffsetMapCodecManager.HighestOffsetAndIncompletes.of();
+            initStateFromOffsetData(offsetData);
+        }
+    }
+
+    /**
+     * Has this partition been removed? No.
+     *
+     * @return by definition false in this implementation
+     */
+    public boolean isRemoved() {
+        return false;
+    }
+
+    public Optional<OffsetAndMetadata> getCommitDataIfDirty() {
+        return isDirty() ?
+                of(createOffsetAndMetadata()) :
+                empty();
+    }
+
+    // visible for testing
+    protected OffsetAndMetadata createOffsetAndMetadata() {
+        Optional<String> payloadOpt = tryToEncodeOffsets();
+        long nextOffset = getOffsetToCommit();
+        return payloadOpt
+                .map(encodedOffsets -> new OffsetAndMetadata(nextOffset, encodedOffsets))
+                .orElseGet(() -> new OffsetAndMetadata(nextOffset));
+    }
+
+    /**
+     * Next offset expected to be polled, upon freshly connecting to a broker.
+     * <p>
+     * Defined as the offset, one below the highest sequentially succeeded offset.
+     */
+    // visible for testing
+    protected long getOffsetToCommit() {
+        return getOffsetHighestSequentialSucceeded() + 1;
+    }
+
+    /**
+     * @return all incomplete offsets of buffered work in this shard, even if higher than the highest succeeded
+     */
+    public List<Long> getAllIncompleteOffsets() {
+        //noinspection FuseStreamOperations - only in java 10
+        return Collections.unmodifiableList(incompleteOffsets.keySet().parallelStream().collect(Collectors.toList()));
+    }
+
+    /**
+     * @return incomplete offsets which are lower than the highest succeeded
+     */
+    public SortedSet<Long> getIncompleteOffsetsBelowHighestSucceeded() {
+        long highestSucceeded = getOffsetHighestSucceeded();
+        return incompleteOffsets.keySet().parallelStream()
+                .filter(x -> x < highestSucceeded)
+                .collect(toTreeSet());
+    }
+
+    /**
+     * The offset which is itself, and all before, all successfully completed (or skipped).
+     * <p>
+     * Defined for our purpose (as only used in definition of what offset to poll for next), as the offset one below the
+     * lowest incomplete offset.
+     */
+    public long getOffsetHighestSequentialSucceeded() {
+        /*
+         * Capture the current value in case it's changed during this operation - because if more records are added to
+         * the queue, after looking at the incompleteOffsets, offsetHighestSeen could increase drastically and will be
+         * incorrect for the value of getOffsetHighestSequentialSucceeded. So this is a ~pessimistic solution - as in a
+         * race case, there may be a higher getOffsetHighestSequentialSucceeded from the incompleteOffsets collection,
+         * but it will always at lease be pessimistically correct in terms of committing offsets to the broker.
+         *
+         * See #200 for the complete correct solution.
+         */
+        long currentOffsetHighestSeen = offsetHighestSeen;
+        Long firstIncompleteOffset = incompleteOffsets.keySet().ceiling(KAFKA_OFFSET_ABSENCE);
+        boolean incompleteOffsetsWasEmpty = firstIncompleteOffset == null;
+
+        if (incompleteOffsetsWasEmpty) {
+            return currentOffsetHighestSeen;
+        } else {
+            return firstIncompleteOffset - 1;
+        }
+    }
+
+
+    /**
+     * Tries to encode the incomplete offsets for this partition. This may not be possible if there are none, or if no
+     * encodings are possible ({@link NoEncodingPossibleException}. Encoding may not be possible of - see
+     * {@link OffsetMapCodecManager#makeOffsetMetadataPayload}.
+     *
+     * @return if possible, the String encoded offset map
+     */
+    private Optional<String> tryToEncodeOffsets() {
+        if (incompleteOffsets.isEmpty()) {
+            setAllowedMoreRecords(true);
+            return empty();
+        }
+
+        try {
+            // todo refactor use of null shouldn't be needed. Is OffsetMapCodecManager stateful? remove null #233
+            OffsetMapCodecManager<K, V> om = new OffsetMapCodecManager<>(this.module);
+            long offsetOfNextExpectedMessage = getOffsetToCommit();
+            var offsetRange = getOffsetHighestSucceeded() - offsetOfNextExpectedMessage;
+            String offsetMapPayload = om.makeOffsetMetadataPayload(offsetOfNextExpectedMessage, this);
+            ratioPayloadUsedDistributionSummary.record(offsetMapPayload.length() / (double) offsetRange);
+            ratioMetadataSpaceUsedDistributionSummary.record(offsetMapPayload.length() / (double) OffsetMapCodecManager.DefaultMaxMetadataSize);
+            boolean mustStrip = updateBlockFromEncodingResult(offsetMapPayload);
+            if (mustStrip) {
+                return empty();
+            } else {
+                return of(offsetMapPayload);
+            }
+        } catch (NoEncodingPossibleException e) {
+            setAllowedMoreRecords(false);
+            log.warn("No encodings could be used to encode the offset map, skipping. Warning: messages might be replayed on rebalance.", e);
+            return empty();
+        }
+    }
+
+    /**
+     * @return true if the payload is too large and must be stripped
+     */
+    private boolean updateBlockFromEncodingResult(String offsetMapPayload) {
+        int metaPayloadLength = offsetMapPayload.length();
+        boolean mustStrip = false;
+
+        if (metaPayloadLength > DefaultMaxMetadataSize) {
+            // exceeded maximum API allowed, strip the payload
+            mustStrip = true;
+            setAllowedMoreRecords(false);
+            log.warn("Offset map data too large (size: {}) to fit in metadata payload hard limit of {} - cannot include in commit. " +
+                            "Warning: messages might be replayed on rebalance. " +
+                            "See kafka.coordinator.group.OffsetConfig#DefaultMaxMetadataSize = {} and issue #47.",
+                    metaPayloadLength, DefaultMaxMetadataSize, DefaultMaxMetadataSize);
+        } else if (metaPayloadLength > getPressureThresholdValue()) { // and thus metaPayloadLength <= DefaultMaxMetadataSize
+            // try to turn on back pressure before max size is reached
+            setAllowedMoreRecords(false);
+            log.warn("Payload size {} higher than threshold {}, but still lower than max {}. Will write payload, but will " +
+                            "not allow further messages, in order to allow the offset data to shrink (via succeeding messages).",
+                    metaPayloadLength, getPressureThresholdValue(), DefaultMaxMetadataSize);
+
+        } else { // and thus (metaPayloadLength <= pressureThresholdValue)
+            if (allowedMoreRecords == false) {
+                // guard is useful for debugging to catch the transition from false to true
+                setAllowedMoreRecords(true);
+            }
+            log.debug("Payload size {} within threshold {}", metaPayloadLength, getPressureThresholdValue());
+        }
+
+        return mustStrip;
+    }
+
+    private double getPressureThresholdValue() {
+        return DefaultMaxMetadataSize * PartitionStateManager.getUSED_PAYLOAD_THRESHOLD_MULTIPLIER();
+    }
+
+    public void onPartitionsRemoved(ShardManager<K, V> sm) {
+        sm.removeAnyShardEntriesReferencedFrom(incompleteOffsets.values());
+        deregisterMetrics();
+    }
+
+    /**
+     * Convenience method for readability
+     *
+     * @return true if {@link #isAllowedMoreRecords()} is false
+     * @see #isAllowedMoreRecords()
+     */
+    public boolean isBlocked() {
+        return !isAllowedMoreRecords();
+    }
+
+    /**
+     * Each time we poll a patch of records, check to see that as expected our tracked incomplete offsets exist in the
+     * set, otherwise they must have been removed from the underlying partition and should be removed from our tracking
+     * as we'll ever be given the record again to retry.
+     * <p>
+     * <p>
+     * Also, does {@link #maybeTruncateBelowOrAbove}.
+     */
+    @SuppressWarnings("OptionalGetWithoutIsPresent") // checked with isEmpty
+    private void maybeTruncateOrPruneTrackedOffsets(EpochAndRecordsMap<?, ?>.RecordsAndEpoch polledRecordBatch) {
+        var records = polledRecordBatch.getRecords();
+
+        if (records.isEmpty()) {
+            log.warn("Polled an empty batch of records? {}", polledRecordBatch);
+            return;
+        }
+
+        var offsetOfLowestRecord = getFirst(records).get().offset(); // NOSONAR see #isEmpty
+
+        maybeTruncateBelowOrAbove(offsetOfLowestRecord);
+
+        // build the hash set once, so we can do random access checks of our tracked incompletes
+        var polledOffsets = records.stream()
+                .map(ConsumerRecord::offset)
+                .collect(Collectors.toSet());
+
+        var offsetOfHighestRecord = getLast(records).get().offset(); // NOSONAR see #isEmpty
+
+        // for the incomplete offsets within this range of poll batch
+        var offsetsToRemoveFromTracking = new ArrayList<Long>();
+        var trackedIncompletesWithinPolledBatch = incompleteOffsets.keySet().subSet(offsetOfLowestRecord, true, offsetOfHighestRecord, true);
+        for (long trackedIncomplete : trackedIncompletesWithinPolledBatch) {
+            boolean incompleteMissingFromPolledRecords = !polledOffsets.contains(trackedIncomplete);
+
+            if (incompleteMissingFromPolledRecords) {
+                offsetsToRemoveFromTracking.add(trackedIncomplete);
+                // don't need to remove it from the #commitQueue, as it would never have been added
+            }
+        }
+        if (!offsetsToRemoveFromTracking.isEmpty()) {
+            log.warn("Offsets {} have been removed from partition {} (as they were not been returned within a polled batch " +
+                            "which should have contained them - batch offset range is {} to {}), so they be removed " +
+                            "from tracking state, as they will never be sent again to be retried. " +
+                            "This can be caused by PC rebalancing across a partition which has been compacted on offsets above the committed " +
+                            "base offset, after initial load and before a rebalance.",
+                    offsetsToRemoveFromTracking,
+                    getTp(),
+                    offsetOfLowestRecord,
+                    offsetOfHighestRecord
+            );
+            offsetsToRemoveFromTracking.forEach(incompleteOffsets::remove);
+        }
+    }
+
+    /**
+     * If the record is below the highest succeeded offset, then it is or will be represented in the current offset
+     * encoding.
+     * <p>
+     * This may in fact be THE message holding up the partition - so must be retried.
+     * <p>
+     * In which case - don't want to skip it.
+     * <p>
+     * Generally speaking, completing more offsets below the highest succeeded (and thus the set represented in the
+     * encoded payload), should usually reduce the payload size requirements.
+     */
+    private boolean isBlockingProgress(WorkContainer<?, ?> workContainer) {
+        return workContainer.offset() < getOffsetHighestSucceeded();
+    }
+
+    /**
+     * Checks if this record be taken from its partition as work.
+     * <p>
+     * It checks that the work is not stale, and that the partition ok to allow more records to be processed, or if the
+     * record is actually blocking our progress.
+     *
+     * @return true if this record be taken from its partition as work.
+     */
+    public boolean couldBeTakenAsWork(WorkContainer<K, V> workContainer) {
+        if (checkIfWorkIsStale(workContainer)) {
+            log.debug("Work is in queue with stale epoch or no longer assigned. Skipping. Shard it came from will/was removed during partition revocation. WC: {}", workContainer);
+            return false;
+        } else if (isAllowedMoreRecords()) {
+            log.debug("Partition is allowed more records. Taking work. WC: {}", workContainer);
+            return true;
+        } else if (isBlockingProgress(workContainer)) {
+            // allow record to be taken, even if partition is blocked, as this record completion may reduce payload size requirement
+            log.debug("Partition is blocked, but this record is blocking progress. Taking work. WC: {}", workContainer);
+            return true;
+        } else {
+            log.debug("Not allowed more records for the partition ({}) as set from previous encode run (blocked), that this " +
+                            "record ({}) belongs to, due to offset encoding back pressure, is within the encoded payload already (offset lower than highest succeeded, " +
+                            "not in flight ({}), continuing on to next container in shardEntry.",
+                    workContainer.getTopicPartition(), workContainer.offset(), workContainer.isNotInFlight());
+            return false;
+        }
+    }
+
+    /**
+     * Have our partitions been revoked?
+     * <p>
+     * This state is rare, as shards or work get removed upon partition revocation, although under busy load it might
+     * occur we don't synchronize over PartitionState here so it's a bit racey, but is handled and eventually settles.
+     *
+     * @return true if epoch doesn't match, false if ok
+     */
+    boolean checkIfWorkIsStale(final WorkContainer<?, ?> workContainer) {
+        Long currentPartitionEpoch = getPartitionsAssignmentEpoch();
+        long workEpoch = workContainer.getEpoch();
+
+        boolean partitionNotAssigned = isPartitionRemovedOrNeverAssigned();
+
+        boolean epochMissMatch = currentPartitionEpoch != workEpoch;
+
+        if (epochMissMatch || partitionNotAssigned) {
+            log.debug("Epoch mismatch {} vs {} for record {}. Skipping message - it's partition has already assigned to a different consumer.",
+                    workEpoch, currentPartitionEpoch, workContainer);
+            return true;
+        }
+        return false;
+    }
+
+    private void initMetrics() {
+        TopicPartition topicPartition = getTp();
+        if (topicPartition == null) {
+            return;
+        }
+        Tag[] partitionStateTags = new Tag[]{Tag.of("topic", topicPartition.topic()), Tag.of("partition", String.valueOf(topicPartition.partition()))};
+        lastCommittedOffsetGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.PARTITION_LAST_COMMITTED_OFFSET,
+                this, partitionState -> partitionState.lastCommittedOffset, partitionStateTags);
+        highestSeenOffsetGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.PARTITION_HIGHEST_SEEN_OFFSET,
+                this, PartitionState::getOffsetHighestSeen, partitionStateTags);
+        highestCompletedOffsetGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.PARTITION_HIGHEST_COMPLETED_OFFSET,
+                this, PartitionState::getOffsetHighestSucceeded, partitionStateTags);
+        highestSequentialSucceededOffsetGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.PARTITION_HIGHEST_SEQUENTIAL_SUCCEEDED_OFFSET,
+                this, PartitionState::getOffsetHighestSequentialSucceeded, partitionStateTags);
+        numberOfIncompletesGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.PARTITION_INCOMPLETE_OFFSETS,
+                this, partitionState -> partitionState.incompleteOffsets.size(), partitionStateTags);
+        ephochGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.PARTITION_ASSIGNMENT_EPOCH,
+                this, PartitionState::getPartitionsAssignmentEpoch, partitionStateTags);
+        ratioMetadataSpaceUsedDistributionSummary = pcMetrics.getDistributionSummaryFromMetricDef(PCMetricsDef.METADATA_SPACE_USED, partitionStateTags);
+        ratioPayloadUsedDistributionSummary = pcMetrics.getDistributionSummaryFromMetricDef(PCMetricsDef.PAYLOAD_RATIO_USED, partitionStateTags);
+    }
+
+    private void deregisterMetrics() {
+        pcMetrics.removeMeter(lastCommittedOffsetGauge);
+        pcMetrics.removeMeter(highestSeenOffsetGauge);
+        pcMetrics.removeMeter(highestCompletedOffsetGauge);
+        pcMetrics.removeMeter(highestSequentialSucceededOffsetGauge);
+        pcMetrics.removeMeter(numberOfIncompletesGauge);
+        pcMetrics.removeMeter(ephochGauge);
+        pcMetrics.removeMeter(ratioMetadataSpaceUsedDistributionSummary);
+        pcMetrics.removeMeter(ratioPayloadUsedDistributionSummary);
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/PartitionStateManager.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/PartitionStateManager.java
new file mode 100644
index 000000000..214355c07
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/PartitionStateManager.java
@@ -0,0 +1,358 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder;
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.internal.BrokerPollSystem;
+import io.confluent.parallelconsumer.internal.EpochAndRecordsMap;
+import io.confluent.parallelconsumer.internal.PCModule;
+import io.confluent.parallelconsumer.metrics.PCMetrics;
+import io.confluent.parallelconsumer.metrics.PCMetricsDef;
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager;
+import io.micrometer.core.instrument.Counter;
+import io.micrometer.core.instrument.Gauge;
+import io.micrometer.core.instrument.Tag;
+import lombok.Getter;
+import lombok.Setter;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerRebalanceListener;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.common.TopicPartition;
+
+import java.util.*;
+import java.util.concurrent.ConcurrentHashMap;
+import java.util.stream.Collectors;
+
+/**
+ * In charge of managing {@link PartitionState}s.
+ * <p>
+ * This state is shared between the {@link BrokerPollSystem} thread and the {@link AbstractParallelEoSStreamProcessor}.
+ *
+ * @author Antony Stubbs
+ * @see PartitionState
+ */
+// metrics: assigned partitions and their epochs, number of assigned partitions,
+@Slf4j
+public class PartitionStateManager<K, V> implements ConsumerRebalanceListener {
+
+    public static final double USED_PAYLOAD_THRESHOLD_MULTIPLIER_DEFAULT = 0.75;
+
+    /**
+     * Best efforts attempt to prevent usage of offset payload beyond X% - as encoding size test is currently only done
+     * per batch, we need to leave some buffer for the required space to overrun before hitting the hard limit where we
+     * have to drop the offset payload entirely.
+     */
+    @Getter
+    @Setter
+    // todo remove static
+    private static double USED_PAYLOAD_THRESHOLD_MULTIPLIER = USED_PAYLOAD_THRESHOLD_MULTIPLIER_DEFAULT;
+
+    private final ShardManager<K, V> sm;
+
+    /**
+     * Hold the tracking state for each of our managed partitions.
+     */
+    private final Map<TopicPartition, PartitionState<K, V>> partitionStates = new ConcurrentHashMap<>();
+
+    /**
+     * Record the generations of partition assignment, for fencing off invalid work.
+     * <p>
+     * NOTE: This must live outside of {@link PartitionState}, as it must be tracked across partition lifecycles.
+     * <p>
+     * Starts at zero.
+     * <p>
+     * NOTE: Must be concurrent because it can be set by one thread, but read by another.
+     */
+    private final Map<TopicPartition, Long> partitionsAssignmentEpochs = new ConcurrentHashMap<>();
+
+    private final PCModule<K, V> module;
+
+    private Gauge numberOfPartitionsGauge;
+    private Gauge totalIncompletesGauge;
+    private final Map<TopicPartition, Counter> slowWorkCounters = new HashMap<>();
+
+    private final PCMetrics pcMetrics;
+
+    public PartitionStateManager(PCModule<K, V> module, ShardManager<K, V> sm) {
+        this.sm = sm;
+        this.module = module;
+        this.pcMetrics = module.pcMetrics();
+        initMetrics();
+    }
+
+    public PartitionState<K, V> getPartitionState(TopicPartition tp) {
+        return partitionStates.get(tp);
+    }
+
+    private PartitionState<K, V> getPartitionState(EpochAndRecordsMap<K, V>.RecordsAndEpoch recordsAndEpoch) {
+        return getPartitionState(recordsAndEpoch.getTopicPartition());
+    }
+
+    protected PartitionState<K, V> getPartitionState(WorkContainer<K, V> workContainer) {
+        TopicPartition topicPartition = workContainer.getTopicPartition();
+        return getPartitionState(topicPartition);
+    }
+
+    /**
+     * Load offset map for assigned assignedPartitions
+     */
+    @Override
+    public void onPartitionsAssigned(Collection<TopicPartition> assignedPartitions) {
+        log.debug("Partitions assigned: {}", assignedPartitions);
+
+        for (final TopicPartition partitionAssignment : assignedPartitions) {
+            boolean isAlreadyAssigned = this.partitionStates.containsKey(partitionAssignment);
+            if (isAlreadyAssigned) {
+                PartitionState<K, V> previouslyAssignedState = partitionStates.get(partitionAssignment);
+                if (previouslyAssignedState.isRemoved()) {
+                    log.trace("Reassignment of previously revoked partition {} - state: {}", partitionAssignment, previouslyAssignedState);
+                } else {
+                    log.warn("New assignment of partition which already exists and isn't recorded as removed in " +
+                            "partition state. Could be a state bug - was the partition revocation somehow missed, " +
+                            "or is this a race? Please file a GH issue. Partition: {}, state: {}", partitionAssignment, previouslyAssignedState);
+                }
+            }
+        }
+
+        incrementPartitionAssignmentEpoch(assignedPartitions);
+
+        try {
+            OffsetMapCodecManager<K, V> om = new OffsetMapCodecManager<>(module); // todo remove throw away instance creation - #233
+            var partitionStates = om.loadPartitionStateForAssignment(assignedPartitions);
+            this.partitionStates.putAll(partitionStates);
+            initPartitionCounters(assignedPartitions);
+
+            // remove stale work containers after partition epoch changed
+            // because we will judge if container is stale or not by comparing between
+            // epoch from WorkContainer to partitionsAssignmentEpoch in PartitionState
+            sm.removeStaleContainers();
+        } catch (Exception e) {
+            log.error("Error in onPartitionsAssigned", e);
+            throw e;
+        }
+    }
+
+    private void initPartitionCounters(Collection<TopicPartition> assignedPartitions) {
+        assignedPartitions.forEach(topicPartition -> {
+            if (!slowWorkCounters.containsKey(topicPartition)) {
+                slowWorkCounters.put(topicPartition, pcMetrics
+                        .getCounterFromMetricDef(PCMetricsDef.SLOW_RECORDS,
+                                Tag.of("topic", topicPartition.topic()),
+                                Tag.of("partition", String.valueOf(topicPartition.partition())))
+                );
+            }
+        });
+    }
+
+    private void deregisterPartitionCounters(Collection<TopicPartition> removedPartitions) {
+        removedPartitions.forEach(topicPartition -> {
+            Counter counter = slowWorkCounters.remove(topicPartition);
+            if (counter != null) {
+                pcMetrics.removeMeter(counter);
+            }
+        });
+    }
+
+    public void incrementSlowWorkCounter(TopicPartition topicPartition) {
+        Optional.ofNullable(slowWorkCounters.get(topicPartition)).ifPresent(Counter::increment);
+    }
+
+    /**
+     * Clear offset map for revoked partitions
+     * <p>
+     * {@link AbstractParallelEoSStreamProcessor#onPartitionsRevoked} handles committing off offsets upon revoke
+     *
+     * @see AbstractParallelEoSStreamProcessor#onPartitionsRevoked
+     */
+    @Override
+    public void onPartitionsRevoked(Collection<TopicPartition> partitions) {
+        log.info("Partitions revoked: {}", partitions);
+
+        try {
+            onPartitionsRemoved(partitions);
+        } catch (Exception e) {
+            log.error("Error in onPartitionsRevoked", e);
+            throw e;
+        }
+    }
+
+    void onPartitionsRemoved(final Collection<TopicPartition> partitions) {
+        incrementPartitionAssignmentEpoch(partitions);
+        resetOffsetMapAndRemoveWork(partitions);
+        deregisterPartitionCounters(partitions);
+
+        // remove stale work containers after partition epoch changed
+        // because we will judge if container is stale or not by comparing between
+        // epoch from WorkContainer to partitionsAssignmentEpoch in PartitionState
+        sm.removeStaleContainers();
+    }
+
+    /**
+     * Clear offset map for lost partitions
+     */
+    @Override
+    public void onPartitionsLost(Collection<TopicPartition> partitions) {
+        try {
+            log.info("Lost partitions: {}", partitions);
+            onPartitionsRemoved(partitions);
+        } catch (Exception e) {
+            log.error("Error in onPartitionsLost", e);
+            throw e;
+        }
+    }
+
+    /**
+     * Truncate our tracked offsets as a commit was successful, so the low water mark rises, and we dont' need to track
+     * as much anymore.
+     * <p>
+     * When commits are made to broker, we can throw away all the individually tracked offsets before the committed
+     * offset.
+     */
+    public void onOffsetCommitSuccess(Map<TopicPartition, OffsetAndMetadata> committed) {
+        // partitionOffsetHighWaterMarks this will get overwritten in due course
+        committed.forEach((tp, meta) -> {
+            var partition = getPartitionState(tp);
+            partition.onOffsetCommitSuccess(meta);
+        });
+    }
+
+    /**
+     * Remove work from removed partition.
+     * <p>
+     *
+     * <b>On shard removal:</b>
+     *
+     * <li>{@link  ProcessingOrder#PARTITION} ordering, work shards and partition queues are the same,
+     * so remove all from referenced shards
+     *
+     * <li>{@link ProcessingOrder#KEY} ordering, all records in a shard will be of
+     * the same key, so by definition all records with this key should be removed - i.e. the entire shard
+     *
+     * <li>{@link ProcessingOrder#UNORDERED} ordering, {@link WorkContainer}s go into shards keyed by partition, so
+     * falls back to the {@link ProcessingOrder#PARTITION} case
+     */
+    private void resetOffsetMapAndRemoveWork(Collection<TopicPartition> allRemovedPartitions) {
+        for (TopicPartition removedPartition : allRemovedPartitions) {
+            // by replacing with a no op implementation, we protect for stale messages still in queues which reference it
+            // however it means the map will only grow, but only it's key set
+            var partition = this.partitionStates.get(removedPartition);
+            partitionStates.put(removedPartition, RemovedPartitionState.getSingleton());
+
+            //
+            partition.onPartitionsRemoved(sm);
+        }
+    }
+
+    /**
+     * @return the current epoch of the partition
+     */
+    public Long getEpochOfPartition(TopicPartition partition) {
+        return partitionsAssignmentEpochs.get(partition);
+    }
+
+    private void incrementPartitionAssignmentEpoch(final Collection<TopicPartition> partitions) {
+        for (final TopicPartition partition : partitions) {
+            Long epoch = partitionsAssignmentEpochs.getOrDefault(partition, PartitionState.KAFKA_OFFSET_ABSENCE);
+            epoch++;
+            partitionsAssignmentEpochs.put(partition, epoch);
+        }
+    }
+
+    /**
+     * Check we have capacity in offset storage to process more messages
+     */
+    public boolean isAllowedMoreRecords(TopicPartition tp) {
+        PartitionState<K, V> partitionState = getPartitionState(tp);
+        return partitionState.isAllowedMoreRecords();
+    }
+
+    /**
+     * @see #isAllowedMoreRecords(TopicPartition)
+     */
+    public boolean isAllowedMoreRecords(WorkContainer<?, ?> wc) {
+        return isAllowedMoreRecords(wc.getTopicPartition());
+    }
+
+    public boolean hasIncompleteOffsets() {
+        for (var partition : getAssignedPartitions().values()) {
+            if (partition.hasIncompleteOffsets())
+                return true;
+        }
+        return false;
+    }
+
+    public long getNumberOfIncompleteOffsets() {
+        Collection<PartitionState<K, V>> values = getAssignedPartitions().values();
+        return values.stream()
+                .mapToLong(PartitionState::getNumberOfIncompleteOffsets)
+                .reduce(Long::sum)
+                .orElse(0);
+    }
+
+    public long getHighestSeenOffset(final TopicPartition tp) {
+        return getPartitionState(tp).getOffsetHighestSeen();
+    }
+
+    public void onSuccess(WorkContainer<K, V> wc) {
+        PartitionState<K, V> partitionState = getPartitionState(wc.getTopicPartition());
+        partitionState.onSuccess(wc.offset());
+    }
+
+    public void onFailure(WorkContainer<K, V> wc) {
+        PartitionState<K, V> partitionState = getPartitionState(wc.getTopicPartition());
+        partitionState.onFailure(wc);
+    }
+
+    /**
+     * Takes a record as work and puts it into internal queues, unless it's been previously recorded as completed as per
+     * loaded records.
+     */
+    void maybeRegisterNewRecordAsWork(final EpochAndRecordsMap<K, V> recordsMap) {
+        log.debug("Incoming {} new records...", recordsMap.count());
+        for (var recordsAndEpoch : recordsMap.getRecordMap().values()) {
+            PartitionState<K, V> partitionState = getPartitionState(recordsAndEpoch);
+            partitionState.maybeRegisterNewPollBatchAsWork(recordsAndEpoch);
+        }
+    }
+
+    public Map<TopicPartition, OffsetAndMetadata> collectDirtyCommitData() {
+        var dirties = new HashMap<TopicPartition, OffsetAndMetadata>();
+        for (var state : getAssignedPartitions().values()) {
+            var offsetAndMetadata = state.getCommitDataIfDirty();
+            //noinspection ObjectAllocationInLoop
+            offsetAndMetadata.ifPresent(andMetadata -> dirties.put(state.getTp(), andMetadata));
+        }
+        return dirties;
+    }
+
+    private Map<TopicPartition, PartitionState<K, V>> getAssignedPartitions() {
+        return Collections.unmodifiableMap(this.partitionStates.entrySet().stream()
+                .filter(e -> !e.getValue().isRemoved())
+                .collect(Collectors.toMap(Map.Entry::getKey, Map.Entry::getValue)));
+    }
+
+    /**
+     * @return true if this record be taken from its partition as work.
+     */
+    public boolean couldBeTakenAsWork(WorkContainer<K, V> workContainer) {
+        return getPartitionState(workContainer)
+                .couldBeTakenAsWork(workContainer);
+    }
+
+    public boolean isDirty() {
+        return this.partitionStates.values().stream()
+                .anyMatch(PartitionState::isDirty);
+    }
+
+    private void initMetrics() {
+        numberOfPartitionsGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.NUMBER_OF_PARTITIONS, this, pm -> getAssignedPartitions().size());
+        totalIncompletesGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.INCOMPLETE_OFFSETS_TOTAL,
+                this, partitionStateManager -> partitionStateManager.getAssignedPartitions().values().stream()
+                        .mapToInt(PartitionState::getNumberOfIncompleteOffsets)
+                        .sum()
+        );
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/ProcessingShard.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/ProcessingShard.java
new file mode 100644
index 000000000..e09741c94
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/ProcessingShard.java
@@ -0,0 +1,203 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder;
+import io.confluent.parallelconsumer.internal.RateLimiter;
+import lombok.Getter;
+import lombok.RequiredArgsConstructor;
+import lombok.extern.slf4j.Slf4j;
+
+import java.time.Duration;
+import java.util.*;
+import java.util.concurrent.ConcurrentSkipListMap;
+import java.util.stream.Collectors;
+
+import static io.confluent.csid.utils.BackportUtils.toSeconds;
+import static io.confluent.csid.utils.JavaUtils.isGreaterThan;
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.UNORDERED;
+import static lombok.AccessLevel.PRIVATE;
+
+/**
+ * Models the queue of work to be processed, based on the {@link ProcessingOrder} modes.
+ *
+ * @author Antony Stubbs
+ * @see ShardManager
+ */
+@Slf4j
+@RequiredArgsConstructor
+public class ProcessingShard<K, V> {
+
+    /**
+     * Map of offset to WorkUnits.
+     * <p>
+     * Uses a ConcurrentSkipListMap instead of a TreeMap as under high pressure there appears to be some concurrency
+     * errors (missing WorkContainers). This is addressed in PR#270.
+     * <p>
+     * Is a Map because need random access into collection, as records don't always complete in order (i.e. UNORDERED
+     * mode).
+     */
+    @Getter
+    private final NavigableMap<Long, WorkContainer<K, V>> entries = new ConcurrentSkipListMap<>();
+
+    @Getter(PRIVATE)
+    private final ShardKey key;
+
+    private final ParallelConsumerOptions<?, ?> options;
+
+    private final PartitionStateManager<K, V> pm;
+
+    private final RateLimiter slowWarningRateLimit = new RateLimiter(5);
+
+    public boolean workIsWaitingToBeProcessed() {
+        return entries.values().parallelStream()
+                .anyMatch(kvWorkContainer -> kvWorkContainer.isAvailableToTakeAsWork());
+    }
+
+    public void addWorkContainer(WorkContainer<K, V> wc) {
+        long key = wc.offset();
+        if (entries.containsKey(key)) {
+            log.debug("Entry for {} already exists in shard queue, dropping record", wc);
+        } else {
+            entries.put(key, wc);
+        }
+    }
+
+    public void onSuccess(WorkContainer<?, ?> wc) {
+        // remove work from shard's queue
+        entries.remove(wc.offset());
+    }
+
+    public boolean isEmpty() {
+        return entries.isEmpty();
+    }
+
+    public long getCountOfWorkAwaitingSelection() {
+        return entries.values().stream()
+                // todo missing pm.isBlocked(topicPartition) ?
+                .filter(WorkContainer::isAvailableToTakeAsWork)
+                .count();
+    }
+
+    public long getCountOfWorkTracked() {
+        return entries.size();
+    }
+
+    public long getCountWorkInFlight() {
+        return entries.values().stream()
+                .filter(WorkContainer::isInFlight)
+                .count();
+    }
+
+    public WorkContainer<K, V> remove(long offset) {
+        return entries.remove(offset);
+    }
+
+
+    // remove staled WorkContainer otherwise when the partition is reassigned, the staled messages will:
+    // 1. block the new work containers to be picked and processed
+    // 2. will cause the consumer to paused consuming new messages indefinitely
+    public boolean removeStaleWorkContainersFromShard() {
+        return this.entries.entrySet()
+                .removeIf(entry -> {
+                    WorkContainer<K, V> workContainer = entry.getValue();
+                    return isWorkContainerStale(workContainer);
+                });
+    }
+
+
+    ArrayList<WorkContainer<K, V>> getWorkIfAvailable(int workToGetDelta) {
+        log.trace("Looking for work on shardQueueEntry: {}", getKey());
+
+        var slowWork = new HashSet<WorkContainer<?, ?>>();
+        var workTaken = new ArrayList<WorkContainer<K, V>>();
+
+        var iterator = entries.entrySet().iterator();
+        while (workTaken.size() < workToGetDelta && iterator.hasNext()) {
+            var workContainer = iterator.next().getValue();
+
+            if (pm.couldBeTakenAsWork(workContainer)) {
+                if (workContainer.isAvailableToTakeAsWork()) {
+                    log.trace("Taking {} as work", workContainer);
+                    workContainer.onQueueingForExecution();
+                    workTaken.add(workContainer);
+                } else {
+                    log.trace("Skipping {} as work, not available to take as work", workContainer);
+                    addToSlowWorkMaybe(slowWork, workContainer);
+                }
+
+                if (isOrderRestricted()) {
+                    // can't take any more work from this shard, due to ordering restrictions
+                    // processing blocked on this shard, continue to next shard
+                    log.trace("Processing by {}, so have cannot get more messages on this ({}) shardEntry.", this.options.getOrdering(), getKey());
+                    break;
+                }
+            } else {
+                // break, assuming all work in this shard, is for the same ShardKey, which is always on the same
+                //  partition (regardless of ordering mode - KEY, PARTITION or UNORDERED (which is parallel PARTITIONs)),
+                //  so no point continuing shard scanning. This only isn't true if a non standard partitioner produced the
+                //  recrods of the same key to different partitions. In which case, there's no way PC can make sure all
+                //  records of that belong to the shard are able to even be processed by the same PC instance, so it doesn't
+                //  matter.
+                log.trace("Partition for shard {} is blocked for work taking, stopping shard scan", this);
+                break;
+            }
+        }
+
+        if (workTaken.size() == workToGetDelta) {
+            log.trace("Work taken ({}) exceeds max ({})", workTaken.size(), workToGetDelta);
+        }
+
+        logSlowWork(slowWork);
+
+        return workTaken;
+    }
+
+    private void logSlowWork(Set<WorkContainer<?, ?>> slowWork) {
+        // log
+        if (!slowWork.isEmpty()) {
+            List<String> slowTopics = slowWork.parallelStream()
+                    .map(x -> x.getTopicPartition().toString()).distinct()
+                    .collect(Collectors.toList());
+            slowWarningRateLimit.performIfNotLimited(() ->
+                    log.warn("Warning: {} records in the queue have been waiting longer than {}s for following topics {}.",
+                            slowWork.size(), toSeconds(options.getThresholdForTimeSpendInQueueWarning()), slowTopics));
+        }
+    }
+
+    private void addToSlowWorkMaybe(Set<WorkContainer<?, ?>> slowWork, WorkContainer<?, ?> workContainer) {
+        Duration timeInFlight = workContainer.getTimeInFlight();
+        Duration slowThreshold = options.getThresholdForTimeSpendInQueueWarning();
+        if (isGreaterThan(timeInFlight, slowThreshold)) {
+            if (!slowWork.contains(workContainer)) {
+                pm.incrementSlowWorkCounter(workContainer.getTopicPartition());
+            }
+            slowWork.add(workContainer);
+            if (log.isTraceEnabled()) {
+                log.trace("Work has spent over " + slowThreshold + " in queue! " + cantTakeAsWorkMsg(workContainer, timeInFlight));
+            }
+        } else {
+            if (log.isTraceEnabled()) {
+                log.trace(cantTakeAsWorkMsg(workContainer, timeInFlight));
+            }
+        }
+    }
+
+    private static String cantTakeAsWorkMsg(WorkContainer<?, ?> workContainer, Duration timeInFlight) {
+        var msgTemplate = "Can't take as work: Work ({}). Must all be true: Delay passed= {}. Is not in flight= {}. Has not succeeded already= {}. Time spent in execution queue: {}.";
+        return msg(msgTemplate, workContainer, workContainer.isDelayPassed(), workContainer.isNotInFlight(), !workContainer.isUserFunctionSucceeded(), timeInFlight);
+    }
+
+    private boolean isOrderRestricted() {
+        return options.getOrdering() != UNORDERED;
+    }
+
+    // check if the work container is stale
+    private boolean isWorkContainerStale(WorkContainer<K, V> workContainer) {
+        return pm.getPartitionState(workContainer).checkIfWorkIsStale(workContainer);
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/RemovedPartitionState.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/RemovedPartitionState.java
new file mode 100644
index 000000000..37d356d14
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/RemovedPartitionState.java
@@ -0,0 +1,126 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.KafkaUtils;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.internal.EpochAndRecordsMap;
+import io.confluent.parallelconsumer.internal.PCModule;
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager;
+import lombok.NonNull;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.common.TopicPartition;
+
+import java.util.Optional;
+import java.util.SortedSet;
+import java.util.TreeSet;
+
+/**
+ * No op version of {@link PartitionState} used for when partition assignments are removed, to avoid managing null
+ * references or {@link Optional}s. By replacing with a no op implementation, we protect for stale messages still in
+ * queues which reference it, among other things.
+ * <p>
+ * The alternative to this implementation, is having {@link PartitionStateManager#getPartitionState(TopicPartition)}
+ * return {@link Optional}, which forces the implicit null check everywhere partition state is retrieved. This was
+ * drafted to a degree, but found to be extremely invasive, where this solution with decent separation of concerns and
+ * encapsulation, is sufficient and potentially more useful as is non-destructive. Potential issue is that of memory
+ * leak as the collection will forever expand. However, even massive partition counts to a single consumer would be in
+ * the hundreds of thousands, this would only result in hundreds of thousands of {@link TopicPartition} object keys all
+ * pointing to the same instance of {@link RemovedPartitionState}.
+ *
+ * @author Antony Stubbs
+ */
+@Slf4j
+public class RemovedPartitionState<K, V> extends PartitionState<K, V> {
+
+    private static final SortedSet<Long> READ_ONLY_EMPTY_SET = new TreeSet<>();
+
+    private static final PartitionState singleton = new RemovedPartitionState<>();
+
+    public static final String NO_OP = "no-op";
+    public static final int NO_EPOCH = -1;
+
+    public RemovedPartitionState() {
+        super(NO_EPOCH, new PCModule<>(ParallelConsumerOptions.<K, V>builder().build()), null, OffsetMapCodecManager.HighestOffsetAndIncompletes.of());
+    }
+
+    public static PartitionState getSingleton() {
+        return RemovedPartitionState.singleton;
+    }
+
+    @Override
+    public boolean isRemoved() {
+        // by definition true in this implementation
+        return true;
+    }
+
+    @Override
+    public TopicPartition getTp() {
+        return null;
+    }
+
+    @Override
+    public void maybeRegisterNewPollBatchAsWork(@NonNull EpochAndRecordsMap<K, V>.RecordsAndEpoch recordsAndEpoch) {
+        // no-op
+        log.warn("Dropping polled record batch for partition no longer assigned. WC: {}", recordsAndEpoch);
+    }
+
+    /**
+     * Don't allow more records to be processed for this partition. Eventually these records triggering this check will
+     * be cleaned out.
+     *
+     * @return always returns false
+     */
+    @Override
+    boolean isAllowedMoreRecords() {
+        log.debug(NO_OP);
+        return true;
+    }
+
+    @Override
+    public SortedSet<Long> getIncompleteOffsetsBelowHighestSucceeded() {
+        log.debug(NO_OP);
+        return READ_ONLY_EMPTY_SET;
+    }
+
+    @Override
+    public long getOffsetHighestSeen() {
+        log.debug(NO_OP);
+        return PartitionState.KAFKA_OFFSET_ABSENCE;
+    }
+
+    @Override
+    public long getOffsetHighestSucceeded() {
+        log.debug(NO_OP);
+        return PartitionState.KAFKA_OFFSET_ABSENCE;
+    }
+
+    @Override
+    public boolean isRecordPreviouslyCompleted(final ConsumerRecord<K, V> rec) {
+        log.debug("Ignoring previously completed request for partition no longer assigned. Partition: {}", KafkaUtils.toTopicPartition(rec));
+        return false;
+    }
+
+    @Override
+    public boolean hasIncompleteOffsets() {
+        return false;
+    }
+
+    @Override
+    public int getNumberOfIncompleteOffsets() {
+        return 0;
+    }
+
+    @Override
+    public void onSuccess(long offset) {
+        log.debug("Dropping completed work container for partition no longer assigned. WC: {}, partition: {}", offset, getTp());
+    }
+
+    @Override
+    public boolean isPartitionRemovedOrNeverAssigned() {
+        return true;
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/ShardKey.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/ShardKey.java
new file mode 100644
index 000000000..4670cc8c0
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/ShardKey.java
@@ -0,0 +1,154 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder;
+import lombok.*;
+import lombok.experimental.FieldDefaults;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.common.TopicPartition;
+
+import java.util.Arrays;
+import java.util.Objects;
+
+/**
+ * Simple value class for processing {@link ShardKey}s to make the various key systems type safe and extendable.
+ *
+ * @author Antony Stubbs
+ */
+@Getter
+@FieldDefaults(makeFinal = true, level = AccessLevel.PRIVATE)
+@ToString
+@EqualsAndHashCode
+public class ShardKey {
+
+    public static ShardKey of(WorkContainer<?, ?> wc, ProcessingOrder ordering) {
+        return of(wc.getCr(), ordering);
+    }
+
+    public static ShardKey of(ConsumerRecord<?, ?> rec, ProcessingOrder ordering) {
+        return switch (ordering) {
+            case KEY -> ofKey(rec);
+            case PARTITION, UNORDERED -> ofTopicPartition(rec);
+        };
+    }
+
+    public static KeyOrderedKey ofKey(ConsumerRecord<?, ?> rec) {
+        return new KeyOrderedKey(rec);
+    }
+
+    public static ShardKey ofTopicPartition(final ConsumerRecord<?, ?> rec) {
+        return new TopicPartitionKey(new TopicPartition(rec.topic(), rec.partition()));
+    }
+
+    @Value
+    @EqualsAndHashCode(callSuper = true)
+    public static class KeyOrderedKey extends ShardKey {
+
+        /**
+         * Note: We use just the topic name here, and not the partition, so that if we were to receive records from the
+         * same key from the partitions we're assigned, they will be put into the same queue.
+         */
+        TopicPartition topicName;
+
+        /**
+         * The key of the record being referenced. Nullable if record is produced with a null key.
+         */
+        KeyWithEquals key;
+
+        public KeyOrderedKey(final ConsumerRecord<?, ?> rec) {
+            this(new TopicPartition(rec.topic(), rec.partition()), rec.key());
+        }
+
+        public KeyOrderedKey(final TopicPartition topicPartition, final Object key) {
+            if (key instanceof KeyWithEquals) {
+                this.key = (KeyWithEquals) key;
+            } else {
+                this.key = new KeyWithEquals(key);
+            }
+            this.topicName = topicPartition;
+        }
+    }
+
+    @Value
+    @RequiredArgsConstructor
+    public static class KeyWithEquals {
+        Object key;
+
+        @Override
+        public boolean equals(Object o) {
+            if (o == this) return true;
+            if (!(o instanceof KeyWithEquals)) return false;
+            KeyWithEquals other = (KeyWithEquals) o;
+            if (other.key == null && this.key == null) return true;
+            if (other.key == null || this.key == null) return false;
+            return Objects.deepEquals(this.key, other.key);
+        }
+
+        @Override
+        public int hashCode() {
+
+            final int PRIME = 59;
+            int result = 1;
+            result = (result * PRIME);
+            if (key == null) {
+                result = result + 43;
+                return result;
+            }
+            if (isArray(key)) {
+                result = result + arrayHashCode(key);
+            } else {
+                result = result + key.hashCode();
+            }
+            return result;
+        }
+
+
+        private int arrayHashCode(Object t) {
+            if (t instanceof Object[]) {
+                return Arrays.deepHashCode((Object[]) t);
+            } else {
+                return primitiveArrayHashCode(t, t.getClass().getComponentType());
+            }
+        }
+
+        /**
+         * Copy of {@link Arrays#primitiveArrayHashCode} logic
+         *
+         * @param a
+         * @param cl
+         * @return
+         */
+        private int primitiveArrayHashCode(Object a, Class<?> cl) {
+            return
+                    (cl == byte.class) ? Arrays.hashCode((byte[]) a) :
+                            (cl == int.class) ? Arrays.hashCode((int[]) a) :
+                                    (cl == long.class) ? Arrays.hashCode((long[]) a) :
+                                            (cl == char.class) ? Arrays.hashCode((char[]) a) :
+                                                    (cl == short.class) ? Arrays.hashCode((short[]) a) :
+                                                            (cl == boolean.class) ? Arrays.hashCode((boolean[]) a) :
+                                                                    (cl == double.class) ? Arrays.hashCode((double[]) a) :
+                                                                            // If new primitive types are ever added, this method must be
+                                                                            // expanded or we will fail here with ClassCastException.
+                                                                            Arrays.hashCode((float[]) a);
+        }
+
+        private boolean isArray(Object obj) {
+            return obj instanceof Object[] || obj instanceof boolean[] ||
+                    obj instanceof byte[] || obj instanceof short[] ||
+                    obj instanceof char[] || obj instanceof int[] ||
+                    obj instanceof long[] || obj instanceof float[] ||
+                    obj instanceof double[];
+        }
+    }
+
+
+    @Value
+    @EqualsAndHashCode(callSuper = true)
+    public static class TopicPartitionKey extends ShardKey {
+        TopicPartition topicPartition;
+    }
+
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/ShardManager.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/ShardManager.java
new file mode 100644
index 000000000..ceac3f51d
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/ShardManager.java
@@ -0,0 +1,301 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.LoopingResumingIterator;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder;
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.internal.BrokerPollSystem;
+import io.confluent.parallelconsumer.internal.PCModule;
+import io.confluent.parallelconsumer.metrics.PCMetrics;
+import io.confluent.parallelconsumer.metrics.PCMetricsDef;
+import io.micrometer.core.instrument.Gauge;
+import lombok.AccessLevel;
+import lombok.Getter;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.common.TopicPartition;
+
+import java.time.Duration;
+import java.time.Instant;
+import java.util.*;
+import java.util.concurrent.ConcurrentHashMap;
+import java.util.stream.Collectors;
+
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.KEY;
+import static java.util.Optional.empty;
+import static java.util.Optional.of;
+
+/**
+ * Shards are local queues of work to be processed.
+ * <p>
+ * Generally they are keyed by one of the corresponding {@link ProcessingOrder} modes - key, partition etc...
+ * <p>
+ * This state is shared between the {@link BrokerPollSystem} thread (write - adding and removing shards and work)  and
+ * the {@link AbstractParallelEoSStreamProcessor} Controller thread (read - how many records are in the shards?), so
+ * must be thread safe.
+ *
+ * @author Antony Stubbs
+ */
+// metrics: number of queues, average queue length
+@Slf4j
+public class ShardManager<K, V> {
+
+    private final PCModule<K, V> module;
+
+
+    @Getter
+    private final ParallelConsumerOptions<?, ?> options;
+
+    private final WorkManager<K, V> wm;
+
+    /**
+     * Map of Object keys to Shard
+     * <p>
+     * Object Type is either the K key type, or it is a {@link TopicPartition}
+     * <p>
+     * Used to collate together a queue of work units for each unique key consumed
+     *
+     * @see ProcessingShard
+     * @see K
+     * @see WorkManager#getWorkIfAvailable()
+     */
+    // performance: could disable/remove if using partition order - but probably not worth the added complexity in the code to handle an extra special case
+    @Getter(AccessLevel.PRIVATE)
+    private final Map<ShardKey, ProcessingShard<K, V>> processingShards = new ConcurrentHashMap<>();
+
+    /**
+     * TreeSet is a Set, so must ensure that we are consistent with equalTo in our comparator - so include the full id -
+     * {@link TopicPartition} and offset after comparing the retry due time.
+     * <p>
+     * I.e. two instances of WC are not equal, just because their retry due time its.
+     * <p>
+     * Also - our primary comparison - {@link WorkContainer#getRetryDueAt()} must return a consistant value, regardless
+     * of WHEN it's queried - so must not use shortcuts like {@link Instant#now()}
+     */
+    @Getter(AccessLevel.PACKAGE) // visible for testing
+    private final Comparator<WorkContainer<?, ?>> retryQueueWorkContainerComparator = Comparator
+            .comparing((WorkContainer<?, ?> workContainer) -> workContainer.getRetryDueAt())
+            .thenComparing(workContainer -> {
+                // TopicPartition does not implement comparable
+                TopicPartition tp = workContainer.getTopicPartition();
+                return tp.topic() + tp.partition();
+            })
+            .thenComparing(WorkContainer::offset);
+
+    /**
+     * Read optimised view of {@link WorkContainer}s that need retrying.
+     */
+    @Getter(AccessLevel.PACKAGE) // visible for testing
+    private final NavigableSet<WorkContainer<?, ?>> retryQueue = new TreeSet<>(retryQueueWorkContainerComparator);
+
+    /**
+     * Iteration resume point, to ensure fairness (prevent shard starvation) when we can't process messages from every
+     * shard.
+     */
+    private Optional<ShardKey> iterationResumePoint = Optional.empty();
+
+    private Gauge shardsSizeGauge;
+    private Gauge numberOfShardsGauge;
+
+    private final PCMetrics pcMetrics;
+
+    public ShardManager(final PCModule<K, V> module, final WorkManager<K, V> wm) {
+        this.module = module;
+        this.wm = wm;
+        this.options = module.options();
+        this.pcMetrics = module.pcMetrics();
+        initMetrics();
+    }
+
+    /**
+     * The shard belonging to the given key
+     *
+     * @return may return empty if the shard has since been removed
+     */
+    Optional<ProcessingShard<K, V>> getShard(ShardKey key) {
+        return Optional.ofNullable(processingShards.get(key));
+    }
+
+    ShardKey computeShardKey(WorkContainer<?, ?> wc) {
+        return ShardKey.of(wc, options.getOrdering());
+    }
+
+    ShardKey computeShardKey(ConsumerRecord<?, ?> wc) {
+        return ShardKey.of(wc, options.getOrdering());
+    }
+
+    /**
+     * @return Work ready in the processing shards, awaiting selection as work to do
+     */
+    public long getNumberOfWorkQueuedInShardsAwaitingSelection() {
+        return processingShards.values().stream()
+                .mapToLong(ProcessingShard::getCountOfWorkAwaitingSelection)
+                .sum();
+    }
+
+    public boolean workIsWaitingToBeProcessed() {
+        Collection<ProcessingShard<K, V>> allShards = processingShards.values();
+        return allShards.parallelStream()
+                .anyMatch(ProcessingShard::workIsWaitingToBeProcessed);
+    }
+
+    /**
+     * Remove only the work shards which are referenced from work from revoked partitions
+     *
+     * @param recordsFromRemovedPartition collection of work to scan to get keys of shards to remove
+     */
+    void removeAnyShardEntriesReferencedFrom(Collection<Optional<ConsumerRecord<K, V>>> recordsFromRemovedPartition) {
+        List<ConsumerRecord<K, V>> polledRecordsFromPartition = recordsFromRemovedPartition.stream()
+                .filter(Optional::isPresent)
+                .map(Optional::get)
+                .collect(Collectors.toList());
+        for (ConsumerRecord<K, V> consumerRecord : polledRecordsFromPartition) {
+            removeWorkFromShardFor(consumerRecord);
+        }
+    }
+
+    /**
+     * Removes any tracked work for this record, and removes the shard if it is empty
+     */
+    private void removeWorkFromShardFor(ConsumerRecord<K, V> consumerRecord) {
+        ShardKey shardKey = computeShardKey(consumerRecord);
+
+        if (processingShards.containsKey(shardKey)) {
+            // remove the work
+            ProcessingShard<K, V> shard = processingShards.get(shardKey);
+            WorkContainer<K, V> removedWC = shard.remove(consumerRecord.offset());
+
+            // remove if in retry queue
+            this.retryQueue.remove(removedWC);
+
+            // remove the shard if empty
+            removeShardIfEmpty(shardKey);
+        } else {
+            log.trace("Shard referenced by WC: {} with shard key: {} already removed", consumerRecord, shardKey);
+        }
+
+    }
+
+    public void addWorkContainer(long epochOfInboundRecords, ConsumerRecord<K, V> aRecord) {
+        var wc = new WorkContainer<>(epochOfInboundRecords, aRecord, module);
+        ShardKey shardKey = computeShardKey(wc);
+
+        // don't need to synchronise on /adding/ elements, as the iterator would just stop early
+        var shard = processingShards.computeIfAbsent(shardKey,
+                ignore -> new ProcessingShard<>(shardKey, options, wm.getPm()));
+        shard.addWorkContainer(wc);
+    }
+
+    void removeShardIfEmpty(ShardKey key) {
+        Optional<ProcessingShard<K, V>> shardOpt = getShard(key);
+
+        // If using KEY ordering, where the shard key is a message key, garbage collect old shard keys (i.e. KEY ordering we may never see a message for this key again)
+        // If not, no point to remove the shard, as it will be reused for the next message from the same partition
+        boolean keyOrdering = options.getOrdering().equals(KEY);
+        if (keyOrdering && shardOpt.isPresent() && shardOpt.get().isEmpty()) {
+            log.trace("Removing empty shard (key: {})", key);
+            this.processingShards.remove(key);
+        }
+    }
+
+    public void onSuccess(WorkContainer<?, ?> wc) {
+        // remove from the retry queue if it's contained
+        this.retryQueue.remove(wc);
+
+        // remove from processing queues
+        var key = computeShardKey(wc);
+        var shardOptional = getShard(key);
+
+        if (shardOptional.isPresent()) {
+            //
+            shardOptional.get().onSuccess(wc);
+            removeShardIfEmpty(key);
+        } else {
+            log.trace("Dropping successful result for revoked partition {}. Record in question was: {}", key, wc.getCr());
+        }
+    }
+
+    /**
+     * Idempotent - work may have not been removed, either way it's put back
+     */
+    public void onFailure(WorkContainer<?, ?> wc) {
+        log.debug("Work FAILED");
+        this.retryQueue.add(wc);
+    }
+
+    /**
+     * @return none if there are no messages to retry
+     */
+    public Optional<Duration> getLowestRetryTime() {
+        // find the first in the queue that isn't in flight
+        // could potentially remove from queue when in flight but that's messy and performance gain would be trivial
+        for (WorkContainer<?, ?> workContainer : this.retryQueue) {
+            if (workContainer.isNotInFlight())
+                return of(workContainer.getDelayUntilRetryDue());
+        }
+        return empty();
+    }
+
+    public List<WorkContainer<K, V>> getWorkIfAvailable(final int requestedMaxWorkToRetrieve) {
+        LoopingResumingIterator<ShardKey, ProcessingShard<K, V>> shardQueueIterator =
+                new LoopingResumingIterator<>(iterationResumePoint, this.processingShards);
+
+        //
+        List<WorkContainer<K, V>> workFromAllShards = new ArrayList<>();
+
+        // loop over shards, and get work from each
+        Optional<Map.Entry<ShardKey, ProcessingShard<K, V>>> next = shardQueueIterator.next();
+        while (workFromAllShards.size() < requestedMaxWorkToRetrieve && next.isPresent()) {
+            var shardEntry = next;
+            ProcessingShard<K, V> shard = shardEntry.get().getValue();
+
+            //
+            int remainingToGet = requestedMaxWorkToRetrieve - workFromAllShards.size();
+            var work = shard.getWorkIfAvailable(remainingToGet);
+            workFromAllShards.addAll(work);
+
+            // next
+            next = shardQueueIterator.next();
+        }
+
+        // log
+        if (workFromAllShards.size() >= requestedMaxWorkToRetrieve) {
+            log.debug("Work taken is now over max (iteration resume point is {})", iterationResumePoint);
+        }
+
+        //
+        updateResumePoint(next);
+
+        return workFromAllShards;
+    }
+
+    public boolean removeStaleContainers() {
+        boolean removed = processingShards.values().stream()
+                .map(ProcessingShard::removeStaleWorkContainersFromShard)
+                .anyMatch(res -> res.equals(true));
+        if (removed) {
+            log.debug("there are stale work containers removed");
+        }
+        return removed;
+    }
+
+    private void updateResumePoint(Optional<Map.Entry<ShardKey, ProcessingShard<K, V>>> lastShard) {
+        // if empty, iteration was exhausted and no resume point is needed
+        iterationResumePoint = lastShard.map(Map.Entry::getKey);
+        if (iterationResumePoint.isPresent()) {
+            log.debug("Work taken is now over max, stopping (saving iteration resume point {})", iterationResumePoint);
+        }
+    }
+
+    private void initMetrics() {
+        shardsSizeGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.SHARDS_SIZE,
+                this, shardManager -> shardManager.processingShards.values().stream()
+                        .mapToInt(processingShard -> processingShard.getEntries().size()).sum());
+        numberOfShardsGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.NUMBER_OF_SHARDS,
+                this, shardManager -> shardManager.processingShards.keySet().size());
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/WorkContainer.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/WorkContainer.java
new file mode 100644
index 000000000..7b2ed2413
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/WorkContainer.java
@@ -0,0 +1,246 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.PollContextInternal;
+import io.confluent.parallelconsumer.RecordContext;
+import io.confluent.parallelconsumer.internal.PCModule;
+import io.confluent.parallelconsumer.internal.ProducerManager;
+import lombok.*;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.common.TopicPartition;
+
+import java.time.Duration;
+import java.time.Instant;
+import java.time.temporal.Temporal;
+import java.util.List;
+import java.util.Optional;
+import java.util.concurrent.Future;
+
+import static io.confluent.csid.utils.KafkaUtils.toTopicPartition;
+import static java.util.Optional.of;
+
+/**
+ * Context object for a given {@link ConsumerRecord}, carrying completion status, various time stamps, retry data etc..
+ *
+ * @author Antony Stubbs
+ */
+@Slf4j
+@EqualsAndHashCode
+public class WorkContainer<K, V> implements Comparable<WorkContainer<K, V>> {
+
+    static final String DEFAULT_TYPE = "DEFAULT";
+
+    /**
+     * Instance reference to otherwise static state, for access to the instance type parameters of WorkContainer as
+     * static fields cannot access them.
+     */
+    @NonNull
+    private final PCModule<K, V> module;
+
+    /**
+     * Assignment generation this record comes from. Used for fencing messages after partition loss, for work lingering
+     * in the system of in flight.
+     */
+    @Getter
+    private final long epoch;
+
+    /**
+     * Simple way to differentiate treatment based on type
+     */
+    @Getter
+    @Setter
+    // todo change to enum, remove setter - #241
+    private String workType;
+
+    @Getter
+    private final ConsumerRecord<K, V> cr;
+
+    @Getter
+    private int numberOfFailedAttempts = 0;
+
+    @Getter
+    private Optional<Instant> lastFailedAt = Optional.empty();
+
+    @Getter
+    private Optional<Instant> succeededAt = Optional.empty();
+
+    @Getter
+    private Optional<Throwable> lastFailureReason;
+
+    private boolean inFlight = false;
+
+    @Getter
+    private Optional<Boolean> maybeUserFunctionSucceeded = Optional.empty();
+
+    @Getter
+    @Setter(AccessLevel.PUBLIC)
+    private Future<List<?>> future;
+
+    private Optional<Long> timeTakenAsWorkMs = Optional.empty();
+
+
+    public WorkContainer(long epoch, ConsumerRecord<K, V> cr, @NonNull PCModule<K, V> module, @NonNull String workType) {
+        this.epoch = epoch;
+        this.cr = cr;
+        this.workType = workType;
+        this.module = module;
+    }
+
+    public WorkContainer(long epoch, ConsumerRecord<K, V> cr, PCModule<K, V> module) {
+        this(epoch, cr, module, DEFAULT_TYPE);
+    }
+
+    public void endFlight() {
+        log.trace("Ending flight {}", this);
+        inFlight = false;
+    }
+
+    public boolean isDelayPassed() {
+        if (!hasPreviouslyFailed()) {
+            // if never failed, there is no artificial delay, so "delay" has always passed
+            return true;
+        }
+        Duration delay = getDelayUntilRetryDue();
+        boolean negative = delay.isNegative() || delay.isZero(); // for debug
+        return negative;
+    }
+
+    /**
+     * @return time until it should be retried
+     */
+    public Duration getDelayUntilRetryDue() {
+        Instant now = module.clock().instant();
+        Temporal nextAttemptAt = getRetryDueAt();
+        return Duration.between(now, nextAttemptAt);
+    }
+
+    /**
+     * @return The point in time at which the record should ideally be retried.
+     */
+    public Instant getRetryDueAt() {
+        if (lastFailedAt.isPresent()) {
+            // previously failed, so add the delay to the last failed time
+            Duration retryDelay = getRetryDelayConfig();
+            return lastFailedAt.get().plus(retryDelay);
+        } else {
+            // never failed, so no try again delay
+            return Instant.MIN; // use a constant for stable comparison
+        }
+    }
+
+    /**
+     * @return the delay between retries e.g. retry after 1 second
+     */
+    public Duration getRetryDelayConfig() {
+        var options = module.options();
+        var retryDelayProvider = options.getRetryDelayProvider();
+        if (retryDelayProvider != null) {
+            return retryDelayProvider.apply(new RecordContext<>(this));
+        } else {
+            return options.getDefaultMessageRetryDelay();
+        }
+    }
+
+    @Override
+    public int compareTo(WorkContainer o) {
+        long myOffset = this.cr.offset();
+        long theirOffset = o.cr.offset();
+        int compare = Long.compare(myOffset, theirOffset);
+        return compare;
+    }
+
+    public boolean isNotInFlight() {
+        return !isInFlight();
+    }
+
+    public boolean isInFlight() {
+        return inFlight;
+    }
+
+    public void onQueueingForExecution() {
+        log.trace("Queueing for execution: {}", this);
+        inFlight = true;
+        timeTakenAsWorkMs = of(System.currentTimeMillis());
+    }
+
+    public TopicPartition getTopicPartition() {
+        return toTopicPartition(getCr());
+    }
+
+    public void onUserFunctionSuccess() {
+        this.succeededAt = of(module.clock().instant());
+        this.maybeUserFunctionSucceeded = of(true);
+    }
+
+    public void onUserFunctionFailure(Throwable cause) {
+        log.trace("Failing {}", this);
+
+        updateFailureHistory(cause);
+
+        this.maybeUserFunctionSucceeded = of(false);
+    }
+
+    private void updateFailureHistory(Throwable cause) {
+        numberOfFailedAttempts++;
+        lastFailedAt = of(Instant.now(module.clock()));
+        lastFailureReason = Optional.ofNullable(cause);
+    }
+
+    public boolean isUserFunctionComplete() {
+        return this.getMaybeUserFunctionSucceeded().isPresent();
+    }
+
+    public boolean isUserFunctionSucceeded() {
+        Optional<Boolean> userFunctionSucceeded = this.getMaybeUserFunctionSucceeded();
+        return userFunctionSucceeded.orElse(false);
+    }
+
+    @Override
+    public String toString() {
+        return "WorkContainer(tp:" + toTopicPartition(cr) + ":o:" + cr.offset() + ":k:" + cr.key() + ")";
+    }
+
+    public Duration getTimeInFlight() {
+        if (!timeTakenAsWorkMs.isPresent()) {
+            return Duration.ZERO;
+        }
+        long millis = System.currentTimeMillis() - timeTakenAsWorkMs.get();
+        return Duration.ofMillis(millis);
+    }
+
+    public long offset() {
+        return getCr().offset();
+    }
+
+    public boolean hasPreviouslyFailed() {
+        return getNumberOfFailedAttempts() > 0;
+    }
+
+    /**
+     * Checks the work is not already in flight, it's retry delay has passed and that it's not already been succeeded.
+     * <p>
+     * Checking that there's no back pressure for the partition it belongs to is covered by
+     * {@link PartitionStateManager#isAllowedMoreRecords(WorkContainer)}.
+     */
+    public boolean isAvailableToTakeAsWork() {
+        return isNotInFlight() && !isUserFunctionSucceeded() && isDelayPassed();
+    }
+
+    /**
+     * Only unlock our producing lock, when we've had the {@link WorkContainer} state safely returned to the controllers
+     * inbound queue, so we know it'll be included properly before the next commit as a succeeded offset. As in order
+     * for the controller to perform the transaction commit, it will be blocked from acquiring its commit lock until all
+     * produce locks have been returned, inbound queue processed, and thus their representative offsets placed into the
+     * commit payload (offset map).
+     */
+    public void onPostAddToMailBox(PollContextInternal<K, V> context, Optional<ProducerManager<K, V>> producerManager) {
+        producerManager.ifPresent(pm -> {
+            var producingLock = context.getProducingLock();
+            producingLock.ifPresent(pm::finishProducing);
+        });
+    }
+}
diff --git a/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/WorkManager.java b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/WorkManager.java
new file mode 100644
index 000000000..0b1952ddf
--- /dev/null
+++ b/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/state/WorkManager.java
@@ -0,0 +1,336 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.internal.*;
+import io.confluent.parallelconsumer.metrics.PCMetrics;
+import io.confluent.parallelconsumer.metrics.PCMetricsDef;
+import io.micrometer.core.instrument.Counter;
+import io.micrometer.core.instrument.Gauge;
+import io.micrometer.core.instrument.Tag;
+import lombok.Getter;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerRebalanceListener;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.common.TopicPartition;
+import pl.tlinkowski.unij.api.UniLists;
+
+import java.time.Duration;
+import java.util.*;
+import java.util.function.Consumer;
+
+import static java.lang.Boolean.TRUE;
+import static lombok.AccessLevel.PUBLIC;
+
+/**
+ * Sharded, prioritised, offset managed, order controlled, delayed work queue.
+ * <p>
+ * Low Watermark - the highest offset (continuously successful) with all it's previous messages succeeded (the offset
+ * one commits to broker)
+ * <p>
+ * High Water Mark - the highest offset which has succeeded (previous may be incomplete)
+ * <p>
+ * Highest seen offset - the highest ever seen offset
+ * <p>
+ * This state is shared between the {@link BrokerPollSystem} thread and the {@link AbstractParallelEoSStreamProcessor}.
+ *
+ * @author Antony Stubbs
+ */
+@Slf4j
+public class WorkManager<K, V> implements ConsumerRebalanceListener {
+
+    @Getter
+    private final ParallelConsumerOptions<K, V> options;
+
+    // todo make private
+    @Getter(PUBLIC)
+    final PartitionStateManager<K, V> pm;
+
+    // todo make private
+    @Getter(PUBLIC)
+    private final ShardManager<K, V> sm;
+
+    /**
+     * The multiple of {@link ParallelConsumerOptions#getMaxConcurrency()} that should be pre-loaded awaiting
+     * processing.
+     * <p>
+     * We use it here as well to make sure we have a matching number of messages in queues available.
+     */
+    private final DynamicLoadFactor dynamicLoadFactor;
+
+    @Getter
+    private int numberRecordsOutForProcessing = 0;
+    private PCModule<K, V> module;
+    /**
+     * Useful for testing
+     */
+    @Getter(PUBLIC)
+    private final List<Consumer<WorkContainer<K, V>>> successfulWorkListeners = new ArrayList<>();
+
+    private Gauge waitingRecordsNumberGauge;
+    private Gauge inflightRecordsNumberGauge;
+    private Map<TopicPartition, Counter> succeededRecordsCounters = new HashMap<>();
+    private Map<TopicPartition, Counter> failedRecordsCounters = new HashMap<>();
+
+    private final PCMetrics pcMetrics;
+
+    public WorkManager(PCModule<K, V> module,
+                       DynamicLoadFactor dynamicExtraLoadFactor) {
+        this.module = module;
+        this.options = module.options();
+        this.dynamicLoadFactor = dynamicExtraLoadFactor;
+        this.sm = new ShardManager<>(module, this);
+        this.pm = new PartitionStateManager<>(module, sm);
+        this.pcMetrics = module.pcMetrics();
+        initMetrics();
+    }
+
+    /**
+     * Load offset map for assigned partitions
+     */
+    @Override
+    public void onPartitionsAssigned(Collection<TopicPartition> partitions) {
+        pm.onPartitionsAssigned(partitions);
+        initTopicPartitionSpecificMetrics(partitions);
+    }
+
+    /**
+     * Clear offset map for revoked partitions
+     * <p>
+     * {@link AbstractParallelEoSStreamProcessor#onPartitionsRevoked} handles committing off offsets upon revoke
+     *
+     * @see AbstractParallelEoSStreamProcessor#onPartitionsRevoked
+     */
+    @Override
+    public void onPartitionsRevoked(Collection<TopicPartition> partitions) {
+        pm.onPartitionsRevoked(partitions);
+        onPartitionsRemoved(partitions);
+    }
+
+    /**
+     * Clear offset map for lost partitions
+     */
+    @Override
+    public void onPartitionsLost(Collection<TopicPartition> partitions) {
+        pm.onPartitionsLost(partitions);
+        onPartitionsRemoved(partitions);
+    }
+
+    void onPartitionsRemoved(final Collection<TopicPartition> partitions) {
+        deregisterTopicPartitionSpecificMetrics(partitions);
+    }
+
+    public void registerWork(EpochAndRecordsMap<K, V> records) {
+        pm.maybeRegisterNewRecordAsWork(records);
+    }
+
+    /**
+     * Get work with no limit on quantity, useful for testing.
+     */
+    public List<WorkContainer<K, V>> getWorkIfAvailable() {
+        return getWorkIfAvailable(Integer.MAX_VALUE);
+    }
+
+    /**
+     * Depth first work retrieval.
+     */
+    public List<WorkContainer<K, V>> getWorkIfAvailable(final int requestedMaxWorkToRetrieve) {
+        // optimise early
+        if (requestedMaxWorkToRetrieve < 1) {
+            return UniLists.of();
+        }
+
+        //
+        var work = sm.getWorkIfAvailable(requestedMaxWorkToRetrieve);
+
+        //
+        if (log.isDebugEnabled()) {
+            log.debug("Got {} of {} requested records of work. In-flight: {}, Awaiting in commit (partition) queues: {}",
+                    work.size(),
+                    requestedMaxWorkToRetrieve,
+                    getNumberRecordsOutForProcessing(),
+                    getNumberOfIncompleteOffsets());
+        }
+        numberRecordsOutForProcessing += work.size();
+        return work;
+    }
+
+    public void onSuccessResult(WorkContainer<K, V> wc) {
+        log.trace("Work success ({}), removing from processing shard queue", wc);
+
+        incrementCounterIfPresent(succeededRecordsCounters, wc.getTopicPartition());
+
+        wc.endFlight();
+
+        // update as we go
+        pm.onSuccess(wc);
+        sm.onSuccess(wc);
+
+        // notify listeners
+        successfulWorkListeners.forEach(c -> c.accept(wc));
+
+        numberRecordsOutForProcessing--;
+    }
+
+    /**
+     * Can run from controller or poller thread, depending on which is responsible for committing
+     *
+     * @see PartitionStateManager#onOffsetCommitSuccess(Map)
+     */
+    public void onOffsetCommitSuccess(Map<TopicPartition, OffsetAndMetadata> committed) {
+        pm.onOffsetCommitSuccess(committed);
+    }
+
+    public void onFailureResult(WorkContainer<K, V> wc) {
+        // error occurred, put it back in the queue if it can be retried
+        incrementCounterIfPresent(failedRecordsCounters, wc.getTopicPartition());
+        wc.endFlight();
+        pm.onFailure(wc);
+        sm.onFailure(wc);
+        numberRecordsOutForProcessing--;
+    }
+
+    public long getNumberOfIncompleteOffsets() {
+        return pm.getNumberOfIncompleteOffsets();
+    }
+
+    public Map<TopicPartition, OffsetAndMetadata> collectCommitDataForDirtyPartitions() {
+        return pm.collectDirtyCommitData();
+    }
+
+    /**
+     * Have our partitions been revoked? Can a batch contain messages of different epochs?
+     *
+     * @return true if any epoch is stale, false if not
+     * @see #checkIfWorkIsStale(WorkContainer)
+     */
+    public boolean checkIfWorkIsStale(final List<WorkContainer<K, V>> workContainers) {
+        for (final WorkContainer<K, V> workContainer : workContainers) {
+            if (checkIfWorkIsStale(workContainer)) return true;
+        }
+        return false;
+    }
+
+    /**
+     * Have our partitions been revoked?
+     *
+     * @return true if epoch doesn't match, false if ok
+     */
+    public boolean checkIfWorkIsStale(WorkContainer<K, V> workContainer) {
+        return pm.getPartitionState(workContainer).checkIfWorkIsStale(workContainer);
+    }
+
+    public boolean shouldThrottle() {
+        return isSufficientlyLoaded();
+    }
+
+    /**
+     * @return true if there's enough messages downloaded from the broker already to satisfy the pipeline, false if more
+     *         should be downloaded (or pipelined in the Consumer)
+     */
+    public boolean isSufficientlyLoaded() {
+        return getNumberOfWorkQueuedInShardsAwaitingSelection() > (long) options.getTargetAmountOfRecordsInFlight() * getLoadingFactor();
+    }
+
+    private int getLoadingFactor() {
+        return dynamicLoadFactor.getCurrentFactor();
+    }
+
+    public boolean workIsWaitingToBeProcessed() {
+        return sm.workIsWaitingToBeProcessed();
+    }
+
+    public boolean hasWorkInFlight() {
+        return getNumberRecordsOutForProcessing() != 0;
+    }
+
+    public boolean isWorkInFlightMeetingTarget() {
+        return getNumberRecordsOutForProcessing() >= options.getTargetAmountOfRecordsInFlight();
+    }
+
+    public long getNumberOfWorkQueuedInShardsAwaitingSelection() {
+        return sm.getNumberOfWorkQueuedInShardsAwaitingSelection();
+    }
+
+    public boolean hasIncompleteOffsets() {
+        return pm.hasIncompleteOffsets();
+    }
+
+    public boolean isRecordsAwaitingProcessing() {
+        return sm.getNumberOfWorkQueuedInShardsAwaitingSelection() > 0;
+    }
+
+    public void handleFutureResult(WorkContainer<K, V> wc) {
+        if (checkIfWorkIsStale(wc)) {
+            // no op, partition has been revoked
+            log.debug("Work result received, but from an old generation. Dropping work from revoked partition {}", wc);
+            wc.endFlight();
+            this.numberRecordsOutForProcessing--;
+        } else {
+            Optional<Boolean> userFunctionSucceeded = wc.getMaybeUserFunctionSucceeded();
+            if (userFunctionSucceeded.isPresent()) {
+                if (TRUE.equals(userFunctionSucceeded.get())) {
+                    onSuccessResult(wc);
+                } else {
+                    onFailureResult(wc);
+                }
+            } else {
+                throw new IllegalStateException("Work returned, but without a success flag - report a bug");
+            }
+        }
+    }
+
+    public boolean isNoRecordsOutForProcessing() {
+        return getNumberRecordsOutForProcessing() == 0;
+    }
+
+    public Optional<Duration> getLowestRetryTime() {
+        return sm.getLowestRetryTime();
+    }
+
+    public boolean isDirty() {
+        return pm.isDirty();
+    }
+
+    private void initMetrics() {
+        waitingRecordsNumberGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.WAITING_RECORDS,
+                this, WorkManager::getNumberOfWorkQueuedInShardsAwaitingSelection);
+        inflightRecordsNumberGauge = pcMetrics.gaugeFromMetricDef(PCMetricsDef.INFLIGHT_RECORDS,
+                this, WorkManager::getNumberRecordsOutForProcessing);
+    }
+
+    private void initTopicPartitionSpecificMetrics(Collection<TopicPartition> partitions) {
+        partitions.forEach(topicPartition -> {
+            if (!succeededRecordsCounters.containsKey(topicPartition)) {
+                succeededRecordsCounters.put(topicPartition, pcMetrics.getCounterFromMetricDef(PCMetricsDef.PROCESSED_RECORDS, getWorkManagerCounterTags(topicPartition)));
+            }
+            if (!failedRecordsCounters.containsKey(topicPartition)) {
+                failedRecordsCounters.put(topicPartition, pcMetrics.getCounterFromMetricDef(PCMetricsDef.FAILED_RECORDS, getWorkManagerCounterTags(topicPartition)));
+            }
+        });
+    }
+
+    private void incrementCounterIfPresent(Map<TopicPartition, Counter> counterMap, TopicPartition topicPartition) {
+        Optional.ofNullable(counterMap.get(topicPartition)).ifPresent(Counter::increment);
+    }
+
+    private Tag[] getWorkManagerCounterTags(TopicPartition topicPartition) {
+        return new Tag[]{Tag.of("topic", topicPartition.topic()), Tag.of("partition", String.valueOf(topicPartition.partition()))};
+    }
+
+    private void deregisterTopicPartitionSpecificMetrics(Collection<TopicPartition> partitions) {
+        partitions.forEach(topicPartition -> {
+            Counter counter = succeededRecordsCounters.remove(topicPartition);
+            if (counter != null) {
+                pcMetrics.removeMeter(counter);
+            }
+            counter = failedRecordsCounters.remove(topicPartition);
+            if (counter != null) {
+                pcMetrics.removeMeter(counter);
+            }
+        });
+    }
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/BrokerIntegrationTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/BrokerIntegrationTest.java
new file mode 100644
index 000000000..aa0fc8295
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/BrokerIntegrationTest.java
@@ -0,0 +1,137 @@
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+package io.confluent.parallelconsumer.integrationTests;
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.testcontainers.FilteredTestContainerSlf4jLogConsumer;
+import io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils;
+import lombok.AccessLevel;
+import lombok.Getter;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.commons.lang3.StringUtils;
+import org.apache.kafka.clients.admin.CreateTopicsResult;
+import org.apache.kafka.clients.admin.NewTopic;
+import org.junit.jupiter.api.AfterEach;
+import org.junit.jupiter.api.BeforeAll;
+import org.junit.jupiter.api.BeforeEach;
+import org.testcontainers.containers.KafkaContainer;
+import org.testcontainers.junit.jupiter.Testcontainers;
+import org.testcontainers.utility.DockerImageName;
+import pl.tlinkowski.unij.api.UniLists;
+
+import java.util.List;
+import java.util.concurrent.ExecutionException;
+import java.util.concurrent.TimeUnit;
+
+import static org.apache.commons.lang3.RandomUtils.nextInt;
+import static org.assertj.core.api.Assertions.assertThat;
+
+/**
+ * @author Antony Stubbs
+ */
+@Testcontainers
+@Slf4j
+public abstract class BrokerIntegrationTest<K, V> {
+
+    static {
+        System.setProperty("flogger.backend_factory", "com.google.common.flogger.backend.slf4j.Slf4jBackendFactory#getInstance");
+    }
+
+    int numPartitions = 1;
+    int partitionNumber = 0;
+
+    @Getter
+    String topic;
+
+    /**
+     * https://www.testcontainers.org/test_framework_integration/manual_lifecycle_control/#singleton-containers
+     * https://github.com/testcontainers/testcontainers-java/pull/1781
+     */
+    public static KafkaContainer kafkaContainer = createKafkaContainer(null);
+
+    public static KafkaContainer createKafkaContainer(String logSegmentSize) {
+        KafkaContainer base = new KafkaContainer(DockerImageName.parse("confluentinc/cp-kafka:7.3.0"))
+                .withEnv("KAFKA_TRANSACTION_STATE_LOG_REPLICATION_FACTOR", "1") //transaction.state.log.replication.factor
+                .withEnv("KAFKA_TRANSACTION_STATE_LOG_MIN_ISR", "1") //transaction.state.log.min.isr
+                .withEnv("KAFKA_TRANSACTION_STATE_LOG_NUM_PARTITIONS", "1") //transaction.state.log.num.partitions
+                //todo need to customise this for this test
+                // default produce batch size is - must be at least higher than it: 16KB
+                // try to speed up initial consumer group formation
+                .withEnv("KAFKA_GROUP_INITIAL_REBALANCE_DELAY_MS", "500") // group.initial.rebalance.delay.ms default: 3000
+                .withReuse(true);
+
+        if (StringUtils.isNotBlank(logSegmentSize)) {
+            base = base.withEnv("KAFKA_LOG_SEGMENT_BYTES", logSegmentSize);
+        }
+
+        return base;
+    }
+
+    static {
+        kafkaContainer.start();
+    }
+
+    @Getter(AccessLevel.PROTECTED)
+    private final KafkaClientUtils kcu = new KafkaClientUtils(kafkaContainer);
+
+    @BeforeAll
+    static void followKafkaLogs() {
+        if (log.isDebugEnabled()) {
+            FilteredTestContainerSlf4jLogConsumer logConsumer = new FilteredTestContainerSlf4jLogConsumer(log);
+            kafkaContainer.followOutput(logConsumer);
+        }
+    }
+
+    @BeforeEach
+    void open() {
+        kcu.open();
+    }
+
+    @AfterEach
+    void close() {
+        kcu.close();
+    }
+
+    protected void setupTopic() {
+        String name = LoadTest.class.getSimpleName();
+        setupTopic(name);
+    }
+
+    protected String setupTopic(String name) {
+        assertThat(kafkaContainer.isRunning()).isTrue(); // sanity
+
+        topic = name + "-" + nextInt();
+
+        ensureTopic(topic, numPartitions);
+
+        return topic;
+    }
+
+    protected CreateTopicsResult ensureTopic(String topic, int numPartitions) {
+        NewTopic e1 = new NewTopic(topic, numPartitions, (short) 1);
+        CreateTopicsResult topics = kcu.getAdmin().createTopics(UniLists.of(e1));
+        try {
+            Void all = topics.all().get(1, TimeUnit.SECONDS);
+        } catch (ExecutionException e) {
+            // fine
+        } catch (Exception e) {
+            throw new RuntimeException(e);
+        }
+        return topics;
+    }
+
+    protected List<String> produceMessages(int quantity) {
+        return produceMessages(quantity, "");
+    }
+
+    @SneakyThrows
+    protected List<String> produceMessages(int quantity, String prefix) {
+        return getKcu().produceMessages(getTopic(), quantity, prefix);
+    }
+
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/CloseAndOpenOffsetTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/CloseAndOpenOffsetTest.java
new file mode 100644
index 000000000..7b9ec379f
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/CloseAndOpenOffsetTest.java
@@ -0,0 +1,400 @@
+package io.confluent.parallelconsumer.integrationTests;
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.Range;
+import io.confluent.parallelconsumer.FakeRuntimeException;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils;
+import io.confluent.parallelconsumer.offsets.OffsetEncoding;
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager;
+import io.confluent.parallelconsumer.offsets.OffsetSimultaneousEncoder;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.commons.lang3.RandomUtils;
+import org.apache.kafka.clients.consumer.ConsumerConfig;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.producer.KafkaProducer;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.clients.producer.RecordMetadata;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.Timeout;
+import org.junit.jupiter.api.parallel.ResourceLock;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniSets;
+
+import java.time.Duration;
+import java.util.ArrayList;
+import java.util.Optional;
+import java.util.Properties;
+import java.util.Set;
+import java.util.concurrent.ConcurrentLinkedQueue;
+import java.util.concurrent.ConcurrentSkipListSet;
+import java.util.concurrent.ExecutionException;
+import java.util.concurrent.Future;
+import java.util.stream.Collectors;
+
+import static io.confluent.parallelconsumer.AbstractParallelEoSStreamProcessorTestBase.defaultTimeout;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.UNORDERED;
+import static java.time.Duration.ofMillis;
+import static java.time.Duration.ofSeconds;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.awaitility.Awaitility.await;
+import static org.junit.jupiter.api.Assumptions.assumeFalse;
+import static org.junit.jupiter.api.parallel.ResourceAccessMode.READ;
+
+/**
+ * Series of tests that check when we close a PC with incompletes encoded, when we open a new one, the correct messages
+ * are skipped.
+ *
+ * @see OffsetMapCodecManager
+ */
+@Timeout(value = 60)
+@Slf4j
+class CloseAndOpenOffsetTest extends BrokerIntegrationTest<String, String> {
+
+    Duration normalTimeout = ofSeconds(5);
+    Duration debugTimeout = Duration.ofMinutes(1);
+
+    // use debug timeout while debugging
+//     Duration timeoutToUse = debugTimeout;
+    Duration timeoutToUse = normalTimeout;
+
+    String rebalanceTopic;
+
+    @BeforeEach
+    void setup() {
+        rebalanceTopic = "close-and-open-" + RandomUtils.nextInt();
+    }
+
+    /**
+     * Publish some messages, some fail, shutdown, startup again, consume again - check we only consume the failed
+     * messages
+     * <p>
+     * Test with different encodings to make sure each encoding can be used to reload
+     * <p>
+     * Sometimes fails as 5 is not committed in the first run and comes out in the 2nd
+     * <p>
+     * NB: messages 4 and 2 are made to fail
+     */
+    @Timeout(value = 60)
+    @SneakyThrows
+    @ParameterizedTest
+    @EnumSource()
+    @ResourceLock(value = OffsetMapCodecManager.METADATA_DATA_SIZE_RESOURCE_LOCK, mode = READ)
+    void offsetsOpenClose(OffsetEncoding encoding) {
+        var skip = UniLists.of(OffsetEncoding.ByteArray, OffsetEncoding.ByteArrayCompressed, OffsetEncoding.KafkaStreams, OffsetEncoding.KafkaStreamsV2);
+        assumeFalse(skip.contains(encoding));
+
+        // todo remove - not even relevant to this test? smelly
+        OffsetMapCodecManager.forcedCodec = Optional.of(encoding);
+        OffsetSimultaneousEncoder.compressionForced = true;
+
+        // 2 partition topic
+        try {
+            ensureTopic(rebalanceTopic, 1);
+        } catch (Exception e) {
+            log.warn(e.getMessage(), e);
+        }
+
+        //
+        KafkaConsumer<String, String> newConsumerOne = getKcu().createNewConsumer();
+        KafkaProducer<String, String> producerOne = getKcu().createNewProducer(true);
+        var options = ParallelConsumerOptions.<String, String>builder()
+                .ordering(UNORDERED)
+                .commitMode(PERIODIC_TRANSACTIONAL_PRODUCER)
+                .consumer(newConsumerOne)
+                .producer(producerOne)
+                .build();
+
+        // first client
+        {
+            //
+            var asyncOne = new ParallelEoSStreamProcessor<String, String>(options);
+
+            //
+            asyncOne.subscribe(UniLists.of(rebalanceTopic));
+
+            // read some messages
+            var successfullInOne = new ConcurrentLinkedQueue<ConsumerRecord<String, String>>();
+            asyncOne.poll(x -> {
+                log.info("Read by consumer ONE: {}", x);
+                if (x.value().equals("4")) {
+                    log.info("Throwing fake error for message 4");
+                    throw new FakeRuntimeException("Fake error - Message 4");
+                }
+                if (x.value().equals("2")) {
+                    log.info("Throwing fake error for message 2");
+                    throw new FakeRuntimeException("Fake error - Message 2");
+                }
+                successfullInOne.add(x.getSingleConsumerRecord());
+            });
+
+            // wait for initial 0 commit
+            Thread.sleep(500);
+
+            //
+            send(rebalanceTopic, 0, 0);
+            send(rebalanceTopic, 0, 1);
+            send(rebalanceTopic, 0, 2);
+            send(rebalanceTopic, 0, 3);
+            send(rebalanceTopic, 0, 4);
+            send(rebalanceTopic, 0, 5);
+
+            // all are processed except msg 2 and 4, which holds up the queue
+            await().alias("check all except 2 and 4 are processed").atMost(normalTimeout).untilAsserted(() -> {
+                        ArrayList<ConsumerRecord<String, String>> copy = new ArrayList<>(successfullInOne);
+                        assertThat(copy.stream()
+                                .map(ConsumerRecord::value).collect(Collectors.toList()))
+                                .containsOnly("0", "1", "3", "5");
+                    }
+            );
+
+            // wait until all expected records have been processed and committed
+            // need to wait for final message processing's offset data to be committed
+            // TODO test for event/trigger instead - could consume offsets topic but have to decode the binary
+            // could listen to a produce topic, but currently it doesn't use the produce flow
+            // could add a commit listener to the api, but that's heavy just for this?
+            // could use Consumer#committed to check and decode, but it's not thread safe
+            // sleep is lazy but much much simpler
+            Thread.sleep(500);
+
+            // commit what we've done so far, don't wait for failing messages to be retried (message 4)
+            log.info("Closing consumer, committing offset map");
+            asyncOne.closeDontDrainFirst();
+
+            await().alias("check all except 2 and 4 are processed")
+                    .atMost(normalTimeout)
+                    .untilAsserted(() ->
+                            assertThat(successfullInOne.stream()
+                                    .map(x -> x.value()).collect(Collectors.toList()))
+                                    .containsOnly("0", "1", "3", "5"));
+
+            assertThat(asyncOne.getFailureCause()).isNull();
+        }
+
+        // second client
+        {
+            //
+            KafkaConsumer<String, String> newConsumerThree = getKcu().createNewConsumer(customClientId("THREE-my-client"));
+            KafkaProducer<String, String> producerThree = getKcu().createNewProducer(true);
+            var optionsThree = options.toBuilder().consumer(newConsumerThree).producer(producerThree).build();
+            try (var asyncThree = new ParallelEoSStreamProcessor<String, String>(optionsThree)) {
+                asyncThree.subscribe(UniLists.of(rebalanceTopic));
+
+                // read what we're given
+                var processedByThree = new ConcurrentLinkedQueue<ConsumerRecord<String, String>>();
+                asyncThree.poll(x -> {
+                    log.info("Read by consumer THREE: {}", x.value());
+                    processedByThree.add(x.getSingleConsumerRecord());
+                });
+
+                //
+                await().alias("only 2 and 4 should be delivered again, as everything else was processed successfully")
+                        .atMost(timeoutToUse)
+                        .untilAsserted(() ->
+                                assertThat(processedByThree).extracting(ConsumerRecord::value)
+                                        .containsExactlyInAnyOrder("2", "4"));
+            }
+        }
+
+        OffsetMapCodecManager.forcedCodec = Optional.empty();
+        OffsetSimultaneousEncoder.compressionForced = false;
+    }
+
+    private Properties customClientId(final String id) {
+        Properties properties = new Properties();
+        properties.put(ConsumerConfig.CLIENT_ID_CONFIG, id);
+        return properties;
+    }
+
+    private void send(String topic, int partition, Integer value) throws InterruptedException, ExecutionException {
+        RecordMetadata recordMetadata = getKcu().getProducer().send(new ProducerRecord<>(topic, partition, value.toString(), value.toString())).get();
+    }
+
+    private void send(int quantity, String topic, int partition) throws InterruptedException, ExecutionException {
+        log.debug("Sending {} messages to {}", quantity, topic);
+        var futures = new ArrayList<Future<RecordMetadata>>();
+        // async
+        for (Long index : Range.range(quantity)) {
+            Future<RecordMetadata> send = getKcu().getProducer().send(new ProducerRecord<>(topic, partition, index.toString(), index.toString()));
+            futures.add(send);
+        }
+        // block until finished
+        for (Future<RecordMetadata> future : futures) {
+            future.get();
+        }
+        log.debug("Finished sending {} messages", quantity);
+    }
+
+
+    /**
+     * Make sure we commit a basic offset correctly - send a single message, read, commit, close, open, read - should be
+     * nothing
+     */
+    @Test
+    void correctOffsetVerySimple() {
+        setupTopic();
+
+        // send a single message
+        String expectedPayload = "0";
+        getKcu().getProducer().send(new ProducerRecord<>(topic, expectedPayload, expectedPayload));
+
+        KafkaConsumer<String, String> consumer = getKcu().createNewConsumer();
+        KafkaProducer<String, String> producerOne = getKcu().createNewProducer(true);
+        var options = ParallelConsumerOptions.<String, String>builder()
+                .ordering(UNORDERED)
+                .consumer(consumer)
+                .producer(producerOne)
+                .commitMode(PERIODIC_TRANSACTIONAL_PRODUCER)
+                .build();
+
+        try (var asyncOne = new ParallelEoSStreamProcessor<String, String>(options)) {
+
+            asyncOne.subscribe(UniLists.of(topic));
+
+            var readByOne = new ArrayList<ConsumerRecord<String, String>>();
+            asyncOne.poll(msg -> {
+                log.debug("Reading {}", msg);
+                readByOne.add(msg.getSingleConsumerRecord());
+            });
+
+            // the single message is processed
+            await().untilAsserted(() -> assertThat(readByOne)
+                    .extracting(ConsumerRecord::value)
+                    .containsExactly(expectedPayload));
+
+        } finally {
+            log.debug("asyncOne closed");
+        }
+
+        //
+        log.debug("Starting up new client");
+        KafkaConsumer<String, String> newConsumerThree = getKcu().createNewConsumer(customClientId("THREE-my-client"));
+        KafkaProducer<String, String> producerThree = getKcu().createNewProducer(true);
+        ParallelConsumerOptions<String, String> optionsThree = options.toBuilder()
+                .consumer(newConsumerThree)
+                .producer(producerThree)
+                .build();
+        try (var asyncThree = new ParallelEoSStreamProcessor<String, String>(optionsThree)) {
+            asyncThree.subscribe(UniLists.of(topic));
+
+            // read what we're given
+            var readByThree = new ArrayList<ConsumerRecord<String, String>>();
+            asyncThree.poll(x -> {
+                log.info("Three read: {}", x.value());
+                readByThree.add(x.getSingleConsumerRecord());
+            });
+
+            // for at least normalTimeout, nothing should be read back (will be long enough to be sure it never is)
+            await().alias("nothing should be read back (will be long enough to be sure it never is)")
+                    .pollDelay(ofSeconds(1))
+                    .atMost(ofSeconds(2))
+                    .atLeast(ofSeconds(1))
+                    .untilAsserted(() -> {
+                                assertThat(readByThree).as("Nothing should be read into the collection")
+                                        .extracting(ConsumerRecord::value)
+                                        .isEmpty();
+                            }
+                    );
+        }
+    }
+
+    /**
+     * @see KafkaClientUtils#MAX_POLL_RECORDS
+     */
+    @SneakyThrows
+    @Test
+    void largeNumberOfMessagesSmallOffsetBitmap() {
+        setupTopic();
+
+        int quantity = 10_000;
+        assertThat(quantity).as("Test expects to process all the produced messages in a single poll")
+                .isLessThanOrEqualTo(KafkaClientUtils.MAX_POLL_RECORDS);
+        send(quantity, topic, 0);
+
+        var baseOptions = ParallelConsumerOptions.<String, String>builder()
+                .ordering(UNORDERED)
+                .commitMode(PERIODIC_TRANSACTIONAL_PRODUCER)
+                .build();
+
+        Set<String> failingMessages = UniSets.of("123", "2345", "8765");
+        int numberOfFailingMessages = failingMessages.size();
+
+        // step 1
+        {
+            KafkaConsumer<String, String> consumer = getKcu().createNewConsumer();
+            KafkaProducer<String, String> producerOne = getKcu().createNewProducer(true);
+            var options = baseOptions.toBuilder()
+                    .consumer(consumer)
+                    .producer(producerOne)
+                    .build();
+            var asyncOne = new ParallelEoSStreamProcessor<String, String>(options);
+
+            asyncOne.subscribe(UniLists.of(topic));
+
+            var readByOne = new ConcurrentSkipListSet<String>();
+            asyncOne.poll(x -> {
+                String value = x.value();
+                if (failingMessages.contains(value)) {
+                    throw new FakeRuntimeException("Fake error for message " + value);
+                }
+                readByOne.add(value);
+            });
+
+            // the single message is not processed
+            await().atMost(defaultTimeout).untilAsserted(() -> assertThat(readByOne.size())
+                    .isEqualTo(quantity - numberOfFailingMessages));
+
+            //
+            // TODO: fatal vs retriable exceptions. Retry limits particularly for draining state?
+            asyncOne.closeDontDrainFirst();
+
+            // sanity - post close
+            assertThat(readByOne.size()).isEqualTo(quantity - numberOfFailingMessages);
+        }
+
+        // step 2
+        {
+            //
+            KafkaConsumer<String, String> newConsumerThree = getKcu().createNewConsumer(customClientId("THREE-my-client"));
+            KafkaProducer<String, String> producerThree = getKcu().createNewProducer(true);
+            var optionsThree = baseOptions.toBuilder()
+                    .consumer(newConsumerThree)
+                    .producer(producerThree)
+                    .build();
+            try (var asyncThree = new ParallelEoSStreamProcessor<String, String>(optionsThree)) {
+                asyncThree.subscribe(UniLists.of(topic));
+
+                // read what we're given
+                var readByThree = new ConcurrentSkipListSet<String>();
+                asyncThree.poll(x -> {
+                    log.info("Three read: {}", x.value());
+                    readByThree.add(x.value());
+                });
+
+                await().alias("Only the one remaining failing message should be submitted for processing")
+                        .pollDelay(ofMillis(1000))
+                        .atLeast(ofMillis(500))
+                        .untilAsserted(() -> {
+                                    assertThat(readByThree)
+                                            .as("Contains only previously failed messages")
+                                            .hasSize(numberOfFailingMessages);
+                                }
+                        );
+
+                //
+                assertThat(readByThree).hasSize(numberOfFailingMessages); // double check after closing
+            }
+        }
+    }
+
+
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/CustomConsumersTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/CustomConsumersTest.java
new file mode 100644
index 000000000..4dee90d70
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/CustomConsumersTest.java
@@ -0,0 +1,47 @@
+package io.confluent.parallelconsumer.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.junit.jupiter.api.Test;
+
+import java.util.Properties;
+
+/**
+ * @author Antony Stubbs
+ */
+class CustomConsumersTest extends BrokerIntegrationTest {
+
+    /**
+     * Tests that extended consumer can be used with a custom consumer with PC.
+     * <p>
+     * Test for issue #195 - https://github.com/confluentinc/parallel-consumer/issues/195
+     *
+     * @see io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor#checkAutoCommitIsDisabled
+     */
+    @Test
+    void extendedConsumer() { // NOSONAR
+        Properties properties = getKcu().setupConsumerProps(this.getClass().getSimpleName());
+        CustomConsumer<String, String> client = new CustomConsumer<>(properties);
+
+        ParallelConsumerOptions<String, String> options = ParallelConsumerOptions.<String, String>builder()
+                .consumer(client)
+                .build();
+
+        ParallelEoSStreamProcessor<String, String> pc = new ParallelEoSStreamProcessor<>(options);
+    }
+
+    static class CustomConsumer<K, V> extends KafkaConsumer<K, V> {
+
+        String customField = "custom";
+
+        public CustomConsumer(Properties configs) {
+            super(configs);
+        }
+
+    }
+}
\ No newline at end of file
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/DbTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/DbTest.java
new file mode 100644
index 000000000..dd93bd736
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/DbTest.java
@@ -0,0 +1,92 @@
+package io.confluent.parallelconsumer.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+import org.postgresql.ds.PGSimpleDataSource;
+import org.testcontainers.containers.PostgreSQLContainer;
+import org.testcontainers.containers.output.Slf4jLogConsumer;
+
+import java.sql.Connection;
+import java.sql.PreparedStatement;
+import java.util.concurrent.locks.ReentrantLock;
+
+import static org.assertj.core.api.Assertions.assertThat;
+
+/**
+ * Simulate real forward pressure, back pressure and error conditions by testing against a real database, instead of
+ * just simulating "work" with a random sleep.
+ */
+@Slf4j
+public class DbTest extends BrokerIntegrationTest<String, String> {
+
+    protected static final PostgreSQLContainer dbc;
+
+    /*
+     * https://www.testcontainers.org/test_framework_integration/manual_lifecycle_control/#singleton-containers
+     * https://github.com/testcontainers/testcontainers-java/pull/1781
+     */
+    static {
+        dbc = new PostgreSQLContainer<>()
+                .withReuse(true);
+        dbc.start();
+    }
+
+    Connection connection;
+
+    @BeforeEach
+    public void followDbLogs() {
+        if (log.isDebugEnabled()) {
+            Slf4jLogConsumer logConsumer = new Slf4jLogConsumer(log);
+            dbc.followOutput(logConsumer);
+        }
+    }
+
+    static ReentrantLock dbLock = new ReentrantLock();
+
+    @SneakyThrows
+    @BeforeEach
+    public void setupDatabase() {
+        PGSimpleDataSource dataSource = new PGSimpleDataSource();
+        dataSource.setUrl(dbc.getJdbcUrl());
+        dataSource.setUser(dbc.getUsername());
+        dataSource.setPassword(dbc.getPassword());
+
+        connection = dataSource.getConnection();
+
+
+        // create if exists doesn't seem to be thread safe - something around postgres creating indexes causes a distinct exception
+        dbLock.lock();
+        PreparedStatement create_table = connection.prepareStatement(
+                """
+                        CREATE TABLE IF NOT EXISTS DATA(
+                           ID SERIAL PRIMARY KEY     NOT NULL,
+                           KEY           TEXT    NOT NULL,
+                           VALUE         TEXT     NOT NULL
+                        );""");
+        create_table.execute();
+        dbLock.unlock();
+    }
+
+    @SneakyThrows
+    @Test
+    public void testDatabaseSetup() {
+        assertThat(dbc.isRunning()).isTrue(); // sanity
+
+        savePayload("a", "test");
+    }
+
+    @SneakyThrows
+    void savePayload(String key, String payload) {
+        var query = "insert into data(key, value) values(?, ?)";
+        PreparedStatement pst = connection.prepareStatement(query);
+        pst.setString(1, key);
+        pst.setString(2, payload);
+        int i = pst.executeUpdate();
+    }
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/DrainCloseTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/DrainCloseTest.java
new file mode 100644
index 000000000..bcd4e6e63
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/DrainCloseTest.java
@@ -0,0 +1,85 @@
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+package io.confluent.parallelconsumer.integrationTests;
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+import pl.tlinkowski.unij.api.UniSets;
+
+import java.time.Duration;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.atomic.AtomicLong;
+
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.PARTITION;
+import static java.lang.Thread.sleep;
+import static org.junit.jupiter.api.Assertions.assertEquals;
+import static org.testcontainers.shaded.org.awaitility.Awaitility.await;
+import static org.testcontainers.shaded.org.hamcrest.Matchers.equalTo;
+import static org.testcontainers.shaded.org.hamcrest.Matchers.is;
+
+@Slf4j
+public class DrainCloseTest extends BrokerIntegrationTest<String, String> {
+
+    Consumer<String, String> consumer;
+
+    ParallelConsumerOptions<String, String> pcOpts;
+    ParallelEoSStreamProcessor<String, String> pc;
+
+    @BeforeEach
+    void setUp() {
+        setupTopic();
+        consumer = getKcu().createNewConsumer(KafkaClientUtils.GroupOption.NEW_GROUP);
+
+        pcOpts = ParallelConsumerOptions.<String, String>builder()
+                .consumer(consumer)
+                .ordering(PARTITION)
+                .build();
+
+        pc = new ParallelEoSStreamProcessor<>(pcOpts);
+
+        pc.subscribe(UniSets.of(topic));
+    }
+
+    @Test
+    @SneakyThrows
+    void stopPollingAfterStateIsSetToDraining() {
+        var recordsToProduce = 2L; // 1 in process + 1 waiting in shard queue
+        var recordsToProduceAfterClose = 10L;
+
+        var count = new AtomicLong();
+        var latch = new CountDownLatch(1);
+
+        getKcu().produceMessages(topic, recordsToProduce);
+        pc.poll(recordContexts -> {
+            count.getAndIncrement();
+            try {
+                latch.await();
+            } catch (InterruptedException e) {
+                throw new RuntimeException(e);
+            }
+            log.debug("Processed record, count now {} - offset: {}", count, recordContexts.offset());
+        });
+        await().untilAtomic(count, is(equalTo(1L)));
+
+        new Thread(() -> pc.closeDrainFirst(Duration.ofSeconds(30))).start();
+        sleep(2000);
+
+        getKcu().produceMessages(topic, recordsToProduceAfterClose);
+        sleep(5000);
+
+        latch.countDown();
+
+        await().until(() -> pc.isClosedOrFailed()
+                || count.get() == recordsToProduce + recordsToProduceAfterClose);
+        assertEquals(recordsToProduce, count.get());
+        log.debug("Test finished");
+    }
+}
\ No newline at end of file
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/KafkaSanityTests.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/KafkaSanityTests.java
new file mode 100644
index 000000000..d31023709
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/KafkaSanityTests.java
@@ -0,0 +1,143 @@
+package io.confluent.parallelconsumer.integrationTests;
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.commons.lang3.RandomStringUtils;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.common.TopicPartition;
+import org.apache.kafka.common.errors.OffsetMetadataTooLarge;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.Timeout;
+import org.junit.jupiter.api.parallel.ResourceAccessMode;
+import org.junit.jupiter.api.parallel.ResourceLock;
+import pl.tlinkowski.unij.api.UniLists;
+
+import java.time.Duration;
+import java.util.HashMap;
+import java.util.Set;
+
+import static io.confluent.csid.utils.GeneralTestUtils.time;
+import static java.time.Duration.ofMillis;
+import static java.time.Duration.ofSeconds;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.assertThatThrownBy;
+
+//@Isolated
+@Slf4j
+public class KafkaSanityTests extends BrokerIntegrationTest<String, String> {
+
+    /**
+     * @link io.confluent.csid.asyncconsumer.BrokerPollSystem#pollBrokerForRecords
+     */
+    @Timeout(value = 20) // includes docker broker startup time, can be slow on CI machines
+    @Test
+    public void pausedConsumerStillLongPollsForNothing() {
+        log.info("Setup topic");
+        setupTopic();
+        KafkaConsumer<String, String> consumer = getKcu().getConsumer();
+        log.info("Subscribe to topic");
+        consumer.subscribe(UniLists.of(topic));
+        Set<TopicPartition> assignment = consumer.assignment();
+        log.info("Pause subscription");
+        consumer.pause(assignment);
+
+        log.info("Initial poll that can trigger some actions and take longer than expected");
+        consumer.poll(ofSeconds(0));
+
+        log.info("Second poll which is measured");
+        Duration longPollTime = ofSeconds(1);
+        Duration time = time(() -> {
+            consumer.poll(longPollTime);
+        });
+
+        log.info("Poll blocked my thread for {}, hopefully slightly longer than {}", time, longPollTime);
+        String desc = "Even though the consumer is paused ALL it's subscribed partitions, it will still perform a long poll against the server";
+        var timePlusFluctuation = time.plus(ofMillis(100));
+        assertThat(timePlusFluctuation).as(desc)
+                .isGreaterThan(longPollTime);
+    }
+
+    /**
+     * Test our understanding of the offset metadata payload system - is the DefaultMaxMetadataSize available for each
+     * partition, or to the total of all partitions in the commit?
+     */
+    @ResourceLock(value = OffsetMapCodecManager.METADATA_DATA_SIZE_RESOURCE_LOCK, mode = ResourceAccessMode.READ)
+    // depends on OffsetMapCodecManager#DefaultMaxMetadataSize
+    // todo remove static dependencies
+    @Test
+    void offsetMetadataSpaceAvailable() {
+        numPartitions = 5;
+        setupTopic();
+
+        int maxCapacity = OffsetMapCodecManager.DefaultMaxMetadataSize;
+        assertThat(maxCapacity)
+                .as("approximate sanity - ensure start state settings (shared static state :`( )")
+                .isGreaterThan(3000);
+
+        KafkaConsumer<String, String> consumer = getKcu().getConsumer();
+        TopicPartition tpOne = new TopicPartition(topic, 0);
+        TopicPartition tpTwo = new TopicPartition(topic, 1);
+        HashMap<TopicPartition, OffsetAndMetadata> map = new HashMap<>();
+
+        String payload = RandomStringUtils.randomAlphanumeric(maxCapacity);
+
+        // fit the max
+        {
+            map.put(tpOne, new OffsetAndMetadata(0, payload));
+
+            consumer.commitSync(map);
+        }
+
+        // fit just one more for one
+        {
+            map.put(tpOne, new OffsetAndMetadata(0, payload + "!"));
+            assertThatThrownBy(() -> consumer.commitSync(map))
+                    .isInstanceOf(OffsetMetadataTooLarge.class)
+                    .hasMessageContainingAll("metadata", "offset request", "too large");
+        }
+
+        // fit double for one
+        {
+            map.put(tpOne, new OffsetAndMetadata(0, payload + payload));
+
+            assertThatThrownBy(() -> consumer.commitSync(map))
+                    .isInstanceOf(OffsetMetadataTooLarge.class)
+                    .hasMessageContainingAll("metadata", "offset request", "too large");
+        }
+
+        // fit max for two
+        {
+            map.put(tpOne, new OffsetAndMetadata(0, payload));
+            map.put(tpTwo, new OffsetAndMetadata(0, payload));
+
+            consumer.commitSync(map);
+        }
+
+        // fit max for five - upper range
+        {
+            map.put(tpOne, new OffsetAndMetadata(0, payload));
+            map.put(tpTwo, new OffsetAndMetadata(0, payload));
+            map.put(new TopicPartition(topic, 2), new OffsetAndMetadata(0, payload));
+            map.put(new TopicPartition(topic, 3), new OffsetAndMetadata(0, payload));
+            map.put(new TopicPartition(topic, 4), new OffsetAndMetadata(0, payload));
+
+            consumer.commitSync(map);
+        }
+
+        // go over for on one of the two
+        {
+            // fit double for one
+            {
+                map.put(tpOne, new OffsetAndMetadata(0, payload));
+                map.put(tpTwo, new OffsetAndMetadata(0, payload + payload));
+                assertThatThrownBy(() -> consumer.commitSync(map))
+                        .isInstanceOf(OffsetMetadataTooLarge.class)
+                        .hasMessageContainingAll("metadata", "offset request", "too large");
+            }
+        }
+    }
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/LargeVolumeInMemoryTests.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/LargeVolumeInMemoryTests.java
new file mode 100644
index 000000000..2e507eb6d
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/LargeVolumeInMemoryTests.java
@@ -0,0 +1,302 @@
+package io.confluent.parallelconsumer.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.ProgressBarUtils;
+import io.confluent.csid.utils.Range;
+import io.confluent.csid.utils.ThreadUtils;
+import io.confluent.parallelconsumer.FakeRuntimeException;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessorTestBase;
+import io.confluent.parallelconsumer.state.WorkContainer;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import me.tongfei.progressbar.ProgressBar;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.clients.producer.MockProducer;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.common.TopicPartition;
+import org.assertj.core.util.Lists;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+import pl.tlinkowski.unij.api.UniLists;
+
+import java.time.Duration;
+import java.util.*;
+import java.util.concurrent.ConcurrentLinkedQueue;
+import java.util.concurrent.CountDownLatch;
+
+import static io.confluent.csid.utils.GeneralTestUtils.time;
+import static io.confluent.csid.utils.Range.range;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.*;
+import static java.util.Comparator.comparing;
+import static java.util.concurrent.TimeUnit.SECONDS;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.awaitility.Awaitility.waitAtMost;
+import static org.mockito.Mockito.mock;
+
+/**
+ * Mocked out comparative volume tests
+ */
+@Slf4j
+class LargeVolumeInMemoryTests extends ParallelEoSStreamProcessorTestBase {
+
+    @SneakyThrows
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    void load(CommitMode commitMode) {
+        setupClients();
+        setupParallelConsumerInstance(ParallelConsumerOptions.builder()
+                .ordering(UNORDERED)
+                .commitMode(commitMode)
+                .build());
+
+//        int quantityOfMessagesToProduce = 1_000_000;
+        int quantityOfMessagesToProduce = 500;
+
+        List<ConsumerRecord<String, String>> records = ktu.generateRecords(quantityOfMessagesToProduce);
+        ktu.send(consumerSpy, records);
+
+        CountDownLatch allMessagesConsumedLatch = new CountDownLatch(quantityOfMessagesToProduce);
+
+        parallelConsumer.pollAndProduceMany((rec) -> {
+            ProducerRecord<String, String> mock = mock(ProducerRecord.class);
+            return UniLists.of(mock);
+        }, (x) -> {
+//            log.debug(x.toString());
+            allMessagesConsumedLatch.countDown();
+        });
+
+        //
+        allMessagesConsumedLatch.await(defaultTimeoutSeconds, SECONDS);
+//        waitAtMost(defaultTimeout).until(() -> producerSpy.consumerGroupOffsetsHistory().size() > 0);
+
+
+        parallelConsumer.close();
+
+        // assert quantity of produced messages
+        List<ProducerRecord<String, String>> history = producerSpy.history();
+        assertThat(history).hasSize(quantityOfMessagesToProduce);
+
+        if (commitMode.equals(PERIODIC_TRANSACTIONAL_PRODUCER)) {
+            // assert order of commits
+            assertCommitsAlwaysIncrease();
+
+            // producer (tx) commits
+            List<Map<String, Map<TopicPartition, OffsetAndMetadata>>> producerCommits = producerSpy.consumerGroupOffsetsHistory();
+            assertThat(producerCommits).isNotEmpty();
+            long mostRecentProducerCommitOffset = findMostRecentCommitOffset(producerSpy); // tx
+            assertThat(mostRecentProducerCommitOffset).isEqualTo(quantityOfMessagesToProduce);
+        } else {
+            // assert commit messages
+            List<Map<TopicPartition, OffsetAndMetadata>> consumerCommitHistory = consumerSpy.getCommitHistoryInt();
+
+            assertThat(consumerCommitHistory).isNotEmpty();
+            long mostRecentConsumerCommitOffset = new ArrayList<>(consumerCommitHistory.get(consumerCommitHistory.size() - 1).values()).get(0).offset(); // non-tx
+            assertThat(mostRecentConsumerCommitOffset).isEqualTo(quantityOfMessagesToProduce);
+        }
+
+        // TODO: Assert process ordering
+    }
+
+    private void assertCommitsAlwaysIncrease() {
+        var map = new HashMap<TopicPartition, List<Long>>();
+        for (var stringMapMap : producerSpy.consumerGroupOffsetsHistory()) {
+            for (Map.Entry<TopicPartition, OffsetAndMetadata> entry : stringMapMap.get(CONSUMER_GROUP_ID).entrySet()) {
+                map.computeIfAbsent(entry.getKey(), (ignore) -> new ArrayList<>()).add(entry.getValue().offset());
+            }
+        }
+        log.trace("Sorted offset commit history: {}", map);
+        for (var entry : map.entrySet()) {
+            var value = entry.getValue();
+            long lastSeenOffset = value.get(0);
+            for (var offset : value) {
+                if (lastSeenOffset > offset)
+                    throw new AssertionError("Offsets not in incrementing order: last seen: " + lastSeenOffset + " vs current: " + offset);
+            }
+        }
+    }
+
+    private long findMostRecentCommitOffset(MockProducer<?, ?> producerSpy) {
+        List<Map<String, Map<TopicPartition, OffsetAndMetadata>>> commitHistory = producerSpy.consumerGroupOffsetsHistory();
+        assertThat(commitHistory).as("No offsets committed").hasSizeGreaterThan(0);
+        Map<String, Map<TopicPartition, OffsetAndMetadata>> mostRecent = commitHistory.get(commitHistory.size() - 1);
+        Map<TopicPartition, OffsetAndMetadata> topicPartitionOffsetAndMetadataMap = mostRecent.get(CONSUMER_GROUP_ID);
+        OffsetAndMetadata mostRecentTPCommit = topicPartitionOffsetAndMetadataMap.get(new TopicPartition(INPUT_TOPIC, 0));
+
+        return mostRecentTPCommit.offset();
+    }
+
+    /**
+     * Test comparative performance of different ordering restrictions and different key spaces.
+     * <p>
+     * Doesn't currently compare different key sizes, only partition order vs key order vs unordered
+     */
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    void timingOfDifferentOrderingTypes(CommitMode commitMode) {
+        var quantityOfMessagesToProduce = 10_00;
+        var defaultNumKeys = 20;
+
+        ParallelConsumerOptions<?, ?> baseOptions = ParallelConsumerOptions.builder()
+                .ordering(UNORDERED)
+                .commitMode(commitMode)
+                .build();
+
+        setupParallelConsumerInstance(baseOptions);
+
+        Duration unorderedDuration = null;
+        for (var round : range(2)) { // warm up round first
+            setupParallelConsumerInstance(baseOptions.toBuilder().ordering(UNORDERED).build());
+            log.debug("No order");
+            unorderedDuration = time(() -> testTiming(defaultNumKeys, quantityOfMessagesToProduce));
+            log.info("Duration for Unordered processing in round {} with {} keys was {}", round, defaultNumKeys, unorderedDuration);
+        }
+
+        var keyOrderingSizeToResults = new TreeMap<Integer, Duration>();
+        for (var keySize : UniLists.of(1, 2, 5, 10, 20, 50, 100, 1_000)) {
+            setupParallelConsumerInstance(baseOptions.toBuilder().ordering(KEY).build());
+            log.debug("By key, {} keys", keySize);
+            var keyOrderDuration = time(() -> testTiming(keySize, quantityOfMessagesToProduce));
+            log.info("Duration for Key order processing {} keys was {}", keySize, keyOrderDuration);
+            keyOrderingSizeToResults.put(keySize, keyOrderDuration);
+        }
+
+        setupParallelConsumerInstance(baseOptions.toBuilder().ordering(PARTITION).build());
+        log.debug("By partition");
+        var partitionOrderDuration = time(() -> testTiming(defaultNumKeys, quantityOfMessagesToProduce));
+        log.info("Duration for Partition order processing {} keys was {}", defaultNumKeys, partitionOrderDuration);
+
+        log.info("Key duration results:\n{}", keyOrderingSizeToResults);
+
+        log.info("Unordered duration: {}", unorderedDuration);
+
+        assertThat(unorderedDuration).as("UNORDERED should be faster than PARTITION order")
+                .isLessThan(partitionOrderDuration);
+
+        // compare key order to partition order
+        int numOfKeysToCompare = 20; // needs to be small enough that there's a significant difference between unordered and key of x
+        Duration keyOrderHalfDefaultKeySize = keyOrderingSizeToResults.get(numOfKeysToCompare);
+
+        // too brittle to have in CI
+//        if (commitMode.equals(PERIODIC_CONSUMER_SYNC)) {
+//            assertThat(unorderedDuration)
+//                    .as("Committing synchronously from the controller causes a large overhead, making UNORDERED " +
+//                            "very close in speed to KEY order, keySize of: " + numOfKeysToCompare)
+//                    .isCloseTo(keyOrderHalfDefaultKeySize,
+//                            keyOrderHalfDefaultKeySize.plus(keyOrderHalfDefaultKeySize.dividedBy(5))); // within 20%
+//        } else {
+//            assertThat(unorderedDuration)
+//                    .as("UNORDERED should be faster than KEY order, keySize of: " + numOfKeysToCompare)
+//                    .isLessThan(keyOrderHalfDefaultKeySize);
+//        }
+
+        assertThat(keyOrderHalfDefaultKeySize)
+                .as("KEY order should be faster than PARTITION order")
+                .isLessThan(partitionOrderDuration);
+    }
+
+    /**
+     * Runs a round of consumption and returns the time taken
+     */
+    private void testTiming(int numberOfKeys, int quantityOfMessagesToProduce) {
+        log.info("Running test for {} keys and {} messages", numberOfKeys, quantityOfMessagesToProduce);
+
+        List<WorkContainer<String, String>> successfulWork = new ArrayList<>();
+        super.injectWorkSuccessListener(parallelConsumer.getWm(), successfulWork);
+
+        List<Integer> keys = Range.listOfIntegers(numberOfKeys);
+        HashMap<Integer, List<ConsumerRecord<String, String>>> records = ktu.generateRecords(keys, quantityOfMessagesToProduce);
+        ktu.send(consumerSpy, records);
+
+        ProgressBar bar = ProgressBarUtils.getNewMessagesBar(log, quantityOfMessagesToProduce);
+
+        Queue<ConsumerRecord<String, String>> processingCheck = new ConcurrentLinkedQueue<ConsumerRecord<String, String>>();
+
+        parallelConsumer.pollAndProduceMany((rec) -> {
+            processingCheck.add(rec.getSingleConsumerRecord());
+            ThreadUtils.sleepQuietly(3);
+            ProducerRecord<String, String> stub = new ProducerRecord<>(OUTPUT_TOPIC, "sk:" + rec.key(), "SourceV: " + rec.value());
+            bar.stepTo(producerSpy.history().size());
+            return UniLists.of(stub);
+        }, (x) -> {
+            // noop
+//            log.debug(x.toString());
+        });
+
+        waitAtMost(defaultTimeout.multipliedBy(15)).untilAsserted(() -> {
+            // assertj's size checker uses an iterator so must be synchronised.
+            // .size() wouldn't need it but this output is nicer
+            synchronized (successfulWork) {
+                assertThat(successfulWork)
+                        .as("All expected messages were processed and successful")
+                        .hasSize(quantityOfMessagesToProduce);
+            }
+
+            assertThat(producerSpy.history())
+                    .as("Expected number of produced messages")
+                    .hasSize(quantityOfMessagesToProduce);
+        });
+        bar.close();
+
+        log.info("Closing async client");
+        parallelConsumer.close();
+
+        assertCommitsAlwaysIncrease();
+
+        //
+        if (processingCheck.size() != quantityOfMessagesToProduce) {
+            int stepIndex = 0;
+            List<ConsumerRecord<String, String>> processingCheckCollection = Lists.newArrayList(processingCheck.iterator());
+            processingCheckCollection.sort(comparing(record -> Integer.parseInt(record.value())));
+            log.error("Expectation mismatch - where are my messages?");
+            for (ConsumerRecord<String, String> rec : processingCheckCollection) {
+                int i = Integer.parseInt(rec.value());
+                if (stepIndex != i) {
+                    log.error("bad step: {} vs {}", stepIndex, i);
+                    throw new FakeRuntimeException("bad process step, expected message is missing: " + stepIndex + " vs " + i);
+                }
+                stepIndex++;
+            }
+        }
+
+        // message produced step check
+        List<ProducerRecord<String, String>> history = producerSpy.history();
+        var missing = new ArrayList<Integer>();
+        if (history.size() != quantityOfMessagesToProduce) {
+            int stepIndex = 0;
+            history.sort(comparing(record -> {
+                Objects.requireNonNull(record);
+                return Integer.parseInt(record.value());
+            }));
+            log.error("Expectation mismatch - where are my messages?");
+            for (ProducerRecord<String, String> rec : history) {
+                int i = Integer.parseInt(rec.value());
+                if (stepIndex != i) {
+                    log.error("bad step: {} vs {}", stepIndex, i);
+                    missing.add(i);
+                    stepIndex++;
+                }
+                stepIndex++;
+            }
+            if (!missing.isEmpty())
+                log.error("Missing: {}", missing);
+            throw new FakeRuntimeException("bad step, expected message(s) is missing: " + missing);
+        }
+
+        assertThat(producerSpy.history()).as("Finally, all messages expected messages were produced").hasSize(quantityOfMessagesToProduce);
+        if (isUsingTransactionalProducer()) {
+            List<Map<String, Map<TopicPartition, OffsetAndMetadata>>> groupOffsetsHistory = producerSpy.consumerGroupOffsetsHistory(); // tx
+            assertThat(groupOffsetsHistory).as("No offsets committed").hasSizeGreaterThan(0); // tx
+        } else {
+            List<Map<TopicPartition, OffsetAndMetadata>> commitHistory = consumerSpy.getCommitHistoryInt();
+            assertThat(commitHistory).as("No offsets committed").hasSizeGreaterThan(0); // non-tx
+        }
+    }
+
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/LoadTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/LoadTest.java
new file mode 100644
index 000000000..1f3a794c9
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/LoadTest.java
@@ -0,0 +1,201 @@
+package io.confluent.parallelconsumer.integrationTests;
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.ProgressBarUtils;
+import io.confluent.csid.utils.Range;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import me.tongfei.progressbar.ProgressBar;
+import org.apache.commons.lang3.RandomStringUtils;
+import org.apache.commons.lang3.RandomUtils;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.ConsumerRecords;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.clients.producer.RecordMetadata;
+import org.assertj.core.util.Lists;
+import org.junit.jupiter.api.Test;
+import org.testcontainers.junit.jupiter.Testcontainers;
+import pl.tlinkowski.unij.api.UniLists;
+
+import java.util.*;
+import java.util.concurrent.Executors;
+import java.util.concurrent.Future;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.regex.Pattern;
+import java.util.stream.IntStream;
+
+import static io.confluent.csid.utils.GeneralTestUtils.time;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER;
+import static java.time.Duration.ofMillis;
+import static java.time.Duration.ofSeconds;
+import static me.tongfei.progressbar.ProgressBar.wrap;
+import static org.apache.commons.lang3.RandomUtils.nextInt;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.awaitility.Awaitility.await;
+
+@Testcontainers
+@Slf4j
+public class LoadTest extends DbTest {
+
+    //    static int total = 8_000_0;
+//    static int total = 4_000_00;
+//    static int total = 4_000_0;
+    static int total = 4_000;
+//    static int total = 8;
+
+    @SneakyThrows
+    public void setupTestData() {
+        setupTopic();
+
+        publishMessages(total / 100, total, topic);
+    }
+
+    @SneakyThrows
+    @Test
+    void timedNormalKafkaConsumerTest() {
+        setupTestData();
+
+        // subscribe in advance, it can be a few seconds
+        getKcu().getConsumer().subscribe(UniLists.of(topic));
+
+        readRecordsPlainConsumer(total, topic);
+    }
+
+    @SneakyThrows
+    @Test
+    void asyncConsumeAndProcess() {
+        setupTestData();
+
+        KafkaConsumer<String, String> newConsumer = getKcu().createNewConsumer();
+        //
+        boolean tx = true;
+        ParallelConsumerOptions<String, String> options = ParallelConsumerOptions.<String, String>builder()
+                .ordering(ParallelConsumerOptions.ProcessingOrder.KEY)
+                .commitMode(PERIODIC_TRANSACTIONAL_PRODUCER)
+                .producer(getKcu().createNewProducer(tx))
+                .consumer(newConsumer)
+                .maxConcurrency(3)
+                .build();
+
+        ParallelEoSStreamProcessor<String, String> async = new ParallelEoSStreamProcessor<>(options);
+        async.subscribe(Pattern.compile(topic));
+
+        AtomicInteger msgCount = new AtomicInteger(0);
+
+        ProgressBar pb = ProgressBarUtils.getNewMessagesBar(log, total);
+
+        try (pb) {
+            async.poll(r -> {
+                // message processing function
+                sleepABit();
+                // db isn interesting but not a great performance test, as the db quickly becomes the bottleneck, need to test against a db cluster that can scale better
+                // save to db
+//                savePayload(r.key(), r.value());
+                //
+                msgCount.getAndIncrement();
+            });
+
+            // keep checking how many message's we've processed
+            await().atMost(ofSeconds(60)).until(() -> {
+                // log.debug("msg count: {}", msgCount.get());
+                pb.stepTo(msgCount.get());
+                return msgCount.get() >= total;
+            });
+        }
+        async.close();
+    }
+
+    private void sleepABit() {
+        int simulatedCPUMessageProcessingDelay = nextInt(0, 5); // random delay between 0,5
+        try {
+            Thread.sleep(simulatedCPUMessageProcessingDelay); // simulate json parsing overhead and network calls
+        } catch (Exception ignore) {
+        }
+    }
+
+    private void readRecordsPlainConsumer(int total, String topic) {
+        // read
+        log.info("Starting to read back");
+        final List<ConsumerRecord<String, String>> allRecords = Lists.newArrayList();
+        AtomicInteger count = new AtomicInteger();
+        time(() -> {
+            ProgressBar pb = ProgressBarUtils.getNewMessagesBar(log, total);
+
+            Executors.newCachedThreadPool().submit(() -> {
+                while (allRecords.size() < total) {
+                    ConsumerRecords<String, String> poll = getKcu().getConsumer().poll(ofMillis(500));
+                    log.info("Polled batch of {} messages", poll.count());
+
+                    //save
+                    Iterable<ConsumerRecord<String, String>> records = poll.records(topic);
+                    records.forEach(x -> {
+                        // log.trace(x.toString());
+                        sleepABit();
+                        // db isn interesting but not a great performance test, as the db quickly becomes the bottleneck, need to test against a db cluster that can scale better
+//                        savePayload(x.key(), x.value());
+                        pb.step();
+                        // log.debug(testDataEbean.toString());
+                    });
+
+                    //
+                    ArrayList<ConsumerRecord<String, String>> c = Lists.newArrayList(records);
+                    allRecords.addAll(c);
+                    count.getAndAdd(c.size());
+                }
+            });
+
+            try (pb) {
+                await().atMost(ofSeconds(60)).untilAsserted(() -> {
+                    assertThat(count).hasValue(total);
+                });
+            }
+
+        });
+
+        assertThat(allRecords).hasSize(total);
+    }
+
+    @SneakyThrows
+    private void publishMessages(int keyRange, int total, String topic) {
+
+        // produce data
+        var keys = Range.listOfIntegers(keyRange);
+        var integers = Lists.newArrayList(IntStream.range(0, total).iterator());
+
+        // publish
+        var futureMetadataResultsFromPublishing = new LinkedList<Future<RecordMetadata>>();
+        log.info("Start publishing...");
+        time(() -> {
+            for (var x : wrap(integers, "Publishing async")) {
+                String key = keys.get(RandomUtils.nextInt(0, keys.size())).toString();
+                int messageSizeInBytes = 500;
+                String value = RandomStringUtils.randomAlphabetic(messageSizeInBytes);
+                var producerRecord = new ProducerRecord<>(topic, key, value);
+                try {
+                    var meta = getKcu().getProducer().send(producerRecord);
+                    futureMetadataResultsFromPublishing.add(meta);
+                } catch (Exception e) {
+                    throw new RuntimeException(e);
+                }
+            }
+        });
+
+        // joining
+        Set<Integer> usedPartitions = new HashSet<>();
+        for (var meta : wrap(futureMetadataResultsFromPublishing, "Joining")) {
+            RecordMetadata recordMetadata = meta.get();
+            int partition = recordMetadata.partition();
+            usedPartitions.add(partition);
+        }
+        // has a certain chance of passing, if number of messages is ~large compared to numPartitions
+        if (numPartitions > 100_000) {
+            assertThat(usedPartitions.stream().distinct()).as("All partitions are made use of").hasSize(numPartitions);
+        }
+    }
+
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/MultiInstanceHighVolumeTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/MultiInstanceHighVolumeTest.java
new file mode 100644
index 000000000..56efc1e4f
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/MultiInstanceHighVolumeTest.java
@@ -0,0 +1,153 @@
+package io.confluent.parallelconsumer.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.ProgressBarUtils;
+import io.confluent.csid.utils.StringUtils;
+import io.confluent.csid.utils.TrimListRepresentation;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import me.tongfei.progressbar.ProgressBar;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.assertj.core.api.Assertions;
+import org.assertj.core.api.SoftAssertions;
+import org.awaitility.core.ConditionTimeoutException;
+import org.junit.jupiter.api.Test;
+
+import java.util.ArrayList;
+import java.util.Collections;
+import java.util.List;
+import java.util.Optional;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static java.time.Duration.ofSeconds;
+import static java.util.concurrent.TimeUnit.SECONDS;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.fail;
+import static org.assertj.core.util.Lists.list;
+import static org.awaitility.Awaitility.waitAtMost;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+@Slf4j
+class MultiInstanceHighVolumeTest extends BrokerIntegrationTest<String, String> {
+
+    public List<String> consumedKeys = Collections.synchronizedList(new ArrayList<>());
+    public List<String> producedKeysAcknowledged = Collections.synchronizedList(new ArrayList<>());
+    public AtomicInteger processedCount = new AtomicInteger(0);
+    public AtomicInteger producedCount = new AtomicInteger(0);
+
+    int maxPoll = 500; // 500 is the kafka default
+
+    CommitMode commitMode = CommitMode.PERIODIC_CONSUMER_SYNC;
+    ProcessingOrder order = ProcessingOrder.KEY;
+
+
+    // todo multi commit mode, multi partition count, multi instance count? 2,3,10,100? more instances than partitions, more partitions than instances
+    @SneakyThrows
+    @Test
+    void multiInstance() {
+        numPartitions = 12;
+        String inputTopicName = setupTopic(this.getClass().getSimpleName() + "-input");
+
+//        int expectedMessageCount = 10_000_000;
+        int expectedMessageCount = 30_000_00;
+        log.info("Producing {} messages before starting test", expectedMessageCount);
+
+        List<String> expectedKeys = getKcu().produceMessages(inputTopicName, expectedMessageCount);
+
+        // setup
+        ParallelEoSStreamProcessor<String, String> pcOne = buildPc(inputTopicName, maxPoll, order, commitMode);
+        ParallelEoSStreamProcessor<String, String> pcTwo = buildPc(inputTopicName, maxPoll, order, commitMode);
+        ParallelEoSStreamProcessor<String, String> pcThree = buildPc(inputTopicName, maxPoll, order, commitMode);
+
+        // run
+        var consumedByOne = Collections.synchronizedList(new ArrayList<ConsumerRecord<?, ?>>());
+        var consumedByTwo = Collections.synchronizedList(new ArrayList<ConsumerRecord<?, ?>>());
+        var consumedByThree = Collections.synchronizedList(new ArrayList<ConsumerRecord<?, ?>>());
+        List<ProgressBar> bars = list();
+        bars.add(run(expectedMessageCount / 3, pcOne, consumedByOne));
+        bars.add(run(expectedMessageCount / 3, pcTwo, consumedByTwo));
+        bars.add(run(expectedMessageCount / 3, pcThree, consumedByThree));
+
+        // wait for all pre-produced messages to be processed and produced
+        Assertions.useRepresentation(new TrimListRepresentation());
+        var failureMessage = StringUtils.msg("All keys sent to input-topic should be processed and produced, within time " +
+                        "(expected: {} commit: {} order: {} max poll: {})",
+                expectedMessageCount, commitMode, order, maxPoll);
+        try {
+            waitAtMost(ofSeconds(60))
+                    // dynamic reason support still waiting https://github.com/awaitility/awaitility/pull/193#issuecomment-873116199
+                    // .failFast( () -> pcThree.getFailureCause(), () -> pcThree.isClosedOrFailed()) // requires https://github.com/awaitility/awaitility/issues/178#issuecomment-734769761
+                    .failFast("PC died - check logs", () -> pcThree.isClosedOrFailed()) // requires https://github.com/awaitility/awaitility/issues/178#issuecomment-734769761
+                    .alias(failureMessage)
+                    .pollInterval(1, SECONDS)
+                    .untilAsserted(() -> {
+                        log.trace("Processed-count: {}, Produced-count: {}", processedCount.get(), producedCount.get());
+                        SoftAssertions all = new SoftAssertions();
+                        all.assertThat(new ArrayList<>(consumedKeys)).as("all expected are consumed").hasSameSizeAs(expectedKeys);
+//                        all.assertThat(new ArrayList<>(producedKeysAcknowledged)).as("all consumed are produced ok ").hasSameSizeAs(expectedKeys);
+                        all.assertAll();
+                    });
+        } catch (ConditionTimeoutException e) {
+            fail(failureMessage + "\n" + e.getMessage());
+        }
+
+        assertThat(processedCount.get())
+                .as("messages processed and produced by parallel-consumer should be equal")
+                .isEqualTo(expectedMessageCount);
+
+        // sanity
+        assertThat(expectedMessageCount).isEqualTo(processedCount.get());
+
+        bars.forEach(ProgressBar::close);
+    }
+
+    private ParallelEoSStreamProcessor<String, String> buildPc(String inputTopicName, int maxPoll, ProcessingOrder order, CommitMode commitMode) {
+        var pc = getKcu().buildPc(order, commitMode, maxPoll);
+        pc.subscribe(of(inputTopicName));
+        return pc;
+    }
+
+    Integer barId = 0;
+
+    private ProgressBar run(final int expectedMessageCount, final ParallelEoSStreamProcessor<String, String> pc, List<ConsumerRecord<?, ?>> consumed) {
+        ProgressBar bar = ProgressBarUtils.getNewMessagesBar(log, expectedMessageCount);
+        bar.setExtraMessage("#" + barId);
+        pc.setMyId(Optional.of("id: " + barId));
+        barId++;
+        pc.poll(record -> {
+                    processRecord(bar, record.getSingleConsumerRecord(), consumed);
+                }
+//                , consumeProduceResult -> {
+//                    callBack(consumeProduceResult);
+//                }
+        );
+        return bar;
+    }
+
+    @SneakyThrows
+    private void processRecord(final ProgressBar bar,
+                               final ConsumerRecord<String, String> record,
+                               List<ConsumerRecord<?, ?>> consumed) {
+//        try {
+        // 1/5 chance of taking a long time
+//        int chance = 10;
+//        int dice = RandomUtils.nextInt(0, chance);
+//        if (dice == 0) {
+//            Thread.sleep(100);
+//        } else {
+//            Thread.sleep(RandomUtils.nextInt(3, 20));
+//        }
+        bar.stepBy(1);
+        consumedKeys.add(record.key());
+        processedCount.incrementAndGet();
+        consumed.add(record);
+//        return new ProducerRecord<>(outputName, record.key(), "data");
+    }
+
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/MultiInstanceMetricsTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/MultiInstanceMetricsTest.java
new file mode 100644
index 000000000..dcc54cc62
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/MultiInstanceMetricsTest.java
@@ -0,0 +1,158 @@
+package io.confluent.parallelconsumer.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils;
+import io.confluent.parallelconsumer.internal.PCModule;
+import io.micrometer.core.instrument.Counter;
+import io.micrometer.core.instrument.search.Search;
+import io.micrometer.core.instrument.simple.SimpleMeterRegistry;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.junit.jupiter.api.*;
+import pl.tlinkowski.unij.api.UniSets;
+
+import java.time.Duration;
+import java.util.UUID;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_CONSUMER_ASYNCHRONOUS;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.PARTITION;
+import static io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils.GroupOption.NEW_GROUP;
+import static io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils.GroupOption.REUSE_GROUP;
+import static io.confluent.parallelconsumer.metrics.PCMetricsDef.PC_INSTANCE_TAG;
+import static io.confluent.parallelconsumer.metrics.PCMetricsDef.PROCESSED_RECORDS;
+import static java.time.Duration.ofSeconds;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.awaitility.Awaitility.await;
+import static org.hamcrest.CoreMatchers.is;
+
+@Slf4j
+class MultiInstanceMetricsTest extends BrokerIntegrationTest<String, String> {
+    {
+        super.numPartitions = 2;
+    }
+
+    SimpleMeterRegistry simpleMeterRegistry;
+    private String outputTopic;
+
+    @BeforeEach
+    void setup() {
+        setupTopic();
+        simpleMeterRegistry = new SimpleMeterRegistry();
+    }
+
+    @AfterEach
+    void cleanup() {
+        simpleMeterRegistry.close();
+    }
+
+
+    @SneakyThrows
+    @Test
+    void twoInstancePCMetricsRecordedIndependently() {
+
+        var numberOfRecordsToProduce = 100L;
+
+        getKcu().produceMessages(topic, numberOfRecordsToProduce);
+
+        String pcInstance1Tag = UUID.randomUUID().toString();
+
+        var pcOptions = getOptions(pcInstance1Tag, NEW_GROUP);
+
+        ParallelEoSStreamProcessor<String, String> pc = new ParallelEoSStreamProcessor<>(pcOptions, new PCModule<>(pcOptions));
+        pc.subscribe(UniSets.of(topic));
+
+        String pcInstance2Tag = UUID.randomUUID().toString();
+        pcOptions = getOptions(pcInstance2Tag, REUSE_GROUP);
+
+        ParallelEoSStreamProcessor<String, String> pc2 = new ParallelEoSStreamProcessor<>(pcOptions, new PCModule<>(pcOptions));
+        pc2.subscribe(UniSets.of(topic));
+
+        AtomicInteger pc1Counter = new AtomicInteger();
+        AtomicInteger pc2Counter = new AtomicInteger();
+        pc.poll(record -> pc1Counter.incrementAndGet());
+
+        pc2.poll(record -> pc2Counter.incrementAndGet());
+
+
+        await().timeout(Duration.ofSeconds(30)).until(() -> pc1Counter.get() + pc2Counter.get() == numberOfRecordsToProduce);
+        assertThat(Search.in(simpleMeterRegistry).tag(PC_INSTANCE_TAG, pcInstance1Tag).name(PROCESSED_RECORDS.getName()).counter().count()).isEqualTo(pc1Counter.get());
+        assertThat(Search.in(simpleMeterRegistry).tag(PC_INSTANCE_TAG, pcInstance2Tag).name(PROCESSED_RECORDS.getName()).counter().count()).isEqualTo(pc2Counter.get());
+        pc.close();
+        pc2.close();
+    }
+
+    @SneakyThrows
+    @Test
+    void sameRegistryCanBeReusedAfterPcInstanceClosed() {
+
+        var numberOfRecordsToProduce = 20;
+
+        getKcu().produceMessages(topic, numberOfRecordsToProduce);
+
+
+        var pcOptions = getOptions(null, NEW_GROUP);
+
+        ParallelEoSStreamProcessor<String, String> pc = new ParallelEoSStreamProcessor<>(pcOptions, new PCModule<>(pcOptions));
+        pc.subscribe(UniSets.of(topic));
+
+
+        AtomicInteger pc1Counter = new AtomicInteger();
+        pc.poll(record -> pc1Counter.incrementAndGet());
+
+
+        await().timeout(Duration.ofSeconds(30)).until(() -> pc1Counter.get() == numberOfRecordsToProduce);
+        assertThat(Search.in(simpleMeterRegistry).name(PROCESSED_RECORDS.getName()).counters().stream().mapToDouble(Counter::count).sum()).isEqualTo(pc1Counter.get());
+        pc.close();
+
+        getKcu().produceMessages(topic, numberOfRecordsToProduce);
+
+        pcOptions = getOptions(null, NEW_GROUP);
+
+        ParallelEoSStreamProcessor<String, String> pc2 = new ParallelEoSStreamProcessor<>(pcOptions, new PCModule<>(pcOptions));
+        pc2.subscribe(UniSets.of(topic));
+        AtomicInteger pc2Counter = new AtomicInteger();
+
+        pc2.poll(record -> pc2Counter.incrementAndGet());
+        await().timeout(Duration.ofSeconds(30)).until(() -> pc2Counter.get() == numberOfRecordsToProduce * 2);
+        assertThat(Search.in(simpleMeterRegistry).name(PROCESSED_RECORDS.getName()).counters().stream().mapToDouble(Counter::count).sum()).isEqualTo(pc2Counter.get());
+
+        pc2.close();
+    }
+
+    @SneakyThrows
+    @Test
+    void allMetersRemovedFromRegistryOnClose() {
+        var numberOfRecordsToProduce = 10L;
+        getKcu().produceMessages(topic, numberOfRecordsToProduce);
+        String pcInstance1Tag = UUID.randomUUID().toString();
+
+        var pcOptions = getOptions(pcInstance1Tag, NEW_GROUP);
+
+        ParallelEoSStreamProcessor<String, String> pc = new ParallelEoSStreamProcessor<>(pcOptions, new PCModule<>(pcOptions));
+        pc.subscribe(UniSets.of(topic));
+        AtomicInteger pc1Counter = new AtomicInteger();
+        pc.poll(record -> pc1Counter.incrementAndGet());
+        await().timeout(Duration.ofSeconds(30)).until(() -> pc1Counter.get() == numberOfRecordsToProduce);
+        assertThat(Search.in(simpleMeterRegistry).tag(PC_INSTANCE_TAG, pcInstance1Tag).name(PROCESSED_RECORDS.getName()).counters().stream().mapToDouble(Counter::count).sum()).isEqualTo(pc1Counter.get());
+        pc.close();
+        assertThat(simpleMeterRegistry.getMeters().size()).isEqualTo(0);
+    }
+
+
+    ParallelConsumerOptions<String, String> getOptions(String pcInstanceTag, KafkaClientUtils.GroupOption consumerGroupOption) {
+        return ParallelConsumerOptions.<String, String>builder()
+                .commitMode(PERIODIC_CONSUMER_ASYNCHRONOUS)
+                .consumer(getKcu().createNewConsumer(consumerGroupOption))
+                .meterRegistry(simpleMeterRegistry)
+                .pcInstanceTag(pcInstanceTag)
+                .ordering(PARTITION) // just so we dont need to use keys
+                .build();
+
+    }
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/MultiInstanceRebalanceTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/MultiInstanceRebalanceTest.java
new file mode 100644
index 000000000..80f2c90fa
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/MultiInstanceRebalanceTest.java
@@ -0,0 +1,433 @@
+package io.confluent.parallelconsumer.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.ProgressBarUtils;
+import io.confluent.csid.utils.ProgressTracker;
+import io.confluent.csid.utils.TrimListRepresentation;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import lombok.Getter;
+import lombok.SneakyThrows;
+import lombok.ToString;
+import lombok.extern.slf4j.Slf4j;
+import me.tongfei.progressbar.ProgressBar;
+import org.apache.commons.lang3.RandomUtils;
+import org.apache.kafka.clients.consumer.ConsumerConfig;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.clients.producer.RecordMetadata;
+import org.assertj.core.api.Assertions;
+import org.assertj.core.api.SoftAssertions;
+import org.assertj.core.internal.StandardComparisonStrategy;
+import org.awaitility.Awaitility;
+import org.awaitility.core.TerminalFailureException;
+import org.junit.jupiter.api.Disabled;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+import org.slf4j.MDC;
+
+import java.util.*;
+import java.util.concurrent.*;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.stream.Collectors;
+import java.util.stream.IntStream;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.PARTITION;
+import static io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor.MDC_INSTANCE_ID;
+import static java.time.Duration.ofMinutes;
+import static java.time.Duration.ofSeconds;
+import static java.util.concurrent.TimeUnit.SECONDS;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.util.IterableUtil.toCollection;
+import static org.awaitility.Awaitility.waitAtMost;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+/**
+ * Test running with multiple instances of parallel-consumer consuming from topic with two partitions.
+ */
+//@Isolated // performance sensitive
+@Slf4j
+public class MultiInstanceRebalanceTest extends BrokerIntegrationTest<String, String> {
+
+    static final int DEFAULT_MAX_POLL = 500;
+    public static final int CHAOS_FREQUENCY = 500;
+    public static final int DEFAULT_POLL_DELAY = 150;
+    AtomicInteger count = new AtomicInteger();
+
+    static {
+        MDC.put(MDC_INSTANCE_ID, "Test-Thread");
+    }
+
+    @ParameterizedTest
+    @EnumSource(ProcessingOrder.class)
+    void consumeWithMultipleInstancesPeriodicConsumerSync(ProcessingOrder order) {
+        numPartitions = 2;
+        int expectedMessageCount = (order == PARTITION) ? 100 : 1000;
+        int numberOfPcsToRun = 2;
+        runTest(DEFAULT_MAX_POLL, CommitMode.PERIODIC_CONSUMER_SYNC, order, expectedMessageCount,
+                numberOfPcsToRun, 1.0, DEFAULT_POLL_DELAY);
+    }
+
+    @ParameterizedTest
+    @EnumSource(ProcessingOrder.class)
+    void consumeWithMultipleInstancesPeriodicConsumerAsynchronous(ProcessingOrder order) {
+        numPartitions = 2;
+        int expectedMessageCount = (order == PARTITION) ? 100 : 1000;
+        runTest(DEFAULT_MAX_POLL, CommitMode.PERIODIC_CONSUMER_ASYNCHRONOUS, order, expectedMessageCount,
+                2, 1.0, DEFAULT_POLL_DELAY);
+    }
+
+    /**
+     * Tests with very large numbers of parallel consumer instances to try to reproduce state and concurrency issues
+     * (#188, #189).
+     * <p>
+     * This test takes some time, but seems required in order to expose some race conditions without syntehticly
+     * creatign them.
+     */
+    @Disabled
+    @Test
+    void largeNumberOfInstances() {
+        numPartitions = 80;
+        int numberOfPcsToRun = 12;
+        int expectedMessageCount = 500000;
+        runTest(DEFAULT_MAX_POLL, CommitMode.PERIODIC_CONSUMER_ASYNCHRONOUS, ProcessingOrder.UNORDERED, expectedMessageCount,
+                numberOfPcsToRun, 0.3, 1);
+    }
+
+    ProgressBar overallProgress;
+    Set<String> overallConsumedKeys = new ConcurrentSkipListSet<>();
+
+    @SneakyThrows
+    private void runTest(int maxPoll, CommitMode commitMode, ProcessingOrder order, int expectedMessageCount,
+                         int numberOfPcsToRun, double fractionOfMessagesToPreProduce, int pollDelayMs) {
+        String inputName = setupTopic(this.getClass().getSimpleName() + "-input-" + RandomUtils.nextInt());
+
+        overallProgress = ProgressBarUtils.getNewMessagesBar("overall", log, expectedMessageCount);
+
+        ExecutorService pcExecutor = Executors.newWorkStealingPool();
+
+        var sendingProgress = ProgressBarUtils.getNewMessagesBar("sending", log, expectedMessageCount);
+
+        // pre-produce messages to input-topic
+        Set<String> expectedKeys = new ConcurrentSkipListSet<>();
+        log.info("Producing {} messages before starting test", expectedMessageCount);
+        List<Future<RecordMetadata>> sends = new ArrayList<>();
+        int preProduceCount = (int) (expectedMessageCount * fractionOfMessagesToPreProduce);
+        try (Producer<String, String> kafkaProducer = getKcu().createNewProducer(false)) {
+            for (int i = 0; i < preProduceCount; i++) {
+                String key = "key-" + i;
+                Future<RecordMetadata> send = kafkaProducer.send(new ProducerRecord<>(inputName, key, "value-" + i), (meta, exception) -> {
+                    if (exception != null) {
+                        log.error("Error sending, ", exception);
+                    }
+                    sendingProgress.step();
+                });
+                sends.add(send);
+                expectedKeys.add(key);
+            }
+            log.debug("Finished sending test data");
+        }
+
+        // make sure we finish sending before next stage
+        log.debug("Waiting for broker acks");
+        for (Future<RecordMetadata> send : sends) {
+            send.get();
+        }
+        assertThat(sends).hasSizeGreaterThanOrEqualTo(preProduceCount);
+
+        // Submit first parallel-consumer
+        log.info("Running first instance of pc");
+        int expectedMessageCountPerPC = expectedMessageCount / numberOfPcsToRun;
+        ParallelConsumerRunnable pc1 = new ParallelConsumerRunnable(maxPoll, commitMode, order, inputName, expectedMessageCountPerPC, pollDelayMs);
+        pcExecutor.submit(pc1);
+
+        // Wait for first consumer to consume messages, also effectively waits for the group.initial.rebalance.delay.ms (3s by default)
+        Awaitility.waitAtMost(ofSeconds(10))
+                .until(() -> pc1.getConsumedKeys().size() > 1);
+
+        // keep producing more messages in the background
+        var sender = new Runnable() {
+            @SneakyThrows
+            @Override
+            public void run() {
+                // pre-produce messages to input-topic
+                log.info("Producing {} messages before starting test", expectedMessageCount);
+                try (Producer<String, String> kafkaProducer = getKcu().createNewProducer(false)) {
+                    for (int i = preProduceCount; i < expectedMessageCount; i++) {
+                        // slow things down just a tad
+//                        Thread.sleep(1);
+                        String key = "key-" + i;
+                        log.debug("sending {}", key);
+                        Future<RecordMetadata> send = kafkaProducer.send(new ProducerRecord<>(inputName, key, "value-" + i), (meta, exception) -> {
+                            if (exception != null) {
+                                log.error("Error sending, ", exception);
+                            }
+                            sendingProgress.step();
+                        });
+                        send.get();
+                        sends.add(send);
+                        expectedKeys.add(key);
+                    }
+                    log.info("Finished sending test data");
+                }
+            }
+        };
+        pcExecutor.submit(sender);
+
+        // start more PCs
+        var secondaryPcs = Collections.synchronizedList(IntStream.range(1, numberOfPcsToRun)
+                .mapToObj(value -> {
+                            try {
+                                int jitterRangeMs = 2;
+                                Thread.sleep((int) (Math.random() * jitterRangeMs)); // jitter pc start
+                            } catch (InterruptedException e) {
+                                log.error(e.getMessage(), e);
+                            }
+                            log.info("Running pc instance {}", value);
+                    ParallelConsumerRunnable instance = new ParallelConsumerRunnable(maxPoll, commitMode, order, inputName, expectedMessageCountPerPC, pollDelayMs);
+                            pcExecutor.submit(instance);
+                            return instance;
+                        }
+                ).collect(Collectors.toList()));
+        final List<ParallelConsumerRunnable> allPCRunners = Collections.synchronizedList(new ArrayList<>());
+        allPCRunners.add(pc1);
+        allPCRunners.addAll(secondaryPcs);
+        final ParallelConsumerRunnable[] parallelConsumerRunnablesArray = allPCRunners.toArray(new ParallelConsumerRunnable[0]);
+
+
+        // Randomly start and stop PCs
+        var chaosMonkey = new Runnable() {
+            @Override
+            public void run() {
+                try {
+                    while (noneHaveFailed(allPCRunners)) {
+                        Thread.sleep((int) (CHAOS_FREQUENCY * Math.random()));
+                        boolean makeChaos = Math.random() > 0.2; // small chance it will let the test do a run without chaos
+//                        boolean makeChaos = true;
+                        if (makeChaos) {
+                            int size = secondaryPcs.size();
+                            int numberToMessWith = (int) (Math.random() * size * 0.6);
+                            if (numberToMessWith > 0) {
+                                log.info("Will mess with {} instances", numberToMessWith);
+                                IntStream.range(0, numberToMessWith).forEach(value -> {
+                                    int instanceToGet = (int) ((size - 1) * Math.random());
+                                    ParallelConsumerRunnable victim = secondaryPcs.get(instanceToGet);
+                                    log.info("Victim is instance: " + victim.instanceId);
+                                    victim.toggle(pcExecutor);
+                                });
+                            }
+                        }
+                    }
+                } catch (Throwable e) {
+                    log.error("Error in chaos loop", e);
+                    throw new RuntimeException(e);
+                }
+                log.error("Ending chaos as a PC instance has died");
+            }
+        };
+        pcExecutor.submit(chaosMonkey);
+
+
+        // wait for all pre-produced messages to be processed
+        Assertions.useRepresentation(new TrimListRepresentation());
+        var failureMessage = msg("All keys sent to input-topic should be processed, within time (expected: {} commit: {} order: {} max poll: {})",
+                expectedMessageCount, commitMode, order, maxPoll);
+        ProgressTracker progressTracker = new ProgressTracker(count);
+        try {
+            waitAtMost(ofMinutes(5))
+                    // dynamic reason support still waiting https://github.com/awaitility/awaitility/issues/240
+                    // .failFast( () -> pc1.getFailureCause(), () -> pc1.isClosedOrFailed()) // requires https://github.com/awaitility/awaitility/issues/240
+                    .failFast("A PC has died - check logs", () -> !noneHaveFailed(allPCRunners)) // dynamic reason requires https://github.com/awaitility/awaitility/issues/240
+                    .alias(failureMessage)
+                    .pollInterval(1, SECONDS)
+                    .untilAsserted(() -> {
+                        log.trace("Processed-count: {}", getAllConsumedKeys(parallelConsumerRunnablesArray).size());
+                        if (progressTracker.hasProgressNotBeenMade()) {
+                            expectedKeys.removeAll(getAllConsumedKeys(parallelConsumerRunnablesArray));
+                            throw progressTracker.constructError(msg("No progress, missing keys: {}.", expectedKeys));
+                        }
+                        SoftAssertions all = new SoftAssertions();
+                        all.assertThat(overallConsumedKeys.containsAll(expectedKeys)).as("contains all: all expected are consumed at least once").isTrue();
+
+                        // is this redundant? containsAll means has size => always true
+                        // NB: Re-balance causes re-processing, and this is probably expected. Leaving test like this anyway
+                        all.assertThat(overallConsumedKeys).as("size: all expected are consumed only once").hasSizeGreaterThanOrEqualTo(expectedKeys.size());
+
+                        all.assertAll();
+                    });
+        } catch (Throwable error) {
+            // this should be replaceable with dynamic reason generation: https://github.com/awaitility/awaitility/issues/240
+            List<Exception> exceptions = checkForFailure(allPCRunners);
+            if (error instanceof TerminalFailureException) {
+                Optional<Exception> any = exceptions.stream().findAny();
+                String message = msg("{} \n Terminal failure in one or more of the PCs. Reported exception states are: {} \n {}", failureMessage, exceptions, error);
+                throw new RuntimeException(message, any.orElse(null));
+            } else {
+                String message = msg("{} \n Assertion error. PC reported exception states: {} \n {}", failureMessage, exceptions, error);
+                throw new RuntimeException(message, error);
+            }
+        } finally {
+            overallProgress.close();
+            sendingProgress.close();
+        }
+
+        allPCRunners.forEach(ParallelConsumerRunnable::close);
+
+        assertThat(pc1.consumedKeys).hasSizeGreaterThan(0);
+        assertThat(getAllConsumedKeys(secondaryPcs.toArray(new ParallelConsumerRunnable[0])))
+                .as("Second PC should have taken over some of the work and consumed some records")
+                .hasSizeGreaterThan(0);
+
+        pcExecutor.shutdown();
+
+        Collection<?> duplicates = toCollection(StandardComparisonStrategy.instance()
+                .duplicatesFrom(getAllConsumedKeys(parallelConsumerRunnablesArray)));
+        log.info("Duplicate consumed keys (at least one is expected due to the rebalance): {}", duplicates);
+        double percentageDuplicateTolerance = 0.2;
+        assertThat(duplicates)
+                .as("There should be few duplicate keys")
+                .hasSizeLessThan((int) (expectedMessageCount * percentageDuplicateTolerance)); // in some env, there are a lot more. i.e. Jenkins running parallel suits
+
+
+    }
+
+    private boolean noneHaveFailed(List<ParallelConsumerRunnable> secondaryPcs) {
+        return checkForFailure(secondaryPcs).isEmpty();
+    }
+
+    private List<Exception> checkForFailure(List<ParallelConsumerRunnable> secondaryPcs) {
+        return secondaryPcs.stream().filter(pcr -> {
+            var pc = pcr.getParallelConsumer();
+            if (pc == null) return false; // hasn't started
+            if (!pc.isClosedOrFailed()) return false; // still open
+            boolean failed = pc.getFailureCause() != null; // actually failed
+            return failed;
+        }).map(pc -> pc.getParallelConsumer().getFailureCause()).collect(Collectors.toList());
+    }
+
+    List<String> getAllConsumedKeys(ParallelConsumerRunnable... instances) {
+        return Arrays.stream(instances)
+                .flatMap(parallelConsumerRunnable -> parallelConsumerRunnable.consumedKeys.stream())
+                .collect(Collectors.toList());
+    }
+
+    int pcInstanceCount = 0;
+
+    @Getter
+    @ToString
+    public class ParallelConsumerRunnable implements Runnable {
+
+        private final int instanceId;
+
+        private final int maxPoll;
+        private final CommitMode commitMode;
+        private final ProcessingOrder order;
+        private final String inputTopic;
+        private final int expectedMessageCount;
+        private final ProgressBar bar;
+        private final int pollDelayMs;
+        private ParallelEoSStreamProcessor<String, String> parallelConsumer;
+        private boolean started = false;
+
+        @ToString.Exclude
+        private final Queue<String> consumedKeys = new ConcurrentLinkedQueue<>();
+
+        public ParallelConsumerRunnable(int maxPoll, CommitMode commitMode, ProcessingOrder order, String inputTopic, int expectedMessageCount, int pollDelayMs) {
+            this.maxPoll = maxPoll;
+            this.commitMode = commitMode;
+            this.order = order;
+            this.inputTopic = inputTopic;
+            this.expectedMessageCount = expectedMessageCount;
+            this.pollDelayMs = pollDelayMs;
+
+            instanceId = pcInstanceCount;
+            pcInstanceCount++;
+
+            bar = ProgressBarUtils.getNewMessagesBar("PC" + instanceId, log, expectedMessageCount);
+        }
+
+        @Override
+        public void run() {
+            MDC.put(MDC_INSTANCE_ID, "Runner-" + instanceId);
+
+            started = true;
+            log.info("Running consumer!");
+
+            Properties consumerProps = new Properties();
+            consumerProps.put(ConsumerConfig.MAX_POLL_RECORDS_CONFIG, maxPoll);
+            KafkaConsumer<String, String> newConsumer = getKcu().createNewConsumer(false, consumerProps);
+
+            this.parallelConsumer = new ParallelEoSStreamProcessor<>(ParallelConsumerOptions.<String, String>builder()
+                    .ordering(order)
+                    .consumer(newConsumer)
+                    .commitMode(commitMode)
+                    .maxConcurrency(10)
+                    .build());
+
+
+            // test was written with 1-second cycles in mind - in terms of expected progression
+            this.parallelConsumer.setTimeBetweenCommits(ofSeconds(1));
+
+
+            parallelConsumer.setMyId(Optional.of("PC-" + instanceId));
+
+            parallelConsumer.subscribe(of(inputTopic));
+
+            parallelConsumer.poll(record -> {
+                        // simulate work
+                        try {
+                            Thread.sleep(pollDelayMs);
+                        } catch (InterruptedException e) {
+                            // ignore
+                        }
+                        count.incrementAndGet();
+                        this.bar.step();
+                        overallProgress.step();
+                        consumedKeys.add(record.key());
+                        overallConsumedKeys.add(record.key());
+                    }
+            );
+        }
+
+        public void stop() {
+            log.info("Stopping {}", this.instanceId);
+            started = false;
+            parallelConsumer.close();
+        }
+
+        public void start(ExecutorService pcExecutor) {
+            // strange structure for debugging
+            Exception failureCause = getParallelConsumer().getFailureCause();
+            if (failureCause != null) {
+                throw new RuntimeException("Error starting PC, pc died from previous error: " + failureCause.getMessage(), failureCause);
+            }
+
+            log.info("Starting {}", this);
+            pcExecutor.submit(this);
+        }
+
+        public void close() {
+            log.info("Stopping {}", this);
+            stop();
+            bar.close();
+        }
+
+        public void toggle(ExecutorService pcExecutor) {
+            if (started) {
+                stop();
+            } else {
+                start(pcExecutor);
+            }
+        }
+    }
+
+
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/MultiTopicTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/MultiTopicTest.java
new file mode 100644
index 000000000..9988eff7f
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/MultiTopicTest.java
@@ -0,0 +1,101 @@
+package io.confluent.parallelconsumer.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.admin.NewTopic;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.common.TopicPartition;
+import org.hamcrest.Matchers;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+
+import java.time.Duration;
+import java.util.HashSet;
+import java.util.List;
+import java.util.Map;
+import java.util.Set;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.stream.Collectors;
+
+import static io.confluent.parallelconsumer.ManagedTruth.assertThat;
+import static one.util.streamex.StreamEx.of;
+import static org.awaitility.Awaitility.await;
+import static org.hamcrest.Matchers.equalTo;
+
+/**
+ * Originally created to investigate issue report #184
+ *
+ * @author Antony Stubbs
+ */
+@Slf4j
+class MultiTopicTest extends BrokerIntegrationTest<String, String> {
+
+    @ParameterizedTest
+    @EnumSource(ProcessingOrder.class)
+    void multiTopic(ProcessingOrder order) {
+        int numTopics = 3;
+        List<NewTopic> multiTopics = getKcu().createTopics(numTopics);
+        int recordsPerTopic = 1;
+        multiTopics.forEach(singleTopic -> sendMessages(singleTopic, recordsPerTopic));
+
+        var pc = getKcu().buildPc(order);
+        pc.subscribe(of(multiTopics).map(NewTopic::name).toList());
+
+        AtomicInteger messageProcessedCount = new AtomicInteger();
+
+        pc.poll(pollContext -> {
+            log.debug(pollContext.toString());
+            messageProcessedCount.incrementAndGet();
+        });
+
+        // processed
+        int expectedMessagesCount = recordsPerTopic * numTopics;
+        await().untilAtomic(messageProcessedCount, Matchers.is(equalTo(expectedMessagesCount)));
+
+        // commits
+        pc.requestCommitAsap();
+        pc.close();
+
+        //
+        Consumer<?, ?> assertingConsumer = getKcu().createNewConsumer(false);
+        await().atMost(Duration.ofSeconds(10))
+                .untilAsserted(() -> {
+                    assertSeparateConsumerCommit(assertingConsumer, new HashSet<>(multiTopics), recordsPerTopic);
+                });
+    }
+
+    /**
+     * Can't get committed offsets from PC wrapped consumer, so force commit by closing PC, then create new consumer
+     * with same group id, and assert what offsets are told are committed.
+     * <p>
+     * When consumer-interface #XXX is merged, could just poll PC directly (see commented out assertCommit below).
+     */
+    private void assertSeparateConsumerCommit(Consumer<?, ?> assertingConsumer, HashSet<NewTopic> topics, int expectedOffset) {
+        Set<TopicPartition> partitions = topics.stream().map(newTopic -> new TopicPartition(newTopic.name(), 0)).collect(Collectors.toSet());
+        Map<TopicPartition, OffsetAndMetadata> committed = assertingConsumer.committed(partitions);
+        var partitionSubjects = assertThat(assertingConsumer).hasCommittedToPartition(partitions);
+        partitionSubjects.forEach((topicPartition, commitHistorySubject)
+                -> commitHistorySubject.atLeastOffset(expectedOffset));
+    }
+
+    @SneakyThrows
+    private void sendMessages(NewTopic newTopic, int recordsPerTopic) {
+        getKcu().produceMessages(newTopic.name(), recordsPerTopic);
+    }
+
+// depends on merge of features/consumer-interface branch
+//    private void assertCommit(final ParallelEoSStreamProcessor<String, String> pc, NewTopic newTopic, int recordsPerTopic) {
+//        var committer = getKcu().getLastConsumerConstructed();
+//
+//        assertThat(committer)
+//                .hasCommittedToPartition(newTopic)
+//                .offset(recordsPerTopic);
+//    }
+
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/OffsetCommittingSanityTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/OffsetCommittingSanityTest.java
new file mode 100644
index 000000000..24ae5d306
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/OffsetCommittingSanityTest.java
@@ -0,0 +1,180 @@
+package io.confluent.parallelconsumer.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.Truth;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.clients.producer.KafkaProducer;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.clients.producer.RecordMetadata;
+import org.apache.kafka.common.TopicPartition;
+import org.junit.jupiter.api.Test;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniSets;
+
+import java.util.ArrayList;
+import java.util.List;
+import java.util.Map;
+import java.util.Set;
+import java.util.concurrent.Future;
+
+import static io.confluent.parallelconsumer.ParallelEoSStreamProcessorTestBase.defaultTimeoutSeconds;
+import static io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils.ProducerMode.NOT_TRANSACTIONAL;
+import static java.time.Duration.ofSeconds;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.assertThatCode;
+import static org.awaitility.Awaitility.waitAtMost;
+
+/**
+ * Test offset restoring from boundary conditions, i.e. when no offset data is encoded in metadata
+ * <p>
+ * Reproduces issue 62: https://github.com/confluentinc/parallel-consumer/issues/62
+ *
+ * @see io.confluent.parallelconsumer.ParallelEoSStreamProcessorTest#closeOpenBoundaryCommits
+ */
+@Slf4j
+public class OffsetCommittingSanityTest extends BrokerIntegrationTest<String, String> {
+
+    @Test
+    void shouldNotSkipAnyMessagesOnRestartRoot() throws Exception {
+        String topicNameForTest = setupTopic("foo");
+        List<Long> producedOffsets = new ArrayList<>();
+        List<Long> consumedOffsets = new ArrayList<>();
+
+        KafkaProducer<String, String> kafkaProducer = getKcu().createNewProducer(false);
+
+        // offset 0
+        sendCheckClose(topicNameForTest, producedOffsets, consumedOffsets, kafkaProducer, "key-0", "value-0", true);
+
+        assertCommittedOffset(topicNameForTest, 1);
+
+        // offset 1
+        sendCheckClose(topicNameForTest, producedOffsets, consumedOffsets, kafkaProducer, "key-1", "value-1", true);
+
+        assertCommittedOffset(topicNameForTest, 2);
+
+        // sanity
+        assertThat(producedOffsets).containsExactly(0L, 1L);
+        assertThat(consumedOffsets).containsExactly(0L, 1L);
+    }
+
+    @Test
+    void shouldNotSkipAnyMessagesOnRestartAsDescribed() throws Exception {
+        String topicNameForTest = setupTopic("foo");
+        List<Long> producedOffsets = new ArrayList<>();
+        List<Long> consumedOffsets = new ArrayList<>();
+
+        KafkaProducer<String, String> kafkaProducer = getKcu().createNewProducer(NOT_TRANSACTIONAL);
+
+        // offset 0
+        sendCheckClose(topicNameForTest, producedOffsets, consumedOffsets, kafkaProducer, "key-0", "value-0", CheckMode.CHECK_CONSUMED);
+
+        //
+        assertCommittedOffset(topicNameForTest, 1);
+
+        // offset 1
+        sendCheckClose(topicNameForTest, producedOffsets, consumedOffsets, kafkaProducer, "key-1", "value-1", CheckMode.JUST_SLEEP);
+
+        // offset 2
+        sendCheckClose(topicNameForTest, producedOffsets, consumedOffsets, kafkaProducer, "key-2", "value-2", CheckMode.CHECK_CONSUMED);
+    }
+
+    private void sendCheckClose(String topic,
+                                List<Long> producedOffsets,
+                                List<Long> consumedOffsets,
+                                KafkaProducer<String, String> kafkaProducer,
+                                String key, String val,
+                                boolean check) throws Exception {
+        sendCheckClose(topic, producedOffsets, consumedOffsets, kafkaProducer, key, val, check ? CheckMode.CHECK_CONSUMED : CheckMode.JUST_SLEEP);
+    }
+
+
+    /**
+     * Sends a record
+     * <p>
+     * Runs PC
+     * <p>
+     * conditionally checks that PC consumes that sent message
+     * <p>
+     * Closes PC
+     * <p>
+     * waiting for it to drain
+     */
+    private void sendCheckClose(String topic,
+                                List<Long> producedOffsets,
+                                List<Long> consumedOffsets,
+                                KafkaProducer<String, String> kafkaProducer,
+                                String key, String val,
+                                CheckMode check) throws Exception {
+        var record = new ProducerRecord<>(topic, key, val);
+        Future<RecordMetadata> send = kafkaProducer.send(record);
+        long offset = send.get().offset();
+        producedOffsets.add(offset);
+
+        //
+        var newConsumer = getKcu().createNewConsumer(false);
+        var pc = createParallelConsumer(topic, newConsumer);
+
+        //
+        pc.poll(consumerRecord -> consumedOffsets.add(consumerRecord.offset()));
+
+        //
+        if (check.equals(CheckMode.CHECK_CONSUMED)) {
+            assertThatCode(() -> {
+                waitAtMost(ofSeconds(defaultTimeoutSeconds)).alias("all produced messages consumed")
+                        .untilAsserted(
+                                () -> assertThat(consumedOffsets).isEqualTo(producedOffsets));
+            }).doesNotThrowAnyException(); // wait for no concurrent exceptions
+        } else {
+            Thread.sleep(2000);
+        }
+        pc.closeDrainFirst();
+    }
+
+    public enum CheckMode {
+        CHECK_CONSUMED, JUST_SLEEP
+    }
+
+    /**
+     * Starts a new consumer for the topic, and checking it's committed offsets that it's sent to start from
+     */
+    private void assertCommittedOffset(String topicNameForTest, long expectedOffset) {
+        // assert committed offset
+        var newConsumer = getKcu().createNewConsumer(false);
+        newConsumer.subscribe(UniSets.of(topicNameForTest));
+        // increased poll timeout to allow for delay under load during parallel test execution
+        newConsumer.poll(ofSeconds(5));
+        Set<TopicPartition> assignment = newConsumer.assignment();
+        Truth.assertWithMessage("Should be assigned some partitions").that(assignment).isNotEmpty();
+
+        //
+        Map<TopicPartition, OffsetAndMetadata> committed = newConsumer.committed(assignment);
+        Truth.assertThat(committed).isNotEmpty();
+
+        //
+        TopicPartition tp = new TopicPartition(topicNameForTest, 0);
+        OffsetAndMetadata offsetAndMetadata = committed.get(tp);
+        assertThat(offsetAndMetadata).as("Should have commit history for this partition {}", tp).isNotNull();
+
+        //
+        long offset = offsetAndMetadata.offset();
+        assertThat(offset).isEqualTo(expectedOffset);
+        newConsumer.close();
+    }
+
+    private ParallelEoSStreamProcessor<String, String> createParallelConsumer(String topicName, Consumer consumer) {
+        ParallelEoSStreamProcessor<String, String> pc = new ParallelEoSStreamProcessor<>(ParallelConsumerOptions.builder()
+                .consumer(consumer)
+                .build()
+        );
+        pc.subscribe(UniLists.of(topicName));
+        return pc;
+    }
+
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/RebalanceEoSDeadlockTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/RebalanceEoSDeadlockTest.java
new file mode 100644
index 000000000..c62d4bae6
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/RebalanceEoSDeadlockTest.java
@@ -0,0 +1,145 @@
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+package io.confluent.parallelconsumer.integrationTests;
+
+import io.confluent.csid.utils.ThreadUtils;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils;
+import io.confluent.parallelconsumer.internal.PCModule;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.common.TopicPartition;
+import org.junit.jupiter.api.AfterEach;
+import org.junit.jupiter.api.Assertions;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.RepeatedTest;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniSets;
+
+import java.time.Duration;
+import java.util.Collection;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.TimeUnit;
+import java.util.concurrent.TimeoutException;
+import java.util.concurrent.atomic.AtomicLong;
+
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.PARTITION;
+import static io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils.GroupOption.REUSE_GROUP;
+import static java.time.Duration.ofSeconds;
+import static org.awaitility.Awaitility.await;
+import static org.hamcrest.CoreMatchers.is;
+import static org.hamcrest.number.OrderingComparison.greaterThan;
+
+/**
+ * Originally created to reproduce the bug #541 https://github.com/confluentinc/parallel-consumer/issues/541
+ * <p>
+ * This test reproduces the potential deadlock situation when a rebalance occurs
+ * using EoS with transactional producer configuration.
+ * The solution aims to avoid the deadlock by reordering the acquisition of locks
+ * in the {@link io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor#onPartitionsRevoked(Collection)} method.
+ *
+ * @author Nacho Munoz
+ */
+@Slf4j
+class RebalanceEoSDeadlockTest extends BrokerIntegrationTest<String, String> {
+
+    private static final String PC_CONTROL = "pc-control";
+    public static final String PC_BROKER_POLL = "pc-broker-poll";
+    Consumer<String, String> consumer;
+    Producer<String, String> producer;
+
+    CountDownLatch rebalanceLatch;
+    private long sleepTimeMs = 0L;
+
+    ParallelEoSStreamProcessor<String, String> pc;
+
+    {
+        super.numPartitions = 2;
+    }
+
+    private String outputTopic;
+    @BeforeEach
+    void setup() {
+        rebalanceLatch = new CountDownLatch(1);
+        setupTopic();
+        outputTopic = setupTopic("output-topic");
+        producer = getKcu().createNewProducer(KafkaClientUtils.ProducerMode.TRANSACTIONAL);
+        consumer = getKcu().createNewConsumer(KafkaClientUtils.GroupOption.NEW_GROUP);
+        var pcOptions = ParallelConsumerOptions.<String,String>builder()
+                .commitMode(ParallelConsumerOptions.CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER)
+                .consumer(consumer)
+                .produceLockAcquisitionTimeout(Duration.ofMinutes(2))
+                .producer(producer)
+                .ordering(PARTITION) // just so we dont need to use keys
+                .build();
+
+        pc = new ParallelEoSStreamProcessor<>(pcOptions, new PCModule<>(pcOptions)) {
+
+            @Override
+            protected void commitOffsetsThatAreReady() throws TimeoutException, InterruptedException {
+                final var threadName = Thread.currentThread().getName();
+                if (threadName.contains(PC_CONTROL)) {
+                    log.info("Delaying pc-control thread {}ms to force the potential deadlock on rebalance", sleepTimeMs);
+                    ThreadUtils.sleepQuietly(sleepTimeMs);
+                }
+
+                super.commitOffsetsThatAreReady();
+
+                if (threadName.contains(PC_BROKER_POLL)) {
+                    // onPartitionsRevoked managed to commit the offsets
+                    rebalanceLatch.countDown();
+                }
+            }
+            @Override
+            public void onPartitionsRevoked(Collection<TopicPartition> partitions) {
+                super.onPartitionsRevoked(partitions);
+            }
+        };
+
+        pc.subscribe(UniSets.of(topic));
+    }
+
+    @AfterEach
+    void cleanup(){
+        pc.close();
+    }
+    final static long SLEEP_TIME_MS = 3000L;
+    @SneakyThrows
+    @RepeatedTest(5)
+    void noDeadlockOnRevoke() {
+        this.sleepTimeMs = (long) (SLEEP_TIME_MS + (Math.random() * 1000));
+        var numberOfRecordsToProduce = 100L;
+        var count = new AtomicLong();
+
+        getKcu().produceMessages(topic, numberOfRecordsToProduce);
+        pc.setTimeBetweenCommits(ofSeconds(1));
+        // consume some records
+        pc.pollAndProduce((recordContexts) -> {
+            count.getAndIncrement();
+            log.debug("Processed record, count now {} - offset: {}", count, recordContexts.offset());
+            return new ProducerRecord<>(outputTopic, recordContexts.key(), recordContexts.value());
+        });
+
+        await().timeout(Duration.ofSeconds(30)).untilAtomic(count,is(greaterThan(5L)));
+        log.debug("Records are getting consumed");
+
+        // cause rebalance
+        final Duration newPollTimeout = Duration.ofSeconds(5);
+        log.debug("Creating new consumer in same group and subscribing to same topic set with a no record timeout of {}, expect this phase to take entire timeout...", newPollTimeout);
+        try (var newConsumer = getKcu().createNewConsumer(REUSE_GROUP)) {
+            newConsumer.subscribe(UniLists.of(topic));
+            newConsumer.poll(newPollTimeout);
+
+            if (!rebalanceLatch.await(30, TimeUnit.SECONDS)) {
+                Assertions.fail("Rebalance did not finished");
+            }
+            log.debug("Test finished");
+        }
+    }
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/RebalanceTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/RebalanceTest.java
new file mode 100644
index 000000000..ec75af5c8
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/RebalanceTest.java
@@ -0,0 +1,99 @@
+package io.confluent.parallelconsumer.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.ConsumerRecords;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniSets;
+
+import java.time.Duration;
+import java.util.concurrent.atomic.AtomicLong;
+
+import static io.confluent.parallelconsumer.ManagedTruth.assertThat;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.PARTITION;
+import static io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils.GroupOption.REUSE_GROUP;
+import static org.testcontainers.shaded.org.awaitility.Awaitility.await;
+import static org.testcontainers.shaded.org.hamcrest.Matchers.equalTo;
+import static org.testcontainers.shaded.org.hamcrest.Matchers.is;
+
+/**
+ * Tests around what should happen when rebalancing occurs
+ *
+ * @author Antony Stubbs
+ */
+@Slf4j
+class RebalanceTest extends BrokerIntegrationTest<String, String> {
+
+    Consumer<String, String> consumer;
+
+    ParallelEoSStreamProcessor<String, String> pc;
+
+    public static final Duration INFINITE = Duration.ofDays(1);
+
+    {
+        super.numPartitions = 2;
+    }
+
+    // todo refactor move up
+    @BeforeEach
+    void setup() {
+        setupTopic();
+        consumer = getKcu().createNewConsumer(KafkaClientUtils.GroupOption.NEW_GROUP);
+
+        pc = new ParallelEoSStreamProcessor<>(ParallelConsumerOptions.<String, String>builder()
+                .consumer(consumer)
+                .ordering(PARTITION) // just so we dont need to use keys
+                .build());
+
+        pc.subscribe(UniSets.of(topic));
+    }
+
+    /**
+     * Checks that when a rebalance happens, a final commit is done first for revoked partitions (that will be assigned
+     * to new consumers), so that the new consumer doesn't reprocess records that are already complete.
+     */
+    @SneakyThrows
+    @Test
+    void commitUponRevoke() {
+        var numberOfRecordsToProduce = 20L;
+        var count = new AtomicLong();
+
+        //
+        getKcu().produceMessages(topic, numberOfRecordsToProduce);
+
+        // effectively disable commit
+        pc.setTimeBetweenCommits(INFINITE);
+
+        // consume all the messages
+        pc.poll(recordContexts -> {
+            count.getAndIncrement();
+            log.debug("Processed record, count now {} - offset: {}", count, recordContexts.offset());
+        });
+        await().untilAtomic(count, is(equalTo(numberOfRecordsToProduce)));
+        log.debug("All records consumed");
+
+        // cause rebalance
+        final Duration newPollTimeout = Duration.ofSeconds(5);
+        log.debug("Creating new consumer in same group and subscribing to same topic set with a no record timeout of {}, expect this phase to take entire timeout...", newPollTimeout);
+        var newConsumer = getKcu().createNewConsumer(REUSE_GROUP);
+        newConsumer.subscribe(UniLists.of(topic));
+        log.debug("Polling with new group member for records with timeout {}...", newPollTimeout);
+        ConsumerRecords<Object, Object> newConsumersPollResult = newConsumer.poll(newPollTimeout);
+        log.debug("Poll complete");
+
+        // make sure only there are no duplicates
+        assertThat(newConsumersPollResult).hasCountEqualTo(0);
+        log.debug("Test finished");
+    }
+
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/SampleTestingFailsafePluginInclusionCore.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/SampleTestingFailsafePluginInclusionCore.java
new file mode 100644
index 000000000..d7097fff4
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/SampleTestingFailsafePluginInclusionCore.java
@@ -0,0 +1,13 @@
+package io.confluent.parallelconsumer.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import org.junit.jupiter.api.Test;
+
+public class SampleTestingFailsafePluginInclusionCore {
+    @Test
+    public void test() {
+    }
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/TransactionAndCommitModeTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/TransactionAndCommitModeTest.java
new file mode 100644
index 000000000..c4abf7f34
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/TransactionAndCommitModeTest.java
@@ -0,0 +1,274 @@
+package io.confluent.parallelconsumer.integrationTests;
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.EnumCartesianProductTestSets;
+import io.confluent.csid.utils.ProgressBarUtils;
+import io.confluent.csid.utils.ProgressTracker;
+import io.confluent.csid.utils.TrimListRepresentation;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.internal.ConsumerOffsetCommitter;
+import io.confluent.parallelconsumer.internal.OffsetCommitter;
+import io.confluent.parallelconsumer.internal.ProducerManager;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import me.tongfei.progressbar.ProgressBar;
+import org.apache.commons.lang3.RandomUtils;
+import org.apache.kafka.clients.consumer.ConsumerConfig;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.producer.KafkaProducer;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.clients.producer.RecordMetadata;
+import org.apache.kafka.common.TopicPartition;
+import org.assertj.core.api.Assertions;
+import org.assertj.core.api.SoftAssertions;
+import org.awaitility.core.ConditionTimeoutException;
+import org.junit.jupiter.api.RepeatedTest;
+import org.junit.jupiter.api.Tag;
+import org.junit.jupiter.api.Test;
+import org.junitpioneer.jupiter.CartesianProductTest;
+
+import java.util.*;
+import java.util.concurrent.Future;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.AbstractParallelEoSStreamProcessorTestBase.defaultTimeout;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_CONSUMER_SYNC;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.*;
+import static java.time.Duration.ofSeconds;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.fail;
+import static org.awaitility.Awaitility.waitAtMost;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+/**
+ * Originally created to reproduce bug #25 https://github.com/confluentinc/parallel-consumer/issues/25 which was a known
+ * issue with multi-threaded use of the {@link KafkaProducer}.
+ * <p>
+ * After fixing multi threading issues, using Producer transactions was made optional, and this test grew to uncover
+ * several issues with the new implementation of committing offsets through the {@link KafkaConsumer}.
+ *
+ * @see OffsetCommitter
+ * @see ConsumerOffsetCommitter
+ * @see ProducerManager
+ */
+@Tag("transactions")
+@Slf4j
+class TransactionAndCommitModeTest extends BrokerIntegrationTest<String, String> {
+
+    int LOW_MAX_POLL_RECORDS_CONFIG = 1;
+    int DEFAULT_MAX_POLL_RECORDS_CONFIG = 500;
+    int HIGH_MAX_POLL_RECORDS_CONFIG = 10_000;
+
+    // is sensitive to changes in metadata size
+    @CartesianProductTest(factory = "enumSets")
+    void testDefaultMaxPoll(CommitMode commitMode, ProcessingOrder order) {
+        int numMessages = 5000;
+        if (order.equals(PARTITION))
+            numMessages = 1000; // much slower, do less
+        runTest(DEFAULT_MAX_POLL_RECORDS_CONFIG, commitMode, order, numMessages);
+    }
+
+    @Test
+    void testDefaultMaxPollConsumerSyncSlow() {
+        runTest(DEFAULT_MAX_POLL_RECORDS_CONFIG, PERIODIC_CONSUMER_SYNC, UNORDERED);
+    }
+
+    static CartesianProductTest.Sets enumSets() {
+        return new EnumCartesianProductTestSets()
+                .add(CommitMode.class)
+                .add(ProcessingOrder.class);
+    }
+
+    @RepeatedTest(5)
+    void testTransactionalDefaultMaxPoll() {
+        runTest(DEFAULT_MAX_POLL_RECORDS_CONFIG, PERIODIC_TRANSACTIONAL_PRODUCER, KEY);
+    }
+
+    // is sensitive to changes in metadata size
+//    @ResourceLock(value = OffsetMapCodecManager.METADATA_DATA_SIZE_RESOURCE_LOCK, mode = READ)
+    @CartesianProductTest(factory = "enumSets")
+    public void testLowMaxPoll(CommitMode commitMode, ProcessingOrder order) {
+        int numMessages = 5000;
+        if (order.equals(PARTITION))
+            numMessages = 1000; // much slower
+        runTest(LOW_MAX_POLL_RECORDS_CONFIG, commitMode, order, numMessages);
+    }
+
+    @CartesianProductTest(factory = "enumSets")
+    public void testHighMaxPollEnum(CommitMode commitMode, ProcessingOrder order) {
+        int numMessages = 10000;
+        if (order.equals(PARTITION))
+            numMessages = 1000; // much slower
+
+        runTest(HIGH_MAX_POLL_RECORDS_CONFIG, commitMode, order, numMessages);
+    }
+
+    private void runTest(int maxPoll, CommitMode commitMode, ProcessingOrder order) {
+        int expectedMessageCount = 30_000;
+        runTest(maxPoll, commitMode, order, expectedMessageCount);
+    }
+
+    @SneakyThrows
+    private void runTest(int maxPoll, CommitMode commitMode, ProcessingOrder order, int expectedCount) {
+        String inputName = setupTopic(this.getClass().getSimpleName() + "-input-" + RandomUtils.nextInt());
+        String outputName = setupTopic(this.getClass().getSimpleName() + "-output-" + RandomUtils.nextInt());
+
+        int expectedMessageCount = expectedCount;
+
+        ProgressBar bar = ProgressBarUtils.getNewMessagesBar(log, expectedMessageCount);
+
+        // pre-produce messages to input-topic
+        List<String> expectedKeys = new ArrayList<>();
+        log.info("Producing {} messages before starting test", expectedMessageCount);
+        List<Future<RecordMetadata>> sends = new ArrayList<>();
+        try (Producer<String, String> kafkaProducer = getKcu().createNewProducer(false)) {
+            for (int i = 0; i < expectedMessageCount; i++) {
+                String key = "key-" + i;
+                Future<RecordMetadata> send = kafkaProducer.send(new ProducerRecord<>(inputName, key, "value-" + i), (meta, exception) -> {
+                    if (exception != null) {
+                        log.error("Error sending, ", exception);
+                    }
+                });
+                sends.add(send);
+                expectedKeys.add(key);
+            }
+            log.debug("Finished sending test data");
+        }
+        // make sure we finish sending before next stage
+        log.debug("Waiting for broker acks");
+        for (Future<RecordMetadata> send : sends) {
+            send.get();
+        }
+        assertThat(sends).hasSize(expectedMessageCount);
+
+        // run parallel-consumer
+        log.debug("Starting test");
+        KafkaProducer<String, String> newProducer = getKcu().createNewProducer(commitMode);
+
+        Properties consumerProps = new Properties();
+        consumerProps.put(ConsumerConfig.MAX_POLL_RECORDS_CONFIG, maxPoll);
+        KafkaConsumer<String, String> newConsumer = getKcu().createNewConsumer(true, consumerProps);
+
+        // increased PC concurrency - improves test stability and performance.
+        int numThreads = 64;
+//        int numThreads = 1000;
+        var pc = new ParallelEoSStreamProcessor<String, String>(ParallelConsumerOptions.<String, String>builder()
+                .ordering(order)
+                .consumer(newConsumer)
+                .producer(newProducer)
+                .commitMode(commitMode)
+//                .numberOfThreads(1000)
+//                .numberOfThreads(100)
+//                .numberOfThreads(2)
+                .maxConcurrency(numThreads)
+                .build());
+        pc.subscribe(of(inputName));
+
+        pc.setTimeBetweenCommits(ofSeconds(1));
+
+        // sanity
+        TopicPartition tp = new TopicPartition(inputName, 0);
+        Map<TopicPartition, Long> beginOffsets = newConsumer.beginningOffsets(of(tp));
+        Map<TopicPartition, Long> endOffsets = newConsumer.endOffsets(of(tp));
+        assertThat(endOffsets).containsEntry(tp, ((long) expectedMessageCount));
+        assertThat(beginOffsets.get(tp)).isZero();
+
+
+        List<String> consumedKeys = Collections.synchronizedList(new ArrayList<>());
+        List<String> producedKeysAcknowledged = Collections.synchronizedList(new ArrayList<>());
+        AtomicInteger processedCount = new AtomicInteger(0);
+        AtomicInteger producedCount = new AtomicInteger(0);
+
+        pc.pollAndProduce(record -> {
+                    log.debug("Polled {}", record.offset());
+                    consumedKeys.add(record.key());
+                    processedCount.incrementAndGet();
+                    return new ProducerRecord<>(outputName, record.key(), "data");
+                }, consumeProduceResult -> {
+                    log.debug("Produced {}", consumeProduceResult.getOut());
+                    producedCount.incrementAndGet();
+                    producedKeysAcknowledged.add(consumeProduceResult.getIn().key());
+                    bar.step();
+                }
+        );
+
+        // wait for all pre-produced messages to be processed and produced
+        Assertions.useRepresentation(new TrimListRepresentation());
+
+        // todo rounds should be 1? progress should always be made
+        int roundsAllowed = 10;
+//        roundsAllowed = 200;
+//        if (commitMode.equals(CONSUMER_SYNC)) {
+//            roundsAllowed = 3; // sync consumer commits can take time // fails
+////            roundsAllowed = 5; // sync consumer commits can take time // fails
+////            roundsAllowed = 10; // sync consumer commits can take time // fails
+////            roundsAllowed = 12; // sync consumer commits can take time // // works with no logging
+//        }
+
+        ProgressTracker progressTracker = new ProgressTracker(processedCount, null, defaultTimeout);
+        var failureMessage = msg("All keys sent to input-topic should be processed and produced, within time (expected: {} commit: {} order: {} max poll: {})",
+                expectedMessageCount, commitMode, order, maxPoll);
+        try {
+            waitAtMost(defaultTimeout)
+                    // dynamic reason support still waiting
+                    // https://github.com/awaitility/awaitility/pull/193#issuecomment-873116199
+                    // https://github.com/confluentinc/parallel-consumer/issues/199
+                    .failFast("PC died, check logs.",
+                            () -> pc.isClosedOrFailed()
+                                    || producedCount.get() > expectedMessageCount)
+//                            () -> {
+//                                if (pc.isClosedOrFailed())
+//                                    return pc.getFailureCause();
+//                                else
+//                                    return new TerminalFailureException(msg("Too many messages? processedCount.get() {} > expectedMessageCount {}",
+//                                            producedCount.get(), expectedMessageCount)); // needs fail-fast feature in 4.0.4
+//                            })
+                    .alias(failureMessage)
+                    .untilAsserted(() -> {
+                        log.trace("Processed-count: {}, Produced-count: {}", processedCount.get(), producedCount.get());
+                        int delta = producedCount.get() - processedCount.get();
+                        if (delta == numThreads && progressTracker.getRounds().get() > 1) {
+                            log.error("Here we go fishy...");
+                        }
+
+                        //
+                        progressTracker.checkForProgressExceptionally();
+
+                        //
+                        SoftAssertions all = new SoftAssertions();
+                        all.assertThat(new ArrayList<>(consumedKeys)).as("all expected are consumed").hasSameSizeAs(expectedKeys);
+                        all.assertThat(new ArrayList<>(producedKeysAcknowledged)).as("all consumed are produced ok ").hasSameSizeAs(expectedKeys);
+                        all.assertAll();
+                    });
+        } catch (ConditionTimeoutException e) {
+            log.debug("Expected keys (size {})", expectedKeys.size());
+            log.debug("Consumed keys ack'd (size {})", consumedKeys.size());
+            log.debug("Produced keys (size {})", producedKeysAcknowledged.size());
+            expectedKeys.removeAll(consumedKeys);
+            log.info("Missing keys from consumed: {}", expectedKeys);
+            fail(failureMessage + "\n" + e.getMessage());
+        }
+
+        pc.closeDrainFirst();
+
+        assertThat(processedCount.get())
+                .as("messages processed and produced by parallel-consumer should be equal")
+                .isEqualTo(producedCount.get());
+
+        // sanity
+        assertThat(expectedMessageCount).isEqualTo(processedCount.get());
+        assertThat(producedKeysAcknowledged).hasSameSizeAs(expectedKeys);
+        // todo performance: tighten up progress check (<2)
+        assertThat(progressTracker.getHighestRoundCountSeen()).isLessThan(40);
+        bar.close();
+    }
+
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/TransactionMarkersTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/TransactionMarkersTest.java
new file mode 100644
index 000000000..fa531181d
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/TransactionMarkersTest.java
@@ -0,0 +1,295 @@
+package io.confluent.parallelconsumer.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.FakeRuntimeException;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.offsets.OffsetSimultaneousEncoder;
+import io.confluent.parallelconsumer.state.PartitionState;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.clients.producer.RecordMetadata;
+import org.jetbrains.annotations.NotNull;
+import org.junit.jupiter.api.AfterEach;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Tag;
+import org.junit.jupiter.api.Test;
+import pl.tlinkowski.unij.api.UniSets;
+
+import java.util.List;
+import java.util.concurrent.Future;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.stream.Collectors;
+import java.util.stream.IntStream;
+
+import static com.google.common.truth.Truth.assertThat;
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.PARTITION;
+import static io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils.ProducerMode.NOT_TRANSACTIONAL;
+import static java.lang.Integer.MAX_VALUE;
+import static org.testcontainers.shaded.org.awaitility.Awaitility.await;
+
+/**
+ * Tests the system when the input topic has transaction markers in its partitions.
+ *
+ * @author Antony Stubbs
+ * @see PartitionState#getOffsetHighestSequentialSucceeded()
+ * @see OffsetSimultaneousEncoder#OffsetSimultaneousEncoder
+ */
+@Tag("transactions")
+@Slf4j
+public class TransactionMarkersTest extends BrokerIntegrationTest<String, String> {
+
+    /**
+     * Block all records beyond the second record
+     */
+    final int LIMIT = 1;
+
+    AtomicInteger receivedRecordCount = new AtomicInteger();
+
+
+    Producer<String, String> txProducer;
+    Producer<String, String> txProducerTwo;
+    Producer<String, String> txProducerThree;
+    Producer<String, String> normalProducer;
+    Consumer<String, String> consumer;
+
+    protected ParallelEoSStreamProcessor<String, String> pc;
+
+    @BeforeEach
+        // todo move to super?
+    void setup() {
+        setupTopic();
+        consumer = getKcu().getConsumer();
+
+        txProducer = getKcu().createAndInitNewTransactionalProducer();
+        txProducerTwo = getKcu().createAndInitNewTransactionalProducer();
+        txProducerThree = getKcu().createAndInitNewTransactionalProducer();
+
+        normalProducer = getKcu().createNewProducer(NOT_TRANSACTIONAL);
+        pc = new ParallelEoSStreamProcessor<>(ParallelConsumerOptions.<String, String>builder()
+                .consumer(consumer)
+                .ordering(PARTITION) // just so we dont need to use keys
+                .build());
+        pc.subscribe(UniSets.of(super.topic));
+    }
+
+    @AfterEach
+    void close() {
+        pc.close();
+    }
+
+    /**
+     * Test that committing can happen successfully when the base offset for the commit is adjacent to transaction
+     * markers in the input partitions.
+     * <p>
+     * The system assumes that the next expected (base committed) offset, will always be 1 offset above the highest
+     * succeeded. But tx makers can increase this gap from 1 to potentially much higher.
+     * <p>
+     * todo can these gaps also be created by log compaction? If so, is the solution the same?
+     *
+     * @see <a href="https://github.com/confluentinc/parallel-consumer/issues/329">Github issue #329</a> the
+     *         original reported issue
+     */
+    @Test
+    void single() {
+        sendOneTransaction();
+        // send records - doesn't need to be in a transaction
+        sendRecordsNonTransactionally(1);
+
+        //
+        runPcAndBlockRecordsOverLimitIndex();
+
+        //
+        waitForRecordsToBeReceived();
+
+        // force commit
+        // should crash now
+        pc.close();
+    }
+
+    @Test
+    void doubleTransaction() {
+        sendOneTransaction();
+        // two transactions back to back
+        sendOneTransaction();
+
+        //
+        runPcAndBlockRecordsOverLimitIndex();
+
+        //
+        waitForRecordsToBeReceived();
+
+        // force commit
+        // should crash now
+        pc.close();
+    }
+
+    private void waitForRecordsToBeReceived() {
+        int expected = 2;
+        waitForRecordsToBeReceived(expected);
+    }
+
+    private void waitForRecordsToBeReceived(int expected) {
+        log.debug("Awaiting {} records to be received...", expected);
+        await().untilAsserted(() -> assertThat(receivedRecordCount.get()).isAtLeast(expected));
+        log.debug("Awaiting {} records to be received - done.", expected);
+    }
+
+    /**
+     * Allow processing of first tx messages, but block second transaction messages
+     */
+    private void runPcAndBlockRecordsOverLimitIndex() {
+        int blockOver = LIMIT;
+        runPcAndBlockRecordsOverLimitIndex(blockOver);
+    }
+
+    private void runPcAndBlockRecordsOverLimitIndex(int blockOver) {
+        pc.poll(recordContexts -> {
+            int index = receivedRecordCount.incrementAndGet();
+            log.debug("Got record index: {} ...", index);
+            if (index > blockOver) {
+                try {
+                    log.debug(msg("{} over block limit of {}, blocking...", index, blockOver));
+                    Thread.sleep(Long.MAX_VALUE);
+                } catch (InterruptedException e) {
+                    throw new FakeRuntimeException(e);
+                }
+            }
+        });
+    }
+
+    private void sendOneTransaction() {
+        txProducer.beginTransaction();
+        txProducer.send(createRecordToSend());
+        txProducer.commitTransaction();
+    }
+
+    @NotNull
+    private ProducerRecord<String, String> createRecordToSend() {
+        return new ProducerRecord<>(topic, "");
+    }
+
+    protected List<Future<RecordMetadata>> sendRecordsNonTransactionally(int count) {
+        return IntStream.of(count).mapToObj(ignored
+                        -> normalProducer.send(createRecordToSend()))
+                .collect(Collectors.toList());
+    }
+
+    /**
+     * @see #single()
+     */
+    @Test
+    void several() {
+        // sendSeveralTransactions, all closed at the same neighboring offsets
+        sendSeveralTransaction();
+
+        // send records - doesn't need to be in a transaction
+        sendRecordsNonTransactionally(10);
+
+        //
+        runPcAndBlockRecordsOverLimitIndex();
+
+        //
+        waitForRecordsToBeReceived();
+
+        // force commit
+        pc.close(); // should crash now
+    }
+
+    private void sendSeveralTransaction() {
+        IntStream.of(10).forEach(value -> sendOneTransaction());
+    }
+
+    /**
+     * Allowing just the first record adjacent to the transaction marker allows the situation to proceed normally
+     *
+     * @see #single()
+     */
+    @Test
+    void dontBlockFirstRecords() {
+        // sendSeveralTransactions, all closed at the same neighboring offsets
+        sendSeveralTransaction();
+
+        // send records - doesn't need to be in a transaction
+        sendRecordsNonTransactionally(10);
+
+        //
+        runPcAndBlockRecordsOverLimitIndex(3);
+
+        //
+        waitForRecordsToBeReceived();
+
+        // force commit
+        pc.close(); // should crash now
+    }
+
+    /**
+     * @see #dontBlockFirstRecords()
+     */
+    @Test
+    void dontBlockAnyRecords() {
+        // sendSeveralTransactions, all closed at the same neighboring offsets
+        sendSeveralTransaction();
+
+        // send records - doesn't need to be in a transaction
+        sendRecordsNonTransactionally(10);
+
+        //
+        runPcAndBlockRecordsOverLimitIndex(MAX_VALUE);
+
+        //
+        waitForRecordsToBeReceived();
+
+        // force commit
+        pc.close(); // should crash now
+    }
+
+
+    /**
+     * A stacked or overlapping transaction situation, that creates 3 commit markers in a row, so we should get a wider
+     * "gap" and so a more negative bitset length (-3)
+     *
+     * @see #single()
+     */
+    @Test
+    void overLappingTransactions() {
+        int numberOfBaseRecords = 3;
+
+        //
+        startAndOneRecord(txProducer);
+        startAndOneRecord(txProducerTwo);
+        startAndOneRecord(txProducerThree);
+
+        //
+        commitTx(txProducer);
+        commitTx(txProducerTwo);
+        commitTx(txProducerThree);
+
+        // send records - doesn't need to be in a transaction
+        sendRecordsNonTransactionally(2);
+
+        //
+        runPcAndBlockRecordsOverLimitIndex(numberOfBaseRecords);
+
+        //
+        waitForRecordsToBeReceived(numberOfBaseRecords);
+
+        // force commit
+        pc.close(); // should crash now
+    }
+
+    private void commitTx(Producer<String, String> txProducer) {
+        txProducer.commitTransaction();
+    }
+
+    private void startAndOneRecord(Producer<String, String> txProducer) {
+        txProducer.beginTransaction();
+        txProducer.send(createRecordToSend());
+    }
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/TransactionTimeoutsTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/TransactionTimeoutsTest.java
new file mode 100644
index 000000000..53ef3ef6f
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/TransactionTimeoutsTest.java
@@ -0,0 +1,286 @@
+package io.confluent.parallelconsumer.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import com.google.common.truth.Truth;
+import io.confluent.csid.utils.LatchTestUtils;
+import io.confluent.csid.utils.ThreadUtils;
+import io.confluent.parallelconsumer.FakeRuntimeException;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.integrationTests.utils.BrokerCommitAsserter;
+import io.confluent.parallelconsumer.internal.PCModule;
+import io.confluent.parallelconsumer.internal.ProducerManager;
+import io.confluent.parallelconsumer.internal.ProducerWrapper;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerGroupMetadata;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.common.TopicPartition;
+import org.junit.jupiter.api.Tag;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.Arguments;
+import org.junit.jupiter.params.provider.MethodSource;
+import org.mockito.ArgumentMatchers;
+import org.mockito.Mockito;
+import org.mockito.invocation.InvocationOnMock;
+
+import java.time.Duration;
+import java.util.Arrays;
+import java.util.List;
+import java.util.Map;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.stream.Collectors;
+import java.util.stream.Stream;
+
+import static io.confluent.parallelconsumer.ManagedTruth.assertThat;
+import static io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils.GroupOption.NEW_GROUP;
+import static java.time.Duration.ofMillis;
+import static java.time.Duration.ofSeconds;
+import static org.mockito.ArgumentMatchers.any;
+import static org.testcontainers.shaded.org.awaitility.Awaitility.await;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+/**
+ * Tests transaction behaviour under timeouts
+ *
+ * @author Antony Stubbs
+ * @see ProducerManager
+ * @see io.confluent.parallelconsumer.internal.ProducerManagerTest
+ */
+@Tag("transactions")
+@Slf4j
+class TransactionTimeoutsTest extends BrokerIntegrationTest<String, String> {
+
+    private static final int NUMBER_TO_SEND = 5;
+
+    private static final int SMALL_TIMEOUT_MULTIPLIER = 2;
+    private static final int LONG_TIMEOUT_MULTIPLIER = 50;
+
+    private static final int OFFSET_TO_ERROR = 12;
+
+    // allow the first offsets to succeed, which we can test
+    private static final int OFFSET_TO_GO_SLOW = NUMBER_TO_SEND + 3;
+
+
+    private ParallelEoSStreamProcessor<String, String> pc;
+
+    private String originalGroupId;
+
+    BrokerCommitAsserter assertConsumer;
+
+    @SneakyThrows
+    void setup(PCModule<String, String> module) {
+        setupTopic(TransactionTimeoutsTest.class.getSimpleName());
+
+        pc = new ParallelEoSStreamProcessor<>(module.options(), module);
+
+        getKcu().produceMessages(getTopic(), NUMBER_TO_SEND);
+
+        pc.subscribe(of(getTopic()));
+
+        originalGroupId = getKcu().getConsumer().groupMetadata().groupId();
+
+        assertConsumer = new BrokerCommitAsserter(getTopic(), getKcu().createNewConsumer(NEW_GROUP));
+    }
+
+    private ParallelConsumerOptions.ParallelConsumerOptionsBuilder<String, String> createOptions() {
+        return ParallelConsumerOptions.<String, String>builder()
+                .consumer(getKcu().createNewConsumer())
+                .producer(getKcu().createNewProducer(CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER))
+                .commitMode(CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER)
+                .commitLockAcquisitionTimeout(ofSeconds(1))
+                .defaultMessageRetryDelay(ofMillis(100))
+                .produceLockAcquisitionTimeout(ofSeconds(2))
+                .commitInterval(ofSeconds(1))
+                .allowEagerProcessingDuringTransactionCommit(true);
+    }
+
+    static Stream<Arguments> commitTimeoutParams() {
+        return Stream.of(Arguments.of(SMALL_TIMEOUT_MULTIPLIER, OFFSET_TO_ERROR, listOf(OFFSET_TO_ERROR)),
+                Arguments.of(LONG_TIMEOUT_MULTIPLIER, OFFSET_TO_GO_SLOW, listOf(OFFSET_TO_GO_SLOW, OFFSET_TO_ERROR)));
+    }
+
+    /**
+     * Tests what happens with the commit stage times out.
+     * <p>
+     * First sends {@link #NUMBER_TO_SEND} and allows them to commit cleanly. Then sends more records of which one takes
+     * too long to process, causing the commit to timeout.
+     * <p>
+     * Runs with different injected timeout sizes:
+     * <p>
+     * Sleep time multiplier:
+     * <p>
+     * 5: triggers a timeout
+     * <p>
+     * 50: triggers a timeout with a much longer deadlock
+     *
+     * @param multiple Multiple values - but affect is the same. It's not worth trying to artificially create a scenario
+     *                 where the sleep wakes up /after/ the commit lock has timed out - this would affectively be a semi
+     *                 happy path, where the result record is produced, in time for the shutdown commit, or times out
+     *                 the shutdown commit as well and so the transaction doesn't get committed and will eventually
+     *                 abort:
+     *                 <p>
+     *                 Small value: triggers a timeout, but gets committed in the shutdown commit, since sleep is
+     *                 shorter than shutdown timeout - result record is produced and committed as completed.
+     *                 <p>
+     *                 Large value: same as the small version, but since sleep is longer than the shutdown timeout -
+     *                 sleep gets interrupted and committed as incomplete - result record never produced, marked as
+     *                 failed and committed as such.
+     */
+    @SneakyThrows
+    @ParameterizedTest()
+    @MethodSource("commitTimeoutParams")
+    void commitTimeout(int multiple, int expectedHighestSucceededCommittedOffset, List<Integer> expectedIncompletes) {
+        var options = createOptions()
+                .shutdownTimeout(Duration.ofSeconds(5))
+                .allowEagerProcessingDuringTransactionCommit(false)
+                .build();
+        setup(new PCModule<>(options));
+
+
+
+        String outputTopic = getTopic() + "-output";
+
+        pc.pollAndProduce(recordContexts -> {
+            log.debug("Processing {}", recordContexts.offset());
+            long offset = recordContexts.offset();
+            if (offset == OFFSET_TO_GO_SLOW) {
+                // triggers deadlock as controller can't acquire commit lock fast enough due to this sleeping thread
+                log.debug("Processing offset {} - simulating a long processing phase with timeout multiple {}", OFFSET_TO_GO_SLOW, multiple);
+                ThreadUtils.sleepQuietly(1000 * multiple);
+                log.debug("Processing offset {} - simulating a long processing phase COMPLETE", OFFSET_TO_GO_SLOW);
+            } else if (offset == OFFSET_TO_ERROR) {
+                throw new FakeRuntimeException("fail");
+            }
+            return new ProducerRecord<>(outputTopic, "output-value,source-offset: " + offset);
+        });
+
+        // assert output topic contains records from processing function - so commit must have committed cleanly
+        var target = NUMBER_TO_SEND - 1;
+        assertConsumer.assertConsumedAtLeastOffset(outputTopic, target); // check a new consumer group can consme the records expected to be committed to the partition
+
+        // send more, upon which offset the pc function will block forever, causing a commit timeout
+        getKcu().produceMessages(getTopic(), 10);
+
+        pc.requestCommitAsap();
+
+        // wait until pc dies from commit timeout
+        await().atMost(Duration.ofSeconds(35)).untilAsserted(() -> assertThat(pc).isClosedOrFailed());
+        assertThat(pc).getFailureCause().hasMessageThat().contains("timeout");
+
+        // check what was committed at shutdown to the input topic, re-using same group id as PC, to access what was committed at shutdown commit attempt
+        // 2nd commit attempt during shutdown will have succeeded
+        var newConsumer = getKcu().createNewConsumer(originalGroupId);
+
+        var assertCommittedToPartition = assertThat(newConsumer).hasCommittedToPartition(getTopic(), partitionNumber);
+
+        assertCommittedToPartition.offset(expectedHighestSucceededCommittedOffset);
+        //Check that incompletes match expected - either just failed offset (for case where processing finishes during shutdown timeout)
+        // or both offsetToError and offsetToGoVerySlow for case when sleep is longer than shutdown timeout and processing is interrupted by forced thread shutdown.
+        assertCommittedToPartition.encodedIncomplete(expectedIncompletes.stream().mapToInt(x->x).toArray());
+    }
+
+    /**
+     * Tests what happens when there is a timeout trying to acquire to produce lock, due to a commit taking too long
+     */
+    @SneakyThrows
+    @Test
+    void produceTimeout() {
+        final int OFFSET_TO_PRODUCE_SLOWLY = NUMBER_TO_SEND + 2;
+
+        CountDownLatch produceLock = new CountDownLatch(1);
+
+        // inject system that causes commit to take too long
+        PCModule<String, String> slowCommitModule = new PCModule<>(createOptions().build()) {
+
+            /**
+             * Inject a special {@link ProducerWrapper} to manipulate for the test
+             *
+             * @return
+             */
+            @Override
+            protected ProducerWrapper<String, String> producerWrap() {
+                var pw = Mockito.spy(super.producerWrap());
+
+                // inject a long sleep in the commit flow, so simulate a slow commit
+                Mockito.doAnswer(this::maybeSleep)
+                        .when(pw)
+                        .sendOffsetsToTransaction(ArgumentMatchers.anyMap(), any(ConsumerGroupMetadata.class));
+
+                return pw;
+            }
+
+            @SneakyThrows
+            private Object maybeSleep(InvocationOnMock invocation) {
+                // only timeout on 2nd commit
+                Map<TopicPartition, OffsetAndMetadata> offsets = (Map<TopicPartition, OffsetAndMetadata>) (invocation.getArguments()[0]);
+                OffsetAndMetadata offsetAndMetadata = offsets.get(new TopicPartition(getTopic(), 0));
+                long offset = offsetAndMetadata.offset();
+
+                boolean firstCycle = produceLock.getCount() > 0;
+                if (offset == OFFSET_TO_PRODUCE_SLOWLY && firstCycle) {
+                    log.debug("Causing commit to take too long which will trigger produce lock timeout");
+                    produceLock.countDown();
+                    ThreadUtils.sleepQuietly(5000); // sleep for some time to simulate timeout
+                    log.debug("Causing commit to take too long COMPLETE");
+                }
+
+                return invocation.callRealMethod();
+            }
+        };
+        setup(slowCommitModule);
+
+
+        // pc
+        AtomicInteger retryCount = new AtomicInteger();
+        final String OUTPUT_TOPIC = getTopic() + "-output";
+        pc.pollAndProduce(recordContexts -> {
+            long offset = recordContexts.offset();
+            log.debug("Processing {}", recordContexts.offset());
+            if (offset == OFFSET_TO_PRODUCE_SLOWLY) {
+                int numberOfFailedAttempts = recordContexts.getSingleRecord().getNumberOfFailedAttempts();
+                log.debug("Updating failed attempts to {}", numberOfFailedAttempts);
+                retryCount.set(numberOfFailedAttempts);
+
+                boolean firstCycle = produceLock.getCount() > 0;
+                if (firstCycle) {
+                    log.debug("Waiting for commit to start before trying to acquire produce lock");
+                    LatchTestUtils.awaitLatch(produceLock);
+                    ThreadUtils.sleepQuietly(1000); // block offset for a second for commit flow to reach lock acquisition stage
+                }
+            }
+
+            return new ProducerRecord<>(OUTPUT_TOPIC, "random");
+        });
+
+        //// phase 1 - happy path - send, process, commit
+        // assert output topic
+        assertConsumer.assertConsumedAtLeastOffset(OUTPUT_TOPIC, NUMBER_TO_SEND - 1); // happy path, all base records committed ok
+
+        //// phase 2 - unhappy path where produce lock times out, but recovers: send, process, block, retry, succeed
+        log.debug("Send more records to trigger timeout condition above...");
+        final int EXTRA_TO_SEND = 4;
+        getKcu().produceMessages(getTopic(), EXTRA_TO_SEND);
+
+        // assert output topic - still has ONLY got the new records due to commit being blocked
+        assertConsumer.assertConsumedAtMostOffset(OUTPUT_TOPIC, NUMBER_TO_SEND - 1); // only base records committed ok to output topic
+
+        // wait for eventually retry on the blocked / slow sending offset
+        await().untilAsserted(() -> Truth.assertThat(retryCount.get()).isAtLeast(1));
+
+        // assert output topic
+        assertConsumer.assertConsumedAtLeastOffset(OUTPUT_TOPIC, NUMBER_TO_SEND + EXTRA_TO_SEND); // happy path after retry, all records committed and read ok
+    }
+
+    static List<Integer> listOf (int... ints){
+        return Arrays.stream(ints).boxed().collect(Collectors.toList());
+    }
+
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/VeryLargeMessageVolumeTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/VeryLargeMessageVolumeTest.java
new file mode 100644
index 000000000..6c32c8c09
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/VeryLargeMessageVolumeTest.java
@@ -0,0 +1,200 @@
+package io.confluent.parallelconsumer.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.ProgressBarUtils;
+import io.confluent.csid.utils.StringUtils;
+import io.confluent.csid.utils.TrimListRepresentation;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import me.tongfei.progressbar.ProgressBar;
+import org.apache.commons.lang3.RandomUtils;
+import org.apache.kafka.clients.consumer.ConsumerConfig;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.producer.KafkaProducer;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.clients.producer.RecordMetadata;
+import org.apache.kafka.common.TopicPartition;
+import org.assertj.core.api.Assertions;
+import org.assertj.core.api.SoftAssertions;
+import org.awaitility.core.ConditionTimeoutException;
+import org.junit.jupiter.api.Test;
+
+import java.util.*;
+import java.util.concurrent.Future;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER;
+import static java.time.Duration.ofSeconds;
+import static java.util.concurrent.TimeUnit.SECONDS;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.fail;
+import static org.awaitility.Awaitility.waitAtMost;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+/**
+ * Just a very simple POC-test do demonstrate bitset-too-long exception while running with very high options.
+ * <p>
+ * This fairly consistently occurs in output-log while running and then the consumer shuts down:
+ * <pre>
+ * "Caused by: java.lang.RuntimeException: Bitset too long to encode: 45975. (max: 32767)"
+ * </pre>
+ * https://github.com/confluentinc/parallel-consumer/issues/35
+ * <p>
+ * RuntimeException when running with very high options in 0.2.0.0 (Bitset too long to encode) #35
+ */
+@Slf4j
+public class VeryLargeMessageVolumeTest extends BrokerIntegrationTest<String, String> {
+
+    int HIGH_MAX_POLL_RECORDS_CONFIG = 10_000;
+
+    public List<String> consumedKeys = Collections.synchronizedList(new ArrayList<>());
+    public List<String> producedKeysAcknowledged = Collections.synchronizedList(new ArrayList<>());
+    public AtomicInteger processedCount = new AtomicInteger(0);
+    public AtomicInteger producedCount = new AtomicInteger(0);
+
+
+    /**
+     * See #35 RuntimeException when running with very high options in 0.2.0.0 (Bitset too long to encode)
+     * <p>
+     * https://github.com/confluentinc/parallel-consumer/issues/35
+     *
+     * <p>
+     * See $37 Support BitSet and RunLength encoding lengths longer than Short.MAX_VALUE
+     * <p>
+     * https://github.com/confluentinc/parallel-consumer/issues/37
+     * <p>
+     */
+    @Test
+    void shouldNotThrowBitSetTooLongException() {
+        runTest(HIGH_MAX_POLL_RECORDS_CONFIG, CommitMode.PERIODIC_CONSUMER_ASYNCHRONOUS, ProcessingOrder.KEY);
+    }
+
+    @SneakyThrows
+    private void runTest(int maxPoll, CommitMode commitMode, ProcessingOrder order) {
+        String inputName = setupTopic(this.getClass().getSimpleName() + "-input-" + RandomUtils.nextInt());
+        String outputName = setupTopic(this.getClass().getSimpleName() + "-output-" + RandomUtils.nextInt());
+
+        // pre-produce messages to input-topic
+        List<String> expectedKeys = new ArrayList<>();
+//        int expectedMessageCount = 2_000_000;
+        long expectedMessageCount = 1_000_000;
+        log.info("Producing {} messages before starting test", expectedMessageCount);
+        List<Future<RecordMetadata>> sends = new ArrayList<>();
+        try (Producer<String, String> kafkaProducer = getKcu().createNewProducer(false)) {
+            for (int i = 0; i < expectedMessageCount; i++) {
+                String key = "key-" + i;
+                Future<RecordMetadata> send = kafkaProducer.send(new ProducerRecord<>(inputName, key, "value-" + i), (meta, exception) -> {
+                    if (exception != null) {
+                        log.error("Error sending, ", exception);
+                    }
+                });
+                sends.add(send);
+                expectedKeys.add(key);
+            }
+            log.debug("Finished sending test data");
+        }
+        // make sure we finish sending before next stage
+        log.debug("Waiting for broker acks");
+        for (Future<RecordMetadata> send : sends) {
+            send.get();
+        }
+        assertThat(sends).hasSize((int) expectedMessageCount);
+
+        // run parallel-consumer
+        log.debug("Starting test");
+        KafkaProducer<String, String> newProducer = getKcu().createNewProducer(commitMode.equals(PERIODIC_TRANSACTIONAL_PRODUCER));
+
+        Properties consumerProps = new Properties();
+        consumerProps.put(ConsumerConfig.MAX_POLL_RECORDS_CONFIG, maxPoll);
+        KafkaConsumer<String, String> newConsumer = getKcu().createNewConsumer(true, consumerProps);
+
+        var pc = new ParallelEoSStreamProcessor<>(ParallelConsumerOptions.<String, String>builder()
+                .ordering(order)
+                .consumer(newConsumer)
+                .producer(newProducer)
+                .commitMode(commitMode)
+                .maxConcurrency(1000)
+                .build());
+        pc.subscribe(of(inputName));
+
+        // sanity
+        TopicPartition tp = new TopicPartition(inputName, 0);
+        Map<TopicPartition, Long> beginOffsets = newConsumer.beginningOffsets(of(tp));
+        Map<TopicPartition, Long> endOffsets = newConsumer.endOffsets(of(tp));
+        assertThat(endOffsets).containsEntry(tp, expectedMessageCount);
+        assertThat(beginOffsets).containsEntry(tp, 0L);
+
+
+        ProgressBar bar = ProgressBarUtils.getNewMessagesBar(log, expectedMessageCount);
+        pc.pollAndProduce(record -> {
+                    // by not having any sleep here, this test really tests the overhead of the system
+//                    try {
+//                        Thread.sleep(5);
+//                    } catch (InterruptedException e) {
+//                        e.printStackTrace();
+//                    }
+//                    try {
+//                        // 1/5 chance of taking a long time
+//                        int chance = 10;
+//                        int dice = RandomUtils.nextInt(0, chance);
+//                        if (dice == 0) {
+//                            Thread.sleep(100);
+//                        } else {
+//                            Thread.sleep(RandomUtils.nextInt(3, 20));
+//                        }
+                    bar.stepBy(1);
+                    consumedKeys.add(record.key());
+                    processedCount.incrementAndGet();
+                    return new ProducerRecord<>(outputName, record.key(), "data");
+                }, consumeProduceResult -> {
+                    producedCount.incrementAndGet();
+                    producedKeysAcknowledged.add(consumeProduceResult.getIn().key());
+                }
+        );
+
+
+        // wait for all pre-produced messages to be processed and produced
+        Assertions.useRepresentation(new TrimListRepresentation());
+        var failureMessage = StringUtils.msg("All keys sent to input-topic should be processed and produced, within time (expected: {} commit: {} order: {} max poll: {})",
+                expectedMessageCount, commitMode, order, maxPoll);
+        try {
+            waitAtMost(ofSeconds(120))
+                    // dynamic reason support still waiting https://github.com/awaitility/awaitility/pull/193#issuecomment-873116199
+                    .failFast("PC died - check logs", pc::isClosedOrFailed)
+                    //, () -> pc.getFailureCause()) // requires https://github.com/awaitility/awaitility/issues/178#issuecomment-734769761
+                    .alias(failureMessage)
+                    .pollInterval(1, SECONDS)
+                    .untilAsserted(() -> {
+                        log.trace("Processed-count: {}, Produced-count: {}", processedCount.get(), producedCount.get());
+                        SoftAssertions all = new SoftAssertions();
+                        all.assertThat(new ArrayList<>(consumedKeys)).as("all expected are consumed").hasSameSizeAs(expectedKeys);
+                        all.assertThat(new ArrayList<>(producedKeysAcknowledged)).as("all consumed are produced ok ").hasSameSizeAs(expectedKeys);
+                        all.assertAll();
+                    });
+        } catch (ConditionTimeoutException e) {
+            fail(failureMessage + "\n" + e.getMessage());
+        }
+
+        bar.close();
+
+        pc.closeDrainFirst();
+
+        assertThat(processedCount.get())
+                .as("messages processed and produced by parallel-consumer should be equal")
+                .isEqualTo(producedCount.get());
+
+        // sanity
+        assertThat(expectedMessageCount).isEqualTo(processedCount.get());
+        assertThat(producedKeysAcknowledged).hasSameSizeAs(expectedKeys);
+
+    }
+
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/sanity/ProgressBarTest.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/sanity/ProgressBarTest.java
new file mode 100644
index 000000000..f824bf80e
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/sanity/ProgressBarTest.java
@@ -0,0 +1,32 @@
+package io.confluent.parallelconsumer.integrationTests.sanity;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.ProgressBarUtils;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import me.tongfei.progressbar.ProgressBar;
+import org.junit.jupiter.api.Disabled;
+import org.junit.jupiter.api.Test;
+
+/**
+ * Testing use of progres bar in different console environments (e.g. intellij)
+ */
+@Slf4j
+public class ProgressBarTest {
+
+    @SneakyThrows
+    @Test
+    @Disabled("For reference sanity only")
+    public void width() {
+        ProgressBar build = ProgressBarUtils.getNewMessagesBar(log, 100);
+        try (build) {
+            while (build.getCurrent() < build.getMax()) {
+                build.step();
+                Thread.sleep(100);
+            }
+        }
+    }
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/state/PartitionStateCommittedOffsetIT.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/state/PartitionStateCommittedOffsetIT.java
new file mode 100644
index 000000000..eb014f92a
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/state/PartitionStateCommittedOffsetIT.java
@@ -0,0 +1,567 @@
+package io.confluent.parallelconsumer.integrationTests.state;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.StringSubject;
+import io.confluent.csid.utils.JavaUtils;
+import io.confluent.csid.utils.ThreadUtils;
+import io.confluent.parallelconsumer.FakeRuntimeException;
+import io.confluent.parallelconsumer.ManagedTruth;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.PollContext;
+import io.confluent.parallelconsumer.integrationTests.BrokerIntegrationTest;
+import io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils;
+import io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils.GroupOption;
+import lombok.NonNull;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.commons.lang3.exception.ExceptionUtils;
+import org.apache.kafka.clients.admin.AlterConfigOp;
+import org.apache.kafka.clients.admin.ConfigEntry;
+import org.apache.kafka.clients.admin.OffsetSpec;
+import org.apache.kafka.clients.consumer.*;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.clients.producer.RecordMetadata;
+import org.apache.kafka.common.KafkaFuture;
+import org.apache.kafka.common.TopicPartition;
+import org.apache.kafka.common.config.ConfigResource;
+import org.apache.kafka.common.config.TopicConfig;
+import org.awaitility.Awaitility;
+import org.awaitility.core.TerminalFailureException;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+import org.testcontainers.containers.KafkaContainer;
+import pl.tlinkowski.unij.api.UniMaps;
+import pl.tlinkowski.unij.api.UniSets;
+
+import java.time.Duration;
+import java.util.*;
+import java.util.concurrent.ExecutionException;
+import java.util.concurrent.Future;
+import java.util.concurrent.TimeoutException;
+import java.util.concurrent.atomic.AtomicLong;
+import java.util.stream.Collectors;
+
+import static com.google.common.truth.Truth.assertThat;
+import static com.google.common.truth.Truth.assertWithMessage;
+import static io.confluent.csid.utils.JavaUtils.getLast;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.PARTITION;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.UNORDERED;
+import static java.util.concurrent.TimeUnit.SECONDS;
+import static org.apache.kafka.clients.consumer.OffsetResetStrategy.NONE;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+/**
+ * Integration test versions of {@link io.confluent.parallelconsumer.state.PartitionStateCommittedOffsetTest}, where
+ * committed offset gets moved around or deleted, or random offsets are removed.
+ *
+ * @author Antony Stubbs
+ * @see io.confluent.parallelconsumer.state.PartitionStateCommittedOffsetTest
+ */
+@Slf4j
+class PartitionStateCommittedOffsetIT extends BrokerIntegrationTest<String, String> {
+
+    public static final OffsetResetStrategy DEFAULT_OFFSET_RESET_POLICY = OffsetResetStrategy.EARLIEST;
+
+    TopicPartition tp;
+
+    int TO_PRODUCE = 200;
+
+    private OffsetResetStrategy offsetResetStrategy = DEFAULT_OFFSET_RESET_POLICY;
+
+    // messy but as result of test is thrown as an exception, is a bit of a pain. But - only used in one test - forgive me
+    private ParallelEoSStreamProcessor<String, String> activePc;
+
+    @BeforeEach
+    void setup() {
+        setupTopic();
+        tp = new TopicPartition(getTopic(), 0);
+    }
+
+    /**
+     * Test for offset gaps in partition data (i.e. compacted topics)
+     */
+    @Test
+    void compactedTopic() {
+        try (KafkaContainer compactingBroker = setupCompactingKafkaBroker();) {
+
+            var TO_PRODUCE = this.TO_PRODUCE / 10; // local override, produce less
+
+            List<String> keys = produceMessages(TO_PRODUCE);
+
+            final int UNTIL_OFFSET = TO_PRODUCE / 2;
+            var processedOnFirstRun = runPcUntilOffset(UNTIL_OFFSET, TO_PRODUCE, UniSets.of(TO_PRODUCE - 3L));
+            assertWithMessage("Last processed should be at least half of the total sent, so that there is incomplete data to track")
+                    .that(getLast(processedOnFirstRun).get().offset())
+                    .isGreaterThan(TO_PRODUCE / 2);
+
+            //
+            ArrayList<String> compactionKeysRaw = sendRandomCompactionRecords(keys, TO_PRODUCE);
+            Set<String> compactedKeys = new HashSet<>(compactionKeysRaw);
+
+            var processedOnFirstRunWithTombstoneTargetsRemoved = processedOnFirstRun.stream()
+                    .filter(context -> !compactedKeys.contains(context.key()))
+                    .map(PollContext::key)
+                    .collect(Collectors.toList());
+
+            var firstRunPartitioned = processedOnFirstRun.stream().collect(Collectors.partitioningBy(context -> compactedKeys.contains(context.key())));
+            var saved = firstRunPartitioned.get(Boolean.FALSE);
+            var compacted = firstRunPartitioned.get(Boolean.TRUE);
+            log.debug("kept offsets: {}", saved.stream().mapToLong(PollContext::offset).boxed().collect(Collectors.toList()));
+            log.debug("kept keys: {}", saved.stream().map(PollContext::key).collect(Collectors.toList()));
+            log.debug("compacted offsets: {}", compacted.stream().map(PollContext::key).collect(Collectors.toList()));
+            log.debug("compacted keys: {}", compacted.stream().mapToLong(PollContext::offset).boxed().collect(Collectors.toList()));
+
+
+            var tombstoneTargetOffsetsFromFirstRun = compacted.stream()
+                    .filter(context -> compactedKeys.contains(context.key()))
+                    .map(PollContext::offset)
+                    .collect(Collectors.toList());
+
+            var tombStonedOffsetsFromKey = compactedKeys.stream()
+                    .map(PartitionStateCommittedOffsetIT::getOffsetFromKey).collect(Collectors.toList());
+            log.debug("First run produced, with compaction targets removed: {}", processedOnFirstRunWithTombstoneTargetsRemoved);
+
+            //
+            triggerCompactionProcessing();
+
+            // The offsets of the tombstone targets should not be read in second run
+            final int expectedOffsetProcessedToSecondRun = TO_PRODUCE + compactedKeys.size();
+            var processedOnSecondRun = runPcUntilOffset(expectedOffsetProcessedToSecondRun, GroupOption.REUSE_GROUP).stream()
+                    .filter(recordContexts -> !recordContexts.key().contains("compaction-trigger"))
+                    .collect(Collectors.toList());
+
+            //
+            List<Long> offsetsFromSecond = processedOnSecondRun.stream()
+                    .map(PollContext::offset)
+                    .collect(Collectors.toList());
+
+            assertWithMessage("Finish reading rest of records from %s to %s",
+                    UNTIL_OFFSET, TO_PRODUCE)
+                    .that(processedOnSecondRun.size()).isGreaterThan(TO_PRODUCE - UNTIL_OFFSET);
+
+            assertWithMessage("Off the offsets read on the second run, offsets that were compacted (below the initial produce target) should now be removed, as they were replaced with newer ones.")
+                    .that(offsetsFromSecond)
+                    .containsNoneIn(tombstoneTargetOffsetsFromFirstRun);
+
+        }
+    }
+
+    /**
+     * Set up our extra special compacting broker
+     */
+    @NonNull
+    private KafkaContainer setupCompactingKafkaBroker() {
+        KafkaContainer compactingBroker = null;
+        {
+            // set up new broker
+            compactingBroker = BrokerIntegrationTest.createKafkaContainer("40000");
+            compactingBroker.start();
+
+            setup();
+        }
+
+        setupCompactedEnvironment();
+
+        return compactingBroker;
+    }
+
+    private List<PollContext<String, String>> runPcUntilOffset(int offset) {
+        return runPcUntilOffset(DEFAULT_OFFSET_RESET_POLICY, offset);
+    }
+
+    private List<PollContext<String, String>> runPcUntilOffset(OffsetResetStrategy offsetResetPolicy, int offset) {
+        return runPcUntilOffset(offsetResetPolicy, offset, offset, UniSets.of(), GroupOption.NEW_GROUP);
+    }
+
+    private List<PollContext<String, String>> runPcUntilOffset(int offset, GroupOption reuseGroup) {
+        return runPcUntilOffset(DEFAULT_OFFSET_RESET_POLICY, Long.MAX_VALUE, offset, UniSets.of(), reuseGroup);
+    }
+
+    private static long getOffsetFromKey(String key) {
+        return Long.parseLong(key.substring(key.indexOf("-") + 1));
+    }
+
+    @SneakyThrows
+    private void setupCompactedEnvironment() {
+        log.debug("Setting up aggressive compaction...");
+        ConfigResource topicConfig = new ConfigResource(ConfigResource.Type.TOPIC, getTopic());
+
+        Collection<AlterConfigOp> alterConfigOps = new ArrayList<>();
+
+        alterConfigOps.add(new AlterConfigOp(new ConfigEntry(TopicConfig.CLEANUP_POLICY_CONFIG, TopicConfig.CLEANUP_POLICY_COMPACT), AlterConfigOp.OpType.SET));
+        alterConfigOps.add(new AlterConfigOp(new ConfigEntry(TopicConfig.MAX_COMPACTION_LAG_MS_CONFIG, "1"), AlterConfigOp.OpType.SET));
+        alterConfigOps.add(new AlterConfigOp(new ConfigEntry(TopicConfig.MIN_CLEANABLE_DIRTY_RATIO_CONFIG, "0"), AlterConfigOp.OpType.SET));
+
+        var configs = UniMaps.of(topicConfig, alterConfigOps);
+        KafkaFuture<Void> all = getKcu().getAdmin().incrementalAlterConfigs(configs).all();
+        all.get(5, SECONDS);
+
+        log.debug("Compaction setup complete");
+    }
+
+    @SneakyThrows
+    private List<String> triggerCompactionProcessing() {
+        // send a lot of messages to fill up segments
+        List<String> keys = produceMessages(TO_PRODUCE * 2, "log-compaction-trigger-");
+        // or wait?
+        final int pauseSeconds = 20;
+        log.info("Pausing for {} seconds to allow for compaction", pauseSeconds);
+        ThreadUtils.sleepSecondsLog(pauseSeconds);
+
+        return keys;
+    }
+
+    @SneakyThrows
+    private ArrayList<String> sendRandomCompactionRecords(List<String> keys, int howMany) {
+        var tombstoneKeys = new ArrayList<String>();
+        // fix randomness
+        List<Future<RecordMetadata>> futures = JavaUtils.getRandom(keys, howMany).stream()
+                .map((String key) -> {
+                    tombstoneKeys.add(key);
+                    var tombstone = new ProducerRecord<>(getTopic(), key, "compactor");
+                    return getKcu().getProducer()
+                            .send(tombstone);
+                })
+                .collect(Collectors.toList());
+        List<Long> tombstoneOffsets = new ArrayList<>();
+        for (Future<RecordMetadata> future : futures) {
+            RecordMetadata recordMetadata = future.get(5, SECONDS);
+            tombstoneOffsets.add(recordMetadata.offset());
+        }
+
+        tombstoneKeys.sort(Comparator.comparingLong(PartitionStateCommittedOffsetIT::getOffsetFromKey));
+
+        log.debug("Keys to tombstone: {}\n" +
+                        "Offsets of the generated tombstone: {}",
+                tombstoneKeys,
+                tombstoneOffsets);
+        return tombstoneKeys;
+    }
+
+    /**
+     * CG offset has been changed to a lower offset (partition rewind / replay) (metdata lost?)
+     */
+    @Test
+    void committedOffsetLower() {
+        produceMessages(TO_PRODUCE);
+
+        runPcUntilOffset(50);
+
+        final int moveToOffset = 25;
+
+        moveCommittedOffset(getKcu().getGroupId(), moveToOffset);
+
+        runPcCheckStartIs(moveToOffset, TO_PRODUCE);
+    }
+
+    /**
+     * Ensure that the PC starts at the correct offset
+     *
+     * @param targetStartOffset the offset to check that PC starts at
+     * @param checkUpTo         the offset to run the PC until, while checking for the start offset
+     */
+    @SneakyThrows
+    private void runPcCheckStartIs(long targetStartOffset, long checkUpTo, GroupOption groupOption) {
+        var tempPc = super.getKcu().buildPc(PARTITION, groupOption);
+        tempPc.subscribe(of(getTopic()));
+
+        AtomicLong lowest = new AtomicLong(Long.MAX_VALUE);
+        AtomicLong highest = new AtomicLong(Long.MIN_VALUE);
+
+        AtomicLong bumpersSent = new AtomicLong();
+
+        tempPc.poll(recordContexts -> {
+            log.error("Consumed: {} Bumpers sent {}", recordContexts.offset(), bumpersSent);
+            long thisOffset = recordContexts.offset();
+            if (thisOffset < lowest.get()) {
+                log.error("Found lowest offset {}", thisOffset);
+                lowest.set(thisOffset);
+            } else if (thisOffset > highest.get()) {
+                highest.set(thisOffset);
+            }
+        });
+
+        //
+        if (offsetResetStrategy.equals(NONE)) {
+            Awaitility.await().untilAsserted(() -> assertThat(tempPc.isClosedOrFailed()).isFalse()); // started
+            Awaitility.await().untilAsserted(() -> assertThat(tempPc.isClosedOrFailed()).isTrue()); // crashed
+            var throwable = tempPc.getFailureCause();
+            StringSubject causeMessage = assertThat(ExceptionUtils.getRootCauseMessage(throwable));
+            causeMessage.contains("NoOffsetForPartitionException");
+            causeMessage.contains("Undefined offset with no reset policy");
+
+            getKcu().close();
+        } else {
+            Awaitility.await()
+                    .pollInterval(5, SECONDS) // allow bumper messages to propagate
+                    .atMost(30, SECONDS) // so, allow more for more total time
+                    .failFast(tempPc::isClosedOrFailed)
+                    .untilAsserted(() -> {
+                        // in case we're at the end of the topic, add some messages to make sure we get a poll response
+                        // must go before failing assertion, otherwise won't be reached
+                        getKcu().getProducer().send(new ProducerRecord<>(getTopic(), "key-bumper", "poll-bumper"));
+                        bumpersSent.incrementAndGet();
+
+                        final long endOffset = getKcu().getAdmin().listOffsets(UniMaps.of(tp, OffsetSpec.earliest())).partitionResult(tp).get().offset();
+                        final long startOffset = getKcu().getAdmin().listOffsets(UniMaps.of(tp, OffsetSpec.latest())).partitionResult(tp).get().offset();
+                        log.error("start await loop: {}, end: {}, bumpersSent: {}", startOffset, endOffset, bumpersSent);
+
+                        //
+                        assertWithMessage("Highest seen offset to read up to")
+                                .that(highest.get())
+                                .isAtLeast(checkUpTo - 1);
+                    });
+
+            log.warn("Offset started at should equal the target {}, lowest {}, sent {}, diff is {})", targetStartOffset, lowest, bumpersSent, lowest.get() - targetStartOffset);
+
+            assertWithMessage("Offset started at should equal the target (sent %s , diff is %s)",
+                    bumpersSent,
+                    lowest.get() - targetStartOffset
+            )
+                    .that(lowest.get())
+                    .isEqualTo(targetStartOffset);
+
+            //
+            tempPc.close();
+        }
+
+    }
+
+    @SneakyThrows
+    private void moveCommittedOffset(String groupId, long offset) {
+        log.debug("Moving offset of {} to {}", groupId, offset);
+        var data = UniMaps.of(tp, new OffsetAndMetadata(offset));
+        var result = getKcu().getAdmin().alterConsumerGroupOffsets(groupId, data);
+        result.all().get(5, SECONDS);
+        log.debug("Moved offset to {}", offset);
+    }
+
+    private List<PollContext<String, String>> runPcUntilOffset(long succeedUpToOffset, long expectedProcessToOffset, Set<Long> exceptionsToSucceed) {
+        return runPcUntilOffset(DEFAULT_OFFSET_RESET_POLICY, succeedUpToOffset, expectedProcessToOffset, exceptionsToSucceed, GroupOption.NEW_GROUP);
+    }
+
+    @SneakyThrows
+    private List<PollContext<String, String>> runPcUntilOffset(OffsetResetStrategy offsetResetPolicy,
+                                                               long succeedUpToOffset,
+                                                               long expectedProcessToOffset,
+                                                               Set<Long> exceptionsToSucceed,
+                                                               GroupOption newGroup) {
+        log.debug("Running PC until at least offset {}", succeedUpToOffset);
+        super.getKcu().setOffsetResetPolicy(offsetResetPolicy);
+        var tempPc = super.getKcu().buildPc(UNORDERED, newGroup);
+        activePc = tempPc;
+        try { // can't use auto closeable because close is complicated as it's expected to crash and close rethrows error
+
+            SortedSet<PollContext<String, String>> seenOffsets = Collections.synchronizedSortedSet(new TreeSet<>(Comparator.comparingLong(PollContext::offset)));
+            SortedSet<PollContext<String, String>> succeededOffsets = Collections.synchronizedSortedSet(new TreeSet<>(Comparator.comparingLong(PollContext::offset)));
+
+            tempPc.subscribe(of(getTopic()));
+
+            tempPc.poll(pollContext -> {
+                seenOffsets.add(pollContext);
+                long thisOffset = pollContext.offset();
+                if (exceptionsToSucceed.contains(thisOffset)) {
+                    log.debug("Exceptional offset {} succeeded", thisOffset);
+                } else if (thisOffset >= succeedUpToOffset) {
+                    log.debug("Failing on {}", thisOffset);
+                    throw new FakeRuntimeException("Failing on " + thisOffset);
+                } else {
+                    log.debug("Succeeded {}: {}", thisOffset, pollContext.getSingleRecord());
+                    succeededOffsets.add(pollContext);
+                }
+            });
+
+            // give first poll a chance to run
+            ThreadUtils.sleepSecondsLog(1);
+
+            getKcu().produceMessages(getTopic(), 1, "poll-bumper");
+
+            Awaitility.await()
+                    .failFast(tempPc::isClosedOrFailed)
+                    .untilAsserted(() -> {
+                        assertThat(seenOffsets).isNotEmpty();
+                        assertThat(seenOffsets.last().offset()).isGreaterThan(expectedProcessToOffset - 2);
+                    });
+
+            if (!succeededOffsets.isEmpty()) {
+                log.debug("Succeeded up to: {}", succeededOffsets.last().offset());
+            }
+            log.debug("Consumed up to {}", seenOffsets.last().offset());
+
+            var sorted = new ArrayList<>(seenOffsets);
+            Collections.sort(sorted, Comparator.comparingLong(PollContext::offset));
+            return sorted;
+        } finally {
+            try {
+                if (!tempPc.isClosedOrFailed()) {
+                    // some test branches, pc will crash and close in the test already
+                    tempPc.close();
+                }
+            } catch (Exception e) {
+                log.debug("Cause will get rethrown close on the NONE parameter branch", e);
+            }
+        }
+    }
+
+    /**
+     * CG offset has been changed to something higher than expected (offset skip) (metdata lost?)
+     */
+    @Test
+    void committedOffsetHigher() {
+        final int quantity = 100;
+        produceMessages(quantity);
+
+        runPcUntilOffset(50);
+
+        final int moveToOffset = 75;
+
+        // resolve groupId mess
+        moveCommittedOffset(getKcu().getGroupId(), moveToOffset);
+
+        runPcCheckStartIs(moveToOffset, quantity);
+    }
+
+    private void runPcCheckStartIs(int targetStartOffset, int checkUpTo) {
+        runPcCheckStartIs(targetStartOffset, checkUpTo, GroupOption.REUSE_GROUP);
+    }
+
+    /**
+     * CG offset has disappeared - committed offset hasn't been changed, but broker gives us a bootstrap poll result
+     * with a higher offset than expected. Could be caused by retention period, or compaction.
+     *
+     * @see #noOffsetPolicyOnStartup
+     */
+    @SneakyThrows
+    @EnumSource(value = OffsetResetStrategy.class)
+    @ParameterizedTest
+    void committedOffsetRemoved(OffsetResetStrategy offsetResetPolicy) {
+        this.offsetResetStrategy = offsetResetPolicy;
+        try (
+                KafkaContainer compactingKafkaBroker = setupCompactingKafkaBroker();
+                KafkaClientUtils clientUtils = new KafkaClientUtils(compactingKafkaBroker);
+        ) {
+            log.debug("Compacting broker started {}", compactingKafkaBroker.getBootstrapServers());
+
+            clientUtils.setOffsetResetPolicy(offsetResetPolicy);
+            clientUtils.open();
+
+            if (offsetResetPolicy.equals(NONE)) {
+                // no reset policy, so we set initial offset to zero, to avoid crash on startup - see startup test
+                var consumer = getKcu().getConsumer();
+                consumer.subscribe(of(getTopic()));
+                consumer.poll(Duration.ofSeconds(1));
+                // commit offset 0 to partition
+                consumer.commitSync(UniMaps.of(tp, new OffsetAndMetadata(0)));
+                consumer.close();
+            }
+
+            var producedCount = produceMessages(TO_PRODUCE).size();
+
+            final int END_OFFSET = 50;
+            var groupId = clientUtils.getGroupId();
+            runPcUntilOffset(offsetResetPolicy, END_OFFSET, END_OFFSET, UniSets.of(), GroupOption.REUSE_GROUP);
+
+            producedCount = producedCount + 1; // run sends one
+
+            //
+            final String compactedKey = "key-50";
+
+            // before compaction
+            checkHowManyRecordsWithKeyPresent(compactedKey, 1, TO_PRODUCE);
+
+            final int triggerRecordsCount = causeCommittedOffsetToBeRemoved(END_OFFSET);
+
+            // after compaction
+            checkHowManyRecordsWithKeyPresent(compactedKey, 1, TO_PRODUCE + 2);
+
+            producedCount = producedCount + triggerRecordsCount;
+
+            final int EXPECTED_RESET_OFFSET = switch (offsetResetPolicy) {
+                case EARLIEST -> 0;
+                case LATEST -> producedCount;
+                case NONE -> -1; // will crash / fail fast
+            };
+
+            clientUtils.setGroupId(groupId);
+            runPcCheckStartIs(EXPECTED_RESET_OFFSET, producedCount);
+        }
+    }
+
+    private void checkHowManyRecordsWithKeyPresent(String keyToSearchFor, int expectedQuantityToFind, long searchUpToOffset) {
+        log.debug("Looking for {} records with key {} up to offset {}", expectedQuantityToFind, keyToSearchFor, searchUpToOffset);
+
+        try (KafkaConsumer<String, String> newConsumer = getKcu().createNewConsumer(GroupOption.NEW_GROUP);) {
+            newConsumer.assign(of(tp));
+            newConsumer.seekToBeginning(UniSets.of(tp));
+            long positionAfter = newConsumer.position(tp); // trigger eager seek
+            assertThat(positionAfter).isEqualTo(0);
+            final List<ConsumerRecord<String, String>> records = new ArrayList<>();
+            long highest = -1;
+            while (highest < searchUpToOffset - 1) {
+                ConsumerRecords<String, String> poll = newConsumer.poll(Duration.ofSeconds(1));
+                records.addAll(poll.records(tp));
+                var lastOpt = getLast(records);
+                if (lastOpt.isPresent()) {
+                    highest = lastOpt.get().offset();
+                }
+            }
+
+            var collect = records.stream().filter(value -> value.key().equals(keyToSearchFor)).collect(Collectors.toList());
+            ManagedTruth.assertThat(collect).hasSize(expectedQuantityToFind);
+        }
+    }
+
+    @SneakyThrows
+    private int causeCommittedOffsetToBeRemoved(long offset) {
+        sendCompactionKeyForOffset(offset);
+        sendCompactionKeyForOffset(offset + 1);
+
+        checkHowManyRecordsWithKeyPresent("key-" + offset, 2, TO_PRODUCE + 2);
+
+        List<String> strings = triggerCompactionProcessing();
+
+        return 2 + strings.size();
+    }
+
+    private void sendCompactionKeyForOffset(long offset) throws InterruptedException, ExecutionException, TimeoutException {
+        String key = "key-" + offset;
+        ProducerRecord<String, String> compactingRecord = new ProducerRecord<>(getTopic(), 0, key, "compactor");
+        getKcu().getProducer()
+                .send(compactingRecord)
+                .get(1, SECONDS);
+    }
+
+    /**
+     * When there's no offset reset policy and there are no offsets for the consumer group, the pc should fail fast,
+     * passing up the exception
+     */
+    @Test
+    void noOffsetPolicyOnStartup() {
+        this.offsetResetStrategy = NONE;
+        try (
+                KafkaClientUtils clientUtils = new KafkaClientUtils(kafkaContainer);
+        ) {
+            clientUtils.setOffsetResetPolicy(offsetResetStrategy);
+            clientUtils.open();
+
+            var producedCount = produceMessages(TO_PRODUCE).size();
+
+            try {
+                runPcUntilOffset(offsetResetStrategy, producedCount, producedCount, UniSets.of(), GroupOption.REUSE_GROUP);
+            } catch (TerminalFailureException e) {
+                var failureCause = activePc.getFailureCause();
+                var rootCauseMessage = ExceptionUtils.getRootCauseMessage(failureCause);
+                var message = assertThat(rootCauseMessage);
+                message.contains("NoOffsetForPartitionException");
+                message.contains("Undefined offset");
+                message.contains("no reset policy");
+            }
+        }
+    }
+
+}
\ No newline at end of file
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/utils/BrokerCommitAsserter.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/utils/BrokerCommitAsserter.java
new file mode 100644
index 000000000..de523aa5a
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/utils/BrokerCommitAsserter.java
@@ -0,0 +1,86 @@
+package io.confluent.parallelconsumer.integrationTests.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.AccessLevel;
+import lombok.Getter;
+import lombok.NonNull;
+import lombok.RequiredArgsConstructor;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import pl.tlinkowski.unij.api.UniSets;
+
+import java.time.Duration;
+import java.util.Set;
+
+import static io.confluent.parallelconsumer.ManagedTruth.assertThat;
+import static java.time.Duration.ofSeconds;
+import static org.testcontainers.shaded.org.awaitility.Awaitility.await;
+
+/**
+ * Central point for asserting commits in integration tests against the brokers.
+ *
+ * @author Antony Stubbs
+ */
+@Slf4j
+@RequiredArgsConstructor
+public class BrokerCommitAsserter {
+
+    @NonNull
+    @Getter(AccessLevel.PRIVATE)
+    private final String defaultTopic;
+
+    @NonNull
+    private final KafkaConsumer<?, ?> assertConsumer;
+
+    public void assertConsumedAtLeastOffset(int target) {
+        assertConsumedAtLeastOffset(getDefaultTopic(), target);
+    }
+
+    public void assertConsumedAtLeastOffset(String topic, int target) {
+        setup(topic, target);
+
+        await().untilAsserted(() -> {
+            var poll = assertConsumer.poll(ofSeconds(1));
+
+            log.debug("Polled {} records, looking for at least offset {}", poll.count(), target);
+            assertThat(poll).hasHeadOffsetAtLeastInAnyTopicPartition(target);
+        });
+
+        post();
+    }
+
+    private void post() {
+        assertConsumer.unsubscribe();
+    }
+
+    private void setup(String topic, int target) {
+        log.debug("Asserting against topic: {}, expecting to consume at LEAST offset {}", topic, target);
+        Set<String> topicSet = UniSets.of(topic);
+        assertConsumer.subscribe(topicSet);
+        assertConsumer.seekToBeginning(UniSets.of());
+    }
+
+    /**
+     * Checks only once, with an assertion delay of 5 second
+     */
+    public void assertConsumedAtMostOffset(String topic, int atMost) {
+        setup(topic, atMost);
+
+        Duration delay = ofSeconds(5);
+        log.debug("Delaying by {} to check consumption from topic {} by at most {}", delay, topic, atMost);
+        await()
+                .pollDelay(delay)
+                .timeout(delay.plusSeconds(1))
+                .untilAsserted(() -> {
+                    var poll = assertConsumer.poll(ofSeconds(1));
+
+                    log.debug("Polled {} records, looking for at MOST offset {}", poll.count(), atMost);
+                    assertThat(poll).hasHeadOffsetAtMostInAnyTopicPartition(atMost);
+                });
+
+        post();
+    }
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/utils/GenUtils.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/utils/GenUtils.java
new file mode 100644
index 000000000..08dcf38a7
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/utils/GenUtils.java
@@ -0,0 +1,27 @@
+package io.confluent.parallelconsumer.integrationTests.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import pl.tlinkowski.unij.api.UniCollectors;
+
+import java.time.Instant;
+import java.util.Calendar;
+import java.util.List;
+import java.util.TimeZone;
+import java.util.function.IntFunction;
+import java.util.stream.IntStream;
+
+public class GenUtils {
+
+    public static final Instant randomSeedInstant = new Calendar.Builder().setTimeZone(TimeZone.getTimeZone("UTC")).setDate(1982, 6, 10).build().toInstant();
+    public static final long randomSeed = randomSeedInstant.toEpochMilli();
+
+    public <T> List<T> createSomeStuff(Integer quantity, IntFunction<T> constructor) {
+        return IntStream.range(0, quantity)
+                .mapToObj(constructor)
+                .collect(UniCollectors.toUnmodifiableList());
+    }
+
+}
diff --git a/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/utils/KafkaClientUtils.java b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/utils/KafkaClientUtils.java
new file mode 100644
index 000000000..bcc71436d
--- /dev/null
+++ b/parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/utils/KafkaClientUtils.java
@@ -0,0 +1,340 @@
+package io.confluent.parallelconsumer.integrationTests.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.internal.PCModuleTestEnv;
+import io.confluent.parallelconsumer.state.ModelUtils;
+import lombok.Getter;
+import lombok.Setter;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import one.util.streamex.IntStreamEx;
+import org.apache.kafka.clients.admin.AdminClient;
+import org.apache.kafka.clients.admin.NewTopic;
+import org.apache.kafka.clients.consumer.ConsumerConfig;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.consumer.OffsetResetStrategy;
+import org.apache.kafka.clients.producer.*;
+import org.apache.kafka.common.IsolationLevel;
+import org.apache.kafka.common.serialization.StringDeserializer;
+import org.apache.kafka.common.serialization.StringSerializer;
+import org.junit.jupiter.api.AfterEach;
+import org.junit.jupiter.api.BeforeEach;
+import org.testcontainers.containers.KafkaContainer;
+
+import java.util.ArrayList;
+import java.util.List;
+import java.util.Locale;
+import java.util.Properties;
+import java.util.concurrent.ExecutionException;
+import java.util.concurrent.Future;
+
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_CONSUMER_ASYNCHRONOUS;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER;
+import static io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils.ProducerMode.NOT_TRANSACTIONAL;
+import static io.confluent.parallelconsumer.integrationTests.utils.KafkaClientUtils.ProducerMode.TRANSACTIONAL;
+import static java.time.Duration.ofSeconds;
+import static java.util.Optional.empty;
+import static org.apache.commons.lang3.RandomUtils.nextInt;
+import static org.assertj.core.api.Assertions.assertThat;
+
+/**
+ * Utilities for creating and manipulating clients
+ * <p>
+ * Caution: When creating new consumers with new group ids, the old group id is overwritten and so cannot be
+ * automatically be reused anymore.
+ *
+ * @author Antony Stubbs
+ */
+@Slf4j
+public class KafkaClientUtils implements AutoCloseable {
+
+    public static final int MAX_POLL_RECORDS = 10_000;
+    public static final String GROUP_ID_PREFIX = "group-1-";
+
+    class PCVersion {
+        public static final String V051 = "0.5.1";
+    }
+
+
+    private final KafkaContainer kContainer;
+
+    @Getter
+    private KafkaConsumer<String, String> consumer;
+
+    @Setter
+    private OffsetResetStrategy offsetResetPolicy = OffsetResetStrategy.EARLIEST;
+
+    @Getter
+    private KafkaProducer<String, String> producer;
+
+    @Getter
+    private AdminClient admin;
+
+    @Getter
+    @Setter
+    private String groupId = GROUP_ID_PREFIX + nextInt();
+
+    /**
+     * todo docs
+     */
+    private KafkaConsumer<String, String> lastConsumerConstructed;
+
+    public KafkaClientUtils(KafkaContainer kafkaContainer) {
+        kafkaContainer.addEnv("KAFKA_transaction_state_log_replication_factor", "1");
+        kafkaContainer.addEnv("KAFKA_transaction_state_log_min_isr", "1");
+        kafkaContainer.start();
+        this.kContainer = kafkaContainer;
+    }
+
+    private Properties setupCommonProps() {
+        var commonProps = new Properties();
+        String servers = this.kContainer.getBootstrapServers();
+        commonProps.put("bootstrap.servers", servers);
+        return commonProps;
+    }
+
+    private Properties setupProducerProps() {
+        var producerProps = setupCommonProps();
+
+        producerProps.put(ProducerConfig.KEY_SERIALIZER_CLASS_CONFIG, StringSerializer.class.getName());
+        producerProps.put(ProducerConfig.VALUE_SERIALIZER_CLASS_CONFIG, StringSerializer.class.getName());
+
+        return producerProps;
+    }
+
+    public Properties setupConsumerProps(String groupIdToUse) {
+        var consumerProps = setupCommonProps();
+
+        //
+        consumerProps.put(ConsumerConfig.GROUP_ID_CONFIG, groupIdToUse);
+        consumerProps.put(ConsumerConfig.ENABLE_AUTO_COMMIT_CONFIG, false);
+        consumerProps.put(ConsumerConfig.KEY_DESERIALIZER_CLASS_CONFIG, StringDeserializer.class.getName());
+        consumerProps.put(ConsumerConfig.VALUE_DESERIALIZER_CLASS_CONFIG, StringDeserializer.class.getName());
+        consumerProps.put(ConsumerConfig.ISOLATION_LEVEL_CONFIG, IsolationLevel.READ_COMMITTED.toString().toLowerCase(Locale.ROOT));
+
+        // Reset
+        consumerProps.put(ConsumerConfig.AUTO_OFFSET_RESET_CONFIG, offsetResetPolicy.name().toLowerCase());
+
+        //
+        //    consumerProps.put(ConsumerConfig.HEARTBEAT_INTERVAL_MS_CONFIG, 10);
+        //    consumerProps.put(ConsumerConfig.SESSION_TIMEOUT_MS_CONFIG, 100);
+
+        // make sure we can download lots of records if they're small. Default is 500
+//        consumerProps.put(ConsumerConfig.MAX_POLL_RECORDS_CONFIG, 1_000_000);
+        consumerProps.put(ConsumerConfig.MAX_POLL_RECORDS_CONFIG, MAX_POLL_RECORDS);
+
+        return consumerProps;
+    }
+
+    @BeforeEach
+    public void open() {
+        log.info("Setting up clients...");
+        consumer = this.createNewConsumer();
+        producer = this.createNewProducer(false);
+        admin = AdminClient.create(setupCommonProps());
+    }
+
+    @AfterEach
+    public void close() {
+        if (producer != null)
+            producer.close();
+        if (consumer != null)
+            consumer.close();
+        if (admin != null)
+            admin.close();
+    }
+
+    public enum GroupOption {
+        REUSE_GROUP,
+        NEW_GROUP
+    }
+
+
+    public <K, V> KafkaConsumer<K, V> createNewConsumer(String groupId) {
+        return createNewConsumer(groupId, new Properties());
+    }
+
+    public <K, V> KafkaConsumer<K, V> createNewConsumer(GroupOption reuseGroup) {
+        return createNewConsumer(reuseGroup.equals(GroupOption.NEW_GROUP));
+    }
+
+    public <K, V> KafkaConsumer<K, V> createNewConsumer() {
+        return createNewConsumer(false);
+    }
+
+    @Deprecated
+    public <K, V> KafkaConsumer<K, V> createNewConsumer(boolean newConsumerGroup) {
+        return createNewConsumer(newConsumerGroup, new Properties());
+    }
+
+    @Deprecated
+    public <K, V> KafkaConsumer<K, V> createNewConsumer(Properties options) {
+        return createNewConsumer(false, options);
+    }
+
+    public <K, V> KafkaConsumer<K, V> createNewConsumer(boolean newConsumerGroup, Properties options) {
+        if (newConsumerGroup) {
+            // overwrite the group id with a new one
+            String newGroupId = GROUP_ID_PREFIX + nextInt();
+            this.groupId = newGroupId; // save it for reuse later
+        }
+        return createNewConsumer(this.groupId, options);
+    }
+
+    @Deprecated
+    public <K, V> KafkaConsumer<K, V> createNewConsumer(String groupId, Properties options) {
+        Properties properties = setupConsumerProps(groupId);
+
+        // override with custom
+        properties.putAll(options);
+
+        KafkaConsumer<K, V> kvKafkaConsumer = new KafkaConsumer<>(properties);
+        log.debug("New consume {}", kvKafkaConsumer);
+        return kvKafkaConsumer;
+    }
+
+    /**
+     * Initialises the producer as well, so can't use with PC
+     */
+    public <K, V> KafkaProducer<K, V> createAndInitNewTransactionalProducer() {
+        KafkaProducer<K, V> txProd = createNewProducer(TRANSACTIONAL);
+        txProd.initTransactions();
+        return txProd;
+    }
+
+    /**
+     * @deprecated use the enum version {@link #createNewProducer(ProducerMode)} instead, since = {@link PCVersion#V051}
+     */
+    @Deprecated
+    public <K, V> KafkaProducer<K, V> createNewProducer(boolean transactional) {
+        var mode = transactional ? TRANSACTIONAL : NOT_TRANSACTIONAL;
+        return createNewProducer(mode);
+    }
+
+    public KafkaProducer<String, String> createNewProducer(CommitMode commitMode) {
+        return createNewProducer(ProducerMode.matching(commitMode));
+    }
+
+    public <K, V> KafkaProducer<K, V> createNewProducer(ProducerMode mode) {
+        Properties properties = setupProducerProps();
+
+        var txProps = new Properties();
+        txProps.putAll(properties);
+
+        if (mode.equals(TRANSACTIONAL)) {
+            // random number, so we get a unique producer tx session each time. Normally wouldn't do this in production,
+            // but sometimes running in the test suite our producers' step on each other between test runs and this causes
+            // Producer Fenced exceptions:
+            // Error looks like: Producer attempted an operation with an old epoch. Either there is a newer producer with
+            // the same transactionalId, or the producer's transaction has been expired by the broker.
+            txProps.put(ProducerConfig.TRANSACTIONAL_ID_CONFIG, this.getClass().getSimpleName() + ":" + nextInt()); // required for tx
+            txProps.put(ProducerConfig.TRANSACTION_TIMEOUT_CONFIG, (int) ofSeconds(10).toMillis()); // speed things up
+        }
+
+        KafkaProducer<K, V> kvKafkaProducer = new KafkaProducer<>(txProps);
+
+        log.debug("New producer {}", kvKafkaProducer);
+        return kvKafkaProducer;
+    }
+
+    public enum ProducerMode {
+        TRANSACTIONAL, NOT_TRANSACTIONAL;
+
+        public static ProducerMode matching(CommitMode commitMode) {
+            return commitMode.equals(PERIODIC_TRANSACTIONAL_PRODUCER)
+                    ? TRANSACTIONAL
+                    : NOT_TRANSACTIONAL;
+        }
+    }
+
+    @SneakyThrows
+    public List<NewTopic> createTopics(int numTopics) {
+        List<NewTopic> newTopics = IntStreamEx.range(numTopics)
+                .mapToObj(i
+                        -> new NewTopic("in-" + i + "-" + nextInt(), empty(), empty()))
+                .toList();
+        getAdmin().createTopics(newTopics)
+                .all()
+                .get();
+        return newTopics;
+    }
+
+    public List<String> produceMessages(String topicName, long numberToSend) throws InterruptedException, ExecutionException {
+        return produceMessages(topicName, numberToSend, "");
+    }
+
+    public List<String> produceMessages(String topicName, long numberToSend, String prefix) throws InterruptedException, ExecutionException {
+        log.info("Producing {} messages to {}", numberToSend, topicName);
+        final List<String> expectedKeys = new ArrayList<>();
+        List<Future<RecordMetadata>> sends = new ArrayList<>();
+        try (Producer<String, String> kafkaProducer = createNewProducer(false)) {
+
+            var mu = new ModelUtils(new PCModuleTestEnv());
+            List<ProducerRecord<String, String>> recs = mu.createProducerRecords(topicName, numberToSend, prefix);
+
+            for (var record : recs) {
+                Future<RecordMetadata> send = kafkaProducer.send(record, (meta, exception) -> {
+                    if (exception != null) {
+                        log.error("Error sending, ", exception);
+                    }
+                });
+                sends.add(send);
+                expectedKeys.add(record.key());
+            }
+            log.debug("Finished sending test data");
+        }
+        // make sure we finish sending before next stage
+        log.debug("Waiting for broker acks");
+        for (Future<RecordMetadata> send : sends) {
+            RecordMetadata recordMetadata = send.get();
+            boolean b = recordMetadata.hasOffset();
+            assertThat(b).isTrue();
+        }
+        assertThat(sends).hasSize(Math.toIntExact(numberToSend));
+        return expectedKeys;
+    }
+
+    public ParallelEoSStreamProcessor<String, String> buildPc(ProcessingOrder order, CommitMode commitMode, int maxPoll) {
+        return buildPc(order, commitMode, maxPoll, GroupOption.REUSE_GROUP);
+    }
+
+    public ParallelEoSStreamProcessor<String, String> buildPc(ProcessingOrder order, CommitMode commitMode, int maxPoll, GroupOption groupOption) {
+        Properties consumerProps = new Properties();
+        consumerProps.put(ConsumerConfig.MAX_POLL_RECORDS_CONFIG, maxPoll);
+        boolean newConsumerGroup = groupOption.equals(GroupOption.NEW_GROUP);
+        KafkaConsumer<String, String> newConsumer = createNewConsumer(newConsumerGroup, consumerProps);
+        lastConsumerConstructed = newConsumer;
+
+        var pc = new ParallelEoSStreamProcessor<>(ParallelConsumerOptions.<String, String>builder()
+                .ordering(order)
+                .consumer(newConsumer)
+                .commitMode(commitMode)
+                .maxConcurrency(100)
+                .build());
+
+        pc.setTimeBetweenCommits(ofSeconds(1));
+
+        // sanity
+        return pc;
+    }
+
+    public ParallelEoSStreamProcessor<String, String> buildPc(ProcessingOrder key, GroupOption groupOption) {
+        return buildPc(key, PERIODIC_CONSUMER_ASYNCHRONOUS, 500, groupOption);
+    }
+
+    public ParallelEoSStreamProcessor<String, String> buildPc(ProcessingOrder key) {
+        return buildPc(key, PERIODIC_CONSUMER_ASYNCHRONOUS, 500);
+    }
+
+    public KafkaConsumer<String, String> getLastConsumerConstructed() {
+        return lastConsumerConstructed;
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/testcontainers/FilteredTestContainerSlf4jLogConsumer.java b/parallel-consumer-core/src/test/java/io/confluent/csid/testcontainers/FilteredTestContainerSlf4jLogConsumer.java
new file mode 100644
index 000000000..9ee1d3638
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/testcontainers/FilteredTestContainerSlf4jLogConsumer.java
@@ -0,0 +1,53 @@
+package io.confluent.csid.testcontainers;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import lombok.Getter;
+import lombok.Setter;
+import lombok.extern.slf4j.Slf4j;
+import org.slf4j.Logger;
+import org.slf4j.event.Level;
+import org.testcontainers.containers.output.OutputFrame;
+import org.testcontainers.containers.output.Slf4jLogConsumer;
+import pl.tlinkowski.unij.api.UniLists;
+
+import java.util.List;
+
+import static org.slf4j.event.Level.DEBUG;
+import static org.slf4j.event.Level.TRACE;
+
+/**
+ * Filters out some log levels from the test container (e.g. Kafka's container has TRACE level set by default).
+ * <p>
+ * Enable logging for this class to get log statements from docker.
+ */
+@Slf4j
+public class FilteredTestContainerSlf4jLogConsumer extends Slf4jLogConsumer {
+
+    @Getter
+    @Setter
+    private List<Level> filteredLevels = UniLists.of(TRACE, DEBUG);
+
+    public FilteredTestContainerSlf4jLogConsumer(Logger logger) {
+        super(logger);
+    }
+
+    public FilteredTestContainerSlf4jLogConsumer(Logger logger, boolean separateOutputStreams) {
+        super(logger, separateOutputStreams);
+    }
+
+    @Override
+    public void accept(OutputFrame outputFrame) {
+        if (log.isDebugEnabled()) {
+            String utf8String = outputFrame.getUtf8String();
+            boolean isFilteredOut = filteredLevels.stream().anyMatch(level -> utf8String.contains(level.toString()));
+            if (!isFilteredOut) {
+                super.accept(outputFrame);
+            } else {
+                // ignoring trace level logging
+            }
+        }
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/BlockedThreadAsserter.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/BlockedThreadAsserter.java
new file mode 100644
index 000000000..5f08ca1ef
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/BlockedThreadAsserter.java
@@ -0,0 +1,114 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.Truth;
+import lombok.extern.slf4j.Slf4j;
+
+import java.time.Duration;
+import java.util.concurrent.Executors;
+import java.util.concurrent.ScheduledExecutorService;
+import java.util.concurrent.TimeUnit;
+import java.util.concurrent.atomic.AtomicBoolean;
+
+import static java.time.Duration.ofSeconds;
+import static org.awaitility.Awaitility.await;
+
+/**
+ * System for asserting that a given method blocks for some period of time, and optionally unblocks.
+ * <p>
+ * JUnit has {@link org.junit.jupiter.api.Assertions#assertTimeoutPreemptively} which is useful but has limitations.
+ *
+ * @author Antony Stubbs
+ */
+@Slf4j
+public class BlockedThreadAsserter {
+
+    /**
+     * Could do this faster with a {@link java.util.concurrent.CountDownLatch}
+     */
+    private final AtomicBoolean methodReturned = new AtomicBoolean(false);
+
+    public boolean functionHasCompleted() {
+        return methodReturned.get();
+    }
+
+
+    public void assertFunctionBlocks(Runnable functionExpectedToBlock) {
+        assertFunctionBlocks(functionExpectedToBlock, ofSeconds(1));
+    }
+
+    public void assertFunctionBlocks(Runnable functionExpectedToBlock, final Duration blockedForAtLeast) {
+        Thread blocked = new Thread(() -> {
+            try {
+                log.debug("Running function expected to block for at least {}...", blockedForAtLeast);
+                functionExpectedToBlock.run();
+                log.debug("Blocked function finished.");
+            } catch (Exception e) {
+                log.error("Error in blocking function", e);
+            }
+            methodReturned.set(true);
+        });
+        blocked.start();
+
+        await()
+                .pollDelay(blockedForAtLeast) // makes sure it is still blocked after 1 second
+                .atMost(blockedForAtLeast.plus(Duration.ofSeconds(1)))
+                .untilAsserted(
+                        () -> Truth.assertWithMessage("Thread should be sleeping/blocked and not have returned")
+                                .that(methodReturned.get())
+                                .isFalse());
+    }
+
+    final ScheduledExecutorService scheduledExecutorService = Executors.newSingleThreadScheduledExecutor();
+
+    public void assertUnblocksAfter(final Runnable functionExpectedToBlock,
+                                    final Runnable unblockingFunction,
+                                    final Duration unblocksAfter) {
+
+        AtomicBoolean unblockerHasRun = new AtomicBoolean(false);
+        scheduledExecutorService.schedule(() -> {
+                    log.debug("Running unblocking function - blocked function should return ONLY after this (which will be tested)");
+                    try {
+                        unblockingFunction.run();
+                    } catch (Exception e) {
+                        log.error("Error in unlocking function", e);
+                    }
+                    unblockerHasRun.set(true);
+                    log.debug("Blocked function returned");
+                },
+                unblocksAfter.toMillis(),
+                TimeUnit.MILLISECONDS);
+
+        var time = TimeUtils.timeWithMeta(() -> {
+            log.debug("Running function expected to block for at least {}...", unblocksAfter);
+            try {
+                functionExpectedToBlock.run();
+            } catch (Exception e) {
+                log.error("Error in blocking function", e);
+            }
+            log.debug("Unblocking function finished returned");
+            return Void.class;
+        });
+        log.debug("Function unblocked after {}", time.getElapsed());
+
+        this.methodReturned.set(true);
+
+        Truth.assertThat(time.getElapsed()).isAtLeast(unblocksAfter);
+        Truth.assertWithMessage("Unblocking function should complete OK (if false, may not have run at all - or that the expected function to block did NOT block)")
+                .that(unblockerHasRun.get()).isTrue();
+    }
+
+    public void assertUnblocksAfter(final Runnable functionExpectedToBlock,
+                                    final Runnable unblockingFunction) {
+        assertUnblocksAfter(functionExpectedToBlock, unblockingFunction, ofSeconds(1));
+    }
+
+    public void awaitReturnFully() {
+        log.debug("Waiting for blocked method to fully finish...");
+        await().untilTrue(this.methodReturned);
+        log.debug("Waiting on blocked method to fully finish is complete.");
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/CollectionUtils.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/CollectionUtils.java
new file mode 100644
index 000000000..4cee8a532
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/CollectionUtils.java
@@ -0,0 +1,16 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import java.util.List;
+import java.util.Optional;
+
+public class CollectionUtils {
+
+    public static <T> Optional<T> getLast(List<T> history) {
+        return history.isEmpty() ? Optional.empty() : Optional.of(history.get(history.size() - 1));
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/EnumCartesianProductTestSets.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/EnumCartesianProductTestSets.java
new file mode 100644
index 000000000..57af228a5
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/EnumCartesianProductTestSets.java
@@ -0,0 +1,34 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import org.junitpioneer.jupiter.CartesianProductTest;
+
+/**
+ * Automatically extract enum constants
+ */
+public class EnumCartesianProductTestSets extends CartesianProductTest.Sets {
+
+    /**
+     * Simply pass in the enum class, otherwise use as normal.
+     *
+     * @see CartesianProductTest.Sets#add
+     */
+    @Override
+    public CartesianProductTest.Sets add(final Object... entries) {
+        Object[] finalEntries = entries;
+        if (entries.length == 1) {
+            Object entry = entries[0];
+            if (entry instanceof Class) {
+                Class<?> classEntry = (Class<?>) entry;
+                if (classEntry.isEnum()) {
+                    finalEntries = classEntry.getEnumConstants();
+                }
+            }
+        }
+        return super.add(finalEntries);
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/GeneralTestUtils.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/GeneralTestUtils.java
new file mode 100644
index 000000000..680435f13
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/GeneralTestUtils.java
@@ -0,0 +1,38 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import ch.qos.logback.classic.Level;
+import ch.qos.logback.classic.Logger;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.slf4j.LoggerFactory;
+
+import java.time.Duration;
+import java.time.Instant;
+
+@Slf4j
+public class GeneralTestUtils {
+
+    public static void changeLogLevelTo(Level targetLevel) {
+        log.warn("Making sure log level isn't too low");
+//        Logger root = (Logger) LoggerFactory.getLogger(Logger.ROOT_LOGGER_NAME);
+//        root.setLevel(Level.INFO);
+
+        Logger csid = (Logger) LoggerFactory.getLogger("io.confluent.csid");
+        csid.setLevel(targetLevel);
+    }
+
+    @SneakyThrows
+    public static Duration time(Runnable task) {
+        Instant start = Instant.now();
+        log.debug("Timed function starting at: {}", start);
+        task.run();
+        Instant end = Instant.now();
+        Duration between = Duration.between(start, end);
+        log.debug("Finished, took {}", between);
+        return between;
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/JavaEnvTest.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/JavaEnvTest.java
new file mode 100644
index 000000000..7d47d8747
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/JavaEnvTest.java
@@ -0,0 +1,22 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import lombok.extern.slf4j.Slf4j;
+import org.junit.jupiter.api.Test;
+
+import static io.confluent.csid.utils.StringTestUtils.pretty;
+
+@Slf4j
+class JavaEnvTest {
+
+    /**
+     * Used to manually inspect the java environment at runtime - particularly useful for CI environments
+     */
+    @Test
+    void checkJavaEnvironment() {
+        log.error("Java all env: {}", pretty(System.getProperties().entrySet()));
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/KafkaTestUtils.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/KafkaTestUtils.java
new file mode 100644
index 000000000..70d385b14
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/KafkaTestUtils.java
@@ -0,0 +1,325 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.AbstractParallelEoSStreamProcessorTestBase;
+import io.confluent.parallelconsumer.PollContext;
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager;
+import io.confluent.parallelconsumer.state.WorkContainer;
+import io.confluent.parallelconsumer.state.WorkManager;
+import lombok.Getter;
+import lombok.RequiredArgsConstructor;
+import lombok.Setter;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.commons.lang3.StringUtils;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.MockConsumer;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.clients.producer.MockProducer;
+import org.apache.kafka.common.TopicPartition;
+import org.assertj.core.api.Assertions;
+import org.assertj.core.util.Lists;
+
+import java.util.*;
+import java.util.concurrent.FutureTask;
+import java.util.concurrent.atomic.AtomicReference;
+import java.util.stream.Collectors;
+
+import static java.lang.Math.random;
+import static org.assertj.core.api.Assertions.assertThat;
+
+@Slf4j
+@RequiredArgsConstructor
+public class KafkaTestUtils {
+
+    private final String INPUT_TOPIC;
+
+    private final String CONSUMER_GROUP_ID;
+
+    @Getter
+    private final LongPollingMockConsumer consumerSpy;
+
+    int offset = 0;
+
+    // todo not used anymore - delete?
+    public void assignConsumerToTopic(final MockConsumer mc) {
+        TopicPartition tp1 = new TopicPartition(INPUT_TOPIC, 1);
+        TopicPartition tp0 = new TopicPartition(INPUT_TOPIC, 0);
+        mc.assign(Lists.list(tp0, tp1));
+
+        HashMap<TopicPartition, Long> beginningOffsets = new HashMap<>();
+        beginningOffsets.put(tp0, 0L);
+        beginningOffsets.put(tp1, 0L);
+        mc.updateBeginningOffsets(beginningOffsets);
+    }
+
+    /**
+     * It's a race to see if the genesis offset gets committed or not. So lets remove it if it exists, and all tests can
+     * assume it doesn't.
+     */
+    public static List<Integer> trimAllGenesisOffset(final List<Integer> collect) {
+        return collect.stream().filter(x -> x != 0).collect(Collectors.toList());
+    }
+
+    public ConsumerRecord<String, String> makeRecord(String key, String value) {
+        return makeRecord(0, key, value);
+    }
+
+    public ConsumerRecord<String, String> makeRecord(int part, String key, String value) {
+        ConsumerRecord<String, String> stringStringConsumerRecord = new ConsumerRecord<>(INPUT_TOPIC, part, offset, (key), (value));
+        offset++;
+        return stringStringConsumerRecord;
+    }
+
+    public void assertCommits(MockProducer mp, List<Integer> integers) {
+        assertCommits(mp, integers, Optional.empty());
+    }
+
+    /**
+     * Collects into a set - ignore repeated commits ({@link OffsetMapCodecManager}).
+     * <p>
+     * Like {@link AbstractParallelEoSStreamProcessorTestBase#assertCommits(List, Optional)} but for a
+     * {@link MockProducer}.
+     *
+     * @see AbstractParallelEoSStreamProcessorTestBase#assertCommits(List, Optional)
+     * @see OffsetMapCodecManager
+     */
+    public void assertCommits(MockProducer mp, List<Integer> expectedOffsets, Optional<String> description) {
+        log.debug("Asserting commits of {}", expectedOffsets);
+        List<Integer> offsets = getProducerCommitsFlattened(mp);
+
+        if (!expectedOffsets.contains(0)) {
+            offsets = KafkaTestUtils.trimAllGenesisOffset(offsets);
+        }
+
+        assertThat(offsets).describedAs(description.orElse("Which offsets are committed and in the expected order"))
+                .containsExactlyElementsOf(expectedOffsets);
+    }
+
+    public List<Integer> getProducerCommitsFlattened(MockProducer mp) {
+        return getProducerCommitsMeta(mp).stream().map(x -> (int) x.offset()).collect(Collectors.toList());
+    }
+
+    public List<OffsetAndMetadata> getProducerCommitsMeta(MockProducer mp) {
+        List<Map<String, Map<TopicPartition, OffsetAndMetadata>>> history = mp.consumerGroupOffsetsHistory();
+
+        List<OffsetAndMetadata> set = history.stream().flatMap(histories -> {
+            // get all partition offsets and flatten
+            ArrayList<OffsetAndMetadata> results = new ArrayList<>();
+            var group = histories.get(CONSUMER_GROUP_ID);
+            for (var partitionOffsets : group.entrySet()) {
+                OffsetAndMetadata commit = partitionOffsets.getValue();
+                results.add(commit);
+            }
+            return results.stream();
+        }).collect(Collectors.toList()); // set - ignore repeated commits ({@link OffsetMap})
+        return set;
+    }
+
+    public void assertCommitLists(MockProducer mp, List<List<Integer>> expectedPartitionOffsets, Optional<String> description) {
+        assertCommitLists(mp.consumerGroupOffsetsHistory(), expectedPartitionOffsets, description);
+    }
+
+    /**
+     * Collects into a set - ignore repeated commits ({@link OffsetMapCodecManager}).
+     * <p>
+     * Ignores duplicates.
+     *
+     * @see OffsetMapCodecManager
+     */
+    public void assertCommitLists(List<Map<String, Map<TopicPartition, OffsetAndMetadata>>> history,
+                                  List<List<Integer>> expectedPartitionOffsets,
+                                  Optional<String> description) {
+        log.info("Asserting commits of {}", expectedPartitionOffsets);
+
+        AtomicReference<String> topicName = new AtomicReference<>("");
+        var partitionToCommittedOffsets = new HashMap<TopicPartition, Set<Integer>>(); // set - ignore repeated commits ({@link OffsetMap})
+        new ArrayList<>(history).stream().forEachOrdered(histories -> {
+            // get all partition offsets and flatten
+            var partitionCommits = histories.get(CONSUMER_GROUP_ID);
+            Set<Map.Entry<TopicPartition, OffsetAndMetadata>> entries = partitionCommits.entrySet();
+            ArrayList<Map.Entry<TopicPartition, OffsetAndMetadata>> wrapped = new ArrayList<>(entries);
+            for (var singlePartitionCommit : wrapped) {
+                TopicPartition key = singlePartitionCommit.getKey();
+                topicName.set(key.topic());
+                OffsetAndMetadata commit = singlePartitionCommit.getValue();
+                int offset = (int) commit.offset();
+                partitionToCommittedOffsets.computeIfAbsent(key, x -> new HashSet<>());
+                // ignore genesis commits
+                if (offset != 0)
+                    partitionToCommittedOffsets.get(key).add(offset);
+            }
+        });
+
+        // compute the matching expected map
+        var expectedMap = new HashMap<TopicPartition, Set<Integer>>();
+        for (int i = 0; i < expectedPartitionOffsets.size(); i++) {
+            List<Integer> offsets = expectedPartitionOffsets.get(i);
+            var tp = new TopicPartition(topicName.get(), i);
+            expectedMap.put(tp, new HashSet<>(offsets));
+        }
+
+        assertThat(partitionToCommittedOffsets)
+                .describedAs(description.orElse("Which offsets are committed and in the expected order"))
+                .containsExactlyEntriesOf(expectedMap);
+    }
+
+    public static void assertLastCommitIs(final LongPollingMockConsumer<String, String> mockConsumer, final int expected) {
+        List<Map<TopicPartition, OffsetAndMetadata>> commits = mockConsumer.getCommitHistoryInt();
+        Assertions.assertThat(commits).isNotEmpty();
+        long offset = (int) commits.get(commits.size() - 1).values().iterator().next().offset();
+        Assertions.assertThat(offset).isEqualTo(expected);
+    }
+    public List<ConsumerRecord<String, String>> generateRecords( int quantity) {
+        return generateRecords(0, quantity);
+    }
+
+    public List<ConsumerRecord<String, String>> generateRecords(int partition, int quantity) {
+        HashMap<Integer, List<ConsumerRecord<String, String>>> integerListHashMap = generateRecords(partition, defaultKeys, quantity);
+        Collection<List<ConsumerRecord<String, String>>> values = integerListHashMap.values();
+        return flatten(values);
+    }
+
+    /**
+     * Randomly create records for randomly selected keys until requested quantity is reached.
+     */
+    public HashMap<Integer, List<ConsumerRecord<String, String>>> generateRecords(int partition, List<Integer> keys, int quantity) {
+        var keyRecords = new HashMap<Integer, List<ConsumerRecord<String, String>>>(quantity);
+//        List<Integer> keyWork = UniLists.copyOf(keys);
+
+        int globalCount = 0;
+        while (globalCount < quantity) {
+            Integer key = getRandomKey(keys);
+            int recsCountForThisKey = (int) (Math.random() * quantity);
+            String keyString = key.toString();
+            final List<ConsumerRecord<String, String>> keyList = keyRecords.computeIfAbsent(key, (ignore) -> new ArrayList<>());
+            int keyCount = keyList.size();
+            String value = keyCount + "," + globalCount;
+            ConsumerRecord<String, String> rec = makeRecord(partition, keyString, value);
+//            var consumerRecords = generateRecordsForKey(key, recsCountForThisKey);
+            keyList.add(rec);
+//            keyRecords.put(key, consumerRecords);
+            globalCount++;
+        }
+        return keyRecords;
+    }
+    public HashMap<Integer, List<ConsumerRecord<String, String>>> generateRecords(List<Integer> keys, int quantity) {
+        return generateRecords(0, keys, quantity);
+    }
+
+        private Integer removeRandomKey(List<Integer> keyWork) {
+        int i = (int) (random() * keyWork.size());
+        Integer remove = keyWork.remove(i);
+        return remove;
+    }
+
+    public ArrayList<ConsumerRecord<String, String>> generateRecordsForKey(Integer key, int quantity) {
+        var records = new ArrayList<ConsumerRecord<String, String>>(quantity);
+        for (long i : Range.range(quantity)) {
+            var rec = makeRecord(key.toString(), i + "");
+            records.add(rec);
+        }
+        return records;
+    }
+
+    public <KEY, VALUE> List<ConsumerRecord<KEY, VALUE>> flatten(Collection<List<ConsumerRecord<KEY, VALUE>>> listlist) {
+        SortedSet<ConsumerRecord<KEY, VALUE>> all = new TreeSet<>(Comparator.comparing(ConsumerRecord::offset));
+        for (Collection<ConsumerRecord<KEY, VALUE>> value : listlist) {
+            all.addAll(value);
+        }
+        return new ArrayList<>(all);
+    }
+
+    @Setter
+    @Getter
+    private List<Integer> defaultKeys = Range.listOfIntegers(100);
+
+    private Integer getRandomDefaultKey() {
+        int i = (int) (random() * defaultKeys.size());
+        return defaultKeys.get(i);
+    }
+
+    private Integer getRandomKey(List<Integer> keyList) {
+        int i = (int) (random() * keyList.size());
+        return keyList.get(i);
+    }
+
+    private ConsumerRecord<String, String> addRecord(String k, String v) {
+        ConsumerRecord<String, String> record = makeRecord(k, v);
+        consumerSpy.addRecord(record);
+        return record;
+    }
+
+    public void send(MockConsumer<String, String> consumerSpy, HashMap<?, List<ConsumerRecord<String, String>>> records) {
+        List<ConsumerRecord<String, String>> collect = records.entrySet().stream()
+                .flatMap(x -> x.getValue().stream())
+                .collect(Collectors.toList());
+        send(consumerSpy, collect);
+    }
+
+    public void send(MockConsumer<String, String> consumerSpy, List<ConsumerRecord<String, String>> records) {
+        log.debug("Sending {} more messages to the consumer stub", records.size());
+        // send records in `correct` offset order as declared by the input data, regardless of the order of the input list
+        List<ConsumerRecord<String, String>> sorted = new ArrayList<>(records);
+        sorted.sort(Comparator.comparingLong(ConsumerRecord::offset));
+        for (ConsumerRecord<String, String> record : sorted) {
+            consumerSpy.addRecord(record);
+        }
+    }
+
+
+    public static void completeWork(final WorkManager<String, String> wmm, List<WorkContainer<String, String>> work, long offset) {
+        WorkContainer<String, String> workMatchingProvidedOffset = work.stream()
+                .filter(x ->
+                        x.getCr().offset() == offset
+                )
+                .findFirst().get();
+        KafkaTestUtils.completeWork(wmm, workMatchingProvidedOffset);
+    }
+
+    public static void completeWork(final WorkManager<String, String> wmm, final WorkContainer<String, String> wc) {
+        FutureTask future = new FutureTask<>(() -> true);
+        future.run();
+        assertThat(future).isDone();
+        wc.setFuture(future);
+        wc.onUserFunctionSuccess();
+        wmm.onSuccessResult(wc);
+        assertThat(wc.isUserFunctionComplete()).isTrue();
+    }
+
+    public List<ConsumerRecord<String, String>> sendRecords(final int i) {
+        var consumerRecords = generateRecords(i);
+        send(consumerSpy, consumerRecords);
+        return consumerRecords;
+    }
+
+    /**
+     * Checks that the ordering of the results is the same as the ordering of the input records
+     */
+    // todo move to specific assertion utils class, along with other legacy assertion utils?
+    public static <T> void checkExactOrdering(Map<String, Queue<PollContext<String, String>>> results,
+                                              HashMap<Integer, List<T>> originalRecords) {
+        originalRecords.entrySet().forEach(entry -> {
+            var originalRecordList = entry.getValue();
+            var originalKey = entry.getKey();
+            var sequence = results.get(originalKey.toString());
+            assertThat(sequence).hasSameSizeAs(originalRecordList);
+            assertThat(sequence.size()).describedAs("Sanity: is same size as original list").isEqualTo(originalRecordList.size());
+            log.debug("Key {} has same size of record as original - {}", originalKey, sequence.size());
+            // check the integer sequence of PollContext value is linear and is without gaps
+            var last = sequence.poll();
+            PollContext<String, String> next = null;
+            while (!sequence.isEmpty()) {
+                next = sequence.poll();
+                var thisValue = Integer.parseInt(org.apache.commons.lang3.StringUtils.substringBefore(next.value(), ","));
+                var lastValuePlusOne = Integer.parseInt(StringUtils.substringBefore(last.value(), ",")) + 1;
+                assertThat(thisValue).isEqualTo(lastValuePlusOne);
+                last = next;
+            }
+            log.debug("Key {} a an exactly sequential series of values, ending in {} (starts at zero)", originalKey, next.value());
+
+        });
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/LatchTestUtils.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/LatchTestUtils.java
new file mode 100644
index 000000000..888e8f644
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/LatchTestUtils.java
@@ -0,0 +1,77 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+
+import java.time.Instant;
+import java.util.ArrayList;
+import java.util.List;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.TimeoutException;
+
+import static io.confluent.csid.utils.BackportUtils.toSeconds;
+import static io.confluent.csid.utils.Range.range;
+import static io.confluent.parallelconsumer.ParallelEoSStreamProcessorTestBase.defaultTimeoutSeconds;
+import static java.time.Duration.between;
+import static java.time.Instant.now;
+import static java.util.concurrent.TimeUnit.SECONDS;
+
+@Slf4j
+public class LatchTestUtils {
+
+    public static void awaitLatch(List<CountDownLatch> latches, int latchIndex) {
+        log.trace("Waiting on latch {}", latchIndex);
+        awaitLatch(latches.get(latchIndex));
+        log.trace("Wait on latch {} finished.", latchIndex);
+    }
+
+    @SneakyThrows
+    public static void awaitLatch(CountDownLatch latch) {
+        awaitLatch(latch, defaultTimeoutSeconds);
+    }
+
+    @SneakyThrows
+    public static void awaitLatch(final CountDownLatch latch, final int seconds) {
+        log.trace("Waiting on latch with timeout {}s", seconds);
+        Instant start = now();
+        boolean latchReachedZero = false;
+        while (start.isAfter(now().minusSeconds(seconds))) {
+            try {
+                latchReachedZero = latch.await(seconds, SECONDS);
+            } catch (InterruptedException e) {
+                log.trace("Latch await interrupted", e);
+            }
+            if (latchReachedZero)
+                break;
+            else
+                log.trace("Latch wait aborted, but timeout ({}s) not reached - will try to wait again remaining {}",
+                        seconds, seconds - toSeconds(between(start, now())));
+        }
+        if (latchReachedZero) {
+            log.trace("Latch was released (#countdown)");
+        } else {
+            throw new TimeoutException("Latch await timeout (" + seconds + " seconds) - " + latch.getCount() + " count remaining");
+        }
+    }
+
+    public static void release(List<CountDownLatch> locks, int lockIndex) {
+        log.debug("Releasing {}...", lockIndex);
+        locks.get(lockIndex).countDown();
+    }
+
+    public static List<CountDownLatch> constructLatches(int numberOfLatches) {
+        var result = new ArrayList<CountDownLatch>(numberOfLatches);
+        for (var ignore : range(numberOfLatches)) {
+            result.add(new CountDownLatch(1));
+        }
+        return result;
+    }
+
+    public static void release(final CountDownLatch latch) {
+        log.info("Latch countdown");
+        latch.countDown();
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/LongPollingMockConsumer.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/LongPollingMockConsumer.java
new file mode 100644
index 000000000..9fc8b5343
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/LongPollingMockConsumer.java
@@ -0,0 +1,219 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import lombok.Getter;
+import lombok.SneakyThrows;
+import lombok.ToString;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.*;
+import org.apache.kafka.clients.consumer.internals.SubscriptionState;
+import org.apache.kafka.clients.producer.MockProducer;
+import org.apache.kafka.common.TopicPartition;
+import pl.tlinkowski.unij.api.UniMaps;
+
+import java.lang.reflect.Field;
+import java.time.Duration;
+import java.time.Instant;
+import java.util.*;
+import java.util.concurrent.CopyOnWriteArrayList;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.stream.Collectors;
+import java.util.stream.IntStream;
+
+/**
+ * Used in tests to stub out the behaviour of the real Broker and Client's long polling system (the mock Kafka Consumer
+ * doesn't have this behaviour).
+ *
+ * @author Antony Stubbs
+ */
+@ToString
+@Slf4j
+public class LongPollingMockConsumer<K, V> extends MockConsumer<K, V> {
+
+    // thread safe for easy parallel tests - no need for performance considerations as is test harness
+    @Getter
+    private final CopyOnWriteArrayList<Map<TopicPartition, OffsetAndMetadata>> commitHistoryInt = new CopyOnWriteArrayList<>();
+
+    public LongPollingMockConsumer(OffsetResetStrategy offsetResetStrategy) {
+        super(offsetResetStrategy);
+    }
+
+    private final AtomicBoolean statePretendingToLongPoll = new AtomicBoolean(false);
+
+    @Override
+    public synchronized ConsumerRecords<K, V> poll(Duration timeout) {
+        var records = super.poll(timeout);
+
+        if (records.isEmpty()) {
+            log.debug("No records returned, simulating long poll with sleep for requested long poll timeout of {}...", timeout);
+            synchronized (this) {
+                var sleepUntil = Instant.now().plus(timeout);
+                statePretendingToLongPoll.set(true);
+                while (statePretendingToLongPoll.get() && !timeoutReached(sleepUntil)) {
+                    Duration left = Duration.between(Instant.now(), sleepUntil);
+                    log.debug("Time remaining: {}", left);
+                    try {
+                        // a sleep of 0 ms causes an indefinite sleep
+                        long msLeft = left.toMillis();
+                        if (msLeft > 0) {
+                            this.wait(msLeft);
+                        }
+                    } catch (InterruptedException e) {
+                        log.warn("Interrupted, ending this long poll early", e);
+                        statePretendingToLongPoll.set(false);
+                    }
+                }
+                if (statePretendingToLongPoll.get() && !timeoutReached(sleepUntil)) {
+                    log.debug("Don't know why I was notified to wake up");
+                } else if (statePretendingToLongPoll.get() && timeoutReached(sleepUntil)) {
+                    log.debug("Simulated long poll of ({}) finished. Now: {} vs sleep until: {}", timeout, Instant.now(), sleepUntil);
+                } else if (!statePretendingToLongPoll.get()) {
+                    log.debug("Simulated long poll was interrupted by by WAKEUP command...");
+                }
+                statePretendingToLongPoll.set(false);
+            }
+        } else {
+            log.debug("Polled and found {} records...", records.count());
+        }
+        return records;
+    }
+
+    /**
+     * Restricted to ms precision to match {@link #wait()} semantics
+     */
+    private boolean timeoutReached(Instant sleepUntil) {
+        long now = Instant.now().toEpochMilli();
+        long until = sleepUntil.toEpochMilli();
+        // plus one due to truncation/rounding semantics
+        return now + 1 >= until;
+    }
+
+    @Override
+    public synchronized void addRecord(ConsumerRecord<K, V> record) {
+        super.addRecord(record);
+        // wake me up if I'm pretending to long poll
+        wakeup();
+    }
+
+    @Override
+    public synchronized void wakeup() {
+        if (statePretendingToLongPoll.get()) {
+            statePretendingToLongPoll.set(false);
+            log.debug("Interrupting mock long poll...");
+            synchronized (this) {
+                this.notifyAll();
+            }
+        }
+    }
+
+    @Override
+    public synchronized void commitAsync(final Map<TopicPartition, OffsetAndMetadata> offsets, final OffsetCommitCallback callback) {
+        commitHistoryInt.add(offsets);
+        super.commitAsync(offsets, callback);
+    }
+
+    /**
+     * Makes the commit history look like the {@link MockProducer}s one so we can use the same assert method.
+     *
+     * @see KafkaTestUtils#assertCommitLists(List, List, Optional)
+     */
+    private List<Map<String, Map<TopicPartition, OffsetAndMetadata>>> injectConsumerGroupId(final List<Map<TopicPartition, OffsetAndMetadata>> commitHistory) {
+        String groupId = this.groupMetadata().groupId();
+        return commitHistory.stream()
+                .map(x -> UniMaps.of(groupId, x))
+                .collect(Collectors.toList());
+    }
+
+    /*
+     * Makes the commit history look like the {@link MockProducer}s one, so we can use the same assert method.
+     *
+     * @see KafkaTestUtils#assertCommitLists(List, List, Optional)
+     */
+    public List<Map<String, Map<TopicPartition, OffsetAndMetadata>>> getCommitHistoryWithGroupId() {
+        var commitHistoryInt = getCommitHistoryInt();
+        return injectConsumerGroupId(commitHistoryInt);
+    }
+
+    @Override
+    @SneakyThrows
+    public synchronized void close(Duration timeout) {
+        revokeAssignment();
+        super.close(timeout);
+    }
+
+    /**
+     * {@link MockConsumer} fails to implement any {@link ConsumerRebalanceListener} system, so we manually revoke
+     * assignments, use reflection to access the registered rebalance listener, call the listener, and only then close
+     * the consumer.
+     *
+     * @see AbstractParallelEoSStreamProcessor#onPartitionsRevoked
+     */
+    private void revokeAssignment() throws NoSuchFieldException, IllegalAccessException {
+        ConsumerRebalanceListener consumerRebalanceListener = getRebalanceListener();
+
+        // execute
+        if (consumerRebalanceListener == null) {
+            log.warn("No rebalance listener assigned - on revoke can't fire");
+        } else {
+            Set<TopicPartition> assignment = super.assignment();
+            consumerRebalanceListener.onPartitionsRevoked(assignment);
+        }
+    }
+
+    private ConsumerRebalanceListener getRebalanceListener() throws NoSuchFieldException, IllegalAccessException {
+        // access listener
+        Field subscriptionsField = MockConsumer.class.getDeclaredField("subscriptions"); //NoSuchFieldException
+        subscriptionsField.setAccessible(true);
+        SubscriptionState subscriptionState = (SubscriptionState) subscriptionsField.get(this); //IllegalAccessException
+        ConsumerRebalanceListener consumerRebalanceListener = subscriptionState.rebalanceListener();
+        return consumerRebalanceListener;
+    }
+
+    public void subscribeWithRebalanceAndAssignment(final List<String> topics, int partitions) {
+        List<TopicPartition> topicPartitions = topics.stream()
+                .flatMap(y -> IntStream.range(0, partitions).boxed()
+                        .map(x -> new TopicPartition(y, x)))
+                .collect(Collectors.toList());
+        rebalance(topicPartitions);
+
+        //
+        HashMap<TopicPartition, Long> beginningOffsets = new HashMap<>();
+        for (var tp : topicPartitions) {
+            beginningOffsets.put(tp, 0L);
+        }
+        super.updateBeginningOffsets(beginningOffsets);
+    }
+
+    @SneakyThrows
+    @Override
+    public synchronized void rebalance(final Collection<TopicPartition> newAssignment) {
+        super.rebalance(newAssignment);
+        ConsumerRebalanceListener rebalanceListeners = getRebalanceListener();
+        if (rebalanceListeners != null) {
+            rebalanceListeners.onPartitionsAssigned(newAssignment);
+        }
+    }
+
+    @SneakyThrows
+    public void revoke(final Collection<TopicPartition> newAssignment) {
+        ConsumerRebalanceListener rebalanceListeners = getRebalanceListener();
+        if (rebalanceListeners != null) {
+            rebalanceListeners.onPartitionsRevoked(newAssignment);
+        }
+    }
+
+    @SneakyThrows
+    public synchronized void assign(final Collection<TopicPartition> newAssignment) {
+        ConsumerRebalanceListener rebalanceListeners = getRebalanceListener();
+        if (rebalanceListeners != null) {
+            rebalanceListeners.onPartitionsAssigned(newAssignment);
+        }
+    }
+
+    public synchronized void rebalanceWithoutAssignment(final Collection<TopicPartition> newAssignment) {
+        super.rebalance(newAssignment);
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/LoopingResumingIteratorTest.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/LoopingResumingIteratorTest.java
new file mode 100644
index 000000000..988f7cacf
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/LoopingResumingIteratorTest.java
@@ -0,0 +1,230 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.Truth;
+import com.google.common.truth.Truth8;
+import org.assertj.core.api.Assertions;
+import org.junit.jupiter.api.Test;
+
+import java.util.ArrayList;
+import java.util.LinkedHashMap;
+import java.util.Map;
+import java.util.Optional;
+import java.util.concurrent.ConcurrentHashMap;
+import java.util.stream.Collectors;
+
+/**
+ * @author Antony Stubbs
+ * @see LoopingResumingIterator
+ */
+class LoopingResumingIteratorTest {
+
+    @Test
+    void noFrom() {
+        LinkedHashMap<Integer, String> map = new LinkedHashMap<>();
+        map.put(0, "a");
+        map.put(1, "b");
+        map.put(2, "c");
+        map.put(3, "d");
+        var iterator = new LoopingResumingIterator<>(map);
+
+        ArrayList<Map.Entry<Integer, String>> results = new ArrayList<>();
+        for (var x = iterator.next(); x.isPresent(); x = iterator.next()) {
+            results.add(x.get());
+        }
+        Assertions.assertThat(results).extracting(Map.Entry::getKey).containsExactly(0, 1, 2, 3);
+    }
+
+    @Test
+    public void fromInMiddle() {
+        LinkedHashMap<Integer, String> map = new LinkedHashMap<>();
+        map.put(0, "a");
+        map.put(1, "b");
+        map.put(2, "c");
+        map.put(3, "d");
+        var iterator = LoopingResumingIterator.build(2, map);
+        ArrayList<Map.Entry<Integer, String>> results = new ArrayList<>();
+        for (var x = iterator.next(); x.isPresent(); x = iterator.next()) {
+            results.add(x.get());
+        }
+        Assertions.assertThat(results).extracting(Map.Entry::getKey).containsExactly(2, 3, 0, 1);
+    }
+
+
+    @Test
+    void fromIsEnd() {
+        LinkedHashMap<Integer, String> map = new LinkedHashMap<>();
+        map.put(0, "a");
+        map.put(1, "b");
+        map.put(2, "c");
+        map.put(3, "d");
+        var iterator = LoopingResumingIterator.build(3, map);
+        ArrayList<Map.Entry<Integer, String>> results = new ArrayList<>();
+        for (var x = iterator.next(); x.isPresent(); x = iterator.next()) {
+            results.add(x.get());
+        }
+        Assertions.assertThat(results).extracting(Map.Entry::getKey).containsExactly(3, 0, 1, 2);
+    }
+
+    @Test
+    public void fromBeginningFirstElement() {
+        LinkedHashMap<Integer, String> map = new LinkedHashMap<>();
+        map.put(0, "a");
+        map.put(1, "b");
+        map.put(2, "c");
+        map.put(3, "d");
+        var iterator = LoopingResumingIterator.build(0, map);
+        ArrayList<Map.Entry<Integer, String>> results = new ArrayList<>();
+        for (var x = iterator.next(); x.isPresent(); x = iterator.next()) {
+            results.add(x.get());
+        }
+        Assertions.assertThat(results).extracting(Map.Entry::getKey).containsExactly(0, 1, 2, 3);
+    }
+
+    @Test
+    void fromDoesntExist() {
+        LinkedHashMap<Integer, String> map = new LinkedHashMap<>();
+        map.put(0, "a");
+        map.put(1, "b");
+        map.put(2, "c");
+        map.put(3, "d");
+        var iterator = LoopingResumingIterator.build(88, map);
+        ArrayList<Map.Entry<Integer, String>> results = new ArrayList<>();
+        for (var x = iterator.next(); x.isPresent(); x = iterator.next()) {
+            results.add(x.get());
+        }
+        Assertions.assertThat(results).extracting(Map.Entry::getKey).containsExactly(0, 1, 2, 3);
+    }
+
+    @Test
+    void loopsCorrectly() {
+        LinkedHashMap<Integer, String> map = new LinkedHashMap<>();
+        map.put(0, "a");
+        map.put(1, "b");
+        map.put(2, "c");
+        {
+            var entries = LoopingResumingIterator.build(null, map);
+            ArrayList<Map.Entry<Integer, String>> results = new ArrayList<>();
+            var iterator = entries;
+            for (var x = iterator.next(); x.isPresent(); x = iterator.next()) {
+                results.add(x.get());
+            }
+            Assertions.assertThat(results).extracting(Map.Entry::getKey).containsExactly(0, 1, 2);
+        }
+
+        {
+            var entries = LoopingResumingIterator.build(2, map);
+            ArrayList<Map.Entry<Integer, String>> results = new ArrayList<>();
+            var iterator = entries;
+            for (var x = iterator.next(); x.isPresent(); x = iterator.next()) {
+                results.add(x.get());
+            }
+            Assertions.assertThat(results).extracting(Map.Entry::getKey).containsExactly(2, 0, 1);
+
+            // check reports now empty
+            Truth8.assertThat(entries.next()).isEmpty();
+        }
+    }
+
+    /**
+     * Like {@link #loopsCorrectly()}, but sets th initial starting element as the first element
+     */
+    @Test
+    void loopsCorrectlyWithStartingObjectIndexZero() {
+        LinkedHashMap<Integer, String> map = new LinkedHashMap<>();
+        map.put(0, "a");
+        map.put(1, "b");
+        map.put(2, "c");
+        {
+            var entries = LoopingResumingIterator.build(0, map);
+            ArrayList<Map.Entry<Integer, String>> results = new ArrayList<>();
+            var iterator = entries;
+            for (var x = iterator.next(); x.isPresent(); x = iterator.next()) {
+                results.add(x.get());
+            }
+            Assertions.assertThat(results).extracting(Map.Entry::getKey).containsExactly(0, 1, 2);
+
+            // check reports now empty
+            {
+                Truth8.assertThat(entries.next()).isEmpty();
+            }
+        }
+    }
+
+    @Test
+    void emptyInitialStartingKey() {
+        //
+        LinkedHashMap<Integer, String> map = new LinkedHashMap<>();
+        map.put(0, "a");
+        map.put(1, "b");
+
+        //
+        var iterator = LoopingResumingIterator.build(null, map);
+
+        //
+        var next = iterator.next().get();
+        Truth.assertThat(next.getKey()).isEqualTo(0);
+        Truth.assertThat(next.getValue()).isEqualTo("a");
+    }
+
+    /**
+     * Exposes an issue where because of iterators being reset, the two iteration passes effectively see a different
+     * collection, through the two different iterators - so the second iterator might be missing the start key
+     * <p>
+     * See https://github.com/confluentinc/parallel-consumer/pull/435
+     *
+     * @see ConcurrentHashMap section about iterators seeing a snapshot of the map state from time of creation
+     */
+    @Test
+    void demoOfNoSuchElementIssue() {
+        final int INDEX_TO_REMOVE = 4;
+        Map<Integer, String> map = new ConcurrentHashMap<>();
+        map.put(0, "a");
+        map.put(1, "b");
+        map.put(2, "c");
+        map.put(3, "d");
+        map.put(INDEX_TO_REMOVE, "e");
+        map.put(5, "f");
+        map.put(6, "g");
+        map.put(7, "h");
+        map.put(8, "i");
+        map.put(9, "j");
+
+        ArrayList<Optional<Map.Entry<Integer, String>>> results = new ArrayList<>();
+
+        var iterator = LoopingResumingIterator.build(INDEX_TO_REMOVE, map);
+
+        // iterate, and remove the staring element
+        for (var x = iterator.next(); x.isPresent(); x = iterator.next()) {
+            results.add(x);
+            if (x.get().getKey() == INDEX_TO_REMOVE) {
+                map.remove(INDEX_TO_REMOVE);
+            }
+        }
+
+        var expected = new LinkedHashMap<Integer, String>();
+        expected.put(4, "e");
+        expected.put(5, "f");
+        expected.put(6, "g");
+        expected.put(7, "h");
+        expected.put(8, "i");
+        expected.put(9, "j");
+        expected.put(0, "a");
+        expected.put(1, "b");
+        expected.put(2, "c");
+        expected.put(3, "d");
+        var expectedAsList = expected.entrySet().stream().map(Optional::of).collect(Collectors.toList());
+
+        Truth.assertThat(results).containsExactlyElementsIn(expectedAsList).inOrder();
+
+        Truth8.assertThat(iterator.next()).isEmpty();
+
+        map.clear();
+
+        Truth8.assertThat(iterator.next()).isEmpty();
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/MyRunListener.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/MyRunListener.java
new file mode 100644
index 000000000..9d42652ce
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/MyRunListener.java
@@ -0,0 +1,53 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.auto.service.AutoService;
+import org.junit.platform.launcher.TestExecutionListener;
+import org.junit.platform.launcher.TestIdentifier;
+import org.junit.platform.launcher.TestPlan;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+
+/**
+ * Print out test names in Maven output, not just class names. Useful for added context for failures in CI runs.
+ * <p>
+ * {@link AutoService} should work and load this automaticly, but something isn't working. So this is loaded manually
+ * through the META-INF/serices/org.junit.platform.launcher.TestExecutionListener
+ * <pre>
+ *  https://stackoverflow.com/questions/49937451/junit-5-is-it-possible-to-set-a-testexecutionlistener-in-maven-surefire-plugin
+ *  https://junit.org/junit5/docs/current/user-guide/#launcher-api-listeners-custom
+ *  https://github.com/google/auto/tree/master/service
+ *  https://stackoverflow.com/a/50058828/105741
+ * </pre>
+ */
+@AutoService(TestExecutionListener.class)
+public class MyRunListener implements TestExecutionListener {
+
+    private final String template = "\n" +
+            "=========\n" +
+            "   JUNIT {}:    {} ({})\n" +
+            "=========";
+
+    @Override
+    public void testPlanExecutionStarted(final TestPlan testPlan) {
+        log(msg(template, "Test plan execution started", testPlan, ""));
+    }
+
+    private void log(final String msg) {
+        System.out.println(msg);
+    }
+
+    @Override
+    public void executionSkipped(final TestIdentifier testIdentifier, final String reason) {
+        log(msg(template, "skipped", testIdentifier.getDisplayName(), reason));
+    }
+
+    @Override
+    public void executionStarted(final TestIdentifier testIdentifier) {
+        log(msg(template, "started", testIdentifier.getDisplayName(), testIdentifier.getLegacyReportingName()));
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/PodamUtils.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/PodamUtils.java
new file mode 100644
index 000000000..d2f81f3c6
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/PodamUtils.java
@@ -0,0 +1,19 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import uk.co.jemos.podam.api.PodamFactoryImpl;
+
+import java.lang.reflect.Type;
+
+public class PodamUtils {
+
+  public static final PodamFactoryImpl PODAM_FACTORY = new PodamFactoryImpl();
+
+  public static <T> T createInstance(Class<T> clazz, Type... genericTypeArgs) {
+    return PODAM_FACTORY.manufacturePojo(clazz, genericTypeArgs);
+  }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/ProgressBarUtils.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/ProgressBarUtils.java
new file mode 100644
index 000000000..d1ac18058
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/ProgressBarUtils.java
@@ -0,0 +1,36 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.UtilityClass;
+import me.tongfei.progressbar.DelegatingProgressBarConsumer;
+import me.tongfei.progressbar.ProgressBar;
+import me.tongfei.progressbar.ProgressBarBuilder;
+import org.slf4j.Logger;
+
+@UtilityClass
+public class ProgressBarUtils {
+
+
+    public static ProgressBar getNewMessagesBar(Logger log, long initialMax) {
+        return getNewMessagesBar(null, log, initialMax);
+    }
+
+    public static ProgressBar getNewMessagesBar(String name, Logger log, long initialMax) {
+        DelegatingProgressBarConsumer delegatingProgressBarConsumer = new DelegatingProgressBarConsumer(log::info);
+
+        String usedName = "progress";
+        if (name != null)
+            usedName = name;
+
+        return new ProgressBarBuilder()
+                .setConsumer(delegatingProgressBarConsumer)
+                .setInitialMax(initialMax)
+                .showSpeed()
+                .setTaskName(usedName)
+                .setUnit("msg", 1)
+                .build();
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/ProgressTracker.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/ProgressTracker.java
new file mode 100644
index 000000000..1a91d1297
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/ProgressTracker.java
@@ -0,0 +1,118 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+import io.confluent.parallelconsumer.internal.InternalRuntimeException;
+import lombok.Getter;
+
+import java.time.Duration;
+import java.time.Instant;
+import java.time.temporal.Temporal;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.AbstractParallelEoSStreamProcessorTestBase.defaultTimeout;
+
+/**
+ * Used to check that progress has been made in some activity.
+ */
+public class ProgressTracker {
+
+    public static final int WARMED_UP_AFTER_X_MESSAGES = 50;
+
+    /**
+     * The shared count of progress.
+     */
+    private final AtomicInteger processedCount;
+
+    private final AtomicInteger lastSeen = new AtomicInteger(0);
+
+    /**
+     * How many times progress has been checked for.
+     */
+    @Getter
+    private final AtomicInteger rounds = new AtomicInteger(0);
+
+    @Getter
+    private Duration timeout = defaultTimeout;
+
+    private Integer roundsAllowed = 10;
+
+    private final int coldRoundsAllowed = 20;
+
+    @Getter
+    private int highestRoundCountSeen = 0;
+    private final Instant startTime = Instant.now();
+
+    public ProgressTracker(final AtomicInteger processedCount, Integer roundsAllowed, Duration timeout) {
+        this.processedCount = processedCount;
+        if (roundsAllowed != null && timeout != null)
+            throw new IllegalArgumentException("Can't provide both a timeout and a number of rounds");
+        this.roundsAllowed = roundsAllowed;
+        this.timeout = timeout;
+    }
+
+    public ProgressTracker(final AtomicInteger processedCount) {
+        this.processedCount = processedCount;
+    }
+
+    /**
+     * Checks progress has been made. Increments the count of rounds / checks.
+     *
+     * @return false if progress has been made, true otherwise
+     */
+    public boolean hasProgressNotBeenMade() {
+        boolean progress = processedCount.get() > lastSeen.get();
+        boolean warmedUp = processedCount.get() > WARMED_UP_AFTER_X_MESSAGES;
+        boolean enoughAttempts = hasTimeoutPassed();
+        if (warmedUp && !progress && enoughAttempts) {
+            return true;
+        } else if (!warmedUp && this.roundsAllowed != null && rounds.get() > coldRoundsAllowed) {
+            return true;
+        } else if (progress) {
+            reset();
+        }
+        lastSeen.set(processedCount.get());
+        rounds.incrementAndGet();
+        return false;
+    }
+
+    private boolean hasTimeoutPassed() {
+        // in the case both are present, prefer rounds to duration (legacy)
+        if (roundsAllowed != null) {
+            return rounds.get() > roundsAllowed;
+        } else {
+            Duration remainingTime = Duration.between(Instant.now(), getDeadline());
+            return remainingTime.isNegative();
+        }
+    }
+
+    private Temporal getDeadline() {
+        return startTime.plus(timeout);
+    }
+
+    private void reset() {
+        if (rounds.get() > highestRoundCountSeen)
+            highestRoundCountSeen = rounds.get();
+        rounds.set(0);
+    }
+
+    /**
+     * @throws Exception If no progress is made
+     */
+    public void checkForProgressExceptionally() throws Exception {
+        boolean noProgress = hasProgressNotBeenMade();
+        if (noProgress)
+            throw constructError();
+    }
+
+    public Exception constructError() {
+        return constructError("");
+    }
+
+    public Exception constructError(String messageToAppend) {
+        return new InternalRuntimeException(msg("No progress beyond {} records after {} rounds. {}",
+                processedCount, rounds, messageToAppend));
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/ReplaceCamelCase.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/ReplaceCamelCase.java
new file mode 100644
index 000000000..3a5f808dc
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/ReplaceCamelCase.java
@@ -0,0 +1,47 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import org.junit.jupiter.api.DisplayNameGenerator;
+
+import java.lang.reflect.Method;
+
+/**
+ * Nicer test names.
+ * <p>
+ * This seems to break some aspects of Ideas test tracking system (i.e. replay failures).
+ * <p>
+ * https://leeturner.me/posts/building-a-camel-case-junit5-displaynamegenerator/
+ */
+public class ReplaceCamelCase extends DisplayNameGenerator.Standard {
+    public ReplaceCamelCase() {
+    }
+
+    public String generateDisplayNameForClass(Class<?> testClass) {
+        return this.replaceCapitals(super.generateDisplayNameForClass(testClass));
+    }
+
+    public String generateDisplayNameForNestedClass(Class<?> nestedClass) {
+        return this.replaceCapitals(super.generateDisplayNameForNestedClass(nestedClass));
+    }
+
+    public String generateDisplayNameForMethod(Class<?> testClass, Method testMethod) {
+        return super.generateDisplayNameForClass(testClass) + ": " + this.replaceCapitals(testMethod.getName());
+    }
+
+    private String replaceCapitals(String name) {
+        name = name.replaceAll("([A-Z])", " $1");
+        name = name.replaceAll("([0-9]+)", " $1");
+        name = name.trim();
+        name = capitiliseSentence(name);
+        return name;
+    }
+
+    private String capitiliseSentence(String sentence) {
+        String firstLetterUpper = (sentence.charAt(0) + "").toUpperCase();
+        String withoutFirstLetter = sentence.substring(1).toLowerCase();
+        return firstLetterUpper + withoutFirstLetter;
+    }
+}
\ No newline at end of file
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/StringTestUtils.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/StringTestUtils.java
new file mode 100644
index 000000000..3aaae1d7b
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/StringTestUtils.java
@@ -0,0 +1,18 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import lombok.experimental.UtilityClass;
+import org.assertj.core.presentation.StandardRepresentation;
+
+@UtilityClass
+public class StringTestUtils {
+
+    public static final StandardRepresentation STANDARD_REPRESENTATION = new StandardRepresentation();
+
+    public static String pretty(Object properties) {
+        return STANDARD_REPRESENTATION.toStringOf(properties);
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/SupplierUtilsTest.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/SupplierUtilsTest.java
new file mode 100644
index 000000000..eb9d09781
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/SupplierUtilsTest.java
@@ -0,0 +1,67 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import org.junit.jupiter.api.Test;
+
+import java.util.function.Supplier;
+
+import static org.junit.jupiter.api.Assertions.assertEquals;
+import static org.junit.jupiter.api.Assertions.assertThrows;
+
+public class SupplierUtilsTest {
+
+    @Test
+    public void testMemoize() {
+        UnderlyingSupplier underlyingSupplier = new UnderlyingSupplier();
+        Supplier<Integer> memoizedSupplier = SupplierUtils.memoize(underlyingSupplier);
+        assertEquals(0, underlyingSupplier.calls); // the underlying supplier hasn't executed yet
+        assertEquals(5, (int) memoizedSupplier.get());
+
+        assertEquals(1, underlyingSupplier.calls);
+        assertEquals(5, (int) memoizedSupplier.get());
+
+        assertEquals(1, underlyingSupplier.calls); // it still should only have executed once due to memoization
+    }
+
+    @Test
+    public void testMemoizeNullSupplier() {
+        assertThrows(NullPointerException.class, () -> SupplierUtils.memoize(null));
+    }
+
+    @Test
+    public void testMemoizeSupplierReturnsNull() {
+        assertThrows(NullPointerException.class, () -> {
+            Supplier<?> supplier = SupplierUtils.memoize(() -> null);
+            supplier.get();
+        });
+    }
+
+    @Test
+    public void testMemoizeExceptionThrown() {
+        Supplier<Integer> memoizedSupplier = SupplierUtils.memoize(new ThrowingSupplier());
+        assertThrows(IllegalStateException.class, memoizedSupplier::get);
+    }
+
+    private static class UnderlyingSupplier implements Supplier<Integer> {
+
+        private int calls = 0;
+
+        @Override
+        public Integer get() {
+            calls++;
+            return calls * 5;
+        }
+
+    }
+
+    private static class ThrowingSupplier implements Supplier<Integer> {
+
+        @Override
+        public Integer get() {
+            throw new IllegalStateException();
+        }
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/ThreadUtils.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/ThreadUtils.java
new file mode 100644
index 000000000..f176751b4
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/ThreadUtils.java
@@ -0,0 +1,36 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+
+@Slf4j
+public class ThreadUtils {
+
+    @SneakyThrows
+    public static void sleepQuietly(final int ms) {
+        log.debug("Sleeping for {}", ms);
+        Thread.sleep(ms);
+        log.debug("Woke up (slept for {})", ms);
+    }
+
+    public static void sleepLog(final int ms) {
+        try {
+            Thread.sleep(ms);
+        } catch (InterruptedException e) {
+            log.error("Sleep of {} interrupted", e, ms);
+        }
+    }
+
+    @SneakyThrows
+    public static void sleepQuietly(long ms) {
+        sleepQuietly((int) ms);
+    }
+
+    public static void sleepSecondsLog(int seconds) {
+        sleepLog(seconds * 1000);
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/TrimListRepresentation.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/TrimListRepresentation.java
new file mode 100644
index 000000000..11be9b3d3
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/TrimListRepresentation.java
@@ -0,0 +1,57 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.extern.slf4j.Slf4j;
+import org.assertj.core.presentation.StandardRepresentation;
+
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.List;
+import java.util.Set;
+import java.util.concurrent.CopyOnWriteArrayList;
+import java.util.stream.Collectors;
+
+/**
+ * Trims long lists to make large List assertions more readable
+ */
+@Slf4j
+public class TrimListRepresentation extends StandardRepresentation {
+
+    private final int sizeLimit = 10;
+
+    protected static String msg = "Collection has been trimmed...";
+
+    @Override
+    public String toStringOf(Object raw) {
+        if (raw instanceof Set) {
+            var aSet = (Set<?>) raw;
+            if (aSet.size() > sizeLimit)
+                raw = new ArrayList<>(aSet);
+        }
+        if (raw instanceof Object[]) {
+            Object[] anObjectArray = (Object[]) raw;
+            if (anObjectArray.length > sizeLimit)
+                raw = Arrays.stream(anObjectArray).collect(Collectors.toList());
+        }
+        if (raw instanceof String[]) {
+            var anObjectArray = (String[]) raw;
+            if (anObjectArray.length > sizeLimit)
+                raw = Arrays.stream(anObjectArray).collect(Collectors.toList());
+        }
+        if (raw instanceof List) {
+            List<?> aList = (List<?>) raw;
+            if (aList.size() > sizeLimit) {
+                log.trace("List too long ({}), trimmed...", aList.size());
+                var trimmedListView = aList.subList(0, sizeLimit);
+                // don't mutate backing lists
+                var copy = new CopyOnWriteArrayList<Object>(trimmedListView);
+                copy.add(msg);
+                return super.toStringOf(copy);
+            }
+        }
+        return super.toStringOf(raw);
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/TrimListRepresentationTest.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/TrimListRepresentationTest.java
new file mode 100644
index 000000000..db302b301
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/TrimListRepresentationTest.java
@@ -0,0 +1,42 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import org.assertj.core.api.Assertions;
+import org.assertj.core.api.SoftAssertions;
+import org.junit.jupiter.api.Test;
+
+import java.util.List;
+import java.util.stream.Collectors;
+import java.util.stream.IntStream;
+
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.assertThatThrownBy;
+
+/**
+ * @author Antony Stubbs
+ * @see TrimListRepresentation
+ */
+class TrimListRepresentationTest {
+
+    @Test
+    void customRepresentationFail() {
+        List<Integer> one = IntStream.range(0, 1000).boxed().collect(Collectors.toList());
+        List<Integer> two = IntStream.range(999, 2000).boxed().collect(Collectors.toList());
+        assertThatThrownBy(() -> assertThat(one).withRepresentation(new TrimListRepresentation()).containsAll(two))
+                .hasMessageContaining("trimmed");
+    }
+
+    @Test
+    void customRepresentationPass() {
+        Assertions.useRepresentation(new TrimListRepresentation());
+        List<Integer> one = IntStream.range(0, 1000).boxed().collect(Collectors.toList());
+        List<Integer> two = IntStream.range(0, 1000).boxed().collect(Collectors.toList());
+        SoftAssertions all = new SoftAssertions();
+        all.assertThat(one).containsAll(two);
+        all.assertAll();
+    }
+
+}
\ No newline at end of file
diff --git a/parallel-consumer-core/src/test/java/io/confluent/csid/utils/WireMockUtils.java b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/WireMockUtils.java
new file mode 100644
index 000000000..af20e25e3
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/csid/utils/WireMockUtils.java
@@ -0,0 +1,30 @@
+package io.confluent.csid.utils;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import com.github.tomakehurst.wiremock.WireMockServer;
+import com.github.tomakehurst.wiremock.client.MappingBuilder;
+import com.github.tomakehurst.wiremock.client.WireMock;
+import com.github.tomakehurst.wiremock.core.WireMockConfiguration;
+
+public class WireMockUtils {
+
+    public static final String stubResponse = "Good times.";
+
+    public WireMockServer setupWireMock() {
+        WireMockServer stubServer;
+        WireMockConfiguration options = WireMockConfiguration.wireMockConfig().dynamicPort();
+        stubServer = new WireMockServer(options);
+        MappingBuilder mappingBuilder = WireMock.get(WireMock.urlPathEqualTo("/"))
+                .willReturn(WireMock.aResponse()
+                        .withBody(stubResponse));
+        stubServer.stubFor(mappingBuilder);
+        stubServer.stubFor(WireMock.get(WireMock.urlPathEqualTo("/api")).
+                willReturn(WireMock.aResponse().withBody(stubResponse)));
+        stubServer.start();
+        return stubServer;
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/AbstractParallelEoSStreamProcessorTestBase.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/AbstractParallelEoSStreamProcessorTestBase.java
new file mode 100644
index 000000000..918eb0657
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/AbstractParallelEoSStreamProcessorTestBase.java
@@ -0,0 +1,495 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import com.google.common.truth.Truth;
+import io.confluent.csid.utils.KafkaTestUtils;
+import io.confluent.csid.utils.LongPollingMockConsumer;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder;
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.internal.PCModule;
+import io.confluent.parallelconsumer.model.CommitHistory;
+import io.confluent.parallelconsumer.state.WorkContainer;
+import io.confluent.parallelconsumer.state.WorkManager;
+import io.confluent.parallelconsumer.truth.CommitHistorySubject;
+import io.confluent.parallelconsumer.truth.LongPollingMockConsumerSubject;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.*;
+import org.apache.kafka.clients.producer.MockProducer;
+import org.apache.kafka.common.TopicPartition;
+import org.apache.kafka.common.serialization.Serdes;
+import org.junit.jupiter.api.AfterEach;
+import org.junit.jupiter.api.BeforeEach;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniMaps;
+
+import java.time.Duration;
+import java.util.*;
+import java.util.concurrent.Callable;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.LinkedBlockingQueue;
+import java.util.concurrent.TimeoutException;
+import java.util.concurrent.atomic.AtomicReference;
+import java.util.stream.Collectors;
+
+import static io.confluent.csid.utils.LatchTestUtils.awaitLatch;
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.*;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.UNORDERED;
+import static java.time.Duration.ofMillis;
+import static java.time.Duration.ofSeconds;
+import static java.util.concurrent.TimeUnit.SECONDS;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.awaitility.Awaitility.await;
+import static org.awaitility.Awaitility.waitAtMost;
+import static org.mockito.Mockito.*;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+/**
+ * @author Antony Stubbs
+ * @see AbstractParallelEoSStreamProcessor
+ */
+// todo migrate commit assertion methods in to a Truth Subject
+@Slf4j
+public abstract class AbstractParallelEoSStreamProcessorTestBase {
+
+    public String INPUT_TOPIC;
+    public String OUTPUT_TOPIC;
+    public String CONSUMER_GROUP_ID;
+
+    public ConsumerGroupMetadata DEFAULT_GROUP_METADATA;
+
+    /**
+     * The frequency with which we pretend to poll the broker for records - actually the pretend long poll timeout. A
+     * lower value shouldn't affect test speed much unless many batches of messages are "published" as test messages are
+     * queued up at the beginning and the polled.
+     *
+     * @see LongPollingMockConsumer#poll(Duration)
+     */
+    public static final int DEFAULT_BROKER_POLL_FREQUENCY_MS = 500;
+
+    /**
+     * The commit interval for the main {@link AbstractParallelEoSStreamProcessor} control thread. Actually the timeout
+     * that we poll the {@link LinkedBlockingQueue} for. A lower value will increase the frequency of control loop
+     * cycles, making our test waiting go faster.
+     *
+     * @see AbstractParallelEoSStreamProcessor#workMailBox
+     * @see AbstractParallelEoSStreamProcessor#processWorkCompleteMailBox
+     */
+    public static final int DEFAULT_COMMIT_INTERVAL_MAX_MS = 100;
+
+    protected LongPollingMockConsumer<String, String> consumerSpy;
+    protected MockProducer<String, String> producerSpy;
+
+    protected AbstractParallelEoSStreamProcessor<String, String> parentParallelConsumer;
+
+    public static int defaultTimeoutSeconds = 30;
+
+    public static Duration defaultTimeout = ofSeconds(defaultTimeoutSeconds);
+    protected static long defaultTimeoutMs = defaultTimeout.toMillis();
+    protected static Duration effectivelyInfiniteTimeout = Duration.ofMinutes(20);
+
+    ParallelEoSStreamProcessorTest.MyAction myRecordProcessingAction;
+
+    ConsumerRecord<String, String> firstRecord;
+    ConsumerRecord<String, String> secondRecord;
+
+    protected KafkaTestUtils ktu;
+
+    protected AtomicReference<Integer> loopCountRef;
+
+    volatile CountDownLatch loopLatchV = new CountDownLatch(0);
+    volatile CountDownLatch controlLoopPauseLatch = new CountDownLatch(0);
+    protected AtomicReference<Integer> loopCount;
+
+    /**
+     * Time to wait to verify some assertion types
+     */
+    long verificationWaitDelay;
+    protected TopicPartition topicPartition;
+
+    /**
+     * Unique topic names for each test method
+     */
+    public void setupTopicNames() {
+        INPUT_TOPIC = "input-" + Math.random();
+        OUTPUT_TOPIC = "output-" + Math.random();
+        CONSUMER_GROUP_ID = "my-group" + Math.random();
+        topicPartition = new TopicPartition(INPUT_TOPIC, 0);
+        DEFAULT_GROUP_METADATA = new ConsumerGroupMetadata(CONSUMER_GROUP_ID);
+    }
+
+    @BeforeEach
+    public void setupAsyncConsumerTestBase() {
+        setupTopicNames();
+
+        ParallelConsumerOptions<Object, Object> options = getOptions();
+        setupParallelConsumerInstance(options);
+    }
+
+    protected ParallelConsumerOptions<Object, Object> getOptions() {
+        ParallelConsumerOptions<Object, Object> options = getDefaultOptions()
+                .build();
+        return options;
+    }
+
+    protected ParallelConsumerOptions.ParallelConsumerOptionsBuilder<Object, Object> getDefaultOptions() {
+        return ParallelConsumerOptions.builder()
+                .commitMode(PERIODIC_CONSUMER_SYNC)
+                .ordering(UNORDERED);
+    }
+
+    @AfterEach
+    public void close() {
+        // don't try to close if error'd (at least one test purposefully creates an error to tests error handling) - we
+        // don't want to bubble up an error here that we expect from here.
+        if (!parentParallelConsumer.isClosedOrFailed()) {
+            if (parentParallelConsumer.getFailureCause() != null) {
+                log.error("PC has error - test failed");
+            }
+            log.debug("Test ended (maybe a failure), closing pc...");
+            parentParallelConsumer.close();
+        } else {
+            log.debug("Test finished, pc already closed.");
+        }
+    }
+
+    protected void injectWorkSuccessListener(WorkManager<String, String> wm, List<WorkContainer<String, String>> customSuccessfulWork) {
+        wm.getSuccessfulWorkListeners().add((work) -> {
+            log.debug("Test work listener heard some successful work: {}", work);
+            synchronized (customSuccessfulWork) {
+                customSuccessfulWork.add(work);
+            }
+        });
+    }
+
+    protected void primeFirstRecord() {
+        firstRecord = ktu.makeRecord("key-0", "v0-first-primed-record");
+        consumerSpy.addRecord(firstRecord);
+    }
+
+    protected MockConsumer<String, String> setupClients() {
+        instantiateConsumerProducer();
+        ktu = new KafkaTestUtils(INPUT_TOPIC, CONSUMER_GROUP_ID, consumerSpy);
+        return consumerSpy;
+    }
+
+    protected void instantiateConsumerProducer() {
+        LongPollingMockConsumer<String, String> consumer = new LongPollingMockConsumer<>(OffsetResetStrategy.EARLIEST);
+        MockProducer<String, String> producer = new MockProducer<>(true,
+                Serdes.String().serializer(), Serdes.String().serializer());
+
+        this.producerSpy = spy(producer);
+        this.consumerSpy = spy(consumer);
+        myRecordProcessingAction = spy(ParallelEoSStreamProcessorTest.MyAction.class);
+
+        when(consumerSpy.groupMetadata()).thenReturn(DEFAULT_GROUP_METADATA);
+    }
+
+    /**
+     * Need to make sure we only use {@link AbstractParallelEoSStreamProcessor#subscribe} methods, and not do manual
+     * assignment, otherwise rebalance listeners don't fire (because there are never rebalances).
+     */
+    protected void subscribeParallelConsumerAndMockConsumerTo(String topic) {
+        List<String> of = of(topic);
+        parentParallelConsumer.subscribe(of);
+        consumerSpy.subscribeWithRebalanceAndAssignment(of, 2);
+    }
+
+    protected void setupParallelConsumerInstance(ProcessingOrder order) {
+        setupParallelConsumerInstance(ParallelConsumerOptions.builder().ordering(order).build());
+    }
+
+    protected void setupParallelConsumerInstance(ParallelConsumerOptions parallelConsumerOptions) {
+        setupClients();
+
+        var optionsWithClients = parallelConsumerOptions.toBuilder()
+                .consumer(consumerSpy)
+                .producer(producerSpy)
+                .build();
+
+        parentParallelConsumer = initAsyncConsumer(optionsWithClients);
+
+        subscribeParallelConsumerAndMockConsumerTo(INPUT_TOPIC);
+
+        parentParallelConsumer.setLongPollTimeout(ofMillis(DEFAULT_BROKER_POLL_FREQUENCY_MS));
+        parentParallelConsumer.setTimeBetweenCommits(ofMillis(DEFAULT_COMMIT_INTERVAL_MAX_MS));
+
+        verificationWaitDelay = parentParallelConsumer.getTimeBetweenCommits().multipliedBy(2).toMillis();
+
+        loopCountRef = attachLoopCounter(parentParallelConsumer);
+    }
+
+    protected abstract AbstractParallelEoSStreamProcessor<String, String> initAsyncConsumer(ParallelConsumerOptions<String, String> parallelConsumerOptions);
+
+    protected void sendSecondRecord(MockConsumer<String, String> consumer) {
+        secondRecord = ktu.makeRecord("key-0", "v1");
+        consumer.addRecord(secondRecord);
+    }
+
+    protected AtomicReference<Integer> attachLoopCounter(AbstractParallelEoSStreamProcessor parallelConsumer) {
+        final AtomicReference<Integer> currentLoop = new AtomicReference<>(0);
+        parentParallelConsumer.addLoopEndCallBack(() -> {
+            Integer currentNumber = currentLoop.get();
+            int newLoopNumber = currentNumber + 1;
+            currentLoop.compareAndSet(currentNumber, newLoopNumber);
+            log.trace("Counting down latch from {}", loopLatchV.getCount());
+            loopLatchV.countDown();
+            log.trace("Loop latch remaining: {}", loopLatchV.getCount());
+            if (controlLoopPauseLatch.getCount() > 0) {
+                log.debug("Waiting on pause latch ({})...", controlLoopPauseLatch.getCount());
+                try {
+                    controlLoopPauseLatch.await();
+                } catch (InterruptedException e) {
+                    log.error(e.getMessage(), e);
+                }
+                log.trace("Completed waiting on pause latch");
+            }
+            log.trace("Loop count {}", currentLoop.get());
+        });
+        return currentLoop;
+    }
+
+    /**
+     * Pauses the control loop by awaiting this injected countdown lunch
+     */
+    protected void pauseControlLoop() {
+        log.trace("Pause loop");
+        controlLoopPauseLatch = new CountDownLatch(1);
+    }
+
+    /**
+     * Resume is the controller by decrementing the injected countdown latch
+     */
+    protected void resumeControlLoop() {
+        log.trace("Resume loop");
+        controlLoopPauseLatch.countDown();
+    }
+
+    protected void awaitForOneLoopCycle() {
+        awaitForSomeLoopCycles(1);
+    }
+
+    protected void awaitForSomeLoopCycles(int thisManyMore) {
+        log.debug("Waiting for {} more iterations of the control loop.", thisManyMore);
+        blockingLoopLatchTrigger(thisManyMore);
+        log.debug("Completed waiting on {} loop(s)", thisManyMore);
+    }
+
+    protected void awaitUntilTrue(Callable<Boolean> booleanCallable) {
+        waitAtMost(defaultTimeout).until(booleanCallable);
+    }
+
+    /**
+     * Make sure the latch is attached, if this times out unexpectedly
+     */
+    @SneakyThrows
+    private void blockingLoopLatchTrigger(int waitForCount) {
+        log.debug("Waiting on {} cycles on loop latch for {}...", waitForCount, defaultTimeout);
+        loopLatchV = new CountDownLatch(waitForCount);
+        try {
+            boolean timeout = !loopLatchV.await(defaultTimeoutSeconds, SECONDS);
+            if (timeout || parentParallelConsumer.isClosedOrFailed())
+                throw new TimeoutException(msg("Timeout of {}, waiting for {} counts, on latch with {} left", defaultTimeout, waitForCount, loopLatchV.getCount()));
+        } catch (InterruptedException e) {
+            log.error("Interrupted while waiting for loop latch - timeout was {}", defaultTimeout);
+            throw e;
+        }
+    }
+
+    @SneakyThrows
+    private void awaitForLoopCount(int waitForCount) {
+        log.debug("Waiting on {} cycles on loop latch...", waitForCount);
+        waitAtMost(defaultTimeout.multipliedBy(100)).until(() -> loopCount.get() > waitForCount);
+    }
+
+    protected void awaitForCommit(int offset) {
+        log.debug("Waiting for commit offset {}", offset);
+        await().timeout(defaultTimeout)
+                .untilAsserted(() -> assertCommitsContains(of(offset)));
+    }
+
+    protected void awaitForCommitExact(int offset) {
+        log.debug("Waiting for EXACTLY commit offset {}", offset);
+        await().timeout(defaultTimeout)
+                .failFast(msg("Commit was not exact - contained offsets that weren't '{}'", offset), () -> {
+                    List<Integer> offsets = extractAllPartitionsOffsetsSequentially(false);
+                    return offsets.size() > 1 && !offsets.contains(offset);
+                })
+                .untilAsserted(() -> assertCommits(of(offset)));
+    }
+
+    protected void awaitForCommitExact(int partition, int offset) {
+        log.debug("Waiting for EXACTLY commit offset {} on partition {}", offset, partition);
+        var expectedOffset = new OffsetAndMetadata(offset, "");
+        TopicPartition partitionNumber = new TopicPartition(INPUT_TOPIC, partition);
+        var expectedOffsetMap = UniMaps.of(partitionNumber, expectedOffset);
+        verify(producerSpy, timeout(defaultTimeoutMs)
+                .times(1))
+                .sendOffsetsToTransaction(
+                        argThat((offsetMap) -> offsetMap.equals(expectedOffsetMap)),
+                        any(ConsumerGroupMetadata.class));
+    }
+
+    public void assertCommitsContains(List<Integer> offsets) {
+        List<Integer> commits = getCommitHistoryFlattened();
+        assertThat(commits).containsAll(offsets);
+    }
+
+    protected List<Integer> getCommitHistoryFlattened() {
+        return (isUsingTransactionalProducer())
+                ? ktu.getProducerCommitsFlattened(producerSpy)
+                : extractAllPartitionsOffsetsSequentially(false);
+    }
+
+    private List<OffsetAndMetadata> getCommitHistoryFlattenedMeta() {
+        return (isUsingTransactionalProducer())
+                ? ktu.getProducerCommitsMeta(producerSpy)
+                : extractAllPartitionsOffsetsSequentiallyMeta(true);
+    }
+
+    public void assertCommits(List<Integer> offsets, String description) {
+        assertCommits(offsets, Optional.of(description));
+    }
+
+    /**
+     * Flattens the offsets of all partitions into a single sequential list. Removing the genesis commit (0) if it
+     * exists, unless it's contained in the assertion.
+     */
+    public void assertCommits(List<Integer> offsets, Optional<String> description) {
+        boolean trimGenesis = !offsets.contains(0);
+
+        if (isUsingTransactionalProducer()) {
+            ktu.assertCommits(producerSpy, offsets, description);
+            assertThat(extractAllPartitionsOffsetsSequentially(trimGenesis)).isEmpty();
+        } else {
+            List<Integer> collect = extractAllPartitionsOffsetsSequentially(trimGenesis);
+
+            // duplicates are ok
+            // is there a nicer optional way?
+            // {@link Optional#ifPresentOrElse} only @since 9
+            if (description.isPresent()) {
+                assertThat(collect).as(description.get()).hasSameElementsAs(offsets);
+            } else {
+                assertThat(collect).hasSameElementsAs(offsets);
+            }
+            ktu.assertCommits(producerSpy, UniLists.of(), Optional.of("Empty"));
+        }
+    }
+
+    /**
+     * Flattens the offsets of all partitions into a single sequential list
+     */
+    protected List<Integer> extractAllPartitionsOffsetsSequentially(boolean trimGenesis) {
+        return extractAllPartitionsOffsetsSequentiallyMeta(trimGenesis).stream().
+                map(x -> (int) x.offset()) // int cast a luxury in test context - no big offsets
+                .collect(Collectors.toList());
+    }
+
+    /**
+     * Flattens the offsets of all partitions into a single sequential list
+     */
+    protected List<OffsetAndMetadata> extractAllPartitionsOffsetsSequentiallyMeta(boolean trimGenesis) {
+        // copy the list for safe concurrent access
+        List<Map<TopicPartition, OffsetAndMetadata>> history = new ArrayList<>(consumerSpy.getCommitHistoryInt());
+        return history.stream()
+                .flatMap(commits ->
+                        {
+                            var rawValues = new ArrayList<>(commits.values()).stream(); // 4 debugging
+                            if (trimGenesis)
+                                return rawValues.filter(x -> x.offset() != 0);
+                            else
+                                return rawValues; // int cast a luxury in test context - no big offsets
+                        }
+                ).collect(Collectors.toList());
+    }
+
+
+    protected List<OffsetAndMetadata> extractAllPartitionsOffsetsAndMetadataSequentially() {
+        // copy the list for safe concurrent access
+        List<Map<TopicPartition, OffsetAndMetadata>> history = new ArrayList<>(consumerSpy.getCommitHistoryInt());
+        return history.stream()
+                .flatMap(commits ->
+                        {
+                            Collection<OffsetAndMetadata> values = new ArrayList<>(commits.values());
+                            return values.stream();
+                        }
+                ).collect(Collectors.toList());
+    }
+
+    public void assertCommits(List<Integer> offsets) {
+        assertCommits(offsets, Optional.empty());
+    }
+
+    public CommitHistorySubject assertCommits() {
+        List<OffsetAndMetadata> commitHistoryFlattened = getCommitHistoryFlattenedMeta();
+        CommitHistory actual = new CommitHistory(commitHistoryFlattened);
+        return CommitHistorySubject.assertThat(actual);
+    }
+
+    /**
+     * Checks a list of commits of a list of partitions - outer list is partition, inner list is commits
+     */
+    public void assertCommitLists(List<List<Integer>> offsets) {
+        if (isUsingTransactionalProducer()) {
+            ktu.assertCommitLists(producerSpy, offsets, Optional.empty());
+        } else {
+            List<Map<String, Map<TopicPartition, OffsetAndMetadata>>> commitHistoryWithGropuId = consumerSpy.getCommitHistoryWithGroupId();
+            ktu.assertCommitLists(commitHistoryWithGropuId, offsets, Optional.empty());
+        }
+    }
+
+    protected List<Map<String, Map<TopicPartition, OffsetAndMetadata>>> getCommitHistory() {
+        if (isUsingTransactionalProducer()) {
+            return producerSpy.consumerGroupOffsetsHistory();
+        } else {
+            return consumerSpy.getCommitHistoryWithGroupId();
+        }
+    }
+
+    protected boolean isUsingTransactionalProducer() {
+        ParallelConsumerOptions.CommitMode commitMode = parentParallelConsumer.getWm().getOptions().getCommitMode();
+        return commitMode.equals(PERIODIC_TRANSACTIONAL_PRODUCER);
+    }
+
+    protected boolean isUsingAsyncCommits() {
+        ParallelConsumerOptions.CommitMode commitMode = parentParallelConsumer.getWm().getOptions().getCommitMode();
+        return commitMode.equals(PERIODIC_CONSUMER_ASYNCHRONOUS);
+    }
+
+    protected void releaseAndWait(List<CountDownLatch> locks, List<Integer> lockIndexes) {
+        for (Integer i : lockIndexes) {
+            log.debug("Releasing {}...", i);
+            locks.get(i).countDown();
+        }
+        awaitForSomeLoopCycles(1);
+    }
+
+    protected void releaseAndWait(List<CountDownLatch> locks, int lockIndex) {
+        log.debug("Releasing {}...", lockIndex);
+        locks.get(lockIndex).countDown();
+        awaitForSomeLoopCycles(1);
+    }
+
+    protected abstract PCModule getModule();
+
+    protected void pauseControlToAwaitForLatch(CountDownLatch latch) {
+        pauseControlLoop();
+        awaitLatch(latch);
+        resumeControlLoop();
+        awaitForOneLoopCycle();
+    }
+
+    /**
+     * Assert {@link com.google.common.truth.Truth} on the test {@link Consumer} ({@link LongPollingMockConsumer}).
+     */
+    protected LongPollingMockConsumerSubject<String, String> assertThatConsumer(String msg) {
+        return Truth.assertWithMessage(msg)
+                .about(LongPollingMockConsumerSubject.<String, String>mockConsumers())
+                .that(consumerSpy);
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/BatchTestBase.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/BatchTestBase.java
new file mode 100644
index 000000000..068325b39
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/BatchTestBase.java
@@ -0,0 +1,26 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+public interface BatchTestBase {
+
+    void averageBatchSizeTest();
+
+    /**
+     * Use:
+     *
+     * @ParameterizedTest
+     * @EnumSource
+     */
+    void simpleBatchTest(ParallelConsumerOptions.ProcessingOrder order);
+
+    /**
+     * Use:
+     *
+     * @ParameterizedTest
+     * @EnumSource
+     */
+    void batchFailureTest(ParallelConsumerOptions.ProcessingOrder order);
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/BatchTestMethods.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/BatchTestMethods.java
new file mode 100644
index 000000000..b841fcc94
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/BatchTestMethods.java
@@ -0,0 +1,235 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.KafkaTestUtils;
+import io.confluent.csid.utils.ProgressBarUtils;
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.internal.RateLimiter;
+import lombok.RequiredArgsConstructor;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import me.tongfei.progressbar.ProgressBar;
+
+import java.util.ArrayList;
+import java.util.Collections;
+import java.util.List;
+import java.util.concurrent.CopyOnWriteArrayList;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.AbstractParallelEoSStreamProcessorTestBase.defaultTimeout;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.PARTITION;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.UNORDERED;
+import static java.time.Duration.ofSeconds;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.awaitility.Awaitility.waitAtMost;
+
+/**
+ * Batch test which can be used in the different modules. The need for this is because the batch methods in each module
+ * all have different signatures, and return types.
+ */
+@Slf4j
+@RequiredArgsConstructor
+public abstract class BatchTestMethods<POLL_RETURN> {
+
+    public static final long FAILURE_TARGET = 5L;
+    private final ParallelEoSStreamProcessorTestBase baseTest;
+
+    protected abstract KafkaTestUtils getKtu();
+
+
+    protected void setupParallelConsumer(int targetBatchSize, int maxConcurrency, ParallelConsumerOptions.ProcessingOrder ordering) {
+        //
+        ParallelConsumerOptions<Object, Object> options = ParallelConsumerOptions.builder()
+                .batchSize(targetBatchSize)
+                .ordering(ordering)
+                .maxConcurrency(maxConcurrency)
+                .build();
+        baseTest.setupParallelConsumerInstance(options);
+
+        //
+        baseTest.parentParallelConsumer.setTimeBetweenCommits(ofSeconds(5));
+    }
+
+    protected abstract AbstractParallelEoSStreamProcessor getPC();
+
+    public void averageBatchSizeTest(int numRecsExpected) {
+        final int targetBatchSize = 20;
+        int maxConcurrency = 8;
+
+        ProgressBar bar = ProgressBarUtils.getNewMessagesBar(log, numRecsExpected);
+
+        setupParallelConsumer(targetBatchSize, maxConcurrency, UNORDERED);
+
+        //
+        getKtu().sendRecords(numRecsExpected);
+
+        //
+        var numBatches = new AtomicInteger(0);
+        var numRecordsProcessed = new AtomicInteger(0);
+        long start = System.currentTimeMillis();
+        RateLimiter statusLogger = new RateLimiter(1);
+
+        averageBatchSizeTestPoll(numBatches, numRecordsProcessed, statusLogger);
+
+        //
+        waitAtMost(defaultTimeout).alias("expected number of records")
+                .failFast(() -> getPC().isClosedOrFailed())
+                .untilAsserted(() -> {
+                    bar.stepTo(numRecordsProcessed.get());
+                    assertThat(numRecordsProcessed.get()).isEqualTo(numRecsExpected);
+                });
+        bar.close();
+
+        //
+
+        //
+        double targetMetThreshold = 999. / 1000.;
+        double acceptableAttainedBatchSize = targetBatchSize * targetMetThreshold;
+        double averageBatchSize = calcAverage(numRecordsProcessed, numBatches);
+        assertThat(averageBatchSize).isGreaterThan(acceptableAttainedBatchSize);
+
+        baseTest.parentParallelConsumer.requestCommitAsap();
+        baseTest.awaitForCommit(numRecsExpected);
+        var duration = System.currentTimeMillis() - start;
+        log.info("Processed {} records in {} ms. Average batch size was: {}. {} records per second.", numRecsExpected, duration, averageBatchSize, numRecsExpected / (duration / 1000.0));
+    }
+
+    /**
+     * Must call {@link #averageBatchSizeTestPollInner}
+     */
+    protected abstract void averageBatchSizeTestPoll(AtomicInteger numBatches, AtomicInteger numRecords, RateLimiter statusLogger);
+
+    protected POLL_RETURN averageBatchSizeTestPollInner(AtomicInteger numBatches, AtomicInteger numRecords, RateLimiter statusLogger, PollContext<String, String> pollBatch) {
+        int size = (int) pollBatch.size();
+
+        statusLogger.performIfNotLimited(() -> {
+            try {
+                log.debug(
+                        "Processed {} records in {} batches with average size {}",
+                        numRecords.get(),
+                        numBatches.get(),
+                        calcAverage(numRecords, numBatches)
+                );
+            } catch (Exception e) {
+                log.error(e.getMessage(), e);
+            }
+        });
+
+        try {
+            log.trace("Batch size {}", size);
+            return averageBatchSizeTestPollStep(pollBatch);
+        } finally {
+            numBatches.getAndIncrement();
+            numRecords.addAndGet(size);
+        }
+    }
+
+    protected abstract POLL_RETURN averageBatchSizeTestPollStep(PollContext<String, String> recordList);
+
+    private double calcAverage(AtomicInteger numRecords, AtomicInteger numBatches) {
+        return numRecords.get() / (0.0 + numBatches.get());
+    }
+
+
+    @SneakyThrows
+    public void simpleBatchTest(ParallelConsumerOptions.ProcessingOrder order) {
+        int batchSizeSetting = 2;
+        int numRecsExpected = 5;
+
+        getPC().setTimeBetweenCommits(ofSeconds(1));
+
+        setupParallelConsumer(batchSizeSetting, ParallelConsumerOptions.DEFAULT_MAX_CONCURRENCY, order);
+
+        var recs = getKtu().sendRecords(numRecsExpected);
+        List<PollContext<String, String>> batchesReceived = new CopyOnWriteArrayList<>();
+
+        //
+        simpleBatchTestPoll(batchesReceived);
+
+        //
+        int expectedNumOfBatches = (order == PARTITION) ?
+                numRecsExpected : // partition ordering restricts the batch sizes to a single element as all records are in a single partition
+                (int) Math.ceil(numRecsExpected / (double) batchSizeSetting);
+
+        waitAtMost(defaultTimeout).alias("expected number of batches")
+                .failFast(() -> getPC().isClosedOrFailed())
+                .untilAsserted(() -> {
+                    assertThat(batchesReceived).hasSize(expectedNumOfBatches);
+                });
+
+        assertThat(batchesReceived)
+                .as("batch size")
+                .allSatisfy(receivedBatchEntry -> assertThat(receivedBatchEntry).hasSizeLessThanOrEqualTo(batchSizeSetting))
+                .as("all messages processed")
+                .flatExtracting(PollContext::getConsumerRecordsFlattened).hasSameElementsAs(recs);
+
+        assertThat(getPC().isClosedOrFailed()).isFalse();
+
+        baseTest.awaitForCommit(numRecsExpected);
+        getPC().closeDrainFirst();
+    }
+
+    public abstract void simpleBatchTestPoll(List<PollContext<String, String>> batchesReceived);
+
+    @SneakyThrows
+    public void batchFailureTest(ParallelConsumerOptions.ProcessingOrder order) {
+        int batchSize = 5;
+        int expectedNumOfMessages = 20;
+
+        setupParallelConsumer(batchSize, ParallelConsumerOptions.DEFAULT_MAX_CONCURRENCY, order);
+
+        var recs = getKtu().sendRecords(expectedNumOfMessages);
+        List<PollContext<String, String>> receivedBatches = Collections.synchronizedList(new ArrayList<>());
+
+        //
+        batchFailPoll(receivedBatches);
+
+        //
+        baseTest.awaitForCommit(expectedNumOfMessages);
+
+        //
+        int expectedNumOfBatches = (int) Math.ceil(expectedNumOfMessages / (double) batchSize);
+
+        // due to the failure, might get one extra batch
+        assertThat(receivedBatches).hasSizeGreaterThanOrEqualTo(expectedNumOfBatches);
+
+        assertThat(receivedBatches)
+                .as("batch size")
+                .allSatisfy(receivedBatch ->
+                        assertThat(receivedBatch).hasSizeLessThanOrEqualTo(batchSize))
+                .as("all messages processed")
+                .flatExtracting(PollContext::getConsumerRecordsFlattened).hasSameElementsAs(recs);
+
+        //
+        assertThat(getPC().isClosedOrFailed()).isFalse();
+    }
+
+    /**
+     * Must call {@link #batchFailPollInner}
+     */
+    protected abstract void batchFailPoll(List<PollContext<String, String>> receivedBatches);
+
+    protected POLL_RETURN batchFailPollInner(PollContext<String, String> batchPollContext) {
+        List<Long> offsets = batchPollContext.getOffsetsFlattened();
+
+        boolean contains = offsets.contains(FAILURE_TARGET);
+        if (contains) {
+            var target = batchPollContext.stream().filter(x -> x.offset() == FAILURE_TARGET).findFirst().get();
+            int numberOfFailedAttempts = target.getNumberOfFailedAttempts();
+            int targetAttempts = 3;
+            if (numberOfFailedAttempts < targetAttempts) {
+                log.debug("Failing batch containing target offset {}", FAILURE_TARGET);
+                throw new FakeRuntimeException(msg("Testing failure processing a batch - pretend attempt #{}", numberOfFailedAttempts));
+            } else {
+                log.debug("Failing target {} now completing as has has reached target attempts {}", offsets, targetAttempts);
+            }
+        }
+        log.debug("Completing batch {}", offsets);
+        return null;
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/CoreBatchTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/CoreBatchTest.java
new file mode 100644
index 000000000..9bf7cc849
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/CoreBatchTest.java
@@ -0,0 +1,99 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.KafkaTestUtils;
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.internal.RateLimiter;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+
+import java.util.List;
+import java.util.concurrent.atomic.AtomicInteger;
+
+/**
+ * Basic tests for batch processing functionality
+ */
+@Slf4j
+public class CoreBatchTest extends ParallelEoSStreamProcessorTestBase implements BatchTestBase {
+
+    BatchTestMethods<Void> batchTestMethods;
+
+    @BeforeEach
+    void setup() {
+        batchTestMethods = new BatchTestMethods<>(this) {
+
+            @Override
+            protected KafkaTestUtils getKtu() {
+                return ktu;
+            }
+
+            @SneakyThrows
+            @Override
+            protected Void averageBatchSizeTestPollStep(PollContext<String, String> recordList) {
+                try {
+                    Thread.sleep(30);
+                } catch (InterruptedException e) {
+                    log.error(e.getMessage(), e);
+                }
+                return null;
+            }
+
+            @Override
+            protected void averageBatchSizeTestPoll(AtomicInteger numBatches, AtomicInteger numRecords, RateLimiter
+                    statusLogger) {
+                parallelConsumer.poll(pollBatch -> {
+                    averageBatchSizeTestPollInner(numBatches, numRecords, statusLogger, pollBatch);
+                });
+            }
+
+            @Override
+            protected AbstractParallelEoSStreamProcessor getPC() {
+                return parallelConsumer;
+            }
+
+            @Override
+            public void simpleBatchTestPoll(List<PollContext<String, String>> batchesReceived) {
+                parallelConsumer.poll(context -> {
+                    log.debug("Batch of messages: {}", context.getOffsetsFlattened());
+                    batchesReceived.add(context);
+                });
+            }
+
+            @Override
+            protected void batchFailPoll(List<PollContext<String, String>> accumlativeReceivedBatches) {
+                parallelConsumer.poll(pollBatch -> {
+                    log.debug("Batch of messages: {}", pollBatch.getOffsetsFlattened());
+                    batchFailPollInner(pollBatch);
+                    accumlativeReceivedBatches.add(pollBatch);
+                });
+            }
+        };
+    }
+
+    @Test
+    public void averageBatchSizeTest() {
+        batchTestMethods.averageBatchSizeTest(50000);
+    }
+
+    @ParameterizedTest
+    @EnumSource
+    @Override
+    public void simpleBatchTest(ParallelConsumerOptions.ProcessingOrder order) {
+        batchTestMethods.simpleBatchTest(order);
+    }
+
+    @ParameterizedTest
+    @EnumSource
+    @Override
+    public void batchFailureTest(ParallelConsumerOptions.ProcessingOrder order) {
+        batchTestMethods.batchFailureTest(order);
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/FakeRuntimeException.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/FakeRuntimeException.java
new file mode 100644
index 000000000..2875b691a
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/FakeRuntimeException.java
@@ -0,0 +1,16 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.experimental.StandardException;
+
+/**
+ * Used for testing error handling - easier to identify than a plain exception.
+ *
+ * @author Antony Stubbs
+ */
+@StandardException
+public class FakeRuntimeException extends PCRetriableException {
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/JStreamParallelEoSStreamProcessorTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/JStreamParallelEoSStreamProcessorTest.java
new file mode 100644
index 000000000..baf262640
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/JStreamParallelEoSStreamProcessorTest.java
@@ -0,0 +1,121 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelStreamProcessor.ConsumeProduceResult;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.assertj.core.util.Lists;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+
+import java.util.List;
+import java.util.concurrent.CountDownLatch;
+import java.util.stream.Stream;
+
+import static io.confluent.csid.utils.LatchTestUtils.awaitLatch;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.mockito.ArgumentMatchers.any;
+import static org.mockito.Mockito.mock;
+import static org.mockito.Mockito.verify;
+import static org.mockito.internal.verification.VerificationModeFactory.times;
+
+// TODO this class shouldn't have access to the non streaming async consumer - refactor out another super class layer
+@Slf4j
+class JStreamParallelEoSStreamProcessorTest extends ParallelEoSStreamProcessorTestBase {
+
+    JStreamParallelEoSStreamProcessor<String, String> streaming;
+
+    @BeforeEach
+    public void setupData() {
+        super.primeFirstRecord();
+    }
+
+    @Override
+    protected ParallelEoSStreamProcessor<String, String> initAsyncConsumer(ParallelConsumerOptions<String, String> options) {
+        streaming = new JStreamParallelEoSStreamProcessor<>(options);
+
+        return streaming;
+    }
+
+    @Test
+    void testStream() {
+        var latch = new CountDownLatch(1);
+        Stream<ConsumeProduceResult<String, String, String, String>> streamedResults = streaming.pollProduceAndStream((record) -> {
+            ProducerRecord<String, String> mock = mock(ProducerRecord.class);
+            log.info("Consumed and produced record ({}), and returning a derivative result to produce to output topic: {}", record, mock);
+            myRecordProcessingAction.apply(record.getSingleConsumerRecord());
+            latch.countDown();
+            return Lists.list(mock);
+        });
+
+        awaitLatch(latch);
+
+        awaitForSomeLoopCycles(2);
+
+        verify(myRecordProcessingAction, times(1)).apply(any());
+
+        assertThat(streamedResults).hasSize(1);
+    }
+
+    @Test
+    void testConsumeAndProduce() {
+        var latch = new CountDownLatch(1);
+        var stream = streaming.pollProduceAndStream((record) -> {
+            String apply = myRecordProcessingAction.apply(record.getSingleConsumerRecord());
+            ProducerRecord<String, String> result = new ProducerRecord<>(OUTPUT_TOPIC, "akey", apply);
+            log.info("Consumed a record ({}), and returning a derivative result record to be produced: {}", record, result);
+            List<ProducerRecord<String, String>> result1 = Lists.list(result);
+            latch.countDown();
+            return result1;
+        });
+
+        awaitLatch(latch);
+
+        resumeControlLoop();
+
+        awaitForSomeLoopCycles(1);
+
+        verify(myRecordProcessingAction, times(1)).apply(any());
+
+        var myResultStream = stream.peek(x -> {
+            if (x != null) {
+                ConsumerRecord<String, String> left = x.getIn().getSingleConsumerRecord();
+                log.info("{}:{}:{}:{}", left.key(), left.value(), x.getOut(), x.getMeta());
+            } else {
+                log.info("null");
+            }
+        });
+
+        assertThat(myResultStream).hasSize(1);
+    }
+
+    @Test
+    void testFlatMapProduce() {
+        var latch = new CountDownLatch(1);
+        var myResultStream = streaming.pollProduceAndStream((record) -> {
+            String apply1 = myRecordProcessingAction.apply(record.getSingleConsumerRecord());
+            String apply2 = myRecordProcessingAction.apply(record.getSingleConsumerRecord());
+
+            var list = Lists.list(
+                    new ProducerRecord<>(OUTPUT_TOPIC, "key", apply1),
+                    new ProducerRecord<>(OUTPUT_TOPIC, "key", apply2));
+
+            latch.countDown();
+            return list;
+        });
+
+        awaitLatch(latch);
+
+        awaitForSomeLoopCycles(1);
+
+        verify(myRecordProcessingAction, times(2)).apply(any());
+
+
+        assertThat(myResultStream).hasSize(2);
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/MockConsumerTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/MockConsumerTest.java
new file mode 100644
index 000000000..9b9e222b5
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/MockConsumerTest.java
@@ -0,0 +1,83 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.LongPollingMockConsumer;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.MockConsumer;
+import org.apache.kafka.clients.consumer.OffsetResetStrategy;
+import org.apache.kafka.common.TopicPartition;
+import org.junit.jupiter.api.Test;
+import org.testcontainers.shaded.org.awaitility.Awaitility;
+
+import java.util.Collections;
+import java.util.HashMap;
+import java.util.concurrent.ConcurrentLinkedQueue;
+
+import static com.google.common.truth.Truth.assertThat;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+/**
+ * Tests that PC works fine with the plain vanilla {@link MockConsumer}, as opposed to the
+ * {@link LongPollingMockConsumer}.
+ * <p>
+ * These tests demonstrate why using {@link MockConsumer} is difficult, and why {@link LongPollingMockConsumer} should
+ * be used instead.
+ *
+ * @author Antony Stubbs
+ * @see LongPollingMockConsumer#revokeAssignment
+ */
+@Slf4j
+class MockConsumerTest {
+
+    private final String topic = MockConsumerTest.class.getSimpleName();
+
+    /**
+     * Test that the mock consumer works as expected
+     */
+    @Test
+    void mockConsumer() {
+        var mockConsumer = new MockConsumer<String, String>(OffsetResetStrategy.EARLIEST);
+        HashMap<TopicPartition, Long> startOffsets = new HashMap<>();
+        TopicPartition tp = new TopicPartition(topic, 0);
+        startOffsets.put(tp, 0L);
+
+        //
+        var options = ParallelConsumerOptions.<String, String>builder()
+                .consumer(mockConsumer)
+                .build();
+        var parallelConsumer = new ParallelEoSStreamProcessor<String, String>(options);
+        parallelConsumer.subscribe(of(topic));
+
+        // MockConsumer is not a correct implementation of the Consumer contract - must manually rebalance++ - or use LongPollingMockConsumer
+        mockConsumer.rebalance(Collections.singletonList(tp));
+        parallelConsumer.onPartitionsAssigned(of(tp));
+        mockConsumer.updateBeginningOffsets(startOffsets);
+
+        //
+        addRecords(mockConsumer);
+
+        //
+        ConcurrentLinkedQueue<RecordContext<String, String>> records = new ConcurrentLinkedQueue<>();
+        parallelConsumer.poll(recordContexts -> {
+            recordContexts.forEach(recordContext -> {
+                log.warn("Processing: {}", recordContext);
+                records.add(recordContext);
+            });
+        });
+
+        //
+        Awaitility.await().untilAsserted(() -> {
+            assertThat(records).hasSize(3);
+        });
+    }
+
+    private void addRecords(MockConsumer<String, String> mockConsumer) {
+        mockConsumer.addRecord(new org.apache.kafka.clients.consumer.ConsumerRecord<>(topic, 0, 0, "key", "value"));
+        mockConsumer.addRecord(new org.apache.kafka.clients.consumer.ConsumerRecord<>(topic, 0, 1, "key", "value"));
+        mockConsumer.addRecord(new org.apache.kafka.clients.consumer.ConsumerRecord<>(topic, 0, 2, "key", "value"));
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/PCMetricsTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/PCMetricsTest.java
new file mode 100644
index 000000000..5e3008e39
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/PCMetricsTest.java
@@ -0,0 +1,281 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.metrics.PCMetricsDef;
+import io.micrometer.core.instrument.*;
+import io.micrometer.core.instrument.simple.SimpleConfig;
+import io.micrometer.core.instrument.simple.SimpleMeterRegistry;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.assertj.core.data.Offset;
+import org.jetbrains.annotations.NotNull;
+import org.junit.jupiter.api.Test;
+import pl.tlinkowski.unij.api.UniLists;
+
+import java.time.Duration;
+import java.util.List;
+import java.util.Optional;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.TimeUnit;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static io.confluent.parallelconsumer.internal.State.PAUSED;
+import static io.confluent.parallelconsumer.internal.State.RUNNING;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.awaitility.Awaitility.await;
+import static org.junit.jupiter.api.Assertions.assertEquals;
+import static org.junit.jupiter.api.Assertions.assertFalse;
+
+@Slf4j
+class PCMetricsTest extends ParallelEoSStreamProcessorTestBase {
+    private SimpleMeterRegistry registry;
+    private final List<Tag> commonTags = UniLists.of(Tag.of("tag1", "pc1"));
+
+    @Test
+    @SneakyThrows
+    void metricsRegisterBinding() {
+        final int quantityP0 = 1000;
+        final int quantityP1 = 500;
+        AtomicInteger numberToBlockAt = new AtomicInteger(200);
+        final int p1StartingOffset = quantityP0;
+
+        ktu.send(consumerSpy, ktu.generateRecords(0, quantityP0));
+        ktu.send(consumerSpy, ktu.generateRecords(1, quantityP1));
+        CountDownLatch latchPartition0 = new CountDownLatch(1);
+        CountDownLatch latchPartition1 = new CountDownLatch(1);
+        AtomicInteger counterP0 = new AtomicInteger();
+        AtomicInteger counterP1 = new AtomicInteger();
+        AtomicBoolean failedRecordDone = new AtomicBoolean(false);
+        parallelConsumer.poll(recordContexts -> {
+            recordContexts.forEach(recordContext -> {
+                log.trace("Processing: {}", recordContext);
+                try {
+                    AtomicInteger counter;
+                    CountDownLatch latch;
+                    if (recordContext.partition() == 0) {
+                        counter = counterP0;
+                        latch = latchPartition0;
+                    } else {
+                        counter = counterP1;
+                        latch = latchPartition1;
+                    }
+                    //towards end of records in Partition 0 - throw RTE to get failed record to verify meter
+                    if (recordContext.partition() == 0 && counter.get() > (quantityP0 - 300)) {
+                        if (!failedRecordDone.getAndSet(true)) {
+                            throw new RuntimeException("Failed a record to verify failed meter");
+                        }
+                    }
+                    if (counter.get() >= numberToBlockAt.get()) {
+                        latch.await();
+                    } else {
+                        Thread.sleep(5);
+                    }
+                    counter.incrementAndGet();
+                } catch (InterruptedException e) {
+                    throw new RuntimeException(e);
+                }
+            });
+        });
+
+        log.info(registry.getMetersAsString());
+        // metrics have some data
+        await().atMost(Duration.ofSeconds(300)).pollInterval(Duration.ofSeconds(2)).untilAsserted(() -> {
+            assertFalse(registry.getMeters().isEmpty());
+            assertEquals(RUNNING.getValue(), registeredGaugeValueFor(PCMetricsDef.PC_STATUS));
+            assertEquals(2, registeredGaugeValueFor(PCMetricsDef.NUMBER_OF_SHARDS));
+            assertEquals(2, registeredGaugeValueFor(PCMetricsDef.NUMBER_OF_PARTITIONS));
+        });
+
+        // metrics show processing is complete
+        await().untilAsserted(() -> {
+            log.info("counterP0: {}, counterP1: {}", counterP0.get(), counterP1.get());
+            log.info(registry.getMetersAsString());
+            assertThat(registeredGaugeValueFor(PCMetricsDef.NUM_PAUSED_PARTITIONS)).isEqualTo(2);
+        });
+
+        //Need to give a little bit of time as racing between scraping metrics and asserts below
+        Thread.sleep(1000);
+        log.info(registry.getMetersAsString());
+
+        int remainingP0 = quantityP0 - counterP0.get();
+        int remainingP1 = quantityP1 - counterP1.get();
+        int highestProcessedOffsetP0 = counterP0.get() - 1;
+        int highestProcessedOffsetP1 = counterP1.get() + p1StartingOffset - 1;
+        int highestSeenOffsetP0 = quantityP0 - 1;
+        int highestSeenOffsetP1 = quantityP1 + p1StartingOffset - 1;
+        //Assert record counts, offset counts specific to Partition 0
+        assertThat(registeredGaugeValueFor(PCMetricsDef.PARTITION_HIGHEST_COMPLETED_OFFSET, 0))
+                .isEqualTo(highestProcessedOffsetP0);
+        assertThat(registeredGaugeValueFor(PCMetricsDef.PARTITION_HIGHEST_SEEN_OFFSET, 0)).isEqualTo(
+                highestSeenOffsetP0);
+        assertThat(registeredGaugeValueFor(PCMetricsDef.PARTITION_HIGHEST_SEQUENTIAL_SUCCEEDED_OFFSET, 0))
+                .isEqualTo(highestProcessedOffsetP0);
+        assertThat(registeredGaugeValueFor(PCMetricsDef.PARTITION_INCOMPLETE_OFFSETS, 0))
+                .isEqualTo(remainingP0);
+        assertThat(registeredGaugeValueFor(PCMetricsDef.PARTITION_LAST_COMMITTED_OFFSET, 0))
+                .isEqualTo(highestProcessedOffsetP0 + 1);
+        assertThat(registeredCounterValueFor(PCMetricsDef.PROCESSED_RECORDS,
+                "topic", topicPartition.topic(), "partition", String.valueOf(0)))
+                .isEqualTo(counterP0.get());
+
+
+        //Assert same as above for Partition 1
+        assertThat(registeredGaugeValueFor(PCMetricsDef.PARTITION_HIGHEST_COMPLETED_OFFSET, 1))
+                .isEqualTo(highestProcessedOffsetP1);
+        assertThat(registeredGaugeValueFor(PCMetricsDef.PARTITION_HIGHEST_SEEN_OFFSET, 1)).isEqualTo(
+                highestSeenOffsetP1);
+        assertThat(registeredGaugeValueFor(PCMetricsDef.PARTITION_HIGHEST_SEQUENTIAL_SUCCEEDED_OFFSET, 1))
+                .isEqualTo(highestProcessedOffsetP1);
+        assertThat(registeredGaugeValueFor(PCMetricsDef.PARTITION_INCOMPLETE_OFFSETS, 1))
+                .isEqualTo(remainingP1);
+        assertThat(registeredGaugeValueFor(PCMetricsDef.PARTITION_LAST_COMMITTED_OFFSET, 1))
+                .isEqualTo(highestProcessedOffsetP1 + 1);
+        assertThat(registeredCounterValueFor(PCMetricsDef.PROCESSED_RECORDS, "topic", topicPartition.topic(), "partition", String.valueOf(1)))
+                .isEqualTo(counterP1.get());
+
+        assertThat(registeredGaugeValueFor(PCMetricsDef.SHARDS_SIZE))
+                .isEqualTo(remainingP0 + remainingP1);
+        // non partition specific metrics
+        assertThat(registeredGaugeValueFor(PCMetricsDef.INCOMPLETE_OFFSETS_TOTAL))
+                .isEqualTo(remainingP0 + remainingP1);
+
+        assertThat(registeredGaugeValueFor(PCMetricsDef.INFLIGHT_RECORDS))
+                .isGreaterThan(0); // I think it is CPU number bound as it defaults to some multiplier of available CPUs - so can't assume number based on my machine...
+
+        assertThat(registeredDistributionSummaryFor(PCMetricsDef.METADATA_SPACE_USED))
+                .isGreaterThan(0);
+
+        assertThat(registeredTimerFor(PCMetricsDef.OFFSETS_ENCODING_TIME))
+                .isGreaterThan(0);
+
+        assertThat(registeredCounterValueFor(PCMetricsDef.OFFSETS_ENCODING_USAGE))
+                .isGreaterThan(0);
+
+        assertThat(registeredGaugeValueFor(PCMetricsDef.NUMBER_OF_PARTITIONS))
+                .isEqualTo(2);
+        assertThat(registeredGaugeValueFor(PCMetricsDef.NUM_PAUSED_PARTITIONS))
+                .isEqualTo(2);
+
+        assertThat(registeredDistributionSummaryFor(PCMetricsDef.PAYLOAD_RATIO_USED))
+                .isGreaterThan(-1.0); // cant really check for actual value as it may be either 0 or >0 depending on timing of commit / encoding execution.
+
+        assertThat(registeredGaugeValueFor(PCMetricsDef.NUMBER_OF_SHARDS))
+                .isEqualTo(2);
+        assertThat(registeredGaugeValueFor(PCMetricsDef.PC_STATUS))
+                .isEqualTo(RUNNING.getValue());
+
+        // it would be remaining - inFlight, but because inFlight number depends on load factor which in turn depends on CPU core number - adding allowable offset.
+        assertThat(registeredGaugeValueFor(PCMetricsDef.WAITING_RECORDS))
+                .isCloseTo((remainingP0 + remainingP1), Offset.offset(100.0));
+
+        assertThat(registeredTimerFor(PCMetricsDef.USER_FUNCTION_PROCESSING_TIME)).isGreaterThan(0);
+
+        numberToBlockAt.set(5000);
+        latchPartition0.countDown();
+        latchPartition1.countDown();
+        await().untilAsserted(() -> {
+            assertThat(counterP0.get()).isEqualTo(quantityP0);
+        });
+
+        await().atMost(Duration.ofSeconds(120)).until(() -> counterP0.get() == quantityP0 &&
+                registeredGaugeValueFor(PCMetricsDef.WAITING_RECORDS) == 0
+        );
+
+        await().atMost(Duration.ofSeconds(120)).pollInterval(Duration.ofSeconds(5)).untilAsserted(() -> {
+            log.info(registry.getMetersAsString());
+            assertThat(registeredCounterValueFor(PCMetricsDef.FAILED_RECORDS, "topic", topicPartition.topic(), "partition", String.valueOf(0)))
+                    .isEqualTo(1);
+        });
+    }
+
+
+    @Test
+    @SneakyThrows
+    void pcStatusMetricUpdatesOnChange() {
+        final int quantity = 1000;
+
+        ktu.send(consumerSpy, ktu.generateRecords(0, quantity));
+
+        parallelConsumer.poll(recordContexts -> {
+            recordContexts.forEach(recordContext -> {
+                log.trace("Processing: {}", recordContext);
+                try {
+                    Thread.sleep(5);
+                } catch (InterruptedException e) {
+                    throw new RuntimeException(e);
+                }
+            });
+        });
+
+        log.info(registry.getMetersAsString());
+        // metrics have some data
+        await().atMost(Duration.ofSeconds(20)).pollInterval(Duration.ofSeconds(1)).untilAsserted(() -> {
+            assertFalse(registry.getMeters().isEmpty());
+            assertEquals(RUNNING.getValue(),
+                    registeredGaugeValueFor(PCMetricsDef.PC_STATUS));
+        });
+
+        parallelConsumer.pauseIfRunning();
+        ktu.send(consumerSpy, ktu.generateRecords(0, 100));
+        await().atMost(Duration.ofSeconds(20)).pollInterval(Duration.ofSeconds(1)).untilAsserted(() -> {
+            assertEquals(PAUSED.getValue(),
+                    registeredGaugeValueFor(PCMetricsDef.PC_STATUS));
+        });
+        parallelConsumer.resumeIfPaused();
+        await().atMost(Duration.ofSeconds(20)).pollInterval(Duration.ofSeconds(1)).untilAsserted(() -> {
+            assertEquals(RUNNING.getValue(),
+                    registeredGaugeValueFor(PCMetricsDef.PC_STATUS));
+        });
+    }
+
+
+    private double registeredGaugeValueFor(PCMetricsDef metricsDef, String... filterTags) {
+        return Optional.ofNullable(registry.find(metricsDef.getName()).tags(filterTags).gauge()).map(Gauge::value).orElse(-1.0);
+    }
+
+    private double registeredGaugeValueFor(PCMetricsDef metricsDef, int partition) {
+        String[] filterTags = new String[]{"topic", topicPartition.topic(), "partition", String.valueOf(partition)};
+        return registeredGaugeValueFor(metricsDef, filterTags);
+    }
+
+    private double registeredCounterValueFor(PCMetricsDef metricsDef, String... filterTags) {
+        return Optional.ofNullable(registry.find(metricsDef.getName()).tags(filterTags).counter())
+                .map(Counter::count).orElse(-1.0);
+    }
+
+    private double registeredTimerFor(PCMetricsDef metricsDef, String... tags) {
+        return Optional.ofNullable(registry.find(metricsDef.getName()).tags(tags).timer())
+                .map(timer -> timer.mean(TimeUnit.MILLISECONDS)).orElse(-1.0);
+    }
+
+    private double registeredDistributionSummaryFor(PCMetricsDef metricsDef, String... tags) {
+        return Optional.ofNullable(registry.find(metricsDef.getName()).tags(tags).summary())
+                .map(DistributionSummary::mean).orElse(-1.0);
+    }
+
+    @Override
+    protected ParallelConsumerOptions<Object, Object> getOptions() {
+        registry = new SimpleMeterRegistry(new SimpleConfig() {
+            @Override
+            public String get(final String key) {
+                return null;
+            }
+
+            @Override
+            public @NotNull Duration step() {
+                return Duration.ofSeconds(10);
+            }
+        }, Clock.SYSTEM);
+        ParallelConsumerOptions<Object, Object> options = getDefaultOptions()
+                .meterRegistry(registry)
+                .metricsTags(commonTags)
+                .build();
+
+        return options;
+    }
+}
+
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelConsumerOptionsTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelConsumerOptionsTest.java
new file mode 100644
index 000000000..1e2f3aaf0
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelConsumerOptionsTest.java
@@ -0,0 +1,54 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.LongPollingMockConsumer;
+import org.junit.jupiter.api.Tag;
+import org.junit.jupiter.api.Test;
+
+import java.time.Duration;
+
+import static com.google.common.truth.Truth.assertThat;
+import static org.apache.kafka.clients.consumer.OffsetResetStrategy.EARLIEST;
+
+/**
+ * Check that various validation and combinations of {@link ParallelConsumerOptions} works.
+ *
+ * @author Antony Stubbs
+ * @see ParallelConsumerOptions
+ */
+@Tag("transactions")
+@Tag("#355")
+class ParallelConsumerOptionsTest {
+
+    /**
+     * Test the deprecation phase of commit frequency
+     */
+    @Test
+    void setTimeBetweenCommits() {
+        var newFreq = Duration.ofMillis(100);
+        var options = ParallelConsumerOptions.<String, String>builder()
+                .commitInterval(newFreq)
+                .consumer(new LongPollingMockConsumer<>(EARLIEST))
+                .build();
+
+        //
+        assertThat(options.getCommitInterval()).isEqualTo(newFreq);
+
+        //
+        var pc = new ParallelEoSStreamProcessor<>(options);
+
+        //
+        assertThat(pc.getTimeBetweenCommits()).isEqualTo(newFreq);
+
+        //
+        var testFreq = Duration.ofMillis(9);
+        pc.setTimeBetweenCommits(testFreq);
+
+        //
+        assertThat(pc.getTimeBetweenCommits()).isEqualTo(testFreq);
+        assertThat(options.getCommitInterval()).isEqualTo(testFreq);
+    }
+}
\ No newline at end of file
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelEoSSStreamProcessorRebalancedTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelEoSSStreamProcessorRebalancedTest.java
new file mode 100644
index 000000000..224549f12
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelEoSSStreamProcessorRebalancedTest.java
@@ -0,0 +1,86 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode;
+import io.confluent.parallelconsumer.internal.PCModuleTestEnv;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.common.TopicPartition;
+import org.junit.jupiter.api.AfterEach;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+@Slf4j
+class ParallelEoSSStreamProcessorRebalancedTest extends ParallelEoSStreamProcessorTestBase {
+
+    private static final AtomicInteger RECORD_SET_KEY_GENERATOR = new AtomicInteger();
+
+    @BeforeEach()
+    public void setupAsyncConsumerTestBase() {
+        setupTopicNames();
+        setupClients();
+    }
+
+    @AfterEach()
+    public void close() {
+    }
+
+    @ParameterizedTest
+    @EnumSource(CommitMode.class)
+    @SneakyThrows
+    void pausingAndResumingProcessingShouldWork(final CommitMode commitMode) {
+        final CountDownLatch countDownLatch = new CountDownLatch(1);
+        final PCModuleTestEnv pcModuleTestEnv = new PCModuleTestEnv(getBaseOptions(commitMode), countDownLatch);
+        parallelConsumer = new ParallelEoSStreamProcessor<>(getBaseOptions(commitMode), pcModuleTestEnv);
+        parentParallelConsumer = parallelConsumer;
+        parallelConsumer.subscribe(of(INPUT_TOPIC));
+        this.consumerSpy.subscribeWithRebalanceAndAssignment(of(INPUT_TOPIC), 2);
+        attachLoopCounter(parallelConsumer);
+
+        parallelConsumer.poll(context -> {
+            //do nothing call never lands here
+        });
+
+        addRecordsWithSetKeyForEachPartition();
+        awaitUntilTrue(() -> parallelConsumer.getWm().getNumberRecordsOutForProcessing() > 0);
+        consumerSpy.revoke(of(new TopicPartition(INPUT_TOPIC, 0)));
+        consumerSpy.rebalanceWithoutAssignment(consumerSpy.assignment());
+        consumerSpy.assign(of(new TopicPartition(INPUT_TOPIC, 0)));
+
+        addRecordsWithSetKeyForEachPartition();
+        countDownLatch.countDown();
+        awaitForCommit(4);
+    }
+
+    private void addRecordsWithSetKeyForEachPartition() {
+        long recordSetKey = RECORD_SET_KEY_GENERATOR.incrementAndGet();
+        log.debug("Producing {} records with set key {}.", 2, recordSetKey);
+        consumerSpy.addRecord(ktu.makeRecord(0, "key-" + recordSetKey + 0, "v0-test-" + 0));
+        consumerSpy.addRecord(ktu.makeRecord(1, "key-" + recordSetKey + 0, "v0-test-" + 0));
+        log.debug("Finished producing {} records with set key {}.", 2, recordSetKey);
+    }
+
+    private ParallelConsumerOptions<String, String> getBaseOptions(final CommitMode commitMode) {
+        final ParallelConsumerOptions.ParallelConsumerOptionsBuilder<String, String> optionsBuilder =
+                ParallelConsumerOptions.<String, String>builder()
+                        .commitMode(commitMode)
+                        .consumer(consumerSpy)
+                        .batchSize(2)
+                        .maxConcurrency(1);
+
+        if (commitMode == CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER) {
+            optionsBuilder.producer(producerSpy);
+        }
+
+        return optionsBuilder.build();
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelEoSStreamProcessorPauseResumeTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelEoSStreamProcessorPauseResumeTest.java
new file mode 100644
index 000000000..a59054501
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelEoSStreamProcessorPauseResumeTest.java
@@ -0,0 +1,232 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.awaitility.Awaitility;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+
+import java.util.Optional;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.concurrent.locks.ReentrantLock;
+import java.util.function.Consumer;
+
+import static com.google.common.truth.Truth.assertThat;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.UNORDERED;
+
+/**
+ * Test for pause/resume feature of the parallel consumer (see {@code GH#193}).
+ *
+ * @author niels.oertel
+ */
+@Slf4j
+class ParallelEoSStreamProcessorPauseResumeTest extends ParallelEoSStreamProcessorTestBase {
+
+    private static final AtomicInteger MY_ID_GENERATOR = new AtomicInteger();
+
+    private static final AtomicInteger RECORD_SET_KEY_GENERATOR = new AtomicInteger();
+
+    private static class TestUserFunction implements Consumer<PollContext<String, String>> {
+
+        private final AtomicInteger numProcessedRecords = new AtomicInteger();
+
+        /**
+         * The number of in flight records. Note that this may not exactly match the real number of in flight records as
+         * parallel consumer has a wrapper around the user function so incrementing/decrementing the counter is a little
+         * bit delayed.
+         */
+        private final AtomicInteger numInFlightRecords = new AtomicInteger();
+
+        private final ReentrantLock mutex = new ReentrantLock();
+
+        public void lockProcessing() {
+            mutex.lock();
+        }
+
+        public void unlockProcessing() {
+            log.debug("Unlocking processing");
+            mutex.unlock();
+        }
+
+        @Override
+        public void accept(PollContext<String, String> t) {
+            log.debug("Received: {}", t);
+            numInFlightRecords.incrementAndGet();
+            try {
+                lockProcessing();
+                int numProcessed = numProcessedRecords.incrementAndGet();
+                log.debug("Processed complete, incremented to {}", numProcessed);
+            } finally {
+                unlockProcessing();
+                numInFlightRecords.decrementAndGet();
+            }
+        }
+
+        public void reset() {
+            numProcessedRecords.set(0);
+        }
+    }
+
+    private ParallelConsumerOptions<String, String> getBaseOptions(final CommitMode commitMode, int maxConcurrency) {
+        return ParallelConsumerOptions.<String, String>builder()
+                .commitMode(commitMode)
+                .consumer(consumerSpy)
+                // UNORDERED so that we get nice linear offsets in our processing order (PARTITION has no concurrency, KEY depends on your keys
+                .ordering(UNORDERED)
+                .maxConcurrency(maxConcurrency)
+                .build();
+    }
+
+    private void addRecordsWithSetKey(final int numRecords) {
+        long recordSetKey = RECORD_SET_KEY_GENERATOR.incrementAndGet();
+        log.debug("Producing {} records with set key {}.", numRecords, recordSetKey);
+        for (int i = 0; i < numRecords; ++i) {
+            consumerSpy.addRecord(ktu.makeRecord("key-" + recordSetKey + i, "v0-test-" + i));
+        }
+        log.debug("Finished producing {} records with set key {}.", numRecords, recordSetKey);
+    }
+
+    private void setupParallelConsumerInstance(final CommitMode commitMode, final int maxConcurrency) {
+        setupParallelConsumerInstance(getBaseOptions(commitMode, maxConcurrency));
+
+        // register unique ID on the parallel consumer
+        String myId = "p/r-test-" + MY_ID_GENERATOR.incrementAndGet();
+        parallelConsumer.setMyId(Optional.of(myId));
+    }
+
+    private TestUserFunction createTestSetup(final CommitMode commitMode, final int maxConcurrency) {
+        setupParallelConsumerInstance(commitMode, maxConcurrency);
+        TestUserFunction testUserFunction = new TestUserFunction();
+        parallelConsumer.poll(testUserFunction);
+
+        return testUserFunction;
+    }
+
+    /**
+     * This test verifies that no new records are submitted to the workers once the consumer is paused.
+     *
+     * @param commitMode The commit mode to be configured for the parallel consumer.
+     */
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    @SneakyThrows
+    void pausingAndResumingProcessingShouldWork(final CommitMode commitMode) {
+        int numTestRecordsPerSet = 1_000;
+        int totalRecordsExpected = 2 * numTestRecordsPerSet;
+
+        TestUserFunction testUserFunction = createTestSetup(commitMode, 3);
+
+        // produce some messages
+        addRecordsWithSetKey(numTestRecordsPerSet);
+
+        // wait for processing to finish
+        Awaitility
+                .waitAtMost(defaultTimeout)
+                .alias(numTestRecordsPerSet + " records should be processed")
+                .untilAsserted(() -> assertThat(testUserFunction.numProcessedRecords.get()).isEqualTo(numTestRecordsPerSet));
+
+        // overall committed offset should reach the same value
+        awaitForCommit(numTestRecordsPerSet);
+
+        //
+        testUserFunction.reset();
+
+        // pause parallel consumer and wait for control loops to catch up
+        parallelConsumer.pauseIfRunning();
+
+        awaitForOneLoopCycle();
+
+        // produce more messages -> nothing should be processed
+        addRecordsWithSetKey(numTestRecordsPerSet);
+
+        awaitForSomeLoopCycles(2);
+
+        // shouldn't have produced any records
+        assertThat(testUserFunction.numProcessedRecords.get()).isEqualTo(0L);
+
+        // overall committed offset should stay at old value
+        awaitForCommit(numTestRecordsPerSet);
+
+        // resume parallel consumer ->
+        parallelConsumer.resumeIfPaused();
+
+        // messages should be processed now
+        Awaitility
+                .waitAtMost(defaultTimeout)
+                .alias(numTestRecordsPerSet + " records should be processed")
+                .untilAsserted(() -> assertThat(testUserFunction.numProcessedRecords.get()).isEqualTo(numTestRecordsPerSet));
+
+        // overall committed offset should reach the total of two batches that were processed
+        awaitForCommit(totalRecordsExpected);
+    }
+
+    /**
+     * This test verifies that in flight work is finished successfully when the consumer is paused. In flight work is
+     * work that's currently being processed inside a user function has already been submitted to be processed based on
+     * the dynamic load factor. The test also verifies that new offsets are committed once the in-flight work finishes
+     * even if the consumer is still paused.
+     *
+     * @param commitMode The commit mode to be configured for the parallel consumer.
+     */
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    @SneakyThrows
+    void testThatInFlightWorkIsFinishedSuccessfullyAndOffsetsAreCommitted(final CommitMode commitMode) {
+        int degreeOfParallelism = 3;
+        int numTestRecordsPerSet = 1_000;
+
+        TestUserFunction testUserFunction = createTestSetup(commitMode, degreeOfParallelism);
+        // block processing in the user function to ensure we have in flight work once we pause the consumer
+        testUserFunction.lockProcessing();
+
+        // produce some messages
+        addRecordsWithSetKey(numTestRecordsPerSet);
+
+        // wait until we have enough records in flight
+        Awaitility
+                .waitAtMost(defaultTimeout)
+                .alias(degreeOfParallelism + " records should be in flight processed")
+                .untilAsserted(() -> assertThat(testUserFunction.numInFlightRecords.get()).isEqualTo(degreeOfParallelism));
+
+        //
+        assertCommits().isEmpty();
+
+        // pause parallel consumer and wait for control loops to catch up
+        parallelConsumer.pauseIfRunning();
+        awaitForOneLoopCycle();
+
+        // unlock the user function
+        testUserFunction.unlockProcessing();
+
+        // in flight messages + buffered messages should get processed now (exact number is based on dynamic load factor)
+        Awaitility
+                .waitAtMost(defaultTimeout)
+                .alias("at least " + degreeOfParallelism + " records should be processed")
+                .untilAsserted(() -> assertThat(testUserFunction.numProcessedRecords.get()).isGreaterThan(degreeOfParallelism));
+
+        // overall committed offset should reach the same value
+        awaitForCommit(testUserFunction.numProcessedRecords.get());
+
+        // shouldn't have anymore in flight records now
+        assertThat(testUserFunction.numInFlightRecords.get()).isEqualTo(0);
+        assertThat(parallelConsumer.getWm().getNumberRecordsOutForProcessing()).isEqualTo(0);
+
+        // resume parallel consumer ->
+        parallelConsumer.resumeIfPaused();
+
+        // other pending messages should be processed now
+        Awaitility
+                .waitAtMost(defaultTimeout)
+                .alias(numTestRecordsPerSet + " records should be processed")
+                .untilAsserted(() -> assertThat(testUserFunction.numProcessedRecords.get()).isEqualTo(numTestRecordsPerSet));
+
+        // overall committed offset should reach the total number of processed records
+        awaitForCommit(numTestRecordsPerSet);
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelEoSStreamProcessorTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelEoSStreamProcessorTest.java
new file mode 100644
index 000000000..217511d6a
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelEoSStreamProcessorTest.java
@@ -0,0 +1,1014 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.JavaUtils;
+import io.confluent.csid.utils.LatchTestUtils;
+import io.confluent.csid.utils.ProgressBarUtils;
+import io.confluent.csid.utils.Range;
+import io.confluent.csid.utils.ThreadUtils;
+import io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode;
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.*;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.common.serialization.Deserializer;
+import org.apache.kafka.common.serialization.Serdes;
+import org.assertj.core.api.Assumptions;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Disabled;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.Timeout;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+import org.mockito.ArgumentMatchers;
+import org.mockito.Mockito;
+
+import java.time.Duration;
+import java.util.*;
+import java.util.concurrent.ConcurrentHashMap;
+import java.util.concurrent.ConcurrentLinkedQueue;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.concurrent.atomic.AtomicLong;
+import java.util.function.Function;
+
+import static io.confluent.csid.utils.GeneralTestUtils.time;
+import static io.confluent.csid.utils.KafkaTestUtils.checkExactOrdering;
+import static io.confluent.csid.utils.KafkaUtils.toTopicPartition;
+import static io.confluent.csid.utils.LatchTestUtils.awaitLatch;
+import static io.confluent.csid.utils.LatchTestUtils.constructLatches;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.*;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.KEY;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.UNORDERED;
+import static java.time.Duration.ofSeconds;
+import static java.util.concurrent.TimeUnit.MINUTES;
+import static org.assertj.core.api.Assertions.*;
+import static org.awaitility.Awaitility.await;
+import static org.mockito.ArgumentMatchers.any;
+import static org.mockito.Mockito.*;
+import static org.mockito.internal.verification.VerificationModeFactory.times;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+@Timeout(value = 3, unit = MINUTES)
+@Slf4j
+public class ParallelEoSStreamProcessorTest extends ParallelEoSStreamProcessorTestBase {
+
+    public static class MyAction implements Function<ConsumerRecord<String, String>, String> {
+
+        @Override
+        public String apply(ConsumerRecord<String, String> record) {
+            log.info("User client function - consuming a record... {}", record.key());
+            return "my-result";
+        }
+    }
+
+    @BeforeEach()
+    public void setupData() {
+        primeFirstRecord();
+    }
+
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    @SneakyThrows
+    public void failingActionNothingCommitted(CommitMode commitMode) {
+        setupParallelConsumerInstance(commitMode);
+
+        parallelConsumer.poll((ignore) -> {
+            throw new FakeRuntimeException("My user's function error");
+        });
+
+        // let it process
+        awaitForSomeLoopCycles(3);
+
+        parallelConsumer.close();
+
+        //
+        assertCommits(of(), "All erroring, so nothing committed except initial");
+    }
+
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    @SneakyThrows
+    public void executorThreadsInterruptedOnShutdownTimeout(CommitMode commitMode) {
+        AtomicBoolean interrupted = new AtomicBoolean(false);
+        CountDownLatch latch = new CountDownLatch(1);
+        setupParallelConsumerInstance(getBaseOptionsKeyOrdered(commitMode, Duration.ofSeconds(1)));
+        primeFirstRecord();
+
+        parallelConsumer.poll((ignore) -> {
+            try {
+                latch.await();
+            } catch (InterruptedException interruptedException) {
+                interrupted.set(true);
+                Thread.interrupted(); //reset interrupted flag.
+                throw new RuntimeException(interruptedException);
+            }
+        });
+
+        // let it process
+        awaitForSomeLoopCycles(2);
+
+        parallelConsumer.close();
+
+        //
+        assertCommits(of(), "All erroring, so nothing committed except initial");
+        assertThat(interrupted).isTrue();
+    }
+
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    @SneakyThrows
+    public void inFlightMessagesCommittedIfProcessedDuringShutdown(CommitMode commitMode) {
+        AtomicBoolean interrupted = new AtomicBoolean(false);
+        CountDownLatch latch = new CountDownLatch(1);
+        setupParallelConsumerInstance(getBaseOptionsKeyOrdered(commitMode, Duration.ofSeconds(1)));
+        primeFirstRecord();
+
+        parallelConsumer.poll((ignore) -> {
+            try {
+                latch.await();
+                ThreadUtils.sleepQuietly(100);
+            } catch (InterruptedException interruptedException) {
+                interrupted.set(true);
+                Thread.interrupted(); //reset interrupted flag.
+            }
+        });
+
+        // let it process
+        awaitForSomeLoopCycles(2);
+
+        latch.countDown();
+        parallelConsumer.close();
+
+        //
+        assertCommits(of(1), "1 record completed during shutdown");
+        assertThat(interrupted).isFalse();
+    }
+
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    @SneakyThrows
+    public void queuedMessagesNotProcessedOrCommittedIfSubmittedDuringShutdown(CommitMode commitMode) {
+        AtomicBoolean interrupted = new AtomicBoolean(false);
+        CountDownLatch latch = new CountDownLatch(1);
+        setupParallelConsumerInstance(getBaseOptionsKeyOrdered(commitMode, Duration.ofSeconds(1)));
+
+        primeFirstRecord();
+
+        consumerSpy.addRecord(ktu.makeRecord("0", "v1"));
+        consumerSpy.addRecord(ktu.makeRecord("0", "v2"));
+        consumerSpy.addRecord(ktu.makeRecord("1", "v3"));
+        consumerSpy.addRecord(ktu.makeRecord("0", "v4"));
+
+        parallelConsumer.poll((record) -> {
+            if(record.getSingleConsumerRecord().value().equals("v1")) {
+                try {
+                    latch.await();
+                    ThreadUtils.sleepQuietly(100);
+                } catch (InterruptedException interruptedException) {
+                    interrupted.set(true);
+                    Thread.interrupted(); //reset interrupted flag.
+                }
+            }
+        });
+
+        // let it process
+        awaitForSomeLoopCycles(2);
+
+        latch.countDown();
+        parallelConsumer.close();
+
+        //
+        assertCommits(of(1,2), "primed record and first key=0 record completed only, followup key 0 records skipped");
+        assertCommits().encodedIncomplete(2); //first blocked/skipped key 0 record (value v2).
+        assertThat(interrupted).isFalse();
+    }
+
+    /**
+     * Checks that - for messages that are currently undergoing processing, that no offsets for them are committed
+     */
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    void offsetsAreNeverCommittedForMessagesStillInFlightSimplest(CommitMode commitMode) {
+        var options = getBaseOptions(commitMode).toBuilder()
+                .ordering(UNORDERED)
+                .build();
+        setupParallelConsumerInstance(options);
+        parallelConsumer.setTimeBetweenCommits(ofSeconds(1));
+
+        primeFirstRecord();
+        sendSecondRecord(consumerSpy);
+
+        // sanity
+        assertThat(parallelConsumer.getWm().getOptions().getOrdering()).isEqualTo(UNORDERED);
+
+        // setup
+        var locks = constructLatches(2);
+        var processedStates = new LinkedHashMap<Integer, Boolean>();
+        var startBarrierLatch = new CountDownLatch(1);
+
+        // finish processing only msg 1
+        parallelConsumer.poll(context -> {
+            log.debug("msg: {}", context);
+            startBarrierLatch.countDown();
+            int offset = (int) context.offset();
+            LatchTestUtils.awaitLatch(locks, offset);
+            processedStates.put(offset, true);
+        });
+
+        //
+        awaitLatch(startBarrierLatch);
+
+        // zero records waiting, 2 out for processing
+        assertThat(parallelConsumer.getWm().getNumberOfWorkQueuedInShardsAwaitingSelection()).isZero();
+        assertThat(parallelConsumer.getWm().getNumberRecordsOutForProcessing()).isEqualTo(2);
+
+        // finish processing 1
+        releaseAndWait(locks, 1);
+
+        // make sure offset 0 is committed (next expected), while the rest are not
+        parallelConsumer.requestCommitAsap();
+        awaitForCommitExact(0);
+
+        // make sure no offsets are committed
+        assertCommits(of(), "Partition is blocked");
+
+        // test complete
+
+        // So it's data is setup can be used in other tests, finish offset 0 as well
+        releaseAndWait(locks, 0);
+
+        parallelConsumer.requestCommitAsap();
+
+        awaitForCommitExact(2);
+
+        log.debug("Closing...");
+        parallelConsumer.closeDrainFirst();
+
+        assertThat(processedStates)
+                .as("sanity - all expected messages are processed")
+                .containsValues(true, true);
+    }
+
+    private void setupParallelConsumerInstance(final CommitMode commitMode) {
+        setupParallelConsumerInstance(getBaseOptions(commitMode));
+        // created a new client above, so have to send the prime record again
+        primeFirstRecord();
+    }
+
+    private ParallelConsumerOptions getBaseOptions(final CommitMode commitMode) {
+        return ParallelConsumerOptions.<String, String>builder()
+                .commitMode(commitMode)
+                .consumer(consumerSpy)
+                .producer(producerSpy)
+                .build();
+    }
+
+    private ParallelConsumerOptions getBaseOptionsKeyOrdered(final CommitMode commitMode, final Duration shutdownDuration) {
+        return ParallelConsumerOptions.<String, String>builder()
+                .commitMode(commitMode)
+                .consumer(consumerSpy)
+                .producer(producerSpy)
+                .shutdownTimeout(shutdownDuration)
+                .ordering(KEY).build();
+    }
+
+    /**
+     * {@link #offsetsAreNeverCommittedForMessagesStillInFlightSimplest(CommitMode)} doesn't check the final offsets -
+     * that's what this test does.
+     */
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    @SneakyThrows
+    void offsetsAreNeverCommittedForMessagesStillInFlightShort(CommitMode commitMode) {
+        offsetsAreNeverCommittedForMessagesStillInFlightSimplest(commitMode);
+        log.info("Test start");
+
+        // next expected offset is now 2
+        await().untilAsserted(() ->
+                assertCommits(of(2), "Only one of the two offsets committed, as they were coalesced for efficiency"));
+    }
+
+    @Disabled
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    void offsetsAreNeverCommittedForMessagesStillInFlightLong(CommitMode commitMode) {
+        setupParallelConsumerInstance(commitMode);
+
+        sendSecondRecord(consumerSpy);
+
+        // send three messages - 0, 1, 2
+        consumerSpy.addRecord(ktu.makeRecord("0", "v2"));
+        consumerSpy.addRecord(ktu.makeRecord("0", "v3"));
+        consumerSpy.addRecord(ktu.makeRecord("0", "v4"));
+        consumerSpy.addRecord(ktu.makeRecord("0", "v5"));
+
+        List<CountDownLatch> locks = constructLatches(6);
+
+        CountDownLatch startLatch = new CountDownLatch(1);
+
+        parallelConsumer.poll((context) -> {
+            int offset = (int) context.offset();
+            CountDownLatch latchForMsg = locks.get(offset);
+            try {
+                startLatch.countDown();
+                latchForMsg.await();
+            } catch (InterruptedException e) {
+                // ignore
+            }
+        });
+
+        startLatch.countDown();
+
+        // finish processing 1
+        releaseAndWait(locks, 1);
+
+        awaitForSomeLoopCycles(1);
+
+        // make sure no offsets are committed
+        verify(producerSpy, after(verificationWaitDelay).never()).commitTransaction();
+
+        // finish 2
+        releaseAndWait(locks, 2);
+
+        //
+        awaitForSomeLoopCycles(1);
+
+        // make sure no offsets are committed
+        verify(producerSpy, after(verificationWaitDelay).never()).commitTransaction();
+
+        // finish 0
+        releaseAndWait(locks, 0);
+        awaitForOneLoopCycle();
+
+        // make sure offset 2, not 0 or 1 is committed
+        verify(producerSpy, after(verificationWaitDelay).times(1)).commitTransaction();
+        var maps = producerSpy.consumerGroupOffsetsHistory();
+        assertThat(maps).hasSize(1);
+        OffsetAndMetadata offsets = maps.get(0).get(CONSUMER_GROUP_ID).get(toTopicPartition(firstRecord));
+        assertThat(offsets.offset()).isEqualTo(2);
+
+        // finish 3
+        releaseAndWait(locks, 3);
+
+        // 3 committed
+        verify(producerSpy, after(verificationWaitDelay).times(2)).commitTransaction();
+        maps = producerSpy.consumerGroupOffsetsHistory();
+        assertThat(maps).hasSize(2);
+        offsets = maps.get(1).get(CONSUMER_GROUP_ID).get(toTopicPartition(firstRecord));
+        assertThat(offsets.offset()).isEqualTo(3);
+
+        // finish 4,5
+        releaseAndWait(locks, of(4, 5));
+
+        // 5 committed
+        verify(producerSpy, after(verificationWaitDelay).atLeast(3)).commitTransaction();
+        maps = producerSpy.consumerGroupOffsetsHistory();
+        assertThat(maps).hasSizeGreaterThanOrEqualTo(3);
+        offsets = maps.get(2).get(CONSUMER_GROUP_ID).get(toTopicPartition(firstRecord));
+        assertThat(offsets.offset()).isEqualTo(5);
+        assertCommits(of(2, 3, 5));
+
+        // close
+        parallelConsumer.close();
+    }
+
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    @SneakyThrows
+    void offsetCommitsAreIsolatedPerPartition(CommitMode commitMode) {
+        // Disable this test for vert.x for now
+        Assumptions.assumeThat(parallelConsumer)
+                .as("Should only test on core PC - this test is very complicated to get to work with vert.x " +
+                        "thread system, as the event and locking system needed is quite different")
+                .isExactlyInstanceOf(AbstractParallelEoSStreamProcessor.class);
+
+        setupParallelConsumerInstance(getBaseOptions(commitMode).toBuilder()
+                .ordering(UNORDERED)
+                .build());
+        primeFirstRecord();
+
+        sendSecondRecord(consumerSpy);
+
+        // send messages - 0,1, to one partition and 3,4 to another partition petitions
+        consumerSpy.addRecord(ktu.makeRecord(1, "0", "v2"));
+        consumerSpy.addRecord(ktu.makeRecord(1, "0", "v3"));
+
+        var msg0Lock = new CountDownLatch(1);
+        var msg1Lock = new CountDownLatch(1);
+        var msg2Lock = new CountDownLatch(1);
+        var msg3Lock = new CountDownLatch(1);
+
+        List<CountDownLatch> locks = of(msg0Lock, msg1Lock, msg2Lock, msg3Lock);
+
+        parallelConsumer.poll((ignore) -> {
+            int offset = (int) ignore.offset();
+            CountDownLatch latchForMsg = locks.get(offset);
+            try {
+                latchForMsg.await();
+            } catch (InterruptedException e) {
+                log.error(e.toString());
+            }
+        });
+
+        // finish processing 1
+        releaseAndWait(locks, 1);
+
+        parallelConsumer.requestCommitAsap();
+
+        awaitForSomeLoopCycles(50); // async commit can be slow - todo change this to event based
+
+        // make sure only base offsets are committed for partition (next expected = 0 and 2 respectively)
+//        assertCommits(of(2));
+        assertCommitLists(of(of(), of(2)));
+
+        // finish 2
+        releaseAndWait(locks, 2);
+        parallelConsumer.requestCommitAsap();
+
+        // make sure only 2 on it's partition is committed
+//        assertCommits(of(2, 3));
+        await().untilAsserted(() ->
+                assertCommitLists(of(of(), of(2, 3))));
+
+        // finish 0
+        releaseAndWait(locks, 0);
+
+        parallelConsumer.requestCommitAsap();
+
+        awaitForOneLoopCycle();
+        if (isUsingAsyncCommits())
+            awaitForSomeLoopCycles(3); // async commit can be slow - todo change this to event based
+
+        // make sure offset 0 and 1 is committed
+        assertCommitLists(of(of(2), of(2, 3)));
+
+        // finish 3
+        releaseAndWait(locks, 3);
+
+        // async consumer is slower to execute the commit. We could just wait, or we could add an event to the async consumer commit cycle
+        if (isUsingAsyncCommits())
+            awaitForSomeLoopCycles(3); // async commit can be slow - todo change this to event based
+
+        //
+        await().untilAsserted(() ->
+                assertCommitLists(of(of(2), of(2, 3, 4))));
+    }
+
+    @ParameterizedTest
+    @EnumSource(CommitMode.class)
+    void controlFlowException(CommitMode commitMode) {
+        // setup again manually to use subscribe instead of assign (for revoke testing)
+        instantiateConsumerProducer();
+        parentParallelConsumer = initPollingAsyncConsumer(getBaseOptions(commitMode));
+        subscribeParallelConsumerAndMockConsumerTo(INPUT_TOPIC);
+        setupData();
+
+        // cause a control loop error
+        parallelConsumer.addLoopEndCallBack(() -> {
+            throw new FakeRuntimeException("My fake control loop error");
+        });
+
+        //
+        parallelConsumer.poll((ignore) -> {
+            log.info("Ignoring {}", ignore);
+        });
+
+        // close and retrieve exception in control loop
+        assertThatThrownBy(() -> {
+            parallelConsumer.closeDrainFirst(ofSeconds(10));
+        }).hasMessageContainingAll("Error", "poll", "thread", "fake control");
+    }
+
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    @SneakyThrows
+    void testVoidPollMethod(CommitMode commitMode) {
+        setupParallelConsumerInstance(commitMode);
+
+        int expected = 1;
+        var msgCompleteBarrier = new CountDownLatch(expected);
+        parallelConsumer.poll(context -> {
+            log.debug("Processing test context...");
+            var singleRecord = context.getSingleConsumerRecord();
+            myRecordProcessingAction.apply(singleRecord);
+            msgCompleteBarrier.countDown();
+        });
+
+        awaitLatch(msgCompleteBarrier);
+
+        awaitForSomeLoopCycles(2);
+
+        parallelConsumer.close();
+
+        assertCommits(of(1));
+
+        verify(myRecordProcessingAction, times(expected)).apply(any());
+
+        // assert internal methods - shouldn't really need this as we already check the commit history above through the
+        // spy, so can leave in for the old producer style
+        if (commitMode.equals(PERIODIC_TRANSACTIONAL_PRODUCER)) {
+            verify(producerSpy, atLeastOnce()).commitTransaction();
+            verify(producerSpy, atLeastOnce()).sendOffsetsToTransaction(anyMap(), ArgumentMatchers.<ConsumerGroupMetadata>any());
+        }
+    }
+
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    @SneakyThrows
+    @Disabled
+    public void processInKeyOrder(CommitMode commitMode) {
+        setupParallelConsumerInstance(ParallelConsumerOptions.builder()
+                .commitMode(commitMode)
+                .ordering(KEY)
+                .build());
+        // created a new client above, so have to send the prime record again
+        primeFirstRecord();
+
+        // sanity check
+        assertThat(parallelConsumer.getWm().getOptions().getOrdering()).isEqualTo(KEY);
+
+        sendSecondRecord(consumerSpy);
+
+        // 0,1 previously sent to partition 0
+        // send two more to part 0 - 2,3,
+        consumerSpy.addRecord(ktu.makeRecord("key-1", "v2")); // 2
+        consumerSpy.addRecord(ktu.makeRecord("key-1", "v3")); // 3
+
+        // and 3,4 to another partition
+        consumerSpy.addRecord(ktu.makeRecord(1, "key-2", "v4")); // 4
+        consumerSpy.addRecord(ktu.makeRecord(1, "key-3", "v5")); // 5
+        consumerSpy.addRecord(ktu.makeRecord(1, "key-3", "v6")); // 6
+        consumerSpy.addRecord(ktu.makeRecord(1, "key-3", "v7")); // 7
+        consumerSpy.addRecord(ktu.makeRecord(1, "key-4", "v8")); // 8 - 8 must not get committed before 7 does
+
+        // so 3 and 4 will block each other only
+        // and 0,1,2,3 will all block each other (part 0)
+
+        // if we're going to block 8 threads, need a big enough executor pool
+        var msg0Lock = new CountDownLatch(1);
+        var msg1Lock = new CountDownLatch(1);
+        var msg2Lock = new CountDownLatch(1);
+        var msg3Lock = new CountDownLatch(1);
+        var msg4Lock = new CountDownLatch(1);
+        var msg5Lock = new CountDownLatch(1);
+        var msg6Lock = new CountDownLatch(1);
+        var msg7Lock = new CountDownLatch(1);
+        var msg8Lock = new CountDownLatch(1);
+
+        final var processedState = new HashMap<Integer, Boolean>();
+        for (Long msgIndex : Range.range(8)) {
+            processedState.put(msgIndex.intValue(), false);
+        }
+
+        List<CountDownLatch> locks = of(msg0Lock, msg1Lock, msg2Lock, msg3Lock, msg4Lock, msg5Lock, msg6Lock, msg7Lock, msg8Lock);
+
+        final List polled = new ArrayList();
+        Mockito.doAnswer(x -> {
+            ConsumerRecords o = (ConsumerRecords) x.callRealMethod();
+            for (Object o1 : o) {
+                polled.add(o1);
+            }
+            return o;
+        }).when(consumerSpy).poll(any());
+
+        parallelConsumer.poll((ignore) -> {
+            int offset = (int) ignore.offset();
+            CountDownLatch latchForMsg = locks.get(offset);
+            try {
+                log.debug("Started msg {} processing, locking on latch to simulate long process times...", offset);
+                latchForMsg.await();
+            } catch (InterruptedException e) {
+                // ignore
+            }
+            log.debug("Finished msg {} processing after waking...", offset);
+            processedState.put(offset, true);
+        });
+
+        // Finish these immediately
+        msg6Lock.countDown();
+        msg8Lock.countDown();
+
+        // unlock 1
+        log.debug("Unlocking 1...");
+        msg1Lock.countDown();
+
+        // wait cycles to make sure
+        awaitForOneLoopCycle();
+
+        //
+        assertThat(polled).as("sanity check input data").hasSameSizeAs(locks);
+
+        //
+        assertThat(processedState.get(1))
+                .as("blocked by 0 (1 shouldn't be run until 0 is complete, due to key order processing)")
+                .isFalse();
+
+        // make sure no offsets are committed
+        assertCommits(of());
+
+        // finish 2 process clear, but commit blocked by 0
+        log.debug("Unlocking 2...");
+        msg2Lock.countDown();
+        awaitForSomeLoopCycles(2);
+        assertThat(processedState.get(2)).isTrue();
+
+
+        // still nothing - 0 blocks 1 and 2 (partition 0)
+        verify(producerSpy, after(verificationWaitDelay).never()).commitTransaction(); // todo remove all wait nevers in favour of triggers as it slows down test
+        awaitForOneLoopCycle();
+        assertCommits(of());
+
+        // finish 0 - releases pending (1,2)
+        log.debug("Unlocking 0...");
+        msg0Lock.countDown();
+
+        // 0 gets comitted by itself
+        awaitForCommitExact(0, 0);
+
+        // make sure offset 0 is committed. 1 is now free to be processed (same key as 0), which as 2 was processed previously, frees up offset 2 to commit
+        awaitForCommitExact(0, 2);
+        assertCommits(of(0, 2));
+
+        // unlock 3 - should get committed
+        log.debug("Unlocking 3...");
+        msg3Lock.countDown();
+
+        // unlock 5 - commit blocked by 4, but should finish processing and clear 6 and then 7 (in 2 loops) for processing
+        log.debug("Unlocking 5...");
+        msg5Lock.countDown();
+        awaitUntilTrue(() -> processedState.get(5));
+        assertThat(processedState.get(5)).as("5 should processed").isTrue();
+
+        awaitForCommitExact(0, 3);
+        assertCommits(of(0, 2, 3));
+
+        // unlock 4 - clears 5 for offset commit - 7 not processed yet (5,6,7 same key), 8 was never locked
+        log.debug("Unlocking 4...");
+        msg4Lock.countDown();
+
+        // 6 should have been processed, unblocked by 5 (same key)
+        awaitUntilTrue(() -> processedState.get(6));
+        assertThat(processedState.get(6)).as("6 should processed").isTrue();
+
+        // 5 and 6 finished, same key, coalesced commit to 6
+        awaitForSomeLoopCycles(1);
+        awaitForCommitExact(1, 6);
+        assertCommits(of(0, 2, 3, 6));
+
+        // unlock 7 (same key as 6), unblocks 8 for commit
+        assertThat(processedState.get(7)).isFalse();
+        assertThat(processedState.get(8)).isTrue();
+        //
+        releaseAndWait(locks, 7);
+        awaitForCommitExact(1, 8);
+        assertCommits(of(0, 2, 3, 6, 8));
+    }
+
+    /**
+     * Check that when processing in key order, when work is not completed or taking a long time, that the commit system
+     * doesn't break.
+     */
+    @SneakyThrows
+    @Test
+    void processInKeyOrderWorkNotReturnedDoesntBreakCommits() {
+        ParallelConsumerOptions options = ParallelConsumerOptions.builder()
+                .commitMode(PERIODIC_CONSUMER_SYNC)
+                .ordering(KEY)
+                .build();
+        setupParallelConsumerInstance(options);
+        primeFirstRecord();
+
+        sendSecondRecord(consumerSpy);
+
+        // sanity check
+        assertThat(parallelConsumer.getWm().getOptions().getOrdering()).isEqualTo(KEY);
+
+        // 0,1 previously sent to partition 0
+        // send one more, with same key of 1
+        consumerSpy.addRecord(ktu.makeRecord("key-1", "v2")); // 2
+
+        CountDownLatch msg1latch = new CountDownLatch(1);
+        HashMap<Integer, CountDownLatch> locks = new HashMap<>();
+        locks.put(1, msg1latch);
+
+        CountDownLatch twoLoopLatch = new CountDownLatch(2);
+        CountDownLatch fourLoopLatch = new CountDownLatch(4);
+        parallelConsumer.addLoopEndCallBack(() -> {
+            log.trace("Control loop cycle - {}, {}", twoLoopLatch.getCount(), fourLoopLatch.getCount());
+            twoLoopLatch.countDown();
+            fourLoopLatch.countDown();
+        });
+
+        var polled = new ArrayList<>();
+        doAnswer(x -> {
+            var records = (ConsumerRecords<String, String>) x.callRealMethod();
+            for (var record : records) {
+                polled.add(record);
+            }
+            return records;
+        }).when(consumerSpy).poll(any());
+
+        parallelConsumer.poll((ignore) -> {
+            int offset = (int) ignore.offset();
+            CountDownLatch countDownLatch = locks.get(offset);
+            if (countDownLatch != null) try {
+                countDownLatch.await();
+            } catch (Exception e) {
+                log.error(e.getMessage(), e);
+            }
+            log.debug("Message offset {} processed...", offset);
+        });
+
+        await().untilAsserted(() ->
+                assertThat(polled)
+                        .as("sanity check - the records have been polled")
+                        .hasSize(3)
+        );
+
+        //
+        awaitLatch(twoLoopLatch);
+        awaitForOneLoopCycle();
+
+        //
+        await().untilAsserted(() -> {
+            try {
+                // simpler way of making the bootstrap commit optional in the results, than adding the required barrier
+                // locks to ensure it's existence, which has been tested else where
+                assertCommits(of(0, 1), "Only 0 should be committed, as even though 2 is also finished, 1 should be " +
+                        "blocking the partition");
+            } catch (AssertionError e) {
+                assertCommits(of(1), "Bootstrap commit is optional. See msg in code above");
+            }
+        });
+
+        //
+        msg1latch.countDown(); // release remaining processing lock
+
+        //
+        awaitLatch(fourLoopLatch); // wait for some loops
+
+        // one more step
+        awaitForOneLoopCycle();
+
+        await().untilAsserted(() -> {
+            //
+            try { // see above
+                assertCommits(of(0, 1, 3), "Remaining two records should be committed as a single offset");
+            } catch (AssertionError e) {
+                assertCommits(of(1, 3), "Bootstrap commit is optional. See msg in code above");
+            }
+        });
+    }
+
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    public void closeAfterSingleMessageShouldBeEventBasedFast(CommitMode commitMode) {
+        setupParallelConsumerInstance(commitMode);
+
+        Duration timeBetweenCommits = parallelConsumer.getTimeBetweenCommits();
+
+        var msgCompleteBarrier = new CountDownLatch(1);
+
+        parallelConsumer.poll((ignore) -> {
+            log.info("Message processed: {} - noop", ignore.offset());
+            msgCompleteBarrier.countDown();
+        });
+
+        awaitLatch(msgCompleteBarrier);
+
+        // allow for offset to be committed
+        awaitForOneLoopCycle();
+
+        parallelConsumer.requestCommitAsap();
+
+        awaitForOneLoopCycle();
+
+        await().untilAsserted(() ->
+                assertCommits(of(1)));
+
+        // close
+        Duration durationOfCloseOperation = time(() -> {
+            parallelConsumer.close();
+        });
+
+        //
+        Duration expectedDurationOfClose = JavaUtils.max(timeBetweenCommits, ofSeconds(2)); // wait at least 1 second
+        assertThat(durationOfCloseOperation).as("Should be fast").isLessThan(expectedDurationOfClose);
+    }
+
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    public void closeWithoutRunningShouldBeEventBasedFast(CommitMode commitMode) {
+        setupParallelConsumerInstance(getBaseOptions(commitMode));
+
+        parallelConsumer.closeDontDrainFirst();
+    }
+
+    @Test
+    public void ensureLibraryCantBeUsedTwice() {
+        parallelConsumer.poll(ignore -> {
+        });
+        assertThatIllegalStateException().isThrownBy(() -> {
+            parallelConsumer.poll(ignore -> {
+            });
+        });
+    }
+
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    void consumeFlowDoesntRequireProducer(CommitMode commitMode) {
+        setupClients();
+
+        var optionsWithClients = ParallelConsumerOptions.<String, String>builder()
+                .consumer(consumerSpy)
+                .commitMode(commitMode)
+                .build();
+
+        if (commitMode.equals(PERIODIC_TRANSACTIONAL_PRODUCER)) {
+            assertThatThrownBy(() -> parallelConsumer = initPollingAsyncConsumer(optionsWithClients))
+                    .isInstanceOf(IllegalArgumentException.class)
+                    .hasMessageContainingAll("Producer", "Transaction");
+        } else {
+            parallelConsumer = initPollingAsyncConsumer(optionsWithClients);
+            attachLoopCounter(parallelConsumer);
+
+            subscribeParallelConsumerAndMockConsumerTo(INPUT_TOPIC);
+            setupData();
+
+            parallelConsumer.poll((ignore) -> {
+                log.debug("Test record processor - rec: {}", ignore);
+            });
+
+            //
+            parallelConsumer.requestCommitAsap();
+            awaitForCommitExact(1);
+
+            parallelConsumer.closeDrainFirst();
+
+            //
+            assertCommits(of(1));
+        }
+    }
+
+    @Test
+    void optionsProduceMessageFlowRequiresProducer() {
+        setupClients();
+
+        var optionsWithClients = ParallelConsumerOptions.<String, String>builder()
+                .consumer(consumerSpy)
+                .commitMode(PERIODIC_TRANSACTIONAL_PRODUCER)
+                .build();
+
+        assertThatThrownBy(() -> parallelConsumer = initPollingAsyncConsumer(optionsWithClients))
+                .isInstanceOf(IllegalArgumentException.class)
+                .hasMessageContainingAll("Producer", "Transaction");
+    }
+
+
+    @Test
+    void optionsGroupIdRequiredAndAutoCommitDisabled() {
+        Properties properties = new Properties();
+        properties.setProperty(ConsumerConfig.BOOTSTRAP_SERVERS_CONFIG, "localhost:9092");
+        Deserializer<String> deserializer = Serdes.String().deserializer();
+        var realConsumer = new KafkaConsumer<>(properties, deserializer, deserializer);
+
+        var optionsBuilder = ParallelConsumerOptions.<String, String>builder()
+                .consumer(realConsumer)
+                .commitMode(PERIODIC_CONSUMER_ASYNCHRONOUS);
+        var optionsWithClients = optionsBuilder
+                .build();
+
+        // fail
+        assertThatThrownBy(() -> parallelConsumer = initPollingAsyncConsumer(optionsWithClients))
+                .as("Should error on missing group id")
+                .isInstanceOf(IllegalArgumentException.class)
+                .hasMessageContainingAll("Consumer", "GroupId");
+
+        // add missing group id, now auto commit should fail
+        properties.setProperty(ConsumerConfig.GROUP_ID_CONFIG, "dummy-group");
+        optionsBuilder.consumer(new KafkaConsumer<>(properties, deserializer, deserializer));
+        assertThat(catchThrowable(() -> parallelConsumer = initPollingAsyncConsumer(optionsBuilder.build())))
+                .as("Should error on auto commit enabled by default")
+                .isInstanceOf(ParallelConsumerException.class)
+                .hasMessageContainingAll("auto", "commit", "disabled");
+
+        // fail auto commit disabled
+        properties.setProperty(ConsumerConfig.ENABLE_AUTO_COMMIT_CONFIG, "true");
+        optionsBuilder.consumer(new KafkaConsumer<>(properties, deserializer, deserializer));
+        assertThat(catchThrowable(() -> parallelConsumer = initPollingAsyncConsumer(optionsBuilder.build())))
+                .as("Should error on auto commit enabled")
+                .isInstanceOf(ParallelConsumerException.class)
+                .hasMessageContainingAll("auto", "commit", "disabled");
+
+        // set missing auto commit
+        properties.setProperty(ConsumerConfig.ENABLE_AUTO_COMMIT_CONFIG, "false");
+        optionsBuilder.consumer(new KafkaConsumer<>(properties, deserializer, deserializer));
+        assertThatNoException().isThrownBy(() -> parallelConsumer = initPollingAsyncConsumer(optionsBuilder.build()));
+    }
+
+
+    @Test
+    void cantUseProduceFlowWithWrongOptions() throws InterruptedException {
+        setupClients();
+
+        // forget to supply producer
+        var optionsWithClients = ParallelConsumerOptions.<String, String>builder()
+                .consumer(consumerSpy)
+                .commitMode(PERIODIC_CONSUMER_ASYNCHRONOUS)
+                .build();
+
+        setupParallelConsumerInstance(optionsWithClients);
+
+        subscribeParallelConsumerAndMockConsumerTo(INPUT_TOPIC);
+
+        setupData();
+
+        var parallel = initPollingAsyncConsumer(optionsWithClients);
+
+        assertThatThrownBy(() -> parallel.pollAndProduce((record) ->
+                new ProducerRecord<>(INPUT_TOPIC, "hi there")))
+                .isInstanceOf(IllegalArgumentException.class)
+                .hasMessageContainingAll("Producer", "options");
+    }
+
+    @ParameterizedTest()
+    @EnumSource(CommitMode.class)
+    void produceMessageFlow(CommitMode commitMode) {
+        setupParallelConsumerInstance(commitMode);
+
+        parallelConsumer.pollAndProduce((ignore) -> new ProducerRecord<>("Hello", "there"));
+
+        // let it process
+        awaitForSomeLoopCycles(2);
+
+        parallelConsumer.requestCommitAsap();
+
+        //
+        await().untilAsserted(() ->
+                assertCommits(of(1)));
+
+        parallelConsumer.closeDrainFirst();
+
+
+        assertThat(producerSpy.history()).hasSize(1);
+    }
+
+    /**
+     * Explicit check for situation where thread size is much larger than key set size.
+     * <p>
+     * See <a href="https://github.com/confluentinc/parallel-consumer/issues/433">Different computational results
+     * obtained with different max concurrency configurations for the same parallel consumer #433</a>
+     */
+    @Test
+    void lessKeysThanThreads() {
+        setupParallelConsumerInstance(ParallelConsumerOptions.<String, String>builder()
+                .ordering(KEY)
+                // use many more threads than keys
+                .maxConcurrency(100)
+                .build());
+
+        // use a small set of keys, over a large set of records
+        final int keySetSize = 4;
+        var keys = Range.range(keySetSize).listAsIntegers();
+        final int total = 100_000;
+        log.debug("Generating {} records against {} keys...", total, keySetSize);
+        var records = ktu.generateRecords(keys, total);
+        records.entrySet().forEach(x -> log.debug("Key {} has {} records", x.getKey(), x.getValue().size()));
+        log.debug("Sending...");
+        ktu.send(consumerSpy, records);
+
+        var bar = ProgressBarUtils.getNewMessagesBar(log, total);
+
+        // run
+        log.debug("Consuming...");
+        var results = new ConcurrentHashMap<String, Queue<PollContext<String, String>>>();
+        AtomicLong counter = new AtomicLong();
+        parallelConsumer.poll(recordContexts -> {
+            counter.incrementAndGet();
+            bar.step();
+            log.trace("Consumed {}", recordContexts);
+            results.computeIfAbsent(recordContexts.key(), ignore -> new ConcurrentLinkedQueue<>())
+                    .add(recordContexts);
+        });
+
+        // count how many we've received so far
+        await().atMost(5, MINUTES)
+                .untilAsserted(() ->
+                        assertThat(counter.get()).isEqualTo(total));
+
+        parallelConsumer.closeDrainFirst();
+        bar.close();
+
+        // check ordering is exact - remove sequenceSize?
+        var sequenceSize = Math.max(total / keySetSize, 1); // if we have more keys than records, then we'll have a sequence size of 1, so round up
+        log.debug("Testing...");
+        checkExactOrdering(results, records);
+    }
+
+}
+
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelEoSStreamProcessorTestBase.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelEoSStreamProcessorTestBase.java
new file mode 100644
index 000000000..4ec2c507b
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/ParallelEoSStreamProcessorTestBase.java
@@ -0,0 +1,31 @@
+package io.confluent.parallelconsumer;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.internal.PCModule;
+import lombok.Getter;
+import lombok.extern.slf4j.Slf4j;
+
+@Slf4j
+public class ParallelEoSStreamProcessorTestBase extends AbstractParallelEoSStreamProcessorTestBase {
+
+    protected ParallelEoSStreamProcessor<String, String> parallelConsumer;
+    @Getter
+    private PCModule module;
+
+    @Override
+    protected AbstractParallelEoSStreamProcessor<String, String> initAsyncConsumer(ParallelConsumerOptions<String, String> parallelConsumerOptions) {
+        return initPollingAsyncConsumer(parallelConsumerOptions);
+    }
+
+    protected ParallelEoSStreamProcessor<String, String> initPollingAsyncConsumer(ParallelConsumerOptions<String, String> parallelConsumerOptions) {
+        module = new PCModule<>(parallelConsumerOptions);
+        parallelConsumer = new ParallelEoSStreamProcessor<>(parallelConsumerOptions);
+        super.parentParallelConsumer = parallelConsumer;
+        return parallelConsumer;
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/internal/LimitedDynamicExtraLoadFactor.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/internal/LimitedDynamicExtraLoadFactor.java
new file mode 100644
index 000000000..3e3ec3b9f
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/internal/LimitedDynamicExtraLoadFactor.java
@@ -0,0 +1,17 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+public class LimitedDynamicExtraLoadFactor extends DynamicLoadFactor {
+    @Override
+    public int getMaxFactor() {
+        return 2;
+    }
+
+    @Override
+    public int getCurrentFactor() {
+        return 2;
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/internal/PCModuleTestEnv.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/internal/PCModuleTestEnv.java
new file mode 100644
index 000000000..f667a5809
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/internal/PCModuleTestEnv.java
@@ -0,0 +1,117 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.state.ModelUtils;
+import io.confluent.parallelconsumer.state.WorkManager;
+import lombok.Getter;
+import lombok.NonNull;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.producer.Producer;
+import org.mockito.Mockito;
+import org.threeten.extra.MutableClock;
+
+import java.time.Clock;
+import java.util.Optional;
+import java.util.concurrent.CountDownLatch;
+
+/**
+ * Version of the {@link PCModule} in test contexts.
+ *
+ * @author Antony Stubbs
+ */
+public class PCModuleTestEnv extends PCModule<String, String> {
+
+    ModelUtils mu = new ModelUtils(this);
+    Optional<CountDownLatch> workManagerController;
+    private WorkManager<String, String> workManager;
+    private final DynamicLoadFactor limitedDynamicLoadFactor = new LimitedDynamicExtraLoadFactor();
+
+    @Override
+    protected DynamicLoadFactor dynamicExtraLoadFactor() {
+        return limitedDynamicLoadFactor;
+    }
+
+    public PCModuleTestEnv(final ParallelConsumerOptions<String, String> optionsInstance,
+                           final CountDownLatch latch) {
+        super(optionsInstance);
+        this.workManagerController = Optional.of(latch);
+    }
+
+    public PCModuleTestEnv(ParallelConsumerOptions<String, String> optionsInstance) {
+        super(optionsInstance);
+
+        ParallelConsumerOptions<String, String> override = enhanceOptions(optionsInstance);
+
+        // overwrite super's with new instance
+        super.optionsInstance = override;
+        this.workManagerController = Optional.empty();
+    }
+
+    private ParallelConsumerOptions<String, String> enhanceOptions(ParallelConsumerOptions<String, String> optionsInstance) {
+        var copy = options().toBuilder();
+
+        if (optionsInstance.getConsumer() == null) {
+            Consumer<String, String> mockConsumer = Mockito.mock(Consumer.class);
+            Mockito.when(mockConsumer.groupMetadata()).thenReturn(mu.consumerGroupMeta());
+            copy.consumer(mockConsumer);
+        }
+
+        var override = copy
+                .producer(Mockito.mock(Producer.class))
+                .build();
+
+        return override;
+    }
+
+    public PCModuleTestEnv() {
+        this(ParallelConsumerOptions.<String, String>builder().build());
+    }
+
+    @Override
+    protected ProducerWrapper<String, String> producerWrap() {
+        return mockProducerWrapTransactional();
+    }
+
+    ProducerWrapper<String, String> mockProduceWrap;
+
+    @NonNull
+    private ProducerWrapper<String, String> mockProducerWrapTransactional() {
+        if (mockProduceWrap == null) {
+            mockProduceWrap = Mockito.spy(new ProducerWrapper<>(options(), true, producer()));
+        }
+        return mockProduceWrap;
+    }
+
+    @Override
+    public WorkManager<String, String> workManager() {
+        if (this.workManager == null) {
+            this.workManager = this.workManagerController.isPresent() ?
+                    new PausableWorkManager<>(this, dynamicExtraLoadFactor(), workManagerController.get())
+                    : super.workManager();
+        }
+        return workManager;
+    }
+
+    @Override
+    protected ConsumerManager<String, String> consumerManager() {
+        ConsumerManager<String, String> consumerManager = super.consumerManager();
+
+        // force update to set cache, otherwise maybe never called (fake consumer)
+        consumerManager.updateCache();
+
+        return consumerManager;
+    }
+
+    @Getter
+    private final MutableClock mutableClock = MutableClock.epochUTC();
+
+    @Override
+    public Clock clock() {
+        return mutableClock;
+    }
+
+}
\ No newline at end of file
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/internal/PausableWorkManager.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/internal/PausableWorkManager.java
new file mode 100644
index 000000000..5b443bdf9
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/internal/PausableWorkManager.java
@@ -0,0 +1,45 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.state.WorkContainer;
+import io.confluent.parallelconsumer.state.WorkManager;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+
+import java.util.List;
+import java.util.Optional;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.TimeUnit;
+
+@Slf4j
+public class PausableWorkManager<K, V> extends WorkManager<K, V> {
+
+    private final Optional<CountDownLatch> optionalCountDownLatch;
+
+    public PausableWorkManager(final PCModule<K, V> module, final DynamicLoadFactor dynamicExtraLoadFactor,
+                               final CountDownLatch latchToControlWorkIfAvailable) {
+        super(module, dynamicExtraLoadFactor);
+        optionalCountDownLatch = Optional.of(latchToControlWorkIfAvailable);
+    }
+
+    @Override
+    public List<WorkContainer<K, V>> getWorkIfAvailable(final int requestedMaxWorkToRetrieve) {
+        final List<WorkContainer<K, V>> workContainers = super.getWorkIfAvailable(requestedMaxWorkToRetrieve);
+        if (workContainers.size() > 0) {
+            this.optionalCountDownLatch.ifPresent(this::awaitLatch);
+        }
+        return workContainers;
+    }
+
+    @SneakyThrows
+    void awaitLatch(final CountDownLatch countDownLatch) {
+        try {
+            countDownLatch.await(60, TimeUnit.SECONDS);
+        } catch (final InterruptedException ex) {
+            log.debug("Expected the exception on rebalance, continue..",ex);
+        }
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/internal/ProducerManagerTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/internal/ProducerManagerTest.java
new file mode 100644
index 000000000..f716f151a
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/internal/ProducerManagerTest.java
@@ -0,0 +1,397 @@
+package io.confluent.parallelconsumer.internal;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import com.google.common.truth.Truth;
+import io.confluent.csid.utils.BlockedThreadAsserter;
+import io.confluent.csid.utils.LatchTestUtils;
+import io.confluent.parallelconsumer.ParallelConsumer;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.PollContextInternal;
+import io.confluent.parallelconsumer.state.ModelUtils;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.ConsumerGroupMetadata;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.clients.producer.RecordMetadata;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Tag;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.Timeout;
+import org.mockito.Mockito;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniMaps;
+
+import java.time.Duration;
+import java.util.List;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.Future;
+import java.util.concurrent.TimeoutException;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.concurrent.atomic.AtomicReference;
+import java.util.function.Function;
+
+import static io.confluent.parallelconsumer.ManagedTruth.assertThat;
+import static io.confluent.parallelconsumer.ManagedTruth.assertWithMessage;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER;
+import static io.confluent.parallelconsumer.internal.ProducerWrapper.ProducerState.*;
+import static java.time.Duration.ofSeconds;
+import static java.util.Collections.emptyList;
+import static org.awaitility.Awaitility.await;
+import static org.junit.jupiter.api.Assertions.assertThrows;
+import static org.mockito.ArgumentMatchers.any;
+import static org.mockito.Mockito.*;
+
+/**
+ * Covers transaction state systems, and their blocking behaiviour towards sending records and the reverse.
+ *
+ * @author Antony Stubbs
+ * @see ProducerManager
+ * @see io.confluent.parallelconsumer.integrationTests.TransactionTimeoutsTest for integration tests checking timeout
+ *         behaiviour
+ */
+@Tag("transactions")
+@Tag("#355")
+@Timeout(60)
+@Slf4j
+class ProducerManagerTest {
+
+    ParallelConsumerOptions<String, String> opts;
+
+    PCModuleTestEnv module;
+
+    ModelUtils mu;
+
+    ProducerManager<String, String> producerManager;
+
+    /**
+     * Default settings
+     */
+    @BeforeEach
+    void setup() {
+        setup(ParallelConsumerOptions.<String, String>builder()
+                .commitMode(PERIODIC_TRANSACTIONAL_PRODUCER)
+                .commitLockAcquisitionTimeout(ofSeconds(2)));
+    }
+
+    private void setup(ParallelConsumerOptions.ParallelConsumerOptionsBuilder<String, String> optionsBuilder) {
+        opts = optionsBuilder.build();
+
+        module = buildModule(opts);
+
+        mu = new ModelUtils(module);
+
+        producerManager = module.producerManager();
+    }
+
+    private PCModuleTestEnv buildModule(ParallelConsumerOptions<String, String> opts) {
+        return new PCModuleTestEnv(opts) {
+            @Override
+            protected AbstractParallelEoSStreamProcessor<String, String> pc() {
+                if (parallelEoSStreamProcessor == null) {
+                    AbstractParallelEoSStreamProcessor<String, String> raw = super.pc();
+                    parallelEoSStreamProcessor = spy(raw);
+
+                    parallelEoSStreamProcessor = new ParallelEoSStreamProcessor<>(options(), this) {
+                        @Override
+                        protected boolean isTimeToCommitNow() {
+                            return true;
+                        }
+
+                        @Override
+                        public void close() {
+                        }
+                    };
+                }
+                return parallelEoSStreamProcessor;
+            }
+        };
+    }
+
+
+    /**
+     * Cannot send a record during a tx commit
+     */
+    @SneakyThrows
+    @Test
+    void sendingGetsLockedInTx() {
+        assertThat(producerManager).isNotTransactionCommittingInProgress();
+
+        // should send fine, futures should finish
+        var produceReadLock = producerManager.beginProducing(mock(PollContextInternal.class));
+        produceOneRecord();
+
+        // acquire work should block
+        var blockedCommit = new BlockedThreadAsserter();
+        blockedCommit.assertFunctionBlocks(() -> {
+            // commit sequence
+            try {
+                producerManager.preAcquireOffsetsToCommit();
+            } catch (Exception e) {
+                throw new RuntimeException(e);
+            }
+            // releases the commit lock that was acquired
+            producerManager.postCommit();
+        });
+
+        // pretend to finish producing records, give the lock back
+        log.debug("Unlocking produce lock...");
+        producerManager.finishProducing(produceReadLock); // triggers commit lock to become acquired as the produce lock is now released
+
+        log.debug("Waiting for commit lock to release...");
+        blockedCommit.awaitReturnFully();
+
+        // start actual commit - acquire commit lock
+        producerManager.preAcquireOffsetsToCommit();
+
+        //
+        assertThat(producerManager).isTransactionCommittingInProgress();
+
+        // try to send more records, which will block as tx in process
+        // Thread should be sleeping/blocked and not have returned
+        var blockedRecordSenderReturned = new BlockedThreadAsserter();
+        blockedRecordSenderReturned.assertFunctionBlocks(() -> {
+            log.debug("Starting sending records - will block due to open commit");
+            ProducerManager<String, String>.ProducingLock produceLock = null;
+            try {
+                produceLock = producerManager.beginProducing(mock(PollContextInternal.class));
+            } catch (TimeoutException e) {
+                throw new RuntimeException(e);
+            }
+            log.debug("Then after released by finishing tx, complete the producing");
+            producerManager.finishProducing(produceLock);
+        });
+
+
+        // pretend to finish tx
+        producerManager.postCommit();
+
+        //
+        assertThat(producerManager).isNotTransactionCommittingInProgress();
+
+        //
+        await("blocked sends should only now complete").until(blockedRecordSenderReturned::functionHasCompleted);
+    }
+
+    private List<ParallelConsumer.Tuple<ProducerRecord<String, String>, Future<RecordMetadata>>> produceOneRecord() {
+        return producerManager.produceMessages(makeRecord());
+    }
+
+    private List<ProducerRecord<String, String>> makeRecord() {
+        return mu.createProducerRecords("topic", 1);
+    }
+
+    /**
+     * Make sure transaction get started lazy - only when a record is sent, not proactively
+     */
+    @SneakyThrows
+    @Test
+    void txOnlyStartedUponMessageSend() {
+        assertThat(producerManager).isNotTransactionCommittingInProgress();
+        assertThat(producerManager).stateIs(INIT);
+
+        assertWithMessage("Transaction is started as not open")
+                .that(producerManager)
+                .transactionNotOpen();
+
+        {
+            var produceLock = producerManager.beginProducing(mock(PollContextInternal.class));
+
+            {
+                var notBlockedSends = produceOneRecord();
+            }
+
+            assertThat(producerManager).stateIs(BEGIN);
+            assertThat(producerManager).transactionOpen();
+
+            {
+                var notBlockedSends = produceOneRecord();
+            }
+
+            producerManager.finishProducing(produceLock);
+        }
+
+        producerManager.preAcquireOffsetsToCommit();
+
+        assertThat(producerManager).isTransactionCommittingInProgress();
+
+        producerManager.commitOffsets(UniMaps.of(), new ConsumerGroupMetadata(""));
+
+        assertThat(producerManager).isTransactionCommittingInProgress();
+
+        producerManager.postCommit();
+
+        assertThat(producerManager).isNotTransactionCommittingInProgress();
+
+        //
+        assertWithMessage("A new transaction hasn't been opened")
+                .that(producerManager)
+                .transactionNotOpen();
+
+        // do another round of producing and check state
+        {
+            var producingLock = producerManager.beginProducing(mock(PollContextInternal.class));
+            assertThat(producerManager).transactionNotOpen();
+            produceOneRecord();
+            assertThat(producerManager).transactionOpen();
+            producerManager.finishProducing(producingLock);
+            assertThat(producerManager).transactionOpen();
+            producerManager.preAcquireOffsetsToCommit();
+            assertThat(producerManager).transactionOpen();
+            producerManager.commitOffsets(UniMaps.of(), new ConsumerGroupMetadata(""));
+            assertThat(producerManager).transactionNotOpen();
+            assertThat(producerManager).stateIs(COMMIT);
+        }
+    }
+
+    @SneakyThrows
+    @Test
+    void producedRecordsCantBeInTransactionWithoutItsOffsetDirect() {
+        // custom settings
+        setup(ParallelConsumerOptions.<String, String>builder()
+                .commitMode(PERIODIC_TRANSACTIONAL_PRODUCER));
+
+        try (var pc = module.pc()) {
+            pc.subscribe(UniLists.of(mu.getTopic()));
+            pc.onPartitionsAssigned(mu.getPartitions());
+            pc.setState(State.RUNNING);
+
+            // "send" one record
+            EpochAndRecordsMap<String, String> freshWork = mu.createFreshWork();
+            pc.registerWork(freshWork);
+
+            assertThat(producerManager).getProducerTransactionLock().isNotWriteLocked();
+
+
+            var producingLockRef = new AtomicReference<ProducerManager.ProducingLock>();
+            var offset1Mutex = new CountDownLatch(1);
+            var blockedOn1 = new AtomicBoolean(false);
+            // todo refactor to use real user function directly
+            Function<PollContextInternal<String, String>, List<Object>> userFunc = context -> {
+                ProducerManager<String, String>.ProducingLock newValue = null;
+                try {
+                    newValue = producerManager.beginProducing(mock(PollContextInternal.class));
+                } catch (TimeoutException e) {
+                    throw new RuntimeException(e);
+                }
+                try {
+                    producingLockRef.set(
+                            newValue
+                    );
+                    log.info(context.toString());
+                    if (context.offset() == 1) {
+                        log.debug("Blocking on {}", 1);
+                        blockedOn1.set(true);
+                        LatchTestUtils.awaitLatch(offset1Mutex);
+                    }
+
+                    // use real user function wrap
+                    module.producerWrap().send(mock(ProducerRecord.class), (a, b) -> {
+                    });
+                    return UniLists.of();
+                } finally {
+                    // this unlocks the produce lock too early - should be after WC returned. Need a call back? plugin? Should refactor the wrapped user function to can construct it?
+                    // also without using wrapped user function- we're not testing something important
+                    newValue.unlock();
+                }
+            };
+
+
+            assertThat(producerManager).getProducerTransactionLock().isNotWriteLocked();
+
+
+            // won't block because offset 0 goes through
+            // distributes first work
+            pc.controlLoop(userFunc, o -> {
+            });
+
+
+            // change to TM?
+            assertThat(producerManager).getProducerTransactionLock().isNotWriteLocked();
+
+            //
+            {
+                var msg = "wait for first record to finish";
+                log.debug(msg);
+                await(msg).untilAsserted(() -> assertThat(pc.getWorkMailBox()).hasSize(1));
+            }
+
+            // send another record, register the work
+            freshWork = mu.createFreshWork();
+            pc.registerWork(freshWork);
+
+            // will first try to commit - which will work fine, as there's no produce lock isn't held yet (off 0 goes through fine)
+            // then it will get the work, distributes it
+            // will then return
+            // -- in the worker thread - will trigger the block and hold the produce lock
+            pc.controlLoop(userFunc, o -> {
+            });
+
+            //
+            assertThat(producerManager).getProducerTransactionLock().isNotWriteLocked();
+
+            // blocks, as offset 1 is blocked sending and so cannot acquire commit lock
+            var msg = "Ensure expected produce lock is now held by blocked worker thread";
+            log.debug(msg);
+            await(msg).untilTrue(blockedOn1);
+
+
+            var commitBlocks = new BlockedThreadAsserter();
+            // unblock 1 as unblocking function, and make sure that makes us return
+            commitBlocks.assertUnblocksAfter(() -> {
+                log.debug("Running control loop which should block until offset 1 is released by finishing produce");
+                try {
+                    pc.controlLoop(userFunc, o -> {
+                    });
+                } catch (Exception e) {
+                    throw new RuntimeException(e);
+                }
+            }, () -> {
+                log.debug("Unblocking offset processing offset1Mutex...");
+                offset1Mutex.countDown();
+            }, ofSeconds(10));
+
+            //
+            await().untilAsserted(() -> Truth.assertWithMessage("commit should now have unlocked and returned")
+                    .that(commitBlocks.functionHasCompleted())
+                    .isTrue());
+
+
+            final int nextExpectedOffset = 2; // as only first of two work completed
+            {
+                var producer = module.producerWrap();
+                Mockito.verify(producer, description("Both offsets are represented in base commit"))
+                        .sendOffsetsToTransaction(UniMaps.of(mu.getPartition(), new OffsetAndMetadata(nextExpectedOffset, "")), mu.consumerGroupMeta());
+
+                Mockito.verify(producer, times(2)
+                                .description("Should send twice, as it blocks the commit lock until it finishes, so offsets get taken only after"))
+                        .send(any(), any());
+
+            }
+        }
+    }
+
+    @Test
+    void testOptions() {
+        assertThrows(IllegalArgumentException.class, () ->
+                ParallelConsumerOptions.builder()
+                        .consumer(mock(Consumer.class))
+                        .commitMode(PERIODIC_TRANSACTIONAL_PRODUCER)
+                        .build()
+                        .validate());
+
+
+        assertThrows(IllegalArgumentException.class, () ->
+                ParallelConsumerOptions.builder()
+                        .consumer(mock(Consumer.class))
+                        .allowEagerProcessingDuringTransactionCommit(true)
+                        .build()
+                        .validate());
+    }
+
+}
\ No newline at end of file
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/model/CommitHistory.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/model/CommitHistory.java
new file mode 100644
index 000000000..8ff32a298
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/model/CommitHistory.java
@@ -0,0 +1,60 @@
+package io.confluent.parallelconsumer.model;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.CollectionUtils;
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager;
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager.HighestOffsetAndIncompletes;
+import lombok.NonNull;
+import lombok.SneakyThrows;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+
+import java.util.List;
+import java.util.Optional;
+import java.util.stream.Collectors;
+
+public class CommitHistory {
+
+    private final List<OffsetAndMetadata> history;
+
+    public CommitHistory(final List<OffsetAndMetadata> collect) {
+        super();
+        this.history = collect;
+    }
+
+    public boolean contains(final int offset) {
+        return history.stream().anyMatch(x -> x.offset() == offset);
+    }
+
+    public Optional<Long> highestCommit() {
+        Optional<OffsetAndMetadata> last = CollectionUtils.getLast(history);
+        return last.map(OffsetAndMetadata::offset);
+    }
+
+    public List<Long> getOffsetHistory() {
+        return history.stream().map(OffsetAndMetadata::offset).collect(Collectors.toList());
+    }
+
+    @SneakyThrows
+    public HighestOffsetAndIncompletes getEncodedSucceeded() {
+        Optional<OffsetAndMetadata> first = getHead();
+        OffsetAndMetadata offsetAndMetadata = first.get();
+        HighestOffsetAndIncompletes highestOffsetAndIncompletes =
+                OffsetMapCodecManager.deserialiseIncompleteOffsetMapFromBase64(offsetAndMetadata.offset(), offsetAndMetadata.metadata());
+        return highestOffsetAndIncompletes;
+    }
+
+    @NonNull
+    private Optional<OffsetAndMetadata> getHead() {
+        Optional<OffsetAndMetadata> first = history.isEmpty()
+                ? Optional.empty()
+                : Optional.of(history.get(history.size() - 1));
+        return first;
+    }
+
+    public String getEncoding() {
+        return getHead().get().metadata();
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/BitSetEncodingTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/BitSetEncodingTest.java
new file mode 100644
index 000000000..8b6dbb90d
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/BitSetEncodingTest.java
@@ -0,0 +1,59 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import lombok.SneakyThrows;
+import org.junit.jupiter.api.Test;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniSets;
+
+import java.nio.ByteBuffer;
+
+import static io.confluent.csid.utils.JavaUtils.toTreeSet;
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.Version.v2;
+import static org.assertj.core.api.Assertions.assertThat;
+
+class BitSetEncodingTest {
+
+    @SneakyThrows
+    @Test
+    void basic() {
+        var incompletes = UniSets.of(0, 4, 6, 7, 8, 10).stream().map(x -> (long) x).collect(toTreeSet());
+        var completes = UniLists.of(1, 2, 3, 5, 9).stream().map(x -> (long) x).collect(toTreeSet());
+        OffsetSimultaneousEncoder offsetSimultaneousEncoder = new OffsetSimultaneousEncoder(-1, 0L, incompletes);
+        int length = 11;
+        BitSetEncoder bs = new BitSetEncoder(length, offsetSimultaneousEncoder, v2);
+
+        bs.encodeIncompleteOffset(0);
+        bs.encodeCompletedOffset(1);
+        bs.encodeCompletedOffset(2);
+        bs.encodeCompletedOffset(3);
+        bs.encodeIncompleteOffset(4);
+        bs.encodeCompletedOffset(5);
+        bs.encodeIncompleteOffset(6);
+        bs.encodeIncompleteOffset(7);
+        bs.encodeIncompleteOffset(8);
+        bs.encodeCompletedOffset(9);
+        bs.encodeIncompleteOffset(10);
+
+        // before serialisation
+        {
+            assertThat(bs.getBitSet().stream().toArray()).containsExactly(1, 2, 3, 5, 9);
+        }
+
+        // after serialisation
+        {
+            byte[] raw = bs.serialise();
+
+            byte[] wrapped = offsetSimultaneousEncoder.packEncoding(new EncodedOffsetPair(OffsetEncoding.BitSetV2, ByteBuffer.wrap(raw)));
+
+            OffsetMapCodecManager.HighestOffsetAndIncompletes result = OffsetMapCodecManager.decodeCompressedOffsets(0, wrapped);
+
+            assertThat(result.getHighestSeenOffset()).contains(10L);
+
+            assertThat(result.getIncompleteOffsets()).containsExactlyInAnyOrderElementsOf(incompletes);
+        }
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/OffsetCodecTestUtils.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/OffsetCodecTestUtils.java
new file mode 100644
index 000000000..5b57ec917
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/OffsetCodecTestUtils.java
@@ -0,0 +1,68 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.state.PartitionState;
+import lombok.experimental.UtilityClass;
+import lombok.extern.slf4j.Slf4j;
+
+import java.util.Set;
+import java.util.TreeSet;
+
+import static io.confluent.csid.utils.Range.range;
+
+@Slf4j
+@UtilityClass
+public class OffsetCodecTestUtils {
+
+    /**
+     * x is complete
+     * <p>
+     * o is incomplete
+     */
+    static String incompletesToBitmapString(long finalOffsetForPartition, long highestSeen, Set<Long> incompletes) {
+        var runLengthString = new StringBuilder();
+        Long lowWaterMark = finalOffsetForPartition;
+        long end = highestSeen - lowWaterMark;
+        for (final var relativeOffset : range(end)) {
+            long offset = lowWaterMark + relativeOffset;
+            if (incompletes.contains(offset)) {
+                runLengthString.append("o");
+            } else {
+                runLengthString.append("x");
+            }
+        }
+        return runLengthString.toString();
+    }
+
+    static String incompletesToBitmapString(long finalOffsetForPartition, PartitionState<?, ?> state) {
+        return incompletesToBitmapString(finalOffsetForPartition,
+                state.getOffsetHighestSeen(), state.getIncompleteOffsetsBelowHighestSucceeded());
+    }
+
+    /**
+     * x is complete
+     * <p>
+     * o is incomplete
+     */
+    static TreeSet<Long> bitmapStringToIncomplete(final long baseOffset, final String inputBitmapString) {
+        var incompleteOffsets = new TreeSet<Long>();
+
+        final long longLength = inputBitmapString.length();
+        range(longLength).forEach(index -> {
+            var bit = inputBitmapString.charAt(Math.toIntExact(index));
+            if (bit == 'o') {
+                incompleteOffsets.add(baseOffset + index);
+            } else if (bit == 'x') {
+                log.trace("Dropping completed offset");
+            } else {
+                throw new IllegalArgumentException("Invalid encoding - unexpected char: " + bit);
+            }
+        });
+
+        return incompleteOffsets;
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/OffsetEncodingBackPressureTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/OffsetEncodingBackPressureTest.java
new file mode 100644
index 000000000..d245f0cc3
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/OffsetEncodingBackPressureTest.java
@@ -0,0 +1,307 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.Truth;
+import com.google.common.truth.Truth8;
+import io.confluent.parallelconsumer.FakeRuntimeException;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessorTestBase;
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager.HighestOffsetAndIncompletes;
+import io.confluent.parallelconsumer.state.PartitionState;
+import io.confluent.parallelconsumer.state.PartitionStateManager;
+import io.confluent.parallelconsumer.state.ShardManager;
+import io.confluent.parallelconsumer.state.WorkManager;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.common.TopicPartition;
+import org.junit.jupiter.api.AfterAll;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.parallel.Isolated;
+import org.junit.jupiter.api.parallel.ResourceAccessMode;
+import org.junit.jupiter.api.parallel.ResourceLock;
+import pl.tlinkowski.unij.api.UniLists;
+
+import java.util.List;
+import java.util.Map;
+import java.util.Optional;
+import java.util.Set;
+import java.util.concurrent.ConcurrentLinkedQueue;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static io.confluent.csid.utils.JavaUtils.getLast;
+import static io.confluent.csid.utils.JavaUtils.getOnlyOne;
+import static io.confluent.csid.utils.LatchTestUtils.awaitLatch;
+import static io.confluent.csid.utils.ThreadUtils.sleepQuietly;
+import static io.confluent.parallelconsumer.ManagedTruth.assertTruth;
+import static io.confluent.parallelconsumer.ManagedTruth.assertWithMessage;
+import static io.confluent.parallelconsumer.state.PartitionStateManager.USED_PAYLOAD_THRESHOLD_MULTIPLIER_DEFAULT;
+import static java.time.Duration.ofSeconds;
+import static java.util.concurrent.TimeUnit.SECONDS;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.awaitility.Awaitility.await;
+import static org.awaitility.Awaitility.waitAtMost;
+
+/**
+ * Writes to static state to perform test - needs to be run in isolation. However it runs very fast, so it doesn't slow
+ * down parallel test suite much.
+ * <p>
+ * Runs in isolation regardless of the resource lock read/write setting, because actually various tests depend
+ * indirectly on the behaviour of the metadata size, even if not so explicitly.
+ * <p>
+ * See {@link OffsetMapCodecManager#METADATA_DATA_SIZE_RESOURCE_LOCK}
+ *
+ * @see OffsetMapCodecManager#METADATA_DATA_SIZE_RESOURCE_LOCK
+ * @see OffsetEncodingBackPressureUnitTest
+ */
+@Isolated // messes with static state - breaks other tests running in parallel
+@Slf4j
+class OffsetEncodingBackPressureTest extends ParallelEoSStreamProcessorTestBase {
+
+    @AfterAll
+    static void cleanup() {
+        PartitionStateManager.setUSED_PAYLOAD_THRESHOLD_MULTIPLIER(USED_PAYLOAD_THRESHOLD_MULTIPLIER_DEFAULT);
+    }
+
+    /**
+     * Tests that when required space for encoding offset becomes too large, back pressure is put into the system so
+     * that no further messages for the given partitions can be taken for processing, until more messages complete.
+     */
+    // todo refactor test to use the new DI system, to manipulate one of the mocks to force test scenario, instead of messing with static state
+    @Test
+    // needed due to static accessors in parallel tests
+    @ResourceLock(value = OffsetMapCodecManager.METADATA_DATA_SIZE_RESOURCE_LOCK, mode = ResourceAccessMode.READ_WRITE)
+    void backPressureShouldPreventTooManyMessagesBeingQueuedForProcessing() throws OffsetDecodingError {
+        // mock messages downloaded for processing > MAX_TO_QUEUE
+        // make sure work manager doesn't queue more than MAX_TO_QUEUE
+//        final int numRecords = 1_000_0;
+        final int numberOfRecordsToPrimeWith = 1_00;
+        parallelConsumer.setTimeBetweenCommits(ofSeconds(1));
+
+        // todo - very smelly - store for restoring
+        var realMax = OffsetMapCodecManager.DefaultMaxMetadataSize;
+
+        // todo don't use static public accessors to change things - makes parallel testing harder and is smelly
+        OffsetMapCodecManager.DefaultMaxMetadataSize = 40; // reduce available to make testing easier
+        OffsetMapCodecManager.forcedCodec = Optional.of(OffsetEncoding.BitSetV2); // force one that takes a predictable large amount of space
+
+        //
+        List<ConsumerRecord<String, String>> records = ktu.generateRecords(numberOfRecordsToPrimeWith);
+        ktu.send(consumerSpy, records);
+
+        AtomicInteger userFuncFinishedCount = new AtomicInteger();
+        AtomicInteger userFuncStartCount = new AtomicInteger();
+
+        CountDownLatch finalMsgLock = new CountDownLatch(1);
+        CountDownLatch msgLockTwo = new CountDownLatch(1);
+        CountDownLatch msgLockThree = new CountDownLatch(1);
+        AtomicInteger attempts = new AtomicInteger(0);
+        long offsetToBlock = 0;
+        List<Long> blockedOffsets = UniLists.of(0L, 2L);
+        final int numberOfBlockedMessages = blockedOffsets.size();
+
+        WorkManager<String, String> wm = parallelConsumer.getWm();
+        final PartitionState<String, String> partitionState = wm.getPm().getPartitionState(topicPartition);
+
+        ConcurrentLinkedQueue<Long> seen = new ConcurrentLinkedQueue<>();
+
+        parallelConsumer.poll(recordContext -> {
+            log.debug("Processing {}", recordContext.offset());
+            seen.add(recordContext.offset());
+            userFuncStartCount.incrementAndGet();
+            // block the partition to create bigger and bigger offset encoding blocks
+            // don't let offset 0 finish
+            if (recordContext.offset() == offsetToBlock) {
+                int attemptNumber = attempts.incrementAndGet();
+                if (attemptNumber == 1) {
+                    log.debug("Force first message to 'never' complete, causing a large offset encoding (lots of messages completing above the low water mark. Waiting for msgLock countdown.");
+                    int timeout = 120;
+                    awaitLatch(finalMsgLock, timeout);
+                    log.debug("Very slow message awoken, throwing exception");
+                    throw new FakeRuntimeException("Fake error");
+                } else {
+                    log.debug("Second attempt, waiting for msgLockTwo countdown");
+                    awaitLatch(msgLockTwo, 60);
+                    log.debug("Second attempt, unlocked, succeeding");
+                }
+            } else if (recordContext.offset() == 2L) {
+                awaitLatch(msgLockThree);
+                log.debug("// msg 2L unblocked");
+            } else {
+                sleepQuietly(1);
+            }
+            userFuncFinishedCount.incrementAndGet();
+        });
+
+        ShardManager<String, String> sm = wm.getSm();
+
+        try {
+
+            // wait for all pre-produced messages to be processed and produced
+            waitAtMost(ofSeconds(120))
+                    // dynamic reason support still waiting https://github.com/awaitility/awaitility/pull/193#issuecomment-873116199
+                    .failFast("PC died - check logs", parallelConsumer::isClosedOrFailed)
+                    //, () -> parallelConsumer.getFailureCause()) // requires https://github.com/awaitility/awaitility/issues/178#issuecomment-734769761
+                    .pollInterval(1, SECONDS)
+                    .untilAsserted(() -> {
+                        assertThat(userFuncFinishedCount.get()).isEqualTo(numberOfRecordsToPrimeWith - numberOfBlockedMessages);
+                    });
+
+            // # assert commit ok - nothing blocked
+            {
+                //
+                awaitForSomeLoopCycles(1);
+                parallelConsumer.requestCommitAsap();
+                awaitForSomeLoopCycles(1);
+
+                // initial 0 offset is committed with they offset encoded payload
+                assertThatConsumer("Initial commit has been executed")
+                        .hasCommittedToAnyPartition()
+                        .offset(0);
+                List<OffsetAndMetadata> offsetAndMetadataList = extractAllPartitionsOffsetsAndMetadataSequentially();
+                OffsetAndMetadata mostRecentCommit = getLast(offsetAndMetadataList).get();
+                assertThat(mostRecentCommit.offset()).isZero();
+
+                // check offset encoding incomplete payload doesn't contain expected completed messages
+                String metadata = mostRecentCommit.metadata();
+                HighestOffsetAndIncompletes decodedOffsetPayload = OffsetMapCodecManager.deserialiseIncompleteOffsetMapFromBase64(0, metadata);
+                Long highestSeenOffset = decodedOffsetPayload.getHighestSeenOffset().get();
+                Set<Long> incompletes = decodedOffsetPayload.getIncompleteOffsets();
+                assertThat(incompletes).isNotEmpty()
+                        .contains(offsetToBlock)
+                        .doesNotContain(1L, 50L, 99L, (long) numberOfRecordsToPrimeWith - numberOfBlockedMessages); // some sampling of completed offsets, 99 being the highest
+                int expectedHighestSeenOffset = numberOfRecordsToPrimeWith - 1;
+                assertThat(highestSeenOffset).as("offset 99 is encoded as having been seen").isEqualTo(expectedHighestSeenOffset);
+            }
+
+
+            // partition not blocked
+            assertTruth(partitionState).isAllowedMoreRecords();
+
+            //
+            log.debug("// feed more messages in order to threshold block - as Bitset requires linearly as much space as we are feeding messages into it, it's guaranteed to block");
+            int bytesNeededToCrossThreshold = 5; // roughly
+            int extraRecordsToBlockWithThresholdBlocks = Byte.SIZE * bytesNeededToCrossThreshold;
+            {
+                assertTruth(partitionState).isAllowedMoreRecords(); // should initially be not blocked
+
+                ktu.send(consumerSpy, ktu.generateRecords(extraRecordsToBlockWithThresholdBlocks));
+                awaitForOneLoopCycle();
+
+                log.debug("// assert partition now blocked from threshold");
+                waitAtMost(ofSeconds(10))
+                        .untilAsserted(
+                                () -> assertWithMessage("Partition SHOULD be blocked due to back pressure")
+                                        .that(partitionState)
+                                        .isBlocked()); // blocked
+
+                Long partitionOffsetHighWaterMarks = wm.getPm().getHighestSeenOffset(topicPartition);
+                assertThat(partitionOffsetHighWaterMarks)
+                        .isGreaterThan(numberOfRecordsToPrimeWith); // high watermark is beyond our initial processed count upon blocking
+
+                parallelConsumer.requestCommitAsap();
+                awaitForOneLoopCycle();
+
+                log.debug("// assert blocked, but can still write payload");
+                // assert the committed offset metadata contains a payload
+                waitAtMost(defaultTimeout).untilAsserted(() ->
+                        {
+                            OffsetAndMetadata partitionCommit = getLastCommit();
+                            //
+                            assertThat(partitionCommit.offset()).isZero();
+                            //
+                            String meta = partitionCommit.metadata();
+                            HighestOffsetAndIncompletes incompletes = OffsetMapCodecManager
+                                    .deserialiseIncompleteOffsetMapFromBase64(0L, meta);
+                            Truth.assertWithMessage("The only incomplete record now is offset zero, which we are blocked on")
+                                    .that(incompletes.getIncompleteOffsets()).containsExactlyElementsIn(blockedOffsets);
+                            int expectedHighestSeen = numberOfRecordsToPrimeWith + extraRecordsToBlockWithThresholdBlocks - 1;
+                            Truth8.assertThat(incompletes.getHighestSeenOffset()).hasValue(expectedHighestSeen);
+                        }
+                );
+            }
+
+            // recreates the situation where the payload size is too large and must be dropped
+            log.debug("// test max payload exceeded, payload dropped");
+            {
+                log.debug("Force system to allow more records to be processed beyond the safety threshold setting " +
+                        "(i.e. the actual system attempts to never allow the payload to grow this big) " +
+                        "i.e. effectively this disables blocking mechanism for the partition");
+                PartitionStateManager.setUSED_PAYLOAD_THRESHOLD_MULTIPLIER(30);
+                OffsetMapCodecManager.DefaultMaxMetadataSize = 30; // reduce max cut off size - could use DI mock instead to change method return value?
+
+                //
+                log.debug("// unlock record to make the state dirty to get a commit");
+
+                msgLockThree.countDown();
+
+                parallelConsumer.requestCommitAsap();
+                awaitForSomeLoopCycles(2);
+
+
+                assertTruth(partitionState).isBlocked();
+
+
+                log.debug("// assert payload missing from commit now");
+                await().untilAsserted(() -> {
+                    assertTruth(partitionState).isBlocked();
+                    OffsetAndMetadata partitionCommit = getLastCommit();
+                    assertTruth(partitionCommit).hasOffsetEqualTo(0l);
+                    assertTruth(partitionCommit).getMetadata().isEmpty();
+                });
+            }
+
+            log.debug("Test that failed messages can retry, causing partition to un-block");
+            {
+                // release message that was blocking partition progression
+                // fail the message
+                finalMsgLock.countDown();
+
+                // wait for the retry
+                awaitForOneLoopCycle();
+                sleepQuietly(ParallelConsumerOptions.DEFAULT_STATIC_RETRY_DELAY.toMillis());
+                await().until(() -> attempts.get() >= 2);
+
+                // assert partition still blocked
+                awaitForOneLoopCycle();
+                await().untilAsserted(() -> assertThat(wm.getPm().isAllowedMoreRecords(topicPartition)).isFalse());
+
+                // release the message for the second time, allowing it to succeed
+                msgLockTwo.countDown();
+            }
+
+            // assert partition is now not blocked
+            {
+                awaitForOneLoopCycle();
+                await().untilAsserted(() -> assertTruth(partitionState).isAllowedMoreRecords());
+            }
+
+            // assert all committed, nothing blocked- next expected offset is now 1+ the offset of the final message we sent
+            {
+                await().untilAsserted(() -> {
+                    List<Integer> offsets = extractAllPartitionsOffsetsSequentially(false);
+                    assertThat(offsets).contains(userFuncFinishedCount.get());
+                });
+                await().untilAsserted(() -> assertTruth(partitionState).isAllowedMoreRecords());
+            }
+        } finally {
+            // todo restore static defaults - lazy way to override settings at runtime but causes bugs by allowing them to be statically changeable
+            OffsetMapCodecManager.DefaultMaxMetadataSize = realMax; // todo wow this is smelly, but convenient
+            OffsetMapCodecManager.forcedCodec = Optional.empty();
+        }
+
+
+    }
+
+    private OffsetAndMetadata getLastCommit() {
+        List<Map<String, Map<TopicPartition, OffsetAndMetadata>>> commitHistory = getCommitHistory();
+        Map<String, Map<TopicPartition, OffsetAndMetadata>> lastCommit = getLast(commitHistory).get();
+        Map<TopicPartition, OffsetAndMetadata> allPartitionCommits = getOnlyOne(lastCommit).get();
+        return allPartitionCommits.get(topicPartition);
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/OffsetEncodingBackPressureUnitTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/OffsetEncodingBackPressureUnitTest.java
new file mode 100644
index 000000000..7db82589e
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/OffsetEncodingBackPressureUnitTest.java
@@ -0,0 +1,215 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.Truth;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessorTestBase;
+import io.confluent.parallelconsumer.internal.EpochAndRecordsMap;
+import io.confluent.parallelconsumer.state.PartitionState;
+import io.confluent.parallelconsumer.state.PartitionStateManager;
+import io.confluent.parallelconsumer.state.WorkContainer;
+import io.confluent.parallelconsumer.state.WorkManager;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import one.util.streamex.LongStreamEx;
+import one.util.streamex.StreamEx;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.ConsumerRecords;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.junit.jupiter.api.AfterAll;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.parallel.ResourceAccessMode;
+import org.junit.jupiter.api.parallel.ResourceLock;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniMaps;
+
+import java.util.List;
+import java.util.Optional;
+import java.util.stream.Collectors;
+
+import static io.confluent.parallelconsumer.ManagedTruth.assertTruth;
+import static io.confluent.parallelconsumer.ManagedTruth.assertWithMessage;
+import static io.confluent.parallelconsumer.state.PartitionStateManager.USED_PAYLOAD_THRESHOLD_MULTIPLIER_DEFAULT;
+
+/**
+ * UnitTest version of {@link OffsetEncodingBackPressureTest}.
+ *
+ * @see OffsetEncodingBackPressureTest
+ */
+@Slf4j
+class OffsetEncodingBackPressureUnitTest extends ParallelEoSStreamProcessorTestBase {
+
+    @AfterAll
+    static void cleanup() {
+        PartitionStateManager.setUSED_PAYLOAD_THRESHOLD_MULTIPLIER(USED_PAYLOAD_THRESHOLD_MULTIPLIER_DEFAULT);
+    }
+
+    @SneakyThrows
+    @Test
+    @ResourceLock(value = OffsetMapCodecManager.METADATA_DATA_SIZE_RESOURCE_LOCK, mode = ResourceAccessMode.READ_WRITE)
+    void backPressureShouldPreventTooManyMessagesBeingQueuedForProcessing() throws OffsetDecodingError {
+        final int numberOfRecords = 1_00;
+
+        // todo - very smelly - store for restoring
+        var realMax = OffsetMapCodecManager.DefaultMaxMetadataSize;
+
+        // todo don't use static public accessors to change things - makes parallel testing harder and is smelly
+        OffsetMapCodecManager.DefaultMaxMetadataSize = 40; // reduce available to make testing easier
+        OffsetMapCodecManager.forcedCodec = Optional.of(OffsetEncoding.BitSetV2); // force one that takes a predictable large amount of space
+
+        //
+        var wm = parallelConsumer.getWm();
+        var pm = wm.getPm();
+        PartitionState<String, String> partitionState = pm.getPartitionState(topicPartition);
+
+        sendRecordsToWM(numberOfRecords, wm);
+
+        final int numberOfBlockedMessages = 2;
+        var samplingOfShouldBeCompleteOffsets = UniLists.of(1L, 50L, 99L, (long) numberOfRecords - numberOfBlockedMessages);
+        var blockedOffsets = UniLists.of(0L, 2L);
+
+        var completes = LongStreamEx.of(numberOfRecords).filter(x -> !blockedOffsets.contains(x)).boxed().toList();
+
+        List<WorkContainer<String, String>> workIfAvailable = wm.getWorkIfAvailable();
+        assertTruth(workIfAvailable).hasSize(numberOfRecords);
+
+        List<WorkContainer<String, String>> toSucceed = workIfAvailable.stream().filter(x -> !blockedOffsets.contains(x.offset())).collect(Collectors.toList());
+        toSucceed.forEach(wm::onSuccessResult);
+
+        try {
+
+            // # assert commit ok - nothing blocked
+            {
+                Optional<OffsetAndMetadata> commitDataIfDirty = partitionState.getCommitDataIfDirty();
+                assertTruth(partitionState).isAllowedMoreRecords();
+
+                int expectedHighestSeenOffset = numberOfRecords - 1;
+                //         check("getOffsetHighestSucceeded()").that(actual.getOffsetHighestSucceeded()).isEqualTo(expected);
+                assertTruth(partitionState).getOffsetHighestSeen().isEqualTo(expectedHighestSeenOffset);
+                assertTruth(partitionState).getCommitDataIfDirty().hasOffsetEqualTo(0);
+            }
+
+
+            log.debug("// feed more messages in order to threshold block - as Bitset requires linearly as much space as we are feeding messages into it, it's guaranteed to block");
+            int extraRecordsToBlockWithThresholdBlocks = numberOfRecords / 2;
+            {
+                sendRecordsToWM(extraRecordsToBlockWithThresholdBlocks, wm);
+                succeedExcept(wm, blockedOffsets);
+
+                // triggers recompute of blockage
+                Optional<OffsetAndMetadata> commitDataIfDirty = partitionState.getCommitDataIfDirty();
+
+                log.debug("// assert partition now blocked from threshold");
+                assertTruth(partitionState).isNotAllowedMoreRecords();
+
+                log.debug("// assert blocked, but can still write payload");
+                assertTruth(partitionState).getCommitDataIfDirty().hasOffsetEqualTo(0L);
+
+                // "The only incomplete record now is offset zero, which we are blocked on"
+                assertTruth(partitionState).getOffsetHighestSeen().isEqualTo(numberOfRecords + extraRecordsToBlockWithThresholdBlocks - 1);
+                assertTruth(partitionState).getCommitDataIfDirty().getMetadata().isNotEmpty();
+                assertTruth(partitionState)
+                        .getAllIncompleteOffsets()
+                        .containsNoneIn(samplingOfShouldBeCompleteOffsets);
+                assertWithMessage("The only incomplete record now is offset zero, which we are blocked on")
+                        .that(partitionState).getAllIncompleteOffsets().containsExactlyElementsIn(blockedOffsets);
+            }
+
+
+            // recreates the situation where the payload size is too large and must be dropped
+            log.debug("// test max payload exceeded, payload dropped");
+            int processedBeforePartitionBlock = extraRecordsToBlockWithThresholdBlocks + numberOfRecords - blockedOffsets.size();
+            int extraMessages = numberOfRecords + extraRecordsToBlockWithThresholdBlocks / 2;
+            log.debug("// messages already sent {}, sending {} more", processedBeforePartitionBlock, extraMessages);
+            {
+                log.debug("// force system to allow more records (i.e. the actual system attempts to never allow the payload to grow this big)");
+                PartitionStateManager.setUSED_PAYLOAD_THRESHOLD_MULTIPLIER(2);
+
+                //
+                // unlock 2L as well
+                unblock(wm, workIfAvailable, 2L);
+                log.debug("// unlock to make state dirty to get a commit");
+                Optional<OffsetAndMetadata> commitDataIfDirty = partitionState.getCommitDataIfDirty();
+
+                //
+                log.debug("// send {} more messages", extraMessages);
+                sendRecordsToWM(extraMessages, wm);
+                succeedExcept(wm, UniLists.of(0L));
+
+                log.debug("// assert payload missing from commit now");
+
+                assertTruth(partitionState).getCommitDataIfDirty().hasOffsetEqualTo(0);
+                assertTruth(partitionState).getCommitDataIfDirty().getMetadata().isEmpty();
+            }
+
+            log.debug("// test failed messages can retry");
+            {
+                {
+                    // check it's not returned
+                    List<Long> workIfAvailable1 = StreamEx.of(wm.getWorkIfAvailable()).map(WorkContainer::offset).toList();
+                    assertTruth(workIfAvailable1).doesNotContain(0L);
+                }
+
+                // release message that was blocking partition progression
+
+                wm.onFailureResult(findWC(workIfAvailable, 0L));
+
+                {
+                    List<Long> workIfAvailable1 = StreamEx.of(wm.getWorkIfAvailable()).map(WorkContainer::offset).toList();
+                    assertTruth(workIfAvailable1).contains(0L);
+                }
+
+
+                unblock(wm, workIfAvailable, 0L);
+            }
+
+            // assert partition is now not blocked
+            {
+
+                Optional<OffsetAndMetadata> commitDataIfDirty = partitionState.getCommitDataIfDirty();
+                assertTruth(partitionState).isAllowedMoreRecords();
+
+            }
+
+            // assert all committed, nothing blocked- next expected offset is now 1+ the offset of the final message we sent
+            {
+
+                assertTruth(partitionState).getCommitDataIfDirty().getOffset().isEqualTo(processedBeforePartitionBlock + extraMessages + numberOfBlockedMessages);
+
+                assertTruth(partitionState).isAllowedMoreRecords();
+
+            }
+        } finally {
+            // todo restore static defaults - lazy way to override settings at runtime but causes bugs by allowing them to be statically changeable
+            OffsetMapCodecManager.DefaultMaxMetadataSize = realMax; // todo wow this is smelly, but convenient
+            OffsetMapCodecManager.forcedCodec = Optional.empty();
+        }
+    }
+
+    private void succeedExcept(WorkManager<String, String> wm, List<Long> incomplete) {
+        var workIfAvailable = wm.getWorkIfAvailable();
+        var toSucceed = workIfAvailable.stream()
+                .filter(x -> !incomplete.contains(x.offset()))
+                .collect(Collectors.toList());
+        toSucceed.forEach(wm::onSuccessResult);
+    }
+
+    private void unblock(WorkManager<String, String> wm, List<WorkContainer<String, String>> from, long offsetToUnblock) {
+        var unblock = findWC(from, offsetToUnblock);
+        wm.onSuccessResult(unblock);
+    }
+
+    private WorkContainer<String, String> findWC(List<WorkContainer<String, String>> from, long offsetToUnblock) {
+        return from.stream().filter(x -> x.offset() == offsetToUnblock).findFirst().get();
+    }
+
+    private void sendRecordsToWM(int numberOfRecords, WorkManager<String, String> wm) {
+        log.debug("~Sending {} more records", numberOfRecords);
+        List<ConsumerRecord<String, String>> records = ktu.generateRecords(numberOfRecords);
+        wm.registerWork(new EpochAndRecordsMap<>(new ConsumerRecords<>(UniMaps.of(topicPartition, records)), wm.getPm()));
+        Truth.assertThat(wm.getNumberOfWorkQueuedInShardsAwaitingSelection()).isEqualTo(numberOfRecords);
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/OffsetEncodingTests.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/OffsetEncodingTests.java
new file mode 100644
index 000000000..c3e150ce1
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/OffsetEncodingTests.java
@@ -0,0 +1,430 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import com.google.common.truth.Truth;
+import io.confluent.csid.utils.KafkaTestUtils;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessorTestBase;
+import io.confluent.parallelconsumer.internal.EpochAndRecordsMap;
+import io.confluent.parallelconsumer.internal.PCModule;
+import io.confluent.parallelconsumer.internal.PCModuleTestEnv;
+import io.confluent.parallelconsumer.state.WorkContainer;
+import io.confluent.parallelconsumer.state.WorkManager;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.ConsumerRecords;
+import org.apache.kafka.common.TopicPartition;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.parallel.ResourceLock;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+import org.junit.jupiter.params.provider.ValueSource;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniMaps;
+import pl.tlinkowski.unij.api.UniSets;
+
+import java.nio.ByteBuffer;
+import java.util.*;
+import java.util.stream.Collectors;
+
+import static io.confluent.parallelconsumer.ManagedTruth.assertTruth;
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.*;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.hamcrest.Matchers.in;
+import static org.hamcrest.Matchers.not;
+import static org.junit.Assume.assumeThat;
+import static org.junit.jupiter.api.parallel.ResourceAccessMode.READ;
+import static org.junit.jupiter.api.parallel.ResourceAccessMode.READ_WRITE;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+@Slf4j
+public class OffsetEncodingTests extends ParallelEoSStreamProcessorTestBase {
+
+    PCModuleTestEnv module = new PCModuleTestEnv();
+
+    @Test
+    void runLengthDeserialise() {
+        var sb = ByteBuffer.allocate(3);
+        sb.put((byte) 0); // magic byte placeholder, can ignore
+        sb.putShort((short) 1);
+        byte[] array = new byte[2];
+        sb.rewind();
+        sb.get(array);
+        ByteBuffer wrap = ByteBuffer.wrap(array);
+        byte b = wrap.get(); // simulate reading magic byte
+        ByteBuffer slice = wrap.slice();
+        List<Integer> integers = OffsetRunLength.runLengthDeserialise(slice);
+        assertThat(integers).isEmpty();
+    }
+
+    /**
+     * Triggers Short shortfall in BitSet encoder and tests encodable range of RunLength encoding - system should
+     * gracefully drop runlength if it has Short overflows (too hard to measure every runlength of incoming records
+     * before accepting?)
+     * <p>
+     * https://github.com/confluentinc/parallel-consumer/issues/37 Support BitSet encoding lengths longer than
+     * Short.MAX_VALUE #37
+     * <p>
+     * https://github.com/confluentinc/parallel-consumer/issues/35 RuntimeException when running with very high options
+     * in 0.2.0.0 (Bitset too long to encode) #35
+     * <p>
+     */
+    @SneakyThrows
+    @ParameterizedTest
+    @ValueSource(longs = {
+            10_000L,
+            100_000L,
+            100_000_0L,
+//            100_000_000L, // very~ slow
+    })
+    @ResourceLock(value = OffsetSimultaneousEncoder.COMPRESSION_FORCED_RESOURCE_LOCK, mode = READ_WRITE)
+    void largeIncompleteOffsetValues(long nextExpectedOffset) {
+        long lowWaterMark = 123L;
+        var incompletes = new TreeSet<>(UniSets.of(lowWaterMark, 2345L, 8765L));
+
+        OffsetSimultaneousEncoder encoder = new OffsetSimultaneousEncoder(lowWaterMark, nextExpectedOffset, incompletes);
+        OffsetSimultaneousEncoder.compressionForced = true;
+
+        //
+        encoder.invoke();
+        Map<OffsetEncoding, byte[]> encodingMap = encoder.getEncodingMap();
+
+        //
+        byte[] smallestBytes = encoder.packSmallest();
+        EncodedOffsetPair unwrap = EncodedOffsetPair.unwrap(smallestBytes);
+        OffsetMapCodecManager.HighestOffsetAndIncompletes decodedIncompletes = unwrap.getDecodedIncompletes(lowWaterMark);
+        assertThat(decodedIncompletes.getIncompleteOffsets()).containsExactlyInAnyOrderElementsOf(incompletes);
+
+        //
+        for (OffsetEncoding encodingToUse : OffsetEncoding.values()) {
+            log.info("Testing {}", encodingToUse);
+            byte[] bitsetBytes = encodingMap.get(encodingToUse);
+            if (bitsetBytes != null) {
+                EncodedOffsetPair bitsetUnwrap = EncodedOffsetPair.unwrap(encoder.packEncoding(new EncodedOffsetPair(encodingToUse, ByteBuffer.wrap(bitsetBytes))));
+                OffsetMapCodecManager.HighestOffsetAndIncompletes decodedBitsets = bitsetUnwrap.getDecodedIncompletes(lowWaterMark);
+                assertThat(decodedBitsets.getIncompleteOffsets())
+                        .as(encodingToUse.toString())
+                        .containsExactlyInAnyOrderElementsOf(incompletes);
+            } else {
+                log.info("Encoding not performed: " + encodingToUse);
+            }
+        }
+
+        OffsetSimultaneousEncoder.compressionForced = false;
+    }
+
+    /**
+     * Verifying that encoding / decoding returns correct highest seen offset when nextExpectedOffset is below the
+     * baseOffsetToCommit
+     */
+    @SneakyThrows
+    @Test
+    @ResourceLock(value = OffsetSimultaneousEncoder.COMPRESSION_FORCED_RESOURCE_LOCK, mode = READ_WRITE)
+    void verifyEncodingWithNextExpectedBelowWatermark() {
+        long baseOffsetToCommit = 123L;
+        long highestSucceededOffset = 122L;
+        var incompletes = new TreeSet<>(UniSets.of(2345L, 8765L)); // no incompletes below low watermark or next expected
+
+        OffsetSimultaneousEncoder encoder = new OffsetSimultaneousEncoder(baseOffsetToCommit, highestSucceededOffset, incompletes);
+        OffsetSimultaneousEncoder.compressionForced = true;
+
+        //
+        encoder.invoke();
+        Map<OffsetEncoding, byte[]> encodingMap = encoder.getEncodingMap();
+
+        //
+        byte[] smallestBytes = encoder.packSmallest();
+        EncodedOffsetPair unwrap = EncodedOffsetPair.unwrap(smallestBytes);
+        OffsetMapCodecManager.HighestOffsetAndIncompletes decodedIncompletes = unwrap.getDecodedIncompletes(baseOffsetToCommit);
+        assertThat(decodedIncompletes.getIncompleteOffsets()).isEmpty();
+        assertThat(decodedIncompletes.getHighestSeenOffset().isPresent()).isTrue();
+        assertThat(decodedIncompletes.getHighestSeenOffset().get()).isEqualTo(highestSucceededOffset);
+
+        //
+        for (OffsetEncoding encodingToUse : OffsetEncoding.values()) {
+            log.info("Testing {}", encodingToUse);
+            byte[] bitsetBytes = encodingMap.get(encodingToUse);
+            if (bitsetBytes != null) {
+                EncodedOffsetPair bitsetUnwrap = EncodedOffsetPair.unwrap(encoder.packEncoding(new EncodedOffsetPair(encodingToUse, ByteBuffer.wrap(bitsetBytes))));
+                OffsetMapCodecManager.HighestOffsetAndIncompletes decodedBitsets = bitsetUnwrap.getDecodedIncompletes(baseOffsetToCommit);
+                assertThat(decodedBitsets.getIncompleteOffsets()).isEmpty();
+                assertThat(decodedBitsets.getHighestSeenOffset().isPresent()).isTrue();
+                assertThat(decodedBitsets.getHighestSeenOffset().get()).isEqualTo(highestSucceededOffset);
+            } else {
+                log.info("Encoding not performed: " + encodingToUse);
+            }
+        }
+
+        OffsetSimultaneousEncoder.compressionForced = false;
+    }
+
+    /**
+     * Test for offset encoding when there is a very large range of offsets, and where the offsets aren't sequential.
+     * <p>
+     * There's no guarantee that offsets are always sequential. The most obvious case is with a compacted topic - there
+     * will always be offsets missing.
+     *
+     * @see #ensureEncodingGracefullyWorksWhenOffsetsArentSequentialTwo
+     */
+    @SneakyThrows
+    @ParameterizedTest
+    @EnumSource(OffsetEncoding.class)
+    // needed due to static accessors in parallel tests
+    @ResourceLock(value = OffsetMapCodecManager.METADATA_DATA_SIZE_RESOURCE_LOCK, mode = READ)
+    // depends on OffsetMapCodecManager#DefaultMaxMetadataSize
+    @ResourceLock(value = OffsetSimultaneousEncoder.COMPRESSION_FORCED_RESOURCE_LOCK, mode = READ_WRITE)
+    void ensureEncodingGracefullyWorksWhenOffsetsAreVeryLargeAndNotSequential(OffsetEncoding encoding) {
+        assumeThat("Codec skipped, not applicable", encoding,
+                not(in(of(ByteArray, ByteArrayCompressed, KafkaStreams, KafkaStreamsV2)))); // byte array not currently used
+        var encodingsThatFail = UniLists.of(BitSet, BitSetCompressed, BitSetV2, RunLength, RunLengthCompressed);
+
+        // todo don't use static public accessors to change things - makes parallel testing harder and is smelly
+        OffsetMapCodecManager.forcedCodec = Optional.of(encoding);
+        OffsetSimultaneousEncoder.compressionForced = true;
+
+        var records = new ArrayList<ConsumerRecord<String, String>>();
+        final int FIRST_SUCCEEDED_OFFSET = 0;
+        records.add(new ConsumerRecord<>(INPUT_TOPIC, 0, FIRST_SUCCEEDED_OFFSET, "akey", "avalue")); // will complete
+        records.add(new ConsumerRecord<>(INPUT_TOPIC, 0, 1, "akey", "avalue"));
+        records.add(new ConsumerRecord<>(INPUT_TOPIC, 0, 4, "akey", "avalue"));
+        records.add(new ConsumerRecord<>(INPUT_TOPIC, 0, 5, "akey", "avalue"));
+        records.add(new ConsumerRecord<>(INPUT_TOPIC, 0, 69, "akey", "avalue")); // will complete
+        records.add(new ConsumerRecord<>(INPUT_TOPIC, 0, 100, "akey", "avalue"));
+        records.add(new ConsumerRecord<>(INPUT_TOPIC, 0, 1_000, "akey", "avalue"));
+        records.add(new ConsumerRecord<>(INPUT_TOPIC, 0, 20_000, "akey", "avalue")); // near upper limit of Short.MAX_VALUE
+        records.add(new ConsumerRecord<>(INPUT_TOPIC, 0, 25_000, "akey", "avalue")); // will complete, near upper limit of Short.MAX_VALUE
+        records.add(new ConsumerRecord<>(INPUT_TOPIC, 0, 30_000, "akey", "avalue")); // near upper limit of Short.MAX_VALUE
+
+        // Extremely large tests for v2 encoders
+        records.add(new ConsumerRecord<>(INPUT_TOPIC, 0, 40_000, "akey", "avalue")); // higher than Short.MAX_VALUE
+        int avoidOffByOne = 2;
+        records.add(new ConsumerRecord<>(INPUT_TOPIC, 0, 40_000 + Short.MAX_VALUE + avoidOffByOne, "akey", "avalue")); // runlength higher than Short.MAX_VALUE
+        int highestSucceeded = 40_000 + Short.MAX_VALUE + avoidOffByOne + 1;
+        records.add(new ConsumerRecord<>(INPUT_TOPIC, 0, highestSucceeded, "akey", "avalue")); // will complete to force whole encoding
+
+
+        var incompleteRecords = new ArrayList<>(records);
+        incompleteRecords.remove(incompleteRecords.stream().filter(x -> x.offset() == FIRST_SUCCEEDED_OFFSET).findFirst().get());
+        incompleteRecords.remove(incompleteRecords.stream().filter(x -> x.offset() == 69).findFirst().get());
+        incompleteRecords.remove(incompleteRecords.stream().filter(x -> x.offset() == 25_000).findFirst().get());
+        incompleteRecords.remove(incompleteRecords.stream().filter(x -> x.offset() == highestSucceeded).findFirst().get());
+
+        List<Long> expected = incompleteRecords.stream().map(ConsumerRecord::offset)
+                .sorted()
+                .collect(Collectors.toList());
+
+        //
+        ktu.send(consumerSpy, records);
+
+        //
+        ParallelConsumerOptions<String, String> options = parallelConsumer.getWm().getOptions();
+        HashMap<TopicPartition, List<ConsumerRecord<String, String>>> recordsMap = new HashMap<>();
+        TopicPartition tp = new TopicPartition(INPUT_TOPIC, 0);
+        recordsMap.put(tp, new ArrayList<>(records));
+        ConsumerRecords<String, String> testRecords = new ConsumerRecords<>(recordsMap);
+
+        // write offsets
+        final ParallelConsumerOptions<String, String> newOptions = options.toBuilder().consumer(consumerSpy).build();
+        final long FIRST_COMMITTED_OFFSET = 1L;
+        {
+            final PCModule<String, String> moduleTwo = new PCModule<>(newOptions);
+            WorkManager<String, String> wmm = moduleTwo.workManager();
+            wmm.onPartitionsAssigned(UniSets.of(new TopicPartition(INPUT_TOPIC, 0)));
+            wmm.registerWork(new EpochAndRecordsMap<>(testRecords, wmm.getPm()));
+
+            List<WorkContainer<String, String>> work = wmm.getWorkIfAvailable();
+            assertThat(work).hasSameSizeAs(records);
+
+            KafkaTestUtils.completeWork(wmm, work, FIRST_SUCCEEDED_OFFSET);
+
+            KafkaTestUtils.completeWork(wmm, work, 69);
+
+            KafkaTestUtils.completeWork(wmm, work, 25_000);
+
+            KafkaTestUtils.completeWork(wmm, work, highestSucceeded);
+
+
+            // make the commit
+            var completedEligibleOffsets = wmm.collectCommitDataForDirtyPartitions();
+            assertThat(completedEligibleOffsets.get(tp).offset()).isEqualTo(FIRST_COMMITTED_OFFSET);
+            consumerSpy.commitSync(completedEligibleOffsets);
+
+            {
+                // check for graceful fall back to the smallest available encoder
+                OffsetMapCodecManager<String, String> om = new OffsetMapCodecManager<>(module);
+                OffsetMapCodecManager.forcedCodec = Optional.empty(); // turn off forced
+                var state = wmm.getPm().getPartitionState(tp);
+                String bestPayload = om.makeOffsetMetadataPayload(FIRST_COMMITTED_OFFSET, state);
+                assertThat(bestPayload).isNotEmpty();
+            }
+        }
+
+        // check
+        {
+            var committed = consumerSpy.committed(UniSets.of(tp)).get(tp);
+            assertThat(committed.offset()).isEqualTo(FIRST_COMMITTED_OFFSET);
+
+            if (assumeWorkingCodec(encoding, encodingsThatFail)) {
+                assertThat(committed.metadata()).isNotBlank();
+            }
+        }
+
+        // simulate a rebalance or some sort of reset, by instantiating a new WM with the state from the last
+
+        // read offsets
+        {
+            final PCModule<String, String> moduleThree = new PCModule<>(options);
+            var newWm = moduleThree.workManager();
+            newWm.onPartitionsAssigned(UniSets.of(tp));
+
+            //
+            var pm = newWm.getPm();
+            var partitionState = pm.getPartitionState(tp);
+
+            if (assumeWorkingCodec(encoding, encodingsThatFail)) {
+                // check state reloaded ok from consumer
+                assertTruth(partitionState).getOffsetHighestSucceeded().isEqualTo(highestSucceeded);
+            }
+
+            //
+            ConsumerRecords<String, String> testRecordsWithBaseCommittedRecordRemoved = new ConsumerRecords<>(UniMaps.of(tp,
+                    testRecords.records(tp)
+                            .stream()
+                            .filter(x ->
+                                    x.offset() >= FIRST_COMMITTED_OFFSET)
+                            .collect(Collectors.toList())));
+            EpochAndRecordsMap<String, String> epochAndRecordsMap = new EpochAndRecordsMap<>(testRecordsWithBaseCommittedRecordRemoved, newWm.getPm());
+            newWm.registerWork(epochAndRecordsMap);
+
+            if (assumeWorkingCodec(encoding, encodingsThatFail)) {
+                // check state reloaded ok from consumer
+                assertTruth(partitionState).getOffsetHighestSucceeded().isEqualTo(highestSucceeded);
+            }
+
+            //
+            if (assumeWorkingCodec(encoding, encodingsThatFail)) {
+                assertTruth(partitionState).getOffsetHighestSequentialSucceeded().isEqualTo(FIRST_SUCCEEDED_OFFSET);
+
+                assertTruth(partitionState).getOffsetHighestSucceeded().isEqualTo(highestSucceeded);
+
+                long offsetHighestSeen = partitionState.getOffsetHighestSeen();
+                assertThat(offsetHighestSeen).isEqualTo(highestSucceeded);
+
+                var incompletes = partitionState.getIncompleteOffsetsBelowHighestSucceeded();
+                Truth.assertThat(incompletes).containsExactlyElementsIn(expected);
+            }
+
+            // check record is marked as incomplete
+            var anIncompleteRecord = records.get(3);
+            assertThat(partitionState.isRecordPreviouslyCompleted(anIncompleteRecord)).isFalse();
+
+            // check state
+            {
+                if (assumeWorkingCodec(encoding, encodingsThatFail)) {
+                    long offsetHighestSequentialSucceeded = partitionState.getOffsetHighestSequentialSucceeded();
+                    assertThat(offsetHighestSequentialSucceeded).isEqualTo(0);
+
+                    long offsetHighestSucceeded = partitionState.getOffsetHighestSucceeded();
+                    assertThat(offsetHighestSucceeded).isEqualTo(highestSucceeded);
+
+                    long offsetHighestSeen = partitionState.getOffsetHighestSeen();
+                    assertThat(offsetHighestSeen).isEqualTo(highestSucceeded);
+
+                    var incompletes = partitionState.getIncompleteOffsetsBelowHighestSucceeded();
+                    Truth.assertThat(incompletes).containsExactlyElementsIn(expected);
+
+                    assertThat(partitionState.isRecordPreviouslyCompleted(anIncompleteRecord)).isFalse();
+                }
+            }
+
+
+            var workRetrieved = newWm.getWorkIfAvailable();
+            var workRetrievedOffsets = workRetrieved.stream().map(WorkContainer::offset).collect(Collectors.toList());
+            assertTruth(workRetrieved).isNotEmpty();
+
+            switch (encoding) {
+                case BitSet, BitSetCompressed, // BitSetV1 both get a short overflow due to the length being too long
+                        BitSetV2, // BitSetv2 uncompressed is too large to fit in metadata payload
+                        RunLength, RunLengthCompressed // RunLength V1 max runlength is Short.MAX_VALUE
+                        -> {
+                    assertThat(workRetrievedOffsets).doesNotContain(2500L);
+                    assertThat(workRetrievedOffsets).doesNotContainSequence(expected);
+                }
+                default -> {
+                    Truth.assertWithMessage("Contains only incomplete records")
+                            .that(workRetrievedOffsets)
+                            .containsExactlyElementsIn(expected)
+                            .inOrder();
+                }
+            }
+        }
+
+        OffsetSimultaneousEncoder.compressionForced = false;
+    }
+
+    /**
+     * A {@link OffsetEncoding} that works in this test scenario
+     */
+    private boolean assumeWorkingCodec(OffsetEncoding encoding, List<OffsetEncoding> encodingsThatFail) {
+        return !encodingsThatFail.contains(encoding);
+    }
+
+    /**
+     * This version of non sequential test just test the encoder directly, and is only half the story, as at the
+     * encoding stage they don't know which offsets have never been seen, and assume simply working with continuous
+     * ranges.
+     * <p>
+     * See more info in the class javadoc of {@link BitsetEncoder}.
+     *
+     * @see BitsetEncoder
+     * @see #ensureEncodingGracefullyWorksWhenOffsetsAreVeryLargeAndNotSequential
+     */
+    @SneakyThrows
+    @Test
+    @ResourceLock(value = OffsetSimultaneousEncoder.COMPRESSION_FORCED_RESOURCE_LOCK, mode = READ_WRITE)
+    void ensureEncodingGracefullyWorksWhenOffsetsArentSequentialTwo() {
+        long nextExpectedOffset = 101;
+        long lowWaterMark = 0;
+        var incompletes = new TreeSet<>(UniSets.of(1L, 4L, 5L, 100L));
+
+        OffsetSimultaneousEncoder encoder = new OffsetSimultaneousEncoder(lowWaterMark, nextExpectedOffset, incompletes);
+        OffsetSimultaneousEncoder.compressionForced = true;
+
+        //
+        encoder.invoke();
+        Map<OffsetEncoding, byte[]> encodingMap = encoder.getEncodingMap();
+
+        //
+        byte[] smallestBytes = encoder.packSmallest();
+        EncodedOffsetPair unwrap = EncodedOffsetPair.unwrap(smallestBytes);
+        OffsetMapCodecManager.HighestOffsetAndIncompletes decodedIncompletes = unwrap.getDecodedIncompletes(lowWaterMark);
+        assertThat(decodedIncompletes.getIncompleteOffsets()).containsExactlyInAnyOrderElementsOf(incompletes);
+
+        if (nextExpectedOffset - lowWaterMark > BitSetEncoder.MAX_LENGTH_ENCODABLE)
+            assertThat(encodingMap.keySet()).as("Gracefully ignores that BitSet can't be supported").doesNotContain(OffsetEncoding.BitSet);
+        else
+            assertThat(encodingMap.keySet()).contains(OffsetEncoding.BitSet);
+
+        //
+        for (OffsetEncoding encodingToUse : OffsetEncoding.values()) {
+            log.info("Testing {}", encodingToUse);
+            byte[] bitsetBytes = encodingMap.get(encodingToUse);
+            if (bitsetBytes != null) {
+                EncodedOffsetPair bitsetUnwrap = EncodedOffsetPair.unwrap(encoder.packEncoding(new EncodedOffsetPair(encodingToUse, ByteBuffer.wrap(bitsetBytes))));
+                OffsetMapCodecManager.HighestOffsetAndIncompletes decodedBitsets = bitsetUnwrap.getDecodedIncompletes(lowWaterMark);
+                assertThat(decodedBitsets.getIncompleteOffsets())
+                        .as(encodingToUse.toString())
+                        .containsExactlyInAnyOrderElementsOf(incompletes);
+            } else {
+                log.info("Encoding not performed: " + encodingToUse);
+            }
+        }
+
+        OffsetSimultaneousEncoder.compressionForced = false;
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/RunLengthEncoderTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/RunLengthEncoderTest.java
new file mode 100644
index 000000000..36251c77f
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/RunLengthEncoderTest.java
@@ -0,0 +1,251 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.Truth;
+import io.confluent.csid.utils.Range;
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager.HighestOffsetAndIncompletes;
+import lombok.SneakyThrows;
+import org.assertj.core.api.Assertions;
+import org.junit.jupiter.api.Assumptions;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniSets;
+
+import javax.lang.model.type.TypeKind;
+import java.nio.ByteBuffer;
+import java.util.List;
+import java.util.Map;
+import java.util.Set;
+import java.util.stream.Collectors;
+
+import static io.confluent.csid.utils.JavaUtils.toTreeSet;
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.Version.v2;
+import static io.confluent.parallelconsumer.state.PartitionState.KAFKA_OFFSET_ABSENCE;
+import static javax.lang.model.type.TypeKind.INT;
+import static javax.lang.model.type.TypeKind.SHORT;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.junit.jupiter.params.provider.EnumSource.Mode.INCLUDE;
+
+class RunLengthEncoderTest {
+
+    /**
+     * Check that run length supports gaps in the source partition - i.e. compacted topics where offsets aren't strictly
+     * sequential
+     */
+    @SneakyThrows
+    @Test
+    void noGaps() {
+        var incompletes = UniSets.of(0, 4, 6, 7, 8, 10).stream().map(x -> (long) x).collect(toTreeSet());
+        var completes = UniSets.of(1, 2, 3, 5, 9).stream().map(x -> (long) x).collect(toTreeSet());
+        List<Integer> runs = UniLists.of(1, 3, 1, 1, 3, 1, 1);
+        OffsetSimultaneousEncoder offsetSimultaneousEncoder = new OffsetSimultaneousEncoder(KAFKA_OFFSET_ABSENCE, 0L, incompletes);
+
+        {
+            RunLengthEncoder rl = new RunLengthEncoder(offsetSimultaneousEncoder, v2);
+
+            rl.encodeIncompleteOffset(0); // 1
+            rl.encodeCompletedOffset(1); // 3
+            rl.encodeCompletedOffset(2);
+            rl.encodeCompletedOffset(3);
+            rl.encodeIncompleteOffset(4); // 1
+            rl.encodeCompletedOffset(5); // 1
+            rl.encodeIncompleteOffset(6); // 3
+            rl.encodeIncompleteOffset(7);
+            rl.encodeIncompleteOffset(8);
+            rl.encodeCompletedOffset(9); // 1
+            rl.encodeIncompleteOffset(10); // 1
+
+            rl.addTail();
+
+            // before serialisation
+            {
+                assertThat(rl.getRunLengthEncodingIntegers()).containsExactlyElementsOf(runs);
+
+                List<Long> calculatedCompletedOffsets = rl.calculateSucceededActualOffsets(0);
+
+                assertThat(calculatedCompletedOffsets).containsExactlyElementsOf(completes);
+            }
+        }
+    }
+
+
+    /**
+     * Check that run length supports gaps in the source partition - i.e. compacted topics where offsets aren't strictly
+     * sequential
+     */
+    @SneakyThrows
+    @Test
+    void noGapsSerialisation() {
+        var incompletes = UniSets.of(0, 4, 6, 7, 8, 10).stream().map(x -> (long) x).collect(toTreeSet()); // lol - DRY!
+        var completes = UniSets.of(1, 2, 3, 5, 9).stream().map(x -> (long) x).collect(toTreeSet()); // lol - DRY!
+        List<Integer> runs = UniLists.of(1, 3, 1, 1, 3, 1, 1);
+        OffsetSimultaneousEncoder offsetSimultaneousEncoder = new OffsetSimultaneousEncoder(KAFKA_OFFSET_ABSENCE, 0L, incompletes);
+
+        {
+            RunLengthEncoder rl = new RunLengthEncoder(offsetSimultaneousEncoder, v2);
+
+            rl.encodeIncompleteOffset(0); // 1
+            rl.encodeCompletedOffset(1); // 3
+            rl.encodeCompletedOffset(2);
+            rl.encodeCompletedOffset(3);
+            rl.encodeIncompleteOffset(4); // 1
+            rl.encodeCompletedOffset(5); // 1
+            rl.encodeIncompleteOffset(6); // 3
+            rl.encodeIncompleteOffset(7);
+            rl.encodeIncompleteOffset(8);
+            rl.encodeCompletedOffset(9); // 1
+            rl.encodeIncompleteOffset(10); // 1
+
+            // after serialisation
+            {
+                byte[] raw = rl.serialise();
+
+                byte[] wrapped = offsetSimultaneousEncoder.packEncoding(new EncodedOffsetPair(OffsetEncoding.RunLengthV2, ByteBuffer.wrap(raw)));
+
+                HighestOffsetAndIncompletes result = OffsetMapCodecManager.decodeCompressedOffsets(0, wrapped);
+
+                assertThat(result.getHighestSeenOffset()).contains(10L);
+
+                assertThat(result.getIncompleteOffsets()).containsExactlyElementsOf(incompletes);
+            }
+        }
+    }
+
+    /**
+     * Check that run length supports gaps in the source partition - i.e. compacted topics where offsets aren't strictly
+     * sequential.
+     */
+    @SneakyThrows
+    @Test
+    void gapsInOffsetsWork() {
+        var incompletes = UniSets.of(0, 6, 10).stream().map(x -> (long) x).collect(toTreeSet());
+
+        // NB: gaps between completed offsets get encoded as succeeded offsets. This doesn't matter because they don't exist and we'll neve see them.
+        Set<Long> completes = UniSets.of(1, 2, 3, 4, 5, 9).stream().map(x -> (long) x).collect(Collectors.toSet());
+        List<Integer> runs = UniLists.of(1, 5, 3, 1, 1);
+        OffsetSimultaneousEncoder offsetSimultaneousEncoder = new OffsetSimultaneousEncoder(KAFKA_OFFSET_ABSENCE, 0L, incompletes);
+
+        {
+            RunLengthEncoder rl = new RunLengthEncoder(offsetSimultaneousEncoder, v2);
+
+            rl.encodeIncompleteOffset(0);
+            rl.encodeCompletedOffset(1);
+            // gap completes at 2
+            rl.encodeCompletedOffset(3);
+            rl.encodeCompletedOffset(4);
+            rl.encodeCompletedOffset(5);
+            rl.encodeIncompleteOffset(6);
+            // gap incompletes at 7
+            rl.encodeIncompleteOffset(8);
+            rl.encodeCompletedOffset(9);
+            rl.encodeIncompleteOffset(10);
+
+            rl.addTail();
+
+            assertThat(rl.getRunLengthEncodingIntegers()).containsExactlyElementsOf(runs);
+
+            List<Long> calculatedCompletedOffsets = rl.calculateSucceededActualOffsets(0);
+
+            assertThat(calculatedCompletedOffsets).containsExactlyElementsOf(completes);
+        }
+    }
+
+
+    /**
+     * Check RLv2 errors on integer overflow. Integer version of this test is very slow (1.5 minutes).
+     */
+    @SneakyThrows
+    @ParameterizedTest()
+    @EnumSource(OffsetEncoding.Version.class)
+    void vTwoIntegerOverflow(OffsetEncoding.Version versionToTest) {
+        final long integerMaxOverflowOffset = 100;
+        final long overflowedValue = Integer.MAX_VALUE + integerMaxOverflowOffset;
+
+        var incompletes = UniSets.of(0L, 4L, 6L, 7L, 8L, 10L, overflowedValue).stream().collect(toTreeSet());
+        var completes = UniSets.of(1, 2, 3, 5, 9).stream().map(x -> (long) x).collect(toTreeSet());
+        OffsetSimultaneousEncoder offsetSimultaneousEncoder
+                = new OffsetSimultaneousEncoder(KAFKA_OFFSET_ABSENCE, overflowedValue - 1, incompletes);
+
+        {
+            final OffsetEncoding.Version versionsToTest = v2;
+            testRunLength(overflowedValue, offsetSimultaneousEncoder, versionToTest);
+        }
+    }
+
+    private static void testRunLength(long overflowedValue, OffsetSimultaneousEncoder offsetSimultaneousEncoder, OffsetEncoding.Version versionsToTest) throws EncodingNotSupportedException {
+        RunLengthEncoder rl = new RunLengthEncoder(offsetSimultaneousEncoder, versionsToTest);
+
+        rl.encodeIncompleteOffset(0); // 1
+        rl.encodeCompletedOffset(1); // 3
+        rl.encodeCompletedOffset(2);
+        rl.encodeCompletedOffset(3);
+        rl.encodeIncompleteOffset(4); // 1
+        rl.encodeCompletedOffset(5); // 1
+        rl.encodeIncompleteOffset(6); // 3
+        rl.encodeIncompleteOffset(7);
+        rl.encodeIncompleteOffset(8);
+        rl.encodeCompletedOffset(9); // 1
+        rl.encodeIncompleteOffset(10); // 1
+
+        // inject overflow offset
+        var errorAssertion = Assertions.assertThatThrownBy(() -> {
+            for (var relativeOffset : Range.range(11, overflowedValue)) {
+                rl.encodeCompletedOffset(relativeOffset);
+            }
+        });
+
+        switch (versionsToTest) {
+            case v1 -> {
+                errorAssertion.isInstanceOf(RunLengthV1EncodingNotSupported.class);
+                errorAssertion.hasMessageContainingAll("too big", "Short");
+            }
+            case v2 -> {
+                errorAssertion.isInstanceOf(RunLengthV2EncodingNotSupported.class);
+                errorAssertion.hasMessageContainingAll("too big", "Integer");
+            }
+        }
+    }
+
+    /**
+     * Test simultaneous encoder with run-length overflow errors fail gracefully.
+     * <p>
+     * Integer version of this test is very slow (1.5 minutes).
+     */
+    @ParameterizedTest
+    @EnumSource(names = {"SHORT", "INT"}, mode = INCLUDE)
+    void testSimultaneousWithOverflowErrors(TypeKind primitiveSize) {
+        Assumptions.assumeTrue(primitiveSize == SHORT || primitiveSize == INT);
+
+        final long integerMaxOverflowOffset = 100;
+        final int maxValue = switch (primitiveSize) {
+            case SHORT -> Short.MAX_VALUE;
+            case INT -> Integer.MAX_VALUE;
+            default -> throw new IllegalStateException("Unexpected value: " + primitiveSize);
+        };
+
+        final long overflowedValue = maxValue + integerMaxOverflowOffset;
+
+        var incompletes = UniSets.of(0L, 4L, 6L, 7L, 8L, 10L, overflowedValue).stream().collect(toTreeSet());
+        var completes = UniSets.of(1, 2, 3, 5, 9).stream().map(x -> (long) x).collect(toTreeSet());
+        OffsetSimultaneousEncoder offsetSimultaneousEncoder
+                = new OffsetSimultaneousEncoder(KAFKA_OFFSET_ABSENCE, overflowedValue - 1, incompletes);
+
+        offsetSimultaneousEncoder.invoke();
+
+        final Map<OffsetEncoding, byte[]> encodingMap = offsetSimultaneousEncoder.getEncodingMap();
+
+        //
+        switch (primitiveSize) {
+            case SHORT -> Truth.assertThat(encodingMap).hasSize(2);
+            case INT -> Truth.assertThat(encodingMap).hasSize(0);
+            default -> throw new IllegalStateException("Unexpected value: " + primitiveSize);
+        }
+        ;
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/WorkManagerOffsetMapCodecManagerTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/WorkManagerOffsetMapCodecManagerTest.java
new file mode 100644
index 000000000..102c67a55
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/offsets/WorkManagerOffsetMapCodecManagerTest.java
@@ -0,0 +1,518 @@
+package io.confluent.parallelconsumer.offsets;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import com.google.common.truth.Truth;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.internal.PCModuleTestEnv;
+import io.confluent.parallelconsumer.state.PartitionState;
+import io.confluent.parallelconsumer.state.WorkManager;
+import lombok.Getter;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.commons.lang3.RandomUtils;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.MockConsumer;
+import org.apache.kafka.clients.consumer.OffsetResetStrategy;
+import org.apache.kafka.common.TopicPartition;
+import org.junit.jupiter.api.BeforeAll;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.extension.ExtendWith;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.MethodSource;
+import org.mockito.Mock;
+import org.mockito.Mockito;
+import org.mockito.junit.jupiter.MockitoExtension;
+import org.xerial.snappy.SnappyOutputStream;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniSets;
+
+import java.io.ByteArrayOutputStream;
+import java.io.IOException;
+import java.nio.ByteBuffer;
+import java.util.*;
+
+import static com.google.common.truth.Truth.assertWithMessage;
+import static io.confluent.csid.utils.Range.range;
+import static io.confluent.parallelconsumer.offsets.OffsetCodecTestUtils.bitmapStringToIncomplete;
+import static io.confluent.parallelconsumer.offsets.OffsetCodecTestUtils.incompletesToBitmapString;
+import static io.confluent.parallelconsumer.offsets.OffsetEncoding.*;
+import static java.nio.charset.StandardCharsets.UTF_8;
+import static java.util.Optional.of;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.AssertionsForClassTypes.assertThatThrownBy;
+
+// todo refactor - remove tests which use hard coded state vs dynamic state - #compressionCycle, #selialiseCycle, #runLengthEncoding, #loadCompressedRunLengthRncoding
+@Slf4j
+@ExtendWith(MockitoExtension.class)
+class WorkManagerOffsetMapCodecManagerTest {
+
+    PCModuleTestEnv module;
+
+    WorkManager<String, String> wm;
+
+    OffsetMapCodecManager<String, String> offsetCodecManager;
+
+    TopicPartition tp = new TopicPartition("myTopic", 0);
+
+    /**
+     * set pf incomplete offsets in our sample data
+     */
+    TreeSet<Long> incompleteOffsets = new TreeSet<>(UniSets.of(0L, 2L, 3L));
+
+    /**
+     * Committable offset of 0, meaning 1 and 4 are complete and 2 and 3 are incomplete
+     * <p>
+     * 0X00X
+     */
+    long finalOffsetForPartition = 0L;
+
+    /**
+     * Sample data runs up to a highest seen offset of 4. Where offset 3 and 3 are incomplete.
+     */
+    long highestSucceeded = 4;
+
+    PartitionState<String, String> state;
+
+    @Mock
+    ConsumerRecord<String, String> mockCr;
+
+    @BeforeEach
+    void setupMock() {
+        injectSucceededWorkAtOffset(highestSucceeded);
+    }
+
+    private void injectSucceededWorkAtOffset(long offset) {
+        Mockito.doReturn(offset).when(mockCr).offset();
+        state.addNewIncompleteRecord(mockCr);
+        state.onSuccess(offset); // in this case the highest seen is also the highest succeeded
+    }
+
+    /**
+     * o = incomplete x = complete
+     */
+    static List<String> simpleSampleInputsToCompress = UniLists.of(
+            "",
+            "o",
+            "x",
+            "ooo",
+            "xxx",
+            "xox",
+            "oxo",
+            "xooxo",
+            "ooxxoxox",
+            "xxxxxxoooooxoxoxoooooxxxxooooo",
+            "oooooooooooooooooooooooooooooo",
+            "ooooooooooooooxxxxxxxxxxxxxxxx",
+            "oxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx",
+            "xxxxxxoooooxoxoxoooooxxxxoooooxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxoxoxooxoxoxoxoxoxoxoxoxoxoxoxo"
+    );
+
+    @Getter
+    static List<String> inputsToCompress = new ArrayList<>();
+
+    @BeforeEach
+    void setup() {
+        MockConsumer<String, String> mockConsumer = new MockConsumer<>(OffsetResetStrategy.EARLIEST);
+        var options = ParallelConsumerOptions.<String, String>builder()
+                .consumer(mockConsumer)
+                .build();
+        module = new PCModuleTestEnv(options);
+        state = new PartitionState<>(0, module, tp, new OffsetMapCodecManager.HighestOffsetAndIncompletes(of(highestSucceeded), incompleteOffsets));
+        wm = module.workManager();
+        wm.onPartitionsAssigned(UniLists.of(tp));
+        offsetCodecManager = new OffsetMapCodecManager<>(module);
+    }
+
+    @BeforeAll
+    static void data() {
+        String input100 = "xxxxxxoooooxoxoxoooooxxxxoooooxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxoxoxooxoxoxoxoxoxoxoxoxoxoxoxo"; //100 chars
+
+        StringBuffer randomInput = generateRandomData(100);
+        String inputString = randomInput.toString();
+
+        inputsToCompress.addAll(simpleSampleInputsToCompress);
+        inputsToCompress.add(input100);
+        inputsToCompress.add(input100 + input100 + input100 + input100 + input100 + input100 + input100 + input100 + input100 + input100 + input100);
+        inputsToCompress.add(inputString);
+        inputsToCompress.add(generateRandomData(1000).toString());
+        // remove? slow, not needed?
+        inputsToCompress.add(generateRandomData(10000).toString());
+        inputsToCompress.add(generateRandomData(30000).toString());
+    }
+
+    private static StringBuffer generateRandomData(int entries) {
+        StringBuffer randomInput = new StringBuffer();
+        range(entries).toStream()
+                .mapToObj(x -> RandomUtils.nextBoolean())
+                .forEach(x -> randomInput.append((x) ? 'x' : 'o'));
+        return randomInput;
+    }
+
+    @SneakyThrows
+    @Test
+    void serialiseCycle() {
+        String serialised = offsetCodecManager.serialiseIncompleteOffsetMapToBase64(finalOffsetForPartition, state);
+        log.info("Size: {}", serialised.length());
+
+        //
+        OffsetMapCodecManager.HighestOffsetAndIncompletes highestOffsetAndIncompletes = OffsetMapCodecManager.deserialiseIncompleteOffsetMapFromBase64(finalOffsetForPartition, serialised);
+        Set<Long> deserializedIncompletes = highestOffsetAndIncompletes.getIncompleteOffsets();
+
+        //
+        assertThat(deserializedIncompletes.toArray()).containsExactly(incompleteOffsets.toArray());
+    }
+
+    /**
+     * Even Java _binary_ serialisation has very large overheads.
+     */
+    @Test
+    void javaSerialisationComparison() {
+        TreeSet<Long> one = new TreeSet<>(UniSets.of(1L));
+        TreeSet<Long> two = new TreeSet<>(UniSets.of(2L));
+
+        String oneS = OffsetSimpleSerialisation.encodeAsJavaObjectStream(one);
+        int payloadLength = 5;
+        String oneStringPreamble = oneS.substring(0, oneS.length() - payloadLength);
+        String twoS = OffsetSimpleSerialisation.encodeAsJavaObjectStream(two);
+        String twoStringPreamble = twoS.substring(0, twoS.length() - payloadLength);
+
+        assertThat(oneStringPreamble).isEqualTo(twoStringPreamble);
+    }
+
+    @SneakyThrows
+    @Test
+    void runLengthEncodingCompression() {
+        List<String> inputs = UniLists.of(
+                "xxxxxxoooooxoxoxoooooxxxxooooo",
+                "6x,5o,1x,1o,1x,1o,1x,5o,4x,5o",
+                "oooooooooooooooooooooooooooooo",
+                "30o",
+                "ooooooooooooooxxxxxxxxxxxxxxxx",
+                "15o,15x",
+                "x",
+                "1x",
+                "");
+
+        for (var i : inputs) {
+            compareCompression(i);
+        }
+    }
+
+    private byte[] compareCompression(String input) throws IOException {
+        log.info("testing input of {}", input);
+
+        byte[] inputBytes = input.getBytes(UTF_8);
+
+        byte[] outg = OffsetSimpleSerialisation.compressGzip(inputBytes);
+        byte[] outz = OffsetSimpleSerialisation.compressZstd(inputBytes);
+        ByteArrayOutputStream outs = new ByteArrayOutputStream();
+
+        var snap = new SnappyOutputStream(outs);
+
+        snap.write(inputBytes);
+
+        snap.close();
+
+        String g64 = Base64.getEncoder().encodeToString(outg);
+        String z64 = Base64.getEncoder().encodeToString(outz);
+        String s64 = Base64.getEncoder().encodeToString(outs.toByteArray());
+
+        String raw64 = Base64.getEncoder().encodeToString(inputBytes);
+
+        log.info("g {}", outg.length);
+        log.info("z {}", outz.length);
+        log.info("s {}", outs.size());
+
+        log.info("64");
+        log.info("r {}", raw64.length());
+        log.info("g {}", g64.length());
+        log.info("z {}", z64.length());
+        log.info("s {}", s64.length());
+
+        return outg;
+    }
+
+    @Test
+    void base64Encoding() {
+        // encode
+        String originalString = "TEST";
+        byte[] stringBytes = originalString.getBytes(UTF_8);
+        String base64Bytes = Base64.getEncoder().encodeToString(stringBytes);
+
+        // decode
+        byte[] base64DecodedBytes = Base64.getDecoder().decode(base64Bytes);
+        assertThat(stringBytes).isEqualTo(base64DecodedBytes);
+
+        // string
+        String decodedString = new String(base64DecodedBytes, UTF_8);
+        assertThat(originalString).isEqualTo(decodedString);
+    }
+
+    @SneakyThrows
+    @Test
+    void loadCompressedRunLengthEncoding() {
+        byte[] bytes = offsetCodecManager.encodeOffsetsCompressed(finalOffsetForPartition, state);
+        OffsetMapCodecManager.HighestOffsetAndIncompletes longs = OffsetMapCodecManager.decodeCompressedOffsets(finalOffsetForPartition, bytes);
+        assertThat(longs.getIncompleteOffsets().toArray()).containsExactly(incompleteOffsets.toArray());
+    }
+
+    @Test
+    void decodeOffsetMap() {
+        Set<Long> set = bitmapStringToIncomplete(2L, "ooxx");
+        assertThat(set).containsExactly(2L, 3L);
+
+        assertThat(bitmapStringToIncomplete(2L, "ooxxoxox")).containsExactly(2L, 3L, 6L, 8L);
+        assertThat(bitmapStringToIncomplete(2L, "o")).containsExactly(2L);
+        assertThat(bitmapStringToIncomplete(2L, "x")).containsExactly();
+        assertThat(bitmapStringToIncomplete(2L, "")).containsExactly();
+        assertThat(bitmapStringToIncomplete(2L, "ooo")).containsExactly(2L, 3L, 4L);
+        assertThat(bitmapStringToIncomplete(2L, "xxx")).containsExactly();
+    }
+
+    @Test
+    void binaryArrayConstruction() {
+        injectSucceededWorkAtOffset(6);
+
+        String encoding = incompletesToBitmapString(finalOffsetForPartition, state);
+        assertThat(encoding).isEqualTo("oxooxx");
+    }
+
+    @SneakyThrows
+    @Test
+    void compressDecompressSanityGzip() {
+        final byte[] input = "Lilan".getBytes();
+        final var compressedInput = OffsetSimpleSerialisation.compressGzip(input);
+        final var decompressedInput = OffsetSimpleSerialisation.decompressGzip(ByteBuffer.wrap(compressedInput));
+        assertThat(decompressedInput).isEqualTo(input);
+    }
+
+    @SneakyThrows
+    @Test
+    void compressDecompressWithBase64SanityGzip() {
+        byte[] input = "Lilan".getBytes();
+        byte[] compressedInput = OffsetSimpleSerialisation.compressGzip(input);
+        byte[] b64input = Base64.getEncoder().encode(compressedInput);
+        byte[] b64Output = Base64.getDecoder().decode(b64input);
+        byte[] decompressedInput = OffsetSimpleSerialisation.decompressGzip(ByteBuffer.wrap(b64Output));
+        assertThat(decompressedInput).isEqualTo(input);
+    }
+
+    @SneakyThrows
+    @Test
+    void compressDecompressSanityZstd() {
+        byte[] input = "Lilan".getBytes();
+        byte[] compressedInput = OffsetSimpleSerialisation.compressZstd(input);
+        ByteBuffer decompressedInput = OffsetSimpleSerialisation.decompressZstd(ByteBuffer.wrap(compressedInput));
+        assertThat(decompressedInput).isEqualTo(ByteBuffer.wrap(input));
+    }
+
+    @SneakyThrows
+    @Test
+    void largeOffsetMap() {
+        injectSucceededWorkAtOffset(200); // force system to have seen a high offset
+        byte[] encoded = offsetCodecManager.encodeOffsetsCompressed(0L, state);
+        int smallestCompressionObserved = 10;
+        assertThat(encoded).as("very small")
+                .hasSizeLessThan(smallestCompressionObserved); // arbitrary size expectation based on past observations - expect around 7
+    }
+
+    @SneakyThrows
+    @Test
+    void stringVsByteVsBitSetEncoding() {
+        for (var inputString : inputsToCompress) {
+            int inputLength = inputString.length();
+
+            var offsets = bitmapStringToIncomplete(finalOffsetForPartition, inputString);
+
+            OffsetSimultaneousEncoder simultaneousEncoder = new OffsetSimultaneousEncoder(finalOffsetForPartition, highestSucceeded, offsets).invoke();
+            byte[] byteByte = simultaneousEncoder.getEncodingMap().get(ByteArray);
+            byte[] bitsBytes = simultaneousEncoder.getEncodingMap().get(BitSet);
+
+//            int compressedBytes = om.compressZstd(byteByte).length;
+//            int compressedBits = om.compressZstd(bitsBytes).length;
+
+            byte[] runlengthBytes = simultaneousEncoder.getEncodingMap().get(RunLength);
+//            int rlBytesCompressed = om.compressZstd(runlengthBytes).length;
+
+            log.info("in: {}", inputString);
+//            log.info("length: {} comp bytes: {} comp bits: {}, uncompressed bits: {}, run length {}, run length compressed: {}", inputLength, compressedBytes, compressedBits, bitsBytes.length, runlengthBytes.length, rlBytesCompressed);
+        }
+    }
+
+    @SneakyThrows
+    @Test
+    void deserialiseBitSet() {
+        var input = "oxxooooooo";
+        long highestSucceeded = input.length() - 1;
+
+        int nextExpectedOffset = 0;
+        var incompletes = bitmapStringToIncomplete(nextExpectedOffset, input);
+        OffsetSimultaneousEncoder encoder = new OffsetSimultaneousEncoder(nextExpectedOffset, highestSucceeded, incompletes);
+        encoder.invoke();
+        byte[] pack = encoder.packSmallest();
+
+        //
+        EncodedOffsetPair encodedOffsetPair = EncodedOffsetPair.unwrap(pack);
+        String deserialisedBitSet = encodedOffsetPair.getDecodedString();
+        assertThat(deserialisedBitSet).isEqualTo(input);
+    }
+
+    /**
+    * Tests for friendly errors when Kafka Streams (as far as we can guess) magic numbers are found in the offset metadata.
+    */
+    @SneakyThrows
+    @Test
+    void deserialiseKafkaStreamsV1WithDefaultErrorPolicy() {
+        final var input = ByteBuffer.allocate(32);
+        // magic number
+        input.put((byte) 1);
+        // timestamp
+        input.putLong(System.currentTimeMillis());
+
+        EncodedOffsetPair encodedOffsetPair = EncodedOffsetPair.unwrap(input.array());
+        assertThatThrownBy(()->encodedOffsetPair.getDecodedIncompletes(0L))
+                .isInstanceOf(KafkaStreamsEncodingNotSupported.class);
+    }
+
+    /**
+     * Tests for ignoring when InvalidOffsetMetadataHandlingPolicy.IGNORE and Kafka Streams (as far as we can guess) magic numbers are found in the offset metadata.
+     */
+    @SneakyThrows
+    @Test
+    void deserialiseKafkaStreamsV1WithIgnoreErrorPolicy() {
+        final var input = ByteBuffer.allocate(32);
+        // magic number
+        input.put((byte) 1);
+        // timestamp
+        input.putLong(System.currentTimeMillis());
+
+        EncodedOffsetPair encodedOffsetPair = EncodedOffsetPair.unwrap(input.array());
+
+        OffsetMapCodecManager.HighestOffsetAndIncompletes longs = encodedOffsetPair.getDecodedIncompletes(100L, ParallelConsumerOptions.InvalidOffsetMetadataHandlingPolicy.IGNORE);
+
+        assertThat(longs.getHighestSeenOffset()).isEqualTo(Optional.of(100L));
+        assertThat(longs.getIncompleteOffsets()).isEqualTo(Collections.emptySet());
+
+    }
+
+    /**
+     * Tests for friendly errors when Kafka Streams V2 (as far as we can guess) magic numbers are found in the offset metadata.
+     */
+    @SneakyThrows
+    @Test
+    void deserialiseKafkaStreamsV2WithDefaultErrorPolicy() {
+        final var input = ByteBuffer.allocate(32);
+        // magic number
+        input.put((byte) 2);
+        // timestamp
+        input.putLong(System.currentTimeMillis());
+        // metadata
+        // number of entries
+        input.putInt(1);
+        // key size
+        input.putInt(1);
+        // key
+        input.put((byte) 'a');
+        // value
+        input.putLong(1L);
+
+        EncodedOffsetPair encodedOffsetPair = EncodedOffsetPair.unwrap(input.array());
+        assertThatThrownBy(()->encodedOffsetPair.getDecodedIncompletes(0L))
+                .isInstanceOf(KafkaStreamsEncodingNotSupported.class);
+    }
+
+    /**
+     * Tests for friendly errors when Kafka Streams V2 (as far as we can guess) magic numbers are found in the offset metadata.
+     */
+    @SneakyThrows
+    @Test
+    void deserialiseKafkaStreamsV2WithIgnoreErrorPolicy() {
+        final var input = ByteBuffer.allocate(32);
+        // magic number
+        input.put((byte) 2);
+        // timestamp
+        input.putLong(System.currentTimeMillis());
+        // metadata
+        // number of entries
+        input.putInt(1);
+        // key size
+        input.putInt(1);
+        // key
+        input.put((byte) 'a');
+        // value
+        input.putLong(1L);
+
+        EncodedOffsetPair encodedOffsetPair = EncodedOffsetPair.unwrap(input.array());
+        OffsetMapCodecManager.HighestOffsetAndIncompletes longs = encodedOffsetPair.getDecodedIncompletes(100L, ParallelConsumerOptions.InvalidOffsetMetadataHandlingPolicy.IGNORE);
+
+        assertThat(longs.getHighestSeenOffset()).isEqualTo(Optional.of(100L));
+        assertThat(longs.getIncompleteOffsets()).isEqualTo(Collections.emptySet());
+    }
+
+    @SneakyThrows
+    @Test
+    void compressionCycle() {
+        byte[] serialised = offsetCodecManager.encodeOffsetsCompressed(finalOffsetForPartition, state);
+
+        OffsetMapCodecManager.HighestOffsetAndIncompletes deserialised = OffsetMapCodecManager.decodeCompressedOffsets(finalOffsetForPartition, serialised);
+
+        assertThat(deserialised.getIncompleteOffsets()).isEqualTo(incompleteOffsets);
+    }
+
+    @Test
+    void runLengthEncoding() {
+        String stringMap = incompletesToBitmapString(finalOffsetForPartition, state);
+        List<Integer> integers = OffsetRunLength.runLengthEncode(stringMap);
+        assertThat(integers).as("encoding of map: " + stringMap).containsExactlyElementsOf(UniLists.of(1, 1, 2));
+
+        assertThat(OffsetRunLength.runLengthDecodeToString(integers)).isEqualTo(stringMap);
+    }
+
+    static List<String> differentInputsAndCompressions() {
+        return inputsToCompress;
+    }
+
+    /**
+     * Compare compression performance on different types of inputs, and tests that each encoding type is decompressed
+     * again correctly
+     */
+    @ParameterizedTest
+    @MethodSource
+    void differentInputsAndCompressions(String input) {
+        long highestSeen = input.length() - 1; // pretend we've gone one higher than the input incompletes
+
+        //
+        log.debug("Testing round - size: {} input: '{}'", input.length(), input);
+        var inputIncompletes = bitmapStringToIncomplete(finalOffsetForPartition, input);
+        String sanityEncoding = incompletesToBitmapString(finalOffsetForPartition, highestSeen + 1, inputIncompletes);
+        Truth.assertThat(sanityEncoding).isEqualTo(input);
+
+        //
+        OffsetSimultaneousEncoder encoder = new OffsetSimultaneousEncoder(finalOffsetForPartition, highestSeen, inputIncompletes);
+        encoder.invoke();
+
+        // test all encodings created
+        for (final EncodedOffsetPair encoding : encoder.sortedEncodings) {
+            //
+            byte[] packedEncoding = encoder.packEncoding(encoding);
+
+            //
+            var recoveredIncompleteAndOffset =
+                    OffsetMapCodecManager.decodeCompressedOffsets(finalOffsetForPartition, packedEncoding);
+            Set<Long> recoveredIncompletes = recoveredIncompleteAndOffset.getIncompleteOffsets();
+
+            //
+            assertThat(recoveredIncompletes).containsExactlyInAnyOrderElementsOf(inputIncompletes);
+
+            //
+            String simple = incompletesToBitmapString(finalOffsetForPartition, highestSeen + 1, recoveredIncompletes);
+            assertWithMessage(encoding.encoding.name())
+                    .that(simple).isEqualTo(input);
+        }
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/sanity/InterruptionTests.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/sanity/InterruptionTests.java
new file mode 100644
index 000000000..ca3fbcfe0
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/sanity/InterruptionTests.java
@@ -0,0 +1,34 @@
+package io.confluent.parallelconsumer.sanity;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import lombok.SneakyThrows;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.Timeout;
+
+import static java.util.concurrent.TimeUnit.SECONDS;
+
+public class InterruptionTests {
+
+    /**
+     * Verify behaviour of 0 vs 1 timeout on {@link Object@wait}. Original test timeout of 5ms was too small, sometimes
+     * (1/4000) runs it would timeout. 1/117,000 it failed at 50ms. 1 second didn't observe failure within ~250,000 runs
+     * in Intellij (run until fail).
+     */
+    @Timeout(value = 1, unit = SECONDS)
+    @SneakyThrows
+    @Test
+    public void waitOnZeroCausesInfiniteWait() {
+        Object lock = new Object();
+        try {
+            synchronized (lock) {
+                lock.wait(1);
+                // lock.wait(0); // zero causes it to wait forever
+            }
+        } catch (InterruptedException e) {
+            e.printStackTrace();
+        }
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/sanity/QueueingSanityTests.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/sanity/QueueingSanityTests.java
new file mode 100644
index 000000000..6db3f4e95
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/sanity/QueueingSanityTests.java
@@ -0,0 +1,28 @@
+package io.confluent.parallelconsumer.sanity;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import org.junit.jupiter.api.Test;
+
+import java.util.concurrent.ConcurrentLinkedDeque;
+
+import static org.assertj.core.api.Assertions.assertThat;
+
+/**
+ * Sanity test usage
+ */
+public class QueueingSanityTests {
+
+    @Test
+    public void test() {
+        ConcurrentLinkedDeque<Integer> q = new ConcurrentLinkedDeque<>();
+
+        assertThat(q.add(1)).isTrue();
+        assertThat(q.add(2)).isTrue();
+
+        assertThat(q.poll()).isEqualTo(1);
+        assertThat(q.poll()).isEqualTo(2);
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/sanity/StreamTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/sanity/StreamTest.java
new file mode 100644
index 000000000..96ed2a939
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/sanity/StreamTest.java
@@ -0,0 +1,69 @@
+package io.confluent.parallelconsumer.sanity;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import lombok.extern.slf4j.Slf4j;
+import org.assertj.core.api.Assertions;
+import org.junit.jupiter.api.Test;
+
+import java.util.Iterator;
+import java.util.List;
+import java.util.Spliterator;
+import java.util.Spliterators;
+import java.util.stream.Collectors;
+import java.util.stream.Stream;
+import java.util.stream.StreamSupport;
+
+/**
+ * Sanity test usage of Java {@link Stream}
+ */
+@Slf4j
+public class StreamTest {
+
+    //    @Test
+    public void test() {
+        Stream<Double> s = Stream.generate(() -> Math.random());
+        s.forEach(x -> {
+            log.info(x.toString());
+        });
+    }
+
+    @Test
+    public void testStreamSpliterators() {
+        int max = 10;
+
+        Iterator<String> i = new Iterator<>() {
+
+            int count = 0;
+
+            @Override
+            public boolean hasNext() {
+                return count < max;
+            }
+
+            @Override
+            public String next() {
+                count++;
+                return count + " " + Math.random();
+
+            }
+        };
+
+        Spliterator<String> spliterator = Spliterators.spliterator(i, 0, Spliterator.NONNULL);
+
+        Stream<String> stream = StreamSupport.stream(spliterator, false);
+
+        List<String> collect = stream
+                .map(x -> {
+                            log.info(x);
+                            return x.toUpperCase();
+                        }
+                )
+                .collect(Collectors.toList());
+
+        Assertions.assertThat(collect).hasSize(max);
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/ModelUtils.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/ModelUtils.java
new file mode 100644
index 000000000..20c45e35c
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/ModelUtils.java
@@ -0,0 +1,97 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.EpochAndRecordsMap;
+import io.confluent.parallelconsumer.internal.PCModuleTestEnv;
+import lombok.Getter;
+import lombok.NonNull;
+import lombok.RequiredArgsConstructor;
+import org.apache.kafka.clients.consumer.ConsumerGroupMetadata;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.ConsumerRecords;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.common.TopicPartition;
+import org.mockito.Mockito;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniMaps;
+
+import java.util.ArrayList;
+import java.util.List;
+
+@RequiredArgsConstructor
+public class ModelUtils {
+
+    @Getter
+    private final PCModuleTestEnv module;
+
+    public ModelUtils() {
+        this(new PCModuleTestEnv());
+    }
+
+    public WorkContainer<String, String> createWorkFor(long offset) {
+        ConsumerRecord<String, String> mockCr = Mockito.mock(ConsumerRecord.class);
+        WorkContainer<String, String> workContainer = new WorkContainer<>(0, mockCr, module);
+        Mockito.doReturn(offset).when(mockCr).offset();
+        return workContainer;
+    }
+
+    public EpochAndRecordsMap<String, String> createFreshWork() {
+        return new EpochAndRecordsMap<>(createConsumerRecords(), module.workManager().getPm());
+    }
+
+    public ConsumerRecords<String, String> createConsumerRecords() {
+        return new ConsumerRecords<>(UniMaps.of(getPartition(), UniLists.of(
+                createConsumerRecord(topic)
+        )));
+    }
+
+    @Getter
+    final String topic = "topic";
+
+    @NonNull
+    public TopicPartition getPartition() {
+        return new TopicPartition(topic, 0);
+    }
+
+    @NonNull
+    public List<TopicPartition> getPartitions() {
+        return UniLists.of(new TopicPartition(topic, 0));
+    }
+
+    private long nextOffset = 0L;
+
+    @NonNull
+    private ConsumerRecord<String, String> createConsumerRecord(String topic) {
+        var cr = new ConsumerRecord<>(topic, 0, nextOffset, "a-key", "a-value");
+        nextOffset++;
+        return cr;
+    }
+
+    public ProducerRecord<String, String> createProducerRecords() {
+        return new ProducerRecord<>(topic, "a-key", "a-value");
+    }
+
+    final String groupId = "cg-1";
+
+    public ConsumerGroupMetadata consumerGroupMeta() {
+        return new ConsumerGroupMetadata(groupId);
+    }
+
+    public List<ProducerRecord<String, String>> createProducerRecords(String topicName, long numberToSend) {
+        return createProducerRecords(topicName, numberToSend, "");
+    }
+
+    public List<ProducerRecord<String, String>> createProducerRecords(String topicName, long numberToSend, String prefix) {
+        List<ProducerRecord<String, String>> recs = new ArrayList<>();
+        for (int i = 0; i < numberToSend; i++) {
+            String key = prefix + "key-" + i;
+            ProducerRecord<String, String> record = new ProducerRecord<>(topicName, key, "value-" + i);
+            recs.add(record);
+        }
+        return recs;
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/PartitionStateCommittedOffsetTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/PartitionStateCommittedOffsetTest.java
new file mode 100644
index 000000000..af0aeccdf
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/PartitionStateCommittedOffsetTest.java
@@ -0,0 +1,181 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.Truth;
+import io.confluent.parallelconsumer.internal.PCModuleTestEnv;
+import io.confluent.parallelconsumer.offsets.OffsetEncodingTests;
+import io.confluent.parallelconsumer.offsets.OffsetMapCodecManager.HighestOffsetAndIncompletes;
+import lombok.extern.slf4j.Slf4j;
+import one.util.streamex.LongStreamEx;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.common.TopicPartition;
+import org.junit.jupiter.api.Test;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniSets;
+
+import java.util.List;
+import java.util.Optional;
+import java.util.Set;
+import java.util.TreeSet;
+import java.util.concurrent.ConcurrentSkipListMap;
+import java.util.stream.Collectors;
+
+import static io.confluent.parallelconsumer.ManagedTruth.assertThat;
+
+/**
+ * Unit test for PartitionState behaviour when committed offsets are changed and random records are removed (compaction)
+ * which already are tracked in the offset map.
+ *
+ * @author Antony Stubbs
+ * @see OffsetEncodingTests#ensureEncodingGracefullyWorksWhenOffsetsAreVeryLargeAndNotSequential
+ * @see PartitionState#maybeTruncateBelow
+ * @see PartitionState#maybeTruncateOrPruneTrackedOffsets
+ * @see io.confluent.parallelconsumer.integrationTests.state.PartitionStateCommittedOffsetIT
+ */
+@Slf4j
+class PartitionStateCommittedOffsetTest {
+
+    ModelUtils mu = new ModelUtils(new PCModuleTestEnv());
+
+    TopicPartition tp = new TopicPartition("topic", 0);
+
+    long unexpectedlyHighOffset = 20L;
+
+    long previouslyCommittedOffset = 11L;
+
+    final long highestSeenOffset = 101L;
+
+    List<Long> trackedIncompletes = UniLists.of(previouslyCommittedOffset, 15L, unexpectedlyHighOffset, 60L, 80L, 95L, 96L, 97L, 98L, 100L);
+
+    List<Long> expectedTruncatedIncompletes = trackedIncompletes.stream()
+            .filter(offset -> offset >= unexpectedlyHighOffset)
+            .collect(Collectors.toList());
+
+    HighestOffsetAndIncompletes offsetData = new HighestOffsetAndIncompletes(Optional.of(highestSeenOffset), new TreeSet<>(trackedIncompletes));
+
+    PartitionState<String, String> state = new PartitionState<>(0, mu.getModule(), tp, offsetData);
+
+    /**
+     * Checks exactly what {@link java.util.NavigableSet#subSet} returns, specifically with regard to checking for
+     * potential off by one in the implementation in {@link PartitionState#maybeTruncateOrPruneTrackedOffsets},
+     */
+    @Test
+    void concurrentSkipListMapSanityCheck() {
+        ConcurrentSkipListMap<Long, Boolean> incompletes = new ConcurrentSkipListMap<>();
+        incompletes.put(2L, true);
+        incompletes.put(3L, true);
+        incompletes.put(4L, true);
+        incompletes.put(5L, true);
+        incompletes.put(6L, true);
+
+        ConcurrentSkipListMap<Long, Boolean> polled = new ConcurrentSkipListMap<>();
+        polled.put(3L, true);
+        polled.put(5L, true);
+
+        final long lowPoll = polled.firstKey();
+        final long highPoll = polled.lastKey();
+
+        var polledRange = incompletes.keySet().subSet(lowPoll, true, highPoll, true);
+
+        polledRange.forEach(x -> {
+            if (polled.containsKey(x)) {
+                log.warn("Found: {}", x);
+            } else {
+                log.warn("Not found, dropping: {}", x);
+                incompletes.remove(x);
+            }
+        });
+
+        assertThat(incompletes.keySet()).containsExactly(2L, 3L, 5L, 6L);
+    }
+
+    /**
+     * Test for offset gaps in partition data (i.e. compacted topics)
+     */
+    @Test
+    void compactedTopic() {
+        Set<Long> missingOffsets = UniSets.of(80L, 95L, 97L);
+        long slightlyLowerRange = highestSeenOffset - 2L; // to check subsets don't mess with incompletes not represented in this polled batch
+        List<Long> polledOffsetsWithCompactedRemoved = LongStreamEx.range(previouslyCommittedOffset, slightlyLowerRange)
+                .filter(offset -> !missingOffsets.contains(offset))
+                .boxed().toList();
+
+
+        //
+        PolledTestBatch polledTestBatchWithoutMissingOffsets = new PolledTestBatch(mu, tp, polledOffsetsWithCompactedRemoved);
+
+        //
+        addPollToState(state, polledTestBatchWithoutMissingOffsets);
+
+        //
+        OffsetAndMetadata offsetAndMetadata = state.createOffsetAndMetadata();
+
+        assertThat(offsetAndMetadata).getOffset().isEqualTo(previouslyCommittedOffset);
+
+        //
+        // this also checks that the state still contains 100, as it's not in the polled batches' range and should still be tracked as incomplete
+        var incompletesWithoutMissingOffsets = trackedIncompletes.stream().filter(offset -> !missingOffsets.contains(offset)).collect(Collectors.toList());
+        assertThat(state).getAllIncompleteOffsets().containsExactlyElementsIn(incompletesWithoutMissingOffsets);
+    }
+
+    /**
+     * CG offset has been changed to a lower offset (partition rewind / replay).
+     * <p>
+     * Metadata could be lost if it's a manual reset, otherwise it will still exist. If it's been lost, then we will
+     * bootstrap the partition as though it's the first time it's ever been seen, so nothing to do.
+     * <p>
+     * If the offset and metadata is still there, then we have to handle the situation.
+     */
+    @Test
+    void committedOffsetLower() {
+        long randomlyChosenStepBackwards = 5L;
+        long unexpectedLowerOffset = previouslyCommittedOffset - randomlyChosenStepBackwards;
+
+        PolledTestBatch polledTestBatch = new PolledTestBatch(mu, tp, unexpectedLowerOffset, highestSeenOffset);
+
+        //
+        addPollToState(state, polledTestBatch);
+
+        //
+        OffsetAndMetadata offsetAndMetadata = state.createOffsetAndMetadata();
+
+        assertThat(offsetAndMetadata).getOffset().isEqualTo(unexpectedLowerOffset);
+        assertThat(state).getAllIncompleteOffsets().containsExactlyElementsIn(LongStreamEx.range(unexpectedLowerOffset, highestSeenOffset + 1).boxed().toList());
+    }
+
+    private void addPollToState(PartitionState<String, String> state, PolledTestBatch polledTestBatch) {
+        state.maybeRegisterNewPollBatchAsWork(polledTestBatch.polledRecordBatch.records(state.getTp()));
+    }
+
+    /**
+     * CG offset has disappeared - committed offset hasn't been changed, but broker gives us a bootstrap poll result
+     * with a higher offset than expected. Could be caused by retention period, or compaction.
+     * <p>
+     * If the CG offset has been changed to something higher than expected manually, then we will bootstrap the
+     * partition as though it's never been seen before, so nothing to do.
+     *
+     * @implSpec issue #409: Committing old offset after OFFSET_OUT_OF_RANGE
+     * @see PartitionState#maybeTruncateBelow
+     * @see OffsetEncodingTests#ensureEncodingGracefullyWorksWhenOffsetsAreVeryLargeAndNotSequential
+     */
+    @Test
+    void bootstrapPollOffsetHigherDueToRetentionOrCompaction() {
+        // bootstrap poll
+        PolledTestBatch polledTestBatch = new PolledTestBatch(mu, tp, unexpectedlyHighOffset, highestSeenOffset);
+
+        //
+        addPollToState(state, polledTestBatch);
+
+        //
+        Truth.assertThat(state.getOffsetToCommit()).isEqualTo(unexpectedlyHighOffset);
+        OffsetAndMetadata offsetAndMetadata = state.createOffsetAndMetadata();
+
+        assertThat(offsetAndMetadata).getOffset().isEqualTo(unexpectedlyHighOffset);
+        assertThat(state).getAllIncompleteOffsets().containsExactlyElementsIn(expectedTruncatedIncompletes);
+    }
+
+
+}
\ No newline at end of file
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/PolledTestBatch.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/PolledTestBatch.java
new file mode 100644
index 000000000..7da07ee0a
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/PolledTestBatch.java
@@ -0,0 +1,73 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.EpochAndRecordsMap;
+import one.util.streamex.LongStreamEx;
+import one.util.streamex.StreamEx;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.ConsumerRecords;
+import org.apache.kafka.common.TopicPartition;
+import org.mockito.Mockito;
+import pl.tlinkowski.unij.api.UniMaps;
+
+import java.util.List;
+import java.util.stream.Collectors;
+
+import static org.mockito.Mockito.mock;
+
+/**
+ * Utility data class for creating test data around polled records from broker.
+ *
+ * @author Antony Stubbs
+ */
+public class PolledTestBatch {
+
+    final ModelUtils mu;
+
+    private final TopicPartition tp;
+
+    List<WorkContainer<String, String>> polledBatchWCs;
+
+    List<ConsumerRecord<String, String>> polledBatch;
+
+    EpochAndRecordsMap<String, String> polledRecordBatch;
+
+    public PolledTestBatch(ModelUtils mu, TopicPartition tp, long fromOffset, long toOffset) {
+        this.mu = mu;
+        this.tp = tp;
+
+        create(fromOffset, toOffset);
+    }
+
+    public PolledTestBatch(ModelUtils mu, TopicPartition tp, List<Long> polledOffsetsWithCompactedRemoved) {
+        this.mu = mu;
+        this.tp = tp;
+
+        create(polledOffsetsWithCompactedRemoved);
+    }
+
+    void create(long fromOffset, long highestSeenOffset) {
+        List<Long> offsets = LongStreamEx.range(fromOffset, highestSeenOffset + 1).boxed().toList();
+        create(offsets);
+    }
+
+    void create(List<Long> offsets) {
+        var offsetStream = StreamEx.of(offsets);
+        this.polledBatchWCs = offsetStream
+                .map(mu::createWorkFor)
+                .toList();
+        this.polledBatch = polledBatchWCs.stream()
+                .map(WorkContainer::getCr)
+                .collect(Collectors.toList());
+
+        ConsumerRecords<String, String> consumerRecords = new ConsumerRecords<>(UniMaps.of(tp, polledBatch));
+
+        PartitionStateManager<String, String> mock = mock(PartitionStateManager.class);
+        Mockito.when(mock.getEpochOfPartition(tp)).thenReturn(0L);
+        this.polledRecordBatch = new EpochAndRecordsMap<>(consumerRecords, mock);
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/ShardKeyTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/ShardKeyTest.java
new file mode 100644
index 000000000..b46232499
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/ShardKeyTest.java
@@ -0,0 +1,155 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.common.TopicPartition;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.Arguments;
+import org.junit.jupiter.params.provider.MethodSource;
+
+import java.util.stream.Stream;
+
+import static io.confluent.parallelconsumer.ManagedTruth.assertThat;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.KEY;
+import static org.mockito.Mockito.mock;
+import static org.mockito.Mockito.when;
+
+/**
+ * @author Antony Stubbs
+ * @see ShardKey
+ */
+class ShardKeyTest {
+
+    /**
+     * Tests when KEY ordering with `null` keyed records
+     */
+    @Test
+    void nullKey() {
+        var cr = mock(ConsumerRecord.class);
+        when(cr.partition()).thenReturn(0);
+        when(cr.topic()).thenReturn("atopic");
+        when(cr.key()).thenReturn(null);
+
+        var wc = mock(WorkContainer.class);
+        when(wc.getCr()).thenReturn(cr);
+
+        ShardKey.of(wc, KEY);
+    }
+
+    // todo split up
+    @Test
+    void keyTest() {
+        ParallelConsumerOptions.ProcessingOrder ordering = KEY;
+        String topicOne = "t1";
+        TopicPartition topicOneP0 = new TopicPartition("t1", 0);
+        String keyOne = "k1";
+        String keyOneAgain = "k1";
+
+        // same inputs, different key instances equal
+        var reck1 = new ConsumerRecord<>(topicOne, 0, 0, keyOne, "v");
+        var reck1Again = new ConsumerRecord<>(topicOne, 0, 0, keyOneAgain, "v");
+
+        ShardKey key1 = ShardKey.of(reck1, ordering);
+        ShardKey anotherInstanceWithSameInputs = ShardKey.of(reck1Again, ordering);
+        assertThat(key1).isEqualTo(anotherInstanceWithSameInputs);
+
+        // same topic, same partition, different key
+        var reck2 = new ConsumerRecord<>(topicOne, 0, 0, "k2", "v");
+        ShardKey of3 = ShardKey.of(reck2, ordering);
+        assertThat(key1).isNotEqualTo(of3);
+
+        // different topic, same key
+        var reck3 = new ConsumerRecord<>("t2", 0, 0, keyOne, "v");
+        assertThat(key1).isNotEqualTo(ShardKey.of(reck3, ordering));
+
+        // same topic, same key
+        ShardKey.KeyOrderedKey keyOrderedKey = new ShardKey.KeyOrderedKey(topicOneP0, keyOne);
+        ShardKey.KeyOrderedKey keyOrderedKeyTwo = new ShardKey.KeyOrderedKey(topicOneP0, keyOne);
+        assertThat(keyOrderedKey).isEqualTo(keyOrderedKeyTwo);
+
+        // same topic, same key, different partition
+        var reck4 = new ConsumerRecord<>(topicOne, 1, 0, keyOne, "v");
+        ShardKey of4 = ShardKey.of(reck2, ordering);
+        assertThat(key1).isNotEqualTo(of3);
+
+        // check both exist in queue too ??
+        //assertThat("false").isEmpty();
+    }
+
+    private static Object keyObject = new Object();
+
+    static Stream<Arguments> keyEqualityParams() {
+        return Stream.of(
+                Arguments.of(keyObject, keyObject),
+                Arguments.of("key", "key"),
+                Arguments.of((byte) 1, (byte) 1),
+                Arguments.of(true, true),
+                Arguments.of((short) 1, (short) 1),
+                Arguments.of(1, 1),
+                Arguments.of(1L, 1L),
+                Arguments.of((float) 1.1, (float) 1.1),
+                Arguments.of(1.1, 1.1),
+                Arguments.of('a', 'a'),
+                Arguments.of(null, null),
+                Arguments.of(Boolean.TRUE, Boolean.TRUE),
+                Arguments.of(Short.valueOf((short) 1), Short.valueOf((short) 1)),
+                Arguments.of(Integer.valueOf(1), Integer.valueOf(1)),
+                Arguments.of(Long.valueOf(1L), Long.valueOf(1L)),
+                Arguments.of(Float.valueOf((float) 1.1), Float.valueOf((float) 1.1)),
+                Arguments.of(Double.valueOf(1.1), Double.valueOf(1.1)),
+                Arguments.of(Character.valueOf('a'), Character.valueOf('a')),
+                Arguments.of(null, null),
+
+                Arguments.of(new Object[]{keyObject, "key"}, new Object[]{keyObject, "key"}),
+                Arguments.of(new String[]{"key1", "key2"}, new String[]{"key1", "key2"}),
+                Arguments.of(new byte[]{1, 2}, new byte[]{1, 2}),
+                Arguments.of(new boolean[]{true, false}, new boolean[]{true, false}),
+                Arguments.of(new short[]{1, 2}, new short[]{1, 2}),
+                Arguments.of(new int[]{1, 2}, new int[]{1, 2}),
+                Arguments.of(new long[]{1, 2}, new long[]{1, 2}),
+                Arguments.of(new float[]{1, 2}, new float[]{1, 2}),
+                Arguments.of(new double[]{1, 2}, new double[]{1, 2}),
+                Arguments.of(new char[]{'1', '2'}, new char[]{'1', '2'}),
+                Arguments.of(new Object[]{null}, new Object[]{null})
+        );
+    }
+
+    /**
+     * Parametrized key equality test for different reference and primitive types including arrays.
+     */
+    @ParameterizedTest
+    @MethodSource("keyEqualityParams")
+    void testKeyEquality(Object keyOne, Object keyTwo) {
+        String topic = "topic1";
+        var reck1 = new ConsumerRecord<>(topic, 0, 0, keyOne, "v");
+        var reck2 = new ConsumerRecord<>(topic, 0, 0, keyTwo, "v");
+
+        ShardKey shardKey1 = ShardKey.of(reck1, KEY);
+        ShardKey shardKey2 = ShardKey.of(reck2, KEY);
+        assertThat(shardKey1).isEqualTo(shardKey2);
+    }
+
+    /**
+     * Tests that equality works correctly for byte[] keys - based on array contents not ref.
+     */
+    @Test
+    void keyTestByteArray() {
+        ParallelConsumerOptions.ProcessingOrder ordering = KEY;
+        String topicOne = "t1";
+        byte[] keyOne = "k1".getBytes();
+        byte[] keyOneAgain = "k1".getBytes();
+
+        // same inputs, different key instances equal
+        var reck1 = new ConsumerRecord<>(topicOne, 0, 0, keyOne, "v");
+        var reck1Again = new ConsumerRecord<>(topicOne, 0, 0, keyOneAgain, "v");
+
+        ShardKey key1 = ShardKey.of(reck1, ordering);
+        ShardKey anotherInstanceWithSameInputs = ShardKey.of(reck1Again, ordering);
+        assertThat(key1).isEqualTo(anotherInstanceWithSameInputs);
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/ShardManagerTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/ShardManagerTest.java
new file mode 100644
index 000000000..3453dffaa
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/ShardManagerTest.java
@@ -0,0 +1,62 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.internal.PCModuleTestEnv;
+import org.junit.jupiter.api.Test;
+
+import java.util.NavigableSet;
+
+import static com.google.common.truth.Truth.assertThat;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+/**
+ * @author Antony Stubbs
+ * @see ShardManager
+ */
+class ShardManagerTest {
+
+    ModelUtils mu = new ModelUtils();
+
+    @Test
+    void retryQueueOrdering() {
+        PCModuleTestEnv module = mu.getModule();
+        ShardManager<String, String> sm = new ShardManager<>(module, module.workManager());
+        NavigableSet<WorkContainer<?, ?>> retryQueue = sm.getRetryQueue();
+
+
+        WorkContainer<String, String> w0 = mu.createWorkFor(0);
+        WorkContainer<String, String> w1 = mu.createWorkFor(1);
+        WorkContainer<String, String> w2 = mu.createWorkFor(2);
+        WorkContainer<String, String> w3 = mu.createWorkFor(3);
+
+        final int ZERO = 0;
+        assertThat(sm.getRetryQueueWorkContainerComparator().compare(w0, w0)).isEqualTo(ZERO);
+
+
+        retryQueue.add(w0);
+        retryQueue.add(w1);
+        retryQueue.add(w2);
+        retryQueue.add(w3);
+
+        assertThat(retryQueue).hasSize(4);
+
+        assertThat(w0).isNotEqualTo(w1);
+        assertThat(w1).isNotEqualTo(w2);
+
+        boolean removed = retryQueue.remove(w1);
+        assertThat(removed).isTrue();
+        assertThat(retryQueue).hasSize(3);
+
+        assertThat(retryQueue).containsNoDuplicates();
+
+        assertThat(retryQueue.contains(w0)).isTrue();
+        assertThat(retryQueue.contains(w1)).isFalse();
+
+        assertThat(retryQueue).contains(w0);
+        assertThat(retryQueue).containsNoneIn(of(w1));
+        assertThat(retryQueue).contains(w2);
+    }
+}
\ No newline at end of file
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/WorkContainerTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/WorkContainerTest.java
new file mode 100644
index 000000000..05cd22465
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/WorkContainerTest.java
@@ -0,0 +1,60 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.FakeRuntimeException;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.RecordContext;
+import io.confluent.parallelconsumer.internal.PCModule;
+import io.confluent.parallelconsumer.internal.PCModuleTestEnv;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.junit.jupiter.api.Test;
+
+import java.time.Duration;
+import java.util.function.Function;
+
+import static io.confluent.parallelconsumer.ManagedTruth.assertThat;
+import static org.mockito.Mockito.mock;
+
+class WorkContainerTest {
+
+    @Test
+    void basics() {
+        var workContainer = new ModelUtils(new PCModuleTestEnv()).createWorkFor(0);
+        assertThat(workContainer).getDelayUntilRetryDue().isNegative();
+    }
+
+    @Test
+    void retryDelayProvider() {
+        int uniqueMultiplier = 7;
+
+        Function<RecordContext<String, String>, Duration> retryDelayProvider = context -> {
+            final int numberOfFailedAttempts = context.getNumberOfFailedAttempts();
+            return Duration.ofSeconds(numberOfFailedAttempts * uniqueMultiplier);
+        };
+
+        //
+        var opts = ParallelConsumerOptions.<String, String>builder()
+                .retryDelayProvider(retryDelayProvider)
+                .build();
+        PCModule module = new PCModuleTestEnv(opts);
+
+        WorkContainer<String, String> wc = new WorkContainer<String, String>(0,
+                mock(ConsumerRecord.class),
+                module);
+
+        //
+        int numberOfFailures = 3;
+        wc.onUserFunctionFailure(new FakeRuntimeException(""));
+        wc.onUserFunctionFailure(new FakeRuntimeException(""));
+        wc.onUserFunctionFailure(new FakeRuntimeException(""));
+
+        //
+        Duration retryDelayConfig = wc.getRetryDelayConfig();
+
+        //
+        assertThat(retryDelayConfig).getSeconds().isEqualTo(numberOfFailures * uniqueMultiplier);
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/WorkManagerTest.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/WorkManagerTest.java
new file mode 100644
index 000000000..6c4ba2617
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/state/WorkManagerTest.java
@@ -0,0 +1,741 @@
+package io.confluent.parallelconsumer.state;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.Truth;
+import io.confluent.csid.utils.KafkaTestUtils;
+import io.confluent.csid.utils.LongPollingMockConsumer;
+import io.confluent.csid.utils.Range;
+import io.confluent.parallelconsumer.FakeRuntimeException;
+import io.confluent.parallelconsumer.ManagedTruth;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.internal.EpochAndRecordsMap;
+import io.confluent.parallelconsumer.internal.PCModule;
+import io.confluent.parallelconsumer.internal.PCModuleTestEnv;
+import io.confluent.parallelconsumer.truth.CommitHistorySubject;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.ConsumerRecords;
+import org.apache.kafka.clients.consumer.MockConsumer;
+import org.apache.kafka.clients.consumer.OffsetResetStrategy;
+import org.apache.kafka.common.TopicPartition;
+import org.assertj.core.api.AbstractListAssert;
+import org.assertj.core.api.ObjectAssert;
+import org.jetbrains.annotations.NotNull;
+import org.junit.jupiter.api.Assumptions;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.parallel.Execution;
+import org.junit.jupiter.api.parallel.ExecutionMode;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+import org.junit.jupiter.params.provider.ValueSource;
+import org.threeten.extra.MutableClock;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniMaps;
+
+import java.time.Duration;
+import java.util.*;
+import java.util.stream.Collectors;
+
+import static com.google.common.truth.Truth.assertWithMessage;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.*;
+import static java.time.Duration.ofSeconds;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.mockito.Mockito.mock;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+/**
+ * Needs to run in {@link ExecutionMode#SAME_THREAD} because it manipulates the static state in
+ * {@link WorkContainer#setStaticModule(PCModule)}.
+ *
+ * @see WorkManager
+ */
+@Execution(ExecutionMode.SAME_THREAD)
+@Slf4j
+public class WorkManagerTest {
+
+    public static final String INPUT_TOPIC = "input";
+    public static final String OUTPUT_TOPIC = "output";
+
+    WorkManager<String, String> wm;
+
+    int offset;
+
+    PCModuleTestEnv module;
+
+    @BeforeEach
+    public void setup() {
+        var options = ParallelConsumerOptions.builder().build();
+        setupWorkManager(options);
+    }
+
+    private MutableClock getClock() {
+        return module.getMutableClock();
+    }
+
+    protected List<WorkContainer<String, String>> successfulWork = new ArrayList<>();
+
+    private void setupWorkManager(ParallelConsumerOptions options) {
+        offset = 0;
+
+        var mockConsumer = new MockConsumer<>(OffsetResetStrategy.EARLIEST);
+        var optsOverride = options.toBuilder().consumer(mockConsumer).build();
+
+        module = new PCModuleTestEnv(optsOverride);
+
+        wm = module.workManager();
+        wm.getSuccessfulWorkListeners().add((work) -> {
+            log.debug("Heard some successful work: {}", work);
+            successfulWork.add(work);
+        });
+
+        module.setWorkManager(wm);
+    }
+
+    private void assignPartition(final int partition) {
+        wm.onPartitionsAssigned(UniLists.of(topicPartitionOf(partition)));
+    }
+
+    @NotNull
+    private TopicPartition topicPartitionOf(int partition) {
+        return new TopicPartition(INPUT_TOPIC, partition);
+    }
+
+    private void registerSomeWork() {
+        registerSomeWork(0);
+    }
+
+    /**
+     * Adds 3 units of work
+     */
+    private void registerSomeWork(int partition) {
+        assignPartition(partition);
+
+        String key = "key-0";
+
+        var rec0 = makeRec("0", key, partition);
+        var rec1 = makeRec("1", key, partition);
+        var rec2 = makeRec("2", key, partition);
+        Map<TopicPartition, List<ConsumerRecord<String, String>>> m = new HashMap<>();
+        m.put(topicPartitionOf(partition), of(rec0, rec1, rec2));
+        var recs = new ConsumerRecords<>(m);
+        wm.registerWork(new EpochAndRecordsMap(recs, wm.getPm()));
+    }
+
+    private ConsumerRecord<String, String> makeRec(String value, String key, int partition) {
+        ConsumerRecord<String, String> stringStringConsumerRecord = new ConsumerRecord<>(INPUT_TOPIC, partition, offset, key, value);
+        offset++;
+        return stringStringConsumerRecord;
+    }
+
+    @ParameterizedTest
+    @EnumSource
+    void basic(ParallelConsumerOptions.ProcessingOrder order) {
+        setupWorkManager(ParallelConsumerOptions.builder()
+                .ordering(order)
+                .build());
+        registerSomeWork();
+
+        //
+        var gottenWork = wm.getWorkIfAvailable();
+
+        if (order == UNORDERED) {
+            assertThat(gottenWork).hasSize(3);
+            assertOffsets(gottenWork, of(0, 1, 2));
+        } else {
+            assertThat(gottenWork).hasSize(1);
+            assertOffsets(gottenWork, of(0));
+        }
+
+        //
+        wm.onSuccessResult(gottenWork.get(0));
+
+        //
+        gottenWork = wm.getWorkIfAvailable();
+
+        if (order == UNORDERED) {
+            assertThat(gottenWork).isEmpty();
+        } else {
+            assertThat(gottenWork).hasSize(1);
+            assertOffsets(gottenWork, of(1));
+        }
+
+        //
+        gottenWork = wm.getWorkIfAvailable();
+        assertThat(gottenWork).isEmpty();
+    }
+
+    @Test
+    void testUnorderedAndDelayed() {
+        setupWorkManager(ParallelConsumerOptions.builder()
+                .ordering(UNORDERED)
+                .build());
+        registerSomeWork();
+
+        int max = 2;
+
+        {
+            var workRetrieved = wm.getWorkIfAvailable(max);
+            assertThat(workRetrieved).hasSize(2);
+            assertOffsets(workRetrieved, of(0, 1));
+
+            // pass first, fail second
+            WorkContainer<String, String> succeed = workRetrieved.get(0);
+            succeed(succeed);
+            WorkContainer<String, String> fail = workRetrieved.get(1);
+            fail(fail);
+        }
+
+        {
+            var workRetrieved = wm.getWorkIfAvailable(max);
+            assertOffsets(workRetrieved, of(2),
+                    "no order restriction, 1's delay won't have passed - should get remaining in queue not yet failed");
+
+            WorkContainer<String, String> succeed = workRetrieved.get(0);
+            succeed(succeed);
+        }
+
+        {
+            var workRetrieved = wm.getWorkIfAvailable(max);
+            assertOffsets(workRetrieved, of(), "delay won't have passed so should not retrieve anything");
+
+            advanceClockBySlightlyLessThanDelay();
+        }
+
+        {
+            var workRetrieved = wm.getWorkIfAvailable(max);
+            assertOffsets(workRetrieved, of());
+
+            advanceClockByDelay();
+        }
+
+        {
+            var workRetrieved = wm.getWorkIfAvailable(max);
+            assertOffsets(workRetrieved, of(1),
+                    "should retrieve 1 given clock has been advanced and retry delay should be over");
+            WorkContainer<String, String> succeed = workRetrieved.get(0);
+            succeed(succeed);
+        }
+
+        assertThat(successfulWork)
+                .extracting(x -> (int) x.getCr().offset())
+                .isEqualTo(of(0, 2, 1));
+    }
+
+    private void succeed(WorkContainer<String, String> succeed) {
+        succeed.onUserFunctionSuccess();
+        wm.onSuccessResult(succeed);
+    }
+
+    private void succeed(Iterable<WorkContainer<String, String>> succeed) {
+        succeed.forEach(this::succeed);
+    }
+
+    /**
+     * Checks the offsets of the work, matches the offsets in the provided list
+     *
+     * @deprecated use {@link CommitHistorySubject} or similar instead
+     */
+    @Deprecated
+    private AbstractListAssert<?, List<? extends Integer>, Integer, ObjectAssert<Integer>>
+    assertOffsets(List<WorkContainer<String, String>> works, List<Integer> expected, String msg) {
+        return assertThat(works)
+                .as(msg)
+                .extracting(x -> (int) x.getCr().offset())
+                .isEqualTo(expected);
+    }
+
+    private AbstractListAssert<?, List<? extends Integer>, Integer, ObjectAssert<Integer>>
+    assertOffsets(List<WorkContainer<String, String>> works, List<Integer> expected) {
+        return assertOffsets(works, expected, "offsets of work given");
+    }
+
+    @Test
+    public void testOrderedInFlightShouldBlockQueue() {
+        ParallelConsumerOptions build = ParallelConsumerOptions.builder().ordering(PARTITION).build();
+        setupWorkManager(build);
+
+        assertThat(wm.getOptions().getOrdering()).isEqualTo(PARTITION);
+
+        registerSomeWork();
+
+        int max = 2;
+
+        var works = wm.getWorkIfAvailable(max);
+        assertOffsets(works, of(0));
+        var w = works.get(0);
+
+        works = wm.getWorkIfAvailable(max);
+        assertOffsets(works, of()); // should be blocked by in flight
+
+        succeed(w);
+
+        works = wm.getWorkIfAvailable(max);
+        assertOffsets(works, of(1));
+    }
+
+    /**
+     * Tests failed work delay
+     */
+    @Test
+    void testOrderedAndDelayed() {
+        ParallelConsumerOptions<?, ?> build = ParallelConsumerOptions.builder().ordering(PARTITION).build();
+        setupWorkManager(build);
+
+        // sanity
+        assertThat(wm.getOptions().getOrdering()).isEqualTo(PARTITION);
+
+        registerSomeWork();
+
+        int maxWorkToGet = 2;
+
+        var works = wm.getWorkIfAvailable(maxWorkToGet);
+
+        assertOffsets(works, of(0));
+
+        // fail the work
+        var wc = works.get(0);
+        fail(wc);
+
+        // nothing available to get
+        works = wm.getWorkIfAvailable(maxWorkToGet);
+        assertOffsets(works, of());
+
+        // advance clock to make delay pass
+        advanceClockByDelay();
+
+        // work should now be ready to take
+        works = wm.getWorkIfAvailable(maxWorkToGet);
+        assertOffsets(works, of(0));
+
+        wc = works.get(0);
+        fail(wc);
+
+        advanceClock(wc.getRetryDelayConfig().minus(ofSeconds(1)));
+
+        works = wm.getWorkIfAvailable(maxWorkToGet);
+        assertOffsets(works, of());
+
+        // increased advance to allow for bigger delay under high load during parallel test execution.
+        advanceClock(wc.getRetryDelayConfig().plus(ofSeconds(1)));
+
+        works = wm.getWorkIfAvailable(maxWorkToGet);
+        assertOffsets(works, of(0));
+        succeed(works.get(0));
+
+        assertOffsets(successfulWork, of(0));
+
+        works = wm.getWorkIfAvailable(maxWorkToGet);
+        assertOffsets(works, of(1));
+        succeed(works.get(0));
+
+        works = wm.getWorkIfAvailable(maxWorkToGet);
+        assertOffsets(works, of(2));
+        succeed(works.get(0));
+
+        // check all published in the end
+        assertOffsets(successfulWork, of(0, 1, 2));
+    }
+
+    @Test
+    void containerDelay() {
+        var wc = new WorkContainer<String, String>(0, mock(ConsumerRecord.class), module);
+        assertThat(wc.isDelayPassed()).isTrue(); // when new, there's no delay
+        wc.onUserFunctionFailure(new FakeRuntimeException(""));
+        assertThat(wc.isDelayPassed()).isFalse();
+        advanceClockBySlightlyLessThanDelay();
+        assertThat(wc.isDelayPassed()).isFalse();
+        advanceClockByDelay();
+        ManagedTruth.assertThat(wc).isDelayPassed();
+    }
+
+    private void advanceClockBySlightlyLessThanDelay() {
+        Duration retryDelay = module.options().getDefaultMessageRetryDelay();
+        Duration duration = retryDelay.dividedBy(2);
+        getClock().add(duration);
+    }
+
+    private void advanceClockByDelay() {
+        Duration retryDelay = module.options().getDefaultMessageRetryDelay();
+        getClock().add(retryDelay);
+    }
+
+    private void advanceClock(Duration by) {
+        getClock().add(by);
+    }
+
+    @Test
+    void insertWrongOrderPreservesOffsetOrdering() {
+        ParallelConsumerOptions<?, ?> build = ParallelConsumerOptions.builder().ordering(UNORDERED).build();
+        setupWorkManager(build);
+
+        assertThat(wm.getOptions().getOrdering()).isEqualTo(UNORDERED);
+
+        registerSomeWork();
+
+        String key = "key";
+        int partition = 0;
+
+        // mess with offset order for insertion
+        var rec = new ConsumerRecord<>(INPUT_TOPIC, partition, 10, key, "value");
+        var rec2 = new ConsumerRecord<>(INPUT_TOPIC, partition, 6, key, "value");
+        var rec3 = new ConsumerRecord<>(INPUT_TOPIC, partition, 8, key, "value");
+        Map<TopicPartition, List<ConsumerRecord<String, String>>> m = new HashMap<>();
+        m.put(topicPartitionOf(partition), of(rec2, rec3, rec));
+        var recs = new ConsumerRecords<>(m);
+
+        //
+        registerWork(recs);
+
+        int max = 10;
+
+        var works = wm.getWorkIfAvailable(4);
+        assertOffsets(works, of(0, 1, 2, 6));
+
+        // fail some
+        fail(works.get(1));
+        fail(works.get(3));
+
+        //
+        works = wm.getWorkIfAvailable(max);
+        assertOffsets(works, of(8, 10));
+
+        //
+        advanceClockByDelay();
+
+        //
+        works = wm.getWorkIfAvailable(max);
+        assertOffsets(works, of(1, 6));
+    }
+
+    private void registerWork(ConsumerRecords<String, String> recs) {
+        wm.registerWork(new EpochAndRecordsMap<>(recs, wm.getPm()));
+    }
+
+
+    private void fail(WorkContainer<String, String> wc) {
+        wc.onUserFunctionFailure(null);
+        wm.onFailureResult(wc);
+    }
+
+    @Test
+    public void maxInFlight() {
+        //
+        var opts = ParallelConsumerOptions.builder();
+        setupWorkManager(opts.build());
+
+        //
+        registerSomeWork();
+
+        //
+        assertThat(wm.getWorkIfAvailable()).hasSize(1);
+        assertThat(wm.getWorkIfAvailable()).isEmpty();
+    }
+
+    public static class FluentQueue<T> implements Iterable<T> {
+        ArrayDeque<T> work = new ArrayDeque<>();
+
+        Collection<T> add(Collection<T> c) {
+            work.addAll(c);
+            return c;
+        }
+
+        public T poll() {
+            return work.poll();
+        }
+
+        @Override
+        public Iterator<T> iterator() {
+            return work.iterator();
+        }
+
+        public int size() {
+            return work.size();
+        }
+    }
+
+    @Test
+    void orderedByPartitionsParallel() {
+        ParallelConsumerOptions<?, ?> build = ParallelConsumerOptions.builder()
+                .ordering(PARTITION)
+                .build();
+        setupWorkManager(build);
+
+        registerSomeWork();
+
+        var partition = 2;
+        assignPartition(2);
+        var rec = new ConsumerRecord<>(INPUT_TOPIC, partition, 10, "66", "value");
+        var rec2 = new ConsumerRecord<>(INPUT_TOPIC, partition, 6, "66", "value");
+        var rec3 = new ConsumerRecord<>(INPUT_TOPIC, partition, 8, "66", "value");
+        Map<TopicPartition, List<ConsumerRecord<String, String>>> m = new HashMap<>();
+        m.put(topicPartitionOf(partition), of(rec2, rec3, rec));
+        var recs = new ConsumerRecords<>(m);
+
+        //
+        registerWork(recs);
+
+        //
+        var works = wm.getWorkIfAvailable();
+        assertOffsets(works, of(0, 6));
+        successAll(works);
+
+        //
+        works = wm.getWorkIfAvailable();
+        assertOffsets(works, of(1, 8));
+        successAll(works);
+
+        //
+        works = wm.getWorkIfAvailable();
+        assertOffsets(works, of(2, 10));
+        successAll(works);
+    }
+
+    private void successAll(List<WorkContainer<String, String>> works) {
+        for (WorkContainer<String, String> work : works) {
+            wm.onSuccessResult(work);
+        }
+    }
+
+    @Test
+    void orderedByKeyParallel() {
+        var build = ParallelConsumerOptions.builder().ordering(KEY).build();
+        setupWorkManager(build);
+
+        assertThat(wm.getOptions().getOrdering()).isEqualTo(KEY);
+
+        registerSomeWork();
+
+        var partition = 2;
+        assignPartition(2);
+        var rec2 = new ConsumerRecord<>(INPUT_TOPIC, partition, 6, "key-a", "value");
+        var rec3 = new ConsumerRecord<>(INPUT_TOPIC, partition, 8, "key-b", "value");
+        var rec0 = new ConsumerRecord<>(INPUT_TOPIC, partition, 10, "key-a", "value");
+        var rec4 = new ConsumerRecord<>(INPUT_TOPIC, partition, 12, "key-c", "value");
+        var rec5 = new ConsumerRecord<>(INPUT_TOPIC, partition, 15, "key-a", "value");
+        var rec6 = new ConsumerRecord<>(INPUT_TOPIC, partition, 20, "key-c", "value");
+        Map<TopicPartition, List<ConsumerRecord<String, String>>> m = new HashMap<>();
+        m.put(topicPartitionOf(partition), of(rec2, rec3, rec0, rec4, rec5, rec6));
+        var recs = new ConsumerRecords<>(m);
+
+        //
+        registerWork(recs);
+
+        //
+        var works = wm.getWorkIfAvailable();
+        works.sort(Comparator.naturalOrder()); // we actually don't care about the order
+        // one record per key
+        assertOffsets(works, of(0, 6, 8, 12));
+        successAll(works);
+
+        //
+        works = wm.getWorkIfAvailable();
+        works.sort(Comparator.naturalOrder());
+        assertOffsets(works, of(1, 10, 20));
+        successAll(works);
+
+        //
+        works = wm.getWorkIfAvailable();
+        works.sort(Comparator.naturalOrder());
+        assertOffsets(works, of(2, 15));
+        successAll(works);
+
+        works = wm.getWorkIfAvailable();
+        assertOffsets(works, of());
+    }
+
+    @ParameterizedTest
+    @ValueSource(ints = {1, 2, 5, 10, 20, 30, 50, 1000})
+    void highVolumeKeyOrder(int quantity) {
+        int uniqueKeys = 100;
+
+        var build = ParallelConsumerOptions.builder()
+                .ordering(KEY)
+                .build();
+        setupWorkManager(build);
+
+        KafkaTestUtils ktu = new KafkaTestUtils(INPUT_TOPIC, null, new LongPollingMockConsumer<>(OffsetResetStrategy.EARLIEST));
+
+        List<Integer> keys = Range.listOfIntegers(uniqueKeys);
+
+        var records = ktu.generateRecords(keys, quantity);
+        var flattened = ktu.flatten(records.values());
+
+        int partition = 0;
+        var recs = new ConsumerRecords<>(UniMaps.of(topicPartitionOf(partition), flattened));
+
+        assignPartition(partition);
+
+        //
+        registerWork(recs);
+
+        //
+        long awaiting = wm.getSm().getNumberOfWorkQueuedInShardsAwaitingSelection();
+        assertThat(awaiting).isEqualTo(quantity);
+
+        //
+        List<WorkContainer<String, String>> work = wm.getWorkIfAvailable();
+
+        //
+        ManagedTruth.assertTruth(work).hasSameSizeAs(records);
+    }
+
+    @Test
+    void treeMapOrderingCorrect() {
+        KafkaTestUtils ktu = new KafkaTestUtils(INPUT_TOPIC, null, new LongPollingMockConsumer<>(OffsetResetStrategy.EARLIEST));
+
+        int i = 10;
+        var records = ktu.generateRecords(i);
+
+        var treeMap = new TreeMap<Long, WorkContainer<String, String>>();
+        for (ConsumerRecord<String, String> record : records) {
+            treeMap.put(record.offset(), new WorkContainer<>(0, record, mock(PCModuleTestEnv.class)));
+        }
+
+        // read back, assert correct order
+        NavigableSet<Long> ascendingOrder = treeMap.navigableKeySet();
+        Object[] objects = ascendingOrder.toArray();
+
+        assertThat(objects).containsExactly(0L, 1L, 2L, 3L, 4L, 5L, 6L, 7L, 8L, 9L);
+    }
+
+    /**
+     * Checks work management is correct in this respect.
+     */
+    @Test
+    void workQueuesEmptyWhenAllWorkComplete() {
+        var build = ParallelConsumerOptions.builder()
+                .ordering(UNORDERED)
+                .build();
+        setupWorkManager(build);
+        registerSomeWork();
+
+        //
+        var work = wm.getWorkIfAvailable();
+        assertThat(work).hasSize(3);
+
+        //
+        succeed(work);
+
+        //
+        assertThat(wm.getSm().getNumberOfWorkQueuedInShardsAwaitingSelection()).isZero();
+        assertThat(wm.getNumberOfIncompleteOffsets()).as("Partition commit queues are now empty").isZero();
+
+        // drain commit queue
+        var completedFutureOffsets = wm.collectCommitDataForDirtyPartitions();
+        assertThat(completedFutureOffsets).hasSize(1); // coalesces (see log)
+        var sync = completedFutureOffsets.values().stream().findFirst().get();
+        Truth.assertThat(sync.offset()).isEqualTo(3);
+        Truth.assertThat(sync.metadata()).isEmpty();
+        PartitionState<String, String> state = wm.getPm().getPartitionState(topicPartitionOf(0));
+        Truth.assertThat(state.getAllIncompleteOffsets()).isEmpty();
+    }
+
+    /**
+     * Tests that the resuming iterator is used correctly
+     */
+    @ParameterizedTest
+    @EnumSource
+    void resumesFromNextShard(ParallelConsumerOptions.ProcessingOrder order) {
+        Assumptions.assumeFalse(order == KEY); // just want to test ordered vs unordered
+
+        ParallelConsumerOptions<?, ?> build = ParallelConsumerOptions.builder()
+                .ordering(order)
+                .build();
+        setupWorkManager(build);
+
+        registerSomeWork();
+
+        assignPartition(1);
+        assignPartition(2);
+        Map<TopicPartition, List<ConsumerRecord<String, String>>> m = new HashMap<>();
+        var rec = new ConsumerRecord<>(INPUT_TOPIC, 1, 11, "11", "value");
+        m.put(topicPartitionOf(1), of(rec));
+        var rec2 = new ConsumerRecord<>(INPUT_TOPIC, 2, 21, "21", "value");
+        m.put(topicPartitionOf(2), of(rec2));
+        var recs = new ConsumerRecords<>(m);
+        registerWork(recs);
+
+//        // force ingestion of records - see refactor: Queue unification #219
+//        wm.tryToEnsureQuantityOfWorkQueuedAvailable(100);
+
+        var workContainersOne = wm.getWorkIfAvailable(1);
+        var workContainersTwo = wm.getWorkIfAvailable(1);
+        var workContainersThree = wm.getWorkIfAvailable(1);
+        var workContainersFour = wm.getWorkIfAvailable(1);
+
+        Truth.assertThat(workContainersOne).hasSize(1);
+        Truth.assertThat(workContainersOne.stream().findFirst().get().getTopicPartition().partition()).isEqualTo(0);
+        Truth.assertThat(workContainersTwo).hasSize(1);
+        Truth.assertThat(workContainersTwo.stream().findFirst().get().getTopicPartition().partition()).isEqualTo(1);
+        Truth.assertThat(workContainersThree).hasSize(1);
+        Truth.assertThat(workContainersThree.stream().findFirst().get().getTopicPartition().partition()).isEqualTo(2);
+
+        if (order == PARTITION) {
+            Truth.assertThat(workContainersFour).isEmpty();
+        } else {
+            Truth.assertThat(workContainersFour).hasSize(1);
+            Optional<WorkContainer<String, String>> work = workContainersFour.stream().findFirst();
+            Truth.assertThat(work.get().getTopicPartition().partition()).isEqualTo(0);
+            Truth.assertThat(work.get().offset()).isEqualTo(1);
+            Truth.assertThat(work.get().getCr().value()).isEqualTo("1");
+        }
+    }
+
+
+    /**
+     * Checks that when using shards are not starved when there's enough work queued to satisfy poll request from the
+     * initial request (without needing to iterate to other shards)
+     *
+     * @see <a href="https://github.com/confluentinc/parallel-consumer/issues/236">#236</a> Under some conditions, a
+     *         shard (by partition or key), can get starved for attention
+     */
+    @Test
+    void starvation() {
+        setupWorkManager(ParallelConsumerOptions.builder()
+                .ordering(PARTITION)
+                .build());
+
+        registerSomeWork(0);
+        registerSomeWork(1);
+        registerSomeWork(2);
+
+        var allWork = new ArrayList<WorkContainer<String, String>>();
+
+        {
+            var work = wm.getWorkIfAvailable(2);
+            allWork.addAll(work);
+
+            assertWithMessage("Should be able to get 2 records of work, one from each partition shard")
+                    .that(work).hasSize(2);
+
+            //
+            var tpOne = work.get(0).getTopicPartition();
+            var tpTwo = work.get(1).getTopicPartition();
+            assertWithMessage("The partitions should be different")
+                    .that(tpOne).isNotEqualTo(tpTwo);
+
+        }
+
+        {
+            var work = wm.getWorkIfAvailable(2);
+            assertWithMessage("Should be able to get only 1 more, from the third shard")
+                    .that(work).hasSize(1);
+            allWork.addAll(work);
+
+            //
+            var tpOne = work.get(0).getTopicPartition();
+        }
+
+        assertWithMessage("TPs all unique")
+                .that(allWork.stream()
+                        .map(WorkContainer::getTopicPartition)
+                        .collect(Collectors.toList()))
+                .containsNoDuplicates();
+
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/CommitHistorySubject.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/CommitHistorySubject.java
new file mode 100644
index 000000000..4ce55b208
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/CommitHistorySubject.java
@@ -0,0 +1,93 @@
+package io.confluent.parallelconsumer.truth;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.FailureMetadata;
+import com.google.common.truth.OptionalSubject;
+import com.google.common.truth.Subject;
+import io.confluent.parallelconsumer.model.CommitHistory;
+import io.stubbs.truth.generator.SubjectFactoryMethod;
+import io.stubbs.truth.generator.UserManagedSubject;
+import lombok.ToString;
+import io.stubbs.truth.generator.SubjectFactoryMethod;
+import io.stubbs.truth.generator.UserManagedSubject;
+
+import java.util.Arrays;
+import java.util.Optional;
+import java.util.Set;
+import java.util.stream.Collectors;
+
+import static com.google.common.truth.Truth.assertAbout;
+
+/**
+ * @author Antony Stubbs
+ * @see CommitHistory
+ */
+@ToString
+@UserManagedSubject(CommitHistory.class)
+public class CommitHistorySubject extends Subject {
+    private final CommitHistory actual;
+
+    protected CommitHistorySubject(FailureMetadata metadata, CommitHistory actual) {
+        super(metadata, actual);
+        this.actual = actual;
+    }
+
+    @SubjectFactoryMethod
+    public static Factory<CommitHistorySubject, CommitHistory> commitHistories() {
+        return CommitHistorySubject::new;
+    }
+
+    public static CommitHistorySubject assertTruth(final CommitHistory actual) {
+        return assertThat(actual);
+    }
+
+    public static CommitHistorySubject assertThat(final CommitHistory actual) {
+        return assertAbout(commitHistories()).that(actual);
+    }
+
+    public void atLeastOffset(long needleCommit) {
+        Optional<Long> highestCommitOpt = this.actual.highestCommit();
+        check("highestCommit()").about(OptionalSubject.optionals())
+                .that(highestCommitOpt)
+                .isPresent();
+        check("highestCommit().atLeastOffset()")
+                .that(highestCommitOpt.get())
+                .isAtLeast(needleCommit);
+    }
+
+    public void offset(long quantity) {
+        check("getOffsetHistory()").that(actual.getOffsetHistory()).contains(quantity);
+    }
+
+    public void anything() {
+        check("commits()").that(actual.getOffsetHistory()).isNotEmpty();
+    }
+
+    public void nothing() {
+        check("commits()").that(actual.getOffsetHistory()).isEmpty();
+    }
+
+    public void isEmpty() {
+        nothing();
+    }
+
+    /**
+     * Asserts that the given offsets are in the offset metadata as incomplete.
+     */
+    public void encodedIncomplete(int... expectedEncodedOffsetsArray) {
+        Set<Long> incompleteOffsets = actual.getEncodedSucceeded().getIncompleteOffsets();
+        check("encodedSucceeded()")
+                .that(incompleteOffsets)
+                .containsExactlyElementsIn(Arrays.stream(expectedEncodedOffsetsArray)
+                        .boxed()
+                        .map(Long::valueOf)
+                        .collect(Collectors.toList()));
+    }
+
+    public void encodingEmpty() {
+        check("encodedMetadata()").that(actual.getEncoding()).isEmpty();
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/ConsumerRecordsSubject.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/ConsumerRecordsSubject.java
new file mode 100644
index 000000000..80d39ab47
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/ConsumerRecordsSubject.java
@@ -0,0 +1,66 @@
+package io.confluent.parallelconsumer.truth;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.FailureMetadata;
+import io.confluent.parallelconsumer.state.PartitionState;
+import io.stubbs.truth.generator.SubjectFactoryMethod;
+import io.stubbs.truth.generator.UserManagedMiddleSubject;
+import io.stubbs.truth.generator.UserManagedSubject;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.ConsumerRecords;
+import org.apache.kafka.clients.consumer.ConsumerRecordsChildSubject;
+import org.apache.kafka.clients.consumer.ConsumerRecordsParentSubject;
+import org.jetbrains.annotations.NotNull;
+
+import java.util.Iterator;
+
+/**
+ * @see ConsumerRecords
+ * @see ConsumerRecordsParentSubject
+ * @see ConsumerRecordsChildSubject
+ */
+@UserManagedSubject(ConsumerRecords.class)
+public class ConsumerRecordsSubject extends ConsumerRecordsParentSubject implements UserManagedMiddleSubject {
+
+    protected ConsumerRecordsSubject(FailureMetadata failureMetadata,
+                                     org.apache.kafka.clients.consumer.ConsumerRecords actual) {
+        super(failureMetadata, actual);
+    }
+
+    /**
+     * Returns an assertion builder for a {@link ConsumerRecords} class.
+     */
+    @SubjectFactoryMethod
+    public static Factory<ConsumerRecordsSubject, ConsumerRecords> consumerRecordses() {
+        return ConsumerRecordsSubject::new;
+    }
+
+    public void hasHeadOffsetAtLeastInAnyTopicPartition(int target) {
+        long highestOffset = findHighestOffsetAnyPartition();
+        check("headOffset").that(highestOffset).isAtLeast(target);
+    }
+
+    public void hasHeadOffsetAtMostInAnyTopicPartition(int atMost) {
+        long highestOffset = findHighestOffsetAnyPartition();
+        check("headOffset").that(highestOffset).isAtMost(atMost);
+    }
+
+    private long findHighestOffsetAnyPartition() {
+        var iterator = getConsumerRecordIterator();
+        long highestOffset = PartitionState.KAFKA_OFFSET_ABSENCE;
+        while (iterator.hasNext()) {
+            ConsumerRecord<?, ?> next = iterator.next();
+            long offset = next.offset();
+            highestOffset = offset;
+        }
+        return highestOffset;
+    }
+
+    @NotNull
+    private Iterator<ConsumerRecord<?, ?>> getConsumerRecordIterator() {
+        return (Iterator<ConsumerRecord<?, ?>>) actual.iterator();
+    }
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/ConsumerSubject.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/ConsumerSubject.java
new file mode 100644
index 000000000..8a51c130c
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/ConsumerSubject.java
@@ -0,0 +1,79 @@
+package io.confluent.parallelconsumer.truth;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.FailureMetadata;
+import io.confluent.parallelconsumer.model.CommitHistory;
+import io.stubbs.truth.generator.SubjectFactoryMethod;
+import io.stubbs.truth.generator.UserManagedSubject;
+import one.util.streamex.StreamEx;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.ConsumerParentSubject;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.common.TopicPartition;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniSets;
+
+import javax.annotation.Generated;
+import java.time.Duration;
+import java.util.Map;
+import java.util.Set;
+
+import static io.confluent.parallelconsumer.truth.CommitHistorySubject.commitHistories;
+
+/**
+ * Optionally move this class into source control, and add your custom assertions here.
+ * <p>
+ * If the system detects this class already exists, it won't attempt to generate a new one. Note that if the base
+ * skeleton of this class ever changes, you won't automatically get it updated.
+ *
+ * @author Antony Stubbs
+ * @see Consumer
+ * @see ConsumerParentSubject
+ */
+@UserManagedSubject(Consumer.class)
+@Generated(value = "io.stubbs.truth.generator.internal.TruthGenerator", date = "2022-05-17T12:20:38.207945Z")
+public class ConsumerSubject extends ConsumerParentSubject {
+
+    protected ConsumerSubject(FailureMetadata failureMetadata, org.apache.kafka.clients.consumer.Consumer actual) {
+        super(failureMetadata, actual);
+    }
+
+    /**
+     * Returns an assertion builder for a {@link Consumer} class.
+     */
+    @SubjectFactoryMethod
+    public static Factory<ConsumerSubject, Consumer> consumers() {
+        return ConsumerSubject::new;
+    }
+
+    private final Duration timeout = Duration.ofSeconds(10);
+
+    public CommitHistorySubject hasCommittedToPartition(String topic, int partition) {
+        TopicPartition topicPartition = new TopicPartition(topic, partition);
+        return hasCommittedToPartition(topicPartition);
+    }
+
+    public CommitHistorySubject hasCommittedToPartition(TopicPartition topicPartitions) {
+        Map<TopicPartition, CommitHistorySubject> rawCommitHistory = hasCommittedToPartition(UniSets.of(topicPartitions));
+        return rawCommitHistory.values().stream()
+                .findFirst()
+                .orElse(
+                        check("getCommitHistory(%s)", topicPartitions.topic())
+                                .about(commitHistories())
+                                .that(new CommitHistory(UniLists.of())));
+    }
+
+    public Map<TopicPartition, CommitHistorySubject> hasCommittedToPartition(Set<TopicPartition> partitions) {
+        Map<TopicPartition, OffsetAndMetadata> committed = actual.committed(partitions, timeout);
+        return StreamEx.of(committed.entrySet())
+                .filter(entry -> entry.getValue() != null)
+                .toMap(entry -> entry.getKey(), entry
+                        -> check("getCommitHistory(%s)", entry.getKey().topic() + ":" + entry.getKey().partition())
+                        .about(commitHistories())
+                        .that(new CommitHistory(UniLists.of(entry.getValue()))));
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/LongPollingMockConsumerSubject.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/LongPollingMockConsumerSubject.java
new file mode 100644
index 000000000..715ca3e58
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/LongPollingMockConsumerSubject.java
@@ -0,0 +1,72 @@
+package io.confluent.parallelconsumer.truth;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.FailureMetadata;
+import com.google.common.truth.Subject;
+import io.confluent.csid.utils.LongPollingMockConsumer;
+import io.confluent.parallelconsumer.model.CommitHistory;
+import io.stubbs.truth.generator.SubjectFactoryMethod;
+import io.stubbs.truth.generator.UserManagedSubject;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.common.TopicPartition;
+
+import java.util.List;
+import java.util.Map;
+import java.util.concurrent.CopyOnWriteArrayList;
+import java.util.stream.Collectors;
+
+import static com.google.common.truth.Truth.assertAbout;
+import static io.confluent.parallelconsumer.truth.CommitHistorySubject.commitHistories;
+
+/**
+ * @author Antony Stubbs
+ */
+@UserManagedSubject(LongPollingMockConsumer.class)
+public class LongPollingMockConsumerSubject<K, V> extends Subject {
+
+    private final LongPollingMockConsumer<K, V> actual;
+
+    protected LongPollingMockConsumerSubject(FailureMetadata metadata, LongPollingMockConsumer<K, V> actual) {
+        super(metadata, actual);
+        this.actual = actual;
+    }
+
+    @SubjectFactoryMethod
+    public static <K, V> Factory<LongPollingMockConsumerSubject<K, V>, LongPollingMockConsumer<K, V>> mockConsumers() {
+        return LongPollingMockConsumerSubject::new;
+    }
+
+    public static <K, V> LongPollingMockConsumerSubject<K, V> assertTruth(final LongPollingMockConsumer<K, V> actual) {
+        return assertThat(actual);
+    }
+
+    public static <K, V> LongPollingMockConsumerSubject<K, V> assertThat(final LongPollingMockConsumer<K, V> actual) {
+        Factory<LongPollingMockConsumerSubject<K, V>, LongPollingMockConsumer<K, V>> factory = LongPollingMockConsumerSubject.mockConsumers();
+        return assertAbout(factory).that(actual);
+    }
+
+    public CommitHistorySubject hasCommittedToPartition(TopicPartition tp) {
+        isNotNull();
+        CopyOnWriteArrayList<Map<TopicPartition, OffsetAndMetadata>> allCommits = actual.getCommitHistoryInt();
+        List<OffsetAndMetadata> historyForCommitsToPartition = allCommits.stream()
+                .filter(aCommitInstance -> aCommitInstance.containsKey(tp))
+                .map(aCommitInstance -> aCommitInstance.get(tp))
+                .collect(Collectors.toList());
+        CommitHistory commitHistory = new CommitHistory(historyForCommitsToPartition);
+        return check("getCommitHistory(%s)", tp).about(commitHistories()).that(commitHistory);
+    }
+
+    public CommitHistorySubject hasCommittedToAnyPartition() {
+        isNotNull();
+        CopyOnWriteArrayList<Map<TopicPartition, OffsetAndMetadata>> allCommits = actual.getCommitHistoryInt();
+        List<OffsetAndMetadata> historyForCommitsToPartition = allCommits.stream()
+                .flatMap(aCommitInstance -> aCommitInstance.values().stream())
+                .collect(Collectors.toList());
+        CommitHistory commitHistory = new CommitHistory(historyForCommitsToPartition);
+        return check("getCommitHistory()").about(commitHistories()).that(commitHistory);
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/ProducerManagerSubject.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/ProducerManagerSubject.java
new file mode 100644
index 000000000..471a92aef
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/ProducerManagerSubject.java
@@ -0,0 +1,53 @@
+package io.confluent.parallelconsumer.truth;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.google.common.truth.FailureMetadata;
+import io.confluent.parallelconsumer.internal.ProducerManager;
+import io.confluent.parallelconsumer.internal.ProducerManagerChildSubject;
+import io.confluent.parallelconsumer.internal.ProducerManagerParentSubject;
+import io.confluent.parallelconsumer.internal.ProducerWrapper;
+import io.stubbs.truth.generator.SubjectFactoryMethod;
+import io.stubbs.truth.generator.UserManagedMiddleSubject;
+import io.stubbs.truth.generator.UserManagedSubject;
+
+/**
+ * Main Subject for the class under test.
+ *
+ * @author Antony Stubbs
+ * @see ProducerManager
+ * @see ProducerManagerParentSubject
+ * @see ProducerManagerChildSubject
+ */
+@UserManagedSubject(ProducerManager.class)
+public class ProducerManagerSubject extends ProducerManagerParentSubject implements UserManagedMiddleSubject {
+
+    protected ProducerManagerSubject(FailureMetadata failureMetadata, ProducerManager actual) {
+        super(failureMetadata, actual);
+    }
+
+    /**
+     * Returns an assertion builder for a {@link ProducerManager} class.
+     */
+    @SubjectFactoryMethod
+    public static Factory<ProducerManagerSubject, ProducerManager> producerManagers() {
+        return ProducerManagerSubject::new;
+    }
+
+    public void transactionNotOpen() {
+        check("isTransactionOpen()").that(actual.getProducerWrapper().isTransactionOpen()).isFalse();
+    }
+
+    public void transactionOpen() {
+        check("isTransactionOpen()").that(actual.getProducerWrapper().isTransactionOpen()).isTrue();
+    }
+
+    public void stateIs(ProducerWrapper.ProducerState targetState) {
+        var producerWrap = actual.getProducerWrapper();
+        var producerState = producerWrap.getProducerState();
+        check("getProducerState()").that(producerState).isEqualTo(targetState);
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/TruthGeneratorTests.java b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/TruthGeneratorTests.java
new file mode 100644
index 000000000..2fe66919d
--- /dev/null
+++ b/parallel-consumer-core/src/test/java/io/confluent/parallelconsumer/truth/TruthGeneratorTests.java
@@ -0,0 +1,39 @@
+package io.confluent.parallelconsumer.truth;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.PodamUtils;
+import org.apache.kafka.clients.consumer.ConsumerRecords;
+import org.apache.kafka.clients.consumer.OffsetAndMetadata;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.clients.producer.RecordMetadata;
+import org.apache.kafka.common.TopicPartition;
+import org.junit.jupiter.api.Test;
+import pl.tlinkowski.unij.api.UniMaps;
+
+import static io.confluent.parallelconsumer.ManagedTruth.assertTruth;
+
+/**
+ * Basic tests of simple usage of the Truth Generator maven plugin
+ *
+ * @author Antony Stubbs
+ */
+class TruthGeneratorTests {
+
+    @Test
+    void generate() {
+        // todo check legacy's also contribute to subject graph
+        assertTruth(new ConsumerRecords<>(UniMaps.of())).getPartitions().isEmpty();
+
+        assertTruth(PodamUtils.createInstance(OffsetAndMetadata.class)).getOffset().isNotNull();
+
+        assertTruth(PodamUtils.createInstance(TopicPartition.class)).hasTopic().isNotEmpty();
+
+        assertTruth(PodamUtils.createInstance(RecordMetadata.class)).ishasTimestamp();
+
+        assertTruth(PodamUtils.createInstance(ProducerRecord.class, String.class, String.class)).getHeaders().isEmpty();
+    }
+
+}
diff --git a/parallel-consumer-core/src/test/resources/META-INF/services/org.junit.platform.launcher.TestExecutionListener b/parallel-consumer-core/src/test/resources/META-INF/services/org.junit.platform.launcher.TestExecutionListener
new file mode 100644
index 000000000..3b6460b54
--- /dev/null
+++ b/parallel-consumer-core/src/test/resources/META-INF/services/org.junit.platform.launcher.TestExecutionListener
@@ -0,0 +1 @@
+io.confluent.csid.utils.MyRunListener
\ No newline at end of file
diff --git a/parallel-consumer-core/src/test/resources/junit-platform.properties b/parallel-consumer-core/src/test/resources/junit-platform.properties
new file mode 100644
index 000000000..487bb72a8
--- /dev/null
+++ b/parallel-consumer-core/src/test/resources/junit-platform.properties
@@ -0,0 +1,17 @@
+#
+# Copyright (C) 2020-2022 Confluent, Inc.
+#
+
+# This seems to break some aspects of Ideas test tracking system (i.e. replay failures)
+#junit.jupiter.displayname.generator.default = io.confluent.csid.utils.ReplaceCamelCase
+
+junit.jupiter.execution.parallel.enabled=${parallel-tests}
+junit.jupiter.execution.parallel.mode.default=concurrent
+
+## number of threads
+#default = dynamic
+#junit.jupiter.execution.parallel.config.strategy=fixed
+# default=1
+# use a high multiple because most of the tests are io bound, not cpu bound
+junit.jupiter.execution.parallel.config.dynamic.factor=20
+#junit.jupiter.execution.parallel.config.fixed.parallelism=64
diff --git a/parallel-consumer-core/src/test/resources/logback-test.xml b/parallel-consumer-core/src/test/resources/logback-test.xml
new file mode 100644
index 000000000..89a62840f
--- /dev/null
+++ b/parallel-consumer-core/src/test/resources/logback-test.xml
@@ -0,0 +1,126 @@
+<!--
+
+    Copyright (C) 2020-2022 Confluent, Inc.
+
+-->
+<configuration packagingData="true" scan="true" scanPeriod="5 seconds" debug="false">
+
+    <appender name="STDOUT" class="ch.qos.logback.core.ConsoleAppender">
+        <!-- encoders are assigned the type
+             ch.qos.logback.classic.encoder.PatternLayoutEncoder by default -->
+        <encoder>
+            <!--            <pattern>%d{mm:ss.SSS} [%thread] %-5level (%class{0}.java:%line\)#%M - %msg%n</pattern>-->
+            <!--            <pattern>[%thread] %-5level .\(%class{0}.java:%line\)#%M - %msg%n</pattern>-->
+            <!--            <pattern>[%thread] %-5level .\(%file:%line\)#%M - %msg%n</pattern>-->
+            <!--            <pattern>%highlight(%-5level) %d{yyyy-MM-dd'T'HH:mm:ss.SSS} %yellow([%thread]) %blue(%logger{36}\(%class{0}.java:%line\)) %msg%n</pattern>-->
+            <!--            <pattern>%highlight(%-5level) %d{yyyy-MM-dd'T'HH:mm:ss.SSS} %yellow([%thread]) %blue(%logger{36}\(%file:%line\)) %msg%n</pattern>-->
+            <!--            <pattern>%highlight(%-5level) %yellow([%thread]) %blue(\(%file:%line\)) %cyan(#%M) %msg%n</pattern>-->
+            <pattern>%d{mm:ss.SSS} %yellow(%X{pcId}) %highlight(%-5level) %yellow([%thread]) %X{offset} %cyan(\(%file:%line\)#%M) %msg%n
+            </pattern>
+            <!--            <pattern>%highlight(%-5level) %yellow([%thread]) %cyan(\(%logger{36}:%line#%M\))  %msg%n</pattern>-->
+        </encoder>
+    </appender>
+
+    <root level="info">
+        <!--    <root level="debug">-->
+        <appender-ref ref="STDOUT"/>
+    </root>
+
+
+    <!-- current -->
+    <!--    <logger name="io.confluent.parallelconsumer.integrationTests.state.PartitionStateCommittedOffsetIT" level="debug"/>-->
+
+
+    <!-- primary -->
+    <logger name="io.confluent.parallelconsumer" level="info"/>
+    <!--    <logger name="io.confluent.parallelconsumer" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer" level="trace"/>-->
+
+    <!--    <logger name="io.confluent.csid" level="trace"/>-->
+
+    <logger name="org.apache.kafka" level="warn"/>
+
+    <!-- docker logs -->
+    <logger name="io.confluent.parallelconsumer.integrationTests.BrokerIntegrationTest" level="warn"/>
+
+
+    <!--    <logger name="io.confluent.csid.utils.LatchTestUtils" level="trace"/>-->
+
+    <!--    <logger name="io.confluent.parallelconsumer.internal.DynamicLoadFactor" level="debug"/>-->
+
+
+    <!--    <logger name="io.confluent.parallelconsumer" level="debug"/>-->
+    <!--    <logger name="io.confluent.csid" level="debug"/>-->
+
+    <!-- Key classes -->
+    <!--        <logger name="io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor" level="debug"/>-->
+    <!-- <logger name="io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor" level="trace"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.state.PartitionStateManager" level="trace"/> -->
+    <!--        <logger name="io.confluent.parallelconsumer.state" level="trace"/>-->
+
+    <!-- Offset committing-->
+    <!--    <logger name="io.confluent.parallelconsumer.internal.AbstractOffsetCommitter" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.offsets" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.offsets.OffsetSimultaneousEncoder" level="debug"/>-->
+
+    <!-- Broker polling -->
+    <!--    <logger name="io.confluent.parallelconsumer.internal.BrokerPollSystem" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.internal.BrokerPollSystem" level="trace"/>-->
+    <!--            <logger name="io.confluent.parallelconsumer.internal" level="debug"/>-->
+    <!--            <logger name="io.confluent.parallelconsumer.state.WorkManager" level="debug"/>-->
+
+
+    <!--    <logger name="io.confluent.parallelconsumer.BatchTestMethods" level="trace"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.state.RemovedPartitionState" level="trace"/>-->
+
+    <!--    <logger name="io.confluent.parallelconsumer.ParallelEoSStreamProcessorPauseResumeTest" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.AbstractParallelEoSStreamProcessorTestBase" level="debug"/>-->
+    <!--    <logger name="io.confluent.csid.utils.LongPollingMockConsumer" level="trace"/>-->
+
+
+    <!--    <logger name="io.confluent.parallelconsumer" level="debug"/>-->
+    <!--    <logger name="io.confluent.csid" level="debug"/>-->
+    <!--        <logger name="io.confluent.parallelconsumer" level="trace"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer" level="error"/>-->
+
+
+    <!--            <logger name="io.confluent.parallelconsumer" level="trace" />-->
+
+    <!-- notable specifics -->
+    <!--    <logger name="io.confluent.parallelconsumer.offsets.OffsetMapCodecManager" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.offsets.OffsetRunLength" level="trace"/>-->
+
+    <!-- Tests    -->
+    <!--    <logger name="io.confluent.parallelconsumer.BatchTestMethods" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.ParallelEoSStreamProcessorTest" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.ParallelEoSStreamProcessorTestBase" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.integrationTests" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.integrationTests.LargeVolumeInMemoryTests" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.ParallelConsumerTestBase" level="trace"/>-->
+
+    <!--    <logger name="io.confluent.parallelconsumer.offsets.WorkManagerOffsetMapCodecManagerTest" level="debug"/>-->
+
+
+    <!-- containers -->
+    <!--    <logger name="io.confluent.parallelconsumer.integrationTests.DbTest" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.integrationTests.BrokerIntegrationTest" level="debug"/>-->
+
+    <!-- related -->
+    <!--    <logger name="org.apache.kafka.clients" level="info"/>-->
+    <!--    <logger name="org.apache.kafka.clients" level="warn"/>-->
+    <!--    <logger name="org.apache.kafka.clients" level="debug"/>-->
+
+    <!-- Kafka External -->
+    <logger name="org.apache.kafka.common.config.AbstractConfig" level="error"/>
+
+    <!-- external -->
+    <logger name="org.postgresql" level="info"/>
+    <!--    <logger name="io.vertx" level="debug"/>-->
+    <logger name="io.netty" level="info"/>
+    <logger name="pl.tlinkowski" level="warn"/>
+
+
+    <!-- kafka internal -->
+    <!--    <logger name="org.apache.kafka.clients.consumer.internals.ConsumerCoordinator" level="debug"/>-->
+
+</configuration>
diff --git a/parallel-consumer-examples/parallel-consumer-example-core/pom.xml b/parallel-consumer-examples/parallel-consumer-example-core/pom.xml
new file mode 100644
index 000000000..980681dcf
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-core/pom.xml
@@ -0,0 +1,49 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Copyright (C) 2020-2023 Confluent, Inc.
+
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>io.confluent.parallelconsumer</groupId>
+        <artifactId>parallel-consumer-examples</artifactId>
+        <version>0.5.2.8-SNAPSHOT</version>
+    </parent>
+
+    <artifactId>parallel-consumer-example-core</artifactId>
+    <name>Confluent Parallel Consumer Example - Core</name>
+
+    <dependencies>
+        <!-- tag::exampleDep[] -->
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-core</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+        <!-- end::exampleDep[] -->
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-core</artifactId>
+            <version>${project.version}</version>
+            <classifier>tests</classifier>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.apache.commons</groupId>
+            <artifactId>commons-lang3</artifactId>
+        </dependency>
+    </dependencies>
+
+    <repositories>
+        <!-- tag::exampleRepo[] -->
+        <repository>
+            <name>Confluent</name>
+            <id>confluent</id>
+            <url>http://packages.confluent.io/maven/</url>
+        </repository>
+        <!-- end::exampleRepo[] -->
+    </repositories>
+</project>
diff --git a/parallel-consumer-examples/parallel-consumer-example-core/src/main/java/io/confluent/parallelconsumer/examples/core/CoreApp.java b/parallel-consumer-examples/parallel-consumer-example-core/src/main/java/io/confluent/parallelconsumer/examples/core/CoreApp.java
new file mode 100644
index 000000000..8b8764529
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-core/src/main/java/io/confluent/parallelconsumer/examples/core/CoreApp.java
@@ -0,0 +1,233 @@
+package io.confluent.parallelconsumer.examples.core;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelStreamProcessor;
+import io.confluent.parallelconsumer.RecordContext;
+import lombok.Value;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.commons.lang3.RandomUtils;
+import org.apache.commons.lang3.concurrent.CircuitBreakingException;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.producer.KafkaProducer;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.clients.producer.ProducerRecord;
+
+import java.time.Duration;
+import java.util.List;
+import java.util.Map;
+import java.util.Properties;
+import java.util.concurrent.ConcurrentHashMap;
+import java.util.stream.Collectors;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.ProcessingOrder.KEY;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+/**
+ * Basic core examples
+ */
+@Slf4j
+public class CoreApp {
+
+
+    String inputTopic = "input-topic-" + RandomUtils.nextInt();
+    String outputTopic = "output-topic-" + RandomUtils.nextInt();
+
+    Consumer<String, String> getKafkaConsumer() {
+        return new KafkaConsumer<>(new Properties());
+    }
+
+    Producer<String, String> getKafkaProducer() {
+        return new KafkaProducer<>(new Properties());
+    }
+
+    ParallelStreamProcessor<String, String> parallelConsumer;
+
+    @SuppressWarnings("UnqualifiedFieldAccess")
+    void run() {
+        this.parallelConsumer = setupParallelConsumer();
+
+        postSetup();
+
+        // tag::example[]
+        parallelConsumer.poll(record ->
+                log.info("Concurrently processing a record: {}", record)
+        );
+        // end::example[]
+    }
+
+    protected void postSetup() {
+        // ignore
+    }
+
+    @SuppressWarnings({"FeatureEnvy", "MagicNumber"})
+    ParallelStreamProcessor<String, String> setupParallelConsumer() {
+        // tag::exampleSetup[]
+        Consumer<String, String> kafkaConsumer = getKafkaConsumer(); // <1>
+        Producer<String, String> kafkaProducer = getKafkaProducer();
+
+        var options = ParallelConsumerOptions.<String, String>builder()
+                .ordering(KEY) // <2>
+                .maxConcurrency(1000) // <3>
+                .consumer(kafkaConsumer)
+                .producer(kafkaProducer)
+                .build();
+
+        ParallelStreamProcessor<String, String> eosStreamProcessor =
+                ParallelStreamProcessor.createEosStreamProcessor(options);
+
+        eosStreamProcessor.subscribe(of(inputTopic)); // <4>
+
+        return eosStreamProcessor;
+        // end::exampleSetup[]
+    }
+
+    void close() {
+        this.parallelConsumer.close();
+    }
+
+    void runPollAndProduce() {
+        this.parallelConsumer = setupParallelConsumer();
+
+        postSetup();
+
+        // tag::exampleProduce[]
+        parallelConsumer.pollAndProduce(context -> {
+                    var consumerRecord = context.getSingleRecord().getConsumerRecord();
+                    var result = processBrokerRecord(consumerRecord);
+                    return new ProducerRecord<>(outputTopic, consumerRecord.key(), result.payload);
+                }, consumeProduceResult -> {
+                    log.debug("Message {} saved to broker at offset {}",
+                            consumeProduceResult.getOut(),
+                            consumeProduceResult.getMeta().offset());
+                }
+        );
+        // end::exampleProduce[]
+    }
+
+    private Result processBrokerRecord(ConsumerRecord<String, String> consumerRecord) {
+        return new Result("Some payload from " + consumerRecord.value());
+    }
+
+    @Value
+    static class Result {
+        String payload;
+    }
+
+    void customRetryDelay() {
+        // tag::customRetryDelay[]
+        final double multiplier = 0.5;
+        final int baseDelaySecond = 1;
+
+        ParallelConsumerOptions.<String, String>builder()
+                .retryDelayProvider(recordContext -> {
+                    int numberOfFailedAttempts = recordContext.getNumberOfFailedAttempts();
+                    long delayMillis = (long) (baseDelaySecond * Math.pow(multiplier, numberOfFailedAttempts) * 1000);
+                    return Duration.ofMillis(delayMillis);
+                });
+        // end::customRetryDelay[]
+    }
+
+
+    void maxRetries() {
+        ParallelStreamProcessor<String, String> pc = ParallelStreamProcessor.createEosStreamProcessor(null);
+        // tag::maxRetries[]
+        final int maxRetries = 10;
+        final Map<ConsumerRecord<String, String>, Long> retriesCount = new ConcurrentHashMap<>();
+
+        pc.poll(context -> {
+            var consumerRecord = context.getSingleRecord().getConsumerRecord();
+            Long retryCount = retriesCount.computeIfAbsent(consumerRecord, ignore -> 0L);
+            if (retryCount < maxRetries) {
+                processRecord(consumerRecord);
+                // no exception, so completed - remove from map
+                retriesCount.remove(consumerRecord);
+            } else {
+                log.warn("Retry count {} exceeded max of {} for record {}", retryCount, maxRetries, consumerRecord);
+                // giving up, remove from map
+                retriesCount.remove(consumerRecord);
+            }
+        });
+        // end::maxRetries[]
+    }
+
+    private void processRecord(final ConsumerRecord<String, String> record) {
+        // no-op
+    }
+
+    void circuitBreaker() {
+        ParallelStreamProcessor<String, String> pc = ParallelStreamProcessor.createEosStreamProcessor(null);
+        // tag::circuitBreaker[]
+        final Map<String, Boolean> upMap = new ConcurrentHashMap<>();
+
+        pc.poll(context -> {
+            var consumerRecord = context.getSingleRecord().getConsumerRecord();
+            String serverId = extractServerId(consumerRecord);
+            boolean up = upMap.computeIfAbsent(serverId, ignore -> true);
+
+            if (!up) {
+                up = updateStatusOfSever(serverId);
+            }
+
+            if (up) {
+                try {
+                    processRecord(consumerRecord);
+                } catch (CircuitBreakingException e) {
+                    log.warn("Server {} is circuitBroken, will retry message when server is up. Record: {}", serverId, consumerRecord);
+                    upMap.put(serverId, false);
+                }
+                // no exception, so set server status UP
+                upMap.put(serverId, true);
+            } else {
+                throw new RuntimeException(msg("Server {} currently down, will retry record latter {}", up, consumerRecord));
+            }
+        });
+        // end::circuitBreaker[]
+    }
+
+    private boolean updateStatusOfSever(final String serverId) {
+        return false;
+    }
+
+    private String extractServerId(final ConsumerRecord<String, String> consumerRecord) {
+        // no-op
+        return null;
+    }
+
+
+    void batching() {
+        // tag::batching[]
+        ParallelStreamProcessor.createEosStreamProcessor(ParallelConsumerOptions.<String, String>builder()
+                .consumer(getKafkaConsumer())
+                .producer(getKafkaProducer())
+                .maxConcurrency(100)
+                .batchSize(5) // <1>
+                .build());
+        parallelConsumer.poll(context -> {
+            // convert the batch into the payload for our processing
+            List<String> payload = context.stream()
+                    .map(this::preparePayload)
+                    .collect(Collectors.toList());
+            // process the entire batch payload at once
+            processBatchPayload(payload);
+        });
+        // end::batching[]
+    }
+
+    private void processBatchPayload(List<String> batchPayload) {
+        // example
+    }
+
+    private String preparePayload(RecordContext<String, String> rc) {
+        ConsumerRecord<String, String> consumerRecords = rc.getConsumerRecord();
+        int failureCount = rc.getNumberOfFailedAttempts();
+        return msg("{}, {}", consumerRecords, failureCount);
+    }
+
+}
diff --git a/parallel-consumer-examples/parallel-consumer-example-core/src/test/java/io/confluent/parallelconsumer/examples/core/CoreAppTest.java b/parallel-consumer-examples/parallel-consumer-example-core/src/test/java/io/confluent/parallelconsumer/examples/core/CoreAppTest.java
new file mode 100644
index 000000000..dcf1bf71f
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-core/src/test/java/io/confluent/parallelconsumer/examples/core/CoreAppTest.java
@@ -0,0 +1,93 @@
+package io.confluent.parallelconsumer.examples.core;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.KafkaTestUtils;
+import io.confluent.csid.utils.LongPollingMockConsumer;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.ConsumerGroupMetadata;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.OffsetResetStrategy;
+import org.apache.kafka.clients.producer.MockProducer;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.common.TopicPartition;
+import org.apache.kafka.common.serialization.Serdes;
+import org.awaitility.Awaitility;
+import org.junit.jupiter.api.Test;
+import org.mockito.Mockito;
+
+import java.time.Duration;
+
+import static org.mockito.Mockito.when;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+@Slf4j
+class CoreAppTest {
+
+    @SneakyThrows
+    @Test
+    public void test() {
+        log.info("Test start");
+        CoreAppUnderTest coreApp = new CoreAppUnderTest();
+        TopicPartition tp = new TopicPartition(coreApp.inputTopic, 0);
+
+        coreApp.run();
+
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(coreApp.inputTopic, 0, 0, "a key 1", "a value"));
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(coreApp.inputTopic, 0, 1, "a key 2", "a value"));
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(coreApp.inputTopic, 0, 2, "a key 3", "a value"));
+
+        Awaitility.await().pollInterval(Duration.ofSeconds(1)).untilAsserted(() -> {
+            KafkaTestUtils.assertLastCommitIs(coreApp.mockConsumer, 3);
+        });
+
+        coreApp.close();
+    }
+
+    @SneakyThrows
+    @Test
+    public void testPollAndProduce() {
+        log.info("Test start");
+        CoreAppUnderTest coreApp = new CoreAppUnderTest();
+
+        coreApp.runPollAndProduce();
+
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(coreApp.inputTopic, 0, 0, "a key 1", "a value"));
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(coreApp.inputTopic, 0, 1, "a key 2", "a value"));
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(coreApp.inputTopic, 0, 2, "a key 3", "a value"));
+
+        Awaitility.await().pollInterval(Duration.ofSeconds(1)).untilAsserted(() -> {
+            KafkaTestUtils.assertLastCommitIs(coreApp.mockConsumer, 3);
+        });
+
+        coreApp.close();
+    }
+
+    class CoreAppUnderTest extends CoreApp {
+
+        LongPollingMockConsumer<String, String> mockConsumer = Mockito.spy(new LongPollingMockConsumer<>(OffsetResetStrategy.EARLIEST));
+        TopicPartition tp = new TopicPartition(inputTopic, 0);
+
+        @Override
+        Consumer<String, String> getKafkaConsumer() {
+            when(mockConsumer.groupMetadata())
+                    .thenReturn(new ConsumerGroupMetadata("groupid")); // todo fix AK mock consumer
+            return mockConsumer;
+        }
+
+        @Override
+        Producer<String, String> getKafkaProducer() {
+            var stringSerializer = Serdes.String().serializer();
+            return new MockProducer<>(true, stringSerializer, stringSerializer);
+        }
+
+        @Override
+        protected void postSetup() {
+            mockConsumer.subscribeWithRebalanceAndAssignment(of(inputTopic), 1);
+        }
+    }
+}
diff --git a/parallel-consumer-examples/parallel-consumer-example-core/src/test/resources/logback-temp-test.xml b/parallel-consumer-examples/parallel-consumer-example-core/src/test/resources/logback-temp-test.xml
new file mode 100644
index 000000000..4107b1237
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-core/src/test/resources/logback-temp-test.xml
@@ -0,0 +1,37 @@
+<!--
+
+    Copyright (C) 2020-2021 Confluent, Inc.
+
+-->
+<configuration packagingData="true" scan="true" scanPeriod="5 seconds">
+
+    <appender name="STDOUT" class="ch.qos.logback.core.ConsoleAppender">
+        <encoder>
+            <pattern>%d{mm:ss.SSS} %highlight(%-5level) %yellow([%thread]) %X{offset} %cyan(\(%file:%line#%M\)) %msg%n</pattern>
+        </encoder>
+    </appender>
+
+    <root level="info">
+        <appender-ref ref="STDOUT"/>
+    </root>
+
+    <logger name="io.confluent.csid" level="info"/>
+    <logger name="io.confluent.parallelconsumer" level="debug"/>
+    <!--    <logger name="io.confluent.csid" level="trace" />-->
+
+    <!--    <logger name="io.confluent.csid.asyncconsumer.WorkManager" level="info" />-->
+    <!--    <logger name="io.confluent.csid.asyncconsumer.ParallelConsumer" level="info" />-->
+
+    <!-- containers -->
+    <logger name="io.confluent.parallelconsumer.integrationTests.DbTest" level="debug"/>
+    <logger name="io.confluent.parallelconsumer.integrationTests.BrokerIntegrationTest" level="debug"/>
+
+    <!-- related -->
+    <logger name="org.apache.kafka.clients" level="warn"/>
+    <logger name="org.postgresql" level="info"/>
+
+    <!-- external -->
+    <logger name="io.vertx" level="debug"/>
+    <logger name="io.netty" level="info"/>
+
+</configuration>
\ No newline at end of file
diff --git a/parallel-consumer-examples/parallel-consumer-example-metrics/pom.xml b/parallel-consumer-examples/parallel-consumer-example-metrics/pom.xml
new file mode 100644
index 000000000..f44abee3c
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-metrics/pom.xml
@@ -0,0 +1,74 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Copyright (C) 2020-2023 Confluent, Inc.
+
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>io.confluent.parallelconsumer</groupId>
+        <artifactId>parallel-consumer-examples</artifactId>
+        <version>0.5.2.8-SNAPSHOT</version>
+    </parent>
+
+    <artifactId>parallel-consumer-example-metrics</artifactId>
+    <name>Confluent Parallel Consumer Example - Metrics</name>
+
+    <dependencies>
+        <!-- tag::exampleDep[] -->
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-core</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+        <dependency>
+            <groupId>io.micrometer</groupId>
+            <artifactId>micrometer-registry-prometheus</artifactId>
+            <version>1.8.2</version>
+        </dependency>
+        <!-- end::exampleDep[] -->
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-core</artifactId>
+            <version>${project.version}</version>
+            <classifier>tests</classifier>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.apache.commons</groupId>
+            <artifactId>commons-lang3</artifactId>
+        </dependency>
+        <dependency>
+            <groupId>ch.qos.logback</groupId>
+            <artifactId>logback-core</artifactId>
+            <version>1.4.4</version>
+        </dependency>
+        <dependency>
+            <groupId>ch.qos.logback</groupId>
+            <artifactId>logback-classic</artifactId>
+            <version>1.4.4</version>
+        </dependency>
+        <dependency>
+            <groupId>org.testcontainers</groupId>
+            <artifactId>testcontainers</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.testcontainers</groupId>
+            <artifactId>junit-jupiter</artifactId>
+            <scope>test</scope>
+        </dependency>
+    </dependencies>
+
+    <repositories>
+        <!-- tag::exampleRepo[] -->
+        <repository>
+            <name>Confluent</name>
+            <id>confluent</id>
+            <url>http://packages.confluent.io/maven/</url>
+        </repository>
+        <!-- end::exampleRepo[] -->
+    </repositories>
+</project>
diff --git a/parallel-consumer-examples/parallel-consumer-example-metrics/src/main/java/io/confluent/parallelconsumer/examples/metrics/CoreApp.java b/parallel-consumer-examples/parallel-consumer-example-metrics/src/main/java/io/confluent/parallelconsumer/examples/metrics/CoreApp.java
new file mode 100644
index 000000000..abbe73da7
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-metrics/src/main/java/io/confluent/parallelconsumer/examples/metrics/CoreApp.java
@@ -0,0 +1,124 @@
+package io.confluent.parallelconsumer.examples.metrics;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import com.sun.net.httpserver.HttpServer;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelStreamProcessor;
+import io.micrometer.core.instrument.Tag;
+import io.micrometer.core.instrument.Tags;
+import io.micrometer.core.instrument.binder.kafka.KafkaClientMetrics;
+import io.micrometer.prometheus.PrometheusConfig;
+import io.micrometer.prometheus.PrometheusMeterRegistry;
+import lombok.NoArgsConstructor;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.commons.lang3.RandomUtils;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.ConsumerConfig;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+
+import java.io.IOException;
+import java.io.OutputStream;
+import java.net.InetSocketAddress;
+import java.util.List;
+import java.util.Map;
+import java.util.Properties;
+import java.util.UUID;
+import java.util.concurrent.ExecutorService;
+import java.util.concurrent.Executors;
+
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+/**
+ * Basic core examples
+ */
+@Slf4j
+@NoArgsConstructor
+public class CoreApp {
+    public static final String METRICS_ENDPOINT = "/prometheus";
+    final PrometheusMeterRegistry meterRegistry = new PrometheusMeterRegistry(PrometheusConfig.DEFAULT);
+    String inputTopic = "input-topic";
+    String outputTopic = "output-topic-" + RandomUtils.nextInt();
+    private final Map<String, String> envVars = System.getenv();
+
+    private KafkaClientMetrics kafkaClientMetrics;
+
+    Consumer<String, String> getKafkaConsumer() {
+        final var props = new Properties();
+        props.put(ConsumerConfig.BOOTSTRAP_SERVERS_CONFIG, envVars.getOrDefault("BOOTSTRAP_SERVERS", "kafka:9092"));
+        props.put(ConsumerConfig.GROUP_ID_CONFIG, envVars.getOrDefault("GROUP_ID", "pc-instance"));
+        props.put(ConsumerConfig.ENABLE_AUTO_COMMIT_CONFIG, false);
+        props.put(ConsumerConfig.KEY_DESERIALIZER_CLASS_CONFIG, "org.apache.kafka.common.serialization.StringDeserializer");
+        props.put(ConsumerConfig.VALUE_DESERIALIZER_CLASS_CONFIG, "org.apache.kafka.common.serialization.StringDeserializer");
+
+        return new KafkaConsumer<>(props);
+    }
+
+    ParallelStreamProcessor<String, String> parallelConsumer;
+
+    private final ExecutorService metricsEndpointExecutor = Executors.newSingleThreadExecutor();
+
+    void setupPrometheusEndpoint() {
+        try {
+            final var server = HttpServer.create(new InetSocketAddress(7001), 0);
+            server.createContext(METRICS_ENDPOINT, httpExchange -> {
+                String response = meterRegistry.scrape();
+                httpExchange.sendResponseHeaders(200, response.getBytes().length);
+                try (OutputStream os = httpExchange.getResponseBody()) {
+                    os.write(response.getBytes());
+                }
+            });
+            metricsEndpointExecutor.submit(server::start);
+        } catch (IOException e) {
+            throw new RuntimeException(e);
+        }
+    }
+
+    @SuppressWarnings("UnqualifiedFieldAccess")
+    void run() {
+        this.parallelConsumer = setupParallelConsumer();
+        postSetup();
+
+        parallelConsumer.poll(record -> {
+            log.info("Concurrently processing a record: {}", record);
+        });
+    }
+
+    protected void postSetup() {
+        this.setupPrometheusEndpoint();
+    }
+
+    @SuppressWarnings({"FeatureEnvy", "MagicNumber" })
+    // tag::example[]
+    ParallelStreamProcessor<String, String> setupParallelConsumer() {
+        Consumer<String, String> kafkaConsumer = getKafkaConsumer();
+        String instanceId = UUID.randomUUID().toString();
+        var options = ParallelConsumerOptions.<String, String>builder()
+                .ordering(ParallelConsumerOptions.ProcessingOrder.KEY)
+                .maxConcurrency(1000)
+                .consumer(kafkaConsumer)
+                .meterRegistry(meterRegistry)                     //<1>
+                .metricsTags(Tags.of(Tag.of("common-tag", "tag1")))    //<2>
+                .pcInstanceTag(instanceId)                          //<3>
+                .build();
+
+        ParallelStreamProcessor<String, String> eosStreamProcessor =
+                ParallelStreamProcessor.createEosStreamProcessor(options);
+
+        eosStreamProcessor.subscribe(of(inputTopic));
+
+        kafkaClientMetrics = new KafkaClientMetrics(kafkaConsumer); //<4>
+        kafkaClientMetrics.bindTo(meterRegistry);                 //<5>
+        return eosStreamProcessor;
+    }
+    // end::example[]
+
+    void close() {
+        this.kafkaClientMetrics.close();
+        this.parallelConsumer.close();
+        this.metricsEndpointExecutor.shutdownNow();
+
+    }
+}
\ No newline at end of file
diff --git a/parallel-consumer-examples/parallel-consumer-example-metrics/src/test/java/io/confluent/parallelconsumer/examples/metrics/CoreAppMetricsIntegrationTest.java b/parallel-consumer-examples/parallel-consumer-example-metrics/src/test/java/io/confluent/parallelconsumer/examples/metrics/CoreAppMetricsIntegrationTest.java
new file mode 100644
index 000000000..912ede32d
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-metrics/src/test/java/io/confluent/parallelconsumer/examples/metrics/CoreAppMetricsIntegrationTest.java
@@ -0,0 +1,93 @@
+package io.confluent.parallelconsumer.examples.metrics;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.LongPollingMockConsumer;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.ConsumerGroupMetadata;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.OffsetResetStrategy;
+import org.awaitility.Awaitility;
+import org.junit.Assert;
+import org.junit.jupiter.api.Test;
+import org.mockito.Mockito;
+import org.testcontainers.junit.jupiter.Container;
+import org.testcontainers.junit.jupiter.Testcontainers;
+import org.testcontainers.shaded.com.fasterxml.jackson.databind.ObjectMapper;
+import pl.tlinkowski.unij.api.UniLists;
+
+import java.io.BufferedInputStream;
+import java.net.HttpURLConnection;
+import java.net.URL;
+import java.time.Duration;
+import java.util.Map;
+import java.util.Set;
+
+import static org.mockito.Mockito.when;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+@Slf4j
+@Testcontainers
+public class CoreAppMetricsIntegrationTest{
+
+    @Container
+    final static private PrometheusContainer PROMETHEUS_CONTAINER = new PrometheusContainer();
+
+    @Test
+    @SneakyThrows
+    void testMetrics() {
+        org.testcontainers.Testcontainers.exposeHostPorts(7001);
+        CoreAppUnderTest coreApp = new CoreAppUnderTest();
+
+        final var expectedMetrics =
+                UniLists.of("pc_status","pc_partitions_number","pc_incomplete_offsets_total","pc_user_function_processing_time_seconds");
+
+
+        coreApp.run();
+
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(coreApp.inputTopic, 0, 0, "a key 1", "a value"));
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(coreApp.inputTopic, 0, 1, "a key 2", "a value"));
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(coreApp.inputTopic, 0, 2, "a key 3", "a value"));
+
+
+        Awaitility.await().pollDelay(Duration.ofSeconds(1)).untilAsserted(() -> {
+            final var metrics = getPrometheusMetrics();
+            Assert.assertTrue(metrics.containsAll(expectedMetrics));
+        });
+
+        coreApp.close();
+    }
+
+    @SneakyThrows
+    private Set<String> getPrometheusMetrics(){
+        ObjectMapper mapper = new ObjectMapper();
+
+        final var url = new URL(String.format("%s/api/v1/metadata", PROMETHEUS_CONTAINER.getPrometheusEndpoint()));
+        HttpURLConnection conn = (HttpURLConnection) url.openConnection();
+        Assert.assertEquals(conn.getResponseCode(), 200);
+
+        final Map<String, Object> jsonBody = mapper.readValue(new BufferedInputStream(conn.getInputStream()), Map.class);
+        return ((Map) jsonBody.get("data")).keySet();
+    }
+
+    class CoreAppUnderTest extends CoreApp {
+        LongPollingMockConsumer<String, String> mockConsumer = Mockito.spy(new LongPollingMockConsumer<>(OffsetResetStrategy.EARLIEST));
+        @Override
+        Consumer<String, String> getKafkaConsumer() {
+            when(mockConsumer.groupMetadata())
+                    .thenReturn(new ConsumerGroupMetadata("groupid")); // todo fix AK mock consumer
+            return mockConsumer;
+        }
+
+        @Override
+        protected void postSetup() {
+            super.postSetup();
+
+            mockConsumer.subscribeWithRebalanceAndAssignment(UniLists.of(inputTopic), 1);
+        }
+    }
+}
\ No newline at end of file
diff --git a/parallel-consumer-examples/parallel-consumer-example-metrics/src/test/java/io/confluent/parallelconsumer/examples/metrics/PrometheusContainer.java b/parallel-consumer-examples/parallel-consumer-example-metrics/src/test/java/io/confluent/parallelconsumer/examples/metrics/PrometheusContainer.java
new file mode 100644
index 000000000..3ef40df35
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-metrics/src/test/java/io/confluent/parallelconsumer/examples/metrics/PrometheusContainer.java
@@ -0,0 +1,57 @@
+package io.confluent.parallelconsumer.examples.metrics;
+
+/*-
+ * Copyright (C) 2020-2023 Confluent, Inc.
+ */
+
+import com.github.dockerjava.api.command.InspectContainerResponse;
+import lombok.SneakyThrows;
+import org.testcontainers.containers.GenericContainer;
+import org.testcontainers.utility.DockerImageName;
+import org.testcontainers.utility.MountableFile;
+
+import java.io.IOException;
+
+public class PrometheusContainer extends GenericContainer<PrometheusContainer> {
+    private static final DockerImageName DEFAULT_IMAGE_NAME = DockerImageName.parse("prom/prometheus");
+    private static final String DEFAULT_TAG = "v2.40.6";
+    public static final int PROMETHEUS_PORT = 9090;
+
+    /** @deprecated */
+    @Deprecated
+    public PrometheusContainer() {
+        this(DEFAULT_IMAGE_NAME.withTag(DEFAULT_TAG));
+    }
+
+    /** @deprecated */
+    @Deprecated
+    public PrometheusContainer(String prometheusVersion) {
+        this(DEFAULT_IMAGE_NAME.withTag(prometheusVersion));
+    }
+
+    public PrometheusContainer(DockerImageName dockerImageName) {
+        super(dockerImageName);
+        dockerImageName.assertCompatibleWith(new DockerImageName[]{DEFAULT_IMAGE_NAME});
+        this.withExposedPorts(new Integer[]{PROMETHEUS_PORT});
+        this.withAccessToHost(true);
+        this.withCopyFileToContainer(
+                MountableFile.forClasspathResource("prometheus.yml"),"/etc/prometheus/");
+        this.withReuse(true);
+    }
+
+    public String getPrometheusEndpoint() {
+        return String.format("http://%s:%s", this.getHost(), this.getMappedPort(PROMETHEUS_PORT));
+    }
+
+    @SneakyThrows
+    protected void containerIsStarted(InspectContainerResponse containerInfo) {
+        try {
+            ExecResult result = this.execInContainer(new String[]{"nc", "-z", "localhost", "9090"});
+            if (result.getExitCode() != 0) {
+                throw new IllegalStateException(result.toString());
+            }
+        } catch (IOException|InterruptedException e) {
+            throw e;
+        }
+    }
+}
\ No newline at end of file
diff --git a/parallel-consumer-examples/parallel-consumer-example-metrics/src/test/resources/prometheus.yml b/parallel-consumer-examples/parallel-consumer-example-metrics/src/test/resources/prometheus.yml
new file mode 100644
index 000000000..8858f005d
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-metrics/src/test/resources/prometheus.yml
@@ -0,0 +1,19 @@
+#
+# Copyright (C) 2020-2023 Confluent, Inc.
+#
+
+global:
+  scrape_interval: 1s
+  scrape_timeout: 1s
+
+scrape_configs:
+  - job_name: services
+    metrics_path: /metrics
+    static_configs:
+      - targets:
+          - 'localhost:9090'
+  - job_name: 'pc'
+    metrics_path: '/prometheus'
+    static_configs:
+      - targets:
+          - 'host.testcontainers.internal:7001'
\ No newline at end of file
diff --git a/parallel-consumer-examples/parallel-consumer-example-reactor/pom.xml b/parallel-consumer-examples/parallel-consumer-example-reactor/pom.xml
new file mode 100644
index 000000000..0b433df8e
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-reactor/pom.xml
@@ -0,0 +1,56 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Copyright (C) 2020-2023 Confluent, Inc.
+
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>io.confluent.parallelconsumer</groupId>
+        <artifactId>parallel-consumer-examples</artifactId>
+        <version>0.5.2.8-SNAPSHOT</version>
+    </parent>
+
+    <artifactId>parallel-consumer-example-reactor</artifactId>
+    <name>Confluent Parallel Consumer Example - Project Reactor.io</name>
+
+    <dependencies>
+        <!-- tag::exampleDep[] -->
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-reactor</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+        <!-- end::exampleDep[] -->
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-core</artifactId>
+            <version>${project.version}</version>
+            <classifier>tests</classifier>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-reactor</artifactId>
+            <version>${project.version}</version>
+            <classifier>tests</classifier>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.apache.commons</groupId>
+            <artifactId>commons-lang3</artifactId>
+        </dependency>
+        <dependency>
+            <groupId>org.awaitility</groupId>
+            <artifactId>awaitility</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>com.github.tomakehurst</groupId>
+            <artifactId>wiremock-jre8</artifactId>
+            <scope>test</scope>
+        </dependency>
+    </dependencies>
+</project>
diff --git a/parallel-consumer-examples/parallel-consumer-example-reactor/src/main/java/io/confluent/parallelconsumer/examples/reactor/ReactorApp.java b/parallel-consumer-examples/parallel-consumer-example-reactor/src/main/java/io/confluent/parallelconsumer/examples/reactor/ReactorApp.java
new file mode 100644
index 000000000..cf04949a5
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-reactor/src/main/java/io/confluent/parallelconsumer/examples/reactor/ReactorApp.java
@@ -0,0 +1,77 @@
+package io.confluent.parallelconsumer.examples.reactor;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.reactor.ReactorProcessor;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.commons.lang3.RandomUtils;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.producer.KafkaProducer;
+import org.apache.kafka.clients.producer.Producer;
+import pl.tlinkowski.unij.api.UniMaps;
+import reactor.core.publisher.Mono;
+
+import java.util.Map;
+import java.util.Properties;
+
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+@Slf4j
+public class ReactorApp {
+
+    static String inputTopic = "input-topic-" + RandomUtils.nextInt();
+
+    Consumer<String, String> getKafkaConsumer() {
+        return new KafkaConsumer<>(new Properties());
+    }
+
+    Producer<String, String> getKafkaProducer() {
+        return new KafkaProducer<>(new Properties());
+    }
+
+    ReactorProcessor<String, String> parallelConsumer;
+
+
+    void run() {
+        Consumer<String, String> kafkaConsumer = getKafkaConsumer();
+        Producer<String, String> kafkaProducer = getKafkaProducer();
+        var options = ParallelConsumerOptions.<String, String>builder()
+                .ordering(ParallelConsumerOptions.ProcessingOrder.KEY)
+                .consumer(kafkaConsumer)
+                .producer(kafkaProducer)
+                .build();
+
+        this.parallelConsumer = new ReactorProcessor<>(options);
+        parallelConsumer.subscribe(of(inputTopic));
+
+        postSetup();
+
+        int port = getPort();
+
+        // tag::example[]
+        parallelConsumer.react(context -> {
+            var consumerRecord = context.getSingleRecord().getConsumerRecord();
+            log.info("Concurrently constructing and returning RequestInfo from record: {}", consumerRecord);
+            Map<String, String> params = UniMaps.of("recordKey", consumerRecord.key(), "payload", consumerRecord.value());
+            return Mono.just("something todo"); // <1>
+        });
+        // end::example[]
+    }
+
+    protected int getPort() {
+        return 8080;
+    }
+
+    void close() {
+        this.parallelConsumer.closeDrainFirst();
+    }
+
+    protected void postSetup() {
+        // no-op, for testing
+    }
+
+}
diff --git a/parallel-consumer-examples/parallel-consumer-example-reactor/src/test/java/io/confluent/parallelconsumer/examples/reactor/ReactorAppTest.java b/parallel-consumer-examples/parallel-consumer-example-reactor/src/test/java/io/confluent/parallelconsumer/examples/reactor/ReactorAppTest.java
new file mode 100644
index 000000000..e516af619
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-reactor/src/test/java/io/confluent/parallelconsumer/examples/reactor/ReactorAppTest.java
@@ -0,0 +1,90 @@
+package io.confluent.parallelconsumer.examples.reactor;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import com.github.tomakehurst.wiremock.WireMockServer;
+import io.confluent.csid.utils.KafkaTestUtils;
+import io.confluent.csid.utils.LongPollingMockConsumer;
+import io.confluent.csid.utils.WireMockUtils;
+import lombok.RequiredArgsConstructor;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.ConsumerGroupMetadata;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.OffsetResetStrategy;
+import org.apache.kafka.clients.producer.MockProducer;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.common.TopicPartition;
+import org.awaitility.Awaitility;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.Timeout;
+import org.mockito.Mockito;
+
+import java.time.Duration;
+import java.util.HashMap;
+
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+@Slf4j
+class ReactorAppTest {
+
+    TopicPartition tp = new TopicPartition(ReactorApp.inputTopic, 0);
+
+    @Timeout(20)
+    @SneakyThrows
+    @Test
+    void test() {
+        log.info("Test start");
+        WireMockServer wireMockServer = new WireMockUtils().setupWireMock();
+        int port = wireMockServer.port();
+
+        ReactorAppAppUnderTest coreApp = new ReactorAppAppUnderTest(port);
+
+        coreApp.run();
+
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(ReactorApp.inputTopic, 0, 0, "a key 1", "a value"));
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(ReactorApp.inputTopic, 0, 1, "a key 2", "a value"));
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(ReactorApp.inputTopic, 0, 2, "a key 3", "a value"));
+
+        Awaitility.await().pollInterval(Duration.ofSeconds(1)).untilAsserted(() -> {
+            KafkaTestUtils.assertLastCommitIs(coreApp.mockConsumer, 3);
+        });
+
+        coreApp.close();
+    }
+
+    @RequiredArgsConstructor
+    class ReactorAppAppUnderTest extends ReactorApp {
+
+        private final int port;
+
+        LongPollingMockConsumer<String, String> mockConsumer = Mockito.spy(new LongPollingMockConsumer<>(OffsetResetStrategy.EARLIEST));
+
+        @Override
+        Consumer<String, String> getKafkaConsumer() {
+            HashMap<TopicPartition, Long> beginningOffsets = new HashMap<>();
+            beginningOffsets.put(tp, 0L);
+            mockConsumer.updateBeginningOffsets(beginningOffsets);
+            Mockito.when(mockConsumer.groupMetadata()).thenReturn(new ConsumerGroupMetadata("groupid")); // todo fix AK mock consumer
+            return mockConsumer;
+        }
+
+        @Override
+        Producer<String, String> getKafkaProducer() {
+            return new MockProducer<>(true, null, null);
+        }
+
+        @Override
+        public void postSetup() {
+            mockConsumer.subscribeWithRebalanceAndAssignment(of(inputTopic), 1);
+        }
+
+        @Override
+        protected int getPort() {
+            return port;
+        }
+    }
+}
diff --git a/parallel-consumer-examples/parallel-consumer-example-reactor/src/test/resources/logback-test.xml b/parallel-consumer-examples/parallel-consumer-example-reactor/src/test/resources/logback-test.xml
new file mode 100644
index 000000000..ec218f218
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-reactor/src/test/resources/logback-test.xml
@@ -0,0 +1,38 @@
+<!--
+
+    Copyright (C) 2020-2021 Confluent, Inc.
+
+-->
+<configuration packagingData="true" scan="true" scanPeriod="5 seconds">
+
+    <appender name="STDOUT" class="ch.qos.logback.core.ConsoleAppender">
+        <encoder>
+            <pattern>%d{mm:ss.SSS} %highlight(%-5level) %yellow([%thread]) %X{offset} %cyan(\(%file:%line#%M\)) %msg%n
+            </pattern>
+        </encoder>
+    </appender>
+
+    <root level="info">
+        <appender-ref ref="STDOUT"/>
+    </root>
+
+    <logger name="io.confluent.csid" level="info"/>
+    <!--    <logger name="io.confluent.csid" level="debug" />-->
+    <!--    <logger name="io.confluent.csid" level="trace" />-->
+
+    <!--    <logger name="io.confluent.csid.asyncconsumer.WorkManager" level="info" />-->
+    <!--    <logger name="io.confluent.csid.asyncconsumer.ParallelConsumer" level="info" />-->
+
+    <!-- containers -->
+    <logger name="io.confluent.parallelconsumer.integrationTests.DbTest" level="debug"/>
+    <logger name="io.confluent.parallelconsumer.integrationTests.BrokerIntegrationTest" level="debug"/>
+
+    <!-- related -->
+    <logger name="org.apache.kafka.clients" level="warn"/>
+    <logger name="org.postgresql" level="info"/>
+
+    <!-- external -->
+    <logger name="io.vertx" level="debug"/>
+    <logger name="io.netty" level="info"/>
+
+</configuration>
\ No newline at end of file
diff --git a/parallel-consumer-examples/parallel-consumer-example-streams/pom.xml b/parallel-consumer-examples/parallel-consumer-example-streams/pom.xml
new file mode 100644
index 000000000..b4b6a7ca4
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-streams/pom.xml
@@ -0,0 +1,70 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Copyright (C) 2020-2023 Confluent, Inc.
+
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>io.confluent.parallelconsumer</groupId>
+        <artifactId>parallel-consumer-examples</artifactId>
+        <version>0.5.2.8-SNAPSHOT</version>
+    </parent>
+
+    <artifactId>parallel-consumer-example-streams</artifactId>
+    <name>Confluent Parallel Consumer Example - Streams</name>
+
+    <dependencies>
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-core</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+        <dependency>
+            <groupId>org.apache.kafka</groupId>
+            <artifactId>kafka-streams</artifactId>
+            <version>${kafka.version}</version>
+        </dependency>
+
+        <!-- Tests -->
+        <dependency>
+            <groupId>org.apache.kafka</groupId>
+            <artifactId>kafka-streams-test-utils</artifactId>
+            <version>${kafka.version}</version>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.awaitility</groupId>
+            <artifactId>awaitility</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-core</artifactId>
+            <version>${project.version}</version>
+            <classifier>tests</classifier>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.testcontainers</groupId>
+            <artifactId>testcontainers</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.testcontainers</groupId>
+            <artifactId>junit-jupiter</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.testcontainers</groupId>
+            <artifactId>kafka</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.apache.commons</groupId>
+            <artifactId>commons-lang3</artifactId>
+        </dependency>
+    </dependencies>
+</project>
diff --git a/parallel-consumer-examples/parallel-consumer-example-streams/src/main/java/io/confluent/parallelconsumer/examples/streams/StreamsApp.java b/parallel-consumer-examples/parallel-consumer-example-streams/src/main/java/io/confluent/parallelconsumer/examples/streams/StreamsApp.java
new file mode 100644
index 000000000..669de9d0a
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-streams/src/main/java/io/confluent/parallelconsumer/examples/streams/StreamsApp.java
@@ -0,0 +1,112 @@
+package io.confluent.parallelconsumer.examples.streams;
+
+/*-
+ * Copyright (C) 2020 Confluent, Inc.
+ */
+
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelStreamProcessor;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.commons.lang3.RandomUtils;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.producer.KafkaProducer;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.common.serialization.Serdes;
+import org.apache.kafka.streams.KafkaStreams;
+import org.apache.kafka.streams.StreamsBuilder;
+import org.apache.kafka.streams.StreamsConfig;
+import org.apache.kafka.streams.Topology;
+import pl.tlinkowski.unij.api.UniLists;
+
+import java.util.Properties;
+import java.util.concurrent.atomic.AtomicInteger;
+
+@Slf4j
+public class StreamsApp {
+
+    static String inputTopic = "input-topic-" + RandomUtils.nextInt();
+
+    static String outputTopicName = "my-output-topic-" + RandomUtils.nextInt();
+
+    Consumer<String, String> getKafkaConsumer() {
+        return new KafkaConsumer<>(new Properties());
+    }
+
+    Producer<String, String> getKafkaProducer() {
+        return new KafkaProducer<>(new Properties());
+    }
+
+    KafkaStreams streams;
+
+    ParallelStreamProcessor<String, String> parallelConsumer;
+
+    AtomicInteger messageCount = new AtomicInteger();
+
+    // tag::example[]
+    void run() {
+        preprocess(); // <1>
+        concurrentProcess(); // <2>
+    }
+
+    void preprocess() {
+        StreamsBuilder builder = new StreamsBuilder();
+        builder.<String, String>stream(inputTopic)
+                .mapValues((key, value) -> {
+                    log.info("Streams preprocessing key: {} value: {}", key, value);
+                    return String.valueOf(value.length());
+                })
+                .to(outputTopicName);
+
+        startStreams(builder.build());
+    }
+
+    void startStreams(Topology topology) {
+        streams = new KafkaStreams(topology, getStreamsProperties());
+        streams.start();
+    }
+
+    void concurrentProcess() {
+        setupParallelConsumer();
+
+        parallelConsumer.poll(record -> {
+            log.info("Concurrently processing a record: {}", record);
+            messageCount.getAndIncrement();
+        });
+    }
+    // end::example[]
+
+    private void setupParallelConsumer() {
+        Consumer<String, String> kafkaConsumer = getKafkaConsumer();
+        Producer<String, String> kafkaProducer = getKafkaProducer();
+        var options = ParallelConsumerOptions.<String, String>builder()
+                .ordering(ParallelConsumerOptions.ProcessingOrder.KEY)
+                .consumer(kafkaConsumer)
+                .producer(kafkaProducer)
+                .build();
+
+
+        parallelConsumer = ParallelStreamProcessor.createEosStreamProcessor(options);
+        parallelConsumer.subscribe(UniLists.of(outputTopicName));
+    }
+
+    Properties getStreamsProperties() {
+        Properties props = new Properties();
+        props.put(StreamsConfig.APPLICATION_ID_CONFIG, this.getClass().getName());
+        props.put(StreamsConfig.BOOTSTRAP_SERVERS_CONFIG, getServerConfig());
+        props.put(StreamsConfig.DEFAULT_KEY_SERDE_CLASS_CONFIG, Serdes.String().getClass());
+        props.put(StreamsConfig.DEFAULT_VALUE_SERDE_CLASS_CONFIG, Serdes.String().getClass());
+        return props;
+    }
+
+    String getServerConfig() {
+        return "add your server here";
+    }
+
+    void close() {
+        streams.close();
+        parallelConsumer.close();
+    }
+
+}
diff --git a/parallel-consumer-examples/parallel-consumer-example-streams/src/test/java/io/confluent/parallelconsumer/examples/streams/StreamsAppTest.java b/parallel-consumer-examples/parallel-consumer-example-streams/src/test/java/io/confluent/parallelconsumer/examples/streams/StreamsAppTest.java
new file mode 100644
index 000000000..0d7dfc575
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-streams/src/test/java/io/confluent/parallelconsumer/examples/streams/StreamsAppTest.java
@@ -0,0 +1,62 @@
+package io.confluent.parallelconsumer.examples.streams;
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.integrationTests.BrokerIntegrationTest;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.assertj.core.api.Assertions;
+import org.awaitility.Awaitility;
+import org.junit.jupiter.api.Test;
+
+@Slf4j
+public class StreamsAppTest extends BrokerIntegrationTest<String, String> {
+
+    @SneakyThrows
+    @Test
+    public void test() {
+        log.info("Test start");
+        ensureTopic(StreamsApp.inputTopic, 1);
+        ensureTopic(StreamsApp.outputTopicName, 1);
+
+        StreamsAppUnderTest coreApp = new StreamsAppUnderTest();
+
+        coreApp.run();
+
+        try (Producer<String, String> kafkaProducer = getKcu().createNewProducer(false)) {
+
+            kafkaProducer.send(new ProducerRecord<>(StreamsApp.inputTopic, "a key 1", "a value"));
+            kafkaProducer.send(new ProducerRecord<>(StreamsApp.inputTopic, "a key 2", "a value"));
+            kafkaProducer.send(new ProducerRecord<>(StreamsApp.inputTopic, "a key 3", "a value"));
+
+            Awaitility.await().untilAsserted(() -> {
+                Assertions.assertThat(coreApp.messageCount.get()).isEqualTo(3);
+            });
+
+        } finally {
+            coreApp.close();
+        }
+    }
+
+    class StreamsAppUnderTest extends StreamsApp {
+
+        @Override
+        Consumer<String, String> getKafkaConsumer() {
+            return getKcu().getConsumer();
+        }
+
+        @Override
+        Producer<String, String> getKafkaProducer() {
+            return getKcu().createNewProducer(false);
+        }
+
+        @Override
+        String getServerConfig() {
+            return BrokerIntegrationTest.kafkaContainer.getBootstrapServers();
+        }
+    }
+}
diff --git a/parallel-consumer-examples/parallel-consumer-example-streams/src/test/resources/logback-test.xml b/parallel-consumer-examples/parallel-consumer-example-streams/src/test/resources/logback-test.xml
new file mode 100644
index 000000000..efe66e19a
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-streams/src/test/resources/logback-test.xml
@@ -0,0 +1,37 @@
+<!--
+
+    Copyright (C) 2020-2021 Confluent, Inc.
+
+-->
+<configuration packagingData="true" scan="true" scanPeriod="5 seconds">
+
+    <appender name="STDOUT" class="ch.qos.logback.core.ConsoleAppender">
+        <encoder>
+            <pattern>%d{mm:ss.SSS} %highlight(%-5level) %yellow([%thread]) %X{offset} %cyan(\(%file:%line#%M\)) %msg%n</pattern>
+        </encoder>
+    </appender>
+
+    <root level="info">
+        <appender-ref ref="STDOUT"/>
+    </root>
+
+    <logger name="io.confluent.csid" level="info"/>
+    <!--    <logger name="io.confluent.csid" level="debug" />-->
+    <!--    <logger name="io.confluent.csid" level="trace" />-->
+
+    <!--    <logger name="io.confluent.csid.asyncconsumer.WorkManager" level="info" />-->
+    <!--    <logger name="io.confluent.csid.asyncconsumer.ParallelConsumer" level="info" />-->
+
+    <!-- containers -->
+    <!--    <logger name="io.confluent.csid.asyncconsumer.integrationTests.DbTest" level="debug" />-->
+    <!--    <logger name="io.confluent.csid.asyncconsumer.integrationTests.KafkaTest" level="debug" />-->
+
+    <!-- related -->
+    <logger name="org.apache.kafka.clients" level="warn"/>
+    <logger name="org.postgresql" level="info"/>
+
+    <!-- external -->
+    <logger name="io.vertx" level="debug"/>
+    <logger name="io.netty" level="info"/>
+
+</configuration>
\ No newline at end of file
diff --git a/parallel-consumer-examples/parallel-consumer-example-vertx/pom.xml b/parallel-consumer-examples/parallel-consumer-example-vertx/pom.xml
new file mode 100644
index 000000000..0699a7aa5
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-vertx/pom.xml
@@ -0,0 +1,56 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Copyright (C) 2020-2023 Confluent, Inc.
+
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>io.confluent.parallelconsumer</groupId>
+        <artifactId>parallel-consumer-examples</artifactId>
+        <version>0.5.2.8-SNAPSHOT</version>
+    </parent>
+
+    <artifactId>parallel-consumer-example-vertx</artifactId>
+    <name>Confluent Parallel Consumer Example - Vert.x</name>
+
+    <dependencies>
+        <!-- tag::exampleDep[] -->
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-vertx</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+        <!-- end::exampleDep[] -->
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-core</artifactId>
+            <version>${project.version}</version>
+            <classifier>tests</classifier>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-vertx</artifactId>
+            <version>${project.version}</version>
+            <classifier>tests</classifier>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.apache.commons</groupId>
+            <artifactId>commons-lang3</artifactId>
+        </dependency>
+        <dependency>
+            <groupId>org.awaitility</groupId>
+            <artifactId>awaitility</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>com.github.tomakehurst</groupId>
+            <artifactId>wiremock-jre8</artifactId>
+            <scope>test</scope>
+        </dependency>
+    </dependencies>
+</project>
diff --git a/parallel-consumer-examples/parallel-consumer-example-vertx/src/main/java/io/confluent/parallelconsumer/examples/vertx/VertxApp.java b/parallel-consumer-examples/parallel-consumer-example-vertx/src/main/java/io/confluent/parallelconsumer/examples/vertx/VertxApp.java
new file mode 100644
index 000000000..38a996d80
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-vertx/src/main/java/io/confluent/parallelconsumer/examples/vertx/VertxApp.java
@@ -0,0 +1,82 @@
+package io.confluent.parallelconsumer.examples.vertx;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.vertx.JStreamVertxParallelStreamProcessor;
+import io.confluent.parallelconsumer.vertx.VertxParallelEoSStreamProcessor.RequestInfo;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.commons.lang3.RandomUtils;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.producer.KafkaProducer;
+import org.apache.kafka.clients.producer.Producer;
+import pl.tlinkowski.unij.api.UniMaps;
+
+import java.util.Map;
+import java.util.Properties;
+
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+@Slf4j
+public class VertxApp {
+
+    static String inputTopic = "input-topic-" + RandomUtils.nextInt();
+
+    Consumer<String, String> getKafkaConsumer() {
+        return new KafkaConsumer<>(new Properties());
+    }
+
+    Producer<String, String> getKafkaProducer() {
+        return new KafkaProducer<>(new Properties());
+    }
+
+    JStreamVertxParallelStreamProcessor<String, String> parallelConsumer;
+
+
+    void run() {
+        Consumer<String, String> kafkaConsumer = getKafkaConsumer();
+        Producer<String, String> kafkaProducer = getKafkaProducer();
+        var options = ParallelConsumerOptions.<String, String>builder()
+                .ordering(ParallelConsumerOptions.ProcessingOrder.KEY)
+                .consumer(kafkaConsumer)
+                .producer(kafkaProducer)
+                .build();
+
+        this.parallelConsumer = JStreamVertxParallelStreamProcessor.createEosStreamProcessor(options);
+        parallelConsumer.subscribe(of(inputTopic));
+
+        postSetup();
+
+        int port = getPort();
+
+        // tag::example[]
+        var resultStream = parallelConsumer.vertxHttpReqInfoStream(context -> {
+            var consumerRecord = context.getSingleConsumerRecord();
+            log.info("Concurrently constructing and returning RequestInfo from record: {}", consumerRecord);
+            Map<String, String> params = UniMaps.of("recordKey", consumerRecord.key(), "payload", consumerRecord.value());
+            return new RequestInfo("localhost", port, "/api", params); // <1>
+        });
+        // end::example[]
+
+        resultStream.forEach(x -> {
+            log.info("From result stream: {}", x);
+        });
+
+    }
+
+    protected int getPort() {
+        return 8080;
+    }
+
+    void close() {
+        this.parallelConsumer.closeDrainFirst();
+    }
+
+    protected void postSetup() {
+        // no-op, for testing
+    }
+
+}
diff --git a/parallel-consumer-examples/parallel-consumer-example-vertx/src/test/java/io/confluent/parallelconsumer/examples/vertx/VertxAppTest.java b/parallel-consumer-examples/parallel-consumer-example-vertx/src/test/java/io/confluent/parallelconsumer/examples/vertx/VertxAppTest.java
new file mode 100644
index 000000000..c82f3a20e
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-vertx/src/test/java/io/confluent/parallelconsumer/examples/vertx/VertxAppTest.java
@@ -0,0 +1,90 @@
+package io.confluent.parallelconsumer.examples.vertx;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import com.github.tomakehurst.wiremock.WireMockServer;
+import io.confluent.csid.utils.KafkaTestUtils;
+import io.confluent.csid.utils.LongPollingMockConsumer;
+import io.confluent.csid.utils.WireMockUtils;
+import lombok.RequiredArgsConstructor;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.Consumer;
+import org.apache.kafka.clients.consumer.ConsumerGroupMetadata;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.apache.kafka.clients.consumer.OffsetResetStrategy;
+import org.apache.kafka.clients.producer.MockProducer;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.common.TopicPartition;
+import org.awaitility.Awaitility;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.Timeout;
+import org.mockito.Mockito;
+
+import java.time.Duration;
+import java.util.HashMap;
+
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+@Slf4j
+class VertxAppTest {
+
+    TopicPartition tp = new TopicPartition(VertxApp.inputTopic, 0);
+
+    @Timeout(20)
+    @SneakyThrows
+    @Test
+    void test() {
+        log.info("Test start");
+        WireMockServer wireMockServer = new WireMockUtils().setupWireMock();
+        int port = wireMockServer.port();
+
+        VertxAppAppUnderTest coreApp = new VertxAppAppUnderTest(port);
+
+        coreApp.run();
+
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(VertxApp.inputTopic, 0, 0, "a key 1", "a value"));
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(VertxApp.inputTopic, 0, 1, "a key 2", "a value"));
+        coreApp.mockConsumer.addRecord(new ConsumerRecord(VertxApp.inputTopic, 0, 2, "a key 3", "a value"));
+
+        Awaitility.await().pollInterval(Duration.ofSeconds(1)).untilAsserted(() -> {
+            KafkaTestUtils.assertLastCommitIs(coreApp.mockConsumer, 3);
+        });
+
+        coreApp.close();
+    }
+
+    @RequiredArgsConstructor
+    class VertxAppAppUnderTest extends VertxApp {
+
+        private final int port;
+
+        LongPollingMockConsumer<String, String> mockConsumer = Mockito.spy(new LongPollingMockConsumer<>(OffsetResetStrategy.EARLIEST));
+
+        @Override
+        Consumer<String, String> getKafkaConsumer() {
+            HashMap<TopicPartition, Long> beginningOffsets = new HashMap<>();
+            beginningOffsets.put(tp, 0L);
+            mockConsumer.updateBeginningOffsets(beginningOffsets);
+            Mockito.when(mockConsumer.groupMetadata()).thenReturn(new ConsumerGroupMetadata("groupid")); // todo fix AK mock consumer
+            return mockConsumer;
+        }
+
+        @Override
+        Producer<String, String> getKafkaProducer() {
+            return new MockProducer<>(true, null, null);
+        }
+
+        @Override
+        public void postSetup() {
+            mockConsumer.subscribeWithRebalanceAndAssignment(of(inputTopic), 1);
+        }
+
+        @Override
+        protected int getPort() {
+            return port;
+        }
+    }
+}
diff --git a/parallel-consumer-examples/parallel-consumer-example-vertx/src/test/resources/logback-test.xml b/parallel-consumer-examples/parallel-consumer-example-vertx/src/test/resources/logback-test.xml
new file mode 100644
index 000000000..474b9b21e
--- /dev/null
+++ b/parallel-consumer-examples/parallel-consumer-example-vertx/src/test/resources/logback-test.xml
@@ -0,0 +1,37 @@
+<!--
+
+    Copyright (C) 2020-2021 Confluent, Inc.
+
+-->
+<configuration packagingData="true" scan="true" scanPeriod="5 seconds">
+
+    <appender name="STDOUT" class="ch.qos.logback.core.ConsoleAppender">
+        <encoder>
+            <pattern>%d{mm:ss.SSS} %highlight(%-5level) %yellow([%thread]) %X{offset} %cyan(\(%file:%line#%M\)) %msg%n</pattern>
+        </encoder>
+    </appender>
+
+    <root level="info">
+        <appender-ref ref="STDOUT"/>
+    </root>
+
+    <logger name="io.confluent.csid" level="info"/>
+    <!--    <logger name="io.confluent.csid" level="debug" />-->
+    <!--    <logger name="io.confluent.csid" level="trace" />-->
+
+    <!--    <logger name="io.confluent.csid.asyncconsumer.WorkManager" level="info" />-->
+    <!--    <logger name="io.confluent.csid.asyncconsumer.ParallelConsumer" level="info" />-->
+
+    <!-- containers -->
+    <logger name="io.confluent.parallelconsumer.integrationTests.DbTest" level="debug"/>
+    <logger name="io.confluent.parallelconsumer.integrationTests.BrokerIntegrationTest" level="debug"/>
+
+    <!-- related -->
+    <logger name="org.apache.kafka.clients" level="warn"/>
+    <logger name="org.postgresql" level="info"/>
+
+    <!-- external -->
+    <logger name="io.vertx" level="debug"/>
+    <logger name="io.netty" level="info"/>
+
+</configuration>
\ No newline at end of file
diff --git a/parallel-consumer-examples/pom.xml b/parallel-consumer-examples/pom.xml
new file mode 100644
index 000000000..d24de5831
--- /dev/null
+++ b/parallel-consumer-examples/pom.xml
@@ -0,0 +1,28 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Copyright (C) 2020-2023 Confluent, Inc.
+
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <artifactId>parallel-consumer-parent</artifactId>
+        <groupId>io.confluent.parallelconsumer</groupId>
+        <version>0.5.2.8-SNAPSHOT</version>
+    </parent>
+
+    <artifactId>parallel-consumer-examples</artifactId>
+    <name>Confluent Parallel Consumer Examples</name>
+    <packaging>pom</packaging>
+
+    <modules>
+        <module>parallel-consumer-example-core</module>
+        <module>parallel-consumer-example-metrics</module>
+        <module>parallel-consumer-example-streams</module>
+        <module>parallel-consumer-example-vertx</module>
+        <module>parallel-consumer-example-reactor</module>
+    </modules>
+
+</project>
diff --git a/parallel-consumer-reactor/pom.xml b/parallel-consumer-reactor/pom.xml
new file mode 100644
index 000000000..a5e7a67c5
--- /dev/null
+++ b/parallel-consumer-reactor/pom.xml
@@ -0,0 +1,57 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Copyright (C) 2020-2023 Confluent, Inc.
+
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <parent>
+        <artifactId>parallel-consumer-parent</artifactId>
+        <groupId>io.confluent.parallelconsumer</groupId>
+        <version>0.5.2.8-SNAPSHOT</version>
+    </parent>
+    <modelVersion>4.0.0</modelVersion>
+
+    <name>Confluent Parallel Consumer Project Reactor.io</name>
+    <artifactId>parallel-consumer-reactor</artifactId>
+
+    <dependencies>
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-core</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-core</artifactId>
+            <version>${project.version}</version>
+            <classifier>tests</classifier>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>io.projectreactor</groupId>
+            <artifactId>reactor-core</artifactId>
+            <version>3.5.9</version>
+        </dependency>
+        <dependency>
+            <groupId>com.google.guava</groupId>
+            <artifactId>guava</artifactId>
+        </dependency>
+        <dependency>
+            <groupId>me.tongfei</groupId>
+            <artifactId>progressbar</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.junit.jupiter</groupId>
+            <artifactId>junit-jupiter-params</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.junit-pioneer</groupId>
+            <artifactId>junit-pioneer</artifactId>
+            <scope>test</scope>
+        </dependency>
+    </dependencies>
+
+</project>
diff --git a/parallel-consumer-reactor/src/main/java/io/confluent/parallelconsumer/reactor/ReactorProcessor.java b/parallel-consumer-reactor/src/main/java/io/confluent/parallelconsumer/reactor/ReactorProcessor.java
new file mode 100644
index 000000000..fe21f9660
--- /dev/null
+++ b/parallel-consumer-reactor/src/main/java/io/confluent/parallelconsumer/reactor/ReactorProcessor.java
@@ -0,0 +1,139 @@
+package io.confluent.parallelconsumer.reactor;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.PollContext;
+import io.confluent.parallelconsumer.PollContextInternal;
+import io.confluent.parallelconsumer.internal.ExternalEngine;
+import io.confluent.parallelconsumer.state.WorkContainer;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+import org.reactivestreams.Publisher;
+import pl.tlinkowski.unij.api.UniLists;
+import reactor.core.Disposable;
+import reactor.core.publisher.Flux;
+import reactor.core.scheduler.Scheduler;
+import reactor.core.scheduler.Schedulers;
+
+import java.time.Duration;
+import java.util.List;
+import java.util.function.Consumer;
+import java.util.function.Function;
+import java.util.function.Supplier;
+import java.util.stream.Collectors;
+
+import static io.confluent.parallelconsumer.internal.UserFunctions.carefullyRun;
+
+/**
+ * Adapter for using Project Reactor as the asynchronous execution engine
+ */
+@Slf4j
+public class ReactorProcessor<K, V> extends ExternalEngine<K, V> {
+
+    /**
+     * @see WorkContainer#getWorkType()
+     */
+    private static final String REACTOR_TYPE = "reactor.x-type";
+
+    private final Supplier<Scheduler> schedulerSupplier;
+    private final Supplier<Scheduler> defaultSchedulerSupplier = Schedulers::boundedElastic;
+
+    public ReactorProcessor(ParallelConsumerOptions<K, V> options, Supplier<Scheduler> newSchedulerSupplier) {
+        super(options);
+        this.schedulerSupplier = (newSchedulerSupplier == null) ? defaultSchedulerSupplier : newSchedulerSupplier;
+    }
+
+    public ReactorProcessor(ParallelConsumerOptions<K, V> options) {
+        this(options, null);
+    }
+
+    @Override
+    protected boolean isAsyncFutureWork(List<?> resultsFromUserFunction) {
+        for (Object object : resultsFromUserFunction) {
+            return (object instanceof Disposable);
+        }
+        return false;
+    }
+
+    @SneakyThrows
+    @Override
+    public void close(Duration timeout, DrainingMode drainMode) {
+        super.close(timeout, drainMode);
+    }
+
+    /**
+     * Register a function to be to polled messages.
+     * <p>
+     * Make sure that you do any work immediately in a Publisher / Flux - do not block this thread.
+     * <p>
+     *
+     * @param reactorFunction user function that takes a single record, and returns some type of Publisher to process
+     *                        their work.
+     * @see #react(Function)
+     * @see ParallelConsumerOptions
+     * @see ParallelConsumerOptions#batchSize
+     * @see io.confluent.parallelconsumer.ParallelStreamProcessor#poll
+     */
+    public void react(Function<PollContext<K, V>, Publisher<?>> reactorFunction) {
+
+        Function<PollContextInternal<K, V>, List<Object>> wrappedUserFunc = pollContext -> {
+
+            if (log.isTraceEnabled()) {
+                log.trace("Record list ({}), executing void function...",
+                        pollContext.streamConsumerRecords()
+                                .map(ConsumerRecord::offset)
+                                .collect(Collectors.toList())
+                );
+            }
+
+            // attach internal handler
+            pollContext.streamWorkContainers()
+                    .forEach(x -> x.setWorkType(REACTOR_TYPE));
+
+            Publisher<?> publisher = carefullyRun(reactorFunction, pollContext.getPollContext());
+
+            Disposable flux = Flux.from(publisher)
+                    // using #subscribeOn so this should be redundant, but testing has shown otherwise
+                    // note this will not cause user's function to run in pool - without successful use of subscribeOn,
+                    // it will run in the controller thread, unless user themselves uses either publishOn or successful
+                    // subscribeOn
+                    .publishOn(getScheduler())
+                    .doOnNext(signal -> {
+                        log.trace("doOnNext {}", signal);
+                    })
+                    .doOnComplete(() -> {
+                        log.debug("Reactor success (doOnComplete)");
+                        pollContext.streamWorkContainers().forEach(wc -> {
+                            wc.onUserFunctionSuccess();
+                            addToMailbox(pollContext, wc);
+                        });
+                    })
+                    .doOnError(throwable -> {
+                        log.error("Reactor fail signal", throwable);
+                        pollContext.streamWorkContainers().forEach(wc -> {
+                            wc.onUserFunctionFailure(throwable);
+                            addToMailbox(pollContext, wc);
+                        });
+                    })
+                    // cause users Publisher to run a thread pool, if it hasn't already - this is a crucial magical part
+                    .subscribeOn(getScheduler())
+                    .subscribe();
+
+            log.trace("asyncPoll - user function finished ok.");
+            return UniLists.of(flux);
+        };
+
+        //
+        Consumer<Object> voidCallBack = (ignore) -> log.trace("Void callback applied.");
+        supervisorLoop(wrappedUserFunc, voidCallBack);
+    }
+
+    private Scheduler getScheduler() {
+        return this.schedulerSupplier.get();
+    }
+
+}
diff --git a/parallel-consumer-reactor/src/test/java/io/confluent/parallelconsumer/reactor/ReactorBatchTest.java b/parallel-consumer-reactor/src/test/java/io/confluent/parallelconsumer/reactor/ReactorBatchTest.java
new file mode 100644
index 000000000..154ad7c60
--- /dev/null
+++ b/parallel-consumer-reactor/src/test/java/io/confluent/parallelconsumer/reactor/ReactorBatchTest.java
@@ -0,0 +1,101 @@
+package io.confluent.parallelconsumer.reactor;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.KafkaTestUtils;
+import io.confluent.parallelconsumer.BatchTestBase;
+import io.confluent.parallelconsumer.BatchTestMethods;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.PollContext;
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.internal.RateLimiter;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+import reactor.core.publisher.Mono;
+
+import java.time.Duration;
+import java.util.List;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+
+@Slf4j
+public class ReactorBatchTest extends ReactorUnitTestBase implements BatchTestBase {
+
+    BatchTestMethods<Mono<String>> batchTestMethods;
+
+    @BeforeEach
+    void setup() {
+        batchTestMethods = new BatchTestMethods<>(this) {
+
+            @Override
+            protected KafkaTestUtils getKtu() {
+                return ktu;
+            }
+
+            @SneakyThrows
+            @Override
+            protected Mono<String> averageBatchSizeTestPollStep(PollContext<String, String> recordList) {
+                return Mono.just(msg("Saw batch or records: {}", recordList.getOffsetsFlattened()))
+                        .delayElement(Duration.ofMillis(30));
+            }
+
+            @Override
+            protected void averageBatchSizeTestPoll(AtomicInteger numBatches, AtomicInteger numRecords, RateLimiter statusLogger) {
+                reactorPC.react(recordList ->
+                        averageBatchSizeTestPollInner(numBatches, numRecords, statusLogger, recordList)
+                );
+            }
+
+            @Override
+            protected AbstractParallelEoSStreamProcessor getPC() {
+                return reactorPC;
+            }
+
+            @Override
+            public void simpleBatchTestPoll(List<PollContext<String, String>> batchesReceived) {
+                reactorPC.react(recordList -> {
+                    String msg = msg("Saw batch or records: {}", recordList.getOffsetsFlattened());
+                    log.debug(msg);
+                    batchesReceived.add(recordList);
+                    return Mono.just(msg);
+                });
+            }
+
+            @Override
+            protected void batchFailPoll(List<PollContext<String, String>> batchesReceived) {
+                reactorPC.react(recordList -> {
+                    batchFailPollInner(recordList);
+                    batchesReceived.add(recordList);
+                    return Mono.just(msg("Saw batch or records: {}", recordList.getOffsetsFlattened()));
+                });
+            }
+        };
+    }
+
+    @Test
+    public void averageBatchSizeTest() {
+        batchTestMethods.averageBatchSizeTest(10000);
+    }
+
+    @ParameterizedTest
+    @EnumSource
+    @Override
+    public void simpleBatchTest(ParallelConsumerOptions.ProcessingOrder order) {
+        batchTestMethods.simpleBatchTest(order);
+    }
+
+    @ParameterizedTest
+    @EnumSource
+    @Override
+    public void batchFailureTest(ParallelConsumerOptions.ProcessingOrder order) {
+        batchTestMethods.batchFailureTest(order);
+    }
+
+}
diff --git a/parallel-consumer-reactor/src/test/java/io/confluent/parallelconsumer/reactor/ReactorPCTest.java b/parallel-consumer-reactor/src/test/java/io/confluent/parallelconsumer/reactor/ReactorPCTest.java
new file mode 100644
index 000000000..763497e31
--- /dev/null
+++ b/parallel-consumer-reactor/src/test/java/io/confluent/parallelconsumer/reactor/ReactorPCTest.java
@@ -0,0 +1,150 @@
+package io.confluent.parallelconsumer.reactor;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.LatchTestUtils;
+import io.confluent.csid.utils.ProgressBarUtils;
+import io.confluent.csid.utils.StringUtils;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import me.tongfei.progressbar.ProgressBar;
+import org.assertj.core.data.Percentage;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+import reactor.core.publisher.Mono;
+
+import java.time.Duration;
+import java.util.concurrent.ConcurrentLinkedQueue;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static com.google.common.truth.Truth.assertWithMessage;
+import static io.confluent.parallelconsumer.truth.LongPollingMockConsumerSubject.assertThat;
+import static org.awaitility.Awaitility.await;
+
+@Slf4j
+class ReactorPCTest extends ReactorUnitTestBase {
+
+    /**
+     * The percent of the max concurrency tolerance allowed
+     */
+    public static final Percentage MAX_CONCURRENCY_OVERFLOW_ALLOWANCE = Percentage.withPercentage(1.2);
+
+    @BeforeEach
+    public void setupData() {
+        super.primeFirstRecord();
+    }
+
+    @Test
+    void kickTires() {
+        primeFirstRecord();
+        primeFirstRecord();
+        primeFirstRecord();
+
+        ConcurrentLinkedQueue<Object> msgs = new ConcurrentLinkedQueue<>();
+
+        reactorPC.react((rec) -> {
+            log.info("Reactor user poll function: {}", rec);
+            msgs.add(rec);
+            Mono<String> result = Mono.just(StringUtils.msg("result: {}:{}", rec.offset(), rec.value()));
+//            Flux<String> stringFlux = fromPath("/tmp/out.html");
+            return result;
+        });
+
+        await()
+                .atMost(defaultTimeout)
+                .untilAsserted(() -> {
+                    assertWithMessage("Processed records collection so far")
+                            .that(msgs.size())
+                            .isEqualTo(4);
+
+                    assertThat(consumerSpy)
+                            .hasCommittedToPartition(topicPartition)
+                            .atLeastOffset(4);
+                });
+    }
+
+    @SneakyThrows
+    @Test
+    void concurrencyTest() {
+        //
+        var quantity = 100_000;
+        var consumerRecords = ktu.generateRecords(quantity - 1); // -1 coz already has 1 record primed (all tests do)
+        ktu.send(consumerSpy, consumerRecords);
+        log.info("Finished priming records");
+
+        //
+        ProgressBar bar = ProgressBarUtils.getNewMessagesBar(log, quantity);
+
+        //
+        ConcurrentLinkedQueue<Object> msgs = new ConcurrentLinkedQueue<>();
+
+        var finishedCount = new AtomicInteger(0);
+        var maxConcurrentRecordsSeen = new AtomicInteger(0);
+        var completeOrProblem = new CountDownLatch(1);
+        var maxConcurrency = MAX_CONCURRENCY;
+
+        reactorPC.react(recordContext -> Mono.just(StringUtils.msg("result: {}:{}", recordContext.offset(), recordContext.value()))
+                .doOnNext(ignore -> {
+                    // add that our mono processing has started
+                    log.trace("Reactor user function executing: {}", recordContext);
+                    msgs.add(recordContext);
+                    if (msgs.size() > maxConcurrency) {
+                        log.error("More records submitted for processing than max concurrency settings ({} vs {})", msgs.size(), maxConcurrency);
+                        // fail fast - test already failed
+                        completeOrProblem.countDown();
+                    }
+                })
+                // delay the Mono to simulate a slow async processing time, to cause our concurrency to be reached for sure
+                .delayElement(Duration.ofMillis((int) (100 * Math.random())))
+                .doOnNext(s -> {
+                    log.trace("User function after delay. Records pending: {}, removing from out for processing: {}", msgs.size(), recordContext);
+                    int currentConcurrentRecords = msgs.size();
+                    int highestSoFar = Math.max(currentConcurrentRecords, maxConcurrentRecordsSeen.get());
+                    maxConcurrentRecordsSeen.set(highestSoFar);
+
+                    //
+                    boolean removed = msgs.remove(recordContext);
+                    assertWithMessage("record was present and removed")
+                            .that(removed).isTrue();
+
+                    //
+                    int numberOfFinishedRecords = finishedCount.incrementAndGet();
+                    boolean allExpectedRecordsAreProcessed = numberOfFinishedRecords > quantity - 1;
+                    if (allExpectedRecordsAreProcessed) {
+                        // release the latch to indicate processing complete
+                        completeOrProblem.countDown();
+                    }
+
+                    //
+                    bar.step();
+                }));
+
+        // block here until all messages processed
+        LatchTestUtils.awaitLatch(completeOrProblem, defaultTimeoutSeconds);
+
+        //
+        int maxConcurrencyAllowedThreshold = (int) (maxConcurrency * MAX_CONCURRENCY_OVERFLOW_ALLOWANCE.value);
+        assertWithMessage("Max concurrency should never be exceeded")
+                .that(maxConcurrentRecordsSeen.get()).isLessThan(maxConcurrencyAllowedThreshold);
+        log.info("Max concurrency was {}", maxConcurrentRecordsSeen.get());
+
+        //
+        await()
+                // perform testing for at least some time - see fail fast
+                .atMost(defaultTimeout)
+                // make sure out for processing recs never exceeds max concurrency
+                .failFast("Max concurrency exceeded", () -> msgs.size() > maxConcurrencyAllowedThreshold)
+                .untilAsserted(() -> {
+                    assertWithMessage("Number of completed messages")
+                            .that(finishedCount.get()).isEqualTo(quantity);
+
+                    assertThat(consumerSpy).hasCommittedToPartition(topicPartition).offset(quantity);
+                });
+
+        bar.close();
+        log.info("Max concurrency was {}", maxConcurrentRecordsSeen.get());
+    }
+}
diff --git a/parallel-consumer-reactor/src/test/java/io/confluent/parallelconsumer/reactor/ReactorTest.java b/parallel-consumer-reactor/src/test/java/io/confluent/parallelconsumer/reactor/ReactorTest.java
new file mode 100644
index 000000000..33e81c920
--- /dev/null
+++ b/parallel-consumer-reactor/src/test/java/io/confluent/parallelconsumer/reactor/ReactorTest.java
@@ -0,0 +1,45 @@
+package io.confluent.parallelconsumer.reactor;
+
+/*-
+ * Copyright (C) 2020-2021 Confluent, Inc.
+ */
+
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.junit.jupiter.api.Test;
+import reactor.core.publisher.Flux;
+import reactor.core.scheduler.Scheduler;
+import reactor.core.scheduler.Schedulers;
+
+@Slf4j
+class ReactorTest {
+
+    @Test
+    void publishOn(){
+        Scheduler s = Schedulers.newParallel("parallel-scheduler", 4);
+
+        final Flux<String> flux = Flux
+                .range(1, 2)
+                .map(i -> 10 + i)
+                .publishOn(s)
+                .map(i -> "value " + i);
+
+        new Thread(() -> flux.subscribe(System.out::println)).run();
+    }
+
+
+    @SneakyThrows
+    @Test
+    void subscribeOn(){
+        Scheduler s = Schedulers.newParallel("parallel-scheduler", 4);
+
+        final Flux<String> flux = Flux
+                .range(1, 2)
+                .map(i -> 10 + i)
+                .subscribeOn(s)
+                .map(i -> "value " + i);
+
+        new Thread(() -> flux.subscribe(System.out::println)).run();
+    }
+
+}
diff --git a/parallel-consumer-reactor/src/test/java/io/confluent/parallelconsumer/reactor/ReactorUnitTestBase.java b/parallel-consumer-reactor/src/test/java/io/confluent/parallelconsumer/reactor/ReactorUnitTestBase.java
new file mode 100644
index 000000000..fce240128
--- /dev/null
+++ b/parallel-consumer-reactor/src/test/java/io/confluent/parallelconsumer/reactor/ReactorUnitTestBase.java
@@ -0,0 +1,43 @@
+package io.confluent.parallelconsumer.reactor;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessorTestBase;
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import reactor.core.publisher.Flux;
+
+import java.nio.file.Files;
+import java.nio.file.Path;
+import java.util.stream.BaseStream;
+
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_CONSUMER_SYNC;
+
+public class ReactorUnitTestBase extends ParallelEoSStreamProcessorTestBase {
+
+    protected ReactorProcessor<String, String> reactorPC;
+
+    protected static final int MAX_CONCURRENCY = 1000;
+
+    @Override
+    protected AbstractParallelEoSStreamProcessor initAsyncConsumer(ParallelConsumerOptions parallelConsumerOptions) {
+        var build = parallelConsumerOptions.toBuilder()
+                .commitMode(PERIODIC_CONSUMER_SYNC)
+                .maxConcurrency(MAX_CONCURRENCY)
+                .build();
+
+        reactorPC = new ReactorProcessor<>(build);
+
+        return reactorPC;
+    }
+
+    protected static Flux<String> fromPath(Path path) {
+        return Flux.using(() -> Files.lines(path),
+                Flux::fromStream,
+                BaseStream::close
+        );
+    }
+
+}
diff --git a/parallel-consumer-reactor/src/test/resources/logback-test.xml b/parallel-consumer-reactor/src/test/resources/logback-test.xml
new file mode 100644
index 000000000..3aec1d52e
--- /dev/null
+++ b/parallel-consumer-reactor/src/test/resources/logback-test.xml
@@ -0,0 +1,83 @@
+<!--
+
+    Copyright (C) 2020-2022 Confluent, Inc.
+
+-->
+<configuration packagingData="true" scan="true" scanPeriod="5 seconds">
+
+    <appender name="STDOUT" class="ch.qos.logback.core.ConsoleAppender">
+        <!-- encoders are assigned the type
+             ch.qos.logback.classic.encoder.PatternLayoutEncoder by default -->
+        <encoder>
+            <!--            <pattern>%d{mm:ss.SSS} [%thread] %-5level (%class{0}.java:%line\)#%M - %msg%n</pattern>-->
+            <!--            <pattern>[%thread] %-5level .\(%class{0}.java:%line\)#%M - %msg%n</pattern>-->
+            <!--            <pattern>[%thread] %-5level .\(%file:%line\)#%M - %msg%n</pattern>-->
+            <!--            <pattern>%highlight(%-5level) %d{yyyy-MM-dd'T'HH:mm:ss.SSS} %yellow([%thread]) %blue(%logger{36}\(%class{0}.java:%line\)) %msg%n</pattern>-->
+            <!--            <pattern>%highlight(%-5level) %d{yyyy-MM-dd'T'HH:mm:ss.SSS} %yellow([%thread]) %blue(%logger{36}\(%file:%line\)) %msg%n</pattern>-->
+            <!--            <pattern>%highlight(%-5level) %yellow([%thread]) %blue(\(%file:%line\)) %cyan(#%M) %msg%n</pattern>-->
+            <pattern>%d{mm:ss.SSS} %yellow(%X{pcId}) %highlight(%-5level) %yellow([%thread]) %X{offset} %cyan(\(%file:%line\)#%M) %msg%n
+            </pattern>
+            <!--            <pattern>%highlight(%-5level) %yellow([%thread]) %cyan(\(%logger{36}:%line#%M\))  %msg%n</pattern>-->
+        </encoder>
+    </appender>
+
+    <root level="warn">
+        <!--    <root level="debug">-->
+        <appender-ref ref="STDOUT"/>
+    </root>
+
+    <!-- primary -->
+    <logger name="io.confluent.parallelconsumer" level="info"/>
+
+    <!-- Key classes -->
+    <!--    <logger name="io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.internal.BrokerPollSystem" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.internal.ConsumerManager" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.state.WorkManager" level="info"/>-->
+        <logger name="io.confluent.parallelconsumer.internal.ExternalEngine" level="info"/>
+
+
+    <!--    <logger name="io.confluent.parallelconsumer.vertx.VertxBatchTest" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.BatchTestMethods" level="debug"/>-->
+
+    <!--    <logger name="io.confluent.parallelconsumer" level="debug"/>-->
+    <!--    <logger name="io.confluent.csid" level="debug"/>-->
+    <!--        <logger name="io.confluent.parallelconsumer" level="trace"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer" level="error"/>-->
+
+    <!--        <logger name="io.confluent.parallelconsumer.integrationTests.BrokerIntegrationTest" level="info"/> &lt;!&ndash; docker logs &ndash;&gt;-->
+    <!--    <logger name="io.confluent.csid" level="info"/>-->
+    <!--        <logger name="io.confluent.csid.utils" level="debug"/>-->
+
+
+    <!--            <logger name="io.confluent.parallelconsumer" level="trace" />-->
+
+    <!-- notable specifics -->
+    <!--        <logger name="io.confluent.parallelconsumer.ParallelEoSStreamProcessorTestBase" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.integrationTests" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.integrationTests.LargeVolumeInMemoryTests" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.ParallelConsumerTestBase" level="trace"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.ParallelConsumer" level="info" />-->
+    <!--    <logger name="io.confluent.parallelconsumer.offsets.OffsetMapCodecManager" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.offsets.WorkManagerOffsetMapCodecManagerTest" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.offsets.OffsetRunLength" level="trace"/>-->
+
+    <!-- containers -->
+    <!--    <logger name="io.confluent.parallelconsumer.integrationTests.DbTest" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.integrationTests.BrokerIntegrationTest" level="debug"/>-->
+
+    <!-- related -->
+    <!--    <logger name="org.apache.kafka.clients" level="info"/>-->
+    <!--    <logger name="org.apache.kafka.clients" level="warn"/>-->
+    <!--    <logger name="org.apache.kafka.clients" level="debug"/>-->
+
+    <logger name="org.postgresql" level="info"/>
+
+    <!-- external -->
+    <!--    <logger name="io.vertx" level="debug"/>-->
+    <logger name="io.netty" level="info"/>
+
+    <!-- kafka internal -->
+    <!--    <logger name="org.apache.kafka.clients.consumer.internals.ConsumerCoordinator" level="debug"/>-->
+
+</configuration>
diff --git a/parallel-consumer-vertx/pom.xml b/parallel-consumer-vertx/pom.xml
new file mode 100644
index 000000000..a908817fd
--- /dev/null
+++ b/parallel-consumer-vertx/pom.xml
@@ -0,0 +1,75 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Copyright (C) 2020-2023 Confluent, Inc.
+
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <parent>
+        <groupId>io.confluent.parallelconsumer</groupId>
+        <artifactId>parallel-consumer-parent</artifactId>
+        <version>0.5.2.8-SNAPSHOT</version>
+    </parent>
+
+    <artifactId>parallel-consumer-vertx</artifactId>
+    <name>Confluent Parallel Consumer Vert.x</name>
+
+    <modelVersion>4.0.0</modelVersion>
+
+    <properties>
+        <vertx.version>4.4.4</vertx.version>
+    </properties>
+
+    <dependencies>
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-core</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+        <dependency>
+            <groupId>io.confluent.parallelconsumer</groupId>
+            <artifactId>parallel-consumer-core</artifactId>
+            <version>${project.version}</version>
+            <classifier>tests</classifier>
+            <scope>test</scope>
+        </dependency>
+        <!-- External-->
+        <dependency>
+            <groupId>io.vertx</groupId>
+            <artifactId>vertx-web-client</artifactId>
+            <version>${vertx.version}</version>
+        </dependency>
+
+        <!-- Testing -->
+        <dependency>
+            <groupId>io.vertx</groupId>
+            <artifactId>vertx-junit5</artifactId>
+            <version>${vertx.version}</version>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>com.github.tomakehurst</groupId>
+            <artifactId>wiremock-jre8</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>me.tongfei</groupId>
+            <artifactId>progressbar</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.testcontainers</groupId>
+            <artifactId>kafka</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.testcontainers</groupId>
+            <artifactId>junit-jupiter</artifactId>
+        </dependency>
+        <dependency>
+            <groupId>com.google.guava</groupId>
+            <artifactId>guava</artifactId>
+        </dependency>
+    </dependencies>
+
+</project>
diff --git a/parallel-consumer-vertx/src/main/java/io/confluent/parallelconsumer/vertx/JStreamVertxParallelEoSStreamProcessor.java b/parallel-consumer-vertx/src/main/java/io/confluent/parallelconsumer/vertx/JStreamVertxParallelEoSStreamProcessor.java
new file mode 100644
index 000000000..1d3e3ce7b
--- /dev/null
+++ b/parallel-consumer-vertx/src/main/java/io/confluent/parallelconsumer/vertx/JStreamVertxParallelEoSStreamProcessor.java
@@ -0,0 +1,161 @@
+package io.confluent.parallelconsumer.vertx;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.Java8StreamUtils;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.PollContext;
+import io.vertx.core.Future;
+import io.vertx.core.Vertx;
+import io.vertx.core.buffer.Buffer;
+import io.vertx.ext.web.client.HttpRequest;
+import io.vertx.ext.web.client.HttpResponse;
+import io.vertx.ext.web.client.WebClient;
+import lombok.Builder;
+import lombok.Getter;
+import lombok.extern.slf4j.Slf4j;
+
+import java.util.Optional;
+import java.util.concurrent.ConcurrentLinkedDeque;
+import java.util.function.BiFunction;
+import java.util.function.Consumer;
+import java.util.function.Function;
+import java.util.stream.Stream;
+
+import static io.confluent.parallelconsumer.internal.UserFunctions.carefullyRun;
+
+@Slf4j
+public class JStreamVertxParallelEoSStreamProcessor<K, V> extends VertxParallelEoSStreamProcessor<K, V>
+        implements JStreamVertxParallelStreamProcessor<K, V> {
+
+    /**
+     * The stream of results, constructed from the Queue {@link #userProcessResultsStream}
+     */
+    private final Stream<VertxCPResult<K, V>> stream;
+
+    /**
+     * The Queue of results
+     */
+    private final ConcurrentLinkedDeque<VertxCPResult<K, V>> userProcessResultsStream;
+
+    /**
+     * Provide your own instances of the Vertx engine and it's webclient.
+     * <p>
+     * Use this to share a Vertx runtime with different systems for efficiency.
+     */
+    public JStreamVertxParallelEoSStreamProcessor(Vertx vertx,
+                                                  WebClient webClient,
+                                                  ParallelConsumerOptions<K, V> options) {
+        super(vertx, webClient, options);
+
+        this.userProcessResultsStream = new ConcurrentLinkedDeque<>();
+
+        this.stream = Java8StreamUtils.setupStreamFromDeque(this.userProcessResultsStream);
+    }
+
+    /**
+     * Simple constructor. Internal Vertx objects will be created.
+     */
+    public JStreamVertxParallelEoSStreamProcessor(ParallelConsumerOptions<K, V> options) {
+        this(null, null, options);
+    }
+
+    @Override
+    public Stream<VertxCPResult<K, V>> vertxHttpReqInfoStream(Function<PollContext<K, V>, RequestInfo> requestInfoFunction) {
+
+        VertxCPResult.VertxCPResultBuilder<K, V> result = VertxCPResult.builder();
+
+        Function<PollContext<K, V>, RequestInfo> requestInfoFunctionWrapped = x -> {
+            result.in(x);
+            RequestInfo apply = carefullyRun(requestInfoFunction, x);
+            result.requestInfo(Optional.of(apply));
+            return apply;
+        };
+
+        Consumer<Future<HttpResponse<Buffer>>> onSendCallBack = future -> {
+            // stream
+            result.asr(future);
+            VertxCPResult<K, V> build = result.build();
+            userProcessResultsStream.add(build);
+        };
+
+        super.vertxHttpReqInfo(requestInfoFunctionWrapped, onSendCallBack, (ignore) -> {
+        });
+
+        return stream;
+    }
+
+    @Override
+    public Stream<VertxCPResult<K, V>> vertxHttpRequestStream(BiFunction<WebClient, PollContext<K, V>, HttpRequest<Buffer>> webClientRequestFunction) {
+
+        VertxCPResult.VertxCPResultBuilder<K, V> result = VertxCPResult.builder();
+
+        BiFunction<WebClient, PollContext<K, V>, HttpRequest<Buffer>> requestInfoFunctionWrapped = (wc, x) -> {
+            result.in(x);
+            HttpRequest<Buffer> apply = carefullyRun(webClientRequestFunction, wc, x);
+
+            result.httpReq(Optional.of(apply));
+            return apply;
+        };
+
+        Consumer<Future<HttpResponse<Buffer>>> onSendCallBack = future -> {
+            // stream
+            result.asr(future);
+            VertxCPResult<K, V> build = result.build();
+            userProcessResultsStream.add(build);
+        };
+
+        super.vertxHttpRequest(requestInfoFunctionWrapped, onSendCallBack, (ignore) -> {
+        });
+        return stream;
+    }
+
+    @Override
+    public Stream<VertxCPResult<K, V>> vertxHttpWebClientStream(
+            BiFunction<WebClient, PollContext<K, V>, Future<HttpResponse<Buffer>>> webClientRequestFunction) {
+
+        VertxCPResult.VertxCPResultBuilder<K, V> result = VertxCPResult.builder();
+
+        BiFunction<WebClient, PollContext<K, V>, Future<HttpResponse<Buffer>>> wrappedFunc = (x, y) -> {
+            // capture
+            result.in(y);
+            Future<HttpResponse<Buffer>> apply = carefullyRun(webClientRequestFunction, x, y);
+
+            result.asr(apply);
+            return apply;
+        };
+
+        Consumer<Future<HttpResponse<Buffer>>> onSendCallBack = future -> {
+            // stream
+            result.asr(future);
+            VertxCPResult<K, V> build = result.build();
+            userProcessResultsStream.add(build);
+        };
+
+        super.vertxHttpWebClient(wrappedFunc, onSendCallBack);
+
+        return stream;
+    }
+
+    /**
+     * @param <K>
+     * @param <V>
+     * @see ConsumeProduceResult
+     */
+    @Getter
+    @Builder
+    public static class VertxCPResult<K, V> {
+        private final PollContext<K, V> in;
+        private final Future<HttpResponse<Buffer>> asr;
+
+        // todo change to class generic type variables? 2 fields become 1. Not worth the hassle atm.
+        // Currently our vertx usage has two types of results. This is a quick way to model that. Should consider improving.
+        @Builder.Default
+        private final Optional<RequestInfo> requestInfo = Optional.empty();
+        @Builder.Default
+        private final Optional<HttpRequest<Buffer>> httpReq = Optional.empty();
+    }
+
+}
diff --git a/parallel-consumer-vertx/src/main/java/io/confluent/parallelconsumer/vertx/JStreamVertxParallelStreamProcessor.java b/parallel-consumer-vertx/src/main/java/io/confluent/parallelconsumer/vertx/JStreamVertxParallelStreamProcessor.java
new file mode 100644
index 000000000..45e14aec3
--- /dev/null
+++ b/parallel-consumer-vertx/src/main/java/io/confluent/parallelconsumer/vertx/JStreamVertxParallelStreamProcessor.java
@@ -0,0 +1,52 @@
+package io.confluent.parallelconsumer.vertx;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumer;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.PollContext;
+import io.vertx.core.Future;
+import io.vertx.core.buffer.Buffer;
+import io.vertx.ext.web.client.HttpRequest;
+import io.vertx.ext.web.client.HttpResponse;
+import io.vertx.ext.web.client.WebClient;
+
+import java.util.function.BiFunction;
+import java.util.function.Function;
+import java.util.stream.Stream;
+
+/**
+ * Result streaming version of {@link VertxParallelEoSStreamProcessor}.
+ */
+public interface JStreamVertxParallelStreamProcessor<K, V> extends ParallelConsumer<K, V> {
+
+    static <KK, VV> JStreamVertxParallelStreamProcessor<KK, VV> createEosStreamProcessor(ParallelConsumerOptions<KK, VV> options) {
+        return new JStreamVertxParallelEoSStreamProcessor<>(options);
+    }
+
+    /**
+     * Streaming version
+     *
+     * @see VertxParallelEoSStreamProcessor#vertxHttpReqInfo
+     */
+    Stream<JStreamVertxParallelEoSStreamProcessor.VertxCPResult<K, V>> vertxHttpReqInfoStream(Function<PollContext<K, V>,
+            VertxParallelEoSStreamProcessor.RequestInfo> requestInfoFunction);
+
+    /**
+     * Streaming version
+     *
+     * @see VertxParallelEoSStreamProcessor#vertxHttpRequest
+     */
+    Stream<JStreamVertxParallelEoSStreamProcessor.VertxCPResult<K, V>> vertxHttpRequestStream(BiFunction<WebClient,
+            PollContext<K, V>, HttpRequest<Buffer>> webClientRequestFunction);
+
+    /**
+     * Streaming version
+     *
+     * @see VertxParallelEoSStreamProcessor#vertxHttpWebClient
+     */
+    Stream<JStreamVertxParallelEoSStreamProcessor.VertxCPResult<K, V>> vertxHttpWebClientStream(
+            BiFunction<WebClient, PollContext<K, V>, Future<HttpResponse<Buffer>>> webClientRequestFunction);
+}
diff --git a/parallel-consumer-vertx/src/main/java/io/confluent/parallelconsumer/vertx/VertxParallelEoSStreamProcessor.java b/parallel-consumer-vertx/src/main/java/io/confluent/parallelconsumer/vertx/VertxParallelEoSStreamProcessor.java
new file mode 100644
index 000000000..6a91218ec
--- /dev/null
+++ b/parallel-consumer-vertx/src/main/java/io/confluent/parallelconsumer/vertx/VertxParallelEoSStreamProcessor.java
@@ -0,0 +1,335 @@
+package io.confluent.parallelconsumer.vertx;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.PollContext;
+import io.confluent.parallelconsumer.PollContextInternal;
+import io.confluent.parallelconsumer.internal.ExternalEngine;
+import io.confluent.parallelconsumer.state.WorkContainer;
+import io.vertx.core.AsyncResult;
+import io.vertx.core.Future;
+import io.vertx.core.Vertx;
+import io.vertx.core.VertxOptions;
+import io.vertx.core.buffer.Buffer;
+import io.vertx.ext.web.client.HttpRequest;
+import io.vertx.ext.web.client.HttpResponse;
+import io.vertx.ext.web.client.WebClient;
+import io.vertx.ext.web.client.WebClientOptions;
+import lombok.AllArgsConstructor;
+import lombok.Getter;
+import lombok.Setter;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.apache.kafka.common.utils.Time;
+import pl.tlinkowski.unij.api.UniLists;
+import pl.tlinkowski.unij.api.UniMaps;
+
+import java.time.Duration;
+import java.util.List;
+import java.util.Map;
+import java.util.Optional;
+import java.util.concurrent.ThreadPoolExecutor;
+import java.util.concurrent.TimeoutException;
+import java.util.function.BiFunction;
+import java.util.function.Consumer;
+import java.util.function.Function;
+
+import static io.confluent.parallelconsumer.internal.UserFunctions.carefullyRun;
+
+
+@Slf4j
+public class VertxParallelEoSStreamProcessor<K, V> extends ExternalEngine<K, V>
+        implements VertxParallelStreamProcessor<K, V> {
+
+    /**
+     * @see WorkContainer#getWorkType()
+     */
+    private static final String VERTX_TYPE = "vert.x-type";
+
+    /**
+     * The Vertx engine to use
+     */
+    private final Vertx vertx;
+
+    /**
+     * The Vertx webclient for making HTTP requests
+     */
+    private final WebClient webClient;
+
+    /**
+     * Extension point for running after Vertx {@link io.vertx.core.Verticle}s finish.
+     */
+    private Optional<Runnable> onVertxCompleteHook = Optional.empty();
+
+    /**
+     * Simple constructor. Internal Vertx objects will be created.
+     */
+    public VertxParallelEoSStreamProcessor(ParallelConsumerOptions options) {
+        this(Vertx.vertx(), null, options);
+    }
+
+    /**
+     * Provide your own instances of the Vertx engine and it's webclient.
+     * <p>
+     * Use this to share a Vertx runtime with different systems for efficiency, or to customise configuration.
+     * <p>
+     * By default Vert.x's {@link WebClient} uses quite small connection limits to servers. PC overrides this to {@link
+     * ParallelConsumerOptions#getMaxConcurrency()}. You can configure these yourself by providing a configured Vert.x
+     * {@link WebClient} with {@link WebClientOptions} set to how you please. Consider also looking at other options
+     * below.
+     *
+     * @see WebClientOptions#setMaxPoolSize
+     * @see WebClientOptions#setMaxWaitQueueSize(int)
+     * @see WebClientOptions#setPipelining(boolean)
+     * @see WebClientOptions#setPipeliningLimit(int)
+     * @see WebClientOptions#setHttp2MaxPoolSize(int)
+     * @see WebClientOptions#setHttp2MultiplexingLimit(int)
+     */
+    public VertxParallelEoSStreamProcessor(Vertx vertx,
+                                           WebClient webClient,
+                                           ParallelConsumerOptions options) {
+        super(options);
+
+        int cores = Runtime.getRuntime().availableProcessors();
+        VertxOptions vertxOptions = new VertxOptions().setWorkerPoolSize(cores);
+
+        int maxConcurrency = options.getMaxConcurrency();
+
+        // should this be user configurable? - probably
+        WebClientOptions webClientOptions = new WebClientOptions()
+                .setMaxPoolSize(maxConcurrency) // defaults to 5
+                .setHttp2MaxPoolSize(maxConcurrency) // defaults to 1
+                ;
+
+        if (vertx == null)
+            vertx = Vertx.vertx(vertxOptions);
+        this.vertx = vertx;
+        if (webClient == null)
+            webClient = WebClient.create(vertx, webClientOptions);
+        this.webClient = webClient;
+    }
+
+    /**
+     * The vert.x module doesn't use any thread pool for dispatching work, as the work is all done by the vert.x engine.
+     * This thread is only used to dispatch the work to vert.x.
+     * <p>
+     * TODO optimise thread usage by not using any extra thread here at all - go straight from the control thread to
+     * vert.x.
+     */
+    @Override
+    protected ThreadPoolExecutor setupWorkerPool(int poolSize) {
+        return super.setupWorkerPool(1);
+    }
+
+    @Override
+    public void vertxHttpReqInfo(Function<PollContext<K, V>, RequestInfo> requestInfoFunction,
+                                 Consumer<Future<HttpResponse<Buffer>>> onSend,
+                                 Consumer<AsyncResult<HttpResponse<Buffer>>> onWebRequestComplete) {
+        vertxHttpRequest((WebClient webClient, PollContext<K, V> rec) -> {
+            RequestInfo reqInf = carefullyRun(requestInfoFunction, rec);
+
+            HttpRequest<Buffer> req = webClient.get(reqInf.getPort(), reqInf.getHost(), reqInf.getContextPath());
+            Map<String, String> params = reqInf.getParams();
+            for (var entry : params.entrySet()) {
+                req = req.addQueryParam(entry.getKey(), entry.getValue());
+            }
+            return req;
+        }, onSend, onWebRequestComplete);
+    }
+
+    @Override
+    public void vertxHttpRequest(BiFunction<WebClient, PollContext<K, V>, HttpRequest<Buffer>> webClientRequestFunction,
+                                 Consumer<Future<HttpResponse<Buffer>>> onSend,
+                                 Consumer<AsyncResult<HttpResponse<Buffer>>> onWebRequestComplete) {
+
+        vertxHttpWebClient((webClient, record) -> {
+            HttpRequest<Buffer> call = carefullyRun(webClientRequestFunction, webClient, record);
+
+            Future<HttpResponse<Buffer>> send = call.send(); // dispatches the work to vertx
+
+            // hook in the users' call back for when the web request gets a response
+            send.onComplete(ar ->
+                    onWebRequestComplete.accept(ar)
+            );
+
+            return send;
+        }, onSend);
+    }
+
+    @Override
+    public void vertxHttpWebClient(BiFunction<WebClient, PollContext<K, V>, Future<HttpResponse<Buffer>>> webClientRequestFunction,
+                                   Consumer<Future<HttpResponse<Buffer>>> onWebRequestSentCallback) {
+
+        // wrap single record function in batch function
+        Function<PollContextInternal<K, V>, List<Future<HttpResponse<Buffer>>>> userFuncWrapper = (context) -> {
+            log.trace("Consumed a record ({}), executing void function...", context);
+
+            Future<HttpResponse<Buffer>> futureWebResponse = carefullyRun(webClientRequestFunction, webClient, context.getPollContext());
+
+            // execute user's onSend callback
+            onWebRequestSentCallback.accept(futureWebResponse);
+
+            addVertxHooks(context, futureWebResponse);
+
+            return UniLists.of(futureWebResponse);
+        };
+
+        Consumer<Future<HttpResponse<Buffer>>> noOp = (ignore) -> {
+        }; // don't need it, we attach to vertx futures for callback
+
+        super.supervisorLoop(userFuncWrapper, noOp);
+    }
+
+    private void addVertxHooks(final PollContextInternal<K, V> context, final Future<?> send) {
+        context.streamWorkContainers().forEach(wc -> {
+            // attach internal handler
+            wc.setWorkType(VERTX_TYPE);
+
+            send.onSuccess(h -> {
+                log.debug("Vert.x Vertical success");
+                wc.onUserFunctionSuccess();
+                addToMailbox(context, wc);
+            });
+            send.onFailure(h -> {
+                log.error("Vert.x Vertical fail: {}", h.getMessage());
+                wc.onUserFunctionFailure(h);
+                addToMailbox(context, wc);
+            });
+
+            // add plugin callback hook
+            send.onComplete(ar -> {
+                log.trace("Running plugin hook");
+                this.onVertxCompleteHook.ifPresent(Runnable::run);
+            });
+        });
+    }
+
+    @Override
+    public void vertxFuture(final Function<PollContext<K, V>, Future<?>> result) {
+
+        // wrap single record function in batch function
+        Function<PollContextInternal<K, V>, List<Future<?>>> userFuncWrapper = context -> {
+            log.trace("Consumed a record ({}), executing void function...", context);
+
+            Future<?> send = carefullyRun(result, context.getPollContext());
+
+            addVertxHooks(context, send);
+
+            return UniLists.of(send);
+        };
+
+        Consumer<Future<?>> noOp = ignore -> {
+        }; // don't need it, we attach to vertx futures for callback
+
+        super.supervisorLoop(userFuncWrapper, noOp);
+    }
+
+    @Override
+    public void batchVertxFuture(final Function<PollContext<K, V>, Future<?>> result) {
+
+        Function<PollContextInternal<K, V>, List<Future<?>>> userFuncWrapper = context -> {
+
+            Future<?> send = carefullyRun(result, context.getPollContext());
+
+            addVertxHooks(context, send);
+
+            return UniLists.of(send);
+        };
+
+        Consumer<Future<?>> noOp = ignore -> {
+        }; // don't need it, we attach to vertx futures for callback
+
+        super.supervisorLoop(userFuncWrapper, noOp);
+    }
+
+    /**
+     * @see #onVertxCompleteHook
+     */
+    public void addVertxOnCompleteHook(Runnable hookFunc) {
+        this.onVertxCompleteHook = Optional.of(hookFunc);
+    }
+
+    /**
+     * Basic information to perform a web request.
+     */
+    @Setter
+    @Getter
+    @AllArgsConstructor
+    public static class RequestInfo {
+        public static final int DEFAULT_PORT = 8080;
+        private final String host;
+        private final int port;
+        private final String contextPath;
+        private Map<String, String> params;
+
+        public RequestInfo(String host, String contextPath, Map<String, String> params) {
+            this(host, DEFAULT_PORT, contextPath, params);
+        }
+
+        public RequestInfo(String host, String contextPath) {
+            this(host, DEFAULT_PORT, contextPath, UniMaps.of());
+        }
+
+    }
+
+    @Override
+    protected void onUserFunctionSuccess(WorkContainer<K, V> wc, List<?> resultsFromUserFunction) {
+        // with vertx, a function hasn't succeeded until the inner vertx function has also succeeded
+        // logging
+        if (isAsyncFutureWork(resultsFromUserFunction)) {
+            log.debug("Vertx creation function success, user's function success");
+        } else {
+            super.onUserFunctionSuccess(wc, resultsFromUserFunction);
+        }
+    }
+
+    @Override
+    protected void addToMailBoxOnUserFunctionSuccess(final PollContextInternal<K, V> context, WorkContainer<K, V> wc, List<?> resultsFromUserFunction) {
+        // with vertx, a function hasn't succeeded until the inner vertx function has also succeeded
+        // no op
+        if (isAsyncFutureWork(resultsFromUserFunction)) {
+            log.debug("User function success but not adding vertx vertical to mailbox yet");
+        } else {
+            super.addToMailBoxOnUserFunctionSuccess(context, wc, resultsFromUserFunction);
+        }
+    }
+
+    /**
+     * Determines if any of the elements in the supplied list is a Vertx Future type
+     */
+    @Override
+    protected boolean isAsyncFutureWork(List<?> resultsFromUserFunction) {
+        for (Object object : resultsFromUserFunction) {
+            return (object instanceof Future);
+        }
+        return false;
+    }
+
+    /**
+     * Close the concurrent Vertx consumer system
+     *
+     * @param timeout   how long to wait before giving up
+     * @param drainMode wait for messages already consumed from the broker to be processed before closing
+     */
+    @SneakyThrows
+    @Override
+    public void close(Duration timeout, DrainingMode drainMode) {
+        log.info("Vert.x async consumer closing...");
+        super.close(timeout, drainMode);
+        webClient.close();
+        Future<Void> close = vertx.close();
+        var timer = Time.SYSTEM.timer(timeout);
+        while (!close.isComplete()) {
+            log.trace("Waiting on close to complete");
+            Thread.sleep(100);
+            timer.update();
+            if (timer.isExpired()) {
+                throw new TimeoutException("Waiting for system to close");
+            }
+        }
+    }
+
+}
diff --git a/parallel-consumer-vertx/src/main/java/io/confluent/parallelconsumer/vertx/VertxParallelStreamProcessor.java b/parallel-consumer-vertx/src/main/java/io/confluent/parallelconsumer/vertx/VertxParallelStreamProcessor.java
new file mode 100644
index 000000000..ea02a2a09
--- /dev/null
+++ b/parallel-consumer-vertx/src/main/java/io/confluent/parallelconsumer/vertx/VertxParallelStreamProcessor.java
@@ -0,0 +1,102 @@
+package io.confluent.parallelconsumer.vertx;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumer;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelStreamProcessor;
+import io.confluent.parallelconsumer.PollContext;
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.vertx.core.AsyncResult;
+import io.vertx.core.Future;
+import io.vertx.core.buffer.Buffer;
+import io.vertx.ext.web.client.HttpRequest;
+import io.vertx.ext.web.client.HttpResponse;
+import io.vertx.ext.web.client.WebClient;
+import org.apache.kafka.clients.consumer.ConsumerRecord;
+
+import java.util.function.BiFunction;
+import java.util.function.Consumer;
+import java.util.function.Function;
+
+/**
+ * An extension to {@link AbstractParallelEoSStreamProcessor} which uses the <a href="https://vertx.io">Vert.x</a>
+ * library and it's non blocking clients to process messages.
+ *
+ * @param <K>
+ * @param <V>
+ * @see AbstractParallelEoSStreamProcessor
+ * @see #vertxHttpReqInfo(Function, Consumer, Consumer)
+ */
+public interface VertxParallelStreamProcessor<K, V> extends ParallelConsumer<K, V> {
+
+    static <KK, VV> VertxParallelStreamProcessor<KK, VV> createEosStreamProcessor(ParallelConsumerOptions options) {
+        return new VertxParallelEoSStreamProcessor<>(options);
+    }
+
+    /**
+     * Consume from the broker concurrently, just give us the {@link VertxParallelEoSStreamProcessor.RequestInfo}, we'll
+     * do the rest.
+     * <p>
+     * Useful for when the web request is very straight forward.
+     *
+     * @param requestInfoFunction  a function taking a {@link ConsumerRecord} and returns a {@link
+     *                             VertxParallelEoSStreamProcessor.RequestInfo} object
+     * @param onSend               function executed after the request has been sent
+     * @param onWebRequestComplete function executed when response received for request
+     */
+    void vertxHttpReqInfo(Function<PollContext<K, V>, VertxParallelEoSStreamProcessor.RequestInfo> requestInfoFunction,
+                          Consumer<Future<HttpResponse<Buffer>>> onSend,
+                          Consumer<AsyncResult<HttpResponse<Buffer>>> onWebRequestComplete);
+
+    /**
+     * Consume from the broker concurrently, give us the {@link HttpRequest}, we'll do the rest.
+     *
+     * @param webClientRequestFunction Given the {@link WebClient} and a {@link ConsumerRecord}, return us the {@link
+     *                                 HttpRequest}
+     * @param onSend
+     * @param onWebRequestComplete
+     */
+    void vertxHttpRequest(BiFunction<WebClient, PollContext<K, V>, HttpRequest<Buffer>> webClientRequestFunction,
+                          Consumer<Future<HttpResponse<Buffer>>> onSend,
+                          Consumer<AsyncResult<HttpResponse<Buffer>>> onWebRequestComplete);
+
+    /**
+     * Consume from the broker concurrently, initiating your own {@link HttpRequest#send()} call, give us the {@link
+     * Future}.
+     * <p>
+     * Useful for when the request if complicated and needs to be handled in a special way.
+     * <p>
+     * Note that an alternative is to pass into the constructor a configured {@link WebClient} instead.
+     *
+     * @see #vertxHttpReqInfo
+     * @see #vertxHttpRequest
+     */
+    void vertxHttpWebClient(BiFunction<WebClient, PollContext<K, V>, Future<HttpResponse<Buffer>>> webClientRequestFunction,
+                            Consumer<Future<HttpResponse<Buffer>>> onSend);
+
+    /**
+     * Consumer from the Broker concurrently - use the various Vert.x systems to return us a vert.x Future based on this
+     * record.
+     */
+    void vertxFuture(final Function<PollContext<K, V>, Future<?>> result);
+
+    /**
+     * Like {@link ParallelStreamProcessor#pollBatch} but for Vert.x.
+     * <p>
+     * Register a function to be applied to a batch of messages.
+     * <p>
+     * The system will treat the messages as a set, so if an error is thrown by the user code, then all messages will be
+     * marked as failed and be retried (Note that when they are retried, there is no guarantee they will all be in the
+     * same batch again). So if you're going to process messages individually, then don't use this function.
+     * <p>
+     * Otherwise, if you're going to process messages in sub sets from this batch, it's better to instead adjust the
+     * {@link ParallelConsumerOptions#getBatchSize()} instead to the actual desired size, and process them as a whole.
+     *
+     * @see ParallelStreamProcessor#pollBatch
+     * @see ParallelConsumerOptions#getBatchSize()
+     */
+    void batchVertxFuture(Function<PollContext<K, V>, Future<?>> result);
+}
diff --git a/parallel-consumer-vertx/src/test-integration/java/io/confluent/parallelconsumer/vertx/integrationTests/VertxConcurrencyIT.java b/parallel-consumer-vertx/src/test-integration/java/io/confluent/parallelconsumer/vertx/integrationTests/VertxConcurrencyIT.java
new file mode 100644
index 000000000..31838f9b8
--- /dev/null
+++ b/parallel-consumer-vertx/src/test-integration/java/io/confluent/parallelconsumer/vertx/integrationTests/VertxConcurrencyIT.java
@@ -0,0 +1,290 @@
+package io.confluent.parallelconsumer.vertx.integrationTests;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.github.tomakehurst.wiremock.WireMockServer;
+import com.github.tomakehurst.wiremock.client.MappingBuilder;
+import com.github.tomakehurst.wiremock.core.WireMockConfiguration;
+import com.github.tomakehurst.wiremock.http.Request;
+import com.github.tomakehurst.wiremock.http.RequestListener;
+import com.github.tomakehurst.wiremock.http.Response;
+import io.confluent.csid.utils.LatchTestUtils;
+import io.confluent.csid.utils.ProgressBarUtils;
+import io.confluent.csid.utils.ThreadUtils;
+import io.confluent.csid.utils.TrimListRepresentation;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.integrationTests.BrokerIntegrationTest;
+import io.confluent.parallelconsumer.vertx.VertxParallelEoSStreamProcessor;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import me.tongfei.progressbar.ProgressBar;
+import org.apache.commons.lang3.RandomUtils;
+import org.apache.kafka.clients.consumer.KafkaConsumer;
+import org.apache.kafka.clients.producer.KafkaProducer;
+import org.apache.kafka.clients.producer.Producer;
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.clients.producer.RecordMetadata;
+import org.apache.kafka.common.TopicPartition;
+import org.assertj.core.api.Assertions;
+import org.awaitility.core.ConditionTimeoutException;
+import org.junit.jupiter.api.AfterAll;
+import org.junit.jupiter.api.BeforeAll;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.parallel.Isolated;
+import org.testcontainers.junit.jupiter.Testcontainers;
+import pl.tlinkowski.unij.api.UniMaps;
+
+import java.util.*;
+import java.util.concurrent.ConcurrentLinkedQueue;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.Future;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static com.github.tomakehurst.wiremock.client.WireMock.*;
+import static com.github.tomakehurst.wiremock.core.WireMockConfiguration.wireMockConfig;
+import static com.google.common.truth.Truth.assertWithMessage;
+import static io.confluent.csid.utils.LatchTestUtils.awaitLatch;
+import static io.confluent.csid.utils.StringUtils.msg;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_CONSUMER_ASYNCHRONOUS;
+import static io.confluent.parallelconsumer.ParallelConsumerOptions.CommitMode.PERIODIC_TRANSACTIONAL_PRODUCER;
+import static java.lang.Thread.getAllStackTraces;
+import static java.time.Duration.ofMillis;
+import static java.time.Duration.ofSeconds;
+import static java.util.concurrent.TimeUnit.SECONDS;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.fail;
+import static org.assertj.core.data.Percentage.withPercentage;
+import static org.awaitility.Awaitility.waitAtMost;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+/**
+ * @see #testVertxConcurrency()
+ */
+@Testcontainers
+@Slf4j
+@Isolated
+class VertxConcurrencyIT extends BrokerIntegrationTest {
+
+    private static final com.google.common.flogger.FluentLogger flog = com.google.common.flogger.FluentLogger.forEnclosingClass();
+
+    private static ProgressBar bar;
+    static final int expectedMessageCount = 2000;
+    static final int expectedConcurrentCount = 100; // also used to set max concurrency
+
+    public List<String> consumedKeys = Collections.synchronizedList(new ArrayList<>());
+    public AtomicInteger processedCount = new AtomicInteger(0);
+    public static AtomicInteger numberRequestsProcessing = new AtomicInteger(0);
+    public static AtomicInteger highestConcurrency = new AtomicInteger(0);
+    public AtomicInteger httpResponseReceivedCount = new AtomicInteger(0);
+
+    public static WireMockServer stubServer;
+
+    static CountDownLatch responseLock = new CountDownLatch(1);
+
+    static Queue<Request> requestsReceivedOnServer = new ConcurrentLinkedQueue<>();
+
+    VertxConcurrencyIT() {
+        bar = ProgressBarUtils.getNewMessagesBar(log, expectedMessageCount);
+    }
+
+    @BeforeAll
+    static void setupWireMock() {
+        WireMockConfiguration options = wireMockConfig().dynamicPort()
+                .containerThreads(expectedConcurrentCount * 2); // ensure wiremock has enough threads to respond to everything in parallel
+
+        stubServer = new WireMockServer(options);
+        MappingBuilder mappingBuilder = get(urlPathEqualTo("/"))
+                .willReturn(aResponse());
+
+        stubServer.stubFor(mappingBuilder);
+
+        stubServer.addMockServiceRequestListener(new RequestListener() {
+
+            @Override
+            public void requestReceived(final Request request, final Response response) {
+                log.debug("req: {}", request);
+                numberRequestsProcessing.getAndIncrement();
+                requestsReceivedOnServer.add(request);
+                bar.stepBy(1);
+                awaitLatch(responseLock, 30); // latch timeout should be longer than awaitility's
+                log.trace("unlocked");
+                int highest = highestConcurrency.get();
+                highestConcurrency.set(Math.max(highest, numberRequestsProcessing.get()));
+                ThreadUtils.sleepLog(400); // slow down responses to cause concurrency limits to be reached
+                numberRequestsProcessing.getAndDecrement();
+            }
+        });
+
+        stubServer.start();
+    }
+
+    @AfterAll
+    static void close() {
+        stubServer.stop();
+    }
+
+    /**
+     * This test uses a wire mock server which blocks responding to all requests, until it has received a certain number
+     * of requests in parallel. Once this count has been reached, the global latch is released, and all requests are
+     * responded to.
+     * <p>
+     * This is used to sanity test that the PC vertx module is indeed sending the number of concurrent requests that we
+     * would expect.
+     */
+    @Test
+    @SneakyThrows
+    void testVertxConcurrency() {
+        var commitMode = PERIODIC_CONSUMER_ASYNCHRONOUS;
+        var order = ParallelConsumerOptions.ProcessingOrder.UNORDERED;
+
+        String inputName = setupTopic(this.getClass().getSimpleName() + "-input-" + RandomUtils.nextInt());
+
+        // pre-produce messages to input-topic
+        List<String> expectedKeys = new ArrayList<>();
+
+
+        log.info("Producing {} messages before starting test", expectedMessageCount);
+        List<Future<RecordMetadata>> sends = new ArrayList<>();
+        try (Producer<String, String> kafkaProducer = getKcu().createNewProducer(false)) {
+            for (int i = 0; i < expectedMessageCount; i++) {
+                String key = "key-" + i;
+                Future<RecordMetadata> send = kafkaProducer.send(new ProducerRecord<>(inputName, key, "value-" + i), (meta, exception) -> {
+                    if (exception != null) {
+                        log.error("Error sending, ", exception);
+                    }
+                });
+                sends.add(send);
+                expectedKeys.add(key);
+            }
+            log.debug("Finished sending test data");
+        }
+        // make sure we finish sending before next stage
+        log.debug("Waiting for broker acks");
+        for (Future<RecordMetadata> send : sends) {
+            send.get();
+        }
+        assertThat(sends).hasSize(expectedMessageCount);
+
+        // run parallel-consumer
+        log.debug("Starting test");
+        KafkaProducer<String, String> newProducer = getKcu().createNewProducer(commitMode.equals(PERIODIC_TRANSACTIONAL_PRODUCER));
+
+        Properties consumerProps = new Properties();
+        KafkaConsumer<String, String> newConsumer = getKcu().createNewConsumer(true, consumerProps);
+
+        var pc = new VertxParallelEoSStreamProcessor<String, String>(ParallelConsumerOptions.<String, String>builder()
+                .ordering(order)
+                .consumer(newConsumer)
+                .producer(newProducer)
+                .commitMode(commitMode)
+                .maxConcurrency(expectedConcurrentCount)
+                .build());
+        pc.subscribe(of(inputName));
+
+        // sanity
+        TopicPartition tp = new TopicPartition(inputName, 0);
+        Map<TopicPartition, Long> beginOffsets = newConsumer.beginningOffsets(of(tp));
+        Map<TopicPartition, Long> endOffsets = newConsumer.endOffsets(of(tp));
+        assertThat(endOffsets.get(tp)).isEqualTo(expectedMessageCount);
+        assertThat(beginOffsets.get(tp)).isEqualTo(0L);
+
+        //
+        pc.vertxHttpReqInfo(record -> {
+                    consumedKeys.add(record.key());
+                    return new VertxParallelEoSStreamProcessor.RequestInfo("localhost", stubServer.port(), "/", UniMaps.of());
+                }, onSend -> {
+                    processedCount.incrementAndGet();
+                }, onWebResponseAsyncResult -> {
+            httpResponseReceivedCount.incrementAndGet();
+            log.trace("Response received complete {}", onWebResponseAsyncResult);
+                }
+        );
+
+        // wait for all pre-produced messages to be processed and produced
+        log.info("Waiting for {}/2 requests in parallel on server.", expectedConcurrentCount);
+        Assertions.useRepresentation(new TrimListRepresentation());
+        var failureMessage = msg("Mock server receives {} requests in parallel from vertx engine",
+                expectedMessageCount / 2);
+        try {
+            waitAtMost(ofSeconds(20))
+                    .pollInterval(ofMillis(200))
+                    .alias(failureMessage)
+                    .untilAsserted(() -> {
+                        log.info("got {}/{}", requestsReceivedOnServer.size(), expectedConcurrentCount / 2);
+                        assertThat(requestsReceivedOnServer.size()).isGreaterThanOrEqualTo(expectedConcurrentCount / 2);
+                    });
+        } catch (ConditionTimeoutException e) {
+            fail(failureMessage + "\n" + e.getMessage());
+        }
+        log.info("{} requests received in parallel by server, releasing server response lock.", requestsReceivedOnServer.size());
+
+        // all requests were received in parallel, so unlock the server to respond to all of them
+        LatchTestUtils.release(responseLock);
+
+//        assertNumberOfThreads();
+
+        log.info("Waiting for {} responses from server, while checking concurrent requests never exceed max concurrency.", expectedMessageCount);
+        waitAtMost(ofSeconds(120))
+                .alias(failureMessage)
+                .failFast(msg("max concurrency exceeded {}", expectedConcurrentCount), () -> {
+                    int concurrent = numberRequestsProcessing.get();
+                    if (concurrent > expectedConcurrentCount) {
+                        log.error("Concurrency too high {}", concurrent);
+                        return true;
+                    }
+                    return false;
+                })
+                .untilAsserted(() -> {
+                    flog.atInfo().atMostEvery(1, SECONDS).log("Concurrency level: %s", numberRequestsProcessing.get());
+                    assertThat(httpResponseReceivedCount).hasValue(expectedMessageCount);
+                });
+
+        log.info("All {} responses received.", expectedMessageCount);
+
+//        assertNumberOfThreads();
+
+        // close
+        bar.close();
+        pc.closeDrainFirst();
+
+        //
+        int highestConcurrencyCount = highestConcurrency.get();
+        log.info("Highest concurrency was {}", highestConcurrencyCount);
+        assertWithMessage("Should at some point reach max concurrency")
+                .that(highestConcurrencyCount).isAtLeast(expectedConcurrentCount);
+
+        // sanity
+        assertThat(expectedMessageCount).isEqualTo(processedCount.get());
+        assertThat(responseLock.getCount()).isZero();
+    }
+
+    /**
+     * Should be around this number of threads running - introduced to sanity check thread count looks right
+     */
+    private void assertNumberOfThreads() {
+        Set<Thread> threadKeys = getAllStackTraces().keySet();
+        String pcPrefix = "pc-";
+        String wireMockPrefix = "qtp";
+        long pcThreadCount = threadKeys.stream().filter(x -> x.getName().startsWith(pcPrefix)).count();
+        long wireMockThreadCount = threadKeys.stream().filter(x -> x.getName().startsWith(wireMockPrefix)).count();
+
+        int expectedPCThreads = 3;
+
+        if (pcThreadCount > 0) // pc may not have started
+        {
+            log.info("Checking there are only {} PC threads running", expectedPCThreads);
+            assertThat(pcThreadCount)
+                    .as("Number of Parallel Consumer threads outside expected estimates")
+                    .isEqualTo(expectedPCThreads);
+        }
+
+        log.info("Checking there are about ~{} wire mock threads running to process requests in parallel from vert.x", expectedConcurrentCount / 2);
+        assertThat(wireMockThreadCount)
+                .as("Number of wiremock threads outside expected estimates")
+                .isCloseTo(expectedConcurrentCount / 2, withPercentage(60));
+
+    }
+
+}
diff --git a/parallel-consumer-vertx/src/test/java/io/confluent/parallelconsumer/vertx/VertxBaseUnitTest.java b/parallel-consumer-vertx/src/test/java/io/confluent/parallelconsumer/vertx/VertxBaseUnitTest.java
new file mode 100644
index 000000000..188be84a7
--- /dev/null
+++ b/parallel-consumer-vertx/src/test/java/io/confluent/parallelconsumer/vertx/VertxBaseUnitTest.java
@@ -0,0 +1,37 @@
+package io.confluent.parallelconsumer.vertx;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.ParallelEoSStreamProcessorTestBase;
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.vertx.core.Vertx;
+import io.vertx.core.VertxOptions;
+import io.vertx.ext.web.client.WebClient;
+import org.junit.jupiter.api.BeforeEach;
+
+public abstract class VertxBaseUnitTest extends ParallelEoSStreamProcessorTestBase {
+
+    JStreamVertxParallelEoSStreamProcessor<String, String> vertxAsync;
+
+    @Override
+    protected AbstractParallelEoSStreamProcessor initAsyncConsumer(ParallelConsumerOptions parallelConsumerOptions) {
+        VertxOptions vertxOptions = new VertxOptions();
+        Vertx vertx = Vertx.vertx(vertxOptions);
+        WebClient wc = WebClient.create(vertx);
+        var build = parallelConsumerOptions.toBuilder()
+                .maxConcurrency(10)
+                .build();
+        vertxAsync = new JStreamVertxParallelEoSStreamProcessor<>(vertx, wc, build);
+
+        return vertxAsync;
+    }
+
+    @BeforeEach
+    public void setupData() {
+        super.primeFirstRecord();
+    }
+
+}
diff --git a/parallel-consumer-vertx/src/test/java/io/confluent/parallelconsumer/vertx/VertxBatchTest.java b/parallel-consumer-vertx/src/test/java/io/confluent/parallelconsumer/vertx/VertxBatchTest.java
new file mode 100644
index 000000000..5625d419a
--- /dev/null
+++ b/parallel-consumer-vertx/src/test/java/io/confluent/parallelconsumer/vertx/VertxBatchTest.java
@@ -0,0 +1,142 @@
+package io.confluent.parallelconsumer.vertx;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import io.confluent.csid.utils.KafkaTestUtils;
+import io.confluent.parallelconsumer.BatchTestBase;
+import io.confluent.parallelconsumer.BatchTestMethods;
+import io.confluent.parallelconsumer.ParallelConsumerOptions;
+import io.confluent.parallelconsumer.PollContext;
+import io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor;
+import io.confluent.parallelconsumer.internal.RateLimiter;
+import io.vertx.core.Future;
+import io.vertx.core.Promise;
+import io.vertx.core.Vertx;
+import io.vertx.junit5.VertxExtension;
+import io.vertx.junit5.VertxTestContext;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.extension.ExtendWith;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.EnumSource;
+
+import java.util.List;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static io.confluent.csid.utils.StringUtils.msg;
+
+@Slf4j
+@ExtendWith(VertxExtension.class)
+public class VertxBatchTest extends VertxBaseUnitTest implements BatchTestBase {
+
+    private Vertx vertx;
+    private VertxTestContext tc;
+
+    BatchTestMethods<Future<String>> batchTestMethods;
+
+    @BeforeEach
+    void setup() {
+        batchTestMethods = new BatchTestMethods<>(this) {
+
+            @Override
+            protected KafkaTestUtils getKtu() {
+                return ktu;
+            }
+
+            @SneakyThrows
+            @Override
+            protected Future<String> averageBatchSizeTestPollStep(PollContext<String, String> recordList) {
+                int delayInMs = 30;
+
+                Promise<String> promise = Promise.promise();
+
+                vertx.setTimer(delayInMs, event -> {
+                    String msg = msg("Saw batch or records: {}", recordList.getOffsetsFlattened());
+                    log.debug(msg);
+                    promise.complete(msg);
+                });
+
+                return promise.future();
+            }
+
+            @Override
+            protected void averageBatchSizeTestPoll(AtomicInteger numBatches, AtomicInteger numRecords, RateLimiter statusLogger) {
+                vertxAsync.batchVertxFuture(recordList -> {
+                    return averageBatchSizeTestPollInner(numBatches, numRecords, statusLogger, recordList);
+                });
+            }
+
+            @Override
+            protected AbstractParallelEoSStreamProcessor getPC() {
+                return vertxAsync;
+            }
+
+            @Override
+            public void simpleBatchTestPoll(List<PollContext<String, String>> batchesReceived) {
+                vertxAsync.batchVertxFuture(recordList -> {
+                    return vertx.executeBlocking(event -> {
+                        log.debug("Saw batch or records: {}", recordList.getOffsetsFlattened());
+                        batchesReceived.add(recordList);
+
+                        event.complete(msg("Saw batch or records: {}", recordList.getOffsetsFlattened()));
+                    });
+                });
+            }
+
+            @Override
+            protected void batchFailPoll(List<PollContext<String, String>> receivedBatches) {
+                vertxAsync.batchVertxFuture(pollBatch -> {
+                    receivedBatches.add(pollBatch);
+                    batchFailPollInner(pollBatch);
+                    return Future.succeededFuture(msg("Saw batch or records: {}", pollBatch.getOffsetsFlattened()));
+                });
+            }
+        };
+    }
+
+    @Test
+    void averageBatchSizeTest(Vertx vertx, VertxTestContext tc) {
+        this.vertx = vertx;
+        this.tc = tc;
+        averageBatchSizeTest();
+        tc.completeNow();
+    }
+
+    @Override
+    public void averageBatchSizeTest() {
+        batchTestMethods.averageBatchSizeTest(100_000);
+    }
+
+    @ParameterizedTest
+    @EnumSource
+    void simpleBatchTest(ParallelConsumerOptions.ProcessingOrder order, Vertx vertx, VertxTestContext tc) {
+        this.vertx = vertx;
+        this.tc = tc;
+        simpleBatchTest(order);
+        tc.completeNow();
+    }
+
+    @Override
+    public void simpleBatchTest(ParallelConsumerOptions.ProcessingOrder order) {
+        batchTestMethods.simpleBatchTest(order);
+    }
+
+
+    @ParameterizedTest
+    @EnumSource
+    public void batchFailureTest(ParallelConsumerOptions.ProcessingOrder order, Vertx vertx, VertxTestContext tc) {
+        this.vertx = vertx;
+        this.tc = tc;
+        batchFailureTest(order);
+        tc.completeNow();
+    }
+
+    @Override
+    public void batchFailureTest(ParallelConsumerOptions.ProcessingOrder order) {
+        batchTestMethods.batchFailureTest(order);
+    }
+}
diff --git a/parallel-consumer-vertx/src/test/java/io/confluent/parallelconsumer/vertx/VertxTest.java b/parallel-consumer-vertx/src/test/java/io/confluent/parallelconsumer/vertx/VertxTest.java
new file mode 100644
index 000000000..a862d89ec
--- /dev/null
+++ b/parallel-consumer-vertx/src/test/java/io/confluent/parallelconsumer/vertx/VertxTest.java
@@ -0,0 +1,259 @@
+package io.confluent.parallelconsumer.vertx;
+
+/*-
+ * Copyright (C) 2020-2022 Confluent, Inc.
+ */
+
+import com.github.tomakehurst.wiremock.WireMockServer;
+import io.confluent.csid.utils.WireMockUtils;
+import io.confluent.parallelconsumer.PollContext;
+import io.confluent.parallelconsumer.vertx.VertxParallelEoSStreamProcessor.RequestInfo;
+import io.vertx.core.AsyncResult;
+import io.vertx.core.Future;
+import io.vertx.core.Vertx;
+import io.vertx.core.buffer.Buffer;
+import io.vertx.ext.web.client.HttpRequest;
+import io.vertx.ext.web.client.HttpResponse;
+import io.vertx.ext.web.client.WebClient;
+import io.vertx.junit5.Checkpoint;
+import io.vertx.junit5.VertxExtension;
+import io.vertx.junit5.VertxTestContext;
+import lombok.SneakyThrows;
+import lombok.extern.slf4j.Slf4j;
+import org.assertj.core.api.Assertions;
+import org.junit.jupiter.api.AfterEach;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Disabled;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.extension.ExtendWith;
+import org.junit.jupiter.api.parallel.Isolated;
+import pl.tlinkowski.unij.api.UniMaps;
+
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.List;
+import java.util.concurrent.CountDownLatch;
+import java.util.stream.Collectors;
+import java.util.stream.Stream;
+
+import static io.confluent.csid.utils.LatchTestUtils.awaitLatch;
+import static java.time.Duration.ofSeconds;
+import static java.util.concurrent.TimeUnit.SECONDS;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.awaitility.Awaitility.await;
+import static pl.tlinkowski.unij.api.UniLists.of;
+
+@Isolated
+@Slf4j
+@ExtendWith(VertxExtension.class)
+class VertxTest extends VertxBaseUnitTest {
+
+    WireMockServer stubServer;
+
+    RequestInfo getGoodHost() {
+        return new RequestInfo("localhost", stubServer.port(), "/", UniMaps.of());
+    }
+
+    RequestInfo getBadRequest() {
+        int badPort = 1;
+        String badHostname = "xxxxxxxxx"; // bad host names seem to fail faster than valid host names with invalid ports
+        return new RequestInfo(badHostname, badPort, "/", UniMaps.of());
+    }
+
+    @BeforeEach
+    void setupWireMock() {
+        WireMockUtils wireMockUtils = new WireMockUtils();
+        stubServer = wireMockUtils.setupWireMock();
+    }
+
+    @AfterEach
+    void closeWireMock() {
+        stubServer.stop();
+    }
+
+    @SneakyThrows
+    @Test
+    void sanityTest(Vertx vertx, VertxTestContext tc) {
+        WebClient client = WebClient.create(vertx);
+        HttpRequest<Buffer> bufferHttpRequest = client.get(getGoodHost().getPort(), getGoodHost().getHost(), "");
+        bufferHttpRequest.send(tc.succeeding(response -> tc.verify(() -> {
+            log.debug("callback {}", response.bodyAsString());
+            tc.completeNow();
+        })));
+    }
+
+    @Test
+    void failingHttpCall() {
+        var latch = new CountDownLatch(1);
+        vertxAsync.addVertxOnCompleteHook(latch::countDown);
+
+        var tupleStream =
+                vertxAsync.vertxHttpReqInfoStream((PollContext<String, String> rec) -> getBadRequest());
+
+        //
+        awaitLatch(latch);
+
+        //
+        assertCommits(of());
+
+        // check results are failures
+        var res = getResults(tupleStream);
+        assertThat(res).doesNotContainNull();
+        assertThat(res).extracting(AsyncResult::failed).containsOnly(true);
+        assertThat(res).flatExtracting(x ->
+                        Arrays.asList(x.cause().getMessage().toLowerCase().split(" ")))
+                .contains("failed", "resolve");
+    }
+
+    // todo how is this different from #failingHttpCall ?
+    @SneakyThrows
+    @Test
+    void testVertxFunctionFail(Vertx vertx, VertxTestContext tc) {
+        var latch = new CountDownLatch(1);
+        vertxAsync.addVertxOnCompleteHook(latch::countDown);
+
+        var futureStream =
+                vertxAsync.vertxHttpReqInfoStream((rec) -> {
+                    log.debug("Inner user function");
+                    return getBadRequest();
+                });
+
+        // wait
+        awaitLatch(latch);
+
+        // verify
+        var collect = futureStream.map(JStreamVertxParallelEoSStreamProcessor.VertxCPResult::getAsr).collect(Collectors.toList());
+        assertThat(collect).hasSize(1);
+        Future<HttpResponse<Buffer>> actual = collect.get(0).onComplete(x -> {
+        });
+        await().until(actual::isComplete);
+        assertThat(actual).isNotNull();
+
+        actual.onComplete(tc.failing(ar -> tc.verify(() -> {
+            assertThat(ar).hasMessageContainingAll("Failed", "resolve");
+            tc.completeNow();
+        })));
+
+        Assertions.assertThat(vertxAsync.workRemaining()).isEqualTo(1); // two failed requests still in queue for retry
+    }
+
+    @Test
+    void testHttpMinimal() {
+        vertxAsync.setTimeBetweenCommits(ofSeconds(1));
+
+        var futureStream =
+                vertxAsync.vertxHttpReqInfoStream((rec) -> {
+                    log.debug("Inner user function");
+                    RequestInfo goodHost = getGoodHost();
+                    var params = UniMaps.of("randomParam", rec.value());
+                    goodHost.setParams(params);
+
+                    return goodHost;
+                });
+
+        //
+        awaitForCommitExact(1);
+
+        // verify
+        // test results are successes
+        var res = getResults(futureStream);
+        assertThat(res).extracting(x -> x.result().statusCode()).containsOnly(200);
+        assertThat(res).extracting(x -> x.result().bodyAsString()).contains(WireMockUtils.stubResponse);
+    }
+
+    @SneakyThrows
+    @Test
+    void testHttp() {
+        var latch = new CountDownLatch(1);
+        vertxAsync.addVertxOnCompleteHook(latch::countDown);
+
+        var futureStream =
+                vertxAsync.vertxHttpRequestStream((webClient, rec) -> {
+                    log.debug("Inner user function");
+                    var data = rec.value();
+                    RequestInfo reqInfo = getGoodHost();
+                    var httpRequest = webClient.get(reqInfo.getPort(), reqInfo.getHost(), reqInfo.getContextPath());
+                    httpRequest = httpRequest.addQueryParam("randomParam", data);
+
+                    return httpRequest;
+                });
+
+        awaitLatch(latch);
+
+        var res = getResults(futureStream);
+
+        // test results are successes
+        assertThat(res).hasSize(1).doesNotContainNull();
+        assertThat(res).extracting(AsyncResult::cause).containsOnlyNulls();
+        assertThat(res).extracting(x -> x.result().statusCode()).containsOnly(200);
+        assertThat(res).extracting(x -> x.result().bodyAsString()).contains(WireMockUtils.stubResponse);
+    }
+
+    private List<AsyncResult<HttpResponse<Buffer>>> getResults(
+            Stream<JStreamVertxParallelEoSStreamProcessor.VertxCPResult<String, String>> futureStream) {
+        var collect = futureStream.map(JStreamVertxParallelEoSStreamProcessor.VertxCPResult::getAsr).collect(Collectors.toList());
+        return blockingGetResults(collect);
+    }
+
+    @Test
+    @Disabled
+    void handleHttpResponseCodes() {
+        assertThat(true).isFalse();
+    }
+
+    @SneakyThrows
+    private <T> List<AsyncResult<T>> blockingGetResults(List<Future<T>> collect) {
+        List<AsyncResult<T>> list = new ArrayList<>();
+        CountDownLatch countDownLatch = new CountDownLatch(collect.size());
+        for (Future<T> httpResponseFuture : collect) {
+            httpResponseFuture.onComplete(x -> {
+                list.add(x);
+                countDownLatch.countDown();
+            });
+        }
+        boolean success = countDownLatch.await(defaultTimeoutSeconds, SECONDS);
+        if (!success)
+            throw new AssertionError("Timeout reached");
+        return list;
+    }
+
+    @SneakyThrows
+    @Test
+    void genericVertxFuture(Vertx vertx, VertxTestContext tc) {
+        primeFirstRecord();
+        primeFirstRecord();
+
+        var latch = new CountDownLatch(1);
+        vertxAsync.addVertxOnCompleteHook(latch::countDown);
+
+        var latchTwo = new CountDownLatch(1);
+
+        Checkpoint cp = tc.checkpoint(3);
+
+        vertxAsync.vertxFuture(rec -> vertx.executeBlocking(event -> {
+            log.debug("Inner user function {}", rec);
+            var data = rec.value();
+
+            try {
+                log.info("Waiting");
+                latchTwo.await();
+            } catch (InterruptedException e) {
+                e.printStackTrace();
+            }
+
+            cp.flag();
+            log.info("Finished waiting");
+
+            event.complete();
+        }));
+
+        log.info("Pausing");
+        Thread.sleep(1000L);
+        latchTwo.countDown();
+        log.info("Counted down");
+
+        awaitLatch(latch);
+        log.info("Latch gotten");
+    }
+
+}
diff --git a/parallel-consumer-vertx/src/test/resources/logback-test.xml b/parallel-consumer-vertx/src/test/resources/logback-test.xml
new file mode 100644
index 000000000..d8d564c02
--- /dev/null
+++ b/parallel-consumer-vertx/src/test/resources/logback-test.xml
@@ -0,0 +1,83 @@
+<!--
+
+    Copyright (C) 2020-2022 Confluent, Inc.
+
+-->
+<configuration packagingData="true" scan="true" scanPeriod="5 seconds" debug="true">
+
+    <appender name="STDOUT" class="ch.qos.logback.core.ConsoleAppender">
+        <!-- encoders are assigned the type
+             ch.qos.logback.classic.encoder.PatternLayoutEncoder by default -->
+        <encoder>
+            <!--            <pattern>%d{mm:ss.SSS} [%thread] %-5level (%class{0}.java:%line\)#%M - %msg%n</pattern>-->
+            <!--            <pattern>[%thread] %-5level .\(%class{0}.java:%line\)#%M - %msg%n</pattern>-->
+            <!--            <pattern>[%thread] %-5level .\(%file:%line\)#%M - %msg%n</pattern>-->
+            <!--            <pattern>%highlight(%-5level) %d{yyyy-MM-dd'T'HH:mm:ss.SSS} %yellow([%thread]) %blue(%logger{36}\(%class{0}.java:%line\)) %msg%n</pattern>-->
+            <!--            <pattern>%highlight(%-5level) %d{yyyy-MM-dd'T'HH:mm:ss.SSS} %yellow([%thread]) %blue(%logger{36}\(%file:%line\)) %msg%n</pattern>-->
+            <!--            <pattern>%highlight(%-5level) %yellow([%thread]) %blue(\(%file:%line\)) %cyan(#%M) %msg%n</pattern>-->
+            <pattern>%d{mm:ss.SSS} %yellow(%X{pcId}) %highlight(%-5level) %yellow([%thread]) %X{offset} %cyan(\(%file:%line\)#%M) %msg%n
+            </pattern>
+            <!--            <pattern>%highlight(%-5level) %yellow([%thread]) %cyan(\(%logger{36}:%line#%M\))  %msg%n</pattern>-->
+        </encoder>
+    </appender>
+
+    <root level="warn">
+        <!--    <root level="debug">-->
+        <appender-ref ref="STDOUT"/>
+    </root>
+
+    <!-- primary -->
+    <logger name="io.confluent.parallelconsumer" level="info"/>
+
+    <!-- Key classes -->
+    <!--    <logger name="io.confluent.parallelconsumer.internal.AbstractParallelEoSStreamProcessor" level="info"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.internal.BrokerPollSystem" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.state.WorkManager" level="info"/>-->
+
+
+    <!--    <logger name="io.confluent.parallelconsumer.vertx.VertxBatchTest" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.BatchTestMethods" level="debug"/>-->
+
+    <!--    <logger name="io.confluent.parallelconsumer.state.RemovedPartitionState" level="trace"/>-->
+
+    <!--    <logger name="io.confluent.parallelconsumer" level="debug"/>-->
+    <!--    <logger name="io.confluent.csid" level="debug"/>-->
+    <!--        <logger name="io.confluent.parallelconsumer" level="trace"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer" level="error"/>-->
+
+    <!--        <logger name="io.confluent.parallelconsumer.integrationTests.BrokerIntegrationTest" level="info"/> &lt;!&ndash; docker logs &ndash;&gt;-->
+    <!--    <logger name="io.confluent.csid" level="info"/>-->
+    <!--        <logger name="io.confluent.csid.utils" level="debug"/>-->
+
+
+    <!--            <logger name="io.confluent.parallelconsumer" level="trace" />-->
+
+    <!-- notable specifics -->
+    <!--        <logger name="io.confluent.parallelconsumer.ParallelEoSStreamProcessorTestBase" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.integrationTests" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.integrationTests.LargeVolumeInMemoryTests" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.ParallelConsumerTestBase" level="trace"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.ParallelConsumer" level="info" />-->
+    <!--    <logger name="io.confluent.parallelconsumer.offsets.OffsetMapCodecManager" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.offsets.WorkManagerOffsetMapCodecManagerTest" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.offsets.OffsetRunLength" level="trace"/>-->
+
+    <!-- containers -->
+    <!--    <logger name="io.confluent.parallelconsumer.integrationTests.DbTest" level="debug"/>-->
+    <!--    <logger name="io.confluent.parallelconsumer.integrationTests.BrokerIntegrationTest" level="debug"/>-->
+
+    <!-- related -->
+    <!--    <logger name="org.apache.kafka.clients" level="info"/>-->
+    <!--    <logger name="org.apache.kafka.clients" level="warn"/>-->
+    <!--    <logger name="org.apache.kafka.clients" level="debug"/>-->
+
+    <logger name="org.postgresql" level="info"/>
+
+    <!-- external -->
+    <!--    <logger name="io.vertx" level="debug"/>-->
+    <logger name="io.netty" level="info"/>
+
+    <!-- kafka internal -->
+    <!--    <logger name="org.apache.kafka.clients.consumer.internals.ConsumerCoordinator" level="debug"/>-->
+
+</configuration>
diff --git a/pom.xml b/pom.xml
new file mode 100644
index 000000000..3ae1df850
--- /dev/null
+++ b/pom.xml
@@ -0,0 +1,977 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Copyright (C) 2020-2023 Confluent, Inc.
+
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <groupId>io.confluent.parallelconsumer</groupId>
+    <artifactId>parallel-consumer-parent</artifactId>
+    <name>Confluent Parallel Consumer</name>
+    <version>0.5.2.8-SNAPSHOT</version>
+    <description>Parallel Apache Kafka client wrapper with client side queueing, a simpler consumer/producer API with key concurrency and extendable non-blocking IO processing.
+    </description>
+    <url>http://confluent.io</url>
+    <inceptionYear>2020</inceptionYear>
+
+    <organization>
+        <name>Confluent, Inc.</name>
+        <url>http://confluent.io</url>
+    </organization>
+
+    <licenses>
+        <license>
+            <name>Apache License, Version 2.0</name>
+            <url>https://www.apache.org/licenses/LICENSE-2.0.txt</url>
+            <distribution>repo</distribution>
+            <comments>A business-friendly OSS license</comments>
+        </license>
+    </licenses>
+
+    <packaging>pom</packaging>
+
+    <modules>
+        <module>parallel-consumer-core</module>
+        <module>parallel-consumer-vertx</module>
+        <module>parallel-consumer-reactor</module>
+        <module>parallel-consumer-examples</module>
+    </modules>
+
+    <developers>
+        <developer>
+            <id>antony@confluent.io</id>
+            <name>Antony Stubbs</name>
+            <email>antony@confluent.io</email>
+            <url>http://confluent.io</url>
+            <organization>Confluent</organization>
+            <organizationUrl>http://confluent.io</organizationUrl>
+            <timezone>Europe/London</timezone>
+        </developer>
+    </developers>
+
+    <scm>
+        <connection>scm:git:git://github.com:confluentinc/parallel-consumer.git</connection>
+        <developerConnection>scm:git:git@github.com:confluentinc/parallel-consumer.git</developerConnection>
+        <url>https://github.com/confluentinc/parallel-consumer.git</url>
+        <tag>0.5.2.6</tag>
+    </scm>
+
+    <distributionManagement>
+        <snapshotRepository>
+            <id>ossrh</id>
+            <url>https://oss.sonatype.org/content/repositories/snapshots</url>
+        </snapshotRepository>
+        <repository>
+            <id>ossrh</id>
+            <url>https://oss.sonatype.org/service/local/staging/deploy/maven2/</url>
+        </repository>
+    </distributionManagement>
+
+    <properties>
+        <source.version>17</source.version>
+        <release.target>8</release.target>
+
+        <!-- when running mvn locally from cmd line, use default jvm for jvm8 - by default uses the runtime JVM -->
+        <jvm.location>${java.home}</jvm.location>
+        <jvm8.location>-insert jvm8 location via environment variable-</jvm8.location>
+        <jvm9.location>-insert jvm9 location via environment variable-</jvm9.location>
+        <!-- default to format when on developer machines, check when in CI -->
+        <license.mode>format</license.mode>
+        <delombok.output>${project.basedir}/target/delombok</delombok.output>
+
+        <!-- standard props -->
+        <maven.version>3.6.3</maven.version>
+        <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
+        <project.reporting.outputEncoding>UTF-8</project.reporting.outputEncoding>
+
+        <skipTests>false</skipTests>
+        <skipITs>${skipTests}</skipITs>
+        <skipUTs>${skipTests}</skipUTs>
+
+        <!-- version numbers -->
+        <!-- plugins -->
+        <mycila.version>4.2</mycila.version>
+        <lombok.version>1.18.28</lombok.version>
+        <auto-service.version>1.1.1</auto-service.version>
+        <surefire.version>3.1.2</surefire.version>
+
+        <!-- core -->
+        <slf4j.version>2.0.7</slf4j.version>
+        <kafka.version>3.5.0</kafka.version>
+        <version.unij>0.1.3</version.unij>
+
+        <!-- tests -->
+        <parallel-tests>true</parallel-tests>
+
+        <!-- tests deps-->
+        <junit.version>5.10.0-RC1</junit.version>
+        <junit.platform.version>1.10.0</junit.platform.version>
+        <testcontainers.version>1.18.3</testcontainers.version>
+        <truth.version>1.1.5</truth.version>
+        <flogger.version>0.7.4</flogger.version>
+        <mockito.version>5.4.0</mockito.version>
+        <truth-generator-maven-plugin.version>0.1.1</truth-generator-maven-plugin.version>
+        <jabel.version>1.0.0</jabel.version>
+        <micrometer-core.version>1.10.2</micrometer-core.version>
+    </properties>
+
+    <profiles>
+        <profile>
+            <!-- override source and target when working from IDE -->
+            <id>intellij-idea-only</id>
+            <activation>
+                <property>
+                    <name>idea.maven.embedder.version</name>
+                </property>
+            </activation>
+            <build>
+                <plugins>
+                    <plugin>
+                        <groupId>org.apache.maven.plugins</groupId>
+                        <artifactId>maven-compiler-plugin</artifactId>
+                        <configuration>
+                            <!-- override source and target when working from IDE -->
+                            <source>${source.version}</source>
+                            <target>${source.version}</target>
+                            <release>${source.version}</release>
+                            <!-- disable Jabel -->
+                            <annotationProcessors>
+                                <annotationProcessor>lombok.launch.AnnotationProcessorHider$AnnotationProcessor
+                                </annotationProcessor>
+                            </annotationProcessors>
+                        </configuration>
+                    </plugin>
+                </plugins>
+            </build>
+        </profile>
+        <profile>
+            <!-- For releasing, use jvm8 for testing -->
+            <!-- currently broken -->
+            <id>jvm8-release</id>
+            <properties>
+                <jvm.location>${jvm8.location}</jvm.location>
+            </properties>
+        </profile>
+        <profile>
+            <!-- For releasing, use jvm9 for testing -->
+            <id>jvm9-release</id>
+            <properties>
+                <jvm.location>${jvm9.location}</jvm.location>
+            </properties>
+        </profile>
+        <profile>
+            <id>license-format</id>
+            <activation>
+                <os>
+                    <!-- this doesnt' work? remove -->
+                    <!-- improve to instead be !jenkins && !travis  / !CI -->
+                    <family>mac</family>
+                </os>
+            </activation>
+            <properties>
+                <license.mode>format</license.mode>
+            </properties>
+        </profile>
+        <profile>
+            <id>github</id>
+            <pluginRepositories>
+                <pluginRepository>
+                    <id>github-asciidoc-template-maven-plugin</id>
+                    <url>https://maven.pkg.github.com/whelk-io/asciidoc-template-maven-plugin</url>
+                </pluginRepository>
+            </pluginRepositories>
+        </profile>
+        <profile>
+            <!-- Profile to always run in Continuous Integration (Jenkins, Github Workflows etc) environments -->
+            <id>ci</id>
+            <properties>
+                <license.mode>check</license.mode>
+                <parallel-tests>false</parallel-tests>
+            </properties>
+            <build>
+                <plugins>
+                    <plugin>
+                        <groupId>org.apache.maven.plugins</groupId>
+                        <artifactId>maven-enforcer-plugin</artifactId>
+                        <executions>
+                            <execution>
+                                <id>enforce-versions</id>
+                                <goals>
+                                    <goal>enforce</goal>
+                                </goals>
+                                <phase>validate</phase>
+                                <configuration>
+                                    <rules>
+                                        <!-- only enforce requireReleaseDeps when running in CI, not locally -->
+                                        <requireReleaseDeps>
+                                            <onlyWhenRelease>false</onlyWhenRelease>
+                                            <failWhenParentIsSnapshot>false</failWhenParentIsSnapshot>
+                                            <excludes>
+                                                <exclude>io.confluent.parallelconsumer:</exclude>
+                                            </excludes>
+                                        </requireReleaseDeps>
+                                    </rules>
+                                </configuration>
+                            </execution>
+                        </executions>
+                    </plugin>
+                </plugins>
+            </build>
+        </profile>
+        <profile>
+            <id>maven-central</id>
+            <activation>
+                <property>
+                    <name>performRelease</name>
+                    <value>true</value>
+                </property>
+            </activation>
+            <distributionManagement>
+                <snapshotRepository>
+                    <id>ossrh</id>
+                    <url>https://oss.sonatype.org/content/repositories/snapshots</url>
+                </snapshotRepository>
+            </distributionManagement>
+            <build>
+                <plugins>
+                    <plugin>
+                        <groupId>org.apache.maven.plugins</groupId>
+                        <artifactId>maven-gpg-plugin</artifactId>
+                        <version>3.1.0</version>
+                        <executions>
+                            <execution>
+                                <id>sign-artifacts</id>
+                                <phase>verify</phase>
+                                <goals>
+                                    <goal>sign</goal>
+                                </goals>
+                            </execution>
+                        </executions>
+                    </plugin>
+                    <plugin>
+                        <groupId>org.sonatype.plugins</groupId>
+                        <artifactId>nexus-staging-maven-plugin</artifactId>
+                        <version>1.6.13</version>
+                        <extensions>true</extensions>
+                        <configuration>
+                            <serverId>ossrh</serverId>
+                            <nexusUrl>https://oss.sonatype.org/</nexusUrl>
+                            <autoReleaseAfterClose>true</autoReleaseAfterClose>
+                        </configuration>
+                    </plugin>
+                </plugins>
+            </build>
+        </profile>
+    </profiles>
+
+    <dependencies>
+        <!-- Build dependency -->
+        <dependency>
+            <groupId>com.github.bsideup.jabel</groupId>
+            <artifactId>jabel-javac-plugin</artifactId>
+            <version>${jabel.version}</version>
+            <scope>provided</scope>
+        </dependency>
+
+        <!-- Main -->
+        <dependency>
+            <groupId>org.projectlombok</groupId>
+            <artifactId>lombok</artifactId>
+            <version>${lombok.version}</version>
+            <scope>provided</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.slf4j</groupId>
+            <artifactId>slf4j-api</artifactId>
+            <version>${slf4j.version}</version>
+        </dependency>
+        <dependency>
+            <groupId>pl.tlinkowski.unij</groupId>
+            <artifactId>pl.tlinkowski.unij.api</artifactId>
+            <version>${version.unij}</version>
+        </dependency>
+        <dependency>
+            <groupId>pl.tlinkowski.unij</groupId>
+            <artifactId>pl.tlinkowski.unij.bundle.jdk8</artifactId>
+            <version>${version.unij}</version>
+            <scope>compile</scope>
+        </dependency>
+
+        <!-- Test -->
+        <dependency>
+            <groupId>ch.qos.logback</groupId>
+            <artifactId>logback-classic</artifactId>
+            <version>1.4.8</version>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.junit.jupiter</groupId>
+            <artifactId>junit-jupiter-api</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.junit.jupiter</groupId>
+            <artifactId>junit-jupiter-engine</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.junit.platform</groupId>
+            <artifactId>junit-platform-launcher</artifactId>
+            <version>${junit.platform.version}</version>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <!-- Junit Pioneer pulls in an older version - force the matched version -->
+            <groupId>org.junit.platform</groupId>
+            <artifactId>junit-platform-commons</artifactId>
+            <version>${junit.platform.version}</version>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.assertj</groupId>
+            <artifactId>assertj-core</artifactId>
+            <version>3.24.2</version>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.mockito</groupId>
+            <artifactId>mockito-core</artifactId>
+            <version>${mockito.version}</version>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.mockito</groupId>
+            <artifactId>mockito-junit-jupiter</artifactId>
+            <version>${mockito.version}</version>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>com.google.auto.service</groupId>
+            <artifactId>auto-service-annotations</artifactId>
+            <version>${auto-service.version}</version>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>com.google.truth</groupId>
+            <artifactId>truth</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>com.google.truth.extensions</groupId>
+            <artifactId>truth-java8-extension</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.awaitility</groupId>
+            <artifactId>awaitility</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>com.google.flogger</groupId>
+            <artifactId>flogger</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>com.google.flogger</groupId>
+            <artifactId>flogger-slf4j-backend</artifactId>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>one.util</groupId>
+            <artifactId>streamex</artifactId>
+            <version>0.8.1</version>
+            <scope>test</scope>
+        </dependency>
+    </dependencies>
+
+    <dependencyManagement>
+        <dependencies>
+            <dependency>
+                <groupId>io.micrometer</groupId>
+                <artifactId>micrometer-core</artifactId>
+                <version>${micrometer-core.version}</version>
+            </dependency>
+            <!-- External -->
+            <dependency>
+                <groupId>org.testcontainers</groupId>
+                <artifactId>testcontainers</artifactId>
+                <version>${testcontainers.version}</version>
+                <scope>test</scope>
+            </dependency>
+            <dependency>
+                <groupId>org.testcontainers</groupId>
+                <artifactId>kafka</artifactId>
+                <version>${testcontainers.version}</version>
+                <scope>test</scope>
+            </dependency>
+            <dependency>
+                <groupId>org.testcontainers</groupId>
+                <artifactId>junit-jupiter</artifactId>
+                <version>${testcontainers.version}</version>
+                <scope>test</scope>
+            </dependency>
+            <dependency>
+                <groupId>org.testcontainers</groupId>
+                <artifactId>postgresql</artifactId>
+                <version>${testcontainers.version}</version>
+                <scope>test</scope>
+            </dependency>
+            <dependency>
+                <groupId>org.awaitility</groupId>
+                <artifactId>awaitility</artifactId>
+                <version>4.2.0</version>
+                <scope>test</scope>
+            </dependency>
+            <dependency>
+                <groupId>org.apache.commons</groupId>
+                <artifactId>commons-lang3</artifactId>
+                <version>3.12.0</version>
+            </dependency>
+            <dependency>
+                <groupId>com.google.truth</groupId>
+                <artifactId>truth</artifactId>
+                <version>${truth.version}</version>
+                <scope>test</scope>
+            </dependency>
+            <dependency>
+                <groupId>com.google.truth.extensions</groupId>
+                <artifactId>truth-java8-extension</artifactId>
+                <version>${truth.version}</version>
+                <scope>test</scope>
+            </dependency>
+            <dependency>
+                <groupId>io.stubbs.truth</groupId>
+                <artifactId>truth-generator-api</artifactId>
+                <version>${truth-generator-maven-plugin.version}</version>
+                <scope>test</scope>
+            </dependency>
+            <dependency>
+                <groupId>com.google.guava</groupId>
+                <artifactId>guava</artifactId>
+                <version>32.1.1-jre</version>
+            </dependency>
+            <dependency>
+                <groupId>me.tongfei</groupId>
+                <artifactId>progressbar</artifactId>
+                <version>0.9.5</version>
+                <scope>test</scope>
+            </dependency>
+            <dependency>
+                <groupId>com.google.flogger</groupId>
+                <artifactId>flogger</artifactId>
+                <version>${flogger.version}</version>
+            </dependency>
+            <dependency>
+                <groupId>com.google.flogger</groupId>
+                <artifactId>flogger-slf4j-backend</artifactId>
+                <version>${flogger.version}</version>
+            </dependency>
+            <dependency>
+                <groupId>org.junit.jupiter</groupId>
+                <artifactId>junit-jupiter-api</artifactId>
+                <scope>test</scope>
+                <version>${junit.version}</version>
+            </dependency>
+            <dependency>
+                <groupId>org.junit.jupiter</groupId>
+                <artifactId>junit-jupiter-engine</artifactId>
+                <scope>test</scope>
+                <version>${junit.version}</version>
+            </dependency>
+            <dependency>
+                <groupId>org.junit.jupiter</groupId>
+                <artifactId>junit-jupiter-params</artifactId>
+                <scope>test</scope>
+                <version>${junit.version}</version>
+            </dependency>
+            <dependency>
+                <groupId>org.junit-pioneer</groupId>
+                <artifactId>junit-pioneer</artifactId>
+                <scope>test</scope>
+                <version>1.9.1</version>
+            </dependency>
+            <dependency>
+                <groupId>com.github.tomakehurst</groupId>
+                <artifactId>wiremock-jre8</artifactId>
+                <version>2.35.0</version>
+                <scope>test</scope>
+            </dependency>
+        </dependencies>
+    </dependencyManagement>
+
+    <build>
+        <testResources>
+            <testResource>
+                <directory>src/test/resources</directory>
+                <filtering>true</filtering>
+            </testResource>
+        </testResources>
+        <plugins>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-help-plugin</artifactId>
+                <version>3.4.0</version>
+                <executions>
+                    <execution>
+                        <id>show-profiles</id>
+                        <phase>compile</phase>
+                        <goals>
+                            <goal>active-profiles</goal>
+                        </goals>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.sonatype.ossindex.maven</groupId>
+                <artifactId>ossindex-maven-plugin</artifactId>
+                <version>3.2.0</version>
+                <configuration>
+                    <scope>runtime</scope>
+                    <fail>false</fail>
+                </configuration>
+                <executions>
+                    <execution>
+                        <id>audit-dependencies</id>
+                        <phase>validate</phase>
+                        <goals>
+                            <goal>audit</goal>
+                        </goals>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>com.soebes.maven.plugins</groupId>
+                <artifactId>echo-maven-plugin</artifactId>
+                <version>0.5.0</version>
+                <!-- very useful for debugging maven runtime state -->
+                <!--                <configuration>-->
+                <!--                    <echos>-->
+                <!--                        <echo>vars: ${JAVA_HOME} ${java.home} ${jvm.location}</echo>-->
+                <!--                    </echos>-->
+                <!--                </configuration>-->
+            </plugin>
+            <plugin>
+                <groupId>io.whelk.asciidoc</groupId>
+                <artifactId>asciidoc-template-maven-plugin</artifactId>
+                <version>1.0.21</version>
+                <inherited>false</inherited>
+                <executions>
+                    <execution>
+                        <id>process</id>
+                        <phase>process-sources</phase>
+                        <goals>
+                            <goal>build</goal>
+                        </goals>
+                    </execution>
+                </executions>
+                <configuration>
+                    <templateDirectory>src/docs/</templateDirectory>
+                    <templateFile>README_TEMPLATE.adoc</templateFile>
+                    <outputDirectory>./</outputDirectory>
+                    <outputFile>README.adoc</outputFile>
+                </configuration>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-release-plugin</artifactId>
+                <version>3.0.1</version>
+                <configuration>
+                    <autoVersionSubmodules>true</autoVersionSubmodules>
+                    <pushChanges>false</pushChanges>
+                    <tagNameFormat>@{project.version}</tagNameFormat>
+                </configuration>
+            </plugin>
+            <plugin>
+                <groupId>com.mycila</groupId>
+                <artifactId>license-maven-plugin</artifactId>
+                <version>${mycila.version}</version>
+                <inherited>false</inherited>
+                <!-- To apply the license run: -->
+                <!-- ↪ mvn com.mycila:license-maven-plugin:format-->
+                <!-- To skip: -Dlicense.skip -->
+                <configuration>
+                    <aggregate>true</aggregate>
+                    <licenseSets>
+                        <licenseSet>
+                            <inlineHeader>Copyright (C) ${license.git.copyrightYears} ${project.organization.name}
+                            </inlineHeader>
+                            <excludes>
+                                <exclude>**/release-pom.xml</exclude>
+                                <exclude>**/target/**/*</exclude>
+                                <exclude>**/README*</exclude>
+                                <!-- don't think this is needed, as it's excluded by default. But running really slow on OSx so thought should check -->
+                                <!-- https://github.com/mathieucarbou/license-maven-plugin/issues/298-->
+                                <!-- Ideally the fix would be this issue: https://github.com/mathieucarbou/license-maven-plugin/issues/126  Ignore items from .gitignore #126-->
+                                <exclude>.ci/**/*</exclude>
+                                <exclude>.git/**/*</exclude>
+                                <!-- Very odd artifact on Jenkins -->
+                                <!--00:01:15.201  [INFO] Checking licenses...-->
+                                <!--00:01:17.095  [WARNING] Unknown file extension: ********-->
+                                <!--00:01:17.096  [WARNING] Missing header in: ********-->
+                                <exclude>********</exclude>
+                            </excludes>
+                        </licenseSet>
+                    </licenseSets>
+                    <mapping>
+                        <java>JAVAPKG_STYLE</java>
+                    </mapping>
+                </configuration>
+                <dependencies>
+                    <dependency>
+                        <groupId>com.mycila</groupId>
+                        <artifactId>license-maven-plugin-git</artifactId>
+                        <version>${mycila.version}</version>
+                    </dependency>
+                </dependencies>
+                <executions>
+                    <execution>
+                        <goals>
+                            <goal>${license.mode}</goal>
+                        </goals>
+                        <phase>process-sources</phase>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-compiler-plugin</artifactId>
+                <version>3.11.0</version>
+                <configuration>
+                    <annotationProcessorPaths>
+                        <path>
+                            <groupId>com.google.auto.service</groupId>
+                            <artifactId>auto-service</artifactId>
+                            <version>${auto-service.version}</version>
+                        </path>
+                        <path>
+                            <groupId>org.projectlombok</groupId>
+                            <artifactId>lombok</artifactId>
+                            <version>${lombok.version}</version>
+                        </path>
+                        <!-- jabel setup-->
+                        <path>
+                            <groupId>com.github.bsideup.jabel</groupId>
+                            <artifactId>jabel-javac-plugin</artifactId>
+                            <version>${jabel.version}</version>
+                        </path>
+                    </annotationProcessorPaths>
+                    <!-- enable language preview features -->
+                    <source>${source.version}</source>
+                    <target>${release.target}</target>
+                    <release>${release.target}</release>
+                    <annotationProcessors>
+                        <annotationProcessor>lombok.launch.AnnotationProcessorHider$AnnotationProcessor
+                        </annotationProcessor>
+                    </annotationProcessors>
+                </configuration>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-surefire-plugin</artifactId>
+                <version>${surefire.version}</version>
+                <configuration>
+                    <trimStackTrace>false</trimStackTrace>
+                    <excludes>
+                        <!-- <exclude>**/*integration*/**/*.java</exclude> too aggressive? -->
+                        <exclude>**/integrationTest*/**/*.java</exclude>
+                        <exclude>**/*IT.java</exclude>
+                    </excludes>
+                    <jvm>${jvm.location}/bin/java</jvm>
+                    <skipTests>${skipUTs}</skipTests>
+                </configuration>
+            </plugin>
+            <plugin>
+                <artifactId>maven-failsafe-plugin</artifactId>
+                <version>${surefire.version}</version>
+                <executions>
+                    <execution>
+                        <goals>
+                            <goal>integration-test</goal>
+                            <goal>verify</goal>
+                        </goals>
+                    </execution>
+                </executions>
+                <configuration>
+                    <includes>
+                        <!-- using filename matching -->
+                        <!-- Integration tests need to be in a package named `integrationTest` -->
+                        <include>**/integrationTest*/**/*.java</include>
+                    </includes>
+                    <jvm>${jvm.location}/bin/java</jvm>
+                    <skipTests>${skipTests}</skipTests>
+                    <skipITs>${skipITs}</skipITs>
+                    <parallel>methods</parallel>
+                </configuration>
+            </plugin>
+            <plugin>
+                <groupId>org.jacoco</groupId>
+                <artifactId>jacoco-maven-plugin</artifactId>
+                <version>0.8.10</version>
+                <executions>
+                    <execution>
+                        <goals>
+                            <goal>prepare-agent</goal>
+                        </goals>
+                    </execution>
+                    <execution>
+                        <id>report</id>
+                        <phase>test</phase>
+                        <goals>
+                            <goal>report</goal>
+                        </goals>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-enforcer-plugin</artifactId>
+                <version>3.3.0</version>
+                <executions>
+                    <execution>
+                        <id>enforce-versions</id>
+                        <goals>
+                            <goal>enforce</goal>
+                        </goals>
+                        <phase>validate</phase>
+                        <configuration>
+                            <rules>
+                                <requireJavaVersion>
+                                    <version>[${source.version},)</version>
+                                </requireJavaVersion>
+                                <requireMavenVersion>
+                                    <version>3.6.3</version>
+                                </requireMavenVersion>
+                                <requireMavenVersion>
+                                    <version>3.6.3</version>
+                                </requireMavenVersion>
+                                <bannedDependencies>
+                                    <searchTransitive>true</searchTransitive>
+                                    <excludes>
+                                        <exclude>log4j:*:*:*:runtime</exclude>
+                                        <exclude>log4j:*:*:*:compile</exclude>
+                                        <exclude>log4j:*:*:*:test</exclude>
+                                        <exclude>org.apache.logging.log4j:log4j-core:*:*:runtime</exclude>
+                                        <exclude>org.apache.logging.log4j:log4j-core:*:*:compile</exclude>
+                                        <!-- Javafaker is abandoned and has CVEs and bugs -->
+                                        <exclude>com.github.javafaker</exclude>
+                                    </excludes>
+                                </bannedDependencies>
+                                <reactorModuleConvergence />
+                                <banDuplicatePomDependencyVersions />
+                                <requireSameVersions />
+                            </rules>
+                        </configuration>
+                    </execution>
+                </executions>
+            </plugin>
+            <!-- https://stackoverflow.com/a/1733745/105741-->
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-jar-plugin</artifactId>
+                <version>3.3.0</version>
+                <executions>
+                    <execution>
+                        <goals>
+                            <goal>test-jar</goal>
+                        </goals>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.codehaus.mojo</groupId>
+                <artifactId>build-helper-maven-plugin</artifactId>
+                <version>3.4.0</version>
+                <executions>
+                    <!-- integration test sources -->
+                    <execution>
+                        <id>add-integration-test-source</id>
+                        <phase>generate-test-sources</phase>
+                        <goals>
+                            <goal>add-test-source</goal>
+                        </goals>
+                        <configuration>
+                            <sources>
+                                <source>src/test-integration/java</source>
+                                <source>${project.build.directory}/generated-sources</source>
+                            </sources>
+                        </configuration>
+                    </execution>
+                    <execution>
+                        <id>add-integration-test-resource</id>
+                        <phase>generate-test-resources</phase>
+                        <goals>
+                            <goal>add-test-resource</goal>
+                        </goals>
+                        <configuration>
+                            <resources>
+                                <resource>
+                                    <directory>src/test-integration/resources</directory>
+                                </resource>
+                            </resources>
+                        </configuration>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-site-plugin</artifactId>
+                <version>4.0.0-M9</version>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-project-info-reports-plugin</artifactId>
+                <version>3.4.5</version>
+            </plugin>
+            <plugin>
+                <groupId>org.projectlombok</groupId>
+                <artifactId>lombok-maven-plugin</artifactId>
+                <version>1.18.20.0</version>
+                <configuration>
+                    <sourceDirectory>${project.basedir}/src/main/java</sourceDirectory>
+                    <outputDirectory>${delombok.output}</outputDirectory>
+                    <addOutputDirectory>false</addOutputDirectory>
+                </configuration>
+                <executions>
+                    <execution>
+                        <phase>generate-sources</phase>
+                        <goals>
+                            <goal>delombok</goal>
+                        </goals>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-javadoc-plugin</artifactId>
+                <version>3.5.0</version>
+                <configuration>
+                    <sourcepath>${delombok.output}</sourcepath>
+                    <sourcepath>${delombok.output}</sourcepath>
+                    <!--
+                    Force javadoc to ignore things like "unknown tag: implNote"
+                    and "no @param for <C>"
+                    -->
+                    <additionalOptions>-Xdoclint:none</additionalOptions>
+                    <javadocExecutable>${java.home}/bin/javadoc</javadocExecutable>
+                </configuration>
+                <executions>
+                    <execution>
+                        <id>attach-javadocs</id>
+                        <goals>
+                            <goal>jar</goal>
+                        </goals>
+                        <configuration>
+                            <source>${source.version}</source>
+                            <release>${source.version}</release>
+                            <!-- Source goals - change to true? -->
+                            <failOnWarnings>false</failOnWarnings>
+                        </configuration>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-source-plugin</artifactId>
+                <version>3.3.0</version>
+                <executions>
+                    <execution>
+                        <id>attach-sources</id>
+                        <goals>
+                            <goal>jar-no-fork</goal>
+                        </goals>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-dependency-plugin</artifactId>
+                <version>3.6.0</version>
+                <executions>
+                    <execution>
+                        <phase>initialize</phase>
+                        <goals>
+                            <goal>tree</goal>
+                        </goals>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <!-- for use in idea -->
+                <groupId>org.codehaus.mojo</groupId>
+                <artifactId>versions-maven-plugin</artifactId>
+                <version>2.16.0</version>
+            </plugin>
+        </plugins>
+
+        <!-- Management -->
+        <pluginManagement>
+            <plugins>
+                <plugin>
+                    <groupId>org.apache.maven.plugins</groupId>
+                    <artifactId>maven-site-plugin</artifactId>
+                    <version>4.0.0-M9</version>
+                </plugin>
+                <plugin>
+                    <groupId>org.apache.maven.plugins</groupId>
+                    <artifactId>maven-project-info-reports-plugin</artifactId>
+                    <version>3.4.5</version>
+                </plugin>
+                <plugin>
+                    <groupId>org.apache.maven.plugins</groupId>
+                    <artifactId>maven-clean-plugin</artifactId>
+                    <version>3.3.1</version>
+                </plugin>
+                <plugin>
+                    <groupId>org.apache.maven.plugins</groupId>
+                    <artifactId>maven-install-plugin</artifactId>
+                    <version>3.1.1</version>
+                </plugin>
+                <plugin>
+                    <groupId>org.apache.maven.plugins</groupId>
+                    <artifactId>maven-deploy-plugin</artifactId>
+                    <version>3.1.1</version>
+                </plugin>
+                <plugin>
+                    <groupId>org.apache.maven.plugins</groupId>
+                    <artifactId>maven-resources-plugin</artifactId>
+                    <version>3.3.1</version>
+                </plugin>
+                <plugin>
+                    <groupId>org.apache.maven.plugins</groupId>
+                    <artifactId>maven-dependency-plugin</artifactId>
+                    <version>3.6.0</version>
+                </plugin>
+            </plugins>
+        </pluginManagement>
+    </build>
+
+    <repositories>
+        <repository>
+            <id>confluent</id>
+            <url>https://packages.confluent.io/maven/</url>
+        </repository>
+        <repository>
+            <id>jitpack.io</id>
+            <url>https://jitpack.io</url>
+        </repository>
+        <repository>
+            <id>astubbs-truth-generator</id>
+            <url>https://packagecloud.io/astubbs/truth-generator/maven2</url>
+            <snapshots>
+                <enabled>true</enabled>
+            </snapshots>
+        </repository>
+    </repositories>
+    <pluginRepositories>
+        <pluginRepository>
+            <id>astubbs-truth-generator</id>
+            <url>https://packagecloud.io/astubbs/truth-generator/maven2</url>
+            <snapshots>
+                <enabled>true</enabled>
+            </snapshots>
+        </pluginRepository>
+    </pluginRepositories>
+
+</project>
diff --git a/service.yml b/service.yml
new file mode 100644
index 000000000..0370fa970
--- /dev/null
+++ b/service.yml
@@ -0,0 +1,13 @@
+#
+lang: unknown
+# Copyright (C) 2021-2022 Confluent, Inc.
+#
+
+name: parallel-consumer
+lang: java
+lang_version: 17
+github:
+    enable: true
+    repo_name: confluentinc/parallel-consumer
+semaphore:
+    enable: false
diff --git a/src/docs/README_TEMPLATE.adoc b/src/docs/README_TEMPLATE.adoc
new file mode 100644
index 000000000..87d0d1934
--- /dev/null
+++ b/src/docs/README_TEMPLATE.adoc
@@ -0,0 +1,1255 @@
+//
+// STOP!!! Make sure you're editing the TEMPLATE version of the README, in /src/docs/README_TEMPLATE.adoc
+//
+// Do NOT edit /README_TEMPLATE.adoc as your changes will be overwritten when the template is rendered again during
+// `process-sources`.
+//
+// Changes made to this template, must then be rendered to the base readme, by running `mvn process-sources`
+//
+// To render the README directly, run `mvn asciidoc-template::build`
+//
+
+
+// dynamic include base for editing in IDEA
+:project_root: ./
+// for editing the template to see the includes, this will correctly render includes
+ifeval::["{docname}" == "README_TEMPLATE"]
+
+TIP:: Editing template file
+
+:project_root: ../../
+
+endif::[]
+
+
+= Confluent Parallel Consumer
+:icons:
+:toc: macro
+:toclevels: 3
+:numbered: 1
+:sectlinks: true
+:sectanchors: true
+
+:github_name: parallel-consumer
+:base_url: https://github.com/confluentinc/{github_name}
+:issues_link: {base_url}/issues
+
+
+ifdef::env-github[]
+:tip-caption: :bulb:
+:note-caption: :information_source:
+:important-caption: :heavy_exclamation_mark:
+:caution-caption: :fire:
+:warning-caption: :warning:
+endif::[]
+
+image:https://maven-badges.herokuapp.com/maven-central/io.confluent.parallelconsumer/parallel-consumer-parent/badge.svg?style=flat[link=https://mvnrepository.com/artifact/io.confluent.parallelconsumer/parallel-consumer-parent,Latest Parallel Consumer on Maven Central]
+
+// Github actions disabled since codecov
+//image:https://github.com/confluentinc/parallel-consumer/actions/workflows/maven.yml/badge.svg[Java 8 Unit Test GitHub] +
+//^(^^full^ ^test^ ^suite^ ^currently^ ^running^ ^only^ ^on^ ^Confluent^ ^internal^ ^CI^ ^server^^)^
+
+// travis badges temporarily disabled as travis isn't running CI currently
+//image:https://travis-ci.com/astubbs/parallel-consumer.svg?branch=master["Build Status", link="https://travis-ci.com/astubbs/parallel-consumer"] image:https://codecov.io/gh/astubbs/parallel-consumer/branch/master/graph/badge.svg["Coverage",https://codecov.io/gh/astubbs/parallel-consumer]
+
+Parallel Apache Kafka client wrapper with client side queueing, a simpler consumer/producer API with *key concurrency* and *extendable non-blocking IO* processing.
+
+Confluent's https://www.confluent.io/confluent-accelerators/#parallel-consumer[product page for the project is here].
+
+TIP: If you like this project, please ⭐ Star it in GitHub to show your appreciation, help us gauge popularity of the project and allocate resources.
+
+NOTE: This is not a part of the Confluent commercial support offering, except through consulting engagements.
+See the <<Support and Issues>> section for more information.
+
+IMPORTANT: This project has been stable and reached its initial target feature set in Q1 2021.
+It is actively maintained by the CSID team at Confluent.
+
+[[intro]]
+This library lets you process messages in parallel via a single Kafka Consumer meaning you can increase consumer parallelism without increasing the number of partitions in the topic you intend to process.
+For many use cases this improves both throughput and latency by reducing load on your brokers.
+It also opens up new use cases like extreme parallelism, external data enrichment, and queuing.
+
+.Consume many messages _concurrently_ with a *single* consumer instance:
+[source,java,indent=0]
+----
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-core/src/main/java/io/confluent/parallelconsumer/examples/core/CoreApp.java[tag=example]
+----
+
+An overview article to the library can also be found on Confluent's https://www.confluent.io/blog/[blog]: https://www.confluent.io/blog/introducing-confluent-parallel-message-processing-client/[Introducing the Confluent Parallel Consumer].
+
+[#demo]
+== Demo
+
+.Relative speed demonstration
+--
+.Click on the animated SVG image to open the https://asciinema.org/a/404299[Asciinema.org player].
+image::https://gist.githubusercontent.com/astubbs/26cccaf8b624a53ae26a52dbc00148b1/raw/cbf558b38b0aa624bd7637406579d2a8f00f51db/demo.svg[link="https://asciinema.org/a/404299"]
+--
+
+:talk_link: https://www.confluent.io/en-gb/events/kafka-summit-europe-2021/introducing-confluent-labs-parallel-consumer-client/
+:talk_preview_image: https://play.vidyard.com/5MLb1Xh7joEQ7phxPxiyPK.jpg
+
+[#talk]
+== Video Overview
+
+.Kafka Summit Europe 2021 Presentation
+--
+.A video presentation overview can be found {talk_link}[from the Kafka Summit Europe 2021] page for the presentatoin, along with slides.
+[link = {talk_link}]
+image::{talk_preview_image}[Talk]
+--
+
+'''
+
+toc::[]
+
+== Motivation
+
+=== Why would I need this?
+
+The unit of parallelism in Kafka’s consumers is the partition but sometimes you want to break away from this approach and manage parallelism yourself using threads rather than new instances of a Consumer.
+Notable use cases include:
+
+* Where partition counts are difficult to change and you need more parallelism than the current configuration allows.
+
+* You wish to avoid over provisioning partitions in topics due to unknown future requirements.
+
+* You wish to reduce the broker-side resource utilization associated with highly-parallel consumer groups.
+
+* You need queue-like semantics that use message level acknowledgment, for example to process a work queue with short- and long-running tasks.
+
+When reading the below, keep in mind that the unit of concurrency and thus performance, is restricted by the number of partitions (degree of sharding / concurrency).
+Currently, you can't adjust the number of partitions in your Kafka topics without jumping through a lot of hoops, or breaking your key ordering.
+
+==== Before
+
+.The slow consumer situation with the raw Apache Kafka Consumer client
+image::https://lucid.app/publicSegments/view/98ad200f-97b2-479b-930c-2805491b2ce7/image.png[align="center"]
+
+==== After
+
+.Example usage of the Parallel Consumer
+image::https://lucid.app/publicSegments/view/2cb3b7e2-bfdf-4e78-8247-22ec394de965/image.png[align="center"]
+
+=== Background
+
+The core Kafka consumer client gives you a batch of messages to process one at a time.
+Processing these in parallel on thread pools is difficult, particularly when considering offset management and strong ordering guarantees.
+You also need to manage your consume loop, and commit transactions properly if using Exactly Once semantics.
+
+This wrapper library for the Apache Kafka Java client handles all this for you, you just supply your processing function.
+
+Another common situation where concurrent processing of messages is advantageous, is what is referred to as "competing consumers".
+A pattern that is often addressed in traditional messaging systems using a shared queue.
+Kafka doesn't provide native queue support and this can result in a slow processing message blocking the messages behind it in the same partition.
+If <<ordering-guarantees,log ordering>> isn't a concern this can be an unwelcome bottleneck for users.
+The Parallel Consumer provides a solution to this problem.
+
+In addition, the <<http-with-vertx,Vert.x extension>> to this library supplies non-blocking interfaces, allowing higher still levels of concurrency with a further simplified interface.
+Also included now is a <<project-reactor,module for>> https://projectreactor.io[Project Reactor.io].
+
+=== FAQ
+
+[qanda]
+Why not just run more consumers?::
+The typical way to address performance issues in a Kafka system, is to increase the number of consumers reading from a topic.
+This is effective in many situations, but falls short in a lot too.
+
+* Primarily: You cannot use more consumers than you have partitions available to read from.
+For example, if you have a topic with five partitions, you cannot use a group with more than five consumers to read from it.
+* Running more extra consumers has resource implications - each consumer takes up resources on both the client and broker side.
+Each consumer adds a lot of overhead in terms of memory, CPU, and network bandwidth.
+* Large consumer groups (especially many large groups) can cause a lot of strain on the consumer group coordination system, such as rebalance storms.
+* Even with several partitions, you cannot achieve the performance levels obtainable by *per-key* ordered or unordered concurrent processing.
+* A single slow or failing message will also still block all messages behind the problematic message, ie. the entire partition.
+The process may recover, but the latency of all the messages behind the problematic one will be negatively impacted severely.
+
+Why not run more consumers __within__ your application instance?::
+* This is in some respects a slightly easier way of running more consumer instances, and in others a more complicated way.
+However, you are still restricted by all the per consumer restrictions as described above.
+
+Why not use the Vert.x library yourself in your processing loop?::
+* Vert.x us used in this library to provide a non-blocking IO system in the message processing step.
+Using Vert.x without using this library with *ordered* processing requires dealing with the quite complicated, and not straight forward, aspect of handling offset commits with Vert.x asynchronous processing system.
++
+*Unordered* processing with Vert.x is somewhat easier, however offset management is still quite complicated, and the Parallel Consumer also provides optimizations for message-level acknowledgment in this case.
+This library handles offset commits for both ordered and unordered processing cases.
+
+=== Scenarios
+
+Below are some real world use cases which illustrate concrete situations where the described advantages massively improve performance.
+
+* Slow consumer systems in transactional systems (online vs offline or reporting systems)
+** Notification system:
++
+*** Notification processing system which sends push notifications to a user to acknowledge a two-factor authentication request on their mobile and authorising a login to a website, requires optimal end-to-end latency for a good user experience.
+*** A specific message in this queue uncharacteristically takes a long time to process because the third party system is sometimes unpredictably slow to respond and so holds up the processing for *ALL* other notifications for other users that are in the same partition behind this message.
+*** Using key order concurrent processing will allow notifications to proceed while this message either slowly succeeds or times out and retires.
+** Slow GPS tracking system (slow HTTP service interfaces that can scale horizontally)
+*** GPS tracking messages from 100,000 different field devices pour through at a high rate into an input topic.
+*** For each message, the GPS location coordinates is checked to be within allowed ranges using a legacy HTTP services, dictated by business rules behind the service.
+*** The service takes 50ms to process each message, however can be scaled out horizontally without restriction.
+*** The input topic only has 10 partitions and for various reasons (see above) cannot be changed.
+*** With the vanilla consumer, messages on each partition must be consumed one after the other in serial order.
+*** The maximum rate of message processing is then:
++
+`1 second / 50 ms * 10 partitions = 200 messages per second.`
+*** By using this library, the 10 partitions can all be processed in key order.
++
+`1 second / 50ms × 100,000 keys = 2,000,000 messages per second`
++
+While the HTTP system probably cannot handle 2,000,000 messages per second, more importantly, your system is no longer the bottleneck.
+
+** Slow CPU bound model processing for fraud prediction
+*** Consider a system where message data is passed through a fraud prediction model which takes CPU cycles, instead of an external system being slow.
+*** We can scale easily the number of CPUs on our virtual machine where the processing is being run, but we choose not to scale the partitions or consumers (see above).
+*** By deploying onto machines with far more CPUs available, we can run our prediction model massively parallel, increasing our throughput and reducing our end-to-end response times.
+* Spikey load with latency sensitive non-functional requirements
+** An upstream system regularly floods our input topic daily at close of business with settlement totals data from retail outlets.
+*** Situations like this are common where systems are designed to comfortably handle average day time load, but are not provisioned to handle sudden increases in traffic as they don't happen often enough to justify the increased spending on processing capacity that would otherwise remain idle.
+*** Without adjusting the available partitions or running consumers, we can reduce our maximum end-to-end latency and increase throughout to get our global days outlet reports to division managers so action can be taken, before close of business.
+** Natural consumer behaviour
+*** Consider scenarios where bursts of data flooding input topics are generated by sudden user behaviour such as sales or television events ("Oprah" moments).
+*** For example, an evening, prime-time game show on TV where users send in quiz answers on their devices.
+The end-to-end latency of the responses to these answers needs to be as low as technically possible, even if the processing step is quick.
+*** Instead of a vanilla client where each user response waits in a virtual queue with others to be processed, this library allows every single response to be processed in parallel.
+* Legacy partition structure
+** Any existing setups where we need higher performance either in throughput or latency where there are not enough partitions for needed concurrency level, the tool can be applied.
+* Partition overloaded brokers
+** Clusters with under-provisioned hardware and with too many partitions already - where we cannot expand partitions even if we were able to.
+** Similar to the above, but from the operations perspective, our system is already over partitioned, perhaps in order to support existing parallel workloads which aren't using the tool (and so need large numbers of partitions).
+** We encourage our development teams to migrate to the tool, and then being a process of actually __lowering__ the number of partitions in our partitions in order to reduce operational complexity, improve reliability and perhaps save on infrastructure costs.
+* Server side resources are controlled by a different team we can't influence
+** The cluster our team is working with is not in our control, we cannot change the partition setup, or perhaps even the consumer layout.
+** We can use the tool ourselves to improve our system performance without touching the cluster / topic setup.
+* Kafka Streams app that had a slow stage
+** We use Kafka Streams for our message processing, but one of it's steps have characteristics of the above and we need better performance.
+We can break out as described below into the tool for processing that step, then return to the Kafka Streams context.
+* Provisioning extra machines (either virtual machines or real machines) to run multiple clients has a cost, using this library instead avoids the need for extra instances to be deployed in any respect.
+
+== Features List
+
+* Have massively parallel consumption processing without running hundreds or thousands of:
+** Kafka consumer clients,
+** topic partitions,
++
+without operational burden or harming the cluster's performance
+* Client side queueing system on top of Apache Kafka consumer
+** Efficient individual message acknowledgement system (without local or third party external system state storage) to massively reduce (and usually completely eliminate) message replay upon failure - see <<offset_map>> section for more details
+* Solution for the https://en.wikipedia.org/wiki/Head-of-line_blocking["head of line"] blocking problem where continued failure of a single message, prevents progress for messages behind it in the queue
+* Per `key` concurrent processing, per partition and unordered message processing
+* Offsets committed correctly, in order, of only processed messages, regardless of concurrency level or retries
+* Batch support in all versions of the API to process batches of messages in parallel instead of single messages.
+** Particularly useful for when your processing function can work with more than a single record at a time - e.g. sending records to an API which has a batch version like Elasticsearch
+* Vert.x and Reactor.io non-blocking library integration
+** Non-blocking I/O work management
+** Vert.x's WebClient and general Vert.x Future support
+** Reactor.io Publisher (Mono/Flux) and Java's CompletableFuture (through `Mono#fromFuture`)
+* Exactly Once bulk transaction system
+** When using the transactional mode, record processing that happens in parallel and produce records back to kafka get all grouped into a large batch transaction, and the offsets and records are submitted through the transactional producer, giving you Exactly once Semantics for parallel processing.
+** For further information, see the <<transaction-system>> section.
+* Fair partition traversal
+* Zero~ dependencies (`Slf4j` and `Lombok`) for the core module
+* Java 8 compatibility
+* Throttle control and broker liveliness management
+* Clean draining shutdown cycle
+* Manual global pause / resume of all partitions, without unsubscribing from topics (useful for implementing a simplistic https://en.wikipedia.org/wiki/Circuit_breaker_design_pattern[circuit breaker])
+** Circuit breaker patterns for individual paritions or keys can be done through throwing failure exceptions in the processing function (see https://github.com/confluentinc/parallel-consumer/pull/291[PR #291 Explicit terminal and retriable exceptions] for further refinement)
+** Note: Pausing of a partition is also automatic, whenever back pressure has built up on a given partition
+
+//image:https://codecov.io/gh/astubbs/parallel-consumer/branch/master/graph/badge.svg["Coverage",https://codecov.io/gh/astubbs/parallel-consumer]
+//image:https://travis-ci.com/astubbs/parallel-consumer.svg?branch=master["Build Status", link="https://travis-ci.com/astubbs/parallel-consumer"]
+
+And more <<roadmap,to come>>!
+
+== Performance
+
+In the best case, you don't care about ordering at all.In which case, the degree of concurrency achievable is simply set by max thread and concurrency settings, or with the Vert.x extension, the Vert.x Vertical being used - e.g. non-blocking HTTP calls.
+
+For example, instead of having to run 1,000 consumers to process 1,000 messages at the same time, we can process all 1,000 concurrently on a single consumer instance.
+
+More typically though you probably still want the per key ordering grantees that Kafka provides.
+For this there is the per key ordering setting.
+This will limit the library from processing any message at the same time or out of order, if they have the same key.
+
+Massively reduce message processing latency regardless of partition count for spikey workloads where there is good key distribution.
+Eg 100,000 “users” all trigger an action at once.
+As long as the processing layer can handle the load horizontally (e.g auto scaling web service), per message latency will be massively decreased, potentially down to the time for processing a single message, if the integration point can handle the concurrency.
+
+For example, if you have a key set of 10,000 unique keys, and you need to call an http endpoint to process each one, you can use the per key order setting, and in the best case the system will process 10,000 at the same time using the non-blocking Vert.x HTTP client library.
+The user just has to provide a function to extract from the message the HTTP call parameters and construct the HTTP request object.
+
+=== Illustrative Performance Example
+
+.(see link:./parallel-consumer-core/src/test-integration/java/io/confluent/parallelconsumer/integrationTests/VolumeTests.java[VolumeTests.java])
+These performance comparison results below, even though are based on real performance measurement results, are for illustrative purposes.
+To see how the performance of the tool is related to instance counts, partition counts, key distribution and how it would relate to the vanilla client.
+Actual results will vary wildly depending upon the setup being deployed into.
+
+For example, if you have hundreds of thousands of keys in your topic, randomly distributed, even with hundreds of partitions, with only a handful of this wrapper deployed, you will probably see many orders of magnitude performance improvements - massively out performing dozens of vanilla Kafka consumer clients.
+
+.Time taken to process a large number of messages with a Single Parallel Consumer vs a single Kafka Consumer, for different key space sizes. As the number of unique keys in the data set increases, the key ordered Parallel Consumer performance starts to approach that of the unordered Parallel Consumer. The raw Kafka consumer performance remains unaffected by the key distribution.
+image::https://docs.google.com/spreadsheets/d/e/2PACX-1vQffkAFG-_BzH-LKfGCVnytdzAHiCNIrixM6X2vF8cqw2YVz6KyW3LBXTB-lVazMAJxW0UDuFILKvtK/pubchart?oid=1691474082&amp;format=image[align="center"]
+
+.Consumer group size effect on total processing time vs a single Parallel Consumer. As instances are added to the consumer group, it's performance starts to approach that of the single instance Parallel Consumer. Key ordering is faster than partition ordering, with unordered being the fastest.
+image::https://docs.google.com/spreadsheets/d/e/2PACX-1vQffkAFG-_BzH-LKfGCVnytdzAHiCNIrixM6X2vF8cqw2YVz6KyW3LBXTB-lVazMAJxW0UDuFILKvtK/pubchart?oid=938493158&format=image[align="center"]
+
+.Consumer group size effect on message latency vs a single Parallel Consumer. As instances are added to the consumer group, it's performance starts to approach that of the single instance Parallel Consumer.
+image::https://docs.google.com/spreadsheets/d/e/2PACX-1vQffkAFG-_BzH-LKfGCVnytdzAHiCNIrixM6X2vF8cqw2YVz6KyW3LBXTB-lVazMAJxW0UDuFILKvtK/pubchart?oid=1161363385&format=image[align="center"]
+
+As an illustrative example of relative performance, given:
+
+* A random processing time between 0 and 5ms
+* 10,000 messages to process
+* A single partition (simplifies comparison - a topic with 5 partitions is the same as 1 partition with a keyspace of 5)
+* Default `ParallelConsumerOptions`
+** maxConcurrency = 100
+** numberOfThreads = 16
+
+.Comparative performance of order modes and key spaces
+[cols="1,1,1,3",options="header"]
+|===
+|Ordering
+|Number of keys
+|Duration
+|Note
+
+|Partition
+|20 (not relevant)
+|22.221s
+|This is the same as a single partition with a single normal serial consumer, as we can see: 2.5ms avg processing time * 10,000 msg / 1000ms = ~25s.
+
+|Key
+|1
+|26.743s
+|Same as above
+
+|Key
+|2
+|13.576s
+|
+
+|Key
+|5
+|5.916s
+|
+
+|Key
+|10
+|3.310s
+|
+
+|Key
+|20
+|2.242s
+|
+
+|Key
+|50
+|2.204s
+|
+
+|Key
+|100
+|2.178s
+|
+
+|Key
+|1,000
+|2.056s
+|
+
+|Key
+|10,000
+|2.128s
+|As key space is t he same as the number of messages, this is similar (but restricted by max concurrency settings) as having a *single consumer* instance and *partition* _per key_. 10,000 msgs * avg processing time 2.5ms = ~2.5s.
+
+|Unordered
+|20 (not relevant)
+|2.829s
+|As there is no order restriction, this is similar (but restricted by max concurrency settings) as having a *single consumer* instance and *partition* _per key_. 10,000 msgs * avg processing time 2.5ms = ~2.5s.
+|===
+
+== Support and Issues
+
+If you encounter any issues, or have any suggestions or future requests, please create issues in the {issues_link}[github issue tracker].
+Issues will be dealt with on a good faith, best efforts basis, by the small team maintaining this library.
+
+We also encourage participation, so if you have any feature ideas etc, please get in touch, and we will help you work on submitting a PR!
+
+NOTE: We are very interested to hear about your experiences!
+And please vote on your favourite issues!
+
+If you have questions, head over to the https://launchpass.com/confluentcommunity[Confluent Slack community], or raise an https://github.com/confluentinc/parallel-consumer/issues[issue] on GitHub.
+
+== License
+
+This library is copyright Confluent Inc, and licensed under the Apache License Version 2.0.
+
+== Usage
+
+=== Maven
+
+This project is available in maven central, https://repo1.maven.org/maven2/io/confluent/parallelconsumer/[repo1], along with SNAPSHOT builds (starting with 0.5-SNAPSHOT) in https://oss.sonatype.org/content/repositories/snapshots/io/confluent/parallelconsumer/[repo1's SNAPSHOTS repo].
+
+Latest version can be seen https://search.maven.org/artifact/io.confluent.parallelconsumer/parallel-consumer-core[here].
+
+Where `${project.version}` is the version to be used:
+
+* group ID: `io.confluent.parallelconsumer`
+* artifact ID: `parallel-consumer-core`
+* version: image:https://maven-badges.herokuapp.com/maven-central/io.confluent.parallelconsumer/parallel-consumer-parent/badge.svg?style=flat[link=https://mvnrepository.com/artifact/io.confluent.parallelconsumer/parallel-consumer-parent,Latest Parallel Consumer on Maven Central]
+
+.Core Module Dependency
+[source,xml,indent=0]
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-core/pom.xml[tag=exampleDep]
+
+.Reactor Module Dependency
+[source,xml,indent=0]
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-reactor/pom.xml[tag=exampleDep]
+
+.Vert.x Module Dependency
+[source,xml,indent=0]
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-vertx/pom.xml[tag=exampleDep]
+
+[[common_preparation]]
+=== Common Preparation
+
+.Setup the client
+[source,java,indent=0]
+----
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-core/src/main/java/io/confluent/parallelconsumer/examples/core/CoreApp.java[tag=exampleSetup]
+----
+
+<1> Setup your clients as per normal.
+A Producer is only required if using the `produce` flows.
+<2> Choose your ordering type, `KEY` in this case.
+This ensures maximum concurrency, while ensuring messages are processed and committed in `KEY` order, making sure no offset is committed unless all offsets before it in it's partition, are completed also.
+<3> The maximum number of concurrent processing operations to be performing at any given time.
+Also, because the library coordinates offsets, `enable.auto.commit` must be disabled in your consumer.
+<5> Subscribe to your topics
+
+NOTE: Because the library coordinates offsets, `enable.auto.commit` must be disabled.
+
+After this setup, one then has the choice of interfaces:
+
+* `ParallelStreamProcessor`
+* `VertxParallelStreamProcessor`
+* `JStreamParallelStreamProcessor`
+* `JStreamVertxParallelStreamProcessor`
+
+There is another interface: `ParallelConsumer` which is integrated, however there is currently no immediate implementation.
+See {issues_link}/12[issue #12], and the `ParallelConsumer` JavaDoc:
+
+[source,java]
+----
+include::{project_root}/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelConsumer.java[tag=javadoc]
+----
+
+=== Core
+
+==== Simple Message Process
+
+This is the only thing you need to do, in order to get massively concurrent processing in your code.
+
+.Usage - print message content out to the console in parallel
+[source,java,indent=0]
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-core/src/main/java/io/confluent/parallelconsumer/examples/core/CoreApp.java[tag=example]
+
+See the link:{project_root}/parallel-consumer-examples/parallel-consumer-example-core/src/main/java/io/confluent/parallelconsumer/examples/core/CoreApp.java[core example] project, and it's test.
+
+==== Process and Produce a Response Message
+
+This interface allows you to process your message, then publish back to the broker zero, one or more result messages.
+You can also optionally provide a callback function to be run after the message(s) is(are) successfully published to the broker.
+
+.Usage - print message content out to the console in parallel
+[source,java,indent=0]
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-core/src/main/java/io/confluent/parallelconsumer/examples/core/CoreApp.java[tag=exampleProduce]
+
+==== Callbacks vs Streams
+
+You have the option to either use callbacks to be notified of events, or use the `Streaming` versions of the API, which use the `java.util.stream.Stream` system:
+
+* `JStreamParallelStreamProcessor`
+* `JStreamVertxParallelStreamProcessor`
+
+In future versions, we plan to look at supporting other streaming systems like https://github.com/ReactiveX/RxJava[RxJava] via modules.
+
+[[batching]]
+=== Batching
+
+The library also supports sending a batch or records as input to the users processing function in parallel.
+Using this, you can process several records in your function at once.
+
+To use it, set a `batch size` in the options class.
+
+There are then various access methods for the batch of records - see the `PollContext` object for more information.
+
+IMPORTANT: If an exception is thrown while processing the batch, all messages in the batch will be returned to the queue, to be retried with the standard retry system.
+There is no guarantee that the messages will be retried again in the same batch.
+
+==== Usage
+
+[source,java,indent=0]
+----
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-core/src/main/java/io/confluent/parallelconsumer/examples/core/CoreApp.java[tag=batching]
+----
+
+<1> Choose your batch size.
+
+==== Restrictions
+
+- If using a batch version of the API, you must choose a batch size in the options class.
+- If a batch size is chosen, the "normal" APIs cannot be used, and an error will be thrown.
+
+[[http-with-vertx]]
+=== HTTP with the Vert.x Module
+
+.Call an HTTP endpoint for each message usage
+[source,java,indent=0]
+----
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-vertx/src/main/java/io/confluent/parallelconsumer/examples/vertx/VertxApp.java[tag=example]
+----
+
+<1> Simply return an object representing the request, the Vert.x HTTP engine will handle the rest, using it's non-blocking engine
+
+See the link:{project_root}/parallel-consumer-examples/parallel-consumer-example-vertx/src/main/java/io/confluent/parallelconsumer/examples/vertx/VertxApp.java[Vert.x example] project, and it's test.
+
+[[project-reactor]]
+=== Project Reactor
+
+As per the Vert.x support, there is also a Reactor module.
+This means you can use Reactor's non-blocking threading model to process your messages, allowing for orders of magnitudes higher concurrent processing than the core module's thread per worker module.
+
+See the link:{project_root}/parallel-consumer-examples/parallel-consumer-example-reactor/src/main/java/io/confluent/parallelconsumer/examples/reactor/ReactorApp.java[Reactor example] project, and it's test.
+
+.Call any Reactor API for each message usage. This example uses a simple `Mono.just` to return a value, but you can use any Reactor API here.
+[source,java,indent=0]
+----
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-reactor/src/main/java/io/confluent/parallelconsumer/examples/reactor/ReactorApp.java[tag=example]
+----
+
+[[spring]]
+[[streams-usage-code]]
+=== Kafka Streams Concurrent Processing
+
+Use your Streams app to process your data first, then send anything needed to be processed concurrently to an output topic, to be consumed by the parallel consumer.
+
+.Example usage with Kafka Streams
+image::https://lucid.app/publicSegments/view/43f2740c-2a7f-4b7f-909e-434a5bbe3fbf/image.png[Kafka Streams Usage,align="center"]
+
+.Preprocess in Kafka Streams, then process concurrently
+[source,java,indent=0]
+----
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-streams/src/main/java/io/confluent/parallelconsumer/examples/streams/StreamsApp.java[tag=example]
+----
+
+<1> Setup your Kafka Streams stage as per normal, performing any type of preprocessing in Kafka Streams
+<2> For the slow consumer part of your Topology, drop down into the parallel consumer, and use massive concurrency
+
+See the link:{project_root}/parallel-consumer-examples/parallel-consumer-example-streams/src/main/java/io/confluent/parallelconsumer/examples/streams/StreamsApp.java[Kafka Streams example] project, and it's test.
+
+[[confluent-cloud]]
+=== Confluent Cloud
+
+. Provision your fully managed Kafka cluster in Confluent Cloud
+.. Sign up for https://www.confluent.io/confluent-cloud/tryfree/[Confluent Cloud], a fully-managed Apache Kafka service.
+.. After you log in to Confluent Cloud, click on `Add cloud environment` and name the environment `learn-kafka`.
+Using a new environment keeps your learning resources separate from your other Confluent Cloud resources.
+.. Click on https://confluent.cloud/learn[LEARN] and follow the instructions to launch a Kafka cluster and to enable Schema Registry.
+. Access the client configuration settings
+.. From the Confluent Cloud Console, navigate to your Kafka cluster.
+From the `Clients` view, get the connection information customized to your cluster (select `Java`).
+.. Create new credentials for your Kafka cluster, and then Confluent Cloud will show a configuration block with your new credentials automatically populated (make sure `show API keys` is checked).
+.. Use these settings presented to https://docs.confluent.io/clients-kafka-java/current/overview.html[configure your clients].
+. Use these clients for steps outlined in the <<common_preparation>> section.
+
+[[upgrading]]
+== Upgrading
+
+=== From 0.4 to 0.5
+
+This version has a breaking change in the API - instead of passing in `ConsumerRecord` instances, it passes in a `PollContext` object which has extra information and utility methods.
+See the `PollContext` class for more information.
+
+[[ordering-guarantees]]
+== Ordering Guarantees
+
+The user has the option to either choose ordered, or unordered message processing.
+
+Either in `ordered` or `unordered` processing, the system will only commit offsets for messages which have been successfully processed.
+
+CAUTION: `Unordered` processing could cause problems for third party integration where ordering by key is required.
+
+CAUTION: Beware of third party systems which are not idempotent, or are key order sensitive.
+
+IMPORTANT: The below diagrams represent a single iteration of the system and a very small number of input partitions and messages.
+
+=== Vanilla Kafka Consumer Operation
+
+Given this input topic with three partitions and a series of messages:
+
+.Input topic
+image::https://lucid.app/publicSegments/view/37d13382-3067-4c93-b521-7e43f2295fff/image.png[align="center"]
+
+The normal Kafka client operations in the following manner.
+Note that typically offset commits are not performed after processing a single message, but is illustrated in this manner for comparison to the single pass concurrent methods below.
+Usually many messages are committed in a single go, which is much more efficient, but for our illustrative purposes is not really relevant, as we are demonstration sequential vs concurrent _processing_ messages.
+
+.Normal execution of the raw Kafka client
+image::https://lucid.app/publicSegments/view/0365890d-e8ff-4a06-b24a-8741175dacc3/image.png[align="center"]
+
+=== Unordered
+
+Unordered processing is where there is no restriction on the order of multiple messages processed per partition, allowing for highest level of concurrency.
+
+This is the fastest option.
+
+.Unordered concurrent processing of message
+image::https://lucid.app/publicSegments/view/aab5d743-de05-46d0-8c1e-0646d7d2946f/image.png[align="center"]
+
+=== Ordered by Partition
+
+At most only one message from any given input partition will be in flight at any given time.
+This means that concurrent processing is restricted to the number of input partitions.
+
+The advantage of ordered processing mode, is that for an assignment of 1000 partitions to a single consumer, you do not need to run 1000 consumer instances or threads, to process the partitions in parallel.
+
+Note that for a given partition, a slow processing message _will_ prevent messages behind it from being processed.
+However, messages in other partitions assigned to the consumer _will_ continue processing.
+
+This option is most like normal operation, except if the consumer is assigned more than one partition, it is free to process all partitions in parallel.
+
+.Partition ordered concurrent processing of messages
+image::https://lucid.app/publicSegments/view/30ad8632-e8fe-4e05-8afd-a2b6b3bab309/image.png[align="center"]
+
+=== Ordered by Key
+
+Most similar to ordered by partition, this mode ensures process ordering by *key* (per partition).
+
+The advantage of this mode, is that a given input topic may not have many partitions, it may have a ~large number of unique keys.
+Each of these key -> message sets can actually be processed concurrently, bringing concurrent processing to a per key level, without having to increase the number of input partitions, whilst keeping strong ordering by key.
+
+As usual, the offset tracking will be correct, regardless of the ordering of unique keys on the partition or adjacency to the committed offset, such that after failure or rebalance, the system will not replay messages already marked as successful.
+
+This option provides the performance of maximum concurrency, while maintaining message processing order per key, which is sufficient for many applications.
+
+.Key ordering concurrent processing of messages
+image::https://lucid.app/publicSegments/view/f7a05e99-24e6-4ea3-b3d0-978e306aa568/image.png[align="center"]
+
+=== Retries and Ordering
+
+Even during retries, offsets will always be committed only after successful processing, and in order.
+
+== Retries
+
+If processing of a record fails, the record will be placed back into it's queue and retried with a configurable delay (see the `ParallelConsumerOptions` class).
+Ordering guarantees will always be adhered to, regardless of failure.
+
+A failure is denoted by *any* exception being thrown from the user's processing function.
+The system catches these exceptions, logs them and replaces the record in the queue for processing later.
+All types of Exceptions thrown are considered retriable.
+To not retry a record, do not throw an exception from your processing function.
+
+TIP:: To avoid the system logging an error, throw an exception which extends PCRetriableException.
+
+TIP:: If there was an error processing a record, and you'd like to skip it - do not throw an exception, and the system will mark the record as succeeded.
+
+If for some reason you want to proactively fail a record, without relying on some other system throwing an exception which you don't catch - simply throw an exception of your own design, which the system will treat the same way.
+
+To configure the retry delay, see `ParallelConsumerOptions#defaultRetryDelay`.
+
+At the moment there is no terminal error support, so messages will continue to be retried forever as long as an exception continues to be thrown from the user function (see <<skipping-records>>).
+But still this will not hold up the queues in `KEY` or `UNORDERED` modes, however in `PARTITION` mode it *will* block progress.
+Offsets will also continue to be committed (see <<commit-mode>> and <<Offset Map>>).
+
+=== Retry Delay Function
+
+As part of the https://github.com/confluentinc/parallel-consumer/issues/65[enhanced retry epic], the ability to https://github.com/confluentinc/parallel-consumer/issues/82[dynamically determine the retry delay] was added.
+This can be used to customise retry delay for a record, such as exponential back off or have different delays for different types of records, or have the delay determined by the status of a system etc.
+
+You can access the retry count of a record through it's wrapped `WorkContainer` class, which is the input variable to the retry delay function.
+
+.Example retry delay function implementing exponential backoff
+[source,java,indent=0]
+----
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-core/src/main/java/io/confluent/parallelconsumer/examples/core/CoreApp.java[tag=customRetryDelay]
+----
+
+[[skipping-records]]
+=== Skipping Records
+
+If for whatever reason you want to skip a record, simply do not throw an exception, or catch any exception being thrown, log and swallow it and return from the user function normally.
+The system will treat this as a record processing success, mark the record as completed and move on as though it was a normal operation.
+
+A user may choose to skip a record for example, if it has been retried too many times or if the record is invalid or doesn't need processing.
+
+Implementing a https://github.com/confluentinc/parallel-consumer/issues/196[max retries feature] as a part of the system is planned.
+
+.Example of skipping a record after a maximum number of retries is reached
+[source,java,indent=0]
+----
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-core/src/main/java/io/confluent/parallelconsumer/examples/core/CoreApp.java[tag=maxRetries]
+----
+
+=== Circuit Breaker Pattern
+
+Although the system doesn't have an https://github.com/confluentinc/parallel-consumer/issues/110[explicit circuit breaker pattern feature], one can be created by combining the custom retry delay function and proactive failure.
+For example, the retry delay can be calculated based upon the status of an external system - i.e. if the external system is currently out of action, use a higher retry.
+Then in the processing function, again check the status of the external system first, and if it's still offline, throw an exception proactively without attempting to process the message.
+This will put the message back in the queue.
+
+.Example of circuit break implementation
+[source,java,indent=0]
+----
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-core/src/main/java/io/confluent/parallelconsumer/examples/core/CoreApp.java[tag=circuitBreaker]
+----
+
+=== Head of Line Blocking
+
+In order to have a failing record not block progress of a partition, one of the ordering modes other than `PARTITION` must be used, so that the system is allowed to process other messages that are perhaps in `KEY` order or in the case of `UNORDERED` processing - any message.
+This is because in `PARTITION` ordering mode, records are always processed in order of partition, and so the Head of Line blocking feature is effectively disabled.
+
+=== Future Work
+
+Improvements to this system are planned, see the following issues:
+
+* https://github.com/confluentinc/parallel-consumer/issues/65[Enhanced retry epic #65]
+* https://github.com/confluentinc/parallel-consumer/issues/48[Support scheduled message processing (scheduled retry)]
+* https://github.com/confluentinc/parallel-consumer/issues/196[Provide option for max retires, and a call back when reached (potential DLQ) #196]
+* https://github.com/confluentinc/parallel-consumer/issues/34[Monitor for progress and optionally shutdown (leave consumer group), skip message or send to DLQ #34]
+
+== Result Models
+
+* Void
+
+Processing is complete simply when your provided function finishes, and the offsets are committed.
+
+* Streaming User Results
+
+When your function is actually run, a result object will be streamed back to your client code, with information about the operation completion.
+
+* Streaming Message Publishing Results
+
+After your operation completes, you can also choose to publish a result message back to Kafka.
+The message publishing metadata can be streamed back to your client code.
+
+[[commit-mode]]
+== Commit Mode
+
+The system gives you three choices for how to do offset commits.
+The simplest of the three are the two Consumer commits modes.
+They are of course, `synchronous` and `asynchronous` mode.
+The `transactional` mode is explained in the next section.
+
+`Asynchronous` mode is faster, as it doesn't block the control loop.
+
+`Synchronous` will block the processing loop until a successful commit response is received, however, `Asynchronous` will still be capped by the max processing settings in the `ParallelConsumerOptions` class.
+
+If you're used to using the auto commit mode in the normal Kafka consumer, you can think of the `Asynchronous` mode being similar to this.
+We suggest starting with this mode, and it is the default.
+
+[[transaction-system]]
+=== Apache Kafka EoS Transaction Model in BULK
+
+There is also the option to use Kafka's Exactly Once Semantics (EoS) system.
+This causes all messages produced, by all workers in parallel, as a result of processing their messages, to be committed within a SINGLE, BULK transaction, along with their source offset.
+
+Note importantly - this is a BULK transaction, not a per input record transaction.
+
+This means that even under failure, the results will exist exactly once in the Kafka output topic.
+If as a part of your processing, you create side effects in other systems, this pertains to the usual idempotency requirements when breaking of EoS Kafka boundaries.
+
+CAUTION:: This is a BULK transaction, not a per input record transaction.
+There is not a single transaction per input record and per worker "thread", but one *LARGE* transaction that gets used by all parallel processing, until the commit interval.
+
+NOTE:: As with the `synchronous` processing mode, this will also block the processing loop until a successful transaction completes
+
+CAUTION: This cannot be true for any externally integrated third party system, unless that system is __idempotent__.
+
+For implementations details, see the <<Transactional System Architecture>> section.
+
+.From the Options Javadoc
+[source,java,indent=0]
+----
+include::{project_root}/parallel-consumer-core/src/main/java/io/confluent/parallelconsumer/ParallelConsumerOptions.java[tag=transactionalJavadoc]
+----
+
+[[streams-usage]]
+== Using with Kafka Streams
+
+Kafka Streams (KS) doesn't yet (https://cwiki.apache.org/confluence/display/KAFKA/KIP-311%3A+Async+processing+with+dynamic+scheduling+in+Kafka+Streams[KIP-311],
+https://cwiki.apache.org/confluence/display/KAFKA/KIP-408%3A+Add+Asynchronous+Processing+To+Kafka+Streams[KIP-408]) have parallel processing of messages.
+However, any given preprocessing can be done in KS, preparing the messages.
+One can then use this library to consume from an input topic, produced by KS to process the messages in parallel.
+
+For a code example, see the <<streams-usage-code>> section.
+
+.Example usage with Kafka Streams
+image::https://lucid.app/publicSegments/view/43f2740c-2a7f-4b7f-909e-434a5bbe3fbf/image.png[Kafka Streams Usage,align="center"]
+[[mertics]]
+== Metrics
+
+Metrics collection subsystem is implemented using Micrometer. This allows for flexible configuration of target metrics backend to be used. See below on example of how to configure MeterRegistry for Parallel Consumer to use for metrics collection.
+
+=== Meters
+Following meters are defined by Parallel Consumer - grouped by Subsystem
+
+
+==== Partition Manager
+
+**Number Of Partitions**
+
+Gauge `pc.partitions.number{subsystem=partitions}`
+
+Number of partitions
+
+**Partition Incomplete Offsets**
+
+Gauge `pc.partition.incomplete.offsets{subsystem=partitions, topic="topicName", partition="partitionNumber"}`
+
+Number of incomplete offsets in the partition
+
+**Partition Highest Completed Offset**
+
+Gauge `pc.partition.highest.completed.offset{subsystem=partitions, topic="topicName", partition="partitionNumber"}`
+
+Highest completed offset in the partition
+
+**Partition Highest Sequential Succeeded Offset**
+
+Gauge `pc.partition.highest.sequential.succeeded.offset{subsystem=partitions, topic="topicName", partition="partitionNumber"}`
+
+Highest sequential succeeded offset in the partition
+
+**Partition Highest Seen Offset**
+
+Gauge `pc.partition.highest.seen.offset{subsystem=partitions, topic="topicName", partition="partitionNumber"}`
+
+Highest seen / consumed offset in the partition
+
+**Partition Last Committed Offset**
+
+Gauge `pc.partition.latest.committed.offset{subsystem=partitions, topic="topicName", partition="partitionNumber"}`
+
+Latest committed offset in the partition
+
+**Partition Assignment Epoch**
+
+Gauge `pc.partition.assignment.epoch{subsystem=partitions, topic="topicName", partition="partitionNumber"}`
+
+Epoch of partition assignment
+
+==== Processor
+
+**User Function Processing Time**
+
+Timer `pc.user.function.processing.time{subsystem=processor}`
+
+User function processing time
+
+**Dynamic Extra Load Factor**
+
+Gauge `pc.dynamic.load.factor{subsystem=processor}`
+
+Dynamic load factor - load of processing buffers
+
+**Pc Status**
+
+Gauge `pc.status{subsystem=processor}`
+
+PC Status, reported as number with following mapping - 0:UNUSED, 1:RUNNING, 2:PAUSED, 3:DRAINING, 4:CLOSING, 5:CLOSED
+
+==== Shard Manager
+
+**Number Of Shards**
+
+Gauge `pc.shards{subsystem=shardmanager}`
+
+Number of shards
+
+**Incomplete Offsets Total**
+
+Gauge `pc.incomplete.offsets.total{subsystem=shardmanager}`
+
+Total number of incomplete offsets
+
+**Shards Size**
+
+Gauge `pc.shards.size{subsystem=shardmanager}`
+
+Number of records queued for processing across all shards
+
+==== Work Manager
+
+**Inflight Records**
+
+Gauge `pc.inflight.records{subsystem=workmanager}`
+
+Total number of records currently being processed or waiting for retry
+
+**Waiting Records**
+
+Gauge `pc.waiting.records{subsystem=workmanager}`
+
+Total number of records waiting to be selected for processing
+
+**Processed Records**
+
+Counter `pc.processed.records{subsystem=workmanager, topic="topicName", partition="partitionNumber"}`
+
+Total number of records successfully processed
+
+**Failed Records**
+
+Counter `pc.failed.records{subsystem=workmanager, topic="topicName", partition="partitionNumber"}`
+
+Total number of records failed to be processed
+
+**Slow Records**
+
+Counter `pc.slow.records{subsystem=workmanager, topic="topicName", partition="partitionNumber"}`
+
+Total number of records that spent more than the configured time threshold in the waiting queue. This setting defaults to 10 seconds
+
+==== Broker Poller
+
+**Pc Poller Status**
+
+Gauge `pc.poller.status{subsystem=poller}`
+
+PC Broker Poller Status, reported as number with following mapping - 0:UNUSED, 1:RUNNING, 2:PAUSED, 3:DRAINING, 4:CLOSING, 5:CLOSED
+
+**Num Paused Partitions**
+
+Gauge `pc.partitions.paused{subsystem=poller}`
+
+Number of paused partitions
+
+==== Offset Encoder
+
+**Offsets Encoding Time**
+
+Timer `pc.offsets.encoding.time{subsystem=offsetencoder}`
+
+Time spend encoding offsets
+
+**Offsets Encoding Usage**
+
+Counter `pc.offsets.encoding.usage{subsystem=offsetencoder, codec="BitSet|BitSetCompressed|BitSetV2Compressed|RunLength"}`
+
+Offset encoding usage per encoding type
+
+**Metadata Space Used**
+
+Distribution Summary `pc.metadata.space.used{subsystem=offsetencoder}`
+
+Ratio between offset metadata payload size and available space
+
+**Payload Ratio Used**
+
+Distribution Summary `pc.payload.ratio.used{subsystem=offsetencoder}`
+
+Ratio between offset metadata payload size and offsets encoded
+
+=== Example Metrics setup steps
+Meter registry that metrics should be bound has to be set using Parallel Consumer Options along with any common tags that identify the PC instance.
+In addition, if desired - Kafka Consumer, Producer can be bound to the registry as well as general JVM metric, logging system and other common binders.
+
+Following example illustrates setup of Parallel Consumer with Meter Registry and binds Kafka Consumer to that same registry as well.
+
+[source,java,indent=0]
+----
+include::{project_root}/parallel-consumer-examples/parallel-consumer-example-metrics/src/main/java/io/confluent/parallelconsumer/examples/metrics/CoreApp.java[tag=example]
+----
+<1> - Meter Registry is set through ParallelConsumerOptions.builder(), if not specified - will default to CompositeMeterRegistry - which is No-op.
+<2> - Optional - common tags can be specified through same builder - they will be added to all Parallel Consumer meters
+<3> - Optional - instance tag value can be specified - it has to be unique to ensure meter uniqueness in cases when multiple parallel consumer instances are recording metrics to the same meter registry. If instance tag is not specified - unique UUID value will be generated and used. Tag is created with tag key 'pcinstance'.
+<4> - Optional - Kafka Consumer Micrometer metrics object created for Kafka Consumer that is later used for Parallel Consumer.
+<5> - Optional - Kafka Consumer Micrometer metrics are bound to Meter Registry.
+
+NOTE:: any additional binders / metrics need to be cleaned up appropriately - for example the Kafka Consumer Metrics registered above - need to be closed using `kafkaClientMetrics.close()` after calling shutting down Parallel Consumer as Parallel Consumer will close Kafka Consumer on shutdown.
+
+
+[[roadmap]]
+== Roadmap
+
+For released changes, see the link:CHANGELOG.adoc[CHANGELOG].
+
+For features in development and a more accurate view on the roadmap, have a look at the
+https://github.com/confluentinc/parallel-consumer/issues[GitHub issues], and clone https://github.com/astubbs/parallel-consumer[Antony's fork].
+
+== Usage Requirements
+
+* Client side
+** JDK 8
+** SLF4J
+** Apache Kafka (AK) Client libraries 2.5
+** Supports all features of the AK client (e.g. security setups, schema registry etc)
+** For use with Streams, see <<streams-usage>> section
+** For use with Connect:
+*** Source: simply consume from the topic that your Connect plugin is publishing to
+*** Sink: use the poll and producer style API and publish the records to the topic that the connector is sinking from
+* Server side
+** Should work with any cluster that the linked AK client library works with
+*** If using EoS/Transactions, needs a cluster setup that supports EoS/transactions
+
+== Development Information
+
+=== Requirements
+
+* Uses https://projectlombok.org/setup/intellij[Lombok], if you're using IntelliJ Idea, get the https://plugins.jetbrains.com/plugin/6317-lombok[plugin].
+* Integration tests require a https://docs.docker.com/docker-for-mac/[running locally accessible Docker host].
+* Has a Maven `profile` setup for IntelliJ Idea, but not Eclipse for example.
+
+=== Notes
+
+The unit test code is set to run at a very high frequency, which can make it difficult to read debug logs (or impossible).
+If you want to debug the code or view the main logs, consider changing the below:
+
+// replace with code inclusion from readme branch
+.ParallelEoSStreamProcessorTestBase
+[source]
+----
+ParallelEoSStreamProcessorTestBase#DEFAULT_BROKER_POLL_FREQUENCY_MS
+ParallelEoSStreamProcessorTestBase#DEFAULT_COMMIT_INTERVAL_MAX_MS
+----
+
+=== Recommended IDEA Plugins
+
+* AsciiDoc
+* CheckStyle
+* CodeGlance
+* EditorConfig
+* Rainbow Brackets
+* SonarLint
+* Lombok
+
+=== Readme
+
+The `README` uses a special https://github.com/whelk-io/asciidoc-template-maven-plugin/pull/25[custom maven processor plugin] to import live code blocks into the root readme, so that GitHub can show the real code as includes in the `README`.
+This is because GitHub https://github.com/github/markup/issues/1095[doesn't properly support the _include_ directive].
+
+The source of truth readme is in link:{project_root}/src/docs/README_TEMPLATE.adoc[].
+
+=== Maven targets
+
+[qanda]
+Compile and run all tests::
+`mvn verify`
+
+Run tests excluding the integration tests::
+`mvn test`
+
+Run all tests::
+`mvn verify`
+
+Run any goal skipping tests (replace `<goalName>` e.g. `install`)::
+`mvn <goalName> -DskipTests`
+
+See what profiles are active::
+`mvn help:active-profiles`
+
+See what plugins or dependencies are available to be updated::
+`mvn versions:display-plugin-updates versions:display-property-updates versions:display-dependency-updates`
+
+Run a single unit test::
+`mvn -Dtest=TestCircle test`
+
+Run a specific integration test method in a submodule project, skipping unit tests::
+`mvn -Dit.test=TransactionAndCommitModeTest#testLowMaxPoll -DskipUTs=true verify  -DfailIfNoTests=false --projects parallel-consumer-core`
+
+Run `git bisect` to find a bad commit, edit the Maven command in `bisect.sh` and run::
+
+[source=bash]
+----
+git bisect start good bad
+git bisect run ./bisect.sh
+----
+
+Note::
+`mvn compile` - Due to a bug in Maven's handling of test-jar dependencies - running `mvn compile` fails, use `mvn test-compile` instead.
+See https://github.com/confluentinc/parallel-consumer/issues/162[issue #162]
+and this https://stackoverflow.com/questions/4786881/why-is-test-jar-dependency-required-for-mvn-compile[Stack Overflow question].
+
+=== Testing
+
+The project has good automated test coverage, of all features.
+Including integration tests running against real Kafka broker and database.
+If you want to run the tests yourself, clone the repository and run the command: `mvn test`.
+The tests require an active docker server on `localhost`.
+
+==== Integration Testing with TestContainers
+//https://github.com/confluentinc/schroedinger#integration-testing-with-testcontainers
+
+We use the excellent https://testcontainers.org[Testcontainers] library for integration testing with JUnit.
+
+To speed up test execution, you can enable container reuse across test runs by setting the following in your https://www.testcontainers.org/features/configuration/[`~/.testcontainers.properties` file]:
+
+[source]
+----
+testcontainers.reuse.enable=true
+----
+
+This will leave the container running after the JUnit test is complete for reuse by subsequent runs.
+
+> NOTE: The container will only be left running if it is not explicitly stopped by the JUnit rule.
+> For this reason, we use a variant of the https://www.testcontainers.org/test_framework_integration/manual_lifecycle_control/#singleton-containers[singleton container pattern]
+> instead of the JUnit rule.
+
+Testcontainers detects if a container is reusable by hashing the container creation parameters from the JUnit test.
+If an existing container is _not_ reusable, a new container will be created, **but the old container will not be removed**.
+
+Target | Description --- | ---
+`testcontainers-list` | List all containers labeled as testcontainers
+`testcontainers-clean` | Remove all containers labeled as testcontainers
+
+.Stop and remove all containers labeled with `org.testcontainers=true`
+[source,bash]
+----
+docker container ls --filter 'label=org.testcontainers=true' --format '{{.ID}}' \
+| $(XARGS) docker container rm --force
+----
+
+.List all containers labeled with `org.testcontainers=true`
+[source,bash]
+----
+docker container ls --filter 'label=org.testcontainers=true'
+----
+
+> NOTE: `testcontainers-clean` removes **all** docker containers on your system with the `io.testcontainers=true` label > (including the most recent container which may be reusable).
+
+See https://github.com/testcontainers/testcontainers-java/pull/1781[this testcontainers PR] for details on the reusable containers feature.
+
+== Implementation Details
+
+=== Core Architecture
+
+Concurrency is controlled by the size of the thread pool (`worker pool` in the diagram).
+Work is performed in a blocking manner, by the users submitted lambda functions.
+
+These are the main sub systems:
+
+- controller thread
+- broker poller thread
+- work pool thread
+- work management
+- offset map manipulation
+
+Each thread collaborates with the others through thread safe Java collections.
+
+.Core Architecture. Threads are represented by letters and colours, with their steps in sequential numbers.
+image::https://lucid.app/publicSegments/view/320d924a-6517-4c54-a72e-b1c4b22e59ed/image.png[Core Architecture,align="center"]
+
+=== Vert.x Architecture
+
+The Vert.x module is an optional extension to the core module.
+As depicted in the diagram, the architecture extends the core architecture.
+
+Instead of the work thread pool count being the degree of concurrency, it is controlled by a max parallel requests setting, and work is performed asynchronously on the Vert.x engine by a _core_ count aligned Vert.x managed thread pool using Vert.x asynchronous IO plugins (https://vertx.io/docs/vertx-core/java/#_verticles[verticles]).
+
+.Vert.x Architecture
+image::https://lucid.app/publicSegments/view/509df410-5997-46be-98e7-ac7f241780b4/image.png[Vert.x Architecture,align="center"]
+
+=== Transactional System Architecture
+
+image::https://lucid.app/publicSegments/view/7480d948-ed7d-4370-a308-8ec12e6b453b/image.png[]
+
+[[offset_map]]
+=== Offset Map
+
+Unlike a traditional queue, messages are not deleted on an acknowledgement.
+However, offsets *are* tracked *per message*, per consumer group - there is no message replay for successful messages, even over clean restarts.
+
+Across a system failure, only completed messages not stored as such in the last offset payload commit will be replayed.
+This is not an _exactly once guarantee_, as message replay cannot be prevented across failure.
+
+CAUTION: Note that Kafka's Exactly Once Semantics (EoS) (transactional processing) also does not prevent _duplicate message replay_ - it *presents* an _effectively once_ result messages in Kafka topics.
+Messages may _still_ be replayed when using `EoS`.
+This is an important consideration when using it, especially when integrating with thrid party systems, which is a very common pattern for utilising this project.
+
+As mentioned previously, offsets are always committed in the correct order and only once all previous messages have been successfully processed; regardless of <<ordering-guarantees,ordering mode>> selected.
+We call this the "highest committable offset".
+
+However, because messages can be processed out of order, messages beyond the highest committable offset must also be tracked for success and not replayed upon restart of failure.
+To achieve this the system goes a step further than normal Kafka offset commits.
+
+When messages beyond the highest committable offset are successfully processed;
+
+. they are stored as such in an internal memory map.
+. when the system then next commits offsets
+. if there are any messages beyond the highest offset which have been marked as succeeded
+.. the offset map is serialised and encoded into a base 64 string, and added to the commit message metadata.
+. upon restore, if needed, the system then deserializes this offset map and loads it back into memory
+. when each messages is polled into the system
+.. it checks if it's already been previously completed
+.. at which point it is then skipped.
+
+This ensures that no message is reprocessed if it's been previously completed.
+
+IMPORTANT: Successful messages beyond the _highest committable offset_ are still recorded as such in a specially constructed metadata payload stored alongside the Kafka committed offset.
+These messages are not replayed upon restore/restart.
+
+The offset map is compressed in parallel using two different compression techniques - run length encoding and bitmap encoding.
+The sizes of the compressed maps are then compared, and the smallest chosen for serialization.
+If both serialised formats are significantly large, they are then both compressed using `zstd` compression, and if that results in a smaller serialization then the compressed form is used instead.
+
+
+==== Storage Notes
+
+* Runtime data model creates list of incomplete offsets
+* Continuously builds a full complete / not complete bit map from the base offset to be committed
+* Dynamically switching storage
+** encodes into a `BitSet`, and a `RunLength`, then compresses both using zstd, then uses the smallest and tags as such in the encoded String
+** Which is smallest can depend on the size and information density of the offset map
+*** Smaller maps fit better into uncompressed `BitSets` ~(30 entry map bitset: compressed: 13 Bytes, uncompressed: 4 Bytes)
+*** Larger maps with continuous sections usually better in compressed `RunLength`
+*** Completely random offset maps, compressed and uncompressed `BitSet` is roughly the same (2000 entries, uncompressed bitset: 250, compressed: 259, compressed bytes array: 477)
+*** Very large maps (20,000 entries), a compressed `BitSet` seems to be significantly smaller again if random.
+* Gets stored along with base offset for each partition, in the offset `commitsync` `metadata` string
+* The offset commit metadata has a hardcoded limit of 4096 bytes (4 kb) per partition (@see `kafka.coordinator.group.OffsetConfig#DefaultMaxMetadataSize = 4096`)
+** Because of this, if our map doesn't fit into this, we have to drop it and not use it, losing the shorter replay benefits.
+However, with runlength encoding and typical offset patterns this should be quite rare.
+*** Work is being done on continuous and predictive space requirements, which will optionally prevent the system from continuing past a point by introducing local backpressure which it can't proceed without dropping the encoded map information - see https://github.com/confluentinc/parallel-consumer/issues/53[Exact continuous offset encoding for precise offset payload size back pressure].
+** Not being able to fit the map into the metadata, depends on message acknowledgement patterns in the use case and the numbers of messages involved.
+Also, the information density in the map (i.e. a single not yet completed message in 4000 completed ones will be a tiny map and will fit very large amounts of messages)
+
+===== FAQ
+
+[qanda]
+If for example, offset 5 cannot be processed for whatever reason, does it cause the committed offset to stick to 5?::
+Yes - the committed offset would "stick" to 5, with the metadata payload containing all the per msg ack's beyond 5.
++
+(Reference: https://github.com/confluentinc/parallel-consumer/issues/415#issuecomment-1256022394[#415])
+
+In the above scenario, would the system eventually exceed the OffsetMap size limit?::
+No, as if the payload size hits 75% or more of the limit (4kB), the back pressure system kicks in, and no more records will be taken for processing, until it drops below 75% again.
+Instead, it will keep retrying existing records.
++
+However, note that if the only record to continually fail is 5, and all others succeed, let's say offset 6-50,000, then the metadata payload is only ~2 shorts (1 and (50,000-6=) 49,994), as it will use run length encoding.
+So it's very efficient.
++
+(Reference: https://github.com/confluentinc/parallel-consumer/issues/415#issuecomment-1256022394[#415])
+
+== Attribution
+
+http://www.apache.org/[Apache®], http://kafka.apache.org/[Apache Kafka], and http://kafka.apache.org/[Kafka®] are either registered trademarks or trademarks of the http://www.apache.org/[Apache Software Foundation] in the United States and/or other countries.
+
+== Tools
+
+image:https://www.yourkit.com/images/yklogo.png[link=https://www.yourkit.com/java/profiler/index.jsp,YourKit]
+
+Quite simply the best profiler for Java, and the only one I use.
+I have been using it for decades.
+Quick, easy to use but soo powerful.
+
+YourKit supports open source projects with innovative and intelligent tools for monitoring and profiling Java and .NET applications.
+
+YourKit is the creator of https://www.google.com/url?q=https://www.yourkit.com/java/profiler/&source=gmail-imap&ust=1670918364000000&usg=AOvVaw3kaQak_H7lmT_plCEzxvde[YourKit Java Profiler],
+https://www.google.com/url?q=https://www.yourkit.com/.net/profiler/&source=gmail-imap&ust=1670918364000000&usg=AOvVaw1ZgQhyH2rIOHTuqtTjFAsA[YourKit .NET Profiler], and https://www.google.com/url?q=https://www.yourkit.com/youmonitor/&source=gmail-imap&ust=1670918364000000&usg=AOvVaw13UzOhGkJLEn-Md3-GNjYB[YourKit YouMonitor].
+
+:leveloffset: +1
+include::{project_root}/CHANGELOG.adoc[]
+//:leveloffset: -1 - Duplicate key leveloffset (attempted merging values +1 and -1): https://github.com/whelk-io/asciidoc-template-maven-plugin/issues/118
+