opensearch-project
diff --git a/‎create-notice.sh
Lines changed: 1 addition & 0 deletions b/‎create-notice.sh
Lines changed: 1 addition & 0 deletions
diff --git a/‎osbenchmark/client.py
Lines changed: 18 additions & 115 deletions b/‎osbenchmark/client.py
Lines changed: 18 additions & 115 deletions
diff --git a/‎osbenchmark/context.py
Lines changed: 140 additions & 0 deletions b/‎osbenchmark/context.py
Lines changed: 140 additions & 0 deletions
diff --git a/‎osbenchmark/kafka_client.py
Lines changed: 70 additions & 0 deletions b/‎osbenchmark/kafka_client.py
Lines changed: 70 additions & 0 deletions
@@ -54,6 +54,7 @@ function main {
     add_license "ijson" "https://raw.githubusercontent.com/ICRAR/ijson/master/LICENSE.txt"
     add_license "google-resumable-media" "https://raw.githubusercontent.com/googleapis/google-resumable-media-python/master/LICENSE"
     add_license "google-auth" "https://raw.githubusercontent.com/googleapis/google-auth-library-python/master/LICENSE"
+    add_license "aiokafka" "https://raw.githubusercontent.com/aio-libs/aiokafka/master/LICENSE"
 
     # transitive dependencies
     # Jinja2 dependencies
 
@@ -22,132 +22,19 @@
 # specific language governing permissions and limitations
 # under the License.
 
-import contextvars
 import logging
 import time
 
 import certifi
 import urllib3
 from urllib3.util.ssl_ import is_ipaddress
+from osbenchmark.kafka_client import KafkaMessageProducer
 
 from osbenchmark import exceptions, doc_link
+from osbenchmark.context import RequestContextHolder
 from osbenchmark.utils import console, convert
 
 
-class RequestContextManager:
-    """
-    Ensures that request context span the defined scope and allow nesting of request contexts with proper propagation.
-    This means that we can span a top-level request context, open sub-request contexts that can be used to measure
-    individual timings and still measure the proper total time on the top-level request context.
-    """
-    def __init__(self, request_context_holder):
-        self.ctx_holder = request_context_holder
-        self.ctx = None
-        self.token = None
-
-    async def __aenter__(self):
-        self.ctx, self.token = self.ctx_holder.init_request_context()
-        return self
-
-    @property
-    def request_start(self):
-        return self.ctx["request_start"]
-
-    @property
-    def request_end(self):
-        return max((value for value in self.ctx["request_end_list"] if value < self.client_request_end))
-
-    @property
-    def client_request_start(self):
-        return self.ctx["client_request_start"]
-
-    @property
-    def client_request_end(self):
-        return self.ctx["client_request_end"]
-
-    async def __aexit__(self, exc_type, exc_val, exc_tb):
-        # propagate earliest request start and most recent request end to parent
-        client_request_start = self.client_request_start
-        client_request_end = self.client_request_end
-        request_start = self.request_start
-        request_end = self.request_end
-        self.ctx_holder.restore_context(self.token)
-        # don't attempt to restore these values on the top-level context as they don't exist
-        if self.token.old_value != contextvars.Token.MISSING:
-            self.ctx_holder.update_request_start(request_start)
-            self.ctx_holder.update_request_end(request_end)
-            self.ctx_holder.update_client_request_start(client_request_start)
-            self.ctx_holder.update_client_request_end(client_request_end)
-        self.token = None
-        return False
-
-
-class RequestContextHolder:
-    """
-    Holds request context variables. This class is only meant to be used together with RequestContextManager.
-    """
-    request_context = contextvars.ContextVar("benchmark_request_context")
-
-    def new_request_context(self):
-        return RequestContextManager(self)
-
-    @classmethod
-    def init_request_context(cls):
-        ctx = {}
-        token = cls.request_context.set(ctx)
-        return ctx, token
-
-    @classmethod
-    def restore_context(cls, token):
-        cls.request_context.reset(token)
-
-    @classmethod
-    def update_request_start(cls, new_request_start):
-        meta = cls.request_context.get()
-        # this can happen if multiple requests are sent on the wire for one logical request (e.g. scrolls)
-        if "request_start" not in meta and "client_request_start" in meta:
-            meta["request_start"] = new_request_start
-
-    @classmethod
-    def update_request_end(cls, new_request_end):
-        meta = cls.request_context.get()
-        if "request_end_list" not in meta:
-            meta["request_end_list"] = []
-        meta["request_end_list"].append(new_request_end)
-
-    @classmethod
-    def update_client_request_start(cls, new_client_request_start):
-        meta = cls.request_context.get()
-        if "client_request_start" not in meta:
-            meta["client_request_start"] = new_client_request_start
-
-    @classmethod
-    def update_client_request_end(cls, new_client_request_end):
-        meta = cls.request_context.get()
-        meta["client_request_end"] = new_client_request_end
-
-    @classmethod
-    def on_client_request_start(cls):
-        cls.update_client_request_start(time.perf_counter())
-
-    @classmethod
-    def on_client_request_end(cls):
-        cls.update_client_request_end(time.perf_counter())
-
-    @classmethod
-    def on_request_start(cls):
-        cls.update_request_start(time.perf_counter())
-
-    @classmethod
-    def on_request_end(cls):
-        cls.update_request_end(time.perf_counter())
-
-    @classmethod
-    def return_raw_response(cls):
-        ctx = cls.request_context.get()
-        ctx["raw_response"] = True
-
-
 class OsClientFactory:
     """
     Abstracts how the OpenSearch client is created. Intended for testing.
@@ -430,3 +317,19 @@ def wait_for_rest_layer(opensearch, max_attempts=40):
                 logger.warning("Got unexpected status code [%s] on attempt [%s].", e.status_code, attempt)
                 raise e
     return False
+
+
+class MessageProducerFactory:
+    @staticmethod
+    async def create(params):
+        """
+        Creates and returns a message producer based on the ingestion source.
+        Currently supports Kafka. Ingestion source should be a dict like:
+            {'type': 'kafka', 'param': {'topic': 'test', 'bootstrap-servers': 'localhost:34803'}}
+        """
+        ingestion_source = params.get("ingestion-source", {})
+        producer_type = ingestion_source.get("type", "kafka").lower()
+        if producer_type == "kafka":
+            return await KafkaMessageProducer.create(params)
+        else:
+            raise ValueError(f"Unsupported ingestion source type: {producer_type}")
@@ -0,0 +1,140 @@
+# SPDX-License-Identifier: Apache-2.0
+#
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+# Licensed to Elasticsearch B.V. under one or more contributor
+# license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright
+# ownership. Elasticsearch B.V. licenses this file to you under
+# the Apache License, Version 2.0 (the "License"); you may
+# not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#	http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+import contextvars
+import time
+
+
+class RequestContextManager:
+    """
+    Ensures that request context span the defined scope and allow nesting of request contexts with proper propagation.
+    This means that we can span a top-level request context, open sub-request contexts that can be used to measure
+    individual timings and still measure the proper total time on the top-level request context.
+    """
+    def __init__(self, request_context_holder):
+        self.ctx_holder = request_context_holder
+        self.ctx = None
+        self.token = None
+
+    async def __aenter__(self):
+        self.ctx, self.token = self.ctx_holder.init_request_context()
+        return self
+
+    @property
+    def request_start(self):
+        return self.ctx["request_start"]
+
+    @property
+    def request_end(self):
+        return max((value for value in self.ctx["request_end_list"] if value < self.client_request_end))
+
+    @property
+    def client_request_start(self):
+        return self.ctx["client_request_start"]
+
+    @property
+    def client_request_end(self):
+        return self.ctx["client_request_end"]
+
+    async def __aexit__(self, exc_type, exc_val, exc_tb):
+        # propagate earliest request start and most recent request end to parent
+        client_request_start = self.client_request_start
+        client_request_end = self.client_request_end
+        request_start = self.request_start
+        request_end = self.request_end
+        self.ctx_holder.restore_context(self.token)
+        # don't attempt to restore these values on the top-level context as they don't exist
+        if self.token.old_value != contextvars.Token.MISSING:
+            self.ctx_holder.update_request_start(request_start)
+            self.ctx_holder.update_request_end(request_end)
+            self.ctx_holder.update_client_request_start(client_request_start)
+            self.ctx_holder.update_client_request_end(client_request_end)
+        self.token = None
+        return False
+
+
+class RequestContextHolder:
+    """
+    Holds request context variables. This class is only meant to be used together with RequestContextManager.
+    """
+    request_context = contextvars.ContextVar("benchmark_request_context")
+
+    def new_request_context(self):
+        return RequestContextManager(self)
+
+    @classmethod
+    def init_request_context(cls):
+        ctx = {}
+        token = cls.request_context.set(ctx)
+        return ctx, token
+
+    @classmethod
+    def restore_context(cls, token):
+        cls.request_context.reset(token)
+
+    @classmethod
+    def update_request_start(cls, new_request_start):
+        meta = cls.request_context.get()
+        # this can happen if multiple requests are sent on the wire for one logical request (e.g. scrolls)
+        if "request_start" not in meta and "client_request_start" in meta:
+            meta["request_start"] = new_request_start
+
+    @classmethod
+    def update_request_end(cls, new_request_end):
+        meta = cls.request_context.get()
+        if "request_end_list" not in meta:
+            meta["request_end_list"] = []
+        meta["request_end_list"].append(new_request_end)
+
+    @classmethod
+    def update_client_request_start(cls, new_client_request_start):
+        meta = cls.request_context.get()
+        if "client_request_start" not in meta:
+            meta["client_request_start"] = new_client_request_start
+
+    @classmethod
+    def update_client_request_end(cls, new_client_request_end):
+        meta = cls.request_context.get()
+        meta["client_request_end"] = new_client_request_end
+
+    @classmethod
+    def on_client_request_start(cls):
+        cls.update_client_request_start(time.perf_counter())
+
+    @classmethod
+    def on_client_request_end(cls):
+        cls.update_client_request_end(time.perf_counter())
+
+    @classmethod
+    def on_request_start(cls):
+        cls.update_request_start(time.perf_counter())
+
+    @classmethod
+    def on_request_end(cls):
+        cls.update_request_end(time.perf_counter())
+
+    @classmethod
+    def return_raw_response(cls):
+        ctx = cls.request_context.get()
+        ctx["raw_response"] = True
@@ -0,0 +1,70 @@
+# SPDX-License-Identifier: Apache-2.0
+#
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+# Licensed to Elasticsearch B.V. under one or more contributor
+# license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright
+# ownership. Elasticsearch B.V. licenses this file to you under
+# the Apache License, Version 2.0 (the "License"); you may
+# not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#	http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+from aiokafka import AIOKafkaProducer
+from osbenchmark.context import RequestContextHolder
+
+class KafkaMessageProducer:
+    def __init__(self, producer, topic):
+        self._producer = producer
+        self._topic = topic
+        self._ctx_holder = RequestContextHolder()
+
+    @classmethod
+    async def create(cls, params):
+        """
+        Creates a Kafka producer based on parameters in the ingestion source.
+        """
+
+        ingestion_source = params.get("ingestion-source", {})
+        kafka_params = ingestion_source.get("param", {})
+        topic = kafka_params.get("topic")
+        if not topic:
+            raise ValueError("No 'topic' specified in ingestion source parameters.")
+        bootstrap_servers = kafka_params.get("bootstrap-servers", "")
+
+        producer = AIOKafkaProducer(
+            bootstrap_servers=bootstrap_servers,
+            key_serializer=str.encode,
+            value_serializer=str.encode
+        )
+        await producer.start()
+        return cls(producer, topic)
+
+    async def send_message(self, message, key=""):
+        """
+        Sends a message to the producer's topic.
+        """
+        await self._producer.send_and_wait(self._topic, message, key=key)
+
+    async def stop(self):
+        """
+        Stops the underlying producer.
+        """
+        await self._producer.stop()
+
+    @property
+    def new_request_context(self):
+        # Delegate to the internal holder
+        return self._ctx_holder.new_request_context