upstash
diff --git a/‎qstash/asyncio/message.py
Lines changed: 10 additions & 0 deletions b/‎qstash/asyncio/message.py
Lines changed: 10 additions & 0 deletions
diff --git a/‎qstash/asyncio/schedule.py
Lines changed: 9 additions & 0 deletions b/‎qstash/asyncio/schedule.py
Lines changed: 9 additions & 0 deletions
diff --git a/‎qstash/dlq.py
Lines changed: 3 additions & 0 deletions b/‎qstash/dlq.py
Lines changed: 3 additions & 0 deletions
diff --git a/‎qstash/message.py
Lines changed: 64 additions & 0 deletions b/‎qstash/message.py
Lines changed: 64 additions & 0 deletions
@@ -5,6 +5,7 @@
 from qstash.http import HttpMethod
 from qstash.message import (
     ApiT,
+    FlowControl,
     BatchJsonRequest,
     BatchRequest,
     BatchResponse,
@@ -47,6 +48,7 @@ async def publish(
         deduplication_id: Optional[str] = None,
         content_based_deduplication: Optional[bool] = None,
         timeout: Optional[Union[str, int]] = None,
+        flow_control: Optional[FlowControl] = None,
     ) -> Union[PublishResponse, List[PublishUrlGroupResponse]]:
         """
         Publishes a message to QStash.
@@ -84,6 +86,8 @@ async def publish(
             When a timeout is specified, it will be used instead of the maximum timeout
             value permitted by the QStash plan. It is useful in scenarios, where a message
             should be delivered with a shorter timeout.
+        :param flow_control: Settings for controlling the number of active requests and
+            number of requests per second with the same key.
         """
         headers = headers or {}
         destination = get_destination(
@@ -105,6 +109,7 @@ async def publish(
             deduplication_id=deduplication_id,
             content_based_deduplication=content_based_deduplication,
             timeout=timeout,
+            flow_control=flow_control,
         )
 
         response = await self._http.request(
@@ -133,6 +138,7 @@ async def publish_json(
         deduplication_id: Optional[str] = None,
         content_based_deduplication: Optional[bool] = None,
         timeout: Optional[Union[str, int]] = None,
+        flow_control: Optional[FlowControl] = None,
     ) -> Union[PublishResponse, List[PublishUrlGroupResponse]]:
         """
         Publish a message to QStash, automatically serializing the
@@ -171,6 +177,8 @@ async def publish_json(
             When a timeout is specified, it will be used instead of the maximum timeout
             value permitted by the QStash plan. It is useful in scenarios, where a message
             should be delivered with a shorter timeout.
+        :param flow_control: Settings for controlling the number of active requests and
+            number of requests per second with the same key.
         """
         return await self.publish(
             url=url,
@@ -188,6 +196,7 @@ async def publish_json(
             deduplication_id=deduplication_id,
             content_based_deduplication=content_based_deduplication,
             timeout=timeout,
+            flow_control=flow_control,
         )
 
     async def enqueue(
@@ -260,6 +269,7 @@ async def enqueue(
             deduplication_id=deduplication_id,
             content_based_deduplication=content_based_deduplication,
             timeout=timeout,
+            flow_control=None,
         )
 
         response = await self._http.request(
 
@@ -8,6 +8,7 @@
     parse_schedule_response,
     prepare_schedule_headers,
 )
+from qstash.message import FlowControl
 
 
 class AsyncScheduleApi:
@@ -29,6 +30,7 @@ async def create(
         delay: Optional[Union[str, int]] = None,
         timeout: Optional[Union[str, int]] = None,
         schedule_id: Optional[str] = None,
+        flow_control: Optional[FlowControl] = None,
     ) -> str:
         """
         Creates a schedule to send messages periodically.
@@ -56,6 +58,8 @@ async def create(
             value permitted by the QStash plan. It is useful in scenarios, where a message
             should be delivered with a shorter timeout.
         :param schedule_id: Schedule id to use. Can be used to update the settings of an existing schedule.
+        :param flow_control: Settings for controlling the number of active requests and
+            number of requests per second with the same key.
         """
         req_headers = prepare_schedule_headers(
             cron=cron,
@@ -68,6 +72,7 @@ async def create(
             delay=delay,
             timeout=timeout,
             schedule_id=schedule_id,
+            flow_control=flow_control,
         )
 
         response = await self._http.request(
@@ -93,6 +98,7 @@ async def create_json(
         delay: Optional[Union[str, int]] = None,
         timeout: Optional[Union[str, int]] = None,
         schedule_id: Optional[str] = None,
+        flow_control: Optional[FlowControl] = None,
     ) -> str:
         """
         Creates a schedule to send messages periodically, automatically serializing the
@@ -121,6 +127,8 @@ async def create_json(
             value permitted by the QStash plan. It is useful in scenarios, where a message
             should be delivered with a shorter timeout.
         :param schedule_id: Schedule id to use. Can be used to update the settings of an existing schedule.
+        :param flow_control: Settings for controlling the number of active requests and
+            number of requests per second with the same key.
         """
         return await self.create(
             destination=destination,
@@ -135,6 +143,7 @@ async def create_json(
             delay=delay,
             timeout=timeout,
             schedule_id=schedule_id,
+            flow_control=flow_control,
         )
 
     async def get(self, schedule_id: str) -> Schedule:
 
@@ -101,6 +101,9 @@ def parse_dlq_message_response(
         response_headers=response.get("responseHeader"),
         response_body=response.get("responseBody"),
         response_body_base64=response.get("responseBodyBase64"),
+        flow_control_key=response.get("flowControlKey"),
+        parallelism=response.get("parallelism"),
+        rate_per_second=response.get("ratePerSecond"),
     )
 
 
 
@@ -28,6 +28,17 @@ class LlmApi(TypedDict):
 ApiT = LlmApi  # In the future, this can be union of different API types
 
 
+class FlowControl(TypedDict, total=False):
+    key: str
+    """flow control key"""
+
+    parallelism: Optional[int]
+    """number of requests which can be active with the same key"""
+
+    rate_per_second: Optional[int]
+    """number of requests to activate per second with the same key"""
+
+
 @dataclasses.dataclass
 class PublishResponse:
     message_id: str
@@ -168,6 +179,12 @@ class BatchRequest(TypedDict, total=False):
     an integer, which will be interpreted as timeout in seconds.
     """
 
+    flow_control: Optional[FlowControl]
+    """
+    Settings for controlling the number of active requests and number of requests
+    per second with the same key.
+    """
+
 
 class BatchJsonRequest(TypedDict, total=False):
     queue: str
@@ -254,6 +271,12 @@ class BatchJsonRequest(TypedDict, total=False):
     set according to the LLM provider.
     """
 
+    flow_control: Optional[FlowControl]
+    """
+    Settings for controlling the number of active requests and number of requests
+    per second with the same key.
+    """
+
 
 @dataclasses.dataclass
 class Message:
@@ -317,6 +340,15 @@ class Message:
     caller_ip: Optional[str]
     """IP address of the publisher of this message."""
 
+    flow_control_key: Optional[str]
+    """flow control key"""
+
+    parallelism: Optional[int]
+    """number of requests which can be active with the same flow control key"""
+
+    rate_per_second: Optional[int]
+    """number of requests to activate per second with the same flow control key"""
+
 
 def get_destination(
     *,
@@ -367,6 +399,7 @@ def prepare_headers(
     deduplication_id: Optional[str],
     content_based_deduplication: Optional[bool],
     timeout: Optional[Union[str, int]],
+    flow_control: Optional[FlowControl],
 ) -> Dict[str, str]:
     h = {}
 
@@ -413,6 +446,21 @@ def prepare_headers(
         else:
             h["Upstash-Timeout"] = timeout
 
+    if flow_control and "key" in flow_control:
+        control_values = []
+        if "parallelism" in flow_control:
+            control_values.append(f"parallelism={flow_control['parallelism']}")
+        if "rate_per_second" in flow_control:
+            control_values.append(f"rate={flow_control['rate_per_second']}")
+
+        if not control_values:
+            raise QStashError(
+                "Provide at least one of parallelism or rate_per_second for flow_control"
+            )
+
+        h["Upstash-Flow-Control-Key"] = flow_control["key"]
+        h["Upstash-Flow-Control-Value"] = ", ".join(control_values)
+
     return h
 
 
@@ -484,6 +532,7 @@ def prepare_batch_message_body(messages: List[BatchRequest]) -> str:
             deduplication_id=msg.get("deduplication_id"),
             content_based_deduplication=msg.get("content_based_deduplication"),
             timeout=msg.get("timeout"),
+            flow_control=msg.get("flow_control"),
         )
 
         batch_messages.append(
@@ -581,6 +630,9 @@ def convert_to_batch_messages(
         if "timeout" in msg:
             batch_msg["timeout"] = msg["timeout"]
 
+        if "flow_control" in msg:
+            batch_msg["flow_control"] = msg["flow_control"]
+
         batch_messages.append(batch_msg)
 
     return batch_messages
@@ -605,6 +657,9 @@ def parse_message_response(response: Dict[str, Any]) -> Message:
         failure_callback=response.get("failureCallback"),
         schedule_id=response.get("scheduleId"),
         caller_ip=response.get("callerIP"),
+        flow_control_key=response.get("flowControlKey"),
+        parallelism=response.get("parallelism"),
+        rate_per_second=response.get("rate"),
     )
 
 
@@ -630,6 +685,7 @@ def publish(
         deduplication_id: Optional[str] = None,
         content_based_deduplication: Optional[bool] = None,
         timeout: Optional[Union[str, int]] = None,
+        flow_control: Optional[FlowControl] = None,
     ) -> Union[PublishResponse, List[PublishUrlGroupResponse]]:
         """
         Publishes a message to QStash.
@@ -667,6 +723,8 @@ def publish(
             When a timeout is specified, it will be used instead of the maximum timeout
             value permitted by the QStash plan. It is useful in scenarios, where a message
             should be delivered with a shorter timeout.
+        :param flow_control: Settings for controlling the number of active requests and
+            number of requests per second with the same key.
         """
         headers = headers or {}
         destination = get_destination(
@@ -688,6 +746,7 @@ def publish(
             deduplication_id=deduplication_id,
             content_based_deduplication=content_based_deduplication,
             timeout=timeout,
+            flow_control=flow_control,
         )
 
         response = self._http.request(
@@ -716,6 +775,7 @@ def publish_json(
         deduplication_id: Optional[str] = None,
         content_based_deduplication: Optional[bool] = None,
         timeout: Optional[Union[str, int]] = None,
+        flow_control: Optional[FlowControl] = None,
     ) -> Union[PublishResponse, List[PublishUrlGroupResponse]]:
         """
         Publish a message to QStash, automatically serializing the
@@ -754,6 +814,8 @@ def publish_json(
             When a timeout is specified, it will be used instead of the maximum timeout
             value permitted by the QStash plan. It is useful in scenarios, where a message
             should be delivered with a shorter timeout.
+        :param flow_control: Settings for controlling the number of active requests and
+            number of requests per second with the same key.
         """
         return self.publish(
             url=url,
@@ -771,6 +833,7 @@ def publish_json(
             deduplication_id=deduplication_id,
             content_based_deduplication=content_based_deduplication,
             timeout=timeout,
+            flow_control=flow_control,
         )
 
     def enqueue(
@@ -843,6 +906,7 @@ def enqueue(
             deduplication_id=deduplication_id,
             content_based_deduplication=content_based_deduplication,
             timeout=timeout,
+            flow_control=None,
         )
 
         response = self._http.request(
Original file line number	Diff line number	Diff line change
`@@ -101,6 +101,9 @@ def parse_dlq_message_response(`
`101`	`101`	`response_headers=response.get("responseHeader"),`
`102`	`102`	`response_body=response.get("responseBody"),`
`103`	`103`	`response_body_base64=response.get("responseBodyBase64"),`
	`104`	`+ flow_control_key=response.get("flowControlKey"),`
	`105`	`+ parallelism=response.get("parallelism"),`
	`106`	`+ rate_per_second=response.get("ratePerSecond"),`
`104`	`107`	`)`
`105`	`108`
`106`	`109`