227
227
from airbyte_cdk .sources .declarative .models .declarative_component_schema import (
228
228
FlattenFields as FlattenFieldsModel ,
229
229
)
230
+ from airbyte_cdk .sources .declarative .models .declarative_component_schema import (
231
+ GroupingPartitionRouter as GroupingPartitionRouterModel ,
232
+ )
230
233
from airbyte_cdk .sources .declarative .models .declarative_component_schema import (
231
234
GzipDecoder as GzipDecoderModel ,
232
235
)
385
388
)
386
389
from airbyte_cdk .sources .declarative .partition_routers import (
387
390
CartesianProductStreamSlicer ,
391
+ GroupingPartitionRouter ,
388
392
ListPartitionRouter ,
389
393
PartitionRouter ,
390
394
SinglePartitionRouter ,
@@ -638,6 +642,7 @@ def _init_mappings(self) -> None:
638
642
UnlimitedCallRatePolicyModel : self .create_unlimited_call_rate_policy ,
639
643
RateModel : self .create_rate ,
640
644
HttpRequestRegexMatcherModel : self .create_http_request_matcher ,
645
+ GroupingPartitionRouterModel : self .create_grouping_partition_router ,
641
646
}
642
647
643
648
# Needed for the case where we need to perform a second parse on the fields of a custom component
@@ -1355,6 +1360,9 @@ def create_concurrent_cursor_from_perpartition_cursor(
1355
1360
)
1356
1361
stream_state = self .apply_stream_state_migrations (stream_state_migrations , stream_state )
1357
1362
1363
+ # Per-partition state doesn't make sense for GroupingPartitionRouter, so force the global state
1364
+ use_global_cursor = isinstance (partition_router , GroupingPartitionRouter )
1365
+
1358
1366
# Return the concurrent cursor and state converter
1359
1367
return ConcurrentPerPartitionCursor (
1360
1368
cursor_factory = cursor_factory ,
@@ -1366,6 +1374,7 @@ def create_concurrent_cursor_from_perpartition_cursor(
1366
1374
connector_state_manager = state_manager ,
1367
1375
connector_state_converter = connector_state_converter ,
1368
1376
cursor_field = cursor_field ,
1377
+ use_global_cursor = use_global_cursor ,
1369
1378
)
1370
1379
1371
1380
@staticmethod
@@ -3370,3 +3379,34 @@ def set_api_budget(self, component_definition: ComponentDefinition, config: Conf
3370
3379
self ._api_budget = self .create_component (
3371
3380
model_type = HTTPAPIBudgetModel , component_definition = component_definition , config = config
3372
3381
)
3382
+
3383
+ def create_grouping_partition_router (
3384
+ self , model : GroupingPartitionRouterModel , config : Config , ** kwargs : Any
3385
+ ) -> GroupingPartitionRouter :
3386
+ underlying_router = self ._create_component_from_model (
3387
+ model = model .underlying_partition_router , config = config
3388
+ )
3389
+ if model .group_size < 1 :
3390
+ raise ValueError (f"Group size must be greater than 0, got { model .group_size } " )
3391
+
3392
+ # Request options in underlying partition routers are not supported for GroupingPartitionRouter
3393
+ # because they are specific to individual partitions and cannot be aggregated or handled
3394
+ # when grouping, potentially leading to incorrect API calls. Any request customization
3395
+ # should be managed at the stream level through the requester's configuration.
3396
+ if isinstance (underlying_router , SubstreamPartitionRouter ):
3397
+ if any (
3398
+ parent_config .request_option
3399
+ for parent_config in underlying_router .parent_stream_configs
3400
+ ):
3401
+ raise ValueError ("Request options are not supported for GroupingPartitionRouter." )
3402
+
3403
+ if isinstance (underlying_router , ListPartitionRouter ):
3404
+ if underlying_router .request_option :
3405
+ raise ValueError ("Request options are not supported for GroupingPartitionRouter." )
3406
+
3407
+ return GroupingPartitionRouter (
3408
+ group_size = model .group_size ,
3409
+ underlying_partition_router = underlying_router ,
3410
+ deduplicate = model .deduplicate if model .deduplicate is not None else True ,
3411
+ config = config ,
3412
+ )
0 commit comments