examples: add large scale map example

Alex Wang · Alex Wang · commit 8ec79c60d0da · 2025-11-14T12:06:25.000-08:00
diff --git a/examples/examples-catalog.json b/examples/examples-catalog.json
@@ -122,6 +122,17 @@
       },
       "path": "./src/map/map_operations.py"
     },
+    {
+      "name": "Map Large Scale",
+      "description": "Processing collections using map-like durable operations in large scale",
+      "handler": "map_with_large_scale.handler",
+      "integration": true,
+      "durableConfig": {
+        "RetentionPeriodInDays": 7,
+        "ExecutionTimeout": 300
+      },
+      "path": "./src/map/map_with_large_scale.py"
+    },
     {
       "name": "Block Example",
       "description": "Nested child contexts demonstrating block operations",
diff --git a/examples/src/map/map_with_large_scale.py b/examples/src/map/map_with_large_scale.py
@@ -0,0 +1,63 @@
+"""Test map with 50 iterations, each returning 100KB data."""
+
+from typing import Any
+
+from aws_durable_execution_sdk_python.config import MapConfig
+from aws_durable_execution_sdk_python.context import DurableContext
+from aws_durable_execution_sdk_python.execution import durable_execution
+from aws_durable_execution_sdk_python.config import Duration
+
+
+def generate_large_string(size_in_kb: int) -> str:
+    """Generate a string of approximately the specified size in KB."""
+    return "A" * 1024 * size_in_kb
+
+@durable_execution
+def handler(_event: Any, context: DurableContext) -> dict[str, Any]:
+    """Handler demonstrating large scale map with substantial data."""
+    # Create array of 50 items (more manageable for testing)
+    items = list(range(1, 51))  # 1 to 50
+
+    config = MapConfig(max_concurrency=10)  # Process 10 items concurrently
+    data = generate_large_string(100)
+    results = context.map(
+        inputs=items,
+        func=lambda ctx, item, index, _: ctx.step(
+            lambda _: {
+                "itemId": item,
+                "index": index,
+                "dataSize": len(data),
+                "data": data,
+                "processed": True,
+            }
+        ),
+        name="large-scale-map",
+        config=config,
+    )
+
+    context.wait(Duration.from_seconds(1), name="wait1")
+
+    # Process results immediately after map operation
+    # Note: After wait operations, the BatchResult may be summarized
+    final_results = results.get_results()
+    total_data_size = sum(result["dataSize"] for result in final_results)
+    all_items_processed = all(result["processed"] for result in final_results)
+
+    total_size_in_mb = round(total_data_size / (1024 * 1024))
+
+    summary = {
+        "itemsProcessed": results.success_count,
+        "totalDataSizeMB": total_size_in_mb,
+        "totalDataSizeBytes": total_data_size,
+        "maxConcurrency": 10,
+        "averageItemSize": round(total_data_size / results.success_count),
+        "allItemsProcessed": all_items_processed,
+    }
+
+    context.wait(Duration.from_seconds(1), name="wait2")
+
+    return {
+        "success": True,
+        "message": "Successfully processed 50 items with substantial data using map",
+        "summary": summary,
+    }
diff --git a/examples/src/run_in_child_context/run_in_child_context_large_data.py b/examples/src/run_in_child_context/run_in_child_context_large_data.py
@@ -12,13 +12,7 @@
 
 def generate_large_string(size_in_kb: int) -> str:
     """Generate a string of approximately the specified size in KB."""
-    target_size = size_in_kb * 1024  # Convert KB to bytes
-    base_string = "A" * 1000  # 1KB string
-    repetitions = target_size // 1000
-    remainder = target_size % 1000
-
-    return base_string * repetitions + "A" * remainder
-
+    return "A" * 1024 * size_in_kb
 
 @durable_with_child_context
 def large_data_processor(child_context: DurableContext) -> dict[str, Any]:
diff --git a/examples/test/map/test_map_with_large_scale.py b/examples/test/map/test_map_with_large_scale.py
@@ -0,0 +1,36 @@
+"""Tests for map_large_scale."""
+
+import pytest
+from aws_durable_execution_sdk_python.execution import InvocationStatus
+
+from src.map import map_with_large_scale
+from test.conftest import deserialize_operation_payload
+
+
+@pytest.mark.example
+@pytest.mark.durable_execution(
+    handler=map_with_large_scale.handler,
+    lambda_function_name="map large scale",
+)
+def test_handle_50_items_with_100kb_each_using_map(durable_runner):
+    """Test handling 50 items with 100KB each using map."""
+    pass
+    with durable_runner:
+        result = durable_runner.run(input=None, timeout=60)
+
+    result_data = deserialize_operation_payload(result.result)
+
+    # Verify the execution succeeded
+    assert result.status is InvocationStatus.SUCCEEDED
+    assert result_data["success"] is True
+
+    # Verify the expected number of items were processed (50 items)
+    assert result_data["summary"]["itemsProcessed"] == 50
+    assert result_data["summary"]["allItemsProcessed"] is True
+
+    # Verify data size expectations (~5MB total from 50 items × 100KB each)
+    assert result_data["summary"]["totalDataSizeMB"] > 4  # Should be ~5MB
+    assert result_data["summary"]["totalDataSizeMB"] < 6
+    assert result_data["summary"]["totalDataSizeBytes"] > 5000000  # ~5MB
+    assert result_data["summary"]["averageItemSize"] > 100000  # ~100KB per item
+    assert result_data["summary"]["maxConcurrency"] == 10