netboxlabs
diff --git a/‎README.md‎
Lines changed: 164 additions & 0 deletions b/‎README.md‎
Lines changed: 164 additions & 0 deletions
diff --git a/‎diode/chunking.go‎
Lines changed: 123 additions & 0 deletions b/‎diode/chunking.go‎
Lines changed: 123 additions & 0 deletions
@@ -286,6 +286,170 @@ Request-level metadata is included in the `IngestRequest` and can be useful for:
 - Debugging and auditing data imports
 - Adding contextual information for downstream processing
 
+### Message chunking
+
+When ingesting large datasets, you may encounter gRPC message size limits (typically 4 MB). The SDK provides automatic message chunking to split large entity lists into size-appropriate chunks that stay within these limits.
+
+#### Automatic chunking
+
+Enable chunking by using `WithChunking()` when calling `Ingest`:
+
+```go
+package main
+
+import (
+	"context"
+	"fmt"
+	"log"
+
+	"github.com/netboxlabs/diode-sdk-go/diode"
+)
+
+func main() {
+	client, err := diode.NewClient(
+		"grpc://localhost:8080/diode",
+		"example-app",
+		"0.1.0",
+		diode.WithClientID("YOUR_CLIENT_ID"),
+		diode.WithClientSecret("YOUR_CLIENT_SECRET"),
+	)
+	if err != nil {
+		log.Fatal(err)
+	}
+
+	// Create a large number of entities
+	entities := make([]diode.Entity, 0)
+	for i := 0; i < 10000; i++ {
+		entities = append(entities, &diode.Device{
+			Name: diode.String(fmt.Sprintf("Device %d", i)),
+			Site: &diode.Site{
+				Name: diode.String("Site ABC"),
+			},
+			DeviceType: &diode.DeviceType{
+				Model: diode.String("Device Type A"),
+			},
+			Role: &diode.DeviceRole{
+				Name: diode.String("Role ABC"),
+			},
+		})
+	}
+
+	// Use chunking with default 3.0 MB chunk size
+	resp, err := client.Ingest(
+		context.Background(),
+		entities,
+		diode.WithChunking(0), // 0 = use default
+	)
+	if err != nil {
+		log.Fatal(err)
+	}
+	log.Printf("Success\n")
+}
+```
+
+#### Custom chunk size
+
+You can specify a custom chunk size in megabytes:
+
+```go
+// Use 3.5 MB chunks instead of the default 3.0 MB
+resp, err := client.Ingest(
+	context.Background(),
+	entities,
+	diode.WithChunking(3.5),
+)
+```
+
+#### Manual chunking
+
+For more control, you can manually chunk entities using the `CreateMessageChunks` function:
+
+```go
+package main
+
+import (
+	"context"
+	"log"
+
+	"github.com/netboxlabs/diode-sdk-go/diode"
+	pb "github.com/netboxlabs/diode-sdk-go/diode/v1/diodepb"
+)
+
+func main() {
+	client, err := diode.NewClient(
+		"grpc://localhost:8080/diode",
+		"example-app",
+		"0.1.0",
+		diode.WithClientID("YOUR_CLIENT_ID"),
+		diode.WithClientSecret("YOUR_CLIENT_SECRET"),
+	)
+	if err != nil {
+		log.Fatal(err)
+	}
+
+	// Create entities
+	entities := []diode.Entity{
+		// ... many entities
+	}
+
+	// Convert to proto entities
+	protoEntities := make([]*pb.Entity, 0)
+	for _, entity := range entities {
+		protoEntities = append(protoEntities, entity.ConvertToProtoEntity())
+	}
+
+	// Manually chunk with custom size (3.5 MB)
+	chunks := diode.CreateMessageChunks(protoEntities, 3.5)
+
+	log.Printf("Split %d entities into %d chunks\n", len(protoEntities), len(chunks))
+
+	// Ingest each chunk
+	for i, chunk := range chunks {
+		log.Printf("Ingesting chunk %d of %d (%d entities)\n", i+1, len(chunks), len(chunk))
+		resp, err := client.IngestProto(context.Background(), chunk)
+		if err != nil {
+			log.Fatalf("Failed to ingest chunk %d: %v\n", i+1, err)
+		}
+		if resp != nil && resp.Errors != nil {
+			log.Printf("Chunk %d errors: %v\n", i+1, resp.Errors)
+		}
+	}
+	log.Printf("Successfully ingested all chunks\n")
+}
+```
+
+#### Estimating message size
+
+You can estimate the size of your entities before chunking:
+
+```go
+import pb "github.com/netboxlabs/diode-sdk-go/diode/v1/diodepb"
+
+protoEntities := make([]*pb.Entity, 0)
+for _, entity := range entities {
+	protoEntities = append(protoEntities, entity.ConvertToProtoEntity())
+}
+
+sizeBytes := diode.EstimateMessageSize(protoEntities)
+sizeMB := float64(sizeBytes) / (1024 * 1024)
+log.Printf("Estimated message size: %.2f MB\n", sizeMB)
+
+if sizeMB > 3.0 {
+	log.Printf("Message exceeds 3 MB, chunking recommended\n")
+}
+```
+
+#### How chunking works
+
+The chunking algorithm uses greedy bin-packing to efficiently group entities:
+
+1. It accumulates entities until adding the next one would exceed the size limit
+2. When the limit would be exceeded, it starts a new chunk
+3. Each chunk includes the base overhead of an `IngestRequest` protobuf message
+4. Entity order is preserved across chunks
+
+The default chunk size of 3.0 MB provides a safe margin below the gRPC 4 MB message size limit, accounting for protobuf serialization overhead and network protocol overhead.
+
 ### TLS verification and certificates
 
 TLS verification is controlled by the target URL scheme:
 
@@ -0,0 +1,123 @@
+package diode
+
+import (
+	"google.golang.org/protobuf/proto"
+
+	pb "github.com/netboxlabs/diode-sdk-go/diode/v1/diodepb"
+)
+
+const (
+	// DefaultMaxChunkSizeMB is the default maximum chunk size in megabytes.
+	// This provides a safe margin below the gRPC 4 MB message size limit,
+	// accounting for protobuf serialization overhead.
+	DefaultMaxChunkSizeMB = 3.0
+)
+
+// CreateMessageChunks creates size-aware chunks from entities using greedy bin-packing.
+//
+// This function chunks entities to ensure each chunk stays under the specified
+// size limit. It uses a greedy bin-packing algorithm that accumulates entities
+// until adding the next entity would exceed the limit, then starts a new chunk.
+//
+// The default chunk size of 3.0 MB provides a safe margin below the gRPC 4 MB
+// message size limit, accounting for protobuf serialization overhead.
+//
+// Parameters:
+//   - entities: Slice of Entity protobuf messages to chunk
+//   - maxChunkSizeMB: Maximum chunk size in MB (use 0 for default of 3.0 MB)
+//
+// Returns:
+//   - Slice of entity chunks, each under maxChunkSizeMB. Returns at least
+//     one chunk even if the input is empty.
+//
+// Examples:
+//
+//	entities := []*diodepb.Entity{entity1, entity2, entity3, ...}
+//	chunks := CreateMessageChunks(entities, 0) // Use default 3.0 MB
+//	for _, chunk := range chunks {
+//	    client.IngestProto(ctx, chunk)
+//	}
+//
+//	// Use a custom chunk size
+//	chunks = CreateMessageChunks(entities, 3.5)
+func CreateMessageChunks(entities []*pb.Entity, maxChunkSizeMB float64) [][]*pb.Entity {
+	// Use default if not specified
+	if maxChunkSizeMB <= 0 {
+		maxChunkSizeMB = DefaultMaxChunkSizeMB
+	}
+
+	// Handle empty input
+	if len(entities) == 0 {
+		return [][]*pb.Entity{entities}
+	}
+
+	// Convert MB to bytes
+	maxChunkSizeBytes := int(maxChunkSizeMB * 1024 * 1024)
+
+	// Quick check: if all entities fit in one chunk, return early
+	totalSize := EstimateMessageSize(entities)
+	if totalSize <= maxChunkSizeBytes {
+		return [][]*pb.Entity{entities}
+	}
+
+	// Greedy bin-packing: accumulate entities until limit reached
+	baseOverhead := proto.Size(&pb.IngestRequest{})
+	chunks := make([][]*pb.Entity, 0)
+	currentChunk := make([]*pb.Entity, 0)
+	currentChunkSize := baseOverhead // Start with overhead for the chunk
+
+	for _, entity := range entities {
+		entitySize := proto.Size(entity)
+		projectedSize := currentChunkSize + entitySize
+
+		// Check if adding this entity would exceed limit
+		if len(currentChunk) > 0 && projectedSize > maxChunkSizeBytes {
+			// Finalize current chunk and start new one
+			chunks = append(chunks, currentChunk)
+			currentChunk = []*pb.Entity{entity}
+			currentChunkSize = baseOverhead + entitySize
+		} else {
+			// Add entity to current chunk
+			currentChunk = append(currentChunk, entity)
+			currentChunkSize = projectedSize
+		}
+	}
+
+	// Add final chunk if not empty
+	if len(currentChunk) > 0 {
+		chunks = append(chunks, currentChunk)
+	}
+
+	// Return chunks or original entities if no chunks were created
+	if len(chunks) == 0 {
+		return [][]*pb.Entity{entities}
+	}
+
+	return chunks
+}
+
+// EstimateMessageSize estimates the serialized size of entities in bytes.
+//
+// Calculates the total size by summing individual entity sizes plus the
+// IngestRequest protobuf overhead.
+//
+// Parameters:
+//   - entities: Slice of Entity protobuf messages
+//
+// Returns:
+//   - Estimated size in bytes including IngestRequest overhead
+//
+// Examples:
+//
+//	entities := []*diodepb.Entity{entity1, entity2, entity3}
+//	sizeBytes := EstimateMessageSize(entities)
+//	sizeMB := float64(sizeBytes) / (1024 * 1024)
+//	fmt.Printf("Estimated size: %.2f MB\n", sizeMB)
+func EstimateMessageSize(entities []*pb.Entity) int {
+	baseOverhead := proto.Size(&pb.IngestRequest{})
+	entitySizesSum := 0
+	for _, entity := range entities {
+		entitySizesSum += proto.Size(entity)
+	}
+	return baseOverhead + entitySizesSum
+}