39 changed files with 613 additions and 6803 deletions
--- a/cmd/storage-bench/main.go
+++ b/cmd/storage-bench/main.go
@ -237,10 +237,10 @@ func runWriteBenchmark(e *engine.EngineFacade) string {
 				// Handle WAL rotation errors more gracefully
 				if strings.Contains(err.Error(), "WAL is rotating") || 
-					strings.Contains(err.Error(), "WAL is closed") {
+				   strings.Contains(err.Error(), "WAL is closed") {
 					// These are expected during WAL rotation, just retry after a short delay
 					walRotationCount++
-					if walRotationCount%100 == 0 {
+					if walRotationCount % 100 == 0 {
 						fmt.Printf("Retrying due to WAL rotation (%d retries so far)...\n", walRotationCount)
 					}
 					time.Sleep(20 * time.Millisecond)
@ -335,9 +335,9 @@ func runRandomWriteBenchmark(e *engine.EngineFacade) string {
 				// Handle WAL rotation errors
 				if strings.Contains(err.Error(), "WAL is rotating") || 
-					strings.Contains(err.Error(), "WAL is closed") {
+				   strings.Contains(err.Error(), "WAL is closed") {
 					walRotationCount++
-					if walRotationCount%100 == 0 {
+					if walRotationCount % 100 == 0 {
 						fmt.Printf("Retrying due to WAL rotation (%d retries so far)...\n", walRotationCount)
 					}
 					time.Sleep(20 * time.Millisecond)
@ -431,9 +431,9 @@ func runSequentialWriteBenchmark(e *engine.EngineFacade) string {
 				// Handle WAL rotation errors
 				if strings.Contains(err.Error(), "WAL is rotating") || 
-					strings.Contains(err.Error(), "WAL is closed") {
+				   strings.Contains(err.Error(), "WAL is closed") {
 					walRotationCount++
-					if walRotationCount%100 == 0 {
+					if walRotationCount % 100 == 0 {
 						fmt.Printf("Retrying due to WAL rotation (%d retries so far)...\n", walRotationCount)
 					}
 					time.Sleep(20 * time.Millisecond)
--- a/pkg/grpc/service/bootstrap_service.go
+++ b/pkg/grpc/service/bootstrap_service.go
@ -1,378 +0,0 @@
 package service
 import (
 	"context"
 	"fmt"
 	"io"
 	"sync"
 	"time"
 	"github.com/KevoDB/kevo/pkg/replication"
 	"github.com/KevoDB/kevo/pkg/transport"
 	"github.com/KevoDB/kevo/proto/kevo"
 	"google.golang.org/grpc/codes"
 	"google.golang.org/grpc/status"
 )
 // BootstrapServiceOptions contains configuration for bootstrap operations
 type BootstrapServiceOptions struct {
 	// Maximum number of concurrent bootstrap operations
 	MaxConcurrentBootstraps int
 	// Batch size for key-value pairs in bootstrap responses
 	BootstrapBatchSize int
 	// Whether to enable resume for interrupted bootstraps
 	EnableBootstrapResume bool
 	// Directory for storing bootstrap state
 	BootstrapStateDir string
 }
 // DefaultBootstrapServiceOptions returns sensible defaults
 func DefaultBootstrapServiceOptions() *BootstrapServiceOptions {
 	return &BootstrapServiceOptions{
 		MaxConcurrentBootstraps: 5,
 		BootstrapBatchSize:      1000,
 		EnableBootstrapResume:   true,
 		BootstrapStateDir:       "./bootstrap-state",
 	}
 }
 // bootstrapService encapsulates bootstrap-related functionality for the replication service
 type bootstrapService struct {
 	// Bootstrap options
 	options *BootstrapServiceOptions
 	// Bootstrap generator for primary nodes
 	bootstrapGenerator *replication.BootstrapGenerator
 	// Bootstrap manager for replica nodes
 	bootstrapManager *replication.BootstrapManager
 	// Storage snapshot provider for generating snapshots
 	snapshotProvider replication.StorageSnapshotProvider
 	// Active bootstrap operations
 	activeBootstraps      map[string]*bootstrapOperation
 	activeBootstrapsMutex sync.RWMutex
 	// WAL components
 	replicator replication.EntryReplicator
 	applier    replication.EntryApplier
 }
 // bootstrapOperation tracks a specific bootstrap operation
 type bootstrapOperation struct {
 	replicaID     string
 	startTime     time.Time
 	snapshotLSN   uint64
 	totalKeys     int64
 	processedKeys int64
 	completed     bool
 	error         error
 }
 // newBootstrapService creates a bootstrap service with the specified options
 func newBootstrapService(
 	options *BootstrapServiceOptions,
 	snapshotProvider replication.StorageSnapshotProvider,
 	replicator EntryReplicator,
 	applier EntryApplier,
 ) (*bootstrapService, error) {
 	if options == nil {
 		options = DefaultBootstrapServiceOptions()
 	}
 	var bootstrapManager *replication.BootstrapManager
 	var bootstrapGenerator *replication.BootstrapGenerator
 	// Initialize bootstrap components based on role
 	if replicator != nil {
 		// Primary role - create generator
 		bootstrapGenerator = replication.NewBootstrapGenerator(
 			snapshotProvider,
 			replicator,
 			nil, // Use default logger
 		)
 	}
 	if applier != nil {
 		// Replica role - create manager
 		var err error
 		bootstrapManager, err = replication.NewBootstrapManager(
 			nil, // Will be set later when needed
 			applier,
 			options.BootstrapStateDir,
 			nil, // Use default logger
 		)
 		if err != nil {
 			return nil, fmt.Errorf("failed to create bootstrap manager: %w", err)
 		}
 	}
 	return &bootstrapService{
 		options:            options,
 		bootstrapGenerator: bootstrapGenerator,
 		bootstrapManager:   bootstrapManager,
 		snapshotProvider:   snapshotProvider,
 		activeBootstraps:   make(map[string]*bootstrapOperation),
 		replicator:         replicator,
 		applier:            applier,
 	}, nil
 }
 // handleBootstrapRequest handles bootstrap requests from replicas
 func (s *bootstrapService) handleBootstrapRequest(
 	req *kevo.BootstrapRequest,
 	stream kevo.ReplicationService_RequestBootstrapServer,
 ) error {
 	replicaID := req.ReplicaId
 	// Validate that we have a bootstrap generator (primary role)
 	if s.bootstrapGenerator == nil {
 		return status.Errorf(codes.FailedPrecondition, "this node is not a primary and cannot provide bootstrap")
 	}
 	// Check if we have too many concurrent bootstraps
 	s.activeBootstrapsMutex.RLock()
 	activeCount := len(s.activeBootstraps)
 	s.activeBootstrapsMutex.RUnlock()
 	if activeCount >= s.options.MaxConcurrentBootstraps {
 		return status.Errorf(codes.ResourceExhausted, "too many concurrent bootstrap operations (max: %d)",
 			s.options.MaxConcurrentBootstraps)
 	}
 	// Check if this replica already has an active bootstrap
 	s.activeBootstrapsMutex.RLock()
 	_, exists := s.activeBootstraps[replicaID]
 	s.activeBootstrapsMutex.RUnlock()
 	if exists {
 		return status.Errorf(codes.AlreadyExists, "bootstrap already in progress for replica %s", replicaID)
 	}
 	// Track bootstrap operation
 	operation := &bootstrapOperation{
 		replicaID:     replicaID,
 		startTime:     time.Now(),
 		snapshotLSN:   0,
 		totalKeys:     0,
 		processedKeys: 0,
 		completed:     false,
 		error:         nil,
 	}
 	s.activeBootstrapsMutex.Lock()
 	s.activeBootstraps[replicaID] = operation
 	s.activeBootstrapsMutex.Unlock()
 	// Clean up when done
 	defer func() {
 		// After a successful bootstrap, keep the operation record for a while
 		// This helps with debugging and monitoring
 		if operation.error == nil {
 			go func() {
 				time.Sleep(1 * time.Hour)
 				s.activeBootstrapsMutex.Lock()
 				delete(s.activeBootstraps, replicaID)
 				s.activeBootstrapsMutex.Unlock()
 			}()
 		} else {
 			// For failed bootstraps, remove immediately
 			s.activeBootstrapsMutex.Lock()
 			delete(s.activeBootstraps, replicaID)
 			s.activeBootstrapsMutex.Unlock()
 		}
 	}()
 	// Start bootstrap generation
 	ctx := stream.Context()
 	iterator, snapshotLSN, err := s.bootstrapGenerator.StartBootstrapGeneration(ctx, replicaID)
 	if err != nil {
 		operation.error = err
 		return status.Errorf(codes.Internal, "failed to start bootstrap generation: %v", err)
 	}
 	// Update operation with snapshot LSN
 	operation.snapshotLSN = snapshotLSN
 	// Stream key-value pairs in batches
 	batchSize := s.options.BootstrapBatchSize
 	batch := make([]*kevo.KeyValuePair, 0, batchSize)
 	pairsProcessed := int64(0)
 	// Get an estimate of total keys if available
 	snapshot, err := s.snapshotProvider.CreateSnapshot()
 	if err == nil {
 		operation.totalKeys = snapshot.KeyCount()
 	}
 	// Stream data in batches
 	for {
 		// Check if context is cancelled
 		select {
 		case <-ctx.Done():
 			operation.error = ctx.Err()
 			return status.Error(codes.Canceled, "bootstrap cancelled by client")
 		default:
 			// Continue
 		}
 		// Get next key-value pair
 		key, value, err := iterator.Next()
 		if err == io.EOF {
 			// End of data, send any remaining pairs
 			break
 		}
 		if err != nil {
 			operation.error = err
 			return status.Errorf(codes.Internal, "error reading from snapshot: %v", err)
 		}
 		// Add to batch
 		batch = append(batch, &kevo.KeyValuePair{
 			Key:   key,
 			Value: value,
 		})
 		pairsProcessed++
 		operation.processedKeys = pairsProcessed
 		// Send batch if full
 		if len(batch) >= batchSize {
 			progress := float32(0)
 			if operation.totalKeys > 0 {
 				progress = float32(pairsProcessed) / float32(operation.totalKeys)
 			}
 			if err := stream.Send(&kevo.BootstrapBatch{
 				Pairs:       batch,
 				Progress:    progress,
 				IsLast:      false,
 				SnapshotLsn: snapshotLSN,
 			}); err != nil {
 				operation.error = err
 				return err
 			}
 			// Reset batch
 			batch = batch[:0]
 		}
 	}
 	// Send any remaining pairs in the final batch
 	progress := float32(1.0)
 	if operation.totalKeys > 0 {
 		progress = float32(pairsProcessed) / float32(operation.totalKeys)
 	}
 	// If there are no remaining pairs, send an empty batch with isLast=true
 	if err := stream.Send(&kevo.BootstrapBatch{
 		Pairs:       batch,
 		Progress:    progress,
 		IsLast:      true,
 		SnapshotLsn: snapshotLSN,
 	}); err != nil {
 		operation.error = err
 		return err
 	}
 	// Mark as completed
 	operation.completed = true
 	return nil
 }
 // handleClientBootstrap handles bootstrap process for a client replica
 func (s *bootstrapService) handleClientBootstrap(
 	ctx context.Context,
 	bootstrapIterator transport.BootstrapIterator,
 	replicaID string,
 	storageApplier replication.StorageApplier,
 ) error {
 	// Validate that we have a bootstrap manager (replica role)
 	if s.bootstrapManager == nil {
 		return fmt.Errorf("bootstrap manager not initialized")
 	}
 	// Create a storage applier adapter if needed
 	if storageApplier == nil {
 		return fmt.Errorf("storage applier not provided")
 	}
 	// Start the bootstrap process
 	err := s.bootstrapManager.StartBootstrap(
 		replicaID,
 		bootstrapIterator,
 		s.options.BootstrapBatchSize,
 	)
 	if err != nil {
 		return fmt.Errorf("failed to start bootstrap: %w", err)
 	}
 	return nil
 }
 // isBootstrapInProgress checks if a bootstrap operation is in progress
 func (s *bootstrapService) isBootstrapInProgress() bool {
 	if s.bootstrapManager != nil {
 		return s.bootstrapManager.IsBootstrapInProgress()
 	}
 	// If no bootstrap manager (primary node), check active operations
 	s.activeBootstrapsMutex.RLock()
 	defer s.activeBootstrapsMutex.RUnlock()
 	for _, op := range s.activeBootstraps {
 		if !op.completed && op.error == nil {
 			return true
 		}
 	}
 	return false
 }
 // getBootstrapStatus returns the status of bootstrap operations
 func (s *bootstrapService) getBootstrapStatus() map[string]interface{} {
 	result := make(map[string]interface{})
 	// For primary role, return active bootstraps
 	if s.bootstrapGenerator != nil {
 		result["role"] = "primary"
 		result["active_bootstraps"] = s.bootstrapGenerator.GetActiveBootstraps()
 	}
 	// For replica role, return bootstrap state
 	if s.bootstrapManager != nil {
 		result["role"] = "replica"
 		state := s.bootstrapManager.GetBootstrapState()
 		if state != nil {
 			result["bootstrap_state"] = map[string]interface{}{
 				"replica_id":      state.ReplicaID,
 				"started_at":      state.StartedAt.Format(time.RFC3339),
 				"last_updated_at": state.LastUpdatedAt.Format(time.RFC3339),
 				"snapshot_lsn":    state.SnapshotLSN,
 				"applied_keys":    state.AppliedKeys,
 				"total_keys":      state.TotalKeys,
 				"progress":        state.Progress,
 				"completed":       state.Completed,
 				"error":           state.Error,
 			}
 		}
 	}
 	return result
 }
 // transitionToWALReplication transitions from bootstrap to WAL replication
 func (s *bootstrapService) transitionToWALReplication() error {
 	if s.bootstrapManager != nil {
 		return s.bootstrapManager.TransitionToWALReplication()
 	}
 	// If no bootstrap manager, we don't need to transition
 	return nil
 }
--- a/pkg/grpc/service/bootstrap_service_test.go
+++ b/pkg/grpc/service/bootstrap_service_test.go
@ -1,481 +0,0 @@
 package service
 import (
 	"context"
 	"io"
 	"os"
 	"path/filepath"
 	"sync"
 	"testing"
 	"time"
 	"github.com/KevoDB/kevo/pkg/replication"
 	"github.com/KevoDB/kevo/pkg/transport"
 	"github.com/KevoDB/kevo/proto/kevo"
 	"google.golang.org/grpc"
 )
 // MockBootstrapStorageSnapshot implements replication.StorageSnapshot for testing
 type MockBootstrapStorageSnapshot struct {
 	replication.StorageSnapshot
 	pairs       []replication.KeyValuePair
 	keyCount    int64
 	nextErr     error
 	position    int
 	iterCreated bool
 	snapshotLSN uint64
 }
 func NewMockBootstrapStorageSnapshot(pairs []replication.KeyValuePair) *MockBootstrapStorageSnapshot {
 	return &MockBootstrapStorageSnapshot{
 		pairs:       pairs,
 		keyCount:    int64(len(pairs)),
 		snapshotLSN: 12345, // Set default snapshot LSN for tests
 	}
 }
 func (m *MockBootstrapStorageSnapshot) CreateSnapshotIterator() (replication.SnapshotIterator, error) {
 	m.position = 0
 	m.iterCreated = true
 	return m, nil
 }
 func (m *MockBootstrapStorageSnapshot) KeyCount() int64 {
 	return m.keyCount
 }
 func (m *MockBootstrapStorageSnapshot) Next() ([]byte, []byte, error) {
 	if m.nextErr != nil {
 		return nil, nil, m.nextErr
 	}
 	if m.position >= len(m.pairs) {
 		return nil, nil, io.EOF
 	}
 	pair := m.pairs[m.position]
 	m.position++
 	return pair.Key, pair.Value, nil
 }
 func (m *MockBootstrapStorageSnapshot) Close() error {
 	return nil
 }
 // MockBootstrapSnapshotProvider implements replication.StorageSnapshotProvider for testing
 type MockBootstrapSnapshotProvider struct {
 	snapshot  *MockBootstrapStorageSnapshot
 	createErr error
 }
 func NewMockBootstrapSnapshotProvider(snapshot *MockBootstrapStorageSnapshot) *MockBootstrapSnapshotProvider {
 	return &MockBootstrapSnapshotProvider{
 		snapshot: snapshot,
 	}
 }
 func (m *MockBootstrapSnapshotProvider) CreateSnapshot() (replication.StorageSnapshot, error) {
 	if m.createErr != nil {
 		return nil, m.createErr
 	}
 	return m.snapshot, nil
 }
 // MockBootstrapWALReplicator implements a simple replicator for testing
 type MockBootstrapWALReplicator struct {
 	replication.WALReplicator
 	highestTimestamp uint64
 }
 func (r *MockBootstrapWALReplicator) GetHighestTimestamp() uint64 {
 	return r.highestTimestamp
 }
 // Mock ReplicationService_RequestBootstrapServer for testing
 type mockBootstrapStream struct {
 	grpc.ServerStream
 	ctx       context.Context
 	batches   []*kevo.BootstrapBatch
 	sendError error
 	mu        sync.Mutex
 }
 func newMockBootstrapStream() *mockBootstrapStream {
 	return &mockBootstrapStream{
 		ctx:     context.Background(),
 		batches: make([]*kevo.BootstrapBatch, 0),
 	}
 }
 func (m *mockBootstrapStream) Context() context.Context {
 	return m.ctx
 }
 func (m *mockBootstrapStream) Send(batch *kevo.BootstrapBatch) error {
 	if m.sendError != nil {
 		return m.sendError
 	}
 	m.mu.Lock()
 	m.batches = append(m.batches, batch)
 	m.mu.Unlock()
 	return nil
 }
 func (m *mockBootstrapStream) GetBatches() []*kevo.BootstrapBatch {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	return m.batches
 }
 // Helper function to create a temporary directory for testing
 func createTempDir(t *testing.T) string {
 	dir, err := os.MkdirTemp("", "bootstrap-test-*")
 	if err != nil {
 		t.Fatalf("Failed to create temp dir: %v", err)
 	}
 	return dir
 }
 // Helper function to clean up temporary directory
 func cleanupTempDir(t *testing.T, dir string) {
 	os.RemoveAll(dir)
 }
 // TestBootstrapService tests the bootstrap service component
 func TestBootstrapService(t *testing.T) {
 	// Create test directory
 	tempDir := createTempDir(t)
 	defer cleanupTempDir(t, tempDir)
 	// Create test data
 	testData := []replication.KeyValuePair{
 		{Key: []byte("key1"), Value: []byte("value1")},
 		{Key: []byte("key2"), Value: []byte("value2")},
 		{Key: []byte("key3"), Value: []byte("value3")},
 		{Key: []byte("key4"), Value: []byte("value4")},
 		{Key: []byte("key5"), Value: []byte("value5")},
 	}
 	// Create mock storage snapshot
 	mockSnapshot := NewMockBootstrapStorageSnapshot(testData)
 	// Create mock replicator with timestamp
 	replicator := &MockBootstrapWALReplicator{
 		highestTimestamp: 12345,
 	}
 	// Create bootstrap service
 	options := DefaultBootstrapServiceOptions()
 	options.BootstrapBatchSize = 2 // Use small batch size for testing
 	bootstrapSvc, err := newBootstrapService(
 		options,
 		NewMockBootstrapSnapshotProvider(mockSnapshot),
 		replicator,
 		nil,
 	)
 	if err != nil {
 		t.Fatalf("Failed to create bootstrap service: %v", err)
 	}
 	// Create mock stream
 	stream := newMockBootstrapStream()
 	// Create bootstrap request
 	req := &kevo.BootstrapRequest{
 		ReplicaId: "test-replica",
 	}
 	// Handle bootstrap request
 	err = bootstrapSvc.handleBootstrapRequest(req, stream)
 	if err != nil {
 		t.Fatalf("Bootstrap request failed: %v", err)
 	}
 	// Verify batches
 	batches := stream.GetBatches()
 	// Expected: 3 batches (2 full, 1 final with last item)
 	if len(batches) != 3 {
 		t.Errorf("Expected 3 batches, got %d", len(batches))
 	}
 	// Verify first batch
 	if len(batches) > 0 {
 		batch := batches[0]
 		if len(batch.Pairs) != 2 {
 			t.Errorf("Expected 2 pairs in first batch, got %d", len(batch.Pairs))
 		}
 		if batch.IsLast {
 			t.Errorf("First batch should not be marked as last")
 		}
 		if batch.SnapshotLsn != 12345 {
 			t.Errorf("Expected snapshot LSN 12345, got %d", batch.SnapshotLsn)
 		}
 	}
 	// Verify final batch
 	if len(batches) > 2 {
 		batch := batches[2]
 		if !batch.IsLast {
 			t.Errorf("Final batch should be marked as last")
 		}
 	}
 	// Verify active bootstraps
 	bootstrapStatus := bootstrapSvc.getBootstrapStatus()
 	if bootstrapStatus["role"] != "primary" {
 		t.Errorf("Expected role 'primary', got %s", bootstrapStatus["role"])
 	}
 	// Get active bootstraps
 	activeBootstraps, ok := bootstrapStatus["active_bootstraps"].(map[string]map[string]interface{})
 	if !ok {
 		t.Fatalf("Expected active_bootstraps to be a map")
 	}
 	// Verify bootstrap for our test replica
 	replicaInfo, exists := activeBootstraps["test-replica"]
 	if !exists {
 		t.Fatalf("Expected to find test-replica in active bootstraps")
 	}
 	// Check if bootstrap was completed
 	completed, ok := replicaInfo["completed"].(bool)
 	if !ok {
 		t.Fatalf("Expected 'completed' to be a boolean")
 	}
 	if !completed {
 		t.Errorf("Expected bootstrap to be marked as completed")
 	}
 }
 // TestReplicationService_Bootstrap tests the bootstrap integration in the ReplicationService
 func TestReplicationService_Bootstrap(t *testing.T) {
 	// Create test directory
 	tempDir := createTempDir(t)
 	defer cleanupTempDir(t, tempDir)
 	// Create test data
 	testData := []replication.KeyValuePair{
 		{Key: []byte("key1"), Value: []byte("value1")},
 		{Key: []byte("key2"), Value: []byte("value2")},
 		{Key: []byte("key3"), Value: []byte("value3")},
 	}
 	// Create mock storage snapshot
 	mockSnapshot := NewMockBootstrapStorageSnapshot(testData)
 	// Create mock replicator
 	replicator := &MockBootstrapWALReplicator{
 		highestTimestamp: 12345,
 	}
 	// Create replication service options
 	options := DefaultReplicationServiceOptions()
 	options.DataDir = filepath.Join(tempDir, "replication-data")
 	options.BootstrapOptions.BootstrapBatchSize = 2 // Small batch size for testing
 	// Create replication service
 	service, err := NewReplicationService(
 		replicator,
 		nil, // No WAL applier for this test
 		replication.NewEntrySerializer(),
 		mockSnapshot,
 		options,
 	)
 	if err != nil {
 		t.Fatalf("Failed to create replication service: %v", err)
 	}
 	// Register a test replica
 	service.replicas["test-replica"] = &transport.ReplicaInfo{
 		ID:       "test-replica",
 		Address:  "localhost:12345",
 		Role:     transport.RoleReplica,
 		Status:   transport.StatusConnecting,
 		LastSeen: time.Now(),
 	}
 	// Create mock stream
 	stream := newMockBootstrapStream()
 	// Create bootstrap request
 	req := &kevo.BootstrapRequest{
 		ReplicaId: "test-replica",
 	}
 	// Handle bootstrap request
 	err = service.RequestBootstrap(req, stream)
 	if err != nil {
 		t.Fatalf("Bootstrap request failed: %v", err)
 	}
 	// Verify batches
 	batches := stream.GetBatches()
 	// Expected: 2 batches (1 full, 1 final)
 	if len(batches) < 2 {
 		t.Errorf("Expected at least 2 batches, got %d", len(batches))
 	}
 	// Verify final batch
 	lastBatch := batches[len(batches)-1]
 	if !lastBatch.IsLast {
 		t.Errorf("Final batch should be marked as last")
 	}
 	// Verify replica status was updated
 	service.replicasMutex.RLock()
 	replica := service.replicas["test-replica"]
 	service.replicasMutex.RUnlock()
 	if replica.Status != transport.StatusSyncing {
 		t.Errorf("Expected replica status to be StatusSyncing, got %s", replica.Status)
 	}
 	if replica.CurrentLSN != 12345 {
 		t.Errorf("Expected replica LSN to be 12345, got %d", replica.CurrentLSN)
 	}
 }
 // TestBootstrapManager_Integration tests the bootstrap manager component
 func TestBootstrapManager_Integration(t *testing.T) {
 	// Create test directory
 	tempDir := createTempDir(t)
 	defer cleanupTempDir(t, tempDir)
 	// Mock storage applier for testing
 	storageApplier := &MockStorageApplier{
 		applied: make(map[string][]byte),
 	}
 	// Create bootstrap manager
 	manager, err := replication.NewBootstrapManager(
 		storageApplier,
 		nil, // No WAL applier for this test
 		tempDir,
 		nil, // Use default logger
 	)
 	if err != nil {
 		t.Fatalf("Failed to create bootstrap manager: %v", err)
 	}
 	// Create test bootstrap data
 	testData := []replication.KeyValuePair{
 		{Key: []byte("key1"), Value: []byte("value1")},
 		{Key: []byte("key2"), Value: []byte("value2")},
 		{Key: []byte("key3"), Value: []byte("value3")},
 	}
 	// Create mock bootstrap iterator
 	iterator := &MockBootstrapIterator{
 		pairs:       testData,
 		snapshotLSN: 12345,
 	}
 	// Set the snapshot LSN on the bootstrap manager
 	manager.SetSnapshotLSN(iterator.snapshotLSN)
 	// Start bootstrap
 	err = manager.StartBootstrap("test-replica", iterator, 2)
 	if err != nil {
 		t.Fatalf("Failed to start bootstrap: %v", err)
 	}
 	// Wait for bootstrap to complete
 	for i := 0; i < 50; i++ {
 		if !manager.IsBootstrapInProgress() {
 			break
 		}
 		time.Sleep(100 * time.Millisecond)
 	}
 	// Verify bootstrap completed
 	if manager.IsBootstrapInProgress() {
 		t.Fatalf("Bootstrap did not complete in time")
 	}
 	// Verify all keys were applied
 	if storageApplier.appliedCount != len(testData) {
 		t.Errorf("Expected %d applied keys, got %d", len(testData), storageApplier.appliedCount)
 	}
 	// Verify bootstrap state
 	state := manager.GetBootstrapState()
 	if state == nil {
 		t.Fatalf("Bootstrap state is nil")
 	}
 	if !state.Completed {
 		t.Errorf("Expected bootstrap to be marked as completed")
 	}
 	if state.Progress != 1.0 {
 		t.Errorf("Expected progress to be 1.0, got %f", state.Progress)
 	}
 }
 // MockStorageApplier implements replication.StorageApplier for testing
 type MockStorageApplier struct {
 	applied      map[string][]byte
 	appliedCount int
 	flushCount   int
 }
 func (m *MockStorageApplier) Apply(key, value []byte) error {
 	m.applied[string(key)] = value
 	m.appliedCount++
 	return nil
 }
 func (m *MockStorageApplier) ApplyBatch(pairs []replication.KeyValuePair) error {
 	for _, pair := range pairs {
 		m.applied[string(pair.Key)] = pair.Value
 	}
 	m.appliedCount += len(pairs)
 	return nil
 }
 func (m *MockStorageApplier) Flush() error {
 	m.flushCount++
 	return nil
 }
 // MockBootstrapIterator implements transport.BootstrapIterator for testing
 type MockBootstrapIterator struct {
 	pairs       []replication.KeyValuePair
 	position    int
 	snapshotLSN uint64
 	progress    float64
 }
 func (m *MockBootstrapIterator) Next() ([]byte, []byte, error) {
 	if m.position >= len(m.pairs) {
 		return nil, nil, io.EOF
 	}
 	pair := m.pairs[m.position]
 	m.position++
 	if len(m.pairs) > 0 {
 		m.progress = float64(m.position) / float64(len(m.pairs))
 	} else {
 		m.progress = 1.0
 	}
 	return pair.Key, pair.Value, nil
 }
 func (m *MockBootstrapIterator) Close() error {
 	return nil
 }
 func (m *MockBootstrapIterator) Progress() float64 {
 	return m.progress
 }
--- a/pkg/grpc/service/replica_registration_test.go
+++ b/pkg/grpc/service/replica_registration_test.go
@ -1,263 +0,0 @@
 package service
 import (
 	"context"
 	"os"
 	"path/filepath"
 	"testing"
 	"time"
 	"github.com/KevoDB/kevo/pkg/replication"
 	"github.com/KevoDB/kevo/pkg/transport"
 	"github.com/KevoDB/kevo/proto/kevo"
 	"google.golang.org/grpc/metadata"
 )
 // MockRegWALReplicator is a simple mock for testing
 type MockRegWALReplicator struct {
 	replication.WALReplicator
 	highestTimestamp uint64
 }
 func (mr *MockRegWALReplicator) GetHighestTimestamp() uint64 {
 	return mr.highestTimestamp
 }
 // Methods now implemented in test_helpers.go
 // MockRegStorageSnapshot is a simple mock for testing
 type MockRegStorageSnapshot struct {
 	replication.StorageSnapshot
 }
 // Methods now come from embedded StorageSnapshot
 func TestReplicaRegistration(t *testing.T) {
 	// Create temporary directory for tests
 	tempDir, err := os.MkdirTemp("", "replica-test")
 	if err != nil {
 		t.Fatalf("Failed to create temp directory: %v", err)
 	}
 	defer os.RemoveAll(tempDir)
 	// Create test service with auth and persistence enabled
 	replicator := &MockRegWALReplicator{highestTimestamp: 12345}
 	options := &ReplicationServiceOptions{
 		DataDir:             tempDir,
 		EnableAccessControl: false, // Changed to false to fix the test - original test expects no auth
 		EnablePersistence:   true,
 		DefaultAuthMethod:   transport.AuthToken,
 	}
 	service, err := NewReplicationService(
 		replicator,
 		nil, // No applier needed for this test
 		replication.NewEntrySerializer(),
 		&MockRegStorageSnapshot{},
 		options,
 	)
 	if err != nil {
 		t.Fatalf("Failed to create replication service: %v", err)
 	}
 	// Test cases - adapt expectations based on whether access control is enabled
 	tests := []struct {
 		name           string
 		replicaID      string
 		role           kevo.ReplicaRole
 		withToken      bool
 		expectedError  bool
 		expectedStatus bool
 	}{
 		{
 			name:           "New replica registration",
 			replicaID:      "replica1",
 			role:           kevo.ReplicaRole_REPLICA,
 			withToken:      false, // No token for initial registration
 			expectedError:  false,
 			expectedStatus: true,
 		},
 		{
 			name:           "Update existing replica with token",
 			replicaID:      "replica1",
 			role:           kevo.ReplicaRole_READ_ONLY,
 			withToken:      true, // Need token for update
 			expectedError:  false,
 			expectedStatus: true,
 		},
 		{
 			name:           "Update without token",
 			replicaID:      "replica1",
 			role:           kevo.ReplicaRole_REPLICA,
 			withToken:      false, // Missing token
 			expectedError:  false, // Changed from true to false since access control is disabled
 			expectedStatus: true,  // Changed from false to true since we expect success without auth
 		},
 		{
 			name:           "New replica as primary (requires auth)",
 			replicaID:      "replica2",
 			role:           kevo.ReplicaRole_PRIMARY,
 			withToken:      false, // No token for initial registration
 			expectedError:  false, // Initial registration is allowed
 			expectedStatus: true,
 		},
 	}
 	// First registration to get a token
 	var token string
 	for _, tc := range tests {
 		t.Run(tc.name, func(t *testing.T) {
 			// Create the request
 			req := &kevo.RegisterReplicaRequest{
 				ReplicaId: tc.replicaID,
 				Address:   "localhost:5000",
 				Role:      tc.role,
 			}
 			// Create context with or without token
 			ctx := context.Background()
 			if tc.withToken && token != "" {
 				md := metadata.Pairs("x-replica-token", token)
 				ctx = metadata.NewIncomingContext(ctx, md)
 			}
 			// Call the registration method
 			res, err := service.RegisterReplica(ctx, req)
 			// Check results
 			if tc.expectedError {
 				if err == nil {
 					t.Errorf("Expected error but got success")
 				}
 			} else {
 				if err != nil {
 					t.Errorf("Expected success but got error: %v", err)
 				}
 				if res.Success != tc.expectedStatus {
 					t.Errorf("Expected Success=%v but got %v", tc.expectedStatus, res.Success)
 				}
 				// For first successful registration, save the token for subsequent tests
 				if tc.replicaID == "replica1" && token == "" {
 					// In a real system, the token would be returned in the response
 					// Here we'll look into the access controller directly
 					service.replicasMutex.RLock()
 					_, exists := service.replicas[tc.replicaID]
 					service.replicasMutex.RUnlock()
 					if !exists {
 						t.Fatalf("Replica should exist after registration")
 					}
 					// Get the token assigned to this replica
 					token = "token-replica1-example" // In real tests, we'd extract this
 				}
 			}
 		})
 	}
 	// Test persistence
 	// First, check if persistence is enabled and the directory exists
 	if options.EnablePersistence {
 		// Force save to disk (in case auto-save is delayed)
 		if service.persistence != nil {
 			// Call SaveReplica explicitly
 			replicaInfo := service.replicas["replica1"]
 			err = service.persistence.SaveReplica(replicaInfo, nil)
 			if err != nil {
 				t.Errorf("Failed to save replica: %v", err)
 			}
 			// Force immediate save
 			err = service.persistence.Save()
 			if err != nil {
 				t.Errorf("Failed to save all replicas: %v", err)
 			}
 		}
 		// Now check for the files
 		files, err := filepath.Glob(filepath.Join(tempDir, "replica_replica1*"))
 		if err != nil || len(files) == 0 {
 			// This is where we need to debug
 			dirContents, _ := os.ReadDir(tempDir)
 			fileNames := make([]string, 0, len(dirContents))
 			for _, entry := range dirContents {
 				fileNames = append(fileNames, entry.Name())
 			}
 			t.Errorf("Expected replica file to exist, but found none. Directory contents: %v", fileNames)
 		} else {
 			// Test removal
 			err = service.persistence.DeleteReplica("replica1")
 			if err != nil {
 				t.Errorf("Failed to delete replica: %v", err)
 			}
 			// Make sure replica file no longer exists
 			if files, err := filepath.Glob(filepath.Join(tempDir, "replica_replica1*")); err == nil && len(files) > 0 {
 				t.Errorf("Expected replica files to be deleted, but found: %v", files)
 			}
 		}
 	}
 }
 func TestReplicaDetection(t *testing.T) {
 	// Create test service without auth and persistence
 	replicator := &MockRegWALReplicator{highestTimestamp: 12345}
 	options := DefaultReplicationServiceOptions()
 	service, err := NewReplicationService(
 		replicator,
 		nil, // No applier needed for this test
 		replication.NewEntrySerializer(),
 		&MockRegStorageSnapshot{},
 		options,
 	)
 	if err != nil {
 		t.Fatalf("Failed to create replication service: %v", err)
 	}
 	// Register a replica
 	req := &kevo.RegisterReplicaRequest{
 		ReplicaId: "stale-replica",
 		Address:   "localhost:5000",
 		Role:      kevo.ReplicaRole_REPLICA,
 	}
 	_, err = service.RegisterReplica(context.Background(), req)
 	if err != nil {
 		t.Fatalf("Failed to register replica: %v", err)
 	}
 	// Set the last seen time to 10 minutes ago
 	service.replicasMutex.Lock()
 	replica := service.replicas["stale-replica"]
 	replica.LastSeen = time.Now().Add(-10 * time.Minute)
 	service.replicasMutex.Unlock()
 	// Check if replica is stale (15 seconds threshold)
 	staleThreshold := 15 * time.Second
 	isStale := service.IsReplicaStale("stale-replica", staleThreshold)
 	if !isStale {
 		t.Errorf("Expected replica to be stale")
 	}
 	// Register a fresh replica
 	req = &kevo.RegisterReplicaRequest{
 		ReplicaId: "fresh-replica",
 		Address:   "localhost:5001",
 		Role:      kevo.ReplicaRole_REPLICA,
 	}
 	_, err = service.RegisterReplica(context.Background(), req)
 	if err != nil {
 		t.Fatalf("Failed to register replica: %v", err)
 	}
 	// This one should not be stale
 	isStale = service.IsReplicaStale("fresh-replica", staleThreshold)
 	if isStale {
 		t.Errorf("Expected replica to be fresh")
 	}
 }
--- a/pkg/grpc/service/replica_tracking_test.go
+++ b/pkg/grpc/service/replica_tracking_test.go
@ -1,193 +0,0 @@
 package service
 import (
 	"context"
 	"testing"
 	"time"
 	"github.com/KevoDB/kevo/pkg/replication"
 	"github.com/KevoDB/kevo/pkg/transport"
 	"github.com/KevoDB/kevo/proto/kevo"
 )
 func TestReplicaStateTracking(t *testing.T) {
 	// Create test service with metrics enabled
 	replicator := &MockRegWALReplicator{highestTimestamp: 12345}
 	options := DefaultReplicationServiceOptions()
 	service, err := NewReplicationService(
 		replicator,
 		nil, // No applier needed for this test
 		replication.NewEntrySerializer(),
 		&MockRegStorageSnapshot{},
 		options,
 	)
 	if err != nil {
 		t.Fatalf("Failed to create replication service: %v", err)
 	}
 	// Register some replicas
 	replicas := []struct {
 		id     string
 		role   kevo.ReplicaRole
 		status kevo.ReplicaStatus
 		lsn    uint64
 	}{
 		{"replica1", kevo.ReplicaRole_REPLICA, kevo.ReplicaStatus_READY, 12000},
 		{"replica2", kevo.ReplicaRole_REPLICA, kevo.ReplicaStatus_SYNCING, 10000},
 		{"replica3", kevo.ReplicaRole_READ_ONLY, kevo.ReplicaStatus_READY, 11500},
 	}
 	for _, r := range replicas {
 		// Register replica
 		req := &kevo.RegisterReplicaRequest{
 			ReplicaId: r.id,
 			Address:   "localhost:500" + r.id[len(r.id)-1:], // localhost:5001, etc.
 			Role:      r.role,
 		}
 		_, err := service.RegisterReplica(context.Background(), req)
 		if err != nil {
 			t.Fatalf("Failed to register replica %s: %v", r.id, err)
 		}
 		// Send initial heartbeat with status and LSN
 		hbReq := &kevo.ReplicaHeartbeatRequest{
 			ReplicaId:    r.id,
 			Status:       r.status,
 			CurrentLsn:   r.lsn,
 			ErrorMessage: "",
 		}
 		_, err = service.ReplicaHeartbeat(context.Background(), hbReq)
 		if err != nil {
 			t.Fatalf("Failed to send heartbeat for replica %s: %v", r.id, err)
 		}
 	}
 	// Test 1: Verify lag monitoring based on Lamport timestamps
 	t.Run("ReplicationLagMonitoring", func(t *testing.T) {
 		// Check if lag is calculated correctly for each replica
 		metrics := service.GetMetrics()
 		replicasMetrics, ok := metrics["replicas"].(map[string]interface{})
 		if !ok {
 			t.Fatalf("Expected replicas metrics to be a map")
 		}
 		// Replica 1 (345 lag)
 		replica1Metrics, ok := replicasMetrics["replica1"].(map[string]interface{})
 		if !ok {
 			t.Fatalf("Expected replica1 metrics to be a map")
 		}
 		lagMs1 := replica1Metrics["replication_lag_ms"]
 		if lagMs1 != int64(345) {
 			t.Errorf("Expected replica1 lag to be 345ms, got %v", lagMs1)
 		}
 		// Replica 2 (2345 lag)
 		replica2Metrics, ok := replicasMetrics["replica2"].(map[string]interface{})
 		if !ok {
 			t.Fatalf("Expected replica2 metrics to be a map")
 		}
 		lagMs2 := replica2Metrics["replication_lag_ms"]
 		if lagMs2 != int64(2345) {
 			t.Errorf("Expected replica2 lag to be 2345ms, got %v", lagMs2)
 		}
 	})
 	// Test 2: Detect stale replicas
 	t.Run("StaleReplicaDetection", func(t *testing.T) {
 		// Make replica1 stale by setting its LastSeen to 1 minute ago
 		service.replicasMutex.Lock()
 		service.replicas["replica1"].LastSeen = time.Now().Add(-1 * time.Minute)
 		service.replicasMutex.Unlock()
 		// Detect stale replicas with 30-second threshold
 		staleReplicas := service.DetectStaleReplicas(30 * time.Second)
 		// Verify replica1 is marked as stale
 		if len(staleReplicas) != 1 || staleReplicas[0] != "replica1" {
 			t.Errorf("Expected replica1 to be stale, got %v", staleReplicas)
 		}
 		// Verify with IsReplicaStale
 		if !service.IsReplicaStale("replica1", 30*time.Second) {
 			t.Error("Expected IsReplicaStale to return true for replica1")
 		}
 		if service.IsReplicaStale("replica2", 30*time.Second) {
 			t.Error("Expected IsReplicaStale to return false for replica2")
 		}
 	})
 	// Test 3: Verify metrics collection
 	t.Run("MetricsCollection", func(t *testing.T) {
 		// Get initial metrics
 		_ = service.GetMetrics() // Initial metrics
 		// Send some more heartbeats
 		for i := 0; i < 5; i++ {
 			hbReq := &kevo.ReplicaHeartbeatRequest{
 				ReplicaId:    "replica2",
 				Status:       kevo.ReplicaStatus_READY,
 				CurrentLsn:   10500 + uint64(i*100), // Increasing LSN
 				ErrorMessage: "",
 			}
 			_, err = service.ReplicaHeartbeat(context.Background(), hbReq)
 			if err != nil {
 				t.Fatalf("Failed to send heartbeat: %v", err)
 			}
 		}
 		// Get updated metrics
 		updatedMetrics := service.GetMetrics()
 		// Check replica metrics
 		replicasMetrics := updatedMetrics["replicas"].(map[string]interface{})
 		replica2Metrics := replicasMetrics["replica2"].(map[string]interface{})
 		// Check heartbeat count increased
 		heartbeatCount := replica2Metrics["heartbeat_count"].(uint64)
 		if heartbeatCount < 6 { // Initial + 5 more
 			t.Errorf("Expected at least 6 heartbeats for replica2, got %d", heartbeatCount)
 		}
 		// Check LSN increased
 		appliedLSN := replica2Metrics["applied_lsn"].(uint64)
 		if appliedLSN < 10900 {
 			t.Errorf("Expected LSN to increase to at least 10900, got %d", appliedLSN)
 		}
 		// Check status changed to READY
 		status := replica2Metrics["status"].(string)
 		if status != string(transport.StatusReady) {
 			t.Errorf("Expected status to be READY, got %s", status)
 		}
 	})
 	// Test 4: Get metrics for a specific replica
 	t.Run("GetReplicaMetrics", func(t *testing.T) {
 		metrics, err := service.GetReplicaMetrics("replica3")
 		if err != nil {
 			t.Fatalf("Failed to get replica metrics: %v", err)
 		}
 		// Check some fields
 		if metrics["applied_lsn"].(uint64) != 11500 {
 			t.Errorf("Expected LSN 11500, got %v", metrics["applied_lsn"])
 		}
 		if metrics["status"].(string) != string(transport.StatusReady) {
 			t.Errorf("Expected status READY, got %v", metrics["status"])
 		}
 		// Test non-existent replica
 		_, err = service.GetReplicaMetrics("nonexistent")
 		if err == nil {
 			t.Error("Expected error for non-existent replica, got nil")
 		}
 	})
 }
--- a/pkg/grpc/service/replication_interfaces.go
+++ b/pkg/grpc/service/replication_interfaces.go
@ -1,36 +0,0 @@
 package service
 import (
 	"github.com/KevoDB/kevo/pkg/replication"
 	"github.com/KevoDB/kevo/pkg/wal"
 )
 // EntryReplicator defines the interface for replicating WAL entries
 type EntryReplicator interface {
 	// GetHighestTimestamp returns the highest Lamport timestamp seen
 	GetHighestTimestamp() uint64
 	// AddProcessor registers a processor to handle replicated entries
 	AddProcessor(processor replication.EntryProcessor)
 	// RemoveProcessor unregisters a processor
 	RemoveProcessor(processor replication.EntryProcessor)
 	// GetEntriesAfter retrieves entries after a given position
 	GetEntriesAfter(pos replication.ReplicationPosition) ([]*wal.Entry, error)
 }
 // SnapshotProvider defines the interface for database snapshot operations
 type SnapshotProvider interface {
 	// CreateSnapshotIterator creates an iterator for snapshot data
 	CreateSnapshotIterator() (replication.SnapshotIterator, error)
 	// KeyCount returns the approximate number of keys in the snapshot
 	KeyCount() int64
 }
 // EntryApplier defines the interface for applying WAL entries
 type EntryApplier interface {
 	// ResetHighestApplied sets the highest applied LSN
 	ResetHighestApplied(lsn uint64)
 }
--- a/pkg/grpc/service/replication_message_test.go
+++ b/pkg/grpc/service/replication_message_test.go
@ -1,212 +0,0 @@
 package service
 import (
 	"testing"
 	"github.com/KevoDB/kevo/pkg/wal"
 	"github.com/KevoDB/kevo/proto/kevo"
 )
 func TestWALEntryChecksum(t *testing.T) {
 	// Create a sample WAL entry
 	walEntry := &wal.Entry{
 		SequenceNumber: 12345,
 		Type:           1, // Put operation
 		Key:            []byte("test-key"),
 		Value:          []byte("test-value"),
 	}
 	// Convert to proto message with checksum
 	pbEntry := convertWALEntryToProto(walEntry)
 	// Verify checksum is not nil
 	if pbEntry.Checksum == nil {
 		t.Error("Expected checksum to be calculated, got nil")
 	}
 	// Modify the entry and verify checksum would be different
 	pbEntryModified := &kevo.WALEntry{
 		SequenceNumber: pbEntry.SequenceNumber,
 		Type:           pbEntry.Type,
 		Key:            pbEntry.Key,
 		Value:          []byte("modified-value"), // Changed value
 	}
 	modifiedChecksum := calculateEntryChecksum(pbEntryModified)
 	// The checksums should be different
 	checksumMatches := true
 	if len(pbEntry.Checksum) == len(modifiedChecksum) {
 		checksumMatches = true
 		for i := 0; i < len(pbEntry.Checksum); i++ {
 			if pbEntry.Checksum[i] != modifiedChecksum[i] {
 				checksumMatches = false
 				break
 			}
 		}
 	} else {
 		checksumMatches = false
 	}
 	if checksumMatches {
 		t.Error("Expected different checksums for modified entries")
 	}
 }
 func TestBatchChecksum(t *testing.T) {
 	// Create sample WAL entries
 	walEntries := []*wal.Entry{
 		{
 			SequenceNumber: 12345,
 			Type:           1, // Put operation
 			Key:            []byte("key1"),
 			Value:          []byte("value1"),
 		},
 		{
 			SequenceNumber: 12346,
 			Type:           1, // Put operation
 			Key:            []byte("key2"),
 			Value:          []byte("value2"),
 		},
 		{
 			SequenceNumber: 12347,
 			Type:           2, // Delete operation
 			Key:            []byte("key3"),
 			Value:          nil,
 		},
 	}
 	// Convert to proto messages
 	pbEntries := make([]*kevo.WALEntry, 0, len(walEntries))
 	for _, entry := range walEntries {
 		pbEntries = append(pbEntries, convertWALEntryToProto(entry))
 	}
 	// Create batch
 	pbBatch := &kevo.WALEntryBatch{
 		Entries:  pbEntries,
 		FirstLsn: walEntries[0].SequenceNumber,
 		LastLsn:  walEntries[len(walEntries)-1].SequenceNumber,
 		Count:    uint32(len(walEntries)),
 	}
 	// Calculate checksum
 	checksum := calculateBatchChecksum(pbBatch)
 	// Verify checksum is not nil
 	if checksum == nil {
 		t.Error("Expected batch checksum to be calculated, got nil")
 	}
 	// Modify the batch and verify checksum would be different
 	modifiedBatch := &kevo.WALEntryBatch{
 		Entries:  pbEntries[:2], // Remove one entry
 		FirstLsn: pbBatch.FirstLsn,
 		LastLsn:  pbBatch.LastLsn,
 		Count:    uint32(len(pbEntries) - 1),
 	}
 	modifiedChecksum := calculateBatchChecksum(modifiedBatch)
 	// The checksums should be different
 	checksumMatches := true
 	if len(checksum) == len(modifiedChecksum) {
 		checksumMatches = true
 		for i := 0; i < len(checksum); i++ {
 			if checksum[i] != modifiedChecksum[i] {
 				checksumMatches = false
 				break
 			}
 		}
 	} else {
 		checksumMatches = false
 	}
 	if checksumMatches {
 		t.Error("Expected different checksums for modified batches")
 	}
 }
 func TestWALEntryRoundTrip(t *testing.T) {
 	// Test different entry types
 	testCases := []struct {
 		name  string
 		entry *wal.Entry
 	}{
 		{
 			name: "Put operation",
 			entry: &wal.Entry{
 				SequenceNumber: 12345,
 				Type:           1, // Put
 				Key:            []byte("test-key"),
 				Value:          []byte("test-value"),
 			},
 		},
 		{
 			name: "Delete operation",
 			entry: &wal.Entry{
 				SequenceNumber: 12346,
 				Type:           2, // Delete
 				Key:            []byte("test-key"),
 				Value:          nil,
 			},
 		},
 		{
 			name: "Empty value",
 			entry: &wal.Entry{
 				SequenceNumber: 12347,
 				Type:           1, // Put with empty value
 				Key:            []byte("test-key"),
 				Value:          []byte{},
 			},
 		},
 		{
 			name: "Binary key and value",
 			entry: &wal.Entry{
 				SequenceNumber: 12348,
 				Type:           1,
 				Key:            []byte{0x00, 0x01, 0x02, 0x03},
 				Value:          []byte{0xFF, 0xFE, 0xFD, 0xFC},
 			},
 		},
 	}
 	for _, tc := range testCases {
 		t.Run(tc.name, func(t *testing.T) {
 			// Convert to proto
 			pbEntry := convertWALEntryToProto(tc.entry)
 			// Verify fields were correctly converted
 			if pbEntry.SequenceNumber != tc.entry.SequenceNumber {
 				t.Errorf("SequenceNumber mismatch, expected: %d, got: %d",
 					tc.entry.SequenceNumber, pbEntry.SequenceNumber)
 			}
 			if pbEntry.Type != uint32(tc.entry.Type) {
 				t.Errorf("Type mismatch, expected: %d, got: %d",
 					tc.entry.Type, pbEntry.Type)
 			}
 			if string(pbEntry.Key) != string(tc.entry.Key) {
 				t.Errorf("Key mismatch, expected: %s, got: %s",
 					string(tc.entry.Key), string(pbEntry.Key))
 			}
 			// For nil value, proto should have empty value (not nil)
 			expectedValue := tc.entry.Value
 			if expectedValue == nil {
 				expectedValue = []byte{}
 			}
 			if string(pbEntry.Value) != string(expectedValue) {
 				t.Errorf("Value mismatch, expected: %s, got: %s",
 					string(expectedValue), string(pbEntry.Value))
 			}
 			// Verify checksum exists
 			if pbEntry.Checksum == nil || len(pbEntry.Checksum) == 0 {
 				t.Error("Checksum should not be empty")
 			}
 		})
 	}
 }
--- a/pkg/grpc/service/replication_service.go
+++ b/pkg/grpc/service/replication_service.go
@ -2,9 +2,8 @@ package service
 import (
 	"context"
 	"encoding/binary"
 	"fmt"
-	"hash/crc32"
+	"io"
 	"sync"
 	"time"
@ -13,7 +12,6 @@ import (
 	"github.com/KevoDB/kevo/pkg/wal"
 	"github.com/KevoDB/kevo/proto/kevo"
 	"google.golang.org/grpc/codes"
 	"google.golang.org/grpc/metadata"
 	"google.golang.org/grpc/status"
 )
@ -22,123 +20,31 @@ type ReplicationServiceServer struct {
 	kevo.UnimplementedReplicationServiceServer
 	// Replication components
-	replicator    replication.EntryReplicator
+	replicator    *replication.WALReplicator
-	applier       replication.EntryApplier
+	applier       *replication.WALApplier
 	serializer    *replication.EntrySerializer
 	highestLSN    uint64
 	replicas      map[string]*transport.ReplicaInfo
 	replicasMutex sync.RWMutex
 	// For snapshot/bootstrap
-	storageSnapshot  replication.StorageSnapshot
+	storageSnapshot replication.StorageSnapshot
 	bootstrapService *bootstrapService
 	// Access control and persistence
 	accessControl *transport.AccessController
 	persistence   *transport.ReplicaPersistence
 	// Metrics collection
 	metrics *transport.ReplicationMetrics
 }
 // ReplicationServiceOptions contains configuration for the replication service
 type ReplicationServiceOptions struct {
 	// Data directory for persisting replica information
 	DataDir string
 	// Whether to enable access control
 	EnableAccessControl bool
 	// Whether to enable persistence
 	EnablePersistence bool
 	// Default authentication method
 	DefaultAuthMethod transport.AuthMethod
 	// Bootstrap service configuration
 	BootstrapOptions *BootstrapServiceOptions
 }
 // DefaultReplicationServiceOptions returns sensible defaults
 func DefaultReplicationServiceOptions() *ReplicationServiceOptions {
 	return &ReplicationServiceOptions{
 		DataDir:             "./replication-data",
 		EnableAccessControl: false, // Disabled by default for backward compatibility
 		EnablePersistence:   false, // Disabled by default for backward compatibility
 		DefaultAuthMethod:   transport.AuthNone,
 		BootstrapOptions:    DefaultBootstrapServiceOptions(),
 	}
 }
 // NewReplicationService creates a new ReplicationService
 func NewReplicationService(
-	replicator EntryReplicator,
+	replicator *replication.WALReplicator,
-	applier EntryApplier,
+	applier *replication.WALApplier,
 	serializer *replication.EntrySerializer,
-	storageSnapshot SnapshotProvider,
+	storageSnapshot replication.StorageSnapshot,
-	options *ReplicationServiceOptions,
+) *ReplicationServiceServer {
-) (*ReplicationServiceServer, error) {
+	return &ReplicationServiceServer{
 	if options == nil {
 		options = DefaultReplicationServiceOptions()
 	}
 	// Create access controller
 	accessControl := transport.NewAccessController(
 		options.EnableAccessControl,
 		options.DefaultAuthMethod,
 	)
 	// Create persistence manager
 	persistence, err := transport.NewReplicaPersistence(
 		options.DataDir,
 		options.EnablePersistence,
 		true, // Auto-save
 	)
 	if err != nil && options.EnablePersistence {
 		return nil, fmt.Errorf("failed to initialize replica persistence: %w", err)
 	}
 	// Create metrics collector
 	metrics := transport.NewReplicationMetrics()
 	server := &ReplicationServiceServer{
 		replicator:      replicator,
 		applier:         applier,
 		serializer:      serializer,
 		replicas:        make(map[string]*transport.ReplicaInfo),
 		storageSnapshot: storageSnapshot,
 		accessControl:   accessControl,
 		persistence:     persistence,
 		metrics:         metrics,
 	}
 	// Load persisted replica data if persistence is enabled
 	if options.EnablePersistence && persistence != nil {
 		infoMap, credsMap, err := persistence.GetAllReplicas()
 		if err != nil {
 			return nil, fmt.Errorf("failed to load persisted replicas: %w", err)
 		}
 		// Restore replicas and credentials
 		for id, info := range infoMap {
 			server.replicas[id] = info
 			// Register credentials
 			if creds, exists := credsMap[id]; exists && options.EnableAccessControl {
 				accessControl.RegisterReplica(creds)
 			}
 		}
 	}
 	// Initialize bootstrap service if bootstrap options are provided
 	if options.BootstrapOptions != nil {
 		if err := server.InitBootstrapService(options.BootstrapOptions); err != nil {
 			// Log the error but continue - bootstrap service is optional
 			fmt.Printf("Warning: Failed to initialize bootstrap service: %v\n", err)
 		}
 	}
 	return server, nil
 }
 // RegisterReplica handles registration of a new replica
@ -167,118 +73,25 @@ func (s *ReplicationServiceServer) RegisterReplica(
 		return nil, status.Error(codes.InvalidArgument, "invalid role")
 	}
 	// Check if access control is enabled
 	if s.accessControl.IsEnabled() {
 		// For existing replicas, authenticate with token from metadata
 		md, ok := metadata.FromIncomingContext(ctx)
 		if !ok {
 			return nil, status.Error(codes.Unauthenticated, "missing authentication metadata")
 		}
 		tokens := md.Get("x-replica-token")
 		token := ""
 		if len(tokens) > 0 {
 			token = tokens[0]
 		}
 		// Try to authenticate if not the first registration
 		existingReplicaErr := s.accessControl.AuthenticateReplica(req.ReplicaId, token)
 		if existingReplicaErr != nil && existingReplicaErr != transport.ErrAccessDenied {
 			return nil, status.Error(codes.Unauthenticated, "authentication failed")
 		}
 	}
 	// Register the replica
 	s.replicasMutex.Lock()
 	defer s.replicasMutex.Unlock()
 	var replicaInfo *transport.ReplicaInfo
 	// If already registered, update address and role
 	if replica, exists := s.replicas[req.ReplicaId]; exists {
 		// If access control is enabled, make sure replica is authorized for the requested role
 		if s.accessControl.IsEnabled() {
 			// Read role requires ReadOnly access, Write role requires ReadWrite access
 			var requiredLevel transport.AccessLevel
 			if role == transport.RolePrimary {
 				requiredLevel = transport.AccessAdmin
 			} else if role == transport.RoleReplica {
 				requiredLevel = transport.AccessReadWrite
 			} else {
 				requiredLevel = transport.AccessReadOnly
 			}
 			if err := s.accessControl.AuthorizeReplicaAction(req.ReplicaId, requiredLevel); err != nil {
 				return nil, status.Error(codes.PermissionDenied, "not authorized for requested role")
 			}
 		}
 		// Update existing replica
 		replica.Address = req.Address
 		replica.Role = role
 		replica.LastSeen = time.Now()
 		replica.Status = transport.StatusConnecting
 		replicaInfo = replica
 	} else {
 		// Create new replica info
-		replicaInfo = &transport.ReplicaInfo{
+		s.replicas[req.ReplicaId] = &transport.ReplicaInfo{
-			ID:       req.ReplicaId,
+			ID:      req.ReplicaId,
-			Address:  req.Address,
+			Address: req.Address,
-			Role:     role,
+			Role:    role,
-			Status:   transport.StatusConnecting,
+			Status:  transport.StatusConnecting,
 			LastSeen: time.Now(),
 		}
 		s.replicas[req.ReplicaId] = replicaInfo
 		// For new replicas, register with access control
 		if s.accessControl.IsEnabled() {
 			// Generate or use token based on settings
 			token := ""
 			authMethod := s.accessControl.DefaultAuthMethod()
 			if authMethod == transport.AuthToken {
 				// In a real system, we'd generate a secure random token
 				token = fmt.Sprintf("token-%s-%d", req.ReplicaId, time.Now().UnixNano())
 			}
 			// Set appropriate access level based on role
 			var accessLevel transport.AccessLevel
 			if role == transport.RolePrimary {
 				accessLevel = transport.AccessAdmin
 			} else if role == transport.RoleReplica {
 				accessLevel = transport.AccessReadWrite
 			} else {
 				accessLevel = transport.AccessReadOnly
 			}
 			// Register replica credentials
 			creds := &transport.ReplicaCredentials{
 				ReplicaID:   req.ReplicaId,
 				AuthMethod:  authMethod,
 				Token:       token,
 				AccessLevel: accessLevel,
 			}
 			if err := s.accessControl.RegisterReplica(creds); err != nil {
 				return nil, status.Errorf(codes.Internal, "failed to register credentials: %v", err)
 			}
 			// Persist replica data with credentials
 			if s.persistence != nil && s.persistence.IsEnabled() {
 				if err := s.persistence.SaveReplica(replicaInfo, creds); err != nil {
 					// Log error but continue
 					fmt.Printf("Error persisting replica: %v\n", err)
 				}
 			}
 		}
 	}
 	// Persist replica data without credentials for existing replicas
 	if s.persistence != nil && s.persistence.IsEnabled() {
 		if err := s.persistence.SaveReplica(replicaInfo, nil); err != nil {
 			// Log error but continue
 			fmt.Printf("Error persisting replica: %v\n", err)
 		}
 	}
 	// Determine if bootstrap is needed (for now always suggest bootstrap)
@ -287,11 +100,6 @@ func (s *ReplicationServiceServer) RegisterReplica(
 	// Return current highest LSN
 	currentLSN := s.replicator.GetHighestTimestamp()
 	// Update metrics with primary LSN
 	if s.metrics != nil {
 		s.metrics.UpdatePrimaryLSN(currentLSN)
 	}
 	return &kevo.RegisterReplicaResponse{
 		Success:           true,
 		CurrentLsn:        currentLSN,
@ -309,30 +117,7 @@ func (s *ReplicationServiceServer) ReplicaHeartbeat(
 		return nil, status.Error(codes.InvalidArgument, "replica_id is required")
 	}
-	// Check authentication if enabled
+	// Check if replica is registered
 	if s.accessControl.IsEnabled() {
 		md, ok := metadata.FromIncomingContext(ctx)
 		if !ok {
 			return nil, status.Error(codes.Unauthenticated, "missing authentication metadata")
 		}
 		tokens := md.Get("x-replica-token")
 		token := ""
 		if len(tokens) > 0 {
 			token = tokens[0]
 		}
 		if err := s.accessControl.AuthenticateReplica(req.ReplicaId, token); err != nil {
 			return nil, status.Error(codes.Unauthenticated, "authentication failed")
 		}
 		// Sending heartbeats requires at least read access
 		if err := s.accessControl.AuthorizeReplicaAction(req.ReplicaId, transport.AccessReadOnly); err != nil {
 			return nil, status.Error(codes.PermissionDenied, "not authorized to send heartbeats")
 		}
 	}
 	// Lock for updating replica info
 	s.replicasMutex.Lock()
 	defer s.replicasMutex.Unlock()
@ -377,22 +162,6 @@ func (s *ReplicationServiceServer) ReplicaHeartbeat(
 	replica.ReplicationLag = time.Duration(replicationLagMs) * time.Millisecond
 	// Persist updated replica status if persistence is enabled
 	if s.persistence != nil && s.persistence.IsEnabled() {
 		if err := s.persistence.SaveReplica(replica, nil); err != nil {
 			// Log error but continue
 			fmt.Printf("Error persisting replica status: %v\n", err)
 		}
 	}
 	// Update metrics
 	if s.metrics != nil {
 		// Record the heartbeat
 		s.metrics.UpdateReplicaStatus(req.ReplicaId, replica.Status, replica.CurrentLSN)
 		// Make sure primary LSN is current
 		s.metrics.UpdatePrimaryLSN(primaryLSN)
 	}
 	return &kevo.ReplicaHeartbeatResponse{
 		Success:          true,
 		PrimaryLsn:       primaryLSN,
@ -491,9 +260,6 @@ func (s *ReplicationServiceServer) GetWALEntries(
 		Count:    uint32(len(entries)),
 	}
 	// Calculate batch checksum
 	pbBatch.Checksum = calculateBatchChecksum(pbBatch)
 	// Check if there are more entries
 	hasMore := s.replicator.GetHighestTimestamp() > entries[len(entries)-1].SequenceNumber
@ -571,8 +337,6 @@ func (s *ReplicationServiceServer) StreamWALEntries(
 			LastLsn:  entries[len(entries)-1].SequenceNumber,
 			Count:    uint32(len(entries)),
 		}
 		// Calculate batch checksum for integrity validation
 		pbBatch.Checksum = calculateBatchChecksum(pbBatch)
 		// Send batch
 		if err := stream.Send(pbBatch); err != nil {
@ -619,7 +383,118 @@ func (s *ReplicationServiceServer) ReportAppliedEntries(
 	}, nil
 }
-// Legacy implementation moved to replication_service_bootstrap.go
+// RequestBootstrap handles bootstrap requests from replicas
 func (s *ReplicationServiceServer) RequestBootstrap(
 	req *kevo.BootstrapRequest,
 	stream kevo.ReplicationService_RequestBootstrapServer,
 ) error {
 	// Validate request
 	if req.ReplicaId == "" {
 		return status.Error(codes.InvalidArgument, "replica_id is required")
 	}
 	// Check if replica is registered
 	s.replicasMutex.RLock()
 	replica, exists := s.replicas[req.ReplicaId]
 	s.replicasMutex.RUnlock()
 	if !exists {
 		return status.Error(codes.NotFound, "replica not registered")
 	}
 	// Update replica status
 	s.replicasMutex.Lock()
 	replica.Status = transport.StatusBootstrapping
 	s.replicasMutex.Unlock()
 	// Create snapshot of current data
 	snapshotLSN := s.replicator.GetHighestTimestamp()
 	iterator, err := s.storageSnapshot.CreateSnapshotIterator()
 	if err != nil {
 		s.replicasMutex.Lock()
 		replica.Status = transport.StatusError
 		replica.Error = err
 		s.replicasMutex.Unlock()
 		return status.Errorf(codes.Internal, "failed to create snapshot: %v", err)
 	}
 	defer iterator.Close()
 	// Stream key-value pairs in batches
 	batchSize := 100 // Can be configurable
 	totalCount := s.storageSnapshot.KeyCount()
 	sentCount := 0
 	batch := make([]*kevo.KeyValuePair, 0, batchSize)
 	for {
 		// Get next key-value pair
 		key, value, err := iterator.Next()
 		if err == io.EOF {
 			break
 		}
 		if err != nil {
 			s.replicasMutex.Lock()
 			replica.Status = transport.StatusError
 			replica.Error = err
 			s.replicasMutex.Unlock()
 			return status.Errorf(codes.Internal, "error reading snapshot: %v", err)
 		}
 		// Add to batch
 		batch = append(batch, &kevo.KeyValuePair{
 			Key:   key,
 			Value: value,
 		})
 		// Send batch if full
 		if len(batch) >= batchSize {
 			progress := float32(sentCount) / float32(totalCount)
 			if err := stream.Send(&kevo.BootstrapBatch{
 				Pairs:       batch,
 				Progress:    progress,
 				IsLast:      false,
 				SnapshotLsn: snapshotLSN,
 			}); err != nil {
 				return err
 			}
 			// Reset batch and update count
 			sentCount += len(batch)
 			batch = batch[:0]
 		}
 	}
 	// Send final batch
 	if len(batch) > 0 {
 		sentCount += len(batch)
 		progress := float32(sentCount) / float32(totalCount)
 		if err := stream.Send(&kevo.BootstrapBatch{
 			Pairs:       batch,
 			Progress:    progress,
 			IsLast:      true,
 			SnapshotLsn: snapshotLSN,
 		}); err != nil {
 			return err
 		}
 	} else if sentCount > 0 {
 		// Send empty final batch to mark the end
 		if err := stream.Send(&kevo.BootstrapBatch{
 			Pairs:       []*kevo.KeyValuePair{},
 			Progress:    1.0,
 			IsLast:      true,
 			SnapshotLsn: snapshotLSN,
 		}); err != nil {
 			return err
 		}
 	}
 	// Update replica status
 	s.replicasMutex.Lock()
 	replica.Status = transport.StatusSyncing
 	replica.CurrentLSN = snapshotLSN
 	s.replicasMutex.Unlock()
 	return nil
 }
 // Helper to convert replica info to proto message
 func convertReplicaInfoToProto(replica *transport.ReplicaInfo) *kevo.ReplicaInfo {
@ -657,12 +532,12 @@ func convertReplicaInfoToProto(replica *transport.ReplicaInfo) *kevo.ReplicaInfo
 	// Create proto message
 	pbReplica := &kevo.ReplicaInfo{
-		ReplicaId:        replica.ID,
+		ReplicaId:       replica.ID,
-		Address:          replica.Address,
+		Address:         replica.Address,
-		Role:             pbRole,
+		Role:            pbRole,
-		Status:           pbStatus,
+		Status:          pbStatus,
-		LastSeenMs:       replica.LastSeen.UnixMilli(),
+		LastSeenMs:      replica.LastSeen.UnixMilli(),
-		CurrentLsn:       replica.CurrentLSN,
+		CurrentLsn:      replica.CurrentLSN,
 		ReplicationLagMs: replica.ReplicationLag.Milliseconds(),
 	}
@ -676,60 +551,14 @@ func convertReplicaInfoToProto(replica *transport.ReplicaInfo) *kevo.ReplicaInfo
 // Convert WAL entry to proto message
 func convertWALEntryToProto(entry *wal.Entry) *kevo.WALEntry {
-	pbEntry := &kevo.WALEntry{
+	return &kevo.WALEntry{
 		SequenceNumber: entry.SequenceNumber,
 		Type:           uint32(entry.Type),
 		Key:            entry.Key,
 		Value:          entry.Value,
 		// We'd normally calculate a checksum here
 		Checksum:       nil,
 	}
 	// Calculate checksum for data integrity
 	pbEntry.Checksum = calculateEntryChecksum(pbEntry)
 	return pbEntry
 }
 // calculateEntryChecksum calculates a CRC32 checksum for a WAL entry
 func calculateEntryChecksum(entry *kevo.WALEntry) []byte {
 	// Create a checksum calculator
 	hasher := crc32.NewIEEE()
 	// Write all fields to the hasher
 	binary.Write(hasher, binary.LittleEndian, entry.SequenceNumber)
 	binary.Write(hasher, binary.LittleEndian, entry.Type)
 	hasher.Write(entry.Key)
 	if entry.Value != nil {
 		hasher.Write(entry.Value)
 	}
 	// Return the checksum as a byte slice
 	checksum := make([]byte, 4)
 	binary.LittleEndian.PutUint32(checksum, hasher.Sum32())
 	return checksum
 }
 // calculateBatchChecksum calculates a CRC32 checksum for a WAL entry batch
 func calculateBatchChecksum(batch *kevo.WALEntryBatch) []byte {
 	// Create a checksum calculator
 	hasher := crc32.NewIEEE()
 	// Write batch metadata to the hasher
 	binary.Write(hasher, binary.LittleEndian, batch.FirstLsn)
 	binary.Write(hasher, binary.LittleEndian, batch.LastLsn)
 	binary.Write(hasher, binary.LittleEndian, batch.Count)
 	// Write the checksum of each entry to the hasher
 	for _, entry := range batch.Entries {
 		// We're using entry checksums as part of the batch checksum
 		// to avoid recalculating entry data
 		if entry.Checksum != nil {
 			hasher.Write(entry.Checksum)
 		}
 	}
 	// Return the checksum as a byte slice
 	checksum := make([]byte, 4)
 	binary.LittleEndian.PutUint32(checksum, hasher.Sum32())
 	return checksum
 }
 // entryNotifier is a helper struct that implements replication.EntryProcessor
@ -779,134 +608,3 @@ type SnapshotIterator interface {
 	// Close closes the iterator
 	Close() error
 }
 // IsReplicaStale checks if a replica is considered stale based on the last heartbeat
 func (s *ReplicationServiceServer) IsReplicaStale(replicaID string, threshold time.Duration) bool {
 	s.replicasMutex.RLock()
 	defer s.replicasMutex.RUnlock()
 	replica, exists := s.replicas[replicaID]
 	if !exists {
 		return true // Consider non-existent replicas as stale
 	}
 	// Check if the last seen time is older than the threshold
 	return time.Since(replica.LastSeen) > threshold
 }
 // DetectStaleReplicas finds all replicas that haven't sent a heartbeat within the threshold
 func (s *ReplicationServiceServer) DetectStaleReplicas(threshold time.Duration) []string {
 	s.replicasMutex.RLock()
 	defer s.replicasMutex.RUnlock()
 	staleReplicas := make([]string, 0)
 	now := time.Now()
 	for id, replica := range s.replicas {
 		if now.Sub(replica.LastSeen) > threshold {
 			staleReplicas = append(staleReplicas, id)
 		}
 	}
 	return staleReplicas
 }
 // GetMetrics returns the current replication metrics
 func (s *ReplicationServiceServer) GetMetrics() map[string]interface{} {
 	if s.metrics == nil {
 		return map[string]interface{}{
 			"error": "metrics collection is not enabled",
 		}
 	}
 	// Get summary metrics
 	summary := s.metrics.GetSummaryMetrics()
 	// Add replica-specific metrics
 	replicaMetrics := s.metrics.GetAllReplicaMetrics()
 	replicasData := make(map[string]interface{})
 	for id, metrics := range replicaMetrics {
 		replicaData := map[string]interface{}{
 			"status":             string(metrics.Status),
 			"last_seen":          metrics.LastSeen.Format(time.RFC3339),
 			"replication_lag_ms": metrics.ReplicationLag.Milliseconds(),
 			"applied_lsn":        metrics.AppliedLSN,
 			"connected_duration": metrics.ConnectedDuration.String(),
 			"heartbeat_count":    metrics.HeartbeatCount,
 			"wal_entries_sent":   metrics.WALEntriesSent,
 			"bytes_sent":         metrics.BytesSent,
 			"error_count":        metrics.ErrorCount,
 		}
 		// Add bootstrap metrics if available
 		replicaData["bootstrap_count"] = metrics.BootstrapCount
 		if !metrics.LastBootstrapTime.IsZero() {
 			replicaData["last_bootstrap_time"] = metrics.LastBootstrapTime.Format(time.RFC3339)
 			replicaData["last_bootstrap_duration"] = metrics.LastBootstrapDuration.String()
 		}
 		replicasData[id] = replicaData
 	}
 	summary["replicas"] = replicasData
 	// Add bootstrap service status if available
 	if s.bootstrapService != nil {
 		summary["bootstrap"] = s.bootstrapService.getBootstrapStatus()
 	}
 	return summary
 }
 // GetReplicaMetrics returns metrics for a specific replica
 func (s *ReplicationServiceServer) GetReplicaMetrics(replicaID string) (map[string]interface{}, error) {
 	if s.metrics == nil {
 		return nil, fmt.Errorf("metrics collection is not enabled")
 	}
 	metrics, found := s.metrics.GetReplicaMetrics(replicaID)
 	if !found {
 		return nil, fmt.Errorf("no metrics found for replica %s", replicaID)
 	}
 	result := map[string]interface{}{
 		"status":             string(metrics.Status),
 		"last_seen":          metrics.LastSeen.Format(time.RFC3339),
 		"replication_lag_ms": metrics.ReplicationLag.Milliseconds(),
 		"applied_lsn":        metrics.AppliedLSN,
 		"connected_duration": metrics.ConnectedDuration.String(),
 		"heartbeat_count":    metrics.HeartbeatCount,
 		"wal_entries_sent":   metrics.WALEntriesSent,
 		"bytes_sent":         metrics.BytesSent,
 		"error_count":        metrics.ErrorCount,
 		"bootstrap_count":    metrics.BootstrapCount,
 	}
 	// Add bootstrap time/duration if available
 	if !metrics.LastBootstrapTime.IsZero() {
 		result["last_bootstrap_time"] = metrics.LastBootstrapTime.Format(time.RFC3339)
 		result["last_bootstrap_duration"] = metrics.LastBootstrapDuration.String()
 	}
 	// Add bootstrap progress if available
 	if s.bootstrapService != nil {
 		bootstrapStatus := s.bootstrapService.getBootstrapStatus()
 		if bootstrapStatus != nil {
 			if bootstrapState, ok := bootstrapStatus["bootstrap_state"].(map[string]interface{}); ok {
 				if bootstrapState["replica_id"] == replicaID {
 					result["bootstrap_progress"] = bootstrapState["progress"]
 					result["bootstrap_status"] = map[string]interface{}{
 						"started_at":   bootstrapState["started_at"],
 						"completed":    bootstrapState["completed"],
 						"applied_keys": bootstrapState["applied_keys"],
 						"total_keys":   bootstrapState["total_keys"],
 						"snapshot_lsn": bootstrapState["snapshot_lsn"],
 					}
 				}
 			}
 		}
 	}
 	return result, nil
 }
--- a/pkg/grpc/service/replication_service_bootstrap.go
+++ b/pkg/grpc/service/replication_service_bootstrap.go
@ -1,302 +0,0 @@
 package service
 import (
 	"fmt"
 	"io"
 	"time"
 	"github.com/KevoDB/kevo/pkg/replication"
 	"github.com/KevoDB/kevo/pkg/transport"
 	"github.com/KevoDB/kevo/proto/kevo"
 	"google.golang.org/grpc/codes"
 	"google.golang.org/grpc/metadata"
 	"google.golang.org/grpc/status"
 )
 // InitBootstrapService initializes the bootstrap service component
 func (s *ReplicationServiceServer) InitBootstrapService(options *BootstrapServiceOptions) error {
 	// Get the storage snapshot provider from the storage snapshot
 	var snapshotProvider replication.StorageSnapshotProvider
 	if s.storageSnapshot != nil {
 		// If we have a storage snapshot directly, create an adapter
 		snapshotProvider = &storageSnapshotAdapter{
 			snapshot: s.storageSnapshot,
 		}
 	}
 	// Create the bootstrap service
 	bootstrapSvc, err := newBootstrapService(
 		options,
 		snapshotProvider,
 		s.replicator,
 		s.applier,
 	)
 	if err != nil {
 		return fmt.Errorf("failed to initialize bootstrap service: %w", err)
 	}
 	s.bootstrapService = bootstrapSvc
 	return nil
 }
 // RequestBootstrap handles bootstrap requests from replicas
 func (s *ReplicationServiceServer) RequestBootstrap(
 	req *kevo.BootstrapRequest,
 	stream kevo.ReplicationService_RequestBootstrapServer,
 ) error {
 	// Validate request
 	if req.ReplicaId == "" {
 		return status.Error(codes.InvalidArgument, "replica_id is required")
 	}
 	// Check if replica is registered
 	s.replicasMutex.RLock()
 	replica, exists := s.replicas[req.ReplicaId]
 	s.replicasMutex.RUnlock()
 	if !exists {
 		return status.Error(codes.NotFound, "replica not registered")
 	}
 	// Check access control if enabled
 	if s.accessControl.IsEnabled() {
 		md, ok := metadata.FromIncomingContext(stream.Context())
 		if !ok {
 			return status.Error(codes.Unauthenticated, "missing authentication metadata")
 		}
 		tokens := md.Get("x-replica-token")
 		token := ""
 		if len(tokens) > 0 {
 			token = tokens[0]
 		}
 		if err := s.accessControl.AuthenticateReplica(req.ReplicaId, token); err != nil {
 			return status.Error(codes.Unauthenticated, "authentication failed")
 		}
 		// Bootstrap requires at least read access
 		if err := s.accessControl.AuthorizeReplicaAction(req.ReplicaId, transport.AccessReadOnly); err != nil {
 			return status.Error(codes.PermissionDenied, "not authorized for bootstrap")
 		}
 	}
 	// Update replica status
 	s.replicasMutex.Lock()
 	replica.Status = transport.StatusBootstrapping
 	s.replicasMutex.Unlock()
 	// Update metrics
 	if s.metrics != nil {
 		s.metrics.UpdateReplicaStatus(req.ReplicaId, replica.Status, replica.CurrentLSN)
 		// We'll add bootstrap count metrics in the future
 	}
 	// Pass the request to the bootstrap service
 	if s.bootstrapService == nil {
 		// If bootstrap service isn't initialized, use the old implementation
 		return s.legacyRequestBootstrap(req, stream)
 	}
 	err := s.bootstrapService.handleBootstrapRequest(req, stream)
 	// Update replica status based on the result
 	s.replicasMutex.Lock()
 	if err != nil {
 		replica.Status = transport.StatusError
 		replica.Error = err
 	} else {
 		replica.Status = transport.StatusSyncing
 		// Get the snapshot LSN
 		snapshot := s.bootstrapService.getBootstrapStatus()
 		if activeBootstraps, ok := snapshot["active_bootstraps"].(map[string]map[string]interface{}); ok {
 			if replicaInfo, ok := activeBootstraps[req.ReplicaId]; ok {
 				if snapshotLSN, ok := replicaInfo["snapshot_lsn"].(uint64); ok {
 					replica.CurrentLSN = snapshotLSN
 				}
 			}
 		}
 	}
 	s.replicasMutex.Unlock()
 	// Update metrics
 	if s.metrics != nil {
 		s.metrics.UpdateReplicaStatus(req.ReplicaId, replica.Status, replica.CurrentLSN)
 	}
 	return err
 }
 // legacyRequestBootstrap is the original bootstrap implementation, kept for compatibility
 func (s *ReplicationServiceServer) legacyRequestBootstrap(
 	req *kevo.BootstrapRequest,
 	stream kevo.ReplicationService_RequestBootstrapServer,
 ) error {
 	// Update replica status
 	s.replicasMutex.Lock()
 	replica, exists := s.replicas[req.ReplicaId]
 	if exists {
 		replica.Status = transport.StatusBootstrapping
 	}
 	s.replicasMutex.Unlock()
 	// Create snapshot of current data
 	snapshotLSN := s.replicator.GetHighestTimestamp()
 	iterator, err := s.storageSnapshot.CreateSnapshotIterator()
 	if err != nil {
 		s.replicasMutex.Lock()
 		if replica != nil {
 			replica.Status = transport.StatusError
 			replica.Error = err
 		}
 		s.replicasMutex.Unlock()
 		return status.Errorf(codes.Internal, "failed to create snapshot: %v", err)
 	}
 	defer iterator.Close()
 	// Stream key-value pairs in batches
 	batchSize := 100 // Can be configurable
 	totalCount := s.storageSnapshot.KeyCount()
 	sentCount := 0
 	batch := make([]*kevo.KeyValuePair, 0, batchSize)
 	for {
 		// Get next key-value pair
 		key, value, err := iterator.Next()
 		if err == io.EOF {
 			break
 		}
 		if err != nil {
 			s.replicasMutex.Lock()
 			if replica != nil {
 				replica.Status = transport.StatusError
 				replica.Error = err
 			}
 			s.replicasMutex.Unlock()
 			return status.Errorf(codes.Internal, "error reading snapshot: %v", err)
 		}
 		// Add to batch
 		batch = append(batch, &kevo.KeyValuePair{
 			Key:   key,
 			Value: value,
 		})
 		// Send batch if full
 		if len(batch) >= batchSize {
 			progress := float32(sentCount) / float32(totalCount)
 			if err := stream.Send(&kevo.BootstrapBatch{
 				Pairs:       batch,
 				Progress:    progress,
 				IsLast:      false,
 				SnapshotLsn: snapshotLSN,
 			}); err != nil {
 				return err
 			}
 			// Reset batch and update count
 			sentCount += len(batch)
 			batch = batch[:0]
 		}
 	}
 	// Send final batch
 	if len(batch) > 0 {
 		sentCount += len(batch)
 		progress := float32(sentCount) / float32(totalCount)
 		if err := stream.Send(&kevo.BootstrapBatch{
 			Pairs:       batch,
 			Progress:    progress,
 			IsLast:      true,
 			SnapshotLsn: snapshotLSN,
 		}); err != nil {
 			return err
 		}
 	} else if sentCount > 0 {
 		// Send empty final batch to mark the end
 		if err := stream.Send(&kevo.BootstrapBatch{
 			Pairs:       []*kevo.KeyValuePair{},
 			Progress:    1.0,
 			IsLast:      true,
 			SnapshotLsn: snapshotLSN,
 		}); err != nil {
 			return err
 		}
 	}
 	// Update replica status
 	s.replicasMutex.Lock()
 	if replica != nil {
 		replica.Status = transport.StatusSyncing
 		replica.CurrentLSN = snapshotLSN
 	}
 	s.replicasMutex.Unlock()
 	// Update metrics
 	if s.metrics != nil {
 		s.metrics.UpdateReplicaStatus(req.ReplicaId, transport.StatusSyncing, snapshotLSN)
 	}
 	return nil
 }
 // GetBootstrapStatusMap retrieves the current status of bootstrap operations as a map
 func (s *ReplicationServiceServer) GetBootstrapStatusMap() map[string]string {
 	// If bootstrap service isn't initialized, return empty status
 	if s.bootstrapService == nil {
 		return map[string]string{
 			"message": "bootstrap service not initialized",
 		}
 	}
 	// Get bootstrap status from the service
 	status := s.bootstrapService.getBootstrapStatus()
 	// Convert to proto-friendly format
 	protoStatus := make(map[string]string)
 	convertStatusToString(status, protoStatus, "")
 	return protoStatus
 }
 // Helper function to convert nested status map to flat string map for proto
 func convertStatusToString(input map[string]interface{}, output map[string]string, prefix string) {
 	for k, v := range input {
 		key := k
 		if prefix != "" {
 			key = prefix + "." + k
 		}
 		switch val := v.(type) {
 		case string:
 			output[key] = val
 		case int, int64, uint64, float64, bool:
 			output[key] = fmt.Sprintf("%v", val)
 		case map[string]interface{}:
 			convertStatusToString(val, output, key)
 		case []interface{}:
 			for i, item := range val {
 				itemKey := fmt.Sprintf("%s[%d]", key, i)
 				if m, ok := item.(map[string]interface{}); ok {
 					convertStatusToString(m, output, itemKey)
 				} else {
 					output[itemKey] = fmt.Sprintf("%v", item)
 				}
 			}
 		case time.Time:
 			output[key] = val.Format(time.RFC3339)
 		default:
 			output[key] = fmt.Sprintf("%v", val)
 		}
 	}
 }
 // storageSnapshotAdapter adapts StorageSnapshot to StorageSnapshotProvider
 type storageSnapshotAdapter struct {
 	snapshot replication.StorageSnapshot
 }
 func (a *storageSnapshotAdapter) CreateSnapshot() (replication.StorageSnapshot, error) {
 	return a.snapshot, nil
 }
--- a/pkg/grpc/service/test_helpers.go
+++ b/pkg/grpc/service/test_helpers.go
@ -1,28 +0,0 @@
 package service
 import (
 	"github.com/KevoDB/kevo/pkg/replication"
 	"github.com/KevoDB/kevo/pkg/wal"
 )
 // For testing purposes, we need our mocks to be convertible to WALReplicator
 // The issue is that the WALReplicator has unexported fields, so we can't just embed it
 // Let's create a clean test implementation of the replication.WALReplicator interface
 // CreateTestReplicator creates a replication.WALReplicator for tests
 func CreateTestReplicator(highTS uint64) *replication.WALReplicator {
 	return &replication.WALReplicator{}
 }
 // Cast mock storage snapshot
 func castToStorageSnapshot(s interface {
 	CreateSnapshotIterator() (replication.SnapshotIterator, error)
 	KeyCount() int64
 }) replication.StorageSnapshot {
 	return s.(replication.StorageSnapshot)
 }
 // MockGetEntriesAfter implements mocking for WAL replicator GetEntriesAfter
 func MockGetEntriesAfter(position replication.ReplicationPosition) ([]*wal.Entry, error) {
 	return nil, nil
 }
--- a/pkg/grpc/transport/reconnect.go
+++ b/pkg/grpc/transport/reconnect.go
@ -1,152 +0,0 @@
 package transport
 import (
 	"context"
 	"math"
 	"time"
 	"github.com/KevoDB/kevo/pkg/transport"
 )
 // reconnectLoop continuously attempts to reconnect the client
 func (c *ReplicationGRPCClient) reconnectLoop(initialDelay time.Duration) {
 	// If we're shutting down, don't attempt to reconnect
 	if c.shuttingDown {
 		return
 	}
 	// Start with initial delay
 	delay := initialDelay
 	// Reset reconnect attempt counter on first try
 	c.reconnectAttempt = 0
 	for {
 		// Check if we're shutting down
 		if c.shuttingDown {
 			return
 		}
 		// Wait for the delay
 		time.Sleep(delay)
 		// Attempt to reconnect
 		c.reconnectAttempt++
 		maxAttempts := c.options.RetryPolicy.MaxRetries
 		c.logger.Info("Attempting to reconnect (%d/%d)", c.reconnectAttempt, maxAttempts)
 		// Create context with timeout
 		ctx, cancel := context.WithTimeout(context.Background(), c.options.Timeout)
 		// Attempt connection
 		err := c.Connect(ctx)
 		cancel()
 		if err == nil {
 			// Connection successful
 			c.logger.Info("Successfully reconnected after %d attempts", c.reconnectAttempt)
 			// Reset circuit breaker
 			c.circuitBreaker.Reset()
 			// Register with primary if we have a replica ID
 			if c.replicaID != "" {
 				ctx, cancel := context.WithTimeout(context.Background(), c.options.Timeout)
 				defer cancel()
 				err := c.RegisterAsReplica(ctx, c.replicaID)
 				if err != nil {
 					c.logger.Error("Failed to re-register as replica: %v", err)
 				} else {
 					c.logger.Info("Successfully re-registered as replica %s", c.replicaID)
 				}
 			}
 			return
 		}
 		// Log the reconnection failure
 		c.logger.Error("Failed to reconnect (attempt %d/%d): %v",
 			c.reconnectAttempt, maxAttempts, err)
 		// Check if we've exceeded the maximum number of reconnection attempts
 		if maxAttempts > 0 && c.reconnectAttempt >= maxAttempts {
 			c.logger.Error("Maximum reconnection attempts (%d) exceeded", maxAttempts)
 			// Trip the circuit breaker to prevent further attempts for a while
 			c.circuitBreaker.Trip()
 			return
 		}
 		// Increase delay for next attempt (with jitter)
 		delay = calculateBackoff(c.reconnectAttempt, c.options.RetryPolicy)
 	}
 }
 // calculateBackoff calculates the backoff duration for the next reconnection attempt
 func calculateBackoff(attempt int, policy transport.RetryPolicy) time.Duration {
 	// Calculate base backoff using exponential formula
 	backoff := float64(policy.InitialBackoff) *
 		math.Pow(2, float64(attempt-1)) // 2^(attempt-1)
 	// Apply backoff factor if specified
 	if policy.BackoffFactor > 0 {
 		backoff *= policy.BackoffFactor
 	}
 	// Apply jitter if specified
 	if policy.Jitter > 0 {
 		jitter := 1.0 - policy.Jitter/2 + policy.Jitter*float64(time.Now().UnixNano()%1000)/1000.0
 		backoff *= jitter
 	}
 	// Cap at max backoff
 	if policy.MaxBackoff > 0 && time.Duration(backoff) > policy.MaxBackoff {
 		return policy.MaxBackoff
 	}
 	return time.Duration(backoff)
 }
 // maybeReconnect checks if the connection is alive, and starts a reconnection
 // loop if it's not
 func (c *ReplicationGRPCClient) maybeReconnect() {
 	// Check if we're connected
 	if c.IsConnected() {
 		return
 	}
 	// Check if the circuit breaker is open
 	if c.circuitBreaker.IsOpen() {
 		c.logger.Warn("Circuit breaker is open, not attempting to reconnect")
 		return
 	}
 	// Start reconnection loop in a new goroutine
 	go c.reconnectLoop(c.options.RetryPolicy.InitialBackoff)
 }
 // handleConnectionError processes a connection error and triggers reconnection if needed
 func (c *ReplicationGRPCClient) handleConnectionError(err error) error {
 	if err == nil {
 		return nil
 	}
 	// Update status
 	c.mu.Lock()
 	c.status.LastError = err
 	wasConnected := c.status.Connected
 	c.status.Connected = false
 	c.mu.Unlock()
 	// Log the error
 	c.logger.Error("Connection error: %v", err)
 	// Check if we should attempt to reconnect
 	if wasConnected && !c.shuttingDown {
 		c.logger.Info("Connection lost, attempting to reconnect")
 		go c.reconnectLoop(c.options.RetryPolicy.InitialBackoff)
 	}
 	return err
 }
--- a/pkg/grpc/transport/reconnect_test.go
+++ b/pkg/grpc/transport/reconnect_test.go
@ -1,255 +0,0 @@
 package transport
 import (
 	"errors"
 	"sync/atomic"
 	"testing"
 	"time"
 	"github.com/KevoDB/kevo/pkg/common/log"
 	"github.com/KevoDB/kevo/pkg/transport"
 )
 func TestCalculateBackoff(t *testing.T) {
 	policy := transport.RetryPolicy{
 		InitialBackoff: 100 * time.Millisecond,
 		MaxBackoff:     5 * time.Second,
 		BackoffFactor:  2.0,
 		Jitter:         0.0, // Disable jitter for deterministic tests
 	}
 	tests := []struct {
 		name          string
 		attempt       int
 		expectedRange [2]time.Duration // Min and max expected duration
 	}{
 		{
 			name:          "First attempt",
 			attempt:       1,
 			expectedRange: [2]time.Duration{100 * time.Millisecond, 200 * time.Millisecond},
 		},
 		{
 			name:          "Second attempt",
 			attempt:       2,
 			expectedRange: [2]time.Duration{200 * time.Millisecond, 400 * time.Millisecond},
 		},
 		{
 			name:          "Third attempt",
 			attempt:       3,
 			expectedRange: [2]time.Duration{400 * time.Millisecond, 800 * time.Millisecond},
 		},
 		{
 			name:          "Tenth attempt",
 			attempt:       10,
 			expectedRange: [2]time.Duration{5 * time.Second, 5 * time.Second}, // Capped at max
 		},
 	}
 	for _, tt := range tests {
 		t.Run(tt.name, func(t *testing.T) {
 			backoff := calculateBackoff(tt.attempt, policy)
 			if backoff < tt.expectedRange[0] || backoff > tt.expectedRange[1] {
 				t.Errorf("Expected backoff between %v and %v, got %v",
 					tt.expectedRange[0], tt.expectedRange[1], backoff)
 			}
 		})
 	}
 	// Test with jitter
 	t.Run("With jitter", func(t *testing.T) {
 		jitterPolicy := transport.RetryPolicy{
 			InitialBackoff: 100 * time.Millisecond,
 			MaxBackoff:     5 * time.Second,
 			BackoffFactor:  2.0,
 			Jitter:         0.5, // 50% jitter
 		}
 		// Run multiple times to check for variation
 		var values []time.Duration
 		for i := 0; i < 10; i++ {
 			values = append(values, calculateBackoff(2, jitterPolicy))
 		}
 		// Check if we have at least some variation (jitter is working)
 		allSame := true
 		for i := 1; i < len(values); i++ {
 			if values[i] != values[0] {
 				allSame = false
 				break
 			}
 		}
 		if allSame {
 			t.Error("Expected variation with jitter enabled, but all values are the same")
 		}
 	})
 }
 // mockClient is a standalone struct for testing that doesn't rely on the reconnectLoop method
 type mockClient struct {
 	logger          log.Logger
 	circuitBreaker  *transport.CircuitBreaker
 	status          transport.TransportStatus
 	options         transport.TransportOptions
 	shuttingDown    bool
 	reconnectCalled atomic.Bool
 }
 // handleConnectionError is a copy of the real implementation but uses reconnectCalled instead
 func (c *mockClient) handleConnectionError(err error) error {
 	if err == nil {
 		return nil
 	}
 	// Update status
 	c.status.LastError = err
 	wasConnected := c.status.Connected
 	c.status.Connected = false
 	// Log the error
 	c.logger.Error("Connection error: %v", err)
 	// Check if we should attempt to reconnect
 	if wasConnected && !c.shuttingDown {
 		c.logger.Info("Connection lost, attempting to reconnect")
 		// Instead of calling reconnectLoop, set the flag
 		c.reconnectCalled.Store(true)
 	}
 	return err
 }
 // maybeReconnect is a copy of the real implementation but uses reconnectCalled instead
 func (c *mockClient) maybeReconnect() {
 	// Check if we're connected
 	if c.status.Connected {
 		return
 	}
 	// Check if the circuit breaker is open
 	if c.circuitBreaker.IsOpen() {
 		c.logger.Warn("Circuit breaker is open, not attempting to reconnect")
 		return
 	}
 	// Mark that reconnect was called
 	c.reconnectCalled.Store(true)
 }
 // IsConnected returns whether the client is connected
 func (c *mockClient) IsConnected() bool {
 	return c.status.Connected
 }
 func TestHandleConnectionError(t *testing.T) {
 	// Create a mock client
 	client := &mockClient{
 		logger:         log.NewStandardLogger(),
 		circuitBreaker: transport.NewCircuitBreaker(3, 100*time.Millisecond),
 		status: transport.TransportStatus{
 			Connected: true,
 		},
 		options: transport.TransportOptions{
 			RetryPolicy: transport.RetryPolicy{
 				InitialBackoff: 1 * time.Millisecond,
 				MaxBackoff:     10 * time.Millisecond,
 				MaxRetries:     2,
 			},
 		},
 	}
 	// Test with a connection error
 	testErr := errors.New("test connection error")
 	result := client.handleConnectionError(testErr)
 	// Check results
 	if result != testErr {
 		t.Errorf("Expected error to be returned, got: %v", result)
 	}
 	if client.status.Connected {
 		t.Error("Expected connected status to be false")
 	}
 	if client.status.LastError != testErr {
 		t.Errorf("Expected LastError to be set, got: %v", client.status.LastError)
 	}
 	// Check if reconnect was attempted
 	if !client.reconnectCalled.Load() {
 		t.Error("Expected reconnect to be attempted")
 	}
 	// Test with nil error
 	client.reconnectCalled.Store(false)
 	result = client.handleConnectionError(nil)
 	if result != nil {
 		t.Errorf("Expected nil error to be returned, got: %v", result)
 	}
 	if client.reconnectCalled.Load() {
 		t.Error("Expected no reconnect attempt for nil error")
 	}
 }
 func TestMaybeReconnect(t *testing.T) {
 	// Test case 1: Already connected
 	t.Run("Already connected", func(t *testing.T) {
 		client := &mockClient{
 			logger:         log.NewStandardLogger(),
 			circuitBreaker: transport.NewCircuitBreaker(3, 100*time.Millisecond),
 			status: transport.TransportStatus{
 				Connected: true,
 			},
 		}
 		client.maybeReconnect()
 		if client.reconnectCalled.Load() {
 			t.Error("Expected no reconnect attempt when already connected")
 		}
 	})
 	// Test case 2: Not connected but circuit breaker open
 	t.Run("Circuit breaker open", func(t *testing.T) {
 		client := &mockClient{
 			logger:         log.NewStandardLogger(),
 			circuitBreaker: transport.NewCircuitBreaker(3, 100*time.Millisecond),
 			status: transport.TransportStatus{
 				Connected: false,
 			},
 		}
 		// Trip the circuit breaker
 		client.circuitBreaker.Trip()
 		client.maybeReconnect()
 		if client.reconnectCalled.Load() {
 			t.Error("Expected no reconnect attempt when circuit breaker is open")
 		}
 	})
 	// Test case 3: Not connected and circuit breaker closed
 	t.Run("Not connected, circuit closed", func(t *testing.T) {
 		client := &mockClient{
 			logger:         log.NewStandardLogger(),
 			circuitBreaker: transport.NewCircuitBreaker(3, 100*time.Millisecond),
 			status: transport.TransportStatus{
 				Connected: false,
 			},
 			options: transport.TransportOptions{
 				RetryPolicy: transport.RetryPolicy{
 					InitialBackoff: 1 * time.Millisecond,
 				},
 			},
 		}
 		client.maybeReconnect()
 		if !client.reconnectCalled.Load() {
 			t.Error("Expected reconnect attempt when not connected and circuit breaker closed")
 		}
 	})
 }
--- a/pkg/grpc/transport/replication_client.go
+++ b/pkg/grpc/transport/replication_client.go
--- a/pkg/grpc/transport/replication_server.go
+++ b/pkg/grpc/transport/replication_server.go
@ -12,43 +12,35 @@ import (
 // ReplicationGRPCServer implements the ReplicationServer interface using gRPC
 type ReplicationGRPCServer struct {
-	transportManager   *GRPCTransportManager
+	transportManager *GRPCTransportManager
 	replicationService *service.ReplicationServiceServer
-	options            transport.TransportOptions
+	options         transport.TransportOptions
-	replicas           map[string]*transport.ReplicaInfo
+	replicas        map[string]*transport.ReplicaInfo
-	mu                 sync.RWMutex
+	mu              sync.RWMutex
 }
 // NewReplicationGRPCServer creates a new ReplicationGRPCServer
 func NewReplicationGRPCServer(
 	transportManager *GRPCTransportManager,
-	replicator replication.EntryReplicator,
+	replicator *replication.WALReplicator,
-	applier replication.EntryApplier,
+	applier *replication.WALApplier,
 	serializer *replication.EntrySerializer,
 	storageSnapshot replication.StorageSnapshot,
 	options transport.TransportOptions,
 ) (*ReplicationGRPCServer, error) {
 	// Create replication service options with default settings
 	serviceOptions := service.DefaultReplicationServiceOptions()
 	// Create replication service
-	replicationService, err := service.NewReplicationService(
+	replicationService := service.NewReplicationService(
 		replicator,
 		applier,
 		serializer,
 		storageSnapshot,
 		serviceOptions,
 	)
 	if err != nil {
 		return nil, fmt.Errorf("failed to create replication service: %w", err)
 	}
 	return &ReplicationGRPCServer{
-		transportManager:   transportManager,
+		transportManager:    transportManager,
-		replicationService: replicationService,
+		replicationService:  replicationService,
-		options:            options,
+		options:             options,
-		replicas:           make(map[string]*transport.ReplicaInfo),
+		replicas:            make(map[string]*transport.ReplicaInfo),
 	}, nil
 }
@ -193,29 +185,16 @@ func init() {
 // WithReplicator adds a replicator to the replication server
 func (s *ReplicationGRPCServer) WithReplicator(
-	replicator replication.EntryReplicator,
+	replicator *replication.WALReplicator,
-	applier replication.EntryApplier,
+	applier *replication.WALApplier,
 	serializer *replication.EntrySerializer,
 	storageSnapshot replication.StorageSnapshot,
 ) *ReplicationGRPCServer {
-	// Create replication service options with default settings
+	s.replicationService = service.NewReplicationService(
 	serviceOptions := service.DefaultReplicationServiceOptions()
 	// Create replication service
 	replicationService, err := service.NewReplicationService(
 		replicator,
 		applier,
 		serializer,
 		storageSnapshot,
 		serviceOptions,
 	)
 	if err != nil {
 		// Log error but continue with nil service
 		fmt.Printf("Error creating replication service: %v\n", err)
 		return s
 	}
 	s.replicationService = replicationService
 	return s
 }
--- a/pkg/replication/applier_test.go
+++ b/pkg/replication/applier_test.go
@ -11,15 +11,15 @@ import (
 // MockStorage implements a simple mock storage for testing
 type MockStorage struct {
-	mu            sync.Mutex
+	mu             sync.Mutex
-	data          map[string][]byte
+	data           map[string][]byte
-	putFail       bool
+	putFail        bool
-	deleteFail    bool
+	deleteFail     bool
-	putCount      int
+	putCount       int
-	deleteCount   int
+	deleteCount    int
-	lastPutKey    []byte
+	lastPutKey     []byte
-	lastPutValue  []byte
+	lastPutValue   []byte
-	lastDeleteKey []byte
+	lastDeleteKey  []byte
 }
 func NewMockStorage() *MockStorage {
@ -69,19 +69,17 @@ func (m *MockStorage) Delete(key []byte) error {
 }
 // Stub implementations for the rest of the interface
-func (m *MockStorage) Close() error                            { return nil }
+func (m *MockStorage) Close() error { return nil }
-func (m *MockStorage) IsDeleted(key []byte) (bool, error)      { return false, nil }
+func (m *MockStorage) IsDeleted(key []byte) (bool, error) { return false, nil }
 func (m *MockStorage) GetIterator() (iterator.Iterator, error) { return nil, nil }
-func (m *MockStorage) GetRangeIterator(startKey, endKey []byte) (iterator.Iterator, error) {
+func (m *MockStorage) GetRangeIterator(startKey, endKey []byte) (iterator.Iterator, error) { return nil, nil }
-	return nil, nil
+func (m *MockStorage) ApplyBatch(entries []*wal.Entry) error { return nil }
-}
+func (m *MockStorage) FlushMemTables() error { return nil }
-func (m *MockStorage) ApplyBatch(entries []*wal.Entry) error   { return nil }
+func (m *MockStorage) GetMemTableSize() uint64 { return 0 }
-func (m *MockStorage) FlushMemTables() error                   { return nil }
+func (m *MockStorage) IsFlushNeeded() bool { return false }
-func (m *MockStorage) GetMemTableSize() uint64                 { return 0 }
+func (m *MockStorage) GetSSTables() []string { return nil }
-func (m *MockStorage) IsFlushNeeded() bool                     { return false }
+func (m *MockStorage) ReloadSSTables() error { return nil }
-func (m *MockStorage) GetSSTables() []string                   { return nil }
+func (m *MockStorage) RotateWAL() error { return nil }
 func (m *MockStorage) ReloadSSTables() error                   { return nil }
 func (m *MockStorage) RotateWAL() error                        { return nil }
 func (m *MockStorage) GetStorageStats() map[string]interface{} { return nil }
 func TestWALApplierBasic(t *testing.T) {
--- a/pkg/replication/bootstrap.go
+++ b/pkg/replication/bootstrap.go
@ -1,421 +0,0 @@
 package replication
 import (
 	"encoding/json"
 	"errors"
 	"fmt"
 	"io"
 	"os"
 	"path/filepath"
 	"sync"
 	"time"
 	"github.com/KevoDB/kevo/pkg/common/log"
 	"github.com/KevoDB/kevo/pkg/transport"
 )
 var (
 	// ErrBootstrapInterrupted indicates the bootstrap process was interrupted
 	ErrBootstrapInterrupted = errors.New("bootstrap process was interrupted")
 	// ErrBootstrapFailed indicates the bootstrap process failed
 	ErrBootstrapFailed = errors.New("bootstrap process failed")
 )
 // BootstrapManager handles the bootstrap process for replicas
 type BootstrapManager struct {
 	// Storage-related components
 	storageApplier StorageApplier
 	walApplier     EntryApplier
 	// State tracking
 	bootstrapState     *BootstrapState
 	bootstrapStatePath string
 	snapshotLSN        uint64
 	// Mutex for synchronization
 	mu sync.RWMutex
 	// Logger instance
 	logger log.Logger
 }
 // StorageApplier defines an interface for applying key-value pairs to storage
 type StorageApplier interface {
 	// Apply applies a key-value pair to storage
 	Apply(key, value []byte) error
 	// ApplyBatch applies multiple key-value pairs to storage
 	ApplyBatch(pairs []KeyValuePair) error
 	// Flush ensures all applied changes are persisted
 	Flush() error
 }
 // BootstrapState tracks the state of an ongoing bootstrap operation
 type BootstrapState struct {
 	ReplicaID       string    `json:"replica_id"`
 	StartedAt       time.Time `json:"started_at"`
 	LastUpdatedAt   time.Time `json:"last_updated_at"`
 	SnapshotLSN     uint64    `json:"snapshot_lsn"`
 	AppliedKeys     int       `json:"applied_keys"`
 	TotalKeys       int       `json:"total_keys"`
 	Progress        float64   `json:"progress"`
 	Completed       bool      `json:"completed"`
 	Error           string    `json:"error,omitempty"`
 	CurrentChecksum uint32    `json:"current_checksum"`
 }
 // NewBootstrapManager creates a new bootstrap manager
 func NewBootstrapManager(
 	storageApplier StorageApplier,
 	walApplier EntryApplier,
 	dataDir string,
 	logger log.Logger,
 ) (*BootstrapManager, error) {
 	if logger == nil {
 		logger = log.GetDefaultLogger().WithField("component", "bootstrap_manager")
 	}
 	// Create bootstrap directory if it doesn't exist
 	bootstrapDir := filepath.Join(dataDir, "bootstrap")
 	if err := os.MkdirAll(bootstrapDir, 0755); err != nil {
 		return nil, fmt.Errorf("failed to create bootstrap directory: %w", err)
 	}
 	bootstrapStatePath := filepath.Join(bootstrapDir, "bootstrap_state.json")
 	manager := &BootstrapManager{
 		storageApplier:     storageApplier,
 		walApplier:         walApplier,
 		bootstrapStatePath: bootstrapStatePath,
 		logger:             logger,
 	}
 	// Try to load existing bootstrap state
 	state, err := manager.loadBootstrapState()
 	if err == nil && state != nil {
 		manager.bootstrapState = state
 		logger.Info("Loaded existing bootstrap state (progress: %.2f%%)", state.Progress*100)
 	}
 	return manager, nil
 }
 // loadBootstrapState loads the bootstrap state from disk
 func (m *BootstrapManager) loadBootstrapState() (*BootstrapState, error) {
 	// Check if the state file exists
 	if _, err := os.Stat(m.bootstrapStatePath); os.IsNotExist(err) {
 		return nil, nil
 	}
 	// Read and parse the state file
 	file, err := os.Open(m.bootstrapStatePath)
 	if err != nil {
 		return nil, err
 	}
 	defer file.Close()
 	var state BootstrapState
 	if err := readJSONFile(file, &state); err != nil {
 		return nil, err
 	}
 	return &state, nil
 }
 // saveBootstrapState saves the bootstrap state to disk
 func (m *BootstrapManager) saveBootstrapState() error {
 	m.mu.RLock()
 	state := m.bootstrapState
 	m.mu.RUnlock()
 	if state == nil {
 		return nil
 	}
 	// Update the last updated timestamp
 	state.LastUpdatedAt = time.Now()
 	// Create a temporary file
 	tempFile, err := os.CreateTemp(filepath.Dir(m.bootstrapStatePath), "bootstrap_state_*.json")
 	if err != nil {
 		return err
 	}
 	tempFilePath := tempFile.Name()
 	// Write state to the temporary file
 	if err := writeJSONFile(tempFile, state); err != nil {
 		tempFile.Close()
 		os.Remove(tempFilePath)
 		return err
 	}
 	// Close the temporary file
 	tempFile.Close()
 	// Atomically replace the state file
 	return os.Rename(tempFilePath, m.bootstrapStatePath)
 }
 // StartBootstrap begins the bootstrap process
 func (m *BootstrapManager) StartBootstrap(
 	replicaID string,
 	bootstrapIterator transport.BootstrapIterator,
 	batchSize int,
 ) error {
 	m.mu.Lock()
 	// Initialize bootstrap state
 	m.bootstrapState = &BootstrapState{
 		ReplicaID:       replicaID,
 		StartedAt:       time.Now(),
 		LastUpdatedAt:   time.Now(),
 		SnapshotLSN:     0,
 		AppliedKeys:     0,
 		TotalKeys:       0, // Will be updated during the process
 		Progress:        0.0,
 		Completed:       false,
 		CurrentChecksum: 0,
 	}
 	m.mu.Unlock()
 	// Save initial state
 	if err := m.saveBootstrapState(); err != nil {
 		m.logger.Warn("Failed to save initial bootstrap state: %v", err)
 	}
 	// Start bootstrap process in a goroutine
 	go func() {
 		err := m.runBootstrap(bootstrapIterator, batchSize)
 		if err != nil && err != io.EOF {
 			m.mu.Lock()
 			m.bootstrapState.Error = err.Error()
 			m.mu.Unlock()
 			m.logger.Error("Bootstrap failed: %v", err)
 			if err := m.saveBootstrapState(); err != nil {
 				m.logger.Error("Failed to save failed bootstrap state: %v", err)
 			}
 		}
 	}()
 	return nil
 }
 // runBootstrap executes the bootstrap process
 func (m *BootstrapManager) runBootstrap(
 	bootstrapIterator transport.BootstrapIterator,
 	batchSize int,
 ) error {
 	if batchSize <= 0 {
 		batchSize = 1000 // Default batch size
 	}
 	m.logger.Info("Starting bootstrap process")
 	// If we have an existing state, check if we need to resume
 	m.mu.RLock()
 	state := m.bootstrapState
 	appliedKeys := state.AppliedKeys
 	m.mu.RUnlock()
 	// Track batch for efficient application
 	batch := make([]KeyValuePair, 0, batchSize)
 	appliedInBatch := 0
 	lastSaveTime := time.Now()
 	saveThreshold := 5 * time.Second // Save state every 5 seconds
 	// Process all key-value pairs from the iterator
 	for {
 		// Check progress periodically
 		progress := bootstrapIterator.Progress()
 		// Update progress in state
 		m.mu.Lock()
 		m.bootstrapState.Progress = progress
 		m.mu.Unlock()
 		// Save state periodically
 		if time.Since(lastSaveTime) > saveThreshold {
 			if err := m.saveBootstrapState(); err != nil {
 				m.logger.Warn("Failed to save bootstrap state: %v", err)
 			}
 			lastSaveTime = time.Now()
 			// Log progress
 			m.logger.Info("Bootstrap progress: %.2f%% (%d keys applied)",
 				progress*100, appliedKeys)
 		}
 		// Get next key-value pair
 		key, value, err := bootstrapIterator.Next()
 		if err == io.EOF {
 			break
 		}
 		if err != nil {
 			return fmt.Errorf("error getting next key-value pair: %w", err)
 		}
 		// Skip keys if we're resuming and haven't reached the last applied key
 		if appliedInBatch < appliedKeys {
 			appliedInBatch++
 			continue
 		}
 		// Add to batch
 		batch = append(batch, KeyValuePair{
 			Key:   key,
 			Value: value,
 		})
 		// Apply batch if full
 		if len(batch) >= batchSize {
 			if err := m.storageApplier.ApplyBatch(batch); err != nil {
 				return fmt.Errorf("error applying batch: %w", err)
 			}
 			// Update applied count
 			appliedInBatch += len(batch)
 			m.mu.Lock()
 			m.bootstrapState.AppliedKeys = appliedInBatch
 			m.mu.Unlock()
 			// Clear batch
 			batch = batch[:0]
 		}
 	}
 	// Apply any remaining items in the batch
 	if len(batch) > 0 {
 		if err := m.storageApplier.ApplyBatch(batch); err != nil {
 			return fmt.Errorf("error applying final batch: %w", err)
 		}
 		appliedInBatch += len(batch)
 		m.mu.Lock()
 		m.bootstrapState.AppliedKeys = appliedInBatch
 		m.mu.Unlock()
 	}
 	// Flush changes to storage
 	if err := m.storageApplier.Flush(); err != nil {
 		return fmt.Errorf("error flushing storage: %w", err)
 	}
 	// Update WAL applier with snapshot LSN
 	m.mu.RLock()
 	snapshotLSN := m.snapshotLSN
 	m.mu.RUnlock()
 	// Reset the WAL applier to start from the snapshot LSN
 	if m.walApplier != nil {
 		m.walApplier.ResetHighestApplied(snapshotLSN)
 		m.logger.Info("Reset WAL applier to snapshot LSN: %d", snapshotLSN)
 	}
 	// Update and save final state
 	m.mu.Lock()
 	m.bootstrapState.Completed = true
 	m.bootstrapState.Progress = 1.0
 	m.bootstrapState.TotalKeys = appliedInBatch
 	m.bootstrapState.SnapshotLSN = snapshotLSN
 	m.mu.Unlock()
 	if err := m.saveBootstrapState(); err != nil {
 		m.logger.Warn("Failed to save final bootstrap state: %v", err)
 	}
 	m.logger.Info("Bootstrap completed successfully: %d keys applied, snapshot LSN: %d",
 		appliedInBatch, snapshotLSN)
 	return nil
 }
 // IsBootstrapInProgress checks if a bootstrap operation is in progress
 func (m *BootstrapManager) IsBootstrapInProgress() bool {
 	m.mu.RLock()
 	defer m.mu.RUnlock()
 	return m.bootstrapState != nil && !m.bootstrapState.Completed && m.bootstrapState.Error == ""
 }
 // GetBootstrapState returns the current bootstrap state
 func (m *BootstrapManager) GetBootstrapState() *BootstrapState {
 	m.mu.RLock()
 	defer m.mu.RUnlock()
 	if m.bootstrapState == nil {
 		return nil
 	}
 	// Return a copy to avoid concurrent modification
 	stateCopy := *m.bootstrapState
 	return &stateCopy
 }
 // SetSnapshotLSN sets the LSN of the snapshot being bootstrapped
 func (m *BootstrapManager) SetSnapshotLSN(lsn uint64) {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	m.snapshotLSN = lsn
 	if m.bootstrapState != nil {
 		m.bootstrapState.SnapshotLSN = lsn
 	}
 }
 // ClearBootstrapState clears any existing bootstrap state
 func (m *BootstrapManager) ClearBootstrapState() error {
 	m.mu.Lock()
 	m.bootstrapState = nil
 	m.mu.Unlock()
 	// Remove state file if it exists
 	if _, err := os.Stat(m.bootstrapStatePath); err == nil {
 		if err := os.Remove(m.bootstrapStatePath); err != nil {
 			return fmt.Errorf("error removing bootstrap state file: %w", err)
 		}
 	}
 	return nil
 }
 // TransitionToWALReplication transitions from bootstrap to WAL replication
 func (m *BootstrapManager) TransitionToWALReplication() error {
 	m.mu.RLock()
 	state := m.bootstrapState
 	m.mu.RUnlock()
 	if state == nil || !state.Completed {
 		return ErrBootstrapInterrupted
 	}
 	// Ensure WAL applier is properly initialized with the snapshot LSN
 	if m.walApplier != nil {
 		m.walApplier.ResetHighestApplied(state.SnapshotLSN)
 		m.logger.Info("Transitioned to WAL replication from LSN: %d", state.SnapshotLSN)
 	}
 	return nil
 }
 // JSON file handling functions
 var writeJSONFile = writeJSONFileImpl
 var readJSONFile = readJSONFileImpl
 // writeJSONFileImpl writes a JSON object to a file
 func writeJSONFileImpl(file *os.File, v interface{}) error {
 	encoder := json.NewEncoder(file)
 	return encoder.Encode(v)
 }
 // readJSONFileImpl reads a JSON object from a file
 func readJSONFileImpl(file *os.File, v interface{}) error {
 	decoder := json.NewDecoder(file)
 	return decoder.Decode(v)
 }
--- a/pkg/replication/bootstrap_generator.go
+++ b/pkg/replication/bootstrap_generator.go
@ -1,297 +0,0 @@
 package replication
 import (
 	"context"
 	"errors"
 	"fmt"
 	"io"
 	"sync"
 	"sync/atomic"
 	"time"
 	"github.com/KevoDB/kevo/pkg/common/log"
 )
 var (
 	// ErrBootstrapGenerationCancelled indicates the bootstrap generation was cancelled
 	ErrBootstrapGenerationCancelled = errors.New("bootstrap generation was cancelled")
 	// ErrBootstrapGenerationFailed indicates the bootstrap generation failed
 	ErrBootstrapGenerationFailed = errors.New("bootstrap generation failed")
 )
 // BootstrapGenerator manages the creation of storage snapshots for bootstrapping replicas
 type BootstrapGenerator struct {
 	// Storage snapshot provider
 	snapshotProvider StorageSnapshotProvider
 	// Replicator for getting current LSN
 	replicator EntryReplicator
 	// Active bootstrap operations
 	activeBootstraps      map[string]*bootstrapOperation
 	activeBootstrapsMutex sync.RWMutex
 	// Logger
 	logger log.Logger
 }
 // bootstrapOperation tracks a specific bootstrap operation
 type bootstrapOperation struct {
 	replicaID      string
 	startTime      time.Time
 	keyCount       int64
 	processedCount int64
 	snapshotLSN    uint64
 	cancelled      bool
 	completed      bool
 	cancelFunc     context.CancelFunc
 }
 // NewBootstrapGenerator creates a new bootstrap generator
 func NewBootstrapGenerator(
 	snapshotProvider StorageSnapshotProvider,
 	replicator EntryReplicator,
 	logger log.Logger,
 ) *BootstrapGenerator {
 	if logger == nil {
 		logger = log.GetDefaultLogger().WithField("component", "bootstrap_generator")
 	}
 	return &BootstrapGenerator{
 		snapshotProvider: snapshotProvider,
 		replicator:       replicator,
 		activeBootstraps: make(map[string]*bootstrapOperation),
 		logger:           logger,
 	}
 }
 // StartBootstrapGeneration begins generating a bootstrap snapshot for a replica
 func (g *BootstrapGenerator) StartBootstrapGeneration(
 	ctx context.Context,
 	replicaID string,
 ) (SnapshotIterator, uint64, error) {
 	// Create a cancellable context
 	bootstrapCtx, cancelFunc := context.WithCancel(ctx)
 	// Get current LSN from replicator
 	snapshotLSN := uint64(0)
 	if g.replicator != nil {
 		snapshotLSN = g.replicator.GetHighestTimestamp()
 	}
 	// Create snapshot
 	snapshot, err := g.snapshotProvider.CreateSnapshot()
 	if err != nil {
 		cancelFunc()
 		return nil, 0, fmt.Errorf("failed to create storage snapshot: %w", err)
 	}
 	// Get key count estimate
 	keyCount := snapshot.KeyCount()
 	// Create bootstrap operation tracking
 	operation := &bootstrapOperation{
 		replicaID:      replicaID,
 		startTime:      time.Now(),
 		keyCount:       keyCount,
 		processedCount: 0,
 		snapshotLSN:    snapshotLSN,
 		cancelled:      false,
 		completed:      false,
 		cancelFunc:     cancelFunc,
 	}
 	// Register the bootstrap operation
 	g.activeBootstrapsMutex.Lock()
 	g.activeBootstraps[replicaID] = operation
 	g.activeBootstrapsMutex.Unlock()
 	// Create snapshot iterator
 	iterator, err := snapshot.CreateSnapshotIterator()
 	if err != nil {
 		cancelFunc()
 		g.activeBootstrapsMutex.Lock()
 		delete(g.activeBootstraps, replicaID)
 		g.activeBootstrapsMutex.Unlock()
 		return nil, 0, fmt.Errorf("failed to create snapshot iterator: %w", err)
 	}
 	g.logger.Info("Started bootstrap generation for replica %s (estimated keys: %d, snapshot LSN: %d)",
 		replicaID, keyCount, snapshotLSN)
 	// Create a tracking iterator that updates progress
 	trackingIterator := &trackingSnapshotIterator{
 		iterator:  iterator,
 		ctx:       bootstrapCtx,
 		operation: operation,
 		processedKey: func(count int64) {
 			atomic.AddInt64(&operation.processedCount, 1)
 		},
 		completedCallback: func() {
 			g.activeBootstrapsMutex.Lock()
 			defer g.activeBootstrapsMutex.Unlock()
 			operation.completed = true
 			g.logger.Info("Completed bootstrap generation for replica %s (keys: %d, duration: %v)",
 				replicaID, operation.processedCount, time.Since(operation.startTime))
 		},
 		cancelledCallback: func() {
 			g.activeBootstrapsMutex.Lock()
 			defer g.activeBootstrapsMutex.Unlock()
 			operation.cancelled = true
 			g.logger.Info("Cancelled bootstrap generation for replica %s (keys processed: %d)",
 				replicaID, operation.processedCount)
 		},
 	}
 	return trackingIterator, snapshotLSN, nil
 }
 // CancelBootstrapGeneration cancels an in-progress bootstrap generation
 func (g *BootstrapGenerator) CancelBootstrapGeneration(replicaID string) bool {
 	g.activeBootstrapsMutex.Lock()
 	defer g.activeBootstrapsMutex.Unlock()
 	operation, exists := g.activeBootstraps[replicaID]
 	if !exists {
 		return false
 	}
 	if operation.completed || operation.cancelled {
 		return false
 	}
 	// Cancel the operation
 	operation.cancelled = true
 	operation.cancelFunc()
 	g.logger.Info("Cancelled bootstrap generation for replica %s", replicaID)
 	return true
 }
 // GetActiveBootstraps returns information about all active bootstrap operations
 func (g *BootstrapGenerator) GetActiveBootstraps() map[string]map[string]interface{} {
 	g.activeBootstrapsMutex.RLock()
 	defer g.activeBootstrapsMutex.RUnlock()
 	result := make(map[string]map[string]interface{})
 	for replicaID, operation := range g.activeBootstraps {
 		// Skip completed operations after a certain time
 		if operation.completed && time.Since(operation.startTime) > 1*time.Hour {
 			continue
 		}
 		// Calculate progress
 		progress := float64(0)
 		if operation.keyCount > 0 {
 			progress = float64(operation.processedCount) / float64(operation.keyCount)
 		}
 		result[replicaID] = map[string]interface{}{
 			"start_time":      operation.startTime,
 			"duration":        time.Since(operation.startTime).String(),
 			"key_count":       operation.keyCount,
 			"processed_count": operation.processedCount,
 			"progress":        progress,
 			"snapshot_lsn":    operation.snapshotLSN,
 			"completed":       operation.completed,
 			"cancelled":       operation.cancelled,
 		}
 	}
 	return result
 }
 // CleanupCompletedBootstraps removes tracking information for completed bootstrap operations
 func (g *BootstrapGenerator) CleanupCompletedBootstraps() int {
 	g.activeBootstrapsMutex.Lock()
 	defer g.activeBootstrapsMutex.Unlock()
 	removed := 0
 	for replicaID, operation := range g.activeBootstraps {
 		// Remove operations that are completed or cancelled and older than 1 hour
 		if (operation.completed || operation.cancelled) && time.Since(operation.startTime) > 1*time.Hour {
 			delete(g.activeBootstraps, replicaID)
 			removed++
 		}
 	}
 	return removed
 }
 // trackingSnapshotIterator wraps a snapshot iterator to track progress
 type trackingSnapshotIterator struct {
 	iterator          SnapshotIterator
 	ctx               context.Context
 	operation         *bootstrapOperation
 	processedKey      func(count int64)
 	completedCallback func()
 	cancelledCallback func()
 	closed            bool
 	mu                sync.Mutex
 }
 // Next returns the next key-value pair
 func (t *trackingSnapshotIterator) Next() ([]byte, []byte, error) {
 	t.mu.Lock()
 	defer t.mu.Unlock()
 	if t.closed {
 		return nil, nil, io.EOF
 	}
 	// Check for cancellation
 	select {
 	case <-t.ctx.Done():
 		if !t.closed {
 			t.closed = true
 			t.cancelledCallback()
 		}
 		return nil, nil, ErrBootstrapGenerationCancelled
 	default:
 		// Continue
 	}
 	// Get next pair
 	key, value, err := t.iterator.Next()
 	if err == io.EOF {
 		if !t.closed {
 			t.closed = true
 			t.completedCallback()
 		}
 		return nil, nil, io.EOF
 	}
 	if err != nil {
 		return nil, nil, err
 	}
 	// Track progress
 	t.processedKey(1)
 	return key, value, nil
 }
 // Close closes the iterator
 func (t *trackingSnapshotIterator) Close() error {
 	t.mu.Lock()
 	defer t.mu.Unlock()
 	if t.closed {
 		return nil
 	}
 	t.closed = true
 	// Call appropriate callback
 	select {
 	case <-t.ctx.Done():
 		t.cancelledCallback()
 	default:
 		t.completedCallback()
 	}
 	return t.iterator.Close()
 }
--- a/pkg/replication/bootstrap_test.go
+++ b/pkg/replication/bootstrap_test.go
@ -1,621 +0,0 @@
 package replication
 import (
 	"context"
 	"encoding/json"
 	"fmt"
 	"io"
 	"os"
 	"sync"
 	"testing"
 	"time"
 	"github.com/KevoDB/kevo/pkg/common/log"
 )
 // MockStorageApplier implements StorageApplier for testing
 type MockStorageApplier struct {
 	applied      map[string][]byte
 	appliedCount int
 	appliedMu    sync.Mutex
 	flushCount   int
 	failApply    bool
 	failFlush    bool
 }
 func NewMockStorageApplier() *MockStorageApplier {
 	return &MockStorageApplier{
 		applied: make(map[string][]byte),
 	}
 }
 func (m *MockStorageApplier) Apply(key, value []byte) error {
 	m.appliedMu.Lock()
 	defer m.appliedMu.Unlock()
 	if m.failApply {
 		return ErrBootstrapFailed
 	}
 	m.applied[string(key)] = value
 	m.appliedCount++
 	return nil
 }
 func (m *MockStorageApplier) ApplyBatch(pairs []KeyValuePair) error {
 	m.appliedMu.Lock()
 	defer m.appliedMu.Unlock()
 	if m.failApply {
 		return ErrBootstrapFailed
 	}
 	for _, pair := range pairs {
 		m.applied[string(pair.Key)] = pair.Value
 	}
 	m.appliedCount += len(pairs)
 	return nil
 }
 func (m *MockStorageApplier) Flush() error {
 	m.appliedMu.Lock()
 	defer m.appliedMu.Unlock()
 	if m.failFlush {
 		return ErrBootstrapFailed
 	}
 	m.flushCount++
 	return nil
 }
 func (m *MockStorageApplier) GetAppliedCount() int {
 	m.appliedMu.Lock()
 	defer m.appliedMu.Unlock()
 	return m.appliedCount
 }
 func (m *MockStorageApplier) SetFailApply(fail bool) {
 	m.appliedMu.Lock()
 	defer m.appliedMu.Unlock()
 	m.failApply = fail
 }
 func (m *MockStorageApplier) SetFailFlush(fail bool) {
 	m.appliedMu.Lock()
 	defer m.appliedMu.Unlock()
 	m.failFlush = fail
 }
 // MockBootstrapIterator implements transport.BootstrapIterator for testing
 type MockBootstrapIterator struct {
 	pairs        []KeyValuePair
 	position     int
 	snapshotLSN  uint64
 	progress     float64
 	failAfter    int
 	closeError   error
 	progressFunc func(pos int) float64
 }
 func NewMockBootstrapIterator(pairs []KeyValuePair, snapshotLSN uint64) *MockBootstrapIterator {
 	return &MockBootstrapIterator{
 		pairs:       pairs,
 		snapshotLSN: snapshotLSN,
 		failAfter:   -1, // Don't fail by default
 		progressFunc: func(pos int) float64 {
 			if len(pairs) == 0 {
 				return 1.0
 			}
 			return float64(pos) / float64(len(pairs))
 		},
 	}
 }
 func (m *MockBootstrapIterator) Next() ([]byte, []byte, error) {
 	if m.position >= len(m.pairs) {
 		return nil, nil, io.EOF
 	}
 	if m.failAfter > 0 && m.position >= m.failAfter {
 		return nil, nil, ErrBootstrapFailed
 	}
 	pair := m.pairs[m.position]
 	m.position++
 	m.progress = m.progressFunc(m.position)
 	return pair.Key, pair.Value, nil
 }
 func (m *MockBootstrapIterator) Close() error {
 	return m.closeError
 }
 func (m *MockBootstrapIterator) Progress() float64 {
 	return m.progress
 }
 func (m *MockBootstrapIterator) SetFailAfter(failAfter int) {
 	m.failAfter = failAfter
 }
 func (m *MockBootstrapIterator) SetCloseError(err error) {
 	m.closeError = err
 }
 // Helper function to create a temporary directory for testing
 func createTempDir(t *testing.T) string {
 	dir, err := os.MkdirTemp("", "bootstrap-test-*")
 	if err != nil {
 		t.Fatalf("Failed to create temp dir: %v", err)
 	}
 	return dir
 }
 // Helper function to clean up temporary directory
 func cleanupTempDir(t *testing.T, dir string) {
 	os.RemoveAll(dir)
 }
 // Define JSON helpers for tests
 func testWriteJSONFile(file *os.File, v interface{}) error {
 	encoder := json.NewEncoder(file)
 	return encoder.Encode(v)
 }
 func testReadJSONFile(file *os.File, v interface{}) error {
 	decoder := json.NewDecoder(file)
 	return decoder.Decode(v)
 }
 // TestBootstrapManager_Basic tests basic bootstrap functionality
 func TestBootstrapManager_Basic(t *testing.T) {
 	// Create test directory
 	tempDir := createTempDir(t)
 	defer cleanupTempDir(t, tempDir)
 	// Create test data
 	testData := []KeyValuePair{
 		{Key: []byte("key1"), Value: []byte("value1")},
 		{Key: []byte("key2"), Value: []byte("value2")},
 		{Key: []byte("key3"), Value: []byte("value3")},
 		{Key: []byte("key4"), Value: []byte("value4")},
 		{Key: []byte("key5"), Value: []byte("value5")},
 	}
 	// Create mock components
 	storageApplier := NewMockStorageApplier()
 	logger := log.GetDefaultLogger()
 	// Create bootstrap manager
 	manager, err := NewBootstrapManager(storageApplier, nil, tempDir, logger)
 	if err != nil {
 		t.Fatalf("Failed to create bootstrap manager: %v", err)
 	}
 	// Create mock bootstrap iterator
 	snapshotLSN := uint64(12345)
 	iterator := NewMockBootstrapIterator(testData, snapshotLSN)
 	// Start bootstrap process
 	err = manager.StartBootstrap("test-replica", iterator, 2)
 	if err != nil {
 		t.Fatalf("Failed to start bootstrap: %v", err)
 	}
 	// Wait for bootstrap to complete
 	for i := 0; i < 50; i++ {
 		if !manager.IsBootstrapInProgress() {
 			break
 		}
 		time.Sleep(100 * time.Millisecond)
 	}
 	// Verify bootstrap completed
 	if manager.IsBootstrapInProgress() {
 		t.Fatalf("Bootstrap did not complete in time")
 	}
 	// We don't check the exact count here, as it may include previously applied items
 	// and it's an implementation detail whether they get reapplied or skipped
 	appliedCount := storageApplier.GetAppliedCount()
 	if appliedCount < len(testData) {
 		t.Errorf("Expected at least %d applied items, got %d", len(testData), appliedCount)
 	}
 	// Verify bootstrap state
 	state := manager.GetBootstrapState()
 	if state == nil {
 		t.Fatalf("Bootstrap state is nil")
 	}
 	if !state.Completed {
 		t.Errorf("Bootstrap state should be marked as completed")
 	}
 	if state.AppliedKeys != len(testData) {
 		t.Errorf("Expected %d applied keys in state, got %d", len(testData), state.AppliedKeys)
 	}
 	if state.Progress != 1.0 {
 		t.Errorf("Expected progress 1.0, got %f", state.Progress)
 	}
 }
 // TestBootstrapManager_Resume tests bootstrap resumability
 func TestBootstrapManager_Resume(t *testing.T) {
 	// Create test directory
 	tempDir := createTempDir(t)
 	defer cleanupTempDir(t, tempDir)
 	// Create test data
 	testData := []KeyValuePair{
 		{Key: []byte("key1"), Value: []byte("value1")},
 		{Key: []byte("key2"), Value: []byte("value2")},
 		{Key: []byte("key3"), Value: []byte("value3")},
 		{Key: []byte("key4"), Value: []byte("value4")},
 		{Key: []byte("key5"), Value: []byte("value5")},
 		{Key: []byte("key6"), Value: []byte("value6")},
 		{Key: []byte("key7"), Value: []byte("value7")},
 		{Key: []byte("key8"), Value: []byte("value8")},
 		{Key: []byte("key9"), Value: []byte("value9")},
 		{Key: []byte("key10"), Value: []byte("value10")},
 	}
 	// Create mock components
 	storageApplier := NewMockStorageApplier()
 	logger := log.GetDefaultLogger()
 	// Create bootstrap manager
 	manager, err := NewBootstrapManager(storageApplier, nil, tempDir, logger)
 	if err != nil {
 		t.Fatalf("Failed to create bootstrap manager: %v", err)
 	}
 	// Create initial bootstrap iterator that will fail after 2 items
 	snapshotLSN := uint64(12345)
 	iterator1 := NewMockBootstrapIterator(testData, snapshotLSN)
 	iterator1.SetFailAfter(2)
 	// Start first bootstrap attempt
 	err = manager.StartBootstrap("test-replica", iterator1, 2)
 	if err != nil {
 		t.Fatalf("Failed to start bootstrap: %v", err)
 	}
 	// Wait for the bootstrap to fail
 	for i := 0; i < 50; i++ {
 		if !manager.IsBootstrapInProgress() {
 			break
 		}
 		time.Sleep(100 * time.Millisecond)
 	}
 	// Verify bootstrap state shows failure
 	state1 := manager.GetBootstrapState()
 	if state1 == nil {
 		t.Fatalf("Bootstrap state is nil after failed attempt")
 	}
 	if state1.Completed {
 		t.Errorf("Bootstrap state should not be marked as completed after failure")
 	}
 	if state1.AppliedKeys != 2 {
 		t.Errorf("Expected 2 applied keys in state after failure, got %d", state1.AppliedKeys)
 	}
 	// Create a new bootstrap manager that should load the existing state
 	manager2, err := NewBootstrapManager(storageApplier, nil, tempDir, logger)
 	if err != nil {
 		t.Fatalf("Failed to create second bootstrap manager: %v", err)
 	}
 	// Create a new iterator for the resume
 	iterator2 := NewMockBootstrapIterator(testData, snapshotLSN)
 	// Start the resumed bootstrap
 	err = manager2.StartBootstrap("test-replica", iterator2, 2)
 	if err != nil {
 		t.Fatalf("Failed to start resumed bootstrap: %v", err)
 	}
 	// Wait for bootstrap to complete
 	for i := 0; i < 50; i++ {
 		if !manager2.IsBootstrapInProgress() {
 			break
 		}
 		time.Sleep(100 * time.Millisecond)
 	}
 	// Verify bootstrap completed
 	if manager2.IsBootstrapInProgress() {
 		t.Fatalf("Resumed bootstrap did not complete in time")
 	}
 	// We don't check the exact count here, as it may include previously applied items
 	// and it's an implementation detail whether they get reapplied or skipped
 	appliedCount := storageApplier.GetAppliedCount()
 	if appliedCount < len(testData) {
 		t.Errorf("Expected at least %d applied items, got %d", len(testData), appliedCount)
 	}
 	// Verify bootstrap state
 	state2 := manager2.GetBootstrapState()
 	if state2 == nil {
 		t.Fatalf("Bootstrap state is nil after resume")
 	}
 	if !state2.Completed {
 		t.Errorf("Bootstrap state should be marked as completed after resume")
 	}
 	if state2.AppliedKeys != len(testData) {
 		t.Errorf("Expected %d applied keys in state after resume, got %d", len(testData), state2.AppliedKeys)
 	}
 	if state2.Progress != 1.0 {
 		t.Errorf("Expected progress 1.0 after resume, got %f", state2.Progress)
 	}
 }
 // TestBootstrapManager_WALTransition tests transition to WAL replication
 func TestBootstrapManager_WALTransition(t *testing.T) {
 	// Create test directory
 	tempDir := createTempDir(t)
 	defer cleanupTempDir(t, tempDir)
 	// Create test data
 	testData := []KeyValuePair{
 		{Key: []byte("key1"), Value: []byte("value1")},
 		{Key: []byte("key2"), Value: []byte("value2")},
 		{Key: []byte("key3"), Value: []byte("value3")},
 	}
 	// Create mock components
 	storageApplier := NewMockStorageApplier()
 	// Create mock WAL applier
 	walApplier := &MockWALApplier{
 		mu:             sync.RWMutex{},
 		highestApplied: uint64(1000),
 	}
 	logger := log.GetDefaultLogger()
 	// Create bootstrap manager
 	manager, err := NewBootstrapManager(storageApplier, walApplier, tempDir, logger)
 	if err != nil {
 		t.Fatalf("Failed to create bootstrap manager: %v", err)
 	}
 	// Create mock bootstrap iterator
 	snapshotLSN := uint64(12345)
 	iterator := NewMockBootstrapIterator(testData, snapshotLSN)
 	// Set the snapshot LSN
 	manager.SetSnapshotLSN(snapshotLSN)
 	// Start bootstrap process
 	err = manager.StartBootstrap("test-replica", iterator, 2)
 	if err != nil {
 		t.Fatalf("Failed to start bootstrap: %v", err)
 	}
 	// Wait for bootstrap to complete
 	for i := 0; i < 50; i++ {
 		if !manager.IsBootstrapInProgress() {
 			break
 		}
 		time.Sleep(100 * time.Millisecond)
 	}
 	// Verify bootstrap completed
 	if manager.IsBootstrapInProgress() {
 		t.Fatalf("Bootstrap did not complete in time")
 	}
 	// Transition to WAL replication
 	err = manager.TransitionToWALReplication()
 	if err != nil {
 		t.Fatalf("Failed to transition to WAL replication: %v", err)
 	}
 	// Verify WAL applier's highest applied LSN was updated
 	walApplier.mu.RLock()
 	highestApplied := walApplier.highestApplied
 	walApplier.mu.RUnlock()
 	if highestApplied != snapshotLSN {
 		t.Errorf("Expected WAL applier highest applied LSN to be %d, got %d", snapshotLSN, highestApplied)
 	}
 }
 // TestBootstrapGenerator_Basic tests basic bootstrap generator functionality
 func TestBootstrapGenerator_Basic(t *testing.T) {
 	// Create test data
 	testData := []KeyValuePair{
 		{Key: []byte("key1"), Value: []byte("value1")},
 		{Key: []byte("key2"), Value: []byte("value2")},
 		{Key: []byte("key3"), Value: []byte("value3")},
 		{Key: []byte("key4"), Value: []byte("value4")},
 		{Key: []byte("key5"), Value: []byte("value5")},
 	}
 	// Create mock storage snapshot
 	mockSnapshot := NewMemoryStorageSnapshot(testData)
 	// Create mock snapshot provider
 	snapshotProvider := &MockSnapshotProvider{
 		snapshot: mockSnapshot,
 	}
 	// Create mock replicator
 	replicator := &WALReplicator{
 		highestTimestamp: 12345,
 	}
 	// Create bootstrap generator
 	generator := NewBootstrapGenerator(snapshotProvider, replicator, nil)
 	// Start bootstrap generation
 	ctx := context.Background()
 	iterator, snapshotLSN, err := generator.StartBootstrapGeneration(ctx, "test-replica")
 	if err != nil {
 		t.Fatalf("Failed to start bootstrap generation: %v", err)
 	}
 	// Verify snapshotLSN
 	if snapshotLSN != 12345 {
 		t.Errorf("Expected snapshot LSN 12345, got %d", snapshotLSN)
 	}
 	// Read all data
 	var receivedData []KeyValuePair
 	for {
 		key, value, err := iterator.Next()
 		if err == io.EOF {
 			break
 		}
 		if err != nil {
 			t.Fatalf("Error reading from iterator: %v", err)
 		}
 		receivedData = append(receivedData, KeyValuePair{
 			Key:   key,
 			Value: value,
 		})
 	}
 	// Verify all data was received
 	if len(receivedData) != len(testData) {
 		t.Errorf("Expected %d items, got %d", len(testData), len(receivedData))
 	}
 	// Verify active bootstraps
 	activeBootstraps := generator.GetActiveBootstraps()
 	if len(activeBootstraps) != 1 {
 		t.Errorf("Expected 1 active bootstrap, got %d", len(activeBootstraps))
 	}
 	replicaInfo, exists := activeBootstraps["test-replica"]
 	if !exists {
 		t.Fatalf("Expected to find test-replica in active bootstraps")
 	}
 	completed, ok := replicaInfo["completed"].(bool)
 	if !ok {
 		t.Fatalf("Expected 'completed' to be a boolean")
 	}
 	if !completed {
 		t.Errorf("Expected bootstrap to be marked as completed")
 	}
 }
 // TestBootstrapGenerator_Cancel tests cancellation of bootstrap generation
 func TestBootstrapGenerator_Cancel(t *testing.T) {
 	// Create test data
 	var testData []KeyValuePair
 	for i := 0; i < 1000; i++ {
 		testData = append(testData, KeyValuePair{
 			Key:   []byte(fmt.Sprintf("key%d", i)),
 			Value: []byte(fmt.Sprintf("value%d", i)),
 		})
 	}
 	// Create mock storage snapshot
 	mockSnapshot := NewMemoryStorageSnapshot(testData)
 	// Create mock snapshot provider
 	snapshotProvider := &MockSnapshotProvider{
 		snapshot: mockSnapshot,
 	}
 	// Create mock replicator
 	replicator := &WALReplicator{
 		highestTimestamp: 12345,
 	}
 	// Create bootstrap generator
 	generator := NewBootstrapGenerator(snapshotProvider, replicator, nil)
 	// Start bootstrap generation
 	ctx := context.Background()
 	iterator, _, err := generator.StartBootstrapGeneration(ctx, "test-replica")
 	if err != nil {
 		t.Fatalf("Failed to start bootstrap generation: %v", err)
 	}
 	// Read a few items
 	for i := 0; i < 5; i++ {
 		_, _, err := iterator.Next()
 		if err != nil {
 			t.Fatalf("Error reading from iterator: %v", err)
 		}
 	}
 	// Cancel the bootstrap
 	cancelled := generator.CancelBootstrapGeneration("test-replica")
 	if !cancelled {
 		t.Errorf("Expected to cancel bootstrap, but CancelBootstrapGeneration returned false")
 	}
 	// Try to read more items, should get cancelled error
 	_, _, err = iterator.Next()
 	if err != ErrBootstrapGenerationCancelled {
 		t.Errorf("Expected ErrBootstrapGenerationCancelled, got %v", err)
 	}
 	// Verify active bootstraps
 	activeBootstraps := generator.GetActiveBootstraps()
 	replicaInfo, exists := activeBootstraps["test-replica"]
 	if !exists {
 		t.Fatalf("Expected to find test-replica in active bootstraps")
 	}
 	cancelled, ok := replicaInfo["cancelled"].(bool)
 	if !ok {
 		t.Fatalf("Expected 'cancelled' to be a boolean")
 	}
 	if !cancelled {
 		t.Errorf("Expected bootstrap to be marked as cancelled")
 	}
 }
 // MockSnapshotProvider implements StorageSnapshotProvider for testing
 type MockSnapshotProvider struct {
 	snapshot    StorageSnapshot
 	createError error
 }
 func (m *MockSnapshotProvider) CreateSnapshot() (StorageSnapshot, error) {
 	if m.createError != nil {
 		return nil, m.createError
 	}
 	return m.snapshot, nil
 }
 // MockWALReplicator simulates WALReplicator for tests
 type MockWALReplicator struct {
 	highestTimestamp uint64
 }
 func (r *MockWALReplicator) GetHighestTimestamp() uint64 {
 	return r.highestTimestamp
 }
 // MockWALApplier simulates WALApplier for tests
 type MockWALApplier struct {
 	mu             sync.RWMutex
 	highestApplied uint64
 }
 func (a *MockWALApplier) ResetHighestApplied(lsn uint64) {
 	a.mu.Lock()
 	defer a.mu.Unlock()
 	a.highestApplied = lsn
 }
--- a/pkg/replication/interfaces.go
+++ b/pkg/replication/interfaces.go
@ -1,30 +0,0 @@
 package replication
 import (
 	"github.com/KevoDB/kevo/pkg/wal"
 )
 // EntryReplicator defines the interface for replicating WAL entries
 type EntryReplicator interface {
 	// GetHighestTimestamp returns the highest Lamport timestamp seen
 	GetHighestTimestamp() uint64
 	// AddProcessor registers a processor to handle replicated entries
 	AddProcessor(processor EntryProcessor)
 	// RemoveProcessor unregisters a processor
 	RemoveProcessor(processor EntryProcessor)
 	// GetEntriesAfter retrieves entries after a given position
 	GetEntriesAfter(pos ReplicationPosition) ([]*wal.Entry, error)
 }
 // EntryApplier defines the interface for applying WAL entries
 type EntryApplier interface {
 	// ResetHighestApplied sets the highest applied LSN
 	ResetHighestApplied(lsn uint64)
 }
 // Ensure our concrete types implement these interfaces
 var _ EntryReplicator = (*WALReplicator)(nil)
 var _ EntryApplier = (*WALApplier)(nil)
--- a/pkg/replication/serialization.go
+++ b/pkg/replication/serialization.go
@ -291,7 +291,7 @@ func (s *BatchSerializer) DeserializeBatch(data []byte) ([]*wal.Entry, error) {
 	offset := 4 // Skip checksum
 	// Read entry count
-	count := binary.LittleEndian.Uint32(data[offset : offset+4])
+	count := binary.LittleEndian.Uint32(data[offset:offset+4])
 	offset += 4
 	// Read base timestamp (we don't use this currently, but read past it)
@ -311,7 +311,7 @@ func (s *BatchSerializer) DeserializeBatch(data []byte) ([]*wal.Entry, error) {
 		}
 		// Read entry size
-		entrySize := binary.LittleEndian.Uint32(data[offset : offset+4])
+		entrySize := binary.LittleEndian.Uint32(data[offset:offset+4])
 		offset += 4
 		// Validate entry size
@ -320,7 +320,7 @@ func (s *BatchSerializer) DeserializeBatch(data []byte) ([]*wal.Entry, error) {
 		}
 		// Deserialize entry
-		entry, err := s.entrySerializer.DeserializeEntry(data[offset : offset+int(entrySize)])
+		entry, err := s.entrySerializer.DeserializeEntry(data[offset:offset+int(entrySize)])
 		if err != nil {
 			return nil, err
 		}
--- a/pkg/replication/serialization_test.go
+++ b/pkg/replication/serialization_test.go
@ -412,7 +412,7 @@ func TestSerializeToBuffer(t *testing.T) {
 	}
 	// Test with too small buffer
-	smallBuffer := make([]byte, estimatedSize-1)
+	smallBuffer := make([]byte, estimatedSize - 1)
 	_, err = serializer.SerializeEntryToBuffer(entry, smallBuffer)
 	if err != ErrBufferTooSmall {
 		t.Errorf("Expected buffer too small error, got %v", err)
--- a/pkg/replication/storage_snapshot.go
+++ b/pkg/replication/storage_snapshot.go
@ -33,8 +33,8 @@ type StorageSnapshotProvider interface {
 // MemoryStorageSnapshot is a simple in-memory implementation of StorageSnapshot
 // Useful for testing or small datasets
 type MemoryStorageSnapshot struct {
-	Pairs    []KeyValuePair
+	Pairs     []KeyValuePair
-	position int
+	position  int
 }
 // KeyValuePair represents a key-value pair in storage
--- a/pkg/transport/access_control.go
+++ b/pkg/transport/access_control.go
@ -1,194 +0,0 @@
 package transport
 import (
 	"errors"
 	"sync"
 	"time"
 )
 var (
 	// ErrAccessDenied indicates the replica is not authorized
 	ErrAccessDenied = errors.New("access denied")
 	// ErrAuthenticationFailed indicates authentication failure
 	ErrAuthenticationFailed = errors.New("authentication failed")
 	// ErrInvalidToken indicates an invalid or expired token
 	ErrInvalidToken = errors.New("invalid or expired token")
 )
 // AuthMethod defines authentication methods for replicas
 type AuthMethod string
 const (
 	// AuthNone means no authentication required (not recommended for production)
 	AuthNone AuthMethod = "none"
 	// AuthToken uses a pre-shared token for authentication
 	AuthToken AuthMethod = "token"
 )
 // AccessLevel defines permission levels for replicas
 type AccessLevel int
 const (
 	// AccessNone has no permissions
 	AccessNone AccessLevel = iota
 	// AccessReadOnly can only read from the primary
 	AccessReadOnly
 	// AccessReadWrite can read and receive updates from the primary
 	AccessReadWrite
 	// AccessAdmin has full control including management operations
 	AccessAdmin
 )
 // ReplicaCredentials contains authentication information for a replica
 type ReplicaCredentials struct {
 	ReplicaID   string
 	AuthMethod  AuthMethod
 	Token       string // Token for authentication (in a production system, this would be hashed)
 	AccessLevel AccessLevel
 	ExpiresAt   time.Time // Token expiration time (zero means no expiration)
 }
 // AccessController manages authentication and authorization for replicas
 type AccessController struct {
 	mu          sync.RWMutex
 	credentials map[string]*ReplicaCredentials // Map of replicaID -> credentials
 	enabled     bool
 	defaultAuth AuthMethod
 }
 // NewAccessController creates a new access controller
 func NewAccessController(enabled bool, defaultAuth AuthMethod) *AccessController {
 	return &AccessController{
 		credentials: make(map[string]*ReplicaCredentials),
 		enabled:     enabled,
 		defaultAuth: defaultAuth,
 	}
 }
 // IsEnabled returns whether access control is enabled
 func (ac *AccessController) IsEnabled() bool {
 	return ac.enabled
 }
 // DefaultAuthMethod returns the default authentication method
 func (ac *AccessController) DefaultAuthMethod() AuthMethod {
 	return ac.defaultAuth
 }
 // RegisterReplica registers a new replica with credentials
 func (ac *AccessController) RegisterReplica(creds *ReplicaCredentials) error {
 	if !ac.enabled {
 		// If access control is disabled, we still register the replica but don't enforce controls
 		creds.AccessLevel = AccessAdmin
 	}
 	ac.mu.Lock()
 	defer ac.mu.Unlock()
 	// Store credentials (in a real system, we'd hash tokens here)
 	ac.credentials[creds.ReplicaID] = creds
 	return nil
 }
 // RemoveReplica removes a replica's credentials
 func (ac *AccessController) RemoveReplica(replicaID string) {
 	ac.mu.Lock()
 	defer ac.mu.Unlock()
 	delete(ac.credentials, replicaID)
 }
 // AuthenticateReplica authenticates a replica based on the provided credentials
 func (ac *AccessController) AuthenticateReplica(replicaID, token string) error {
 	if !ac.enabled {
 		return nil // Authentication disabled
 	}
 	ac.mu.RLock()
 	defer ac.mu.RUnlock()
 	creds, exists := ac.credentials[replicaID]
 	if !exists {
 		return ErrAccessDenied
 	}
 	// Check if credentials are expired
 	if !creds.ExpiresAt.IsZero() && time.Now().After(creds.ExpiresAt) {
 		return ErrInvalidToken
 	}
 	// Authenticate based on method
 	switch creds.AuthMethod {
 	case AuthNone:
 		return nil // No authentication required
 	case AuthToken:
 		// In a real system, we'd compare hashed tokens
 		if token != creds.Token {
 			return ErrAuthenticationFailed
 		}
 		return nil
 	default:
 		return ErrAuthenticationFailed
 	}
 }
 // AuthorizeReplicaAction checks if a replica has permission for an action
 func (ac *AccessController) AuthorizeReplicaAction(replicaID string, requiredLevel AccessLevel) error {
 	if !ac.enabled {
 		return nil // Authorization disabled
 	}
 	ac.mu.RLock()
 	defer ac.mu.RUnlock()
 	creds, exists := ac.credentials[replicaID]
 	if !exists {
 		return ErrAccessDenied
 	}
 	// Check permissions
 	if creds.AccessLevel < requiredLevel {
 		return ErrAccessDenied
 	}
 	return nil
 }
 // GetReplicaAccessLevel returns the access level for a replica
 func (ac *AccessController) GetReplicaAccessLevel(replicaID string) (AccessLevel, error) {
 	if !ac.enabled {
 		return AccessAdmin, nil // If disabled, return highest access level
 	}
 	ac.mu.RLock()
 	defer ac.mu.RUnlock()
 	creds, exists := ac.credentials[replicaID]
 	if !exists {
 		return AccessNone, ErrAccessDenied
 	}
 	return creds.AccessLevel, nil
 }
 // SetReplicaAccessLevel updates the access level for a replica
 func (ac *AccessController) SetReplicaAccessLevel(replicaID string, level AccessLevel) error {
 	ac.mu.Lock()
 	defer ac.mu.Unlock()
 	creds, exists := ac.credentials[replicaID]
 	if !exists {
 		return ErrAccessDenied
 	}
 	creds.AccessLevel = level
 	return nil
 }
--- a/pkg/transport/bootstrap_metrics.go
+++ b/pkg/transport/bootstrap_metrics.go
@ -1,159 +0,0 @@
 package transport
 import (
 	"sync"
 	"time"
 )
 // BootstrapMetrics contains metrics related to bootstrap operations
 type BootstrapMetrics struct {
 	// Bootstrap counts per replica
 	bootstrapCount     map[string]int
 	bootstrapCountLock sync.RWMutex
 	// Bootstrap progress per replica
 	bootstrapProgress     map[string]float64
 	bootstrapProgressLock sync.RWMutex
 	// Last successful bootstrap time per replica
 	lastBootstrap     map[string]time.Time
 	lastBootstrapLock sync.RWMutex
 }
 // newBootstrapMetrics creates a new bootstrap metrics container
 func newBootstrapMetrics() *BootstrapMetrics {
 	return &BootstrapMetrics{
 		bootstrapCount:    make(map[string]int),
 		bootstrapProgress: make(map[string]float64),
 		lastBootstrap:     make(map[string]time.Time),
 	}
 }
 // IncrementBootstrapCount increments the bootstrap count for a replica
 func (m *BootstrapMetrics) IncrementBootstrapCount(replicaID string) {
 	m.bootstrapCountLock.Lock()
 	defer m.bootstrapCountLock.Unlock()
 	m.bootstrapCount[replicaID]++
 }
 // GetBootstrapCount gets the bootstrap count for a replica
 func (m *BootstrapMetrics) GetBootstrapCount(replicaID string) int {
 	m.bootstrapCountLock.RLock()
 	defer m.bootstrapCountLock.RUnlock()
 	return m.bootstrapCount[replicaID]
 }
 // UpdateBootstrapProgress updates the bootstrap progress for a replica
 func (m *BootstrapMetrics) UpdateBootstrapProgress(replicaID string, progress float64) {
 	m.bootstrapProgressLock.Lock()
 	defer m.bootstrapProgressLock.Unlock()
 	m.bootstrapProgress[replicaID] = progress
 }
 // GetBootstrapProgress gets the bootstrap progress for a replica
 func (m *BootstrapMetrics) GetBootstrapProgress(replicaID string) float64 {
 	m.bootstrapProgressLock.RLock()
 	defer m.bootstrapProgressLock.RUnlock()
 	return m.bootstrapProgress[replicaID]
 }
 // MarkBootstrapCompleted marks a bootstrap as completed for a replica
 func (m *BootstrapMetrics) MarkBootstrapCompleted(replicaID string) {
 	m.lastBootstrapLock.Lock()
 	defer m.lastBootstrapLock.Unlock()
 	m.lastBootstrap[replicaID] = time.Now()
 }
 // GetLastBootstrapTime gets the last bootstrap time for a replica
 func (m *BootstrapMetrics) GetLastBootstrapTime(replicaID string) (time.Time, bool) {
 	m.lastBootstrapLock.RLock()
 	defer m.lastBootstrapLock.RUnlock()
 	ts, exists := m.lastBootstrap[replicaID]
 	return ts, exists
 }
 // GetAllBootstrapMetrics returns all bootstrap metrics as a map
 func (m *BootstrapMetrics) GetAllBootstrapMetrics() map[string]map[string]interface{} {
 	result := make(map[string]map[string]interface{})
 	// Get all replica IDs
 	var replicaIDs []string
 	m.bootstrapCountLock.RLock()
 	for id := range m.bootstrapCount {
 		replicaIDs = append(replicaIDs, id)
 	}
 	m.bootstrapCountLock.RUnlock()
 	m.bootstrapProgressLock.RLock()
 	for id := range m.bootstrapProgress {
 		found := false
 		for _, existingID := range replicaIDs {
 			if existingID == id {
 				found = true
 				break
 			}
 		}
 		if !found {
 			replicaIDs = append(replicaIDs, id)
 		}
 	}
 	m.bootstrapProgressLock.RUnlock()
 	m.lastBootstrapLock.RLock()
 	for id := range m.lastBootstrap {
 		found := false
 		for _, existingID := range replicaIDs {
 			if existingID == id {
 				found = true
 				break
 			}
 		}
 		if !found {
 			replicaIDs = append(replicaIDs, id)
 		}
 	}
 	m.lastBootstrapLock.RUnlock()
 	// Build metrics for each replica
 	for _, id := range replicaIDs {
 		replicaMetrics := make(map[string]interface{})
 		// Add bootstrap count
 		m.bootstrapCountLock.RLock()
 		if count, exists := m.bootstrapCount[id]; exists {
 			replicaMetrics["bootstrap_count"] = count
 		} else {
 			replicaMetrics["bootstrap_count"] = 0
 		}
 		m.bootstrapCountLock.RUnlock()
 		// Add bootstrap progress
 		m.bootstrapProgressLock.RLock()
 		if progress, exists := m.bootstrapProgress[id]; exists {
 			replicaMetrics["bootstrap_progress"] = progress
 		} else {
 			replicaMetrics["bootstrap_progress"] = 0.0
 		}
 		m.bootstrapProgressLock.RUnlock()
 		// Add last bootstrap time
 		m.lastBootstrapLock.RLock()
 		if ts, exists := m.lastBootstrap[id]; exists {
 			replicaMetrics["last_bootstrap"] = ts
 		} else {
 			replicaMetrics["last_bootstrap"] = nil
 		}
 		m.lastBootstrapLock.RUnlock()
 		result[id] = replicaMetrics
 	}
 	return result
 }
--- a/pkg/transport/errors.go
+++ b/pkg/transport/errors.go
@ -1,98 +0,0 @@
 package transport
 import (
 	"errors"
 	"fmt"
 )
 // Common error types for transport and reliability
 var (
 	// ErrMaxRetriesExceeded indicates the operation failed after all retries
 	ErrMaxRetriesExceeded = errors.New("maximum retries exceeded")
 	// ErrCircuitOpen indicates the circuit breaker is open
 	ErrCircuitOpen = errors.New("circuit breaker is open")
 	// ErrConnectionFailed indicates a connection failure
 	ErrConnectionFailed = errors.New("connection failed")
 	// ErrDisconnected indicates the connection was lost
 	ErrDisconnected = errors.New("connection was lost")
 	// ErrReconnectionFailed indicates reconnection attempts failed
 	ErrReconnectionFailed = errors.New("reconnection failed")
 	// ErrStreamClosed indicates the stream was closed
 	ErrStreamClosed = errors.New("stream was closed")
 	// ErrInvalidState indicates an invalid state
 	ErrInvalidState = errors.New("invalid state")
 	// ErrReplicaNotRegistered indicates the replica is not registered
 	ErrReplicaNotRegistered = errors.New("replica not registered")
 )
 // TemporaryError wraps an error with information about whether it's temporary
 type TemporaryError struct {
 	Err        error
 	IsTemp     bool
 	RetryAfter int // Suggested retry after duration in milliseconds
 }
 // Error returns the error string
 func (e *TemporaryError) Error() string {
 	if e.RetryAfter > 0 {
 		return fmt.Sprintf("%v (temporary: %v, retry after: %dms)", e.Err, e.IsTemp, e.RetryAfter)
 	}
 	return fmt.Sprintf("%v (temporary: %v)", e.Err, e.IsTemp)
 }
 // Unwrap returns the wrapped error
 func (e *TemporaryError) Unwrap() error {
 	return e.Err
 }
 // IsTemporary returns whether the error is temporary
 func (e *TemporaryError) IsTemporary() bool {
 	return e.IsTemp
 }
 // GetRetryAfter returns the suggested retry after duration
 func (e *TemporaryError) GetRetryAfter() int {
 	return e.RetryAfter
 }
 // NewTemporaryError creates a new temporary error
 func NewTemporaryError(err error, isTemp bool) *TemporaryError {
 	return &TemporaryError{
 		Err:    err,
 		IsTemp: isTemp,
 	}
 }
 // NewTemporaryErrorWithRetry creates a new temporary error with retry hint
 func NewTemporaryErrorWithRetry(err error, isTemp bool, retryAfter int) *TemporaryError {
 	return &TemporaryError{
 		Err:        err,
 		IsTemp:     isTemp,
 		RetryAfter: retryAfter,
 	}
 }
 // IsTemporary checks if an error is a temporary error
 func IsTemporary(err error) bool {
 	var tempErr *TemporaryError
 	if errors.As(err, &tempErr) {
 		return tempErr.IsTemporary()
 	}
 	return false
 }
 // GetRetryAfter extracts the retry hint from an error
 func GetRetryAfter(err error) int {
 	var tempErr *TemporaryError
 	if errors.As(err, &tempErr) {
 		return tempErr.GetRetryAfter()
 	}
 	return 0
 }
--- a/pkg/transport/errors_test.go
+++ b/pkg/transport/errors_test.go
@ -1,150 +0,0 @@
 package transport
 import (
 	"errors"
 	"fmt"
 	"strings"
 	"testing"
 )
 func TestTemporaryError(t *testing.T) {
 	t.Run("Basic error wrapping", func(t *testing.T) {
 		baseErr := errors.New("base error")
 		tempErr := NewTemporaryError(baseErr, true)
 		if !tempErr.IsTemporary() {
 			t.Error("Expected IsTemporary() to return true")
 		}
 		if tempErr.GetRetryAfter() != 0 {
 			t.Errorf("Expected GetRetryAfter() to return 0, got %d", tempErr.GetRetryAfter())
 		}
 		if !strings.Contains(tempErr.Error(), baseErr.Error()) {
 			t.Errorf("Expected Error() to contain the base error message")
 		}
 		if !strings.Contains(tempErr.Error(), "temporary: true") {
 			t.Errorf("Expected Error() to indicate temporary status")
 		}
 		// Test unwrap
 		unwrapped := errors.Unwrap(tempErr)
 		if unwrapped != baseErr {
 			t.Errorf("Expected Unwrap() to return the base error")
 		}
 	})
 	t.Run("Error with retry hint", func(t *testing.T) {
 		baseErr := errors.New("connection refused")
 		retryAfter := 1000 // 1 second
 		tempErr := NewTemporaryErrorWithRetry(baseErr, true, retryAfter)
 		if !tempErr.IsTemporary() {
 			t.Error("Expected IsTemporary() to return true")
 		}
 		if tempErr.GetRetryAfter() != retryAfter {
 			t.Errorf("Expected GetRetryAfter() to return %d, got %d", retryAfter, tempErr.GetRetryAfter())
 		}
 		if !strings.Contains(tempErr.Error(), baseErr.Error()) {
 			t.Errorf("Expected Error() to contain the base error message")
 		}
 		if !strings.Contains(tempErr.Error(), "temporary: true") {
 			t.Errorf("Expected Error() to indicate temporary status")
 		}
 		if !strings.Contains(tempErr.Error(), "retry after: 1000ms") {
 			t.Errorf("Expected Error() to include retry hint")
 		}
 	})
 	t.Run("Non-temporary error", func(t *testing.T) {
 		baseErr := errors.New("permanent error")
 		tempErr := NewTemporaryError(baseErr, false)
 		if tempErr.IsTemporary() {
 			t.Error("Expected IsTemporary() to return false")
 		}
 		if !strings.Contains(tempErr.Error(), "temporary: false") {
 			t.Errorf("Expected Error() to indicate non-temporary status")
 		}
 	})
 }
 func TestIsTemporary(t *testing.T) {
 	t.Run("With TemporaryError", func(t *testing.T) {
 		err := NewTemporaryError(errors.New("test error"), true)
 		if !IsTemporary(err) {
 			t.Error("Expected IsTemporary() to return true")
 		}
 		err = NewTemporaryError(errors.New("test error"), false)
 		if IsTemporary(err) {
 			t.Error("Expected IsTemporary() to return false")
 		}
 	})
 	t.Run("With regular error", func(t *testing.T) {
 		err := errors.New("regular error")
 		if IsTemporary(err) {
 			t.Error("Expected IsTemporary() to return false for regular error")
 		}
 	})
 	t.Run("With wrapped error", func(t *testing.T) {
 		tempErr := NewTemporaryError(errors.New("base error"), true)
 		wrappedErr := errors.New("wrapper: " + tempErr.Error())
 		wrappedTempErr := fmt.Errorf("wrapper: %w", tempErr)
 		// Regular wrapping doesn't preserve error type
 		if IsTemporary(wrappedErr) {
 			t.Error("Expected IsTemporary() to return false for string-wrapped error")
 		}
 		// fmt.Errorf with %w preserves error type
 		if !IsTemporary(wrappedTempErr) {
 			t.Error("Expected IsTemporary() to return true for properly wrapped error")
 		}
 	})
 }
 func TestGetRetryAfter(t *testing.T) {
 	t.Run("With retry hint", func(t *testing.T) {
 		retryAfter := 2000 // 2 seconds
 		err := NewTemporaryErrorWithRetry(errors.New("test error"), true, retryAfter)
 		if GetRetryAfter(err) != retryAfter {
 			t.Errorf("Expected GetRetryAfter() to return %d, got %d", retryAfter, GetRetryAfter(err))
 		}
 	})
 	t.Run("Without retry hint", func(t *testing.T) {
 		err := NewTemporaryError(errors.New("test error"), true)
 		if GetRetryAfter(err) != 0 {
 			t.Errorf("Expected GetRetryAfter() to return 0, got %d", GetRetryAfter(err))
 		}
 	})
 	t.Run("With regular error", func(t *testing.T) {
 		err := errors.New("regular error")
 		if GetRetryAfter(err) != 0 {
 			t.Errorf("Expected GetRetryAfter() to return 0, got %d", GetRetryAfter(err))
 		}
 	})
 	t.Run("With wrapped error", func(t *testing.T) {
 		retryAfter := 3000 // 3 seconds
 		tempErr := NewTemporaryErrorWithRetry(errors.New("base error"), true, retryAfter)
 		wrappedTempErr := fmt.Errorf("wrapper: %w", tempErr)
 		if GetRetryAfter(wrappedTempErr) != retryAfter {
 			t.Errorf("Expected GetRetryAfter() to return %d, got %d", retryAfter, GetRetryAfter(wrappedTempErr))
 		}
 	})
 }
--- a/pkg/transport/registry.go
+++ b/pkg/transport/registry.go
@ -7,9 +7,9 @@ import (
 // registry implements the Registry interface
 type registry struct {
-	mu                         sync.RWMutex
+	mu                      sync.RWMutex
-	clientFactories            map[string]ClientFactory
+	clientFactories         map[string]ClientFactory
-	serverFactories            map[string]ServerFactory
+	serverFactories         map[string]ServerFactory
 	replicationClientFactories map[string]ReplicationClientFactory
 	replicationServerFactories map[string]ReplicationServerFactory
 }
@ -17,8 +17,8 @@ type registry struct {
 // NewRegistry creates a new transport registry
 func NewRegistry() Registry {
 	return &registry{
-		clientFactories:            make(map[string]ClientFactory),
+		clientFactories: make(map[string]ClientFactory),
-		serverFactories:            make(map[string]ServerFactory),
+		serverFactories: make(map[string]ServerFactory),
 		replicationClientFactories: make(map[string]ReplicationClientFactory),
 		replicationServerFactories: make(map[string]ReplicationServerFactory),
 	}
--- a/pkg/transport/replica_persistence.go
+++ b/pkg/transport/replica_persistence.go
@ -1,310 +0,0 @@
 package transport
 import (
 	"encoding/json"
 	"errors"
 	"os"
 	"path/filepath"
 	"sync"
 	"time"
 )
 var (
 	// ErrPersistenceDisabled indicates persistence operations cannot be performed
 	ErrPersistenceDisabled = errors.New("persistence is disabled")
 	// ErrInvalidReplicaData indicates the stored replica data is invalid
 	ErrInvalidReplicaData = errors.New("invalid replica data")
 )
 // PersistentReplicaInfo contains replica information that can be persisted
 type PersistentReplicaInfo struct {
 	ID          string              `json:"id"`
 	Address     string              `json:"address"`
 	Role        string              `json:"role"`
 	LastSeen    int64               `json:"last_seen"`
 	CurrentLSN  uint64              `json:"current_lsn"`
 	Credentials *ReplicaCredentials `json:"credentials,omitempty"`
 }
 // ReplicaPersistence manages persistence of replica information
 type ReplicaPersistence struct {
 	mu        sync.RWMutex
 	dataDir   string
 	enabled   bool
 	autoSave  bool
 	replicas  map[string]*PersistentReplicaInfo
 	dirty     bool
 	lastSave  time.Time
 	saveTimer *time.Timer
 }
 // NewReplicaPersistence creates a new persistence manager
 func NewReplicaPersistence(dataDir string, enabled bool, autoSave bool) (*ReplicaPersistence, error) {
 	rp := &ReplicaPersistence{
 		dataDir:  dataDir,
 		enabled:  enabled,
 		autoSave: autoSave,
 		replicas: make(map[string]*PersistentReplicaInfo),
 	}
 	// Create data directory if it doesn't exist
 	if enabled {
 		if err := os.MkdirAll(dataDir, 0755); err != nil {
 			return nil, err
 		}
 		// Load existing data
 		if err := rp.Load(); err != nil {
 			return nil, err
 		}
 		// Start auto-save timer if needed
 		if autoSave {
 			rp.saveTimer = time.AfterFunc(10*time.Second, rp.autoSaveFunc)
 		}
 	}
 	return rp, nil
 }
 // autoSaveFunc is called periodically to save replica data
 func (rp *ReplicaPersistence) autoSaveFunc() {
 	rp.mu.RLock()
 	dirty := rp.dirty
 	rp.mu.RUnlock()
 	if dirty {
 		if err := rp.Save(); err != nil {
 			// In a production system, this should be logged properly
 			println("Error auto-saving replica data:", err.Error())
 		}
 	}
 	// Reschedule timer
 	rp.saveTimer.Reset(10 * time.Second)
 }
 // FromReplicaInfo converts a ReplicaInfo to a persistent form
 func (rp *ReplicaPersistence) FromReplicaInfo(info *ReplicaInfo, creds *ReplicaCredentials) *PersistentReplicaInfo {
 	return &PersistentReplicaInfo{
 		ID:          info.ID,
 		Address:     info.Address,
 		Role:        string(info.Role),
 		LastSeen:    info.LastSeen.UnixMilli(),
 		CurrentLSN:  info.CurrentLSN,
 		Credentials: creds,
 	}
 }
 // ToReplicaInfo converts from persistent form to ReplicaInfo
 func (rp *ReplicaPersistence) ToReplicaInfo(pinfo *PersistentReplicaInfo) *ReplicaInfo {
 	info := &ReplicaInfo{
 		ID:         pinfo.ID,
 		Address:    pinfo.Address,
 		Role:       ReplicaRole(pinfo.Role),
 		LastSeen:   time.UnixMilli(pinfo.LastSeen),
 		CurrentLSN: pinfo.CurrentLSN,
 	}
 	return info
 }
 // Save persists all replica information to disk
 func (rp *ReplicaPersistence) Save() error {
 	if !rp.enabled {
 		return ErrPersistenceDisabled
 	}
 	rp.mu.Lock()
 	defer rp.mu.Unlock()
 	// Nothing to save if no replicas or not dirty
 	if len(rp.replicas) == 0 || !rp.dirty {
 		return nil
 	}
 	// Save each replica to its own file for better concurrency
 	for id, replica := range rp.replicas {
 		filename := filepath.Join(rp.dataDir, "replica_"+id+".json")
 		data, err := json.MarshalIndent(replica, "", "  ")
 		if err != nil {
 			return err
 		}
 		// Write to temp file first, then rename for atomic update
 		tempFile := filename + ".tmp"
 		if err := os.WriteFile(tempFile, data, 0644); err != nil {
 			return err
 		}
 		if err := os.Rename(tempFile, filename); err != nil {
 			return err
 		}
 	}
 	rp.dirty = false
 	rp.lastSave = time.Now()
 	return nil
 }
 // IsEnabled returns whether persistence is enabled
 func (rp *ReplicaPersistence) IsEnabled() bool {
 	return rp.enabled
 }
 // Load reads all persisted replica information from disk
 func (rp *ReplicaPersistence) Load() error {
 	if !rp.enabled {
 		return ErrPersistenceDisabled
 	}
 	rp.mu.Lock()
 	defer rp.mu.Unlock()
 	// Clear existing data
 	rp.replicas = make(map[string]*PersistentReplicaInfo)
 	// Find all replica files
 	pattern := filepath.Join(rp.dataDir, "replica_*.json")
 	files, err := filepath.Glob(pattern)
 	if err != nil {
 		return err
 	}
 	// Load each file
 	for _, file := range files {
 		data, err := os.ReadFile(file)
 		if err != nil {
 			// Skip files with read errors
 			continue
 		}
 		var replica PersistentReplicaInfo
 		if err := json.Unmarshal(data, &replica); err != nil {
 			// Skip files with parse errors
 			continue
 		}
 		// Validate replica data
 		if replica.ID == "" {
 			continue
 		}
 		rp.replicas[replica.ID] = &replica
 	}
 	rp.dirty = false
 	return nil
 }
 // SaveReplica persists a single replica's information
 func (rp *ReplicaPersistence) SaveReplica(info *ReplicaInfo, creds *ReplicaCredentials) error {
 	if !rp.enabled {
 		return ErrPersistenceDisabled
 	}
 	if info == nil || info.ID == "" {
 		return ErrInvalidReplicaData
 	}
 	pinfo := rp.FromReplicaInfo(info, creds)
 	rp.mu.Lock()
 	rp.replicas[info.ID] = pinfo
 	rp.dirty = true
 	// For immediate save option
 	shouldSave := !rp.autoSave
 	rp.mu.Unlock()
 	// Save immediately if auto-save is disabled
 	if shouldSave {
 		return rp.Save()
 	}
 	return nil
 }
 // LoadReplica loads a single replica's information
 func (rp *ReplicaPersistence) LoadReplica(id string) (*ReplicaInfo, *ReplicaCredentials, error) {
 	if !rp.enabled {
 		return nil, nil, ErrPersistenceDisabled
 	}
 	if id == "" {
 		return nil, nil, ErrInvalidReplicaData
 	}
 	rp.mu.RLock()
 	defer rp.mu.RUnlock()
 	pinfo, exists := rp.replicas[id]
 	if !exists {
 		return nil, nil, nil // Not found but not an error
 	}
 	return rp.ToReplicaInfo(pinfo), pinfo.Credentials, nil
 }
 // DeleteReplica removes a replica's persisted information
 func (rp *ReplicaPersistence) DeleteReplica(id string) error {
 	if !rp.enabled {
 		return ErrPersistenceDisabled
 	}
 	if id == "" {
 		return ErrInvalidReplicaData
 	}
 	rp.mu.Lock()
 	defer rp.mu.Unlock()
 	// Remove from memory
 	delete(rp.replicas, id)
 	rp.dirty = true
 	// Remove file
 	filename := filepath.Join(rp.dataDir, "replica_"+id+".json")
 	err := os.Remove(filename)
 	// Ignore file not found errors
 	if err != nil && !os.IsNotExist(err) {
 		return err
 	}
 	return nil
 }
 // GetAllReplicas returns all persisted replicas
 func (rp *ReplicaPersistence) GetAllReplicas() (map[string]*ReplicaInfo, map[string]*ReplicaCredentials, error) {
 	if !rp.enabled {
 		return nil, nil, ErrPersistenceDisabled
 	}
 	rp.mu.RLock()
 	defer rp.mu.RUnlock()
 	infoMap := make(map[string]*ReplicaInfo, len(rp.replicas))
 	credsMap := make(map[string]*ReplicaCredentials, len(rp.replicas))
 	for id, pinfo := range rp.replicas {
 		infoMap[id] = rp.ToReplicaInfo(pinfo)
 		credsMap[id] = pinfo.Credentials
 	}
 	return infoMap, credsMap, nil
 }
 // Close shuts down the persistence manager
 func (rp *ReplicaPersistence) Close() error {
 	if !rp.enabled {
 		return nil
 	}
 	// Stop auto-save timer
 	if rp.autoSave && rp.saveTimer != nil {
 		rp.saveTimer.Stop()
 	}
 	// Save any pending changes
 	return rp.Save()
 }
--- a/pkg/transport/replication.go
+++ b/pkg/transport/replication.go
@ -10,11 +10,11 @@ import (
 // Standard constants for replication message types
 const (
 	// Request types
-	TypeReplicaRegister  = "replica_register"
+	TypeReplicaRegister      = "replica_register"
-	TypeReplicaHeartbeat = "replica_heartbeat"
+	TypeReplicaHeartbeat     = "replica_heartbeat"
-	TypeReplicaWALSync   = "replica_wal_sync"
+	TypeReplicaWALSync       = "replica_wal_sync"
-	TypeReplicaBootstrap = "replica_bootstrap"
+	TypeReplicaBootstrap     = "replica_bootstrap"
-	TypeReplicaStatus    = "replica_status"
+	TypeReplicaStatus        = "replica_status"
 	// Response types
 	TypeReplicaACK           = "replica_ack"
@ -38,24 +38,24 @@ type ReplicaStatus string
 // Replica statuses
 const (
-	StatusConnecting    ReplicaStatus = "connecting"
+	StatusConnecting   ReplicaStatus = "connecting"
-	StatusSyncing       ReplicaStatus = "syncing"
+	StatusSyncing      ReplicaStatus = "syncing"
 	StatusBootstrapping ReplicaStatus = "bootstrapping"
-	StatusReady         ReplicaStatus = "ready"
+	StatusReady        ReplicaStatus = "ready"
-	StatusDisconnected  ReplicaStatus = "disconnected"
+	StatusDisconnected ReplicaStatus = "disconnected"
-	StatusError         ReplicaStatus = "error"
+	StatusError        ReplicaStatus = "error"
 )
 // ReplicaInfo contains information about a replica
 type ReplicaInfo struct {
-	ID             string
+	ID            string
-	Address        string
+	Address       string
-	Role           ReplicaRole
+	Role          ReplicaRole
-	Status         ReplicaStatus
+	Status        ReplicaStatus
-	LastSeen       time.Time
+	LastSeen      time.Time
-	CurrentLSN     uint64 // Lamport Sequence Number
+	CurrentLSN    uint64  // Lamport Sequence Number
 	ReplicationLag time.Duration
-	Error          error
+	Error         error
 }
 // ReplicationStreamDirection defines the direction of a replication stream
--- a/pkg/transport/replication_metrics.go
+++ b/pkg/transport/replication_metrics.go
@ -1,354 +0,0 @@
 package transport
 import (
 	"sync"
 	"time"
 )
 // ReplicaMetrics contains metrics for a single replica
 type ReplicaMetrics struct {
 	ReplicaID         string        // ID of the replica
 	Status            ReplicaStatus // Current status
 	ConnectedDuration time.Duration // How long the replica has been connected
 	LastSeen          time.Time     // Last time a heartbeat was received
 	ReplicationLag    time.Duration // Current replication lag
 	AppliedLSN        uint64        // Last LSN applied on the replica
 	WALEntriesSent    uint64        // Number of WAL entries sent to this replica
 	HeartbeatCount    uint64        // Number of heartbeats received
 	ErrorCount        uint64        // Number of errors encountered
 	// For bandwidth metrics
 	BytesSent        uint64 // Total bytes sent to this replica
 	BytesReceived    uint64 // Total bytes received from this replica
 	LastTransferRate uint64 // Bytes/second in the last measurement period
 	// Bootstrap metrics
 	BootstrapCount        uint64        // Number of times bootstrapped
 	LastBootstrapTime     time.Time     // Last time a bootstrap was completed
 	LastBootstrapDuration time.Duration // Duration of the last bootstrap
 }
 // NewReplicaMetrics creates a new metrics collector for a replica
 func NewReplicaMetrics(replicaID string) *ReplicaMetrics {
 	return &ReplicaMetrics{
 		ReplicaID: replicaID,
 		Status:    StatusDisconnected,
 		LastSeen:  time.Now(),
 	}
 }
 // ReplicationMetrics collects and provides metrics about replication
 type ReplicationMetrics struct {
 	mu             sync.RWMutex
 	replicaMetrics map[string]*ReplicaMetrics // Metrics by replica ID
 	// Overall replication metrics
 	PrimaryLSN            uint64        // Current LSN on primary
 	TotalWALEntriesSent   uint64        // Total WAL entries sent to all replicas
 	TotalBytesTransferred uint64        // Total bytes transferred
 	ActiveReplicaCount    int           // Number of currently active replicas
 	TotalErrorCount       uint64        // Total error count across all replicas
 	TotalHeartbeatCount   uint64        // Total heartbeats processed
 	AverageReplicationLag time.Duration // Average lag across replicas
 	MaxReplicationLag     time.Duration // Maximum lag across replicas
 	// For performance tracking
 	processingTime  map[string]time.Duration // Processing time by operation type
 	processingCount map[string]uint64        // Operation counts
 	lastSampleTime  time.Time                // Last time metrics were sampled
 	// Bootstrap metrics
 	bootstrapMetrics *BootstrapMetrics
 }
 // NewReplicationMetrics creates a new metrics collector
 func NewReplicationMetrics() *ReplicationMetrics {
 	return &ReplicationMetrics{
 		replicaMetrics:   make(map[string]*ReplicaMetrics),
 		processingTime:   make(map[string]time.Duration),
 		processingCount:  make(map[string]uint64),
 		lastSampleTime:   time.Now(),
 		bootstrapMetrics: newBootstrapMetrics(),
 	}
 }
 // GetOrCreateReplicaMetrics gets metrics for a replica, creating if needed
 func (rm *ReplicationMetrics) GetOrCreateReplicaMetrics(replicaID string) *ReplicaMetrics {
 	rm.mu.RLock()
 	metrics, exists := rm.replicaMetrics[replicaID]
 	rm.mu.RUnlock()
 	if exists {
 		return metrics
 	}
 	// Create new metrics
 	metrics = NewReplicaMetrics(replicaID)
 	rm.mu.Lock()
 	rm.replicaMetrics[replicaID] = metrics
 	rm.mu.Unlock()
 	return metrics
 }
 // UpdateReplicaStatus updates a replica's status and metrics
 func (rm *ReplicationMetrics) UpdateReplicaStatus(replicaID string, status ReplicaStatus, lsn uint64) {
 	rm.mu.Lock()
 	defer rm.mu.Unlock()
 	metrics, exists := rm.replicaMetrics[replicaID]
 	if !exists {
 		metrics = NewReplicaMetrics(replicaID)
 		rm.replicaMetrics[replicaID] = metrics
 	}
 	// Update last seen
 	now := time.Now()
 	metrics.LastSeen = now
 	// Update status
 	oldStatus := metrics.Status
 	metrics.Status = status
 	// If just connected, start tracking connected duration
 	if oldStatus != StatusReady && status == StatusReady {
 		metrics.ConnectedDuration = 0
 	}
 	// Update LSN and calculate lag
 	if lsn > 0 {
 		metrics.AppliedLSN = lsn
 		// Calculate lag (primary LSN - replica LSN)
 		if rm.PrimaryLSN > lsn {
 			lag := rm.PrimaryLSN - lsn
 			// Convert to a time.Duration (assuming LSN ~ timestamp)
 			metrics.ReplicationLag = time.Duration(lag) * time.Millisecond
 		} else {
 			metrics.ReplicationLag = 0
 		}
 	}
 	// Increment heartbeat count
 	metrics.HeartbeatCount++
 	rm.TotalHeartbeatCount++
 	// Count active replicas and update aggregate metrics
 	rm.updateAggregateMetrics()
 }
 // RecordWALEntries records WAL entries sent to a replica
 func (rm *ReplicationMetrics) RecordWALEntries(replicaID string, count uint64, bytes uint64) {
 	rm.mu.Lock()
 	defer rm.mu.Unlock()
 	metrics, exists := rm.replicaMetrics[replicaID]
 	if !exists {
 		metrics = NewReplicaMetrics(replicaID)
 		rm.replicaMetrics[replicaID] = metrics
 	}
 	// Update WAL entries count
 	metrics.WALEntriesSent += count
 	rm.TotalWALEntriesSent += count
 	// Update bytes transferred
 	metrics.BytesSent += bytes
 	rm.TotalBytesTransferred += bytes
 	// Calculate transfer rate
 	now := time.Now()
 	elapsed := now.Sub(rm.lastSampleTime)
 	if elapsed > time.Second {
 		metrics.LastTransferRate = uint64(float64(bytes) / elapsed.Seconds())
 		rm.lastSampleTime = now
 	}
 }
 // RecordBootstrap records a bootstrap operation
 func (rm *ReplicationMetrics) RecordBootstrap(replicaID string, duration time.Duration) {
 	rm.mu.Lock()
 	defer rm.mu.Unlock()
 	metrics, exists := rm.replicaMetrics[replicaID]
 	if !exists {
 		metrics = NewReplicaMetrics(replicaID)
 		rm.replicaMetrics[replicaID] = metrics
 	}
 	metrics.BootstrapCount++
 	metrics.LastBootstrapTime = time.Now()
 	metrics.LastBootstrapDuration = duration
 }
 // RecordError records an error for a replica
 func (rm *ReplicationMetrics) RecordError(replicaID string) {
 	rm.mu.Lock()
 	defer rm.mu.Unlock()
 	metrics, exists := rm.replicaMetrics[replicaID]
 	if !exists {
 		metrics = NewReplicaMetrics(replicaID)
 		rm.replicaMetrics[replicaID] = metrics
 	}
 	metrics.ErrorCount++
 	rm.TotalErrorCount++
 }
 // RecordOperationDuration records the duration of a replication operation
 func (rm *ReplicationMetrics) RecordOperationDuration(operation string, duration time.Duration) {
 	rm.mu.Lock()
 	defer rm.mu.Unlock()
 	rm.processingTime[operation] += duration
 	rm.processingCount[operation]++
 }
 // GetAverageOperationDuration returns the average duration for an operation
 func (rm *ReplicationMetrics) GetAverageOperationDuration(operation string) time.Duration {
 	rm.mu.RLock()
 	defer rm.mu.RUnlock()
 	count := rm.processingCount[operation]
 	if count == 0 {
 		return 0
 	}
 	return time.Duration(int64(rm.processingTime[operation]) / int64(count))
 }
 // GetAllReplicaMetrics returns a copy of all replica metrics
 func (rm *ReplicationMetrics) GetAllReplicaMetrics() map[string]ReplicaMetrics {
 	rm.mu.RLock()
 	defer rm.mu.RUnlock()
 	result := make(map[string]ReplicaMetrics, len(rm.replicaMetrics))
 	for id, metrics := range rm.replicaMetrics {
 		result[id] = *metrics // Make a copy
 	}
 	return result
 }
 // GetReplicaMetrics returns metrics for a specific replica
 func (rm *ReplicationMetrics) GetReplicaMetrics(replicaID string) (ReplicaMetrics, bool) {
 	rm.mu.RLock()
 	defer rm.mu.RUnlock()
 	metrics, exists := rm.replicaMetrics[replicaID]
 	if !exists {
 		return ReplicaMetrics{}, false
 	}
 	return *metrics, true
 }
 // GetSummaryMetrics returns summary metrics for all replicas
 func (rm *ReplicationMetrics) GetSummaryMetrics() map[string]interface{} {
 	rm.mu.RLock()
 	defer rm.mu.RUnlock()
 	return map[string]interface{}{
 		"primary_lsn":             rm.PrimaryLSN,
 		"active_replicas":         rm.ActiveReplicaCount,
 		"total_wal_entries_sent":  rm.TotalWALEntriesSent,
 		"total_bytes_transferred": rm.TotalBytesTransferred,
 		"avg_replication_lag_ms":  rm.AverageReplicationLag.Milliseconds(),
 		"max_replication_lag_ms":  rm.MaxReplicationLag.Milliseconds(),
 		"total_errors":            rm.TotalErrorCount,
 		"total_heartbeats":        rm.TotalHeartbeatCount,
 	}
 }
 // UpdatePrimaryLSN updates the current primary LSN
 func (rm *ReplicationMetrics) UpdatePrimaryLSN(lsn uint64) {
 	rm.mu.Lock()
 	defer rm.mu.Unlock()
 	rm.PrimaryLSN = lsn
 	// Update lag for all replicas based on new primary LSN
 	for _, metrics := range rm.replicaMetrics {
 		if rm.PrimaryLSN > metrics.AppliedLSN {
 			lag := rm.PrimaryLSN - metrics.AppliedLSN
 			metrics.ReplicationLag = time.Duration(lag) * time.Millisecond
 		} else {
 			metrics.ReplicationLag = 0
 		}
 	}
 	// Update aggregate metrics
 	rm.updateAggregateMetrics()
 }
 // updateAggregateMetrics updates aggregate metrics based on all replicas
 func (rm *ReplicationMetrics) updateAggregateMetrics() {
 	// Count active replicas
 	activeCount := 0
 	var totalLag time.Duration
 	maxLag := time.Duration(0)
 	for _, metrics := range rm.replicaMetrics {
 		if metrics.Status == StatusReady {
 			activeCount++
 			totalLag += metrics.ReplicationLag
 			if metrics.ReplicationLag > maxLag {
 				maxLag = metrics.ReplicationLag
 			}
 		}
 	}
 	rm.ActiveReplicaCount = activeCount
 	// Calculate average lag
 	if activeCount > 0 {
 		rm.AverageReplicationLag = totalLag / time.Duration(activeCount)
 	} else {
 		rm.AverageReplicationLag = 0
 	}
 	rm.MaxReplicationLag = maxLag
 }
 // UpdateConnectedDurations updates connected durations for all replicas
 func (rm *ReplicationMetrics) UpdateConnectedDurations() {
 	rm.mu.Lock()
 	defer rm.mu.Unlock()
 	now := time.Now()
 	for _, metrics := range rm.replicaMetrics {
 		if metrics.Status == StatusReady {
 			metrics.ConnectedDuration = now.Sub(metrics.LastSeen) + metrics.ConnectedDuration
 		}
 	}
 }
 // IncrementBootstrapCount increments the bootstrap count for a replica
 func (rm *ReplicationMetrics) IncrementBootstrapCount(replicaID string) {
 	rm.mu.Lock()
 	defer rm.mu.Unlock()
 	// Update per-replica metrics
 	metrics, exists := rm.replicaMetrics[replicaID]
 	if !exists {
 		metrics = NewReplicaMetrics(replicaID)
 		rm.replicaMetrics[replicaID] = metrics
 	}
 	metrics.BootstrapCount++
 	// Also update dedicated bootstrap metrics if available
 	if rm.bootstrapMetrics != nil {
 		rm.bootstrapMetrics.IncrementBootstrapCount(replicaID)
 	}
 }
 // UpdateBootstrapProgress updates the bootstrap progress for a replica
 func (rm *ReplicationMetrics) UpdateBootstrapProgress(replicaID string, progress float64) {
 	if rm.bootstrapMetrics != nil {
 		rm.bootstrapMetrics.UpdateBootstrapProgress(replicaID, progress)
 	}
 }
--- a/pkg/transport/replication_test.go
+++ b/pkg/transport/replication_test.go
@ -10,7 +10,7 @@ import (
 // MockReplicationClient implements ReplicationClient for testing
 type MockReplicationClient struct {
-	connected           bool
+	connected          bool
 	registeredAsReplica bool
 	heartbeatSent       bool
 	walEntriesRequested bool
@ -23,7 +23,7 @@ type MockReplicationClient struct {
 func NewMockReplicationClient() *MockReplicationClient {
 	return &MockReplicationClient{
-		connected:           false,
+		connected:          false,
 		registeredAsReplica: false,
 		heartbeatSent:       false,
 		walEntriesRequested: false,
@ -169,12 +169,12 @@ func TestReplicationClientInterface(t *testing.T) {
 	// Test SendHeartbeat
 	replicaInfo := &ReplicaInfo{
-		ID:             "replica1",
+		ID:            "replica1",
-		Address:        "localhost:50051",
+		Address:       "localhost:50051",
-		Role:           RoleReplica,
+		Role:          RoleReplica,
-		Status:         StatusReady,
+		Status:        StatusReady,
-		LastSeen:       time.Now(),
+		LastSeen:      time.Now(),
-		CurrentLSN:     100,
+		CurrentLSN:    100,
 		ReplicationLag: 0,
 	}
 	err = client.SendHeartbeat(ctx, replicaInfo)
@ -340,12 +340,12 @@ func TestReplicationServerInterface(t *testing.T) {
 	// Test RegisterReplica
 	replica1 := &ReplicaInfo{
-		ID:             "replica1",
+		ID:            "replica1",
-		Address:        "localhost:50051",
+		Address:       "localhost:50051",
-		Role:           RoleReplica,
+		Role:          RoleReplica,
-		Status:         StatusConnecting,
+		Status:        StatusConnecting,
-		LastSeen:       time.Now(),
+		LastSeen:      time.Now(),
-		CurrentLSN:     0,
+		CurrentLSN:    0,
 		ReplicationLag: 0,
 	}
 	err = server.RegisterReplica(replica1)
--- a/pkg/transport/retry.go
+++ b/pkg/transport/retry.go
@ -1,209 +0,0 @@
 package transport
 import (
 	"context"
 	"math"
 	"math/rand"
 	"time"
 )
 // RetryableFunc is a function that can be retried
 type RetryableFunc func(ctx context.Context) error
 // WithRetry executes a function with retry logic based on the provided policy
 func WithRetry(ctx context.Context, policy RetryPolicy, fn RetryableFunc) error {
 	var err error
 	backoff := policy.InitialBackoff
 	for attempt := 0; attempt <= policy.MaxRetries; attempt++ {
 		// Execute the function
 		err = fn(ctx)
 		if err == nil {
 			// Success
 			return nil
 		}
 		// Check if we should continue retrying
 		if attempt == policy.MaxRetries {
 			break
 		}
 		// Check if context is done
 		select {
 		case <-ctx.Done():
 			return ctx.Err()
 		default:
 			// Continue
 		}
 		// Add jitter to prevent thundering herd
 		jitter := 1.0
 		if policy.Jitter > 0 {
 			jitter = 1.0 + rand.Float64()*policy.Jitter
 		}
 		// Calculate next backoff with jitter
 		backoffWithJitter := time.Duration(float64(backoff) * jitter)
 		if backoffWithJitter > policy.MaxBackoff {
 			backoffWithJitter = policy.MaxBackoff
 		}
 		// Wait for backoff period
 		timer := time.NewTimer(backoffWithJitter)
 		select {
 		case <-ctx.Done():
 			timer.Stop()
 			return ctx.Err()
 		case <-timer.C:
 			// Continue with next attempt
 		}
 		// Increase backoff for next attempt
 		backoff = time.Duration(float64(backoff) * policy.BackoffFactor)
 		if backoff > policy.MaxBackoff {
 			backoff = policy.MaxBackoff
 		}
 	}
 	return err
 }
 // DefaultRetryPolicy returns a sensible default retry policy
 func DefaultRetryPolicy() RetryPolicy {
 	return RetryPolicy{
 		MaxRetries:     3,
 		InitialBackoff: 100 * time.Millisecond,
 		MaxBackoff:     5 * time.Second,
 		BackoffFactor:  2.0,
 		Jitter:         0.2,
 	}
 }
 // CircuitBreakerState represents the state of a circuit breaker
 type CircuitBreakerState int
 const (
 	// CircuitClosed means the circuit is closed and operations are permitted
 	CircuitClosed CircuitBreakerState = iota
 	// CircuitOpen means the circuit is open and operations will fail fast
 	CircuitOpen
 	// CircuitHalfOpen means the circuit is allowing a test operation
 	CircuitHalfOpen
 )
 // CircuitBreaker implements the circuit breaker pattern
 type CircuitBreaker struct {
 	state             CircuitBreakerState
 	failureThreshold  int
 	resetTimeout      time.Duration
 	failureCount      int
 	lastFailure       time.Time
 	lastStateChange   time.Time
 	successThreshold  int
 	halfOpenSuccesses int
 }
 // NewCircuitBreaker creates a new circuit breaker
 func NewCircuitBreaker(failureThreshold int, resetTimeout time.Duration) *CircuitBreaker {
 	return &CircuitBreaker{
 		state:            CircuitClosed,
 		failureThreshold: failureThreshold,
 		resetTimeout:     resetTimeout,
 		successThreshold: 1, // Default to 1 success required to close circuit
 	}
 }
 // Execute attempts to execute a function with circuit breaker protection
 func (cb *CircuitBreaker) Execute(ctx context.Context, fn RetryableFunc) error {
 	// Check if circuit is open
 	if cb.IsOpen() && !cb.shouldAttemptReset() {
 		return ErrCircuitOpen
 	}
 	// Mark as half-open if we're attempting a reset
 	if cb.state == CircuitOpen {
 		cb.state = CircuitHalfOpen
 		cb.halfOpenSuccesses = 0
 		cb.lastStateChange = time.Now()
 	}
 	// Execute the function
 	err := fn(ctx)
 	// Handle result
 	if err != nil {
 		// Record failure
 		cb.recordFailure()
 		return err
 	}
 	// Record success
 	cb.recordSuccess()
 	return nil
 }
 // IsOpen returns whether the circuit is open
 func (cb *CircuitBreaker) IsOpen() bool {
 	return cb.state == CircuitOpen || cb.state == CircuitHalfOpen
 }
 // Trip manually opens the circuit
 func (cb *CircuitBreaker) Trip() {
 	cb.state = CircuitOpen
 	cb.lastStateChange = time.Now()
 }
 // Reset manually closes the circuit
 func (cb *CircuitBreaker) Reset() {
 	cb.state = CircuitClosed
 	cb.failureCount = 0
 	cb.lastStateChange = time.Now()
 }
 // recordFailure records a failure and potentially opens the circuit
 func (cb *CircuitBreaker) recordFailure() {
 	cb.lastFailure = time.Now()
 	switch cb.state {
 	case CircuitClosed:
 		cb.failureCount++
 		if cb.failureCount >= cb.failureThreshold {
 			cb.state = CircuitOpen
 			cb.lastStateChange = time.Now()
 		}
 	case CircuitHalfOpen:
 		cb.state = CircuitOpen
 		cb.lastStateChange = time.Now()
 	}
 }
 // recordSuccess records a success and potentially closes the circuit
 func (cb *CircuitBreaker) recordSuccess() {
 	switch cb.state {
 	case CircuitHalfOpen:
 		cb.halfOpenSuccesses++
 		if cb.halfOpenSuccesses >= cb.successThreshold {
 			cb.state = CircuitClosed
 			cb.failureCount = 0
 			cb.lastStateChange = time.Now()
 		}
 	case CircuitClosed:
 		// Reset failure count after a success
 		cb.failureCount = 0
 	}
 }
 // shouldAttemptReset determines if enough time has passed to attempt a reset
 func (cb *CircuitBreaker) shouldAttemptReset() bool {
 	return cb.state == CircuitOpen &&
 		time.Since(cb.lastStateChange) >= cb.resetTimeout
 }
 // ExponentialBackoff calculates the next backoff duration
 func ExponentialBackoff(attempt int, initialBackoff time.Duration, maxBackoff time.Duration, factor float64) time.Duration {
 	backoff := float64(initialBackoff) * math.Pow(factor, float64(attempt))
 	if backoff > float64(maxBackoff) {
 		return maxBackoff
 	}
 	return time.Duration(backoff)
 }
--- a/pkg/transport/retry_test.go
+++ b/pkg/transport/retry_test.go
@ -1,208 +0,0 @@
 package transport
 import (
 	"context"
 	"errors"
 	"testing"
 	"time"
 )
 func TestWithRetrySuccess(t *testing.T) {
 	callCount := 0
 	successOnAttempt := 3
 	fn := func(ctx context.Context) error {
 		callCount++
 		if callCount >= successOnAttempt {
 			return nil
 		}
 		return errors.New("temporary error")
 	}
 	policy := RetryPolicy{
 		MaxRetries:     5,
 		InitialBackoff: 1 * time.Millisecond,
 		MaxBackoff:     10 * time.Millisecond,
 		BackoffFactor:  2.0,
 		Jitter:         0.1,
 	}
 	err := WithRetry(context.Background(), policy, fn)
 	if err != nil {
 		t.Errorf("Expected success, got error: %v", err)
 	}
 	if callCount != successOnAttempt {
 		t.Errorf("Expected %d calls, got %d", successOnAttempt, callCount)
 	}
 }
 func TestWithRetryExceedMaxRetries(t *testing.T) {
 	callCount := 0
 	fn := func(ctx context.Context) error {
 		callCount++
 		return errors.New("persistent error")
 	}
 	policy := RetryPolicy{
 		MaxRetries:     3,
 		InitialBackoff: 1 * time.Millisecond,
 		MaxBackoff:     10 * time.Millisecond,
 		BackoffFactor:  2.0,
 		Jitter:         0.0, // Disable jitter for deterministic tests
 	}
 	err := WithRetry(context.Background(), policy, fn)
 	if err == nil {
 		t.Error("Expected error, got nil")
 	}
 	expectedCalls := policy.MaxRetries + 1 // Initial try + retries
 	if callCount != expectedCalls {
 		t.Errorf("Expected %d calls, got %d", expectedCalls, callCount)
 	}
 }
 func TestWithRetryContextCancellation(t *testing.T) {
 	callCount := 0
 	fn := func(ctx context.Context) error {
 		callCount++
 		return errors.New("error")
 	}
 	policy := RetryPolicy{
 		MaxRetries:     10,
 		InitialBackoff: 50 * time.Millisecond,
 		MaxBackoff:     1 * time.Second,
 		BackoffFactor:  2.0,
 		Jitter:         0.0,
 	}
 	ctx, cancel := context.WithCancel(context.Background())
 	// Cancel the context after a short time
 	go func() {
 		time.Sleep(10 * time.Millisecond)
 		cancel()
 	}()
 	err := WithRetry(ctx, policy, fn)
 	if err == nil {
 		t.Error("Expected context cancellation error, got nil")
 	}
 	if !errors.Is(err, context.Canceled) {
 		t.Errorf("Expected context.Canceled error, got: %v", err)
 	}
 }
 func TestExponentialBackoff(t *testing.T) {
 	initialBackoff := 100 * time.Millisecond
 	maxBackoff := 10 * time.Second
 	factor := 2.0
 	tests := []struct {
 		name     string
 		attempt  int
 		expected time.Duration
 	}{
 		{"FirstAttempt", 0, 100 * time.Millisecond},
 		{"SecondAttempt", 1, 200 * time.Millisecond},
 		{"ThirdAttempt", 2, 400 * time.Millisecond},
 		{"FourthAttempt", 3, 800 * time.Millisecond},
 		{"MaxBackoff", 10, maxBackoff}, // This would exceed maxBackoff
 	}
 	for _, tt := range tests {
 		t.Run(tt.name, func(t *testing.T) {
 			result := ExponentialBackoff(tt.attempt, initialBackoff, maxBackoff, factor)
 			if result != tt.expected {
 				t.Errorf("Expected %v, got %v", tt.expected, result)
 			}
 		})
 	}
 }
 func TestCircuitBreaker(t *testing.T) {
 	t.Run("Initially Closed", func(t *testing.T) {
 		cb := NewCircuitBreaker(3, 100*time.Millisecond)
 		if cb.IsOpen() {
 			t.Error("Circuit breaker should be closed initially")
 		}
 	})
 	t.Run("Opens After Failures", func(t *testing.T) {
 		cb := NewCircuitBreaker(3, 100*time.Millisecond)
 		failingFn := func(ctx context.Context) error {
 			return errors.New("error")
 		}
 		// Execute with failures
 		for i := 0; i < 3; i++ {
 			_ = cb.Execute(context.Background(), failingFn)
 		}
 		if !cb.IsOpen() {
 			t.Error("Circuit breaker should be open after threshold failures")
 		}
 	})
 	t.Run("Stays Open Until Timeout", func(t *testing.T) {
 		resetTimeout := 100 * time.Millisecond
 		cb := NewCircuitBreaker(1, resetTimeout)
 		// Trip the circuit
 		cb.Trip()
 		if !cb.IsOpen() {
 			t.Error("Circuit breaker should be open after tripping")
 		}
 		// Execute should fail fast
 		err := cb.Execute(context.Background(), func(ctx context.Context) error {
 			return nil
 		})
 		if err != ErrCircuitOpen {
 			t.Errorf("Expected ErrCircuitOpen, got: %v", err)
 		}
 		// Wait for reset timeout
 		time.Sleep(resetTimeout + 10*time.Millisecond)
 		// Now it should be half-open and attempt the function
 		successFn := func(ctx context.Context) error {
 			return nil
 		}
 		err = cb.Execute(context.Background(), successFn)
 		if err != nil {
 			t.Errorf("Expected successful execution, got: %v", err)
 		}
 		if cb.IsOpen() {
 			t.Error("Circuit breaker should be closed after successful execution in half-open state")
 		}
 	})
 	t.Run("Resets After Success", func(t *testing.T) {
 		cb := NewCircuitBreaker(3, 100*time.Millisecond)
 		// Trip the circuit manually
 		cb.Trip()
 		// Manually reset
 		cb.Reset()
 		if cb.IsOpen() {
 			t.Error("Circuit breaker should be closed after reset")
 		}
 	})
 }
--- a/pkg/wal/wal_test.go
+++ b/pkg/wal/wal_test.go
@ -377,8 +377,8 @@ func TestWALSyncModes(t *testing.T) {
 		syncMode        config.SyncMode
 		expectedEntries int // Expected number of entries after crash (without explicit sync)
 	}{
-		{"SyncNone", config.SyncNone, 0},            // No entries should be recovered without explicit sync
+		{"SyncNone", config.SyncNone, 0}, // No entries should be recovered without explicit sync
-		{"SyncBatch", config.SyncBatch, 0},          // No entries should be recovered if batch threshold not reached
+		{"SyncBatch", config.SyncBatch, 0}, // No entries should be recovered if batch threshold not reached
 		{"SyncImmediate", config.SyncImmediate, 10}, // All entries should be recovered
 	}