diff --git a/adapter/sqs.go b/adapter/sqs.go
index 1a3a06fdf..dfd1916cc 100644
--- a/adapter/sqs.go
+++ b/adapter/sqs.go
@@ -52,7 +52,6 @@ const (
 // "Common Errors" page of the SQS API reference.
 const (
 	sqsErrInvalidAction      = "InvalidAction"
-	sqsErrNotImplemented     = "NotImplemented"
 	sqsErrInternalFailure    = "InternalFailure"
 	sqsErrServiceUnavailable = "ServiceUnavailable"
 	sqsErrMalformedRequest   = "MalformedQueryString"
@@ -69,6 +68,14 @@ type SQSServer struct {
 	leaderSQS      map[string]string
 	region         string
 	staticCreds    map[string]string
+	// reaperCtx / reaperCancel drive the retention sweeper goroutine.
+	// Both are initialized in NewSQSServer (never reassigned) so a
+	// concurrent Stop() that lands before Run() completes still reads
+	// a stable cancel func — unlike a Run-time assignment, which the
+	// race detector flagged because Run and Stop run on different
+	// goroutines without ordering between them.
+	reaperCtx    context.Context
+	reaperCancel context.CancelFunc
 }
 
 // WithSQSLeaderMap configures the Raft-address-to-SQS-address mapping used to
@@ -84,10 +91,13 @@ func WithSQSLeaderMap(m map[string]string) SQSServerOption {
 }
 
 func NewSQSServer(listen net.Listener, st store.MVCCStore, coordinate kv.Coordinator, opts ...SQSServerOption) *SQSServer {
+	reaperCtx, reaperCancel := context.WithCancel(context.Background())
 	s := &SQSServer{
-		listen:      listen,
-		store:       st,
-		coordinator: coordinate,
+		listen:       listen,
+		store:        st,
+		coordinator:  coordinate,
+		reaperCtx:    reaperCtx,
+		reaperCancel: reaperCancel,
 	}
 	s.targetHandlers = map[string]func(http.ResponseWriter, *http.Request){
 		sqsCreateQueueTarget:               s.createQueue,
@@ -96,17 +106,17 @@ func NewSQSServer(listen net.Listener, st store.MVCCStore, coordinate kv.Coordin
 		sqsGetQueueUrlTarget:               s.getQueueUrl,
 		sqsGetQueueAttributesTarget:        s.getQueueAttributes,
 		sqsSetQueueAttributesTarget:        s.setQueueAttributes,
-		sqsPurgeQueueTarget:                s.notImplemented("PurgeQueue"),
+		sqsPurgeQueueTarget:                s.purgeQueue,
 		sqsSendMessageTarget:               s.sendMessage,
-		sqsSendMessageBatchTarget:          s.notImplemented("SendMessageBatch"),
+		sqsSendMessageBatchTarget:          s.sendMessageBatch,
 		sqsReceiveMessageTarget:            s.receiveMessage,
 		sqsDeleteMessageTarget:             s.deleteMessage,
-		sqsDeleteMessageBatchTarget:        s.notImplemented("DeleteMessageBatch"),
+		sqsDeleteMessageBatchTarget:        s.deleteMessageBatch,
 		sqsChangeMessageVisibilityTarget:   s.changeMessageVisibility,
-		sqsChangeMessageVisibilityBatchTgt: s.notImplemented("ChangeMessageVisibilityBatch"),
-		sqsTagQueueTarget:                  s.notImplemented("TagQueue"),
-		sqsUntagQueueTarget:                s.notImplemented("UntagQueue"),
-		sqsListQueueTagsTarget:             s.notImplemented("ListQueueTags"),
+		sqsChangeMessageVisibilityBatchTgt: s.changeMessageVisibilityBatch,
+		sqsTagQueueTarget:                  s.tagQueue,
+		sqsUntagQueueTarget:                s.untagQueue,
+		sqsListQueueTagsTarget:             s.listQueueTags,
 	}
 	mux := http.NewServeMux()
 	mux.HandleFunc("/", s.handle)
@@ -120,6 +130,7 @@ func NewSQSServer(listen net.Listener, st store.MVCCStore, coordinate kv.Coordin
 }
 
 func (s *SQSServer) Run() error {
+	s.startReaper(s.reaperCtx)
 	if err := s.httpServer.Serve(s.listen); err != nil && !errors.Is(err, http.ErrServerClosed) {
 		return errors.WithStack(err)
 	}
@@ -127,6 +138,9 @@ func (s *SQSServer) Run() error {
 }
 
 func (s *SQSServer) Stop() {
+	if s.reaperCancel != nil {
+		s.reaperCancel()
+	}
 	if s.httpServer != nil {
 		_ = s.httpServer.Shutdown(context.Background())
 	}
@@ -237,15 +251,6 @@ func sqsLeaderProxyErrorWriter(w http.ResponseWriter, status int, message string
 	writeSQSError(w, status, sqsErrServiceUnavailable, message)
 }
 
-// notImplemented returns a handler that responds with a JSON-protocol
-// NotImplemented error so clients get a clean signal while the real handlers
-// are still being built out.
-func (s *SQSServer) notImplemented(op string) func(http.ResponseWriter, *http.Request) {
-	return func(w http.ResponseWriter, _ *http.Request) {
-		writeSQSError(w, http.StatusNotImplemented, sqsErrNotImplemented, op+" is not implemented yet")
-	}
-}
-
 // writeSQSError emits an SQS JSON-protocol error envelope. AWS returns:
 //
 //	{ "__type": "<code>", "message": "<text>" }
diff --git a/adapter/sqs_catalog.go b/adapter/sqs_catalog.go
index 13c9d02f9..4dc801e68 100644
--- a/adapter/sqs_catalog.go
+++ b/adapter/sqs_catalog.go
@@ -40,6 +40,15 @@ const (
 	sqsListQueuesDefaultMaxResults      = 1000
 	sqsListQueuesHardMaxResults         = 1000
 	sqsQueueScanPageLimit               = 1024
+	// sqsPurgeRateLimitMillis is AWS's "one PurgeQueue per 60 seconds per
+	// queue" limit. PurgeInProgress is returned to callers that try
+	// again before the cooldown ends.
+	sqsPurgeRateLimitMillis = 60_000
+)
+
+// AWS error codes specific to PurgeQueue.
+const (
+	sqsErrPurgeInProgress = "AWS.SimpleQueueService.PurgeQueueInProgress"
 )
 
 // AWS error codes specific to the queue catalog.
@@ -70,6 +79,19 @@ type sqsQueueMeta struct {
 	MaximumMessageSize        int64             `json:"maximum_message_size"`
 	RedrivePolicy             string            `json:"redrive_policy,omitempty"`
 	Tags                      map[string]string `json:"tags,omitempty"`
+	// LastPurgedAtMillis is the wall-clock time of the last successful
+	// PurgeQueue. AWS rate-limits PurgeQueue to once per 60 seconds per
+	// queue; tracking it on the meta record means the limit survives
+	// leader failover (in-memory cooldowns would let the new leader
+	// accept a second purge a few seconds later).
+	LastPurgedAtMillis int64 `json:"last_purged_at_millis,omitempty"`
+	// CreatedAtMillis / LastModifiedAtMillis are wall-clock timestamps
+	// surfaced by GetQueueAttributes (AWS reports them in second
+	// granularity). HLC is unsuitable for this — it is a logical
+	// counter, not a wall clock — so we record the local Now() at
+	// commit time and trust HLC monotonicity to keep ordering sane.
+	CreatedAtMillis      int64 `json:"created_at_millis,omitempty"`
+	LastModifiedAtMillis int64 `json:"last_modified_at_millis,omitempty"`
 }
 
 var storedSQSMetaPrefix = []byte{0x00, 'S', 'Q', 0x01}
@@ -362,18 +384,26 @@ var sqsAttributeAppliers = map[string]attributeApplier{
 		m.ContentBasedDedup = b
 		return nil
 	},
-	"RedrivePolicy": func(_ *sqsQueueMeta, _ string) error {
-		// Milestone 1 does not enforce DLQ redrive at receive time,
-		// so silently accepting RedrivePolicy would advertise a
-		// feature clients rely on (poison messages moving to the
-		// DLQ after maxReceiveCount) that this adapter does not
-		// actually provide — receivers would see infinite
-		// redelivery instead. Reject the attribute until the
-		// Milestone-2 receive path that actually performs the DLQ
-		// move lands, so operators get a clear signal instead of
-		// a silently-broken queue.
-		return newSQSAPIError(http.StatusNotImplemented, sqsErrNotImplemented,
-			"RedrivePolicy is not yet supported; DLQ redrive is tracked for Milestone 2")
+	"RedrivePolicy": func(m *sqsQueueMeta, v string) error {
+		// Validate the policy at attribute-apply time so a malformed
+		// RedrivePolicy never makes it onto the queue meta record. The
+		// receive path re-parses on every check rather than caching
+		// the struct on meta, because DLQ existence has to be
+		// re-validated at the readTS anyway.
+		policy, err := parseRedrivePolicy(v)
+		if err != nil {
+			return err
+		}
+		// AWS rejects self-referential DLQ targets. Without this gate
+		// a redrive transaction would delete the source record and
+		// rewrite it to the same queue with a fresh receipt token,
+		// looping the poison message forever.
+		if policy.DLQName == m.Name {
+			return newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+				"RedrivePolicy.deadLetterTargetArn must not point at the source queue")
+		}
+		m.RedrivePolicy = v
+		return nil
 	},
 }
 
@@ -487,6 +517,14 @@ func (s *SQSServer) createQueue(w http.ResponseWriter, r *http.Request) {
 		writeSQSErrorFromErr(w, err)
 		return
 	}
+	if len(in.Tags) > sqsMaxTagsPerQueue {
+		// AWS caps tags per queue at 50. CreateQueue must reject
+		// over-cap tag bundles up front; a silent slice-and-store
+		// would let queues land with more tags than TagQueue would
+		// ever accept on the same queue.
+		writeSQSError(w, http.StatusBadRequest, sqsErrInvalidAttributeValue, "queue tag count exceeds 50")
+		return
+	}
 	requested.Tags = in.Tags
 
 	if err := s.createQueueWithRetry(r.Context(), requested); err != nil {
@@ -539,6 +577,9 @@ func (s *SQSServer) tryCreateQueueOnce(ctx context.Context, requested *sqsQueueM
 	if clock := s.coordinator.Clock(); clock != nil {
 		requested.CreatedAtHLC = clock.Current()
 	}
+	now := time.Now().UnixMilli()
+	requested.CreatedAtMillis = now
+	requested.LastModifiedAtMillis = now
 	metaBytes, err := encodeSQSQueueMeta(requested)
 	if err != nil {
 		return false, errors.WithStack(err)
@@ -600,14 +641,18 @@ func (s *SQSServer) deleteQueueWithRetry(ctx context.Context, queueName string)
 		}
 
 		// Bump the generation counter so any stragglers under the old
-		// generation are unreachable by routing. Actual message cleanup
-		// lands in a follow-up PR along with the message keyspace.
+		// generation are unreachable by routing. The tombstone gives the
+		// reaper a way to find leftover data / vis / byage / dedup /
+		// group records once meta is gone — without it, scanQueueNames
+		// would never see the deleted queue again and its message
+		// keyspace would leak forever.
 		lastGen, err := s.loadQueueGenerationAt(ctx, queueName, readTS)
 		if err != nil {
 			return errors.WithStack(err)
 		}
 		metaKey := sqsQueueMetaKey(queueName)
 		genKey := sqsQueueGenKey(queueName)
+		tombstoneKey := sqsQueueTombstoneKey(queueName, lastGen)
 		// StartTS + ReadKeys fence against a concurrent CreateQueue /
 		// SetQueueAttributes landing between our load and dispatch.
 		req := &kv.OperationGroup[kv.OP]{
@@ -617,6 +662,7 @@ func (s *SQSServer) deleteQueueWithRetry(ctx context.Context, queueName string)
 			Elems: []*kv.Elem[kv.OP]{
 				{Op: kv.Del, Key: metaKey},
 				{Op: kv.Put, Key: genKey, Value: []byte(strconv.FormatUint(lastGen+1, 10))},
+				{Op: kv.Put, Key: tombstoneKey, Value: []byte{1}},
 			},
 		}
 		if _, err := s.coordinator.Dispatch(ctx, req); err == nil {
@@ -777,7 +823,8 @@ func (s *SQSServer) getQueueAttributes(w http.ResponseWriter, r *http.Request) {
 		writeSQSErrorFromErr(w, err)
 		return
 	}
-	meta, exists, err := s.loadQueueMetaAt(r.Context(), name, s.nextTxnReadTS(r.Context()))
+	readTS := s.nextTxnReadTS(r.Context())
+	meta, exists, err := s.loadQueueMetaAt(r.Context(), name, readTS)
 	if err != nil {
 		writeSQSErrorFromErr(w, err)
 		return
@@ -787,10 +834,32 @@ func (s *SQSServer) getQueueAttributes(w http.ResponseWriter, r *http.Request) {
 		return
 	}
 	selection := selectedAttributeNames(in.AttributeNames)
-	attrs := queueMetaToAttributes(meta, selection)
+	// Counter computation is the only path that touches per-message
+	// state, so skip the scan when the caller did not ask for any of
+	// the Approximate* attributes. AWS itself documents these as
+	// approximate; a snapshot read is correct enough.
+	var counters *sqsApproxCounters
+	if selectionWantsApproxCounters(selection) {
+		c, scanErr := s.scanApproxCounters(r.Context(), name, meta.Generation, readTS)
+		if scanErr != nil {
+			writeSQSErrorFromErr(w, scanErr)
+			return
+		}
+		counters = &c
+	}
+	attrs := queueMetaToAttributes(meta, selection, counters, s.queueArn(name))
 	writeSQSJSON(w, map[string]any{"Attributes": attrs})
 }
 
+// queueArn synthesises the AWS-shaped ARN clients expect to find on
+// GetQueueAttributes. Account id is fixed at "000000000000" — IAM is
+// out of scope, so emitting a sentinel placeholder gives SDKs a
+// well-formed string without inventing identity.
+func (s *SQSServer) queueArn(queueName string) string {
+	region := s.effectiveRegion()
+	return "arn:aws:sqs:" + region + ":000000000000:" + queueName
+}
+
 // sqsAttributeSelection is a tri-state result from selectedAttributeNames:
 // expandAll = AWS "All" (or any entry equals "All"); a non-nil map lists
 // the specific attribute names the caller asked for; and an empty
@@ -823,7 +892,37 @@ func selectedAttributeNames(req []string) sqsAttributeSelection {
 	return sqsAttributeSelection{names: selection}
 }
 
-func queueMetaToAttributes(meta *sqsQueueMeta, selection sqsAttributeSelection) map[string]string {
+// sqsApproxCounters bundles the three AWS-published "Approximate"
+// counters; nil means the caller did not request them and so the
+// per-message scan was skipped.
+type sqsApproxCounters struct {
+	Visible    int64
+	NotVisible int64
+	Delayed    int64
+}
+
+// approxCounterAttributeNames is every attribute that requires a
+// per-message scan. queueMetaToAttributes only invokes the scan when
+// the selection overlaps this set.
+var approxCounterAttributeNames = map[string]bool{
+	"ApproximateNumberOfMessages":           true,
+	"ApproximateNumberOfMessagesNotVisible": true,
+	"ApproximateNumberOfMessagesDelayed":    true,
+}
+
+func selectionWantsApproxCounters(selection sqsAttributeSelection) bool {
+	if selection.expandAll {
+		return true
+	}
+	for k := range selection.names {
+		if approxCounterAttributeNames[k] {
+			return true
+		}
+	}
+	return false
+}
+
+func queueMetaToAttributes(meta *sqsQueueMeta, selection sqsAttributeSelection, counters *sqsApproxCounters, queueArn string) map[string]string {
 	// No AttributeNames supplied and no "All" → AWS returns nothing.
 	// The handler still emits "Attributes" as an empty map so the
 	// response shape is stable.
@@ -838,6 +937,19 @@ func queueMetaToAttributes(meta *sqsQueueMeta, selection sqsAttributeSelection)
 		"MaximumMessageSize":            strconv.FormatInt(meta.MaximumMessageSize, 10),
 		"FifoQueue":                     strconv.FormatBool(meta.IsFIFO),
 		"ContentBasedDeduplication":     strconv.FormatBool(meta.ContentBasedDedup),
+		"QueueArn":                      queueArn,
+	}
+	if created := meta.CreatedAtMillis; created > 0 {
+		// AWS reports timestamps in unix seconds (string-encoded).
+		all["CreatedTimestamp"] = strconv.FormatInt(created/sqsMillisPerSecond, 10)
+	}
+	if mod := meta.LastModifiedAtMillis; mod > 0 {
+		all["LastModifiedTimestamp"] = strconv.FormatInt(mod/sqsMillisPerSecond, 10)
+	}
+	if counters != nil {
+		all["ApproximateNumberOfMessages"] = strconv.FormatInt(counters.Visible, 10)
+		all["ApproximateNumberOfMessagesNotVisible"] = strconv.FormatInt(counters.NotVisible, 10)
+		all["ApproximateNumberOfMessagesDelayed"] = strconv.FormatInt(counters.Delayed, 10)
 	}
 	if meta.RedrivePolicy != "" {
 		all["RedrivePolicy"] = meta.RedrivePolicy
@@ -921,6 +1033,7 @@ func (s *SQSServer) trySetQueueAttributesOnce(ctx context.Context, queueName str
 	if meta.ContentBasedDedup && !meta.IsFIFO {
 		return false, newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue, "ContentBasedDeduplication is only valid on FIFO queues")
 	}
+	meta.LastModifiedAtMillis = time.Now().UnixMilli()
 	metaBytes, err := encodeSQSQueueMeta(meta)
 	if err != nil {
 		return false, errors.WithStack(err)
@@ -942,3 +1055,80 @@ func (s *SQSServer) trySetQueueAttributesOnce(ctx context.Context, queueName str
 	}
 	return true, nil
 }
+
+// sqsApproxCounterScanLimit caps a single GetQueueAttributes scan. AWS
+// reports the counters as "approximate"; once the queue is past this
+// many records the per-bucket totals are best-effort. Picking 50_000
+// keeps the scan latency under ~100 ms on a warm Pebble cache.
+const sqsApproxCounterScanLimit = 50_000
+
+// scanApproxCounters walks every data record under (queue, generation)
+// and buckets it into visible / not-visible / delayed by the same
+// definitions GetQueueAttributes documents. The scan runs at the same
+// snapshot timestamp the meta read used so the returned numbers are a
+// coherent snapshot; concurrent sends or receives that commit after
+// readTS just show up on the next call.
+func (s *SQSServer) scanApproxCounters(ctx context.Context, queueName string, gen uint64, readTS uint64) (sqsApproxCounters, error) {
+	prefix := []byte(SqsMsgDataPrefix)
+	prefix = append(prefix, []byte(encodeSQSSegment(queueName))...)
+	prefix = appendU64(prefix, gen)
+	end := prefixScanEnd(prefix)
+
+	now := time.Now().UnixMilli()
+	var counters sqsApproxCounters
+	start := bytes.Clone(prefix)
+	for {
+		page, err := s.store.ScanAt(ctx, start, end, sqsQueueScanPageLimit, readTS)
+		if err != nil {
+			return counters, errors.WithStack(err)
+		}
+		if len(page) == 0 {
+			return counters, nil
+		}
+		bucketApproxCounterPage(page, now, &counters)
+		if exhausted(counters, page, end, &start) {
+			return counters, nil
+		}
+	}
+}
+
+// bucketApproxCounterPage walks one ScanAt page and bumps the right
+// counter for each record. Pulled out of scanApproxCounters so the
+// outer loop stays under the cyclomatic budget.
+func bucketApproxCounterPage(page []*store.KVPair, now int64, counters *sqsApproxCounters) {
+	for _, kvp := range page {
+		rec, err := decodeSQSMessageRecord(kvp.Value)
+		if err != nil {
+			// Malformed record means a programmer bug, not a
+			// counter bug — drop it from the totals rather than
+			// failing the whole call.
+			continue
+		}
+		if rec.VisibleAtMillis <= now {
+			counters.Visible++
+			continue
+		}
+		if rec.ReceiveCount == 0 {
+			counters.Delayed++
+		} else {
+			counters.NotVisible++
+		}
+	}
+}
+
+// exhausted reports whether the scan has reached its budget or the
+// end of the prefix range. Mutates `start` so the caller can resume.
+func exhausted(counters sqsApproxCounters, page []*store.KVPair, end []byte, start *[]byte) bool {
+	total := counters.Visible + counters.NotVisible + counters.Delayed
+	if total >= sqsApproxCounterScanLimit {
+		return true
+	}
+	if len(page) < sqsQueueScanPageLimit {
+		return true
+	}
+	*start = nextScanCursorAfter(page[len(page)-1].Key)
+	if end != nil && bytes.Compare(*start, end) >= 0 {
+		return true
+	}
+	return false
+}
diff --git a/adapter/sqs_catalog_test.go b/adapter/sqs_catalog_test.go
index d57cd8648..291732ded 100644
--- a/adapter/sqs_catalog_test.go
+++ b/adapter/sqs_catalog_test.go
@@ -358,41 +358,44 @@ func TestSQSServer_SetQueueAttributesRequiresAttributes(t *testing.T) {
 	}
 }
 
-func TestSQSServer_CreateQueueRejectsRedrivePolicy(t *testing.T) {
+func TestSQSServer_CreateQueueValidatesRedrivePolicy(t *testing.T) {
 	t.Parallel()
-	// Milestone 1 does not enforce DLQ redrive on the receive path, so
-	// accepting RedrivePolicy would silently advertise a feature the
-	// adapter can't deliver — poison messages would redeliver
-	// indefinitely instead of moving to the DLQ. Until the Milestone-2
-	// receive-side DLQ move lands, reject the attribute loudly.
+	// Now that the receive path implements DLQ redrive, RedrivePolicy
+	// must round-trip; only malformed policies are rejected.
 	nodes, _, _ := createNode(t, 1)
 	defer shutdown(nodes)
 	node := sqsLeaderNode(t, nodes)
 
+	// Missing maxReceiveCount → InvalidAttributeValue.
 	status, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
-		"QueueName": "with-redrive",
+		"QueueName": "bad-redrive",
 		"Attributes": map[string]string{
-			"RedrivePolicy": `{"deadLetterTargetArn":"arn:aws:sqs:us-east-1:000000000000:dlq","maxReceiveCount":"5"}`,
+			"RedrivePolicy": `{"deadLetterTargetArn":"arn:aws:sqs:us-east-1:000000000000:dlq"}`,
 		},
 	})
-	if status != http.StatusNotImplemented {
-		t.Fatalf("CreateQueue with RedrivePolicy: got %d want 501 (%v)", status, out)
-	}
-	if got, _ := out["__type"].(string); got != sqsErrNotImplemented {
-		t.Fatalf("error type: %q want %q", got, sqsErrNotImplemented)
+	if status != http.StatusBadRequest {
+		t.Fatalf("CreateQueue with malformed RedrivePolicy: got %d want 400 (%v)", status, out)
 	}
 
-	// SetQueueAttributes rejects the same attribute on an existing
-	// queue.
-	url := createSQSQueueForTest(t, node, "no-redrive")
-	status, out = callSQS(t, node, sqsSetQueueAttributesTarget, map[string]any{
-		"QueueUrl": url,
+	// Well-formed RedrivePolicy succeeds and round-trips.
+	policy := `{"deadLetterTargetArn":"arn:aws:sqs:us-east-1:000000000000:dlq","maxReceiveCount":5}`
+	status, out = callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName": "with-redrive",
 		"Attributes": map[string]string{
-			"RedrivePolicy": `{"maxReceiveCount":"3"}`,
+			"RedrivePolicy": policy,
 		},
 	})
-	if status != http.StatusNotImplemented {
-		t.Fatalf("SetQueueAttributes with RedrivePolicy: got %d want 501 (%v)", status, out)
+	if status != http.StatusOK {
+		t.Fatalf("CreateQueue with valid RedrivePolicy: got %d (%v)", status, out)
+	}
+	url, _ := out["QueueUrl"].(string)
+	_, out = callSQS(t, node, sqsGetQueueAttributesTarget, map[string]any{
+		"QueueUrl":       url,
+		"AttributeNames": []string{"RedrivePolicy"},
+	})
+	attrs, _ := out["Attributes"].(map[string]any)
+	if attrs["RedrivePolicy"] != policy {
+		t.Fatalf("RedrivePolicy not echoed back: %v", attrs)
 	}
 }
 
diff --git a/adapter/sqs_extra_test.go b/adapter/sqs_extra_test.go
new file mode 100644
index 000000000..614081f38
--- /dev/null
+++ b/adapter/sqs_extra_test.go
@@ -0,0 +1,1909 @@
+package adapter
+
+import (
+	"bytes"
+	"context"
+	"encoding/binary"
+	"encoding/hex"
+	"net/http"
+	"strconv"
+	"strings"
+	"testing"
+	"time"
+
+	"github.com/bootjp/elastickv/kv"
+)
+
+func TestSQSServer_PurgeQueueRemovesMessagesAndRateLimits(t *testing.T) {
+	t.Parallel()
+	// PurgeQueue must (a) bump the queue generation so previously sent
+	// messages are unreachable on the new generation and (b) reject a
+	// follow-up purge issued within AWS's 60-second cooldown.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "purge-target")
+
+	for i := range 3 {
+		_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+			"QueueUrl":    queueURL,
+			"MessageBody": "msg-" + strconv.Itoa(i),
+		})
+	}
+
+	status, out := callSQS(t, node, sqsPurgeQueueTarget, map[string]any{
+		"QueueUrl": queueURL,
+	})
+	if status != http.StatusOK {
+		t.Fatalf("purge: %d %v", status, out)
+	}
+
+	// After purge, the queue is empty for the new generation.
+	status, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            queueURL,
+		"MaxNumberOfMessages": 10,
+	})
+	if status != http.StatusOK {
+		t.Fatalf("receive after purge: %d %v", status, out)
+	}
+	if msgs, _ := out["Messages"].([]any); len(msgs) != 0 {
+		t.Fatalf("expected 0 messages after purge, got %d (%v)", len(msgs), msgs)
+	}
+
+	// Second purge inside the 60-second cooldown must fail.
+	status, out = callSQS(t, node, sqsPurgeQueueTarget, map[string]any{
+		"QueueUrl": queueURL,
+	})
+	if status != http.StatusBadRequest {
+		t.Fatalf("rapid purge: got %d want 400 (%v)", status, out)
+	}
+	if got, _ := out["__type"].(string); got != sqsErrPurgeInProgress {
+		t.Fatalf("error type: %q want %q", got, sqsErrPurgeInProgress)
+	}
+
+	// New sends still work after a purge — the queue still exists.
+	status, out = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":    queueURL,
+		"MessageBody": "after-purge",
+	})
+	if status != http.StatusOK {
+		t.Fatalf("post-purge send: %d %v", status, out)
+	}
+}
+
+func TestSQSServer_PurgeQueueOnMissingQueue(t *testing.T) {
+	t.Parallel()
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	status, out := callSQS(t, node, sqsPurgeQueueTarget, map[string]any{
+		"QueueUrl": "http://" + node.sqsAddress + "/no-such-queue",
+	})
+	if status != http.StatusBadRequest {
+		t.Fatalf("purge missing: %d %v", status, out)
+	}
+	if got, _ := out["__type"].(string); got != sqsErrQueueDoesNotExist {
+		t.Fatalf("error type: %q want %q", got, sqsErrQueueDoesNotExist)
+	}
+}
+
+func TestSQSServer_SendMessageBatchHappyPath(t *testing.T) {
+	t.Parallel()
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "batch-send")
+
+	entries := make([]map[string]any, 0, 3)
+	for i := range 3 {
+		entries = append(entries, map[string]any{
+			"Id":          "e" + strconv.Itoa(i),
+			"MessageBody": "body-" + strconv.Itoa(i),
+		})
+	}
+	status, out := callSQS(t, node, sqsSendMessageBatchTarget, map[string]any{
+		"QueueUrl": queueURL,
+		"Entries":  entries,
+	})
+	if status != http.StatusOK {
+		t.Fatalf("send batch: %d %v", status, out)
+	}
+	successful, _ := out["Successful"].([]any)
+	if len(successful) != 3 {
+		t.Fatalf("expected 3 successful, got %d (%v)", len(successful), out)
+	}
+	failed, _ := out["Failed"].([]any)
+	if len(failed) != 0 {
+		t.Fatalf("expected 0 failed, got %v", failed)
+	}
+
+	// Confirm the messages are deliverable.
+	status, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            queueURL,
+		"MaxNumberOfMessages": 10,
+		"VisibilityTimeout":   60,
+	})
+	if status != http.StatusOK {
+		t.Fatalf("receive: %d %v", status, out)
+	}
+	msgs, _ := out["Messages"].([]any)
+	if len(msgs) != 3 {
+		t.Fatalf("expected 3 received, got %d", len(msgs))
+	}
+}
+
+func TestSQSServer_SendMessageBatchPartialFailure(t *testing.T) {
+	t.Parallel()
+	// One entry has an empty body (rejected as InvalidParameterValue),
+	// two are valid. AWS reports per-entry success/failure rather than
+	// failing the whole batch — verify that contract holds.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "batch-mixed")
+
+	entries := []map[string]any{
+		{"Id": "ok-1", "MessageBody": "yes"},
+		{"Id": "bad-1", "MessageBody": ""}, // empty body is per-entry failure
+		{"Id": "ok-2", "MessageBody": "yes-2"},
+	}
+	status, out := callSQS(t, node, sqsSendMessageBatchTarget, map[string]any{
+		"QueueUrl": queueURL,
+		"Entries":  entries,
+	})
+	if status != http.StatusOK {
+		t.Fatalf("send batch: %d %v", status, out)
+	}
+	successful, _ := out["Successful"].([]any)
+	if len(successful) != 2 {
+		t.Fatalf("expected 2 successful, got %d (%v)", len(successful), successful)
+	}
+	failed, _ := out["Failed"].([]any)
+	if len(failed) != 1 {
+		t.Fatalf("expected 1 failed, got %d (%v)", len(failed), failed)
+	}
+	bad, _ := failed[0].(map[string]any)
+	if bad["Id"] != "bad-1" {
+		t.Fatalf("failed entry Id = %v, want bad-1", bad["Id"])
+	}
+	if bad["SenderFault"] != true {
+		t.Fatalf("SenderFault = %v, want true", bad["SenderFault"])
+	}
+}
+
+func TestSQSServer_SendMessageBatchRejectsEmptyAndOversize(t *testing.T) {
+	t.Parallel()
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "batch-shape")
+
+	// Empty entries list → EmptyBatchRequest.
+	status, out := callSQS(t, node, sqsSendMessageBatchTarget, map[string]any{
+		"QueueUrl": queueURL,
+		"Entries":  []map[string]any{},
+	})
+	if status != http.StatusBadRequest || out["__type"] != sqsErrEmptyBatchRequest {
+		t.Fatalf("empty batch: status=%d body=%v", status, out)
+	}
+
+	// More than 10 entries → TooManyEntriesInBatchRequest.
+	bigEntries := make([]map[string]any, 0, 11)
+	for i := range 11 {
+		bigEntries = append(bigEntries, map[string]any{
+			"Id": "e" + strconv.Itoa(i), "MessageBody": "x",
+		})
+	}
+	status, out = callSQS(t, node, sqsSendMessageBatchTarget, map[string]any{
+		"QueueUrl": queueURL,
+		"Entries":  bigEntries,
+	})
+	if status != http.StatusBadRequest || out["__type"] != sqsErrTooManyEntriesInBatchRequest {
+		t.Fatalf("too many entries: status=%d body=%v", status, out)
+	}
+
+	// Duplicate Ids → BatchEntryIdsNotDistinct.
+	status, out = callSQS(t, node, sqsSendMessageBatchTarget, map[string]any{
+		"QueueUrl": queueURL,
+		"Entries": []map[string]any{
+			{"Id": "dup", "MessageBody": "a"},
+			{"Id": "dup", "MessageBody": "b"},
+		},
+	})
+	if status != http.StatusBadRequest || out["__type"] != sqsErrBatchEntryIdsNotDistinct {
+		t.Fatalf("dup ids: status=%d body=%v", status, out)
+	}
+}
+
+func TestSQSServer_DeleteMessageBatch(t *testing.T) {
+	t.Parallel()
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "batch-delete")
+
+	for i := range 3 {
+		_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+			"QueueUrl":    queueURL,
+			"MessageBody": "d-" + strconv.Itoa(i),
+		})
+	}
+	_, out := callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            queueURL,
+		"MaxNumberOfMessages": 10,
+		"VisibilityTimeout":   60,
+	})
+	msgs, _ := out["Messages"].([]any)
+	if len(msgs) != 3 {
+		t.Fatalf("expected 3 received, got %d", len(msgs))
+	}
+	entries := make([]map[string]any, 0, len(msgs))
+	for i, m := range msgs {
+		mm, _ := m.(map[string]any)
+		entries = append(entries, map[string]any{
+			"Id":            "d" + strconv.Itoa(i),
+			"ReceiptHandle": mm["ReceiptHandle"],
+		})
+	}
+	// Add a malformed handle entry — must fail per-entry, not the whole batch.
+	entries = append(entries, map[string]any{
+		"Id":            "bad-handle",
+		"ReceiptHandle": "not-base64-!!!",
+	})
+	status, out := callSQS(t, node, sqsDeleteMessageBatchTarget, map[string]any{
+		"QueueUrl": queueURL,
+		"Entries":  entries,
+	})
+	if status != http.StatusOK {
+		t.Fatalf("delete batch: %d %v", status, out)
+	}
+	successful, _ := out["Successful"].([]any)
+	if len(successful) != 3 {
+		t.Fatalf("expected 3 successful, got %d (%v)", len(successful), successful)
+	}
+	failed, _ := out["Failed"].([]any)
+	if len(failed) != 1 {
+		t.Fatalf("expected 1 failed, got %v", failed)
+	}
+	bad, _ := failed[0].(map[string]any)
+	if bad["Id"] != "bad-handle" {
+		t.Fatalf("failed Id = %v, want bad-handle", bad["Id"])
+	}
+}
+
+func TestSQSServer_ChangeMessageVisibilityBatch(t *testing.T) {
+	t.Parallel()
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "batch-chgvis")
+
+	for i := range 2 {
+		_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+			"QueueUrl":    queueURL,
+			"MessageBody": "c-" + strconv.Itoa(i),
+		})
+	}
+	_, out := callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            queueURL,
+		"MaxNumberOfMessages": 10,
+		"VisibilityTimeout":   1,
+	})
+	msgs, _ := out["Messages"].([]any)
+	if len(msgs) != 2 {
+		t.Fatalf("expected 2 received, got %d", len(msgs))
+	}
+	entries := make([]map[string]any, 0, len(msgs))
+	for i, m := range msgs {
+		mm, _ := m.(map[string]any)
+		entries = append(entries, map[string]any{
+			"Id":                "v" + strconv.Itoa(i),
+			"ReceiptHandle":     mm["ReceiptHandle"],
+			"VisibilityTimeout": 60,
+		})
+	}
+	// Add an entry with a bad VisibilityTimeout — must fail per-entry.
+	entries = append(entries, map[string]any{
+		"Id":                "bad",
+		"ReceiptHandle":     "ignored",
+		"VisibilityTimeout": -1,
+	})
+	status, out := callSQS(t, node, sqsChangeMessageVisibilityBatchTgt, map[string]any{
+		"QueueUrl": queueURL,
+		"Entries":  entries,
+	})
+	if status != http.StatusOK {
+		t.Fatalf("change vis batch: %d %v", status, out)
+	}
+	successful, _ := out["Successful"].([]any)
+	if len(successful) != 2 {
+		t.Fatalf("expected 2 successful, got %d (%v)", len(successful), successful)
+	}
+	failed, _ := out["Failed"].([]any)
+	if len(failed) != 1 {
+		t.Fatalf("expected 1 failed, got %d", len(failed))
+	}
+
+	// After the original 1s expires, the messages must still be hidden
+	// thanks to the new 60s visibility set by the batch call.
+	time.Sleep(1200 * time.Millisecond)
+	_, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            queueURL,
+		"MaxNumberOfMessages": 10,
+	})
+	if msgs, _ := out["Messages"].([]any); len(msgs) != 0 {
+		t.Fatalf("expected 0 messages after visibility extension, got %d", len(msgs))
+	}
+}
+
+func TestSQSServer_TagQueueRoundTrip(t *testing.T) {
+	t.Parallel()
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "tagged")
+
+	// Initial ListQueueTags returns an empty map.
+	status, out := callSQS(t, node, sqsListQueueTagsTarget, map[string]any{
+		"QueueUrl": queueURL,
+	})
+	if status != http.StatusOK {
+		t.Fatalf("list tags initial: %d %v", status, out)
+	}
+	tags, _ := out["Tags"].(map[string]any)
+	if len(tags) != 0 {
+		t.Fatalf("expected no tags, got %v", tags)
+	}
+
+	// TagQueue stores two tags.
+	status, out = callSQS(t, node, sqsTagQueueTarget, map[string]any{
+		"QueueUrl": queueURL,
+		"Tags":     map[string]string{"team": "platform", "env": "test"},
+	})
+	if status != http.StatusOK {
+		t.Fatalf("tag: %d %v", status, out)
+	}
+	_, out = callSQS(t, node, sqsListQueueTagsTarget, map[string]any{
+		"QueueUrl": queueURL,
+	})
+	tags, _ = out["Tags"].(map[string]any)
+	if tags["team"] != "platform" || tags["env"] != "test" {
+		t.Fatalf("after tag: %v", tags)
+	}
+
+	// UntagQueue drops one tag, leaves the other.
+	status, out = callSQS(t, node, sqsUntagQueueTarget, map[string]any{
+		"QueueUrl": queueURL,
+		"TagKeys":  []string{"env"},
+	})
+	if status != http.StatusOK {
+		t.Fatalf("untag: %d %v", status, out)
+	}
+	_, out = callSQS(t, node, sqsListQueueTagsTarget, map[string]any{
+		"QueueUrl": queueURL,
+	})
+	tags, _ = out["Tags"].(map[string]any)
+	if _, present := tags["env"]; present {
+		t.Fatalf("env should be removed, got %v", tags)
+	}
+	if tags["team"] != "platform" {
+		t.Fatalf("team should remain, got %v", tags)
+	}
+}
+
+func TestSQSServer_GetQueueAttributesApproximateCounters(t *testing.T) {
+	t.Parallel()
+	// Three buckets must be reflected by a single GetQueueAttributes call:
+	//   - visible    : sent and currently deliverable
+	//   - delayed    : sent with DelaySeconds > 0 and not yet available
+	//   - not visible: delivered to a consumer and within the visibility
+	//                  window
+	// QueueArn / CreatedTimestamp / LastModifiedTimestamp must also come
+	// back so dashboards have something to render. Counts are approximate
+	// per AWS, but the snapshot we read should be coherent.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "approx")
+
+	// One visible message.
+	_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl": queueURL, "MessageBody": "v",
+	})
+	// One delayed message.
+	_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl": queueURL, "MessageBody": "d", "DelaySeconds": 60,
+	})
+	// One in-flight message: send, then receive with a long visibility
+	// timeout so it stays not-visible for the duration of this test.
+	_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl": queueURL, "MessageBody": "i",
+	})
+	_, out := callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            queueURL,
+		"MaxNumberOfMessages": 1,
+		"VisibilityTimeout":   600,
+	})
+	if msgs, _ := out["Messages"].([]any); len(msgs) != 1 {
+		t.Fatalf("expected 1 received, got %d", len(msgs))
+	}
+
+	status, body := callSQS(t, node, sqsGetQueueAttributesTarget, map[string]any{
+		"QueueUrl":       queueURL,
+		"AttributeNames": []string{"All"},
+	})
+	if status != http.StatusOK {
+		t.Fatalf("getAttrs: %d %v", status, body)
+	}
+	attrs, _ := body["Attributes"].(map[string]any)
+	assertApproxCounterAttrs(t, attrs)
+
+	// When the caller does not request any Approximate* attribute, the
+	// scan must be skipped — verify by asking for a single non-counter
+	// attribute and confirming the counters are absent from the response.
+	_, body = callSQS(t, node, sqsGetQueueAttributesTarget, map[string]any{
+		"QueueUrl":       queueURL,
+		"AttributeNames": []string{"VisibilityTimeout"},
+	})
+	attrs, _ = body["Attributes"].(map[string]any)
+	if _, present := attrs["ApproximateNumberOfMessages"]; present {
+		t.Fatalf("counter included for non-counter selection: %v", attrs)
+	}
+}
+
+func TestSQSServer_MessageAttributesCanonicalMD5(t *testing.T) {
+	t.Parallel()
+	// Cross-check md5OfAttributesHex against the AWS-published wire
+	// format using a hand-rolled reference encoder. AWS SDKs verify
+	// MD5OfMessageAttributes; if our hash drifts every SDK send fails
+	// with MessageAttributeMD5Mismatch.
+	attrs := map[string]sqsMessageAttributeValue{
+		"City":  {DataType: "String", StringValue: "Anytown"},
+		"Order": {DataType: "Number", StringValue: "12345"},
+		"Blob":  {DataType: "Binary", BinaryValue: []byte{0xde, 0xad, 0xbe, 0xef}},
+	}
+	want := referenceCanonicalMD5(attrs)
+	got := md5OfAttributesHex(attrs)
+	if got != want {
+		t.Fatalf("canonical md5 mismatch:\n  got:  %s\n  want: %s", got, want)
+	}
+	if md5OfAttributesHex(nil) != "" {
+		t.Fatalf("empty attrs must hash to empty string, got %q", md5OfAttributesHex(nil))
+	}
+	if md5OfAttributesHex(map[string]sqsMessageAttributeValue{}) != "" {
+		t.Fatalf("empty map must hash to empty string")
+	}
+}
+
+// referenceCanonicalMD5 reimplements the AWS canonical algorithm in a
+// way that does not share code with md5OfAttributesHex. If the two
+// disagree the SDK hash is wrong.
+func referenceCanonicalMD5(attrs map[string]sqsMessageAttributeValue) string {
+	if len(attrs) == 0 {
+		return ""
+	}
+	names := make([]string, 0, len(attrs))
+	for k := range attrs {
+		names = append(names, k)
+	}
+	for i := 1; i < len(names); i++ {
+		for j := i; j > 0 && names[j-1] > names[j]; j-- {
+			names[j-1], names[j] = names[j], names[j-1]
+		}
+	}
+	var buf bytes.Buffer
+	writeLen := func(s string) {
+		var l [4]byte
+		binary.BigEndian.PutUint32(l[:], safeUint32Len(len(s)))
+		buf.Write(l[:])
+	}
+	writeLenBytes := func(p []byte) {
+		var l [4]byte
+		binary.BigEndian.PutUint32(l[:], safeUint32Len(len(p)))
+		buf.Write(l[:])
+	}
+	for _, name := range names {
+		v := attrs[name]
+		writeLen(name)
+		buf.WriteString(name)
+		writeLen(v.DataType)
+		buf.WriteString(v.DataType)
+		switch v.DataType {
+		case "Binary":
+			buf.WriteByte(0x02)
+			writeLenBytes(v.BinaryValue)
+			buf.Write(v.BinaryValue)
+		default:
+			buf.WriteByte(0x01)
+			writeLen(v.StringValue)
+			buf.WriteString(v.StringValue)
+		}
+	}
+	return hexMD5(buf.Bytes())
+}
+
+func hexMD5(p []byte) string {
+	h := sqsMD5Hex(p)
+	if _, err := hex.DecodeString(h); err != nil {
+		return ""
+	}
+	return h
+}
+
+func TestSQSServer_SendMessageWithMessageAttributes(t *testing.T) {
+	t.Parallel()
+	// SendMessage must accept MessageAttributes, return the AWS-canonical
+	// MD5 in MD5OfMessageAttributes, and a subsequent ReceiveMessage with
+	// MessageAttributeNames=["All"] must echo the attributes back along
+	// with the same MD5.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "msg-attrs")
+
+	attrs := map[string]any{
+		"City":  map[string]any{"DataType": "String", "StringValue": "Tokyo"},
+		"Order": map[string]any{"DataType": "Number", "StringValue": "42"},
+	}
+	status, out := callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":          queueURL,
+		"MessageBody":       "hi",
+		"MessageAttributes": attrs,
+	})
+	if status != http.StatusOK {
+		t.Fatalf("send: %d %v", status, out)
+	}
+	expectedMD5 := md5OfAttributesHex(map[string]sqsMessageAttributeValue{
+		"City":  {DataType: "String", StringValue: "Tokyo"},
+		"Order": {DataType: "Number", StringValue: "42"},
+	})
+	if got, _ := out["MD5OfMessageAttributes"].(string); got != expectedMD5 {
+		t.Fatalf("MD5OfMessageAttributes = %q, want %q", got, expectedMD5)
+	}
+
+	// Receive with "All" must echo attributes + matching MD5.
+	status, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":              queueURL,
+		"MaxNumberOfMessages":   1,
+		"VisibilityTimeout":     60,
+		"MessageAttributeNames": []string{"All"},
+	})
+	if status != http.StatusOK {
+		t.Fatalf("receive: %d %v", status, out)
+	}
+	msgs, _ := out["Messages"].([]any)
+	if len(msgs) != 1 {
+		t.Fatalf("expected 1 message, got %d", len(msgs))
+	}
+	m, _ := msgs[0].(map[string]any)
+	if got, _ := m["MD5OfMessageAttributes"].(string); got != expectedMD5 {
+		t.Fatalf("Receive MD5 = %q, want %q", got, expectedMD5)
+	}
+	echoed, _ := m["MessageAttributes"].(map[string]any)
+	if len(echoed) != 2 {
+		t.Fatalf("expected 2 echoed attributes, got %v", echoed)
+	}
+	city, _ := echoed["City"].(map[string]any)
+	if city["StringValue"] != "Tokyo" || city["DataType"] != "String" {
+		t.Fatalf("City attribute = %v", city)
+	}
+}
+
+func TestSQSServer_SendMessageRejectsMalformedAttributes(t *testing.T) {
+	t.Parallel()
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "bad-attrs")
+
+	// Missing DataType.
+	status, out := callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":    queueURL,
+		"MessageBody": "x",
+		"MessageAttributes": map[string]any{
+			"X": map[string]any{"StringValue": "value"},
+		},
+	})
+	if status != http.StatusBadRequest || out["__type"] != sqsErrInvalidAttributeValue {
+		t.Fatalf("missing DataType: status=%d body=%v", status, out)
+	}
+
+	// Unknown DataType.
+	status, out = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":    queueURL,
+		"MessageBody": "x",
+		"MessageAttributes": map[string]any{
+			"X": map[string]any{"DataType": "Bogus", "StringValue": "v"},
+		},
+	})
+	if status != http.StatusBadRequest || out["__type"] != sqsErrInvalidAttributeValue {
+		t.Fatalf("bad DataType: status=%d body=%v", status, out)
+	}
+
+	// String type with empty StringValue.
+	status, out = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":    queueURL,
+		"MessageBody": "x",
+		"MessageAttributes": map[string]any{
+			"X": map[string]any{"DataType": "String", "StringValue": ""},
+		},
+	})
+	if status != http.StatusBadRequest || out["__type"] != sqsErrInvalidAttributeValue {
+		t.Fatalf("empty StringValue: status=%d body=%v", status, out)
+	}
+}
+
+func TestSQSServer_DLQRedriveOnMaxReceiveCount(t *testing.T) {
+	t.Parallel()
+	// A message received maxReceiveCount times must be moved to the
+	// DLQ on the next receive instead of being delivered. The DLQ
+	// receives the message body and a DeadLetterQueueSourceArn
+	// attribute, and the source queue stops surfacing it.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	dlqURL := createSQSQueueForTest(t, node, "dlq-target")
+	policy := `{"deadLetterTargetArn":"arn:aws:sqs:us-east-1:000000000000:dlq-target","maxReceiveCount":2}`
+	status, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName": "redrive-src",
+		"Attributes": map[string]string{
+			"RedrivePolicy": policy,
+		},
+	})
+	if status != http.StatusOK {
+		t.Fatalf("create source: %d %v", status, out)
+	}
+	srcURL, _ := out["QueueUrl"].(string)
+
+	_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":    srcURL,
+		"MessageBody": "poison",
+	})
+
+	// First two receives deliver the message normally (count 1, 2).
+	for i := range 2 {
+		_, out := callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+			"QueueUrl":            srcURL,
+			"MaxNumberOfMessages": 1,
+			"VisibilityTimeout":   1,
+		})
+		msgs, _ := out["Messages"].([]any)
+		if len(msgs) != 1 {
+			t.Fatalf("receive #%d expected 1 msg, got %d (%v)", i, len(msgs), out)
+		}
+		// Wait past the visibility window so the next receive can pick
+		// it up again.
+		time.Sleep(1100 * time.Millisecond)
+	}
+
+	// Third receive triggers the redrive — source returns 0 messages.
+	_, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            srcURL,
+		"MaxNumberOfMessages": 1,
+		"VisibilityTimeout":   1,
+	})
+	if msgs, _ := out["Messages"].([]any); len(msgs) != 0 {
+		t.Fatalf("source still returning poison message after redrive: %v", msgs)
+	}
+
+	// DLQ now has the moved message.
+	_, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            dlqURL,
+		"MaxNumberOfMessages": 1,
+		"VisibilityTimeout":   60,
+	})
+	msgs, _ := out["Messages"].([]any)
+	if len(msgs) != 1 {
+		t.Fatalf("DLQ expected 1 moved message, got %d (%v)", len(msgs), out)
+	}
+	moved, _ := msgs[0].(map[string]any)
+	if moved["Body"] != "poison" {
+		t.Fatalf("DLQ message body = %v, want poison", moved["Body"])
+	}
+	// ApproximateReceiveCount on the DLQ side starts at 1 (this single
+	// receive); the source's count is not carried over.
+	movedAttrs, _ := moved["Attributes"].(map[string]any)
+	if movedAttrs["ApproximateReceiveCount"] != "1" {
+		t.Fatalf("DLQ message ApproximateReceiveCount = %v, want 1", movedAttrs["ApproximateReceiveCount"])
+	}
+}
+
+func TestSQSServer_FifoSequenceNumberMonotonic(t *testing.T) {
+	t.Parallel()
+	// Two FIFO sends must come back with strictly increasing
+	// SequenceNumber, and ReceiveMessage must echo the same number on
+	// the corresponding message.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	_, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName":  "fifo-seq.fifo",
+		"Attributes": map[string]string{"FifoQueue": "true"},
+	})
+	url, _ := out["QueueUrl"].(string)
+
+	first := sendFifoMessage(t, node, url, "g1", "d1", "a")
+	second := sendFifoMessage(t, node, url, "g1", "d2", "b")
+	if first >= second {
+		t.Fatalf("FIFO SequenceNumbers not increasing: first=%d second=%d", first, second)
+	}
+
+	_, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            url,
+		"MaxNumberOfMessages": 1,
+		"VisibilityTimeout":   60,
+	})
+	msgs, _ := out["Messages"].([]any)
+	if len(msgs) != 1 {
+		t.Fatalf("expected 1 received, got %d", len(msgs))
+	}
+	m, _ := msgs[0].(map[string]any)
+	attrs, _ := m["Attributes"].(map[string]any)
+	seqStr, _ := attrs["SequenceNumber"].(string)
+	got, _ := strconv.ParseUint(seqStr, 10, 64)
+	if got != first {
+		t.Fatalf("Receive SequenceNumber=%d, want first send's %d", got, first)
+	}
+}
+
+// assertApproxCounterAttrs verifies the Approximate counters and the
+// catalog metadata fields produced by GetQueueAttributes for the
+// hand-built (visible=1, not-visible=1, delayed=1) fixture.
+func assertApproxCounterAttrs(t *testing.T, attrs map[string]any) {
+	t.Helper()
+	if attrs["ApproximateNumberOfMessages"] != "1" {
+		t.Fatalf("Visible counter = %v, want 1 (%v)", attrs["ApproximateNumberOfMessages"], attrs)
+	}
+	if attrs["ApproximateNumberOfMessagesNotVisible"] != "1" {
+		t.Fatalf("NotVisible counter = %v, want 1", attrs["ApproximateNumberOfMessagesNotVisible"])
+	}
+	if attrs["ApproximateNumberOfMessagesDelayed"] != "1" {
+		t.Fatalf("Delayed counter = %v, want 1", attrs["ApproximateNumberOfMessagesDelayed"])
+	}
+	if got, _ := attrs["QueueArn"].(string); got == "" || got[:11] != "arn:aws:sqs" {
+		t.Fatalf("QueueArn malformed: %v", attrs["QueueArn"])
+	}
+	if attrs["CreatedTimestamp"] == nil || attrs["LastModifiedTimestamp"] == nil {
+		t.Fatalf("expected created/modified timestamps, got %v", attrs)
+	}
+}
+
+func sendFifoMessage(t *testing.T, node Node, url, groupID, dedupID, body string) uint64 {
+	t.Helper()
+	status, out := callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":               url,
+		"MessageBody":            body,
+		"MessageGroupId":         groupID,
+		"MessageDeduplicationId": dedupID,
+	})
+	if status != http.StatusOK {
+		t.Fatalf("FIFO send: %d %v", status, out)
+	}
+	seqStr, _ := out["SequenceNumber"].(string)
+	seq, err := strconv.ParseUint(seqStr, 10, 64)
+	if err != nil {
+		t.Fatalf("SequenceNumber not parseable: %v", out["SequenceNumber"])
+	}
+	return seq
+}
+
+func TestSQSServer_SendMessageBatchFifoDedupAndSequence(t *testing.T) {
+	t.Parallel()
+	// SendMessageBatch on a FIFO queue must (a) honor per-entry dedup —
+	// two entries with the same MessageDeduplicationId only land once
+	// and report the same MessageId, and (b) assign strictly increasing
+	// SequenceNumbers across distinct entries. The standard-queue
+	// single-OCC fast path would lose both invariants by skipping the
+	// dedup record and writing identical sequence numbers, which is
+	// the regression flagged by Codex P1.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	_, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName":  "fifo-batch.fifo",
+		"Attributes": map[string]string{"FifoQueue": "true"},
+	})
+	url, _ := out["QueueUrl"].(string)
+
+	entries := []map[string]any{
+		{"Id": "a", "MessageBody": "alpha", "MessageGroupId": "g", "MessageDeduplicationId": "d-a"},
+		{"Id": "b", "MessageBody": "beta", "MessageGroupId": "g", "MessageDeduplicationId": "d-b"},
+		// Duplicate dedup id of "a" — must collapse to the same MessageId.
+		{"Id": "c", "MessageBody": "alpha-again", "MessageGroupId": "g", "MessageDeduplicationId": "d-a"},
+	}
+	status, body := callSQS(t, node, sqsSendMessageBatchTarget, map[string]any{
+		"QueueUrl": url,
+		"Entries":  entries,
+	})
+	if status != http.StatusOK {
+		t.Fatalf("send batch fifo: %d %v", status, body)
+	}
+	successful, _ := body["Successful"].([]any)
+	if len(successful) != 3 {
+		t.Fatalf("expected 3 successful, got %d (%v)", len(successful), successful)
+	}
+
+	byID := map[string]map[string]any{}
+	for _, s := range successful {
+		m, _ := s.(map[string]any)
+		id, _ := m["Id"].(string)
+		byID[id] = m
+	}
+	if byID["a"]["MessageId"] != byID["c"]["MessageId"] {
+		t.Fatalf("dedup hit must reuse original MessageId; a=%v c=%v",
+			byID["a"]["MessageId"], byID["c"]["MessageId"])
+	}
+	seqAStr, _ := byID["a"]["SequenceNumber"].(string)
+	seqBStr, _ := byID["b"]["SequenceNumber"].(string)
+	seqCStr, _ := byID["c"]["SequenceNumber"].(string)
+	seqA, _ := strconv.ParseUint(seqAStr, 10, 64)
+	seqB, _ := strconv.ParseUint(seqBStr, 10, 64)
+	seqC, _ := strconv.ParseUint(seqCStr, 10, 64)
+	if seqA == 0 || seqB == 0 {
+		t.Fatalf("FIFO batch sends must assign sequence numbers: a=%d b=%d", seqA, seqB)
+	}
+	if seqA >= seqB {
+		t.Fatalf("SequenceNumber must be strictly increasing: a=%d b=%d", seqA, seqB)
+	}
+	if seqC != seqA {
+		t.Fatalf("dedup hit must reuse original sequence; a=%d c=%d", seqA, seqC)
+	}
+
+	// Only two messages should be deliverable (a, b) — the dedup
+	// hit on c collapsed back to a's record.
+	_, body = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            url,
+		"MaxNumberOfMessages": 10,
+		"VisibilityTimeout":   60,
+	})
+	msgs, _ := body["Messages"].([]any)
+	// FIFO group lock means we only receive the head until it is deleted.
+	if len(msgs) != 1 {
+		t.Fatalf("FIFO batch + group lock expected exactly 1 head message, got %d", len(msgs))
+	}
+}
+
+func TestSQSServer_FifoDedupBlocksDuplicateSend(t *testing.T) {
+	t.Parallel()
+	// A second FIFO send with the same MessageDeduplicationId inside
+	// the dedup window must come back with the original MessageId and
+	// not write a new copy on the queue.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	_, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName":  "fifo-dedup.fifo",
+		"Attributes": map[string]string{"FifoQueue": "true"},
+	})
+	url, _ := out["QueueUrl"].(string)
+
+	status, first := callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":               url,
+		"MessageBody":            "x",
+		"MessageGroupId":         "g",
+		"MessageDeduplicationId": "same",
+	})
+	if status != http.StatusOK {
+		t.Fatalf("first send: %d %v", status, first)
+	}
+	status, second := callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":               url,
+		"MessageBody":            "different-body-but-same-dedup",
+		"MessageGroupId":         "g",
+		"MessageDeduplicationId": "same",
+	})
+	if status != http.StatusOK {
+		t.Fatalf("dedup send: %d %v", status, second)
+	}
+	if first["MessageId"] != second["MessageId"] {
+		t.Fatalf("dedup hit must reuse original MessageId: %v vs %v", first, second)
+	}
+
+	// Only one message should be deliverable.
+	_, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            url,
+		"MaxNumberOfMessages": 10,
+		"VisibilityTimeout":   60,
+	})
+	msgs, _ := out["Messages"].([]any)
+	if len(msgs) != 1 {
+		t.Fatalf("dedup window must collapse send to 1 message; got %d", len(msgs))
+	}
+	m, _ := msgs[0].(map[string]any)
+	if m["Body"] != "x" {
+		t.Fatalf("dedup must keep the original body, got %v", m["Body"])
+	}
+}
+
+func TestSQSServer_FifoContentBasedDedup(t *testing.T) {
+	t.Parallel()
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	_, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName": "fifo-cbd.fifo",
+		"Attributes": map[string]string{
+			"FifoQueue":                 "true",
+			"ContentBasedDeduplication": "true",
+		},
+	})
+	url, _ := out["QueueUrl"].(string)
+
+	status, first := callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":       url,
+		"MessageBody":    "same-body",
+		"MessageGroupId": "g",
+	})
+	if status != http.StatusOK {
+		t.Fatalf("first cbd send: %d %v", status, first)
+	}
+	status, second := callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":       url,
+		"MessageBody":    "same-body",
+		"MessageGroupId": "g",
+	})
+	if status != http.StatusOK {
+		t.Fatalf("dup cbd send: %d %v", status, second)
+	}
+	if first["MessageId"] != second["MessageId"] {
+		t.Fatalf("ContentBasedDeduplication must hash body to the same dedup id: %v vs %v", first, second)
+	}
+}
+
+func TestSQSServer_FifoGroupLockHoldsAcrossVisibilityExpiry(t *testing.T) {
+	t.Parallel()
+	// Two FIFO messages in the same group: the first receive must pull
+	// message A (the head). Even after A's visibility window expires
+	// (without a delete), the next receive must re-deliver A — never
+	// jump ahead to B — because the group lock pins itself to the head
+	// across visibility-timeout transitions.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	_, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName":  "fifo-grouplock.fifo",
+		"Attributes": map[string]string{"FifoQueue": "true"},
+	})
+	url, _ := out["QueueUrl"].(string)
+
+	_ = sendFifoMessage(t, node, url, "g", "a", "first")
+	_ = sendFifoMessage(t, node, url, "g", "b", "second")
+
+	// First receive: must be the head.
+	_, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            url,
+		"MaxNumberOfMessages": 10,
+		"VisibilityTimeout":   1,
+	})
+	msgs, _ := out["Messages"].([]any)
+	if len(msgs) != 1 {
+		t.Fatalf("expected exactly 1 head message, got %d (group lock should hide successor)", len(msgs))
+	}
+	first, _ := msgs[0].(map[string]any)
+	if first["Body"] != "first" {
+		t.Fatalf("FIFO head must be 'first', got %v", first["Body"])
+	}
+
+	// Wait past the visibility window; group lock must keep the head
+	// pinned so the next receive re-delivers A, not B.
+	time.Sleep(1200 * time.Millisecond)
+	_, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            url,
+		"MaxNumberOfMessages": 10,
+		"VisibilityTimeout":   60,
+	})
+	msgs, _ = out["Messages"].([]any)
+	if len(msgs) != 1 {
+		t.Fatalf("expected re-delivery of head, got %d messages", len(msgs))
+	}
+	again, _ := msgs[0].(map[string]any)
+	if again["Body"] != "first" {
+		t.Fatalf("FIFO redelivery must stay on head; got %v", again["Body"])
+	}
+	if again["MessageId"] != first["MessageId"] {
+		t.Fatalf("FIFO redelivery must reuse the same MessageId")
+	}
+
+	// Delete the head; the next receive can finally pick up the second.
+	receiptHandle, _ := again["ReceiptHandle"].(string)
+	deleteMessageOK(t, node, url, receiptHandle)
+	_, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            url,
+		"MaxNumberOfMessages": 10,
+		"VisibilityTimeout":   60,
+	})
+	msgs, _ = out["Messages"].([]any)
+	if len(msgs) != 1 {
+		t.Fatalf("expected successor after head delete, got %d", len(msgs))
+	}
+	tail, _ := msgs[0].(map[string]any)
+	if tail["Body"] != "second" {
+		t.Fatalf("expected successor body 'second', got %v", tail["Body"])
+	}
+}
+
+func TestSQSServer_RetentionReaperRemovesOldMessage(t *testing.T) {
+	t.Parallel()
+	// Send a message, backdate it past retention, then drive one reaper
+	// pass and confirm the data, vis, and byage entries are gone. The
+	// reaper must succeed without going through ReceiveMessage — that
+	// is the whole reason byage exists, since a message stuck in
+	// flight could otherwise live forever past retention.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	_, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName": "reap-target",
+		"Attributes": map[string]string{
+			"MessageRetentionPeriod": "60",
+		},
+	})
+	url, _ := out["QueueUrl"].(string)
+	_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":    url,
+		"MessageBody": "to-be-reaped",
+	})
+
+	// Backdate so retention has elapsed.
+	backdateSQSMessageForTest(t, nodes[0], "reap-target", 120*time.Second)
+
+	// Drive one reaper pass directly so the test does not have to
+	// wait the natural 30 s tick.
+	srv := node.sqsServer
+	if err := srv.reapAllQueues(t.Context()); err != nil {
+		t.Fatalf("reapAllQueues: %v", err)
+	}
+
+	// Receive must come back empty — the data record is gone, the
+	// scan path will not find it via the visibility index either.
+	status, body := callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            url,
+		"MaxNumberOfMessages": 1,
+	})
+	if status != http.StatusOK {
+		t.Fatalf("receive after reap: %d %v", status, body)
+	}
+	if msgs, _ := body["Messages"].([]any); len(msgs) != 0 {
+		t.Fatalf("reaper left a message behind: %v", msgs)
+	}
+
+	// ApproximateNumberOfMessages must reflect the empty queue too.
+	_, body = callSQS(t, node, sqsGetQueueAttributesTarget, map[string]any{
+		"QueueUrl":       url,
+		"AttributeNames": []string{"ApproximateNumberOfMessages"},
+	})
+	attrs, _ := body["Attributes"].(map[string]any)
+	if attrs["ApproximateNumberOfMessages"] != "0" {
+		t.Fatalf("approx counter after reap = %v, want 0", attrs)
+	}
+}
+
+func TestSQSServer_PurgeThenDeleteOrphansCleaned(t *testing.T) {
+	t.Parallel()
+	// Regression: PurgeQueue followed by DeleteQueue, both committing
+	// before any reaper tick, used to permanently leak the pre-purge
+	// generation. PurgeQueue advanced the generation counter without
+	// writing a tombstone for the old gen, then DeleteQueue removed
+	// the meta row and only tombstoned the post-purge gen. After that,
+	//   * reapAllQueues -> scanQueueNames sees no meta -> skip,
+	//   * reapTombstonedQueues only finds the post-purge gen's
+	//     tombstone -> reapDeadByAge filters by that gen -> the older
+	//     gen's byage / data / vis records are never visited.
+	// Fix: PurgeQueue tombstones the pre-bump gen in the same OCC
+	// transaction that bumps the counter, so the tombstone-driven
+	// reaper sweeps both generations.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "purge-del-orphans")
+	stampSQSMessages(t, node, queueURL, "g1-", 3)
+	expectSQSOK(t, node, sqsPurgeQueueTarget, map[string]any{"QueueUrl": queueURL}, "purge")
+	expectSQSOK(t, node, sqsDeleteQueueTarget, map[string]any{"QueueUrl": queueURL}, "delete")
+
+	srv := node.sqsServer
+	ctx := t.Context()
+	byagePrefix := sqsMsgByAgePrefixAllGenerations("purge-del-orphans")
+	byageEnd := prefixScanEnd(byagePrefix)
+
+	// Sanity: gen-1 byage rows exist before any reaper pass; otherwise
+	// the test would pass trivially even if the bug were still present.
+	if got := scanCount(t, srv, ctx, byagePrefix, byageEnd); got == 0 {
+		t.Fatalf("expected gen-1 byage rows after purge+delete, got none")
+	}
+
+	if err := srv.reapAllQueues(ctx); err != nil {
+		t.Fatalf("reapAllQueues: %v", err)
+	}
+
+	if got := scanCount(t, srv, ctx, byagePrefix, byageEnd); got != 0 {
+		t.Fatalf("byage rows leaked after purge+delete+reap: %d entries", got)
+	}
+	// Both tombstones (pre-purge gen + post-delete gen) must be
+	// drained too, otherwise every subsequent reaper tick re-scans an
+	// empty cohort forever.
+	tombPrefix := []byte(SqsQueueTombstonePrefix)
+	if got := scanCount(t, srv, ctx, tombPrefix, prefixScanEnd(tombPrefix)); got != 0 {
+		t.Fatalf("tombstones leaked after purge+delete+reap: %d entries", got)
+	}
+}
+
+// stampSQSMessages sends `count` bodies tagged with `prefix` + index.
+// Send errors are intentionally ignored: callers use this to set up
+// state, and per-message failures show up downstream as missing rows.
+func stampSQSMessages(t *testing.T, node Node, queueURL, prefix string, count int) {
+	t.Helper()
+	for i := range count {
+		_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+			"QueueUrl":    queueURL,
+			"MessageBody": prefix + strconv.Itoa(i),
+		})
+	}
+}
+
+// expectSQSOK calls the named SQS target and fails the test if the
+// HTTP status is not 200. The label is used in the error message so
+// chained calls in a single test produce distinguishable failures.
+func expectSQSOK(t *testing.T, node Node, target string, in map[string]any, label string) {
+	t.Helper()
+	status, body := callSQS(t, node, target, in)
+	if status != http.StatusOK {
+		t.Fatalf("%s: %d %v", label, status, body)
+	}
+}
+
+// scanCount returns the number of entries under [prefix, end) at a
+// fresh read timestamp. Errors are fatal so callers do not have to
+// thread an extra branch through their assertions.
+func scanCount(t *testing.T, srv *SQSServer, ctx context.Context, prefix, end []byte) int {
+	t.Helper()
+	pairs, err := srv.store.ScanAt(ctx, prefix, end, 100, srv.nextTxnReadTS(ctx))
+	if err != nil {
+		t.Fatalf("scan [%x, %x): %v", prefix, end, err)
+	}
+	return len(pairs)
+}
+
+func TestSQSServer_RetentionReaperReclaimsPurgedGenerations(t *testing.T) {
+	t.Parallel()
+	// PurgeQueue advances the queue generation rather than walking the
+	// keyspace, so prior-generation data/vis/byage records become
+	// orphans that no normal request path can ever observe again. The
+	// reaper must walk every generation under the queue and delete
+	// those orphans, otherwise each purge leaks storage permanently.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "purge-orphans")
+
+	// Stamp three messages on the original generation, then purge.
+	for i := range 3 {
+		_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+			"QueueUrl":    queueURL,
+			"MessageBody": "g0-" + strconv.Itoa(i),
+		})
+	}
+	if status, body := callSQS(t, node, sqsPurgeQueueTarget, map[string]any{
+		"QueueUrl": queueURL,
+	}); status != http.StatusOK {
+		t.Fatalf("purge: %d %v", status, body)
+	}
+
+	// Confirm the byage prefix still has the orphan rows before
+	// reaping.
+	srv := node.sqsServer
+	ctx := t.Context()
+	prefix := sqsMsgByAgePrefixAllGenerations("purge-orphans")
+	end := prefixScanEnd(prefix)
+	before, err := srv.store.ScanAt(ctx, prefix, end, 100, srv.nextTxnReadTS(ctx))
+	if err != nil {
+		t.Fatalf("pre-reap scan: %v", err)
+	}
+	if len(before) == 0 {
+		t.Fatalf("expected pre-reap orphan rows, got none")
+	}
+
+	// Drive one reaper pass; the orphan generation must be cleaned.
+	if err := srv.reapAllQueues(ctx); err != nil {
+		t.Fatalf("reapAllQueues: %v", err)
+	}
+	assertNoPurgeOrphansLeft(t, srv, "purge-orphans", prefix, end)
+}
+
+// assertNoPurgeOrphansLeft scans the byage prefix after a reaper pass
+// and fails the test if any entry still references a generation older
+// than the queue's current generation.
+func assertNoPurgeOrphansLeft(t *testing.T, srv *SQSServer, queueName string, prefix, end []byte) {
+	t.Helper()
+	ctx := t.Context()
+	readTS := srv.nextTxnReadTS(ctx)
+	meta, _, metaErr := srv.loadQueueMetaAt(ctx, queueName, readTS)
+	if metaErr != nil {
+		t.Fatalf("meta load: %v", metaErr)
+	}
+	after, err := srv.store.ScanAt(ctx, prefix, end, 100, srv.nextTxnReadTS(ctx))
+	if err != nil {
+		t.Fatalf("post-reap scan: %v", err)
+	}
+	for _, kvp := range after {
+		parsed, ok := parseSqsMsgByAgeKey(kvp.Key, queueName)
+		if !ok {
+			continue
+		}
+		if parsed.Generation < meta.Generation {
+			t.Fatalf("orphan row from gen=%d still present after reap (current=%d)",
+				parsed.Generation, meta.Generation)
+		}
+	}
+}
+
+func TestSQSServer_RetentionReaperDropsExpiredFifoDedup(t *testing.T) {
+	t.Parallel()
+	// Expired dedup records must be reaped, otherwise queues with
+	// mostly-unique MessageDeduplicationIds accumulate permanent
+	// dedup rows. The send path already treats expired entries as
+	// misses; the reaper is the only path that frees the storage.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	_, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName":  "fifo-dedup-reap.fifo",
+		"Attributes": map[string]string{"FifoQueue": "true"},
+	})
+	url, _ := out["QueueUrl"].(string)
+	_ = sendFifoMessage(t, node, url, "g", "d-1", "x")
+
+	srv := node.sqsServer
+	ctx := t.Context()
+	dedupKey := sqsMsgDedupKey("fifo-dedup-reap.fifo", 1, "d-1")
+	readTS := srv.nextTxnReadTS(ctx)
+	raw, err := srv.store.GetAt(ctx, dedupKey, readTS)
+	if err != nil {
+		t.Fatalf("read dedup: %v", err)
+	}
+	rec, err := decodeFifoDedupRecord(raw)
+	if err != nil {
+		t.Fatalf("decode dedup: %v", err)
+	}
+	rec.ExpiresAtMillis = time.Now().UnixMilli() - 1000
+	body, err := encodeFifoDedupRecord(rec)
+	if err != nil {
+		t.Fatalf("encode dedup: %v", err)
+	}
+	commitReq := &kv.OperationGroup[kv.OP]{
+		IsTxn:   true,
+		StartTS: readTS,
+		Elems: []*kv.Elem[kv.OP]{
+			{Op: kv.Put, Key: dedupKey, Value: body},
+		},
+	}
+	if _, err := srv.coordinator.Dispatch(ctx, commitReq); err != nil {
+		t.Fatalf("backdate dispatch: %v", err)
+	}
+
+	if err := srv.reapAllQueues(ctx); err != nil {
+		t.Fatalf("reapAllQueues: %v", err)
+	}
+
+	if _, err := srv.store.GetAt(ctx, dedupKey, srv.nextTxnReadTS(ctx)); err == nil {
+		t.Fatalf("expired dedup record still present after reap")
+	}
+}
+
+func TestSQSServer_ReaperCleansDeletedQueueOrphans(t *testing.T) {
+	t.Parallel()
+	// DeleteQueue removes the meta row but leaves data / vis / byage /
+	// dedup / group keys keyed by the old generation. Without a
+	// tombstone-driven reaper pass, scanQueueNames would never visit
+	// the deleted queue again and those keys would leak forever. Here
+	// we send a few messages, delete the queue, and confirm the
+	// orphan rows are gone after a reaper pass and the tombstone is
+	// cleaned up.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "del-orphans")
+
+	for i := range 3 {
+		_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+			"QueueUrl":    queueURL,
+			"MessageBody": "x-" + strconv.Itoa(i),
+		})
+	}
+	if status, body := callSQS(t, node, sqsDeleteQueueTarget, map[string]any{
+		"QueueUrl": queueURL,
+	}); status != http.StatusOK {
+		t.Fatalf("delete: %d %v", status, body)
+	}
+
+	srv := node.sqsServer
+	ctx := t.Context()
+	// Tombstone is present pre-reap.
+	tombPrefix := []byte(SqsQueueTombstonePrefix)
+	tombEnd := prefixScanEnd(tombPrefix)
+	preTomb, err := srv.store.ScanAt(ctx, tombPrefix, tombEnd, 100, srv.nextTxnReadTS(ctx))
+	if err != nil {
+		t.Fatalf("pre-reap tombstone scan: %v", err)
+	}
+	if len(preTomb) == 0 {
+		t.Fatalf("DeleteQueue did not write a tombstone")
+	}
+
+	// One reaper pass should clear byage + dedup + group + tombstone.
+	if err := srv.reapAllQueues(ctx); err != nil {
+		t.Fatalf("reapAllQueues: %v", err)
+	}
+
+	byagePrefix := sqsMsgByAgePrefixAllGenerations("del-orphans")
+	byageEnd := prefixScanEnd(byagePrefix)
+	leftover, err := srv.store.ScanAt(ctx, byagePrefix, byageEnd, 100, srv.nextTxnReadTS(ctx))
+	if err != nil {
+		t.Fatalf("post-reap byage scan: %v", err)
+	}
+	if len(leftover) != 0 {
+		t.Fatalf("byage rows leaked after delete + reap: %v", leftover)
+	}
+	postTomb, err := srv.store.ScanAt(ctx, tombPrefix, tombEnd, 100, srv.nextTxnReadTS(ctx))
+	if err != nil {
+		t.Fatalf("post-reap tombstone scan: %v", err)
+	}
+	if len(postTomb) != 0 {
+		t.Fatalf("tombstone leaked after orphan reap: %d entries", len(postTomb))
+	}
+}
+
+func TestSQSServer_SendMessageBatchRejectsInvalidEntryId(t *testing.T) {
+	t.Parallel()
+	// AWS limits batch entry Ids to 1-80 chars of [a-zA-Z0-9_-].
+	// Anything outside that grammar must return InvalidBatchEntryId,
+	// not be silently passed through.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	url := createSQSQueueForTest(t, node, "bad-id")
+
+	bad := []string{
+		"has space",
+		"emoji-😀",
+		"slash/unsafe",
+		strings.Repeat("a", 81),
+	}
+	for _, id := range bad {
+		status, out := callSQS(t, node, sqsSendMessageBatchTarget, map[string]any{
+			"QueueUrl": url,
+			"Entries": []map[string]any{
+				{"Id": id, "MessageBody": "x"},
+			},
+		})
+		if status != http.StatusBadRequest {
+			t.Fatalf("bad id %q: got %d want 400 (%v)", id, status, out)
+		}
+		if got, _ := out["__type"].(string); got != sqsErrInvalidBatchEntryId {
+			t.Fatalf("bad id %q: error type %q want %q", id, got, sqsErrInvalidBatchEntryId)
+		}
+	}
+
+	// Valid ids still work.
+	status, _ := callSQS(t, node, sqsSendMessageBatchTarget, map[string]any{
+		"QueueUrl": url,
+		"Entries": []map[string]any{
+			{"Id": "valid-id_1", "MessageBody": "x"},
+		},
+	})
+	if status != http.StatusOK {
+		t.Fatalf("valid id: status %d", status)
+	}
+}
+
+func TestSQSServer_SendMessageBatchAttributesContributeToSizeCap(t *testing.T) {
+	t.Parallel()
+	// Body size alone is not the AWS request cap — MessageAttribute
+	// names + DataTypes + StringValues + BinaryValues all count.
+	// Without that, a client can ship tiny bodies and a few-MiB
+	// BinaryValue per entry and bypass the 256 KiB request cap.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	url := createSQSQueueForTest(t, node, "attr-size-cap")
+
+	huge := bytes.Repeat([]byte{0xff}, 200_000) // 200 KiB
+	entries := []map[string]any{
+		{
+			"Id":          "a",
+			"MessageBody": "tiny",
+			"MessageAttributes": map[string]any{
+				"big": map[string]any{"DataType": "Binary", "BinaryValue": huge},
+			},
+		},
+		{
+			"Id":          "b",
+			"MessageBody": "tiny",
+			"MessageAttributes": map[string]any{
+				"big": map[string]any{"DataType": "Binary", "BinaryValue": huge},
+			},
+		},
+	}
+	status, body := callSQS(t, node, sqsSendMessageBatchTarget, map[string]any{
+		"QueueUrl": url,
+		"Entries":  entries,
+	})
+	if status != http.StatusBadRequest {
+		t.Fatalf("oversize batch with attr bytes: got %d want 400 (%v)", status, body)
+	}
+	if got, _ := body["__type"].(string); got != sqsErrBatchRequestTooLong {
+		t.Fatalf("error type = %q, want %q", got, sqsErrBatchRequestTooLong)
+	}
+}
+
+func TestSQSServer_RedrivePolicyRejectsSelfReference(t *testing.T) {
+	t.Parallel()
+	// A self-referential RedrivePolicy would let DLQ redrive loop
+	// poison messages forever inside the same queue with reset
+	// counters. The validator must reject it at attribute-apply time.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	// CreateQueue with self-pointing RedrivePolicy is rejected.
+	policy := `{"deadLetterTargetArn":"arn:aws:sqs:us-east-1:000000000000:loopy","maxReceiveCount":3}`
+	status, body := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName":  "loopy",
+		"Attributes": map[string]string{"RedrivePolicy": policy},
+	})
+	if status != http.StatusBadRequest {
+		t.Fatalf("self-ref RedrivePolicy on Create: got %d want 400 (%v)", status, body)
+	}
+
+	// SetQueueAttributes likewise rejects.
+	url := createSQSQueueForTest(t, node, "loopy")
+	status, body = callSQS(t, node, sqsSetQueueAttributesTarget, map[string]any{
+		"QueueUrl":   url,
+		"Attributes": map[string]string{"RedrivePolicy": policy},
+	})
+	if status != http.StatusBadRequest {
+		t.Fatalf("self-ref RedrivePolicy on SetAttrs: got %d want 400 (%v)", status, body)
+	}
+}
+
+func TestSQSServer_ReceivePagesPastFifoGroupLockSkips(t *testing.T) {
+	t.Parallel()
+	// FIFO group lock keeps successive messages in the same group
+	// hidden behind the head. With many messages in one group ahead
+	// of a deliverable head in a different group, the receive must
+	// keep paging the visibility index instead of stopping after
+	// the first page of group-locked candidates.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	_, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName":  "fifo-skipheavy.fifo",
+		"Attributes": map[string]string{"FifoQueue": "true"},
+	})
+	url, _ := out["QueueUrl"].(string)
+
+	// Group "g1" gets one head, then 30 messages in g2 (which will
+	// all be pinned behind a single delivered head). Take "g1"'s head
+	// (which holds the g1 lock) — only g2's head should ever be
+	// deliverable on the next receive even though 30 candidates show
+	// up in the visibility index ahead of it.
+	_ = sendFifoMessage(t, node, url, "g1", "g1-d1", "g1-head")
+	for i := range 30 {
+		_ = sendFifoMessage(t, node, url, "g2", "g2-d"+strconv.Itoa(i), "g2-"+strconv.Itoa(i))
+	}
+
+	// First receive picks up the heads of each group; with two groups
+	// we expect both g1-head and the first g2 message. The remaining
+	// g2 messages are blocked behind g2's lock.
+	_, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            url,
+		"MaxNumberOfMessages": 10,
+		"VisibilityTimeout":   60,
+	})
+	msgs, _ := out["Messages"].([]any)
+	if len(msgs) < 2 {
+		t.Fatalf("expected at least 2 head messages (one per group), got %d", len(msgs))
+	}
+
+	// Second receive must return 0 — both groups are locked, but the
+	// scan must page through every group-locked candidate without
+	// errantly exhausting its budget on the first page.
+	_, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            url,
+		"MaxNumberOfMessages": 10,
+	})
+	if msgs, _ := out["Messages"].([]any); len(msgs) != 0 {
+		t.Fatalf("expected 0 (all groups locked), got %d", len(msgs))
+	}
+}
+
+func TestSQSServer_CreateQueueRejectsTooManyTags(t *testing.T) {
+	t.Parallel()
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	tags := make(map[string]string, 60)
+	for i := range 60 {
+		tags["tag-"+strconv.Itoa(i)] = "v"
+	}
+	status, body := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName": "too-many-tags",
+		"tags":      tags,
+	})
+	if status != http.StatusBadRequest {
+		t.Fatalf("60-tag create: got %d want 400 (%v)", status, body)
+	}
+	if got, _ := body["__type"].(string); got != sqsErrInvalidAttributeValue {
+		t.Fatalf("error type: %q want %q", got, sqsErrInvalidAttributeValue)
+	}
+}
+
+func TestSQSServer_BatchOnMissingQueueIsRequestLevelError(t *testing.T) {
+	t.Parallel()
+	// AWS returns request-level QueueDoesNotExist (HTTP 400) on
+	// DeleteMessageBatch / ChangeMessageVisibilityBatch when the
+	// queue does not exist — not an HTTP-200 envelope with per-entry
+	// failures, which retry logic could misclassify as partial
+	// success.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	missingURL := "http://" + node.sqsAddress + "/no-such-queue"
+
+	dummyHandle, err := encodeReceiptHandle(1, "00000000000000000000000000000000",
+		bytes.Repeat([]byte{0x01}, sqsReceiptTokenBytes))
+	if err != nil {
+		t.Fatalf("encode handle: %v", err)
+	}
+
+	status, body := callSQS(t, node, sqsDeleteMessageBatchTarget, map[string]any{
+		"QueueUrl": missingURL,
+		"Entries": []map[string]any{
+			{"Id": "a", "ReceiptHandle": dummyHandle},
+		},
+	})
+	if status != http.StatusBadRequest {
+		t.Fatalf("delete batch missing queue: got %d want 400 (%v)", status, body)
+	}
+	if got, _ := body["__type"].(string); got != sqsErrQueueDoesNotExist {
+		t.Fatalf("delete batch error type: %q want %q", got, sqsErrQueueDoesNotExist)
+	}
+
+	status, body = callSQS(t, node, sqsChangeMessageVisibilityBatchTgt, map[string]any{
+		"QueueUrl": missingURL,
+		"Entries": []map[string]any{
+			{"Id": "a", "ReceiptHandle": dummyHandle, "VisibilityTimeout": 30},
+		},
+	})
+	if status != http.StatusBadRequest {
+		t.Fatalf("change vis batch missing queue: got %d want 400 (%v)", status, body)
+	}
+	if got, _ := body["__type"].(string); got != sqsErrQueueDoesNotExist {
+		t.Fatalf("change vis batch error type: %q want %q", got, sqsErrQueueDoesNotExist)
+	}
+}
+
+func TestSQSServer_RedrivePolicyFifoDlqRejectsStandardSource(t *testing.T) {
+	t.Parallel()
+	// A Standard source pointing at a FIFO DLQ would copy empty
+	// MessageGroupId into the DLQ record; the DLQ-side receive only
+	// enforces FIFO group-lock when MessageGroupId is non-empty, so
+	// those messages bypass FIFO semantics inside a queue clients
+	// believe is strictly ordered. The redrive path must reject the
+	// move when this would happen.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	// Create FIFO DLQ.
+	_, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName":  "dlq.fifo",
+		"Attributes": map[string]string{"FifoQueue": "true"},
+	})
+	if dlqURL, _ := out["QueueUrl"].(string); dlqURL == "" {
+		t.Fatalf("FIFO DLQ create failed: %v", out)
+	}
+
+	// Standard source with RedrivePolicy targeting the FIFO DLQ.
+	policy := `{"deadLetterTargetArn":"arn:aws:sqs:us-east-1:000000000000:dlq.fifo","maxReceiveCount":1}`
+	status, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName":  "src-standard",
+		"Attributes": map[string]string{"RedrivePolicy": policy},
+	})
+	if status != http.StatusOK {
+		t.Fatalf("create standard source with FIFO-DLQ policy: %d %v", status, out)
+	}
+	srcURL, _ := out["QueueUrl"].(string)
+
+	_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":    srcURL,
+		"MessageBody": "poison",
+	})
+	// First receive bumps ReceiveCount to 1 == maxReceiveCount; second
+	// receive should attempt redrive and the FIFO compatibility gate
+	// must trip. The receive path returns 5xx (sqsErrInternalFailure
+	// surfaced via sqsAPIError) rather than silently moving an
+	// invalid record.
+	_, _ = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            srcURL,
+		"MaxNumberOfMessages": 1,
+		"VisibilityTimeout":   1,
+	})
+	time.Sleep(1100 * time.Millisecond)
+	status, body := callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            srcURL,
+		"MaxNumberOfMessages": 1,
+	})
+	if status == http.StatusOK {
+		// AWS-level invariant: the message must NOT have been
+		// redriven into the FIFO DLQ. Even if the receive returns
+		// OK, the failure is that the FIFO DLQ should not now hold
+		// a record with an empty MessageGroupId.
+		if msgs, _ := body["Messages"].([]any); len(msgs) > 0 {
+			t.Fatalf("FIFO DLQ should not receive redriven Standard source records, got msgs=%v", msgs)
+		}
+	}
+}
+
+func TestSQSServer_RedrivePolicyStandardDlqRejectsFifoSource(t *testing.T) {
+	t.Parallel()
+	// Symmetric to RedrivePolicyFifoDlqRejectsStandardSource: the
+	// existing guard rejected only the Standard→FIFO direction, but
+	// FIFO→Standard was equally broken. A FIFO source carries
+	// MessageGroupId on every record; copying that into a Standard
+	// DLQ and then issuing ReceiveMessage on the DLQ trips
+	// tryDeliverCandidate's FIFO group-lock branch (gated solely on
+	// MessageGroupId != ""), which serializes delivery in a queue
+	// clients believe behaves as Standard. AWS rejects mixed-type
+	// redrive policies; this test pins that behavior.
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	// Standard DLQ (no FifoQueue attribute).
+	_, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName": "dlq-standard",
+	})
+	dlqURL, _ := out["QueueUrl"].(string)
+	if dlqURL == "" {
+		t.Fatalf("Standard DLQ create failed: %v", out)
+	}
+
+	// FIFO source with RedrivePolicy targeting the Standard DLQ.
+	policy := `{"deadLetterTargetArn":"arn:aws:sqs:us-east-1:000000000000:dlq-standard","maxReceiveCount":1}`
+	status, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName": "src-fifo.fifo",
+		"Attributes": map[string]string{
+			"FifoQueue":     "true",
+			"RedrivePolicy": policy,
+		},
+	})
+	if status != http.StatusOK {
+		t.Fatalf("create FIFO source with Standard-DLQ policy: %d %v", status, out)
+	}
+	srcURL, _ := out["QueueUrl"].(string)
+
+	_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":               srcURL,
+		"MessageBody":            "poison",
+		"MessageGroupId":         "g1",
+		"MessageDeduplicationId": "d1",
+	})
+	// First receive bumps ReceiveCount to 1 == maxReceiveCount;
+	// second receive (after visibility expiry) should attempt redrive.
+	// The runtime type-compatibility gate must trip, leaving the DLQ
+	// empty and the source message intact.
+	_, _ = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            srcURL,
+		"MaxNumberOfMessages": 1,
+		"VisibilityTimeout":   1,
+	})
+	time.Sleep(1100 * time.Millisecond)
+	_, _ = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            srcURL,
+		"MaxNumberOfMessages": 1,
+	})
+
+	// Direct DLQ receive: a successful redrive would have written a
+	// record with non-empty MessageGroupId here; the fix must keep
+	// the DLQ empty.
+	_, body := callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            dlqURL,
+		"MaxNumberOfMessages": 10,
+	})
+	if msgs, _ := body["Messages"].([]any); len(msgs) > 0 {
+		t.Fatalf("Standard DLQ received a redriven FIFO record (would carry MessageGroupId): %v", msgs)
+	}
+}
+
+func TestSQSServer_TagQueueRequiresTags(t *testing.T) {
+	t.Parallel()
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "tag-required")
+
+	// Missing Tags is a MissingParameter, not a silent no-op.
+	status, out := callSQS(t, node, sqsTagQueueTarget, map[string]any{
+		"QueueUrl": queueURL,
+	})
+	if status != http.StatusBadRequest || out["__type"] != sqsErrMissingParameter {
+		t.Fatalf("tag without Tags: %d %v", status, out)
+	}
+	status, out = callSQS(t, node, sqsUntagQueueTarget, map[string]any{
+		"QueueUrl": queueURL,
+	})
+	if status != http.StatusBadRequest || out["__type"] != sqsErrMissingParameter {
+		t.Fatalf("untag without TagKeys: %d %v", status, out)
+	}
+}
+
+// TestSQSServer_FifoFifoRedriveAssignsSequenceNumber pins the round-N
+// Codex P1 fix on `cdb3c87` redrive: a FIFO source whose RedrivePolicy
+// targets a FIFO DLQ used to commit the DLQ record with
+// SequenceNumber = 0 (zero-value, not even AWS's "starts at 1"
+// invariant), and the DLQ's per-queue sequence counter
+// (sqsQueueSeqKey) was never advanced. Consumers reading the DLQ saw
+// 0 verbatim, and a normal FIFO send to the DLQ later produced a
+// number lower than the redriven message — non-monotonic per AWS's
+// FIFO contract. The fix loads the DLQ seq at readTS, increments it,
+// stamps it onto the DLQ record, and includes the seq Put in the OCC
+// transaction. This test asserts both halves: (a) the redriven DLQ
+// record carries SequenceNumber = 1, (b) a subsequent FIFO send to
+// the DLQ carries SequenceNumber = 2.
+func TestSQSServer_FifoFifoRedriveAssignsSequenceNumber(t *testing.T) {
+	t.Parallel()
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+
+	// FIFO DLQ.
+	_, out := callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName":  "dlq-fifo.fifo",
+		"Attributes": map[string]string{"FifoQueue": "true"},
+	})
+	dlqURL, _ := out["QueueUrl"].(string)
+	if dlqURL == "" {
+		t.Fatalf("FIFO DLQ create failed: %v", out)
+	}
+
+	// FIFO source pointing at the FIFO DLQ. Both queues are FIFO so
+	// the type-equality guard added in cdb3c87 lets the redrive
+	// proceed; this test exercises the SequenceNumber assignment that
+	// became reachable only with that change.
+	policy := `{"deadLetterTargetArn":"arn:aws:sqs:us-east-1:000000000000:dlq-fifo.fifo","maxReceiveCount":1}`
+	_, out = callSQS(t, node, sqsCreateQueueTarget, map[string]any{
+		"QueueName": "src-fifo.fifo",
+		"Attributes": map[string]string{
+			"FifoQueue":     "true",
+			"RedrivePolicy": policy,
+		},
+	})
+	srcURL, _ := out["QueueUrl"].(string)
+
+	// Send a poison message to the FIFO source.
+	_, _ = callSQS(t, node, sqsSendMessageTarget, map[string]any{
+		"QueueUrl":               srcURL,
+		"MessageBody":            "poison",
+		"MessageGroupId":         "g1",
+		"MessageDeduplicationId": "d-poison",
+	})
+
+	// First receive bumps ReceiveCount to 1 == maxReceiveCount;
+	// second receive (after visibility expiry) triggers the redrive.
+	_, _ = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            srcURL,
+		"MaxNumberOfMessages": 1,
+		"VisibilityTimeout":   1,
+	})
+	time.Sleep(1100 * time.Millisecond)
+	_, _ = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            srcURL,
+		"MaxNumberOfMessages": 1,
+	})
+
+	// DLQ now has the moved message. SequenceNumber must be > 0;
+	// pre-fix it was 0 (zero-value, never set).
+	_, out = callSQS(t, node, sqsReceiveMessageTarget, map[string]any{
+		"QueueUrl":            dlqURL,
+		"MaxNumberOfMessages": 1,
+		"VisibilityTimeout":   60,
+	})
+	msgs, _ := out["Messages"].([]any)
+	if len(msgs) != 1 {
+		t.Fatalf("DLQ expected 1 redriven message, got %d (%v)", len(msgs), out)
+	}
+	moved, _ := msgs[0].(map[string]any)
+	movedAttrs, _ := moved["Attributes"].(map[string]any)
+	movedSeqStr, _ := movedAttrs["SequenceNumber"].(string)
+	movedSeq, _ := strconv.ParseUint(movedSeqStr, 10, 64)
+	if movedSeq == 0 {
+		t.Fatalf("redriven DLQ message has SequenceNumber=0 (regression: counter not advanced); attrs=%v", movedAttrs)
+	}
+
+	// Second half: a normal FIFO send to the DLQ must observe the
+	// advanced counter and assign movedSeq + 1, not start over from
+	// 1 (which would put two messages with the same sequence on the
+	// queue, the exact bug the fix is preventing).
+	follow := sendFifoMessage(t, node, dlqURL, "g-dlq", "d-follow", "follow")
+	if follow != movedSeq+1 {
+		t.Fatalf("DLQ FIFO send after redrive: SequenceNumber=%d, want %d (= %d + 1)", follow, movedSeq+1, movedSeq)
+	}
+}
+
+// TestSQSServer_SendMessageRejectsBinaryWithStringValue pins the
+// round-N Codex P2 fix: AWS requires a MessageAttributeValue to
+// populate exactly one of {StringValue, BinaryValue}. The previous
+// validator only checked that BinaryValue was non-empty for Binary
+// types; an attribute carrying both fields would be persisted into
+// the record (and round-tripped on ReceiveMessage), which is not
+// AWS behavior and would surface mismatched MD5 hashes downstream.
+// The symmetric String/Number + non-empty BinaryValue case is also
+// asserted.
+func TestSQSServer_SendMessageRejectsBinaryWithStringValue(t *testing.T) {
+	t.Parallel()
+	nodes, _, _ := createNode(t, 1)
+	defer shutdown(nodes)
+	node := sqsLeaderNode(t, nodes)
+	queueURL := createSQSQueueForTest(t, node, "binary-string-mix")
+
+	cases := []struct {
+		name  string
+		attrs map[string]any
+	}{
+		{
+			name: "Binary with non-empty StringValue",
+			attrs: map[string]any{
+				"X": map[string]any{
+					"DataType":    "Binary",
+					"BinaryValue": []byte{0x01, 0x02, 0x03},
+					"StringValue": "stowaway",
+				},
+			},
+		},
+		{
+			name: "String with non-empty BinaryValue",
+			attrs: map[string]any{
+				"X": map[string]any{
+					"DataType":    "String",
+					"StringValue": "ok",
+					"BinaryValue": []byte{0x01},
+				},
+			},
+		},
+		{
+			name: "Number with non-empty BinaryValue",
+			attrs: map[string]any{
+				"X": map[string]any{
+					"DataType":    "Number",
+					"StringValue": "1",
+					"BinaryValue": []byte{0x01},
+				},
+			},
+		},
+	}
+	for _, tc := range cases {
+		t.Run(tc.name, func(t *testing.T) {
+			status, out := callSQS(t, node, sqsSendMessageTarget, map[string]any{
+				"QueueUrl":          queueURL,
+				"MessageBody":       "body",
+				"MessageAttributes": tc.attrs,
+			})
+			if status != http.StatusBadRequest {
+				t.Fatalf("expected 400, got %d (%v)", status, out)
+			}
+			if got, _ := out["__type"].(string); got != sqsErrInvalidAttributeValue {
+				t.Fatalf("error type: %q want %q (%v)", got, sqsErrInvalidAttributeValue, out)
+			}
+		})
+	}
+}
diff --git a/adapter/sqs_fifo.go b/adapter/sqs_fifo.go
new file mode 100644
index 000000000..c603a8f6d
--- /dev/null
+++ b/adapter/sqs_fifo.go
@@ -0,0 +1,305 @@
+package adapter
+
+import (
+	"context"
+	"crypto/sha256"
+	"encoding/hex"
+	"strconv"
+	"time"
+
+	"github.com/bootjp/elastickv/kv"
+	"github.com/bootjp/elastickv/store"
+	"github.com/cockroachdb/errors"
+	json "github.com/goccy/go-json"
+)
+
+// FIFO dedup window — AWS guarantees exactly-once within 5 minutes of
+// the first SendMessage that carried a given (dedup-id, queue-gen).
+const sqsFifoDedupWindowMillis = 5 * 60 * 1000
+
+// sqsFifoDedupRecord is the value persisted at !sqs|msg|dedup|... so a
+// retry within the dedup window can short-circuit to the original
+// message-id without writing a second copy of the body. Holding the
+// original send timestamp lets the receive path drop expired records
+// lazily once we add a reaper.
+type sqsFifoDedupRecord struct {
+	MessageID        string `json:"message_id"`
+	SendTimestampMs  int64  `json:"send_timestamp_ms"`
+	ExpiresAtMillis  int64  `json:"expires_at_millis"`
+	OriginalSequence uint64 `json:"original_sequence,omitempty"`
+}
+
+func encodeFifoDedupRecord(r *sqsFifoDedupRecord) ([]byte, error) {
+	b, err := json.Marshal(r)
+	if err != nil {
+		return nil, errors.WithStack(err)
+	}
+	return b, nil
+}
+
+func decodeFifoDedupRecord(b []byte) (*sqsFifoDedupRecord, error) {
+	var r sqsFifoDedupRecord
+	if err := json.Unmarshal(b, &r); err != nil {
+		return nil, errors.WithStack(err)
+	}
+	return &r, nil
+}
+
+// sqsFifoGroupLock is the value persisted at !sqs|msg|group|... while a
+// group has an in-flight head message. Holding the message id (rather
+// than just a boolean) lets the receive path tell "I already own this
+// lock" (a redelivery) apart from "another message owns it" (skip the
+// whole group).
+type sqsFifoGroupLock struct {
+	MessageID    string `json:"message_id"`
+	AcquiredAtMs int64  `json:"acquired_at_ms"`
+	VisibleAtMs  int64  `json:"visible_at_ms"`
+}
+
+func encodeFifoGroupLock(l *sqsFifoGroupLock) ([]byte, error) {
+	b, err := json.Marshal(l)
+	if err != nil {
+		return nil, errors.WithStack(err)
+	}
+	return b, nil
+}
+
+func decodeFifoGroupLock(b []byte) (*sqsFifoGroupLock, error) {
+	var l sqsFifoGroupLock
+	if err := json.Unmarshal(b, &l); err != nil {
+		return nil, errors.WithStack(err)
+	}
+	return &l, nil
+}
+
+// resolveFifoDedupID returns the dedup-id AWS would compute for this
+// send. ContentBasedDeduplication=true uses SHA-256 over the body
+// (matching AWS exactly); otherwise the caller-supplied
+// MessageDeduplicationId is used.
+func resolveFifoDedupID(meta *sqsQueueMeta, in sqsSendMessageInput) string {
+	if in.MessageDeduplicationId != "" {
+		return in.MessageDeduplicationId
+	}
+	if meta.ContentBasedDedup {
+		sum := sha256.Sum256([]byte(in.MessageBody))
+		return hex.EncodeToString(sum[:])
+	}
+	return ""
+}
+
+// loadFifoDedupRecord returns the dedup record at the given snapshot,
+// or (nil, nil) when there is no live record for this dedup-id.
+// Expired records are surfaced as nil so a stale entry does not block
+// a fresh send within the same FIFO queue.
+func (s *SQSServer) loadFifoDedupRecord(ctx context.Context, queueName string, gen uint64, dedupID string, readTS uint64) (*sqsFifoDedupRecord, []byte, error) {
+	key := sqsMsgDedupKey(queueName, gen, dedupID)
+	raw, err := s.store.GetAt(ctx, key, readTS)
+	if err != nil {
+		if errors.Is(err, store.ErrKeyNotFound) {
+			return nil, key, nil
+		}
+		return nil, key, errors.WithStack(err)
+	}
+	rec, err := decodeFifoDedupRecord(raw)
+	if err != nil {
+		return nil, key, errors.WithStack(err)
+	}
+	if rec.ExpiresAtMillis > 0 && time.Now().UnixMilli() > rec.ExpiresAtMillis {
+		return nil, key, nil
+	}
+	return rec, key, nil
+}
+
+// loadFifoSequence fetches the current per-queue sequence counter at
+// the given snapshot. Missing keys (fresh queue) read as zero so the
+// first FIFO send observes 1.
+func (s *SQSServer) loadFifoSequence(ctx context.Context, queueName string, readTS uint64) (uint64, error) {
+	raw, err := s.store.GetAt(ctx, sqsQueueSeqKey(queueName), readTS)
+	if err != nil {
+		if errors.Is(err, store.ErrKeyNotFound) {
+			return 0, nil
+		}
+		return 0, errors.WithStack(err)
+	}
+	v, err := strconv.ParseUint(string(raw), 10, 64)
+	if err != nil {
+		return 0, errors.WithStack(err)
+	}
+	return v, nil
+}
+
+// loadFifoGroupLock fetches the in-flight lock for a group, if any.
+// Returns nil when no lock is held. Callers that also need the key
+// can recompute it via sqsMsgGroupKey — the helper used to return it
+// alongside the lock, but every caller already had the key in scope
+// from a different code path.
+func (s *SQSServer) loadFifoGroupLock(ctx context.Context, queueName string, gen uint64, groupID string, readTS uint64) (*sqsFifoGroupLock, error) {
+	key := sqsMsgGroupKey(queueName, gen, groupID)
+	raw, err := s.store.GetAt(ctx, key, readTS)
+	if err != nil {
+		if errors.Is(err, store.ErrKeyNotFound) {
+			return nil, nil
+		}
+		return nil, errors.WithStack(err)
+	}
+	lock, err := decodeFifoGroupLock(raw)
+	if err != nil {
+		return nil, errors.WithStack(err)
+	}
+	return lock, nil
+}
+
+// sendFifoMessage is the FIFO-aware analog of the OCC dispatch in
+// sendMessage. It runs inside the existing retry loop and:
+//
+//  1. Looks up the dedup record for this (queue, gen, dedup-id). On
+//     hit it returns the original message-id without writing.
+//  2. Loads the per-queue sequence counter and bumps it.
+//  3. Writes the data + vis-index entries plus the dedup record and
+//     the new sequence counter, all under one OCC transaction so a
+//     concurrent FIFO send cannot reuse our sequence number.
+//
+// Returns the response payload (MessageId, MD5OfMessageBody, etc.)
+// the caller should hand to the JSON encoder, and a retry hint: when
+// the OCC dispatch fails with a retryable error the bool is true and
+// the caller re-runs the whole pass against a fresh snapshot.
+func (s *SQSServer) sendFifoMessage(
+	ctx context.Context,
+	queueName string,
+	meta *sqsQueueMeta,
+	in sqsSendMessageInput,
+	dedupID string,
+	delay int64,
+	readTS uint64,
+) (map[string]string, bool, error) {
+	dedup, dedupKey, err := s.loadFifoDedupRecord(ctx, queueName, meta.Generation, dedupID, readTS)
+	if err != nil {
+		return nil, false, err
+	}
+	if dedup != nil {
+		// AWS semantics: dedup hit returns success with the original
+		// message-id, no error. Idempotent-by-design retries from a
+		// crashed-and-restarted producer keep working.
+		return map[string]string{
+			"MessageId":              dedup.MessageID,
+			"MD5OfMessageBody":       sqsMD5Hex([]byte(in.MessageBody)),
+			"MD5OfMessageAttributes": md5OfAttributesHex(in.MessageAttributes),
+			"SequenceNumber":         strconv.FormatUint(dedup.OriginalSequence, 10),
+		}, false, nil
+	}
+
+	prevSeq, err := s.loadFifoSequence(ctx, queueName, readTS)
+	if err != nil {
+		return nil, false, err
+	}
+	nextSeq := prevSeq + 1
+
+	rec, _, err := buildSendRecord(meta, in, delay)
+	if err != nil {
+		return nil, false, err
+	}
+	rec.SequenceNumber = nextSeq
+	recordBytes, err := encodeSQSMessageRecord(rec)
+	if err != nil {
+		return nil, false, errors.WithStack(err)
+	}
+
+	now := time.Now().UnixMilli()
+	dedupRec := &sqsFifoDedupRecord{
+		MessageID:        rec.MessageID,
+		SendTimestampMs:  now,
+		ExpiresAtMillis:  now + sqsFifoDedupWindowMillis,
+		OriginalSequence: nextSeq,
+	}
+	dedupBytes, err := encodeFifoDedupRecord(dedupRec)
+	if err != nil {
+		return nil, false, errors.WithStack(err)
+	}
+
+	dataKey := sqsMsgDataKey(queueName, meta.Generation, rec.MessageID)
+	visKey := sqsMsgVisKey(queueName, meta.Generation, rec.AvailableAtMillis, rec.MessageID)
+	byAgeKey := sqsMsgByAgeKey(queueName, meta.Generation, rec.SendTimestampMillis, rec.MessageID)
+	seqKey := sqsQueueSeqKey(queueName)
+	metaKey := sqsQueueMetaKey(queueName)
+	genKey := sqsQueueGenKey(queueName)
+	// ReadKeys: meta + gen guard against DeleteQueue / PurgeQueue,
+	// dedupKey guards a concurrent send under the same dedup-id, seqKey
+	// guards a concurrent FIFO send taking the same sequence number.
+	req := &kv.OperationGroup[kv.OP]{
+		IsTxn:    true,
+		StartTS:  readTS,
+		ReadKeys: [][]byte{metaKey, genKey, dedupKey, seqKey},
+		Elems: []*kv.Elem[kv.OP]{
+			{Op: kv.Put, Key: dataKey, Value: recordBytes},
+			{Op: kv.Put, Key: visKey, Value: []byte(rec.MessageID)},
+			{Op: kv.Put, Key: byAgeKey, Value: []byte(rec.MessageID)},
+			{Op: kv.Put, Key: dedupKey, Value: dedupBytes},
+			{Op: kv.Put, Key: seqKey, Value: []byte(strconv.FormatUint(nextSeq, 10))},
+		},
+	}
+	if _, err := s.coordinator.Dispatch(ctx, req); err != nil {
+		if isRetryableTransactWriteError(err) {
+			return nil, true, nil
+		}
+		return nil, false, errors.WithStack(err)
+	}
+	return map[string]string{
+		"MessageId":              rec.MessageID,
+		"MD5OfMessageBody":       rec.MD5OfBody,
+		"MD5OfMessageAttributes": md5OfAttributesHex(in.MessageAttributes),
+		"SequenceNumber":         strconv.FormatUint(nextSeq, 10),
+	}, false, nil
+}
+
+// fifoCandidateLockState classifies what a candidate's group lock
+// allows the receive path to do. Centralising the three-way decision
+// keeps tryDeliverCandidate readable.
+type fifoCandidateLockState int
+
+const (
+	// fifoLockSkip means the group is held by a different message; the
+	// candidate must be skipped without consuming the receive budget.
+	fifoLockSkip fifoCandidateLockState = iota
+	// fifoLockOwn means the group is already held by this very
+	// message — a redelivery after visibility expiry. Continue.
+	fifoLockOwn
+	// fifoLockAcquire means no lock exists and the receive path must
+	// install one as part of the OCC transaction.
+	fifoLockAcquire
+)
+
+// classifyFifoGroupLock decides whether a FIFO candidate is eligible
+// for delivery. Standard queues bypass the function entirely.
+func (s *SQSServer) classifyFifoGroupLock(ctx context.Context, queueName string, gen uint64, rec *sqsMessageRecord, readTS uint64) (fifoCandidateLockState, []byte, error) {
+	lockKey := sqsMsgGroupKey(queueName, gen, rec.MessageGroupId)
+	lock, err := s.loadFifoGroupLock(ctx, queueName, gen, rec.MessageGroupId, readTS)
+	if err != nil {
+		return fifoLockSkip, lockKey, err
+	}
+	if lock == nil {
+		return fifoLockAcquire, lockKey, nil
+	}
+	if lock.MessageID == rec.MessageID {
+		return fifoLockOwn, lockKey, nil
+	}
+	return fifoLockSkip, lockKey, nil
+}
+
+// fifoLockMutationsForReceive returns the OCC ops the receive path
+// must add when it commits a FIFO delivery. The lock's VisibleAtMs is
+// always rewritten so a concurrent re-acquire sees the freshest
+// in-flight deadline.
+func fifoLockMutationsForReceive(lockKey []byte, msgID string, newVisibleAt int64) ([]*kv.Elem[kv.OP], error) {
+	lock := &sqsFifoGroupLock{
+		MessageID:    msgID,
+		AcquiredAtMs: time.Now().UnixMilli(),
+		VisibleAtMs:  newVisibleAt,
+	}
+	body, err := encodeFifoGroupLock(lock)
+	if err != nil {
+		return nil, err
+	}
+	return []*kv.Elem[kv.OP]{
+		{Op: kv.Put, Key: lockKey, Value: body},
+	}, nil
+}
diff --git a/adapter/sqs_keys.go b/adapter/sqs_keys.go
index f0f402665..a80ae471a 100644
--- a/adapter/sqs_keys.go
+++ b/adapter/sqs_keys.go
@@ -1,7 +1,9 @@
 package adapter
 
 import (
+	"bytes"
 	"encoding/base64"
+	"encoding/binary"
 	"strings"
 
 	"github.com/cockroachdb/errors"
@@ -16,6 +18,35 @@ const (
 	// Bumped on DeleteQueue / PurgeQueue so keys from an older incarnation of
 	// the same queue name cannot leak into a newly created queue.
 	SqsQueueGenPrefix = "!sqs|queue|gen|"
+	// SqsQueueSeqPrefix prefixes the per-queue FIFO sequence counter. Bumped
+	// on every FIFO send and embedded in the message record so consumers can
+	// reconstruct the producer's strict total order.
+	SqsQueueSeqPrefix = "!sqs|queue|seq|"
+	// SqsMsgDedupPrefix prefixes FIFO deduplication records. Each entry
+	// stores the original message id and the dedup-window expiry; the
+	// receive path is unaware of these — they only gate sends.
+	SqsMsgDedupPrefix = "!sqs|msg|dedup|"
+	// SqsMsgGroupPrefix prefixes the FIFO group-lock records. The lock is
+	// held by at most one message per group, persists across visibility
+	// expiries, and is only released on DeleteMessage / DLQ redrive /
+	// retention expiry.
+	SqsMsgGroupPrefix = "!sqs|msg|group|"
+	// SqsMsgByAgePrefix prefixes the send-age index. Each entry is
+	// keyed by (queue, gen, send_timestamp, message_id) so the reaper
+	// can find every record whose retention deadline has elapsed with
+	// one bounded scan, without having to load every message body.
+	SqsMsgByAgePrefix = "!sqs|msg|byage|"
+	// SqsQueueTombstonePrefix prefixes a generation-orphan marker.
+	// DeleteQueue and PurgeQueue each write one (queue, gen) tombstone
+	// in the same OCC transaction that supersedes that generation —
+	// DeleteQueue tombstones the gen it removes the meta row at, and
+	// PurgeQueue tombstones the pre-bump gen so the reaper can find
+	// pre-purge orphans even if the queue is deleted before the next
+	// reaper tick. The reaper enumerates these markers to clean up
+	// orphan data / vis / byage / dedup / group keys for superseded
+	// generations. The tombstone is itself deleted once the reaper
+	// confirms no message-keyspace state remains for that (queue, gen).
+	SqsQueueTombstonePrefix = "!sqs|queue|tombstone|"
 )
 
 func sqsQueueMetaKey(queueName string) []byte {
@@ -26,6 +57,128 @@ func sqsQueueGenKey(queueName string) []byte {
 	return []byte(SqsQueueGenPrefix + encodeSQSSegment(queueName))
 }
 
+func sqsQueueSeqKey(queueName string) []byte {
+	return []byte(SqsQueueSeqPrefix + encodeSQSSegment(queueName))
+}
+
+func sqsMsgDedupKey(queueName string, gen uint64, dedupID string) []byte {
+	buf := make([]byte, 0, len(SqsMsgDedupPrefix)+sqsKeyCapLarge)
+	buf = append(buf, SqsMsgDedupPrefix...)
+	buf = append(buf, encodeSQSSegment(queueName)...)
+	buf = appendU64(buf, gen)
+	buf = append(buf, encodeSQSSegment(dedupID)...)
+	return buf
+}
+
+func sqsMsgGroupKey(queueName string, gen uint64, groupID string) []byte {
+	buf := make([]byte, 0, len(SqsMsgGroupPrefix)+sqsKeyCapLarge)
+	buf = append(buf, SqsMsgGroupPrefix...)
+	buf = append(buf, encodeSQSSegment(queueName)...)
+	buf = appendU64(buf, gen)
+	buf = append(buf, encodeSQSSegment(groupID)...)
+	return buf
+}
+
+func sqsQueueTombstoneKey(queueName string, gen uint64) []byte {
+	buf := make([]byte, 0, len(SqsQueueTombstonePrefix)+sqsKeyCapSmall)
+	buf = append(buf, SqsQueueTombstonePrefix...)
+	buf = append(buf, encodeSQSSegment(queueName)...)
+	buf = appendU64(buf, gen)
+	return buf
+}
+
+// sqsGenerationSuffixLen is the byte length of the trailing big-endian
+// uint64 generation segment in tombstone and byage keys.
+const sqsGenerationSuffixLen = 8
+
+// parseSqsQueueTombstoneKey reverses sqsQueueTombstoneKey. The
+// generation is fixed at the last 8 bytes of the key, so the queue
+// name segment is everything between the prefix and that suffix —
+// no delimiter needed.
+func parseSqsQueueTombstoneKey(key []byte) (queueName string, gen uint64, ok bool) {
+	if !bytes.HasPrefix(key, []byte(SqsQueueTombstonePrefix)) {
+		return "", 0, false
+	}
+	rest := key[len(SqsQueueTombstonePrefix):]
+	if len(rest) < sqsGenerationSuffixLen {
+		return "", 0, false
+	}
+	encQueue := rest[:len(rest)-sqsGenerationSuffixLen]
+	gen = binary.BigEndian.Uint64(rest[len(rest)-sqsGenerationSuffixLen:])
+	name, err := decodeSQSSegment(string(encQueue))
+	if err != nil {
+		return "", 0, false
+	}
+	return name, gen, true
+}
+
+func sqsMsgByAgeKey(queueName string, gen uint64, sendTimestampMs int64, messageID string) []byte {
+	buf := make([]byte, 0, len(SqsMsgByAgePrefix)+sqsKeyCapLarge)
+	buf = append(buf, SqsMsgByAgePrefix...)
+	buf = append(buf, encodeSQSSegment(queueName)...)
+	buf = appendU64(buf, gen)
+	buf = appendU64(buf, uint64MaxZero(sendTimestampMs))
+	buf = append(buf, encodeSQSSegment(messageID)...)
+	return buf
+}
+
+// sqsMsgByAgePrefixAllGenerations returns the prefix for every byage
+// entry under (queue, *) — i.e. across every queue generation, alive
+// and superseded. The reaper uses this to surface orphan records left
+// over by PurgeQueue / DeleteQueue, which bump the generation counter
+// instead of cleaning up old keys.
+func sqsMsgByAgePrefixAllGenerations(queueName string) []byte {
+	buf := make([]byte, 0, len(SqsMsgByAgePrefix)+sqsKeyCapSmall)
+	buf = append(buf, SqsMsgByAgePrefix...)
+	buf = append(buf, encodeSQSSegment(queueName)...)
+	return buf
+}
+
+// sqsMsgByAgeRecord is the parsed shape of a byage key. Generation,
+// send timestamp, and message id all live in the key (the value is
+// just the message id again so a missing-data scan does not have to
+// open the data record). Returns ok=false when the key does not match
+// the expected shape, so the reaper can skip junk without looping.
+type sqsMsgByAgeRecord struct {
+	Generation      uint64
+	SendTimestampMs int64
+	MessageID       string
+}
+
+// sqsByAgeKeyHeaderLen is the byte length of the (gen, ts) prefix that
+// follows the queue segment in a byage key — two big-endian uint64s.
+const sqsByAgeKeyHeaderLen = 16
+
+func parseSqsMsgByAgeKey(key []byte, queueName string) (sqsMsgByAgeRecord, bool) {
+	expected := sqsMsgByAgePrefixAllGenerations(queueName)
+	if !bytes.HasPrefix(key, expected) {
+		return sqsMsgByAgeRecord{}, false
+	}
+	rest := key[len(expected):]
+	if len(rest) < sqsByAgeKeyHeaderLen {
+		return sqsMsgByAgeRecord{}, false
+	}
+	gen := binary.BigEndian.Uint64(rest[:8])
+	tsRaw := binary.BigEndian.Uint64(rest[8:sqsByAgeKeyHeaderLen])
+	msgIDEnc := string(rest[sqsByAgeKeyHeaderLen:])
+	msgID, err := decodeSQSSegment(msgIDEnc)
+	if err != nil {
+		return sqsMsgByAgeRecord{}, false
+	}
+	// Wall-clock millis fits in int63; the only way tsRaw exceeds
+	// math.MaxInt64 is if the caller wrote a key with a uint64 that
+	// the rest of the adapter would never produce. Treat that as
+	// malformed.
+	if tsRaw > 1<<63-1 {
+		return sqsMsgByAgeRecord{}, false
+	}
+	return sqsMsgByAgeRecord{
+		Generation:      gen,
+		SendTimestampMs: int64(tsRaw),
+		MessageID:       msgID,
+	}, true
+}
+
 // encodeSQSSegment emits a printable, byte-ordered-unique representation of a
 // queue name. Base64 raw URL encoding matches the encoding the DynamoDB
 // adapter uses for table segments (see encodeDynamoSegment) so that operators
diff --git a/adapter/sqs_messages.go b/adapter/sqs_messages.go
index 05742b862..a64a0006e 100644
--- a/adapter/sqs_messages.go
+++ b/adapter/sqs_messages.go
@@ -63,24 +63,46 @@ const (
 	sqsErrMessageNotInflight   = "MessageNotInflight"
 )
 
+// sqsMessageAttributeValue is the AWS-shaped MessageAttribute payload.
+// We accept the same JSON shape AWS SDKs send: DataType (required),
+// plus exactly one of StringValue or BinaryValue depending on the
+// declared type. BinaryValue is base64 on the wire and []byte in
+// memory; Go's json package handles the base64 conversion.
+type sqsMessageAttributeValue struct {
+	DataType    string `json:"DataType"`
+	StringValue string `json:"StringValue,omitempty"`
+	BinaryValue []byte `json:"BinaryValue,omitempty"`
+}
+
 // sqsMessageRecord mirrors !sqs|msg|data|... on disk. Visibility state
 // (VisibleAtMillis, CurrentReceiptToken, ReceiveCount) lives here rather
 // than in a side-record so a single OCC transaction can rotate it.
 type sqsMessageRecord struct {
-	MessageID              string            `json:"message_id"`
-	Body                   []byte            `json:"body"`
-	MD5OfBody              string            `json:"md5_of_body"`
-	MessageAttributes      map[string]string `json:"message_attributes,omitempty"`
-	SenderID               string            `json:"sender_id,omitempty"`
-	SendTimestampMillis    int64             `json:"send_timestamp_millis"`
-	AvailableAtMillis      int64             `json:"available_at_millis"`
-	VisibleAtMillis        int64             `json:"visible_at_millis"`
-	ReceiveCount           int64             `json:"receive_count"`
-	FirstReceiveMillis     int64             `json:"first_receive_millis,omitempty"`
-	CurrentReceiptToken    []byte            `json:"current_receipt_token"`
-	QueueGeneration        uint64            `json:"queue_generation"`
-	MessageGroupId         string            `json:"message_group_id,omitempty"`
-	MessageDeduplicationId string            `json:"message_deduplication_id,omitempty"`
+	MessageID              string                              `json:"message_id"`
+	Body                   []byte                              `json:"body"`
+	MD5OfBody              string                              `json:"md5_of_body"`
+	MD5OfMessageAttributes string                              `json:"md5_of_message_attributes,omitempty"`
+	MessageAttributes      map[string]sqsMessageAttributeValue `json:"message_attributes,omitempty"`
+	SenderID               string                              `json:"sender_id,omitempty"`
+	SendTimestampMillis    int64                               `json:"send_timestamp_millis"`
+	AvailableAtMillis      int64                               `json:"available_at_millis"`
+	VisibleAtMillis        int64                               `json:"visible_at_millis"`
+	ReceiveCount           int64                               `json:"receive_count"`
+	FirstReceiveMillis     int64                               `json:"first_receive_millis,omitempty"`
+	CurrentReceiptToken    []byte                              `json:"current_receipt_token"`
+	QueueGeneration        uint64                              `json:"queue_generation"`
+	MessageGroupId         string                              `json:"message_group_id,omitempty"`
+	MessageDeduplicationId string                              `json:"message_deduplication_id,omitempty"`
+	// SequenceNumber is the per-queue strict-order counter assigned at
+	// FIFO send time. AWS surfaces it on the SendMessage response and on
+	// every ReceiveMessage; ordering across messages with different
+	// MessageGroupId is undefined, but within a group the consumer sees
+	// monotonically increasing sequence numbers.
+	SequenceNumber uint64 `json:"sequence_number,omitempty"`
+	// DeadLetterSourceArn is set on records that arrived in this queue
+	// via DLQ redrive. AWS surfaces it on the DLQ-side ReceiveMessage so
+	// consumers can correlate moved messages back to their origin.
+	DeadLetterSourceArn string `json:"dead_letter_source_arn,omitempty"`
 }
 
 var storedSQSMsgPrefix = []byte{0x00, 'S', 'M', 0x01}
@@ -243,19 +265,20 @@ func decodeReceiptHandle(raw string) (*decodedReceiptHandle, error) {
 // ------------------------ input decoding ------------------------
 
 type sqsSendMessageInput struct {
-	QueueUrl               string            `json:"QueueUrl"`
-	MessageBody            string            `json:"MessageBody"`
-	DelaySeconds           *int64            `json:"DelaySeconds,omitempty"`
-	MessageAttributes      map[string]string `json:"MessageAttributes,omitempty"`
-	MessageGroupId         string            `json:"MessageGroupId,omitempty"`
-	MessageDeduplicationId string            `json:"MessageDeduplicationId,omitempty"`
+	QueueUrl               string                              `json:"QueueUrl"`
+	MessageBody            string                              `json:"MessageBody"`
+	DelaySeconds           *int64                              `json:"DelaySeconds,omitempty"`
+	MessageAttributes      map[string]sqsMessageAttributeValue `json:"MessageAttributes,omitempty"`
+	MessageGroupId         string                              `json:"MessageGroupId,omitempty"`
+	MessageDeduplicationId string                              `json:"MessageDeduplicationId,omitempty"`
 }
 
 type sqsReceiveMessageInput struct {
-	QueueUrl            string `json:"QueueUrl"`
-	MaxNumberOfMessages *int   `json:"MaxNumberOfMessages,omitempty"`
-	VisibilityTimeout   *int64 `json:"VisibilityTimeout,omitempty"`
-	WaitTimeSeconds     *int64 `json:"WaitTimeSeconds,omitempty"`
+	QueueUrl              string   `json:"QueueUrl"`
+	MaxNumberOfMessages   *int     `json:"MaxNumberOfMessages,omitempty"`
+	VisibilityTimeout     *int64   `json:"VisibilityTimeout,omitempty"`
+	WaitTimeSeconds       *int64   `json:"WaitTimeSeconds,omitempty"`
+	MessageAttributeNames []string `json:"MessageAttributeNames,omitempty"`
 }
 
 type sqsDeleteMessageInput struct {
@@ -287,17 +310,8 @@ func (s *SQSServer) sendMessage(w http.ResponseWriter, r *http.Request) {
 		writeSQSErrorFromErr(w, apiErr)
 		return
 	}
-	// AWS SDKs verify MD5OfMessageAttributes against the canonical
-	// binary encoding (sorted, length-prefixed, with transport type
-	// byte). The Milestone-1 adapter does not yet implement that
-	// canonical hash, and a non-matching value would make every SDK
-	// SendMessage call fail with MessageAttributeMD5Mismatch. Until
-	// Milestone 2 ships the canonical encoder, reject sends that
-	// actually carry MessageAttributes so clients fail clearly at
-	// the caller instead of mysteriously in the SDK.
-	if len(in.MessageAttributes) > 0 {
-		writeSQSError(w, http.StatusBadRequest, sqsErrInvalidAttributeValue,
-			"MessageAttributes are not yet supported; omit the field until canonical MD5 lands")
+	if apiErr := validateMessageAttributes(in.MessageAttributes); apiErr != nil {
+		writeSQSErrorFromErr(w, apiErr)
 		return
 	}
 	if apiErr := validateSendFIFOParams(meta, in); apiErr != nil {
@@ -309,6 +323,11 @@ func (s *SQSServer) sendMessage(w http.ResponseWriter, r *http.Request) {
 		writeSQSErrorFromErr(w, apiErr)
 		return
 	}
+	if meta.IsFIFO {
+		s.sendMessageFifoLoop(w, r, queueName, meta, in, delay, readTS)
+		return
+	}
+
 	rec, recordBytes, apiErr := buildSendRecord(meta, in, delay)
 	if apiErr != nil {
 		writeSQSErrorFromErr(w, apiErr)
@@ -317,6 +336,7 @@ func (s *SQSServer) sendMessage(w http.ResponseWriter, r *http.Request) {
 
 	dataKey := sqsMsgDataKey(queueName, meta.Generation, rec.MessageID)
 	visKey := sqsMsgVisKey(queueName, meta.Generation, rec.AvailableAtMillis, rec.MessageID)
+	byAgeKey := sqsMsgByAgeKey(queueName, meta.Generation, rec.SendTimestampMillis, rec.MessageID)
 	metaKey := sqsQueueMetaKey(queueName)
 	genKey := sqsQueueGenKey(queueName)
 	// StartTS + ReadKeys fence against a concurrent DeleteQueue /
@@ -334,6 +354,7 @@ func (s *SQSServer) sendMessage(w http.ResponseWriter, r *http.Request) {
 		Elems: []*kv.Elem[kv.OP]{
 			{Op: kv.Put, Key: dataKey, Value: recordBytes},
 			{Op: kv.Put, Key: visKey, Value: []byte(rec.MessageID)},
+			{Op: kv.Put, Key: byAgeKey, Value: []byte(rec.MessageID)},
 		},
 	}
 	if _, err := s.coordinator.Dispatch(r.Context(), req); err != nil {
@@ -348,6 +369,21 @@ func (s *SQSServer) sendMessage(w http.ResponseWriter, r *http.Request) {
 	})
 }
 
+// sendMessageFifoLoop runs the dedup-aware OCC send for FIFO queues
+// under the standard retry budget. Stamping the dedup record + new
+// sequence number happens inside one transaction so a concurrent send
+// either observes the dedup hit or loses the OCC race. The actual
+// retry loop and per-attempt meta / dedup / delay re-derivation live
+// in runFifoSendWithRetry.
+func (s *SQSServer) sendMessageFifoLoop(w http.ResponseWriter, r *http.Request, queueName string, _ *sqsQueueMeta, in sqsSendMessageInput, _ int64, _ uint64) {
+	resp, err := s.runFifoSendWithRetry(r.Context(), queueName, in)
+	if err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	writeSQSJSON(w, resp)
+}
+
 // loadQueueMetaForSend reads the queue metadata and body-size-gates the
 // send. Returns the snapshot read timestamp alongside the metadata so
 // the caller can pin its OCC dispatch to it; without that fence a
@@ -444,6 +480,7 @@ func buildSendRecord(meta *sqsQueueMeta, in sqsSendMessageInput, delay int64) (*
 		MessageID:              messageID,
 		Body:                   body,
 		MD5OfBody:              sqsMD5Hex(body),
+		MD5OfMessageAttributes: md5OfAttributesHex(in.MessageAttributes),
 		MessageAttributes:      in.MessageAttributes,
 		SendTimestampMillis:    now,
 		AvailableAtMillis:      availableAt,
@@ -512,7 +549,13 @@ func (s *SQSServer) receiveMessage(w http.ResponseWriter, r *http.Request) {
 		return
 	}
 
-	delivered, err := s.longPollReceive(ctx, queueName, max, visibilityTimeout, waitSeconds)
+	opts := sqsReceiveOptions{
+		Max:                   max,
+		VisibilityTimeout:     visibilityTimeout,
+		WaitSeconds:           waitSeconds,
+		MessageAttributeNames: in.MessageAttributeNames,
+	}
+	delivered, err := s.longPollReceive(ctx, queueName, opts)
 	if err != nil {
 		writeSQSErrorFromErr(w, err)
 		return
@@ -520,6 +563,18 @@ func (s *SQSServer) receiveMessage(w http.ResponseWriter, r *http.Request) {
 	writeSQSJSON(w, map[string]any{"Messages": delivered})
 }
 
+// sqsReceiveOptions bundles the per-request settings that ride down
+// the receive call chain. Threading individual params through
+// longPollReceive → scanAndDeliverOnce → rotateMessagesForDelivery →
+// tryDeliverCandidate → commitReceiveRotation gets unwieldy fast,
+// especially as new optional fields like MessageAttributeNames land.
+type sqsReceiveOptions struct {
+	Max                   int
+	VisibilityTimeout     int64
+	WaitSeconds           int64
+	MessageAttributeNames []string
+}
+
 // resolveReceiveWaitSeconds picks the effective long-poll duration: the
 // per-request WaitTimeSeconds if provided, else the queue default. AWS
 // permits 0..20 and rejects anything outside with
@@ -552,15 +607,15 @@ func resolveReceiveWaitSeconds(requested *int64, queueDefault int64) (int64, err
 // a DeleteQueue / PurgeQueue that commits during a long wait is
 // observed on the very next scan — otherwise we'd keep scanning
 // orphan keys under the old generation.
-func (s *SQSServer) longPollReceive(ctx context.Context, queueName string, max int, visibilityTimeout, waitSeconds int64) ([]map[string]any, error) {
-	delivered, err := s.scanAndDeliverOnce(ctx, queueName, max, visibilityTimeout)
+func (s *SQSServer) longPollReceive(ctx context.Context, queueName string, opts sqsReceiveOptions) ([]map[string]any, error) {
+	delivered, err := s.scanAndDeliverOnce(ctx, queueName, opts)
 	if err != nil {
 		return nil, err
 	}
-	if len(delivered) > 0 || waitSeconds <= 0 {
+	if len(delivered) > 0 || opts.WaitSeconds <= 0 {
 		return delivered, nil
 	}
-	deadline := time.Now().Add(time.Duration(waitSeconds) * time.Second)
+	deadline := time.Now().Add(time.Duration(opts.WaitSeconds) * time.Second)
 	ticker := time.NewTicker(sqsLongPollInterval)
 	defer ticker.Stop()
 	for {
@@ -572,7 +627,7 @@ func (s *SQSServer) longPollReceive(ctx context.Context, queueName string, max i
 		if time.Now().After(deadline) {
 			return delivered, nil
 		}
-		delivered, err = s.scanAndDeliverOnce(ctx, queueName, max, visibilityTimeout)
+		delivered, err = s.scanAndDeliverOnce(ctx, queueName, opts)
 		if err != nil {
 			return nil, err
 		}
@@ -582,14 +637,22 @@ func (s *SQSServer) longPollReceive(ctx context.Context, queueName string, max i
 	}
 }
 
-// scanAndDeliverOnce is the single-pass scan+rotate the long-poll loop
+// scanAndDeliverOnce is the scan+rotate pass the long-poll loop
 // re-runs. Each pass takes its own snapshot so the OCC StartTS tracks
 // the most recent visible_at for the candidates it picked, AND each
 // pass re-reads queue metadata so a concurrent DeleteQueue /
 // PurgeQueue that bumps the generation is observed immediately. If
 // the queue has been deleted the method returns QueueDoesNotExist;
 // scan errors and other non-retryable failures propagate.
-func (s *SQSServer) scanAndDeliverOnce(ctx context.Context, queueName string, max int, visibilityTimeout int64) ([]map[string]any, error) {
+//
+// Scan and rotation are interleaved: a single scan page can be
+// consumed entirely by FIFO group-lock skips or DLQ redrive, leaving
+// the receive caller below opts.Max with deliverable messages still
+// further along in the visibility index. Looping until either
+// opts.Max is reached, the index is drained, or the wall-clock budget
+// elapses prevents false-empty returns under poison-message backlogs
+// or hot-FIFO-group fan-in.
+func (s *SQSServer) scanAndDeliverOnce(ctx context.Context, queueName string, opts sqsReceiveOptions) ([]map[string]any, error) {
 	readTS := s.nextTxnReadTS(ctx)
 	meta, exists, err := s.loadQueueMetaAt(ctx, queueName, readTS)
 	if err != nil {
@@ -598,11 +661,41 @@ func (s *SQSServer) scanAndDeliverOnce(ctx context.Context, queueName string, ma
 	if !exists {
 		return nil, newSQSAPIError(http.StatusBadRequest, sqsErrQueueDoesNotExist, "queue does not exist")
 	}
-	candidates, err := s.scanVisibleMessageCandidates(ctx, queueName, meta.Generation, max*sqsReceiveScanOverfetchFactor, readTS)
-	if err != nil {
-		return nil, err
+	now := time.Now().UnixMilli()
+	start, end := sqsMsgVisScanBounds(queueName, meta.Generation, now)
+	pageSize := opts.Max * sqsReceiveScanOverfetchFactor
+	if pageSize > sqsVisScanPageLimit {
+		pageSize = sqsVisScanPageLimit
+	}
+	deadline := time.Now().Add(sqsVisScanWallClockBudget)
+	delivered := make([]map[string]any, 0, opts.Max)
+	for len(delivered) < opts.Max {
+		if time.Now().After(deadline) {
+			return delivered, nil
+		}
+		page, next, done, scanErr := s.scanOneVisibleMessagePage(ctx, start, end, pageSize, readTS)
+		if scanErr != nil {
+			return nil, scanErr
+		}
+		if len(page) == 0 {
+			return delivered, nil
+		}
+		fresh, err := s.rotateMessagesForDelivery(ctx, queueName, meta, page, readTS, sqsReceiveOptions{
+			Max:                   opts.Max - len(delivered),
+			VisibilityTimeout:     opts.VisibilityTimeout,
+			WaitSeconds:           opts.WaitSeconds,
+			MessageAttributeNames: opts.MessageAttributeNames,
+		})
+		if err != nil {
+			return delivered, err
+		}
+		delivered = append(delivered, fresh...)
+		if done {
+			return delivered, nil
+		}
+		start = next
 	}
-	return s.rotateMessagesForDelivery(ctx, queueName, meta.Generation, candidates, visibilityTimeout, meta.MessageRetentionSeconds, max, readTS)
+	return delivered, nil
 }
 
 // resolveReceiveMaxMessages validates MaxNumberOfMessages against the
@@ -631,25 +724,38 @@ type sqsMsgCandidate struct {
 	messageID string
 }
 
-func (s *SQSServer) scanVisibleMessageCandidates(ctx context.Context, queueName string, gen uint64, limit int, readTS uint64) ([]sqsMsgCandidate, error) {
-	if limit <= 0 {
-		return nil, nil
-	}
-	now := time.Now().UnixMilli()
-	start, end := sqsMsgVisScanBounds(queueName, gen, now)
-	page := limit
-	if page > sqsVisScanPageLimit {
-		page = sqsVisScanPageLimit
-	}
-	kvs, err := s.store.ScanAt(ctx, start, end, page, readTS)
+// sqsVisScanWallClockBudget caps how long the scan + deliver loop may
+// spend paging the visibility index. The receive path filters
+// candidates after each scan page (FIFO group lock, retention expiry,
+// DLQ redrive); without a wall-clock cap a queue with thousands of
+// group-locked or poisoned messages ahead of one deliverable could
+// pin the leader for many milliseconds.
+const sqsVisScanWallClockBudget = 100 * time.Millisecond
+
+// scanOneVisibleMessagePage reads a single page of the visibility
+// index starting at `start`, returning the parsed candidates plus the
+// cursor for the next page. `done=true` means the scan range is
+// drained and the caller should stop paging.
+func (s *SQSServer) scanOneVisibleMessagePage(ctx context.Context, start, end []byte, pageSize int, readTS uint64) ([]sqsMsgCandidate, []byte, bool, error) {
+	kvs, err := s.store.ScanAt(ctx, start, end, pageSize, readTS)
 	if err != nil {
-		return nil, errors.WithStack(err)
+		return nil, start, true, errors.WithStack(err)
+	}
+	if len(kvs) == 0 {
+		return nil, start, true, nil
 	}
 	out := make([]sqsMsgCandidate, 0, len(kvs))
 	for _, kvp := range kvs {
 		out = append(out, sqsMsgCandidate{visKey: bytes.Clone(kvp.Key), messageID: string(kvp.Value)})
 	}
-	return out, nil
+	if len(kvs) < pageSize {
+		return out, start, true, nil
+	}
+	next := nextScanCursorAfter(kvs[len(kvs)-1].Key)
+	if end != nil && bytes.Compare(next, end) >= 0 {
+		return out, next, true, nil
+	}
+	return out, next, false, nil
 }
 
 // rotateMessagesForDelivery runs an OCC transaction per candidate to
@@ -683,22 +789,40 @@ func (s *SQSServer) loadCandidateRecord(ctx context.Context, queueName string, g
 	return rec, dataKey, false, nil
 }
 
-// expireMessage removes a retention-expired record and its current
-// visibility index entry in a single OCC transaction. On
-// ErrWriteConflict (another worker raced us to delete or rotate
-// this same message) we treat it as success: the message is no
-// longer our responsibility either way. Any other error propagates
+// expireMessage removes a retention-expired record, its current
+// visibility index entry, and the byage index entry in a single OCC
+// transaction. On ErrWriteConflict (another worker raced us to delete
+// or rotate this same message) we treat it as success: the message is
+// no longer our responsibility either way. Any other error propagates
 // so a coordinator / storage failure does not silently fall through
 // to "delivered empty", matching the receive-error policy.
-func (s *SQSServer) expireMessage(ctx context.Context, queueName string, gen uint64, visKey, dataKey []byte, readTS uint64) error {
+func (s *SQSServer) expireMessage(ctx context.Context, queueName string, gen uint64, visKey, dataKey []byte, rec *sqsMessageRecord, readTS uint64) error {
+	byAgeKey := sqsMsgByAgeKey(queueName, gen, rec.SendTimestampMillis, rec.MessageID)
+	readKeys := [][]byte{visKey, dataKey, sqsQueueMetaKey(queueName), sqsQueueGenKey(queueName)}
+	elems := []*kv.Elem[kv.OP]{
+		{Op: kv.Del, Key: visKey},
+		{Op: kv.Del, Key: dataKey},
+		{Op: kv.Del, Key: byAgeKey},
+	}
+	// FIFO retention expiry must release the group lock so a successor
+	// in the same group can become deliverable. This mirrors the delete
+	// and redrive paths.
+	if rec.MessageGroupId != "" {
+		lockKey := sqsMsgGroupKey(queueName, gen, rec.MessageGroupId)
+		lock, err := s.loadFifoGroupLock(ctx, queueName, gen, rec.MessageGroupId, readTS)
+		if err != nil {
+			return err
+		}
+		if lock != nil && lock.MessageID == rec.MessageID {
+			readKeys = append(readKeys, lockKey)
+			elems = append(elems, &kv.Elem[kv.OP]{Op: kv.Del, Key: lockKey})
+		}
+	}
 	req := &kv.OperationGroup[kv.OP]{
 		IsTxn:    true,
 		StartTS:  readTS,
-		ReadKeys: [][]byte{visKey, dataKey, sqsQueueMetaKey(queueName), sqsQueueGenKey(queueName)},
-		Elems: []*kv.Elem[kv.OP]{
-			{Op: kv.Del, Key: visKey},
-			{Op: kv.Del, Key: dataKey},
-		},
+		ReadKeys: readKeys,
+		Elems:    elems,
 	}
 	if _, err := s.coordinator.Dispatch(ctx, req); err != nil {
 		if isRetryableTransactWriteError(err) {
@@ -706,26 +830,32 @@ func (s *SQSServer) expireMessage(ctx context.Context, queueName string, gen uin
 		}
 		return errors.WithStack(err)
 	}
-	_ = gen // reserved for future per-queue expiry metrics
 	return nil
 }
 
 func (s *SQSServer) rotateMessagesForDelivery(
 	ctx context.Context,
 	queueName string,
-	gen uint64,
+	meta *sqsQueueMeta,
 	candidates []sqsMsgCandidate,
-	visibilityTimeout int64,
-	retentionSeconds int64,
-	max int,
 	readTS uint64,
+	opts sqsReceiveOptions,
 ) ([]map[string]any, error) {
-	delivered := make([]map[string]any, 0, max)
+	// Parse RedrivePolicy once per receive call rather than per
+	// candidate. The struct only changes via SetQueueAttributes /
+	// CreateQueue, so cross-candidate caching is safe.
+	var redrive *parsedRedrivePolicy
+	if meta.RedrivePolicy != "" {
+		if p, err := parseRedrivePolicy(meta.RedrivePolicy); err == nil {
+			redrive = p
+		}
+	}
+	delivered := make([]map[string]any, 0, opts.Max)
 	for _, cand := range candidates {
-		if len(delivered) >= max {
+		if len(delivered) >= opts.Max {
 			break
 		}
-		msg, skip, err := s.tryDeliverCandidate(ctx, queueName, gen, cand, visibilityTimeout, retentionSeconds, readTS)
+		msg, skip, err := s.tryDeliverCandidate(ctx, queueName, meta.Generation, cand, meta.MessageRetentionSeconds, readTS, opts, redrive)
 		if err != nil {
 			return delivered, err
 		}
@@ -753,9 +883,10 @@ func (s *SQSServer) tryDeliverCandidate(
 	queueName string,
 	gen uint64,
 	cand sqsMsgCandidate,
-	visibilityTimeout int64,
 	retentionSeconds int64,
 	readTS uint64,
+	opts sqsReceiveOptions,
+	redrive *parsedRedrivePolicy,
 ) (map[string]any, bool, error) {
 	rec, dataKey, skip, err := s.loadCandidateRecord(ctx, queueName, gen, cand, readTS)
 	if skip || err != nil {
@@ -764,7 +895,35 @@ func (s *SQSServer) tryDeliverCandidate(
 	if expired, err := s.handleRetentionExpiry(ctx, queueName, gen, cand, dataKey, rec, retentionSeconds, readTS); expired || err != nil {
 		return nil, expired, err
 	}
-	return s.commitReceiveRotation(ctx, queueName, gen, cand, dataKey, rec, visibilityTimeout, readTS)
+	if shouldRedrive(rec, redrive) {
+		// The candidate has hit maxReceiveCount; move it to the DLQ
+		// inside its own OCC transaction and skip past it. The
+		// receive response intentionally omits redriven messages —
+		// AWS does the same and consumers polling the source queue
+		// must not observe a poison message past the limit.
+		moved, err := s.redriveCandidateToDLQ(ctx, queueName, gen, cand, dataKey, rec, redrive, s.queueArn(queueName), readTS)
+		if err != nil {
+			return nil, false, err
+		}
+		return nil, moved, nil
+	}
+	// FIFO group lock filter: skip candidates whose group is held by
+	// another in-flight message. Standard queues short-circuit because
+	// MessageGroupId is empty.
+	lockState := fifoLockAcquire
+	var lockKey []byte
+	if rec.MessageGroupId != "" {
+		state, key, err := s.classifyFifoGroupLock(ctx, queueName, gen, rec, readTS)
+		if err != nil {
+			return nil, false, err
+		}
+		if state == fifoLockSkip {
+			return nil, true, nil
+		}
+		lockState = state
+		lockKey = key
+	}
+	return s.commitReceiveRotation(ctx, queueName, gen, cand, dataKey, rec, readTS, opts, lockKey, lockState)
 }
 
 // handleRetentionExpiry deletes the candidate inline when its
@@ -780,21 +939,24 @@ func (s *SQSServer) handleRetentionExpiry(ctx context.Context, queueName string,
 	if now-rec.SendTimestampMillis <= retentionSeconds*sqsMillisPerSecond {
 		return false, nil
 	}
-	if err := s.expireMessage(ctx, queueName, gen, cand.visKey, dataKey, readTS); err != nil {
+	if err := s.expireMessage(ctx, queueName, gen, cand.visKey, dataKey, rec, readTS); err != nil {
 		return false, err
 	}
 	return true, nil
 }
 
 // commitReceiveRotation runs the final OCC dispatch that rotates
-// receipt token + visibility index for a non-expired candidate.
-func (s *SQSServer) commitReceiveRotation(ctx context.Context, queueName string, gen uint64, cand sqsMsgCandidate, dataKey []byte, rec *sqsMessageRecord, visibilityTimeout int64, readTS uint64) (map[string]any, bool, error) {
+// receipt token + visibility index for a non-expired candidate. When
+// the candidate carries a MessageGroupId the transaction also
+// installs (or refreshes) the per-group lock so a later message in
+// the same group cannot overtake it on the next receive.
+func (s *SQSServer) commitReceiveRotation(ctx context.Context, queueName string, gen uint64, cand sqsMsgCandidate, dataKey []byte, rec *sqsMessageRecord, readTS uint64, opts sqsReceiveOptions, lockKey []byte, lockState fifoCandidateLockState) (map[string]any, bool, error) {
 	newToken, err := newReceiptToken()
 	if err != nil {
 		return nil, false, err
 	}
 	now := time.Now().UnixMilli()
-	newVisibleAt := now + visibilityTimeout*sqsMillisPerSecond
+	newVisibleAt := now + opts.VisibilityTimeout*sqsMillisPerSecond
 	rec.VisibleAtMillis = newVisibleAt
 	rec.CurrentReceiptToken = newToken
 	rec.ReceiveCount++
@@ -806,20 +968,9 @@ func (s *SQSServer) commitReceiveRotation(ctx context.Context, queueName string,
 		return nil, false, err
 	}
 	newVisKey := sqsMsgVisKey(queueName, gen, newVisibleAt, cand.messageID)
-	// StartTS pins the OCC read snapshot to the timestamp we actually
-	// loaded the record at. ReadKeys cover: cand.visKey + dataKey so a
-	// concurrent rotation → conflict; sqsQueueMetaKey / sqsQueueGenKey
-	// so a concurrent DeleteQueue / PurgeQueue → conflict (DeleteQueue
-	// only mutates meta + generation and would otherwise slip through).
-	req := &kv.OperationGroup[kv.OP]{
-		IsTxn:    true,
-		StartTS:  readTS,
-		ReadKeys: [][]byte{cand.visKey, dataKey, sqsQueueMetaKey(queueName), sqsQueueGenKey(queueName)},
-		Elems: []*kv.Elem[kv.OP]{
-			{Op: kv.Del, Key: cand.visKey},
-			{Op: kv.Put, Key: newVisKey, Value: []byte(cand.messageID)},
-			{Op: kv.Put, Key: dataKey, Value: recordBytes},
-		},
+	req, err := buildReceiveRotationOps(queueName, cand, dataKey, recordBytes, newVisKey, lockKey, lockState, newVisibleAt, readTS)
+	if err != nil {
+		return nil, false, err
 	}
 	if _, err := s.coordinator.Dispatch(ctx, req); err != nil {
 		if isRetryableTransactWriteError(err) {
@@ -832,17 +983,116 @@ func (s *SQSServer) commitReceiveRotation(ctx context.Context, queueName string,
 	if err != nil {
 		return nil, false, err
 	}
-	return map[string]any{
+	sysAttrs := buildReceiveSysAttributes(rec)
+	resp := map[string]any{
 		"MessageId":     cand.messageID,
 		"ReceiptHandle": handle,
 		"Body":          string(rec.Body),
 		"MD5OfBody":     rec.MD5OfBody,
-		"Attributes": map[string]string{
-			"ApproximateReceiveCount":          strconv.FormatInt(rec.ReceiveCount, 10),
-			"SentTimestamp":                    strconv.FormatInt(rec.SendTimestampMillis, 10),
-			"ApproximateFirstReceiveTimestamp": strconv.FormatInt(rec.FirstReceiveMillis, 10),
-		},
-	}, false, nil
+		"Attributes":    sysAttrs,
+	}
+	if filtered := selectMessageAttributes(rec.MessageAttributes, opts.MessageAttributeNames); len(filtered) > 0 {
+		resp["MessageAttributes"] = filtered
+		resp["MD5OfMessageAttributes"] = md5OfAttributesHex(filtered)
+	}
+	return resp, false, nil
+}
+
+// buildReceiveRotationOps assembles the OCC OperationGroup for a
+// successful receive rotation. The FIFO group lock branch is split out
+// here so commitReceiveRotation stays under the cyclomatic budget.
+func buildReceiveRotationOps(
+	queueName string,
+	cand sqsMsgCandidate,
+	dataKey []byte,
+	recordBytes []byte,
+	newVisKey []byte,
+	lockKey []byte,
+	lockState fifoCandidateLockState,
+	newVisibleAt int64,
+	readTS uint64,
+) (*kv.OperationGroup[kv.OP], error) {
+	readKeys := [][]byte{cand.visKey, dataKey, sqsQueueMetaKey(queueName), sqsQueueGenKey(queueName)}
+	elems := []*kv.Elem[kv.OP]{
+		{Op: kv.Del, Key: cand.visKey},
+		{Op: kv.Put, Key: newVisKey, Value: []byte(cand.messageID)},
+		{Op: kv.Put, Key: dataKey, Value: recordBytes},
+	}
+	if lockKey != nil {
+		_ = lockState // both fifoLockOwn and fifoLockAcquire write the same shape; documented for clarity
+		readKeys = append(readKeys, lockKey)
+		mut, err := fifoLockMutationsForReceive(lockKey, cand.messageID, newVisibleAt)
+		if err != nil {
+			return nil, errors.WithStack(err)
+		}
+		elems = append(elems, mut...)
+	}
+	return &kv.OperationGroup[kv.OP]{
+		IsTxn:    true,
+		StartTS:  readTS,
+		ReadKeys: readKeys,
+		Elems:    elems,
+	}, nil
+}
+
+// buildReceiveSysAttributes flattens the message record's system
+// attributes into the AWS-shaped string map. Splitting it out keeps
+// commitReceiveRotation under the cyclomatic budget.
+func buildReceiveSysAttributes(rec *sqsMessageRecord) map[string]string {
+	sysAttrs := map[string]string{
+		"ApproximateReceiveCount":          strconv.FormatInt(rec.ReceiveCount, 10),
+		"SentTimestamp":                    strconv.FormatInt(rec.SendTimestampMillis, 10),
+		"ApproximateFirstReceiveTimestamp": strconv.FormatInt(rec.FirstReceiveMillis, 10),
+	}
+	if rec.MessageGroupId != "" {
+		sysAttrs["MessageGroupId"] = rec.MessageGroupId
+	}
+	if rec.MessageDeduplicationId != "" {
+		sysAttrs["MessageDeduplicationId"] = rec.MessageDeduplicationId
+	}
+	if rec.SequenceNumber > 0 {
+		sysAttrs["SequenceNumber"] = strconv.FormatUint(rec.SequenceNumber, 10)
+	}
+	if rec.DeadLetterSourceArn != "" {
+		sysAttrs["DeadLetterQueueSourceArn"] = rec.DeadLetterSourceArn
+	}
+	return sysAttrs
+}
+
+// selectMessageAttributes filters the stored MessageAttributes by the
+// names the caller asked for. AWS supports:
+//
+//   - omission / empty list  → return no attributes.
+//   - "All" or ".*"          → return everything.
+//   - explicit list          → return only those exact names.
+//
+// Returning a non-empty filter means the response also carries an
+// MD5OfMessageAttributes computed over the *filtered* set so SDKs that
+// re-verify the digest do not see a hash over attributes they did not
+// receive.
+func selectMessageAttributes(attrs map[string]sqsMessageAttributeValue, names []string) map[string]sqsMessageAttributeValue {
+	if len(attrs) == 0 || len(names) == 0 {
+		return nil
+	}
+	all := false
+	want := make(map[string]bool, len(names))
+	for _, n := range names {
+		if n == "All" || n == ".*" {
+			all = true
+			break
+		}
+		want[n] = true
+	}
+	if all {
+		return attrs
+	}
+	out := make(map[string]sqsMessageAttributeValue, len(want))
+	for name, v := range attrs {
+		if want[name] {
+			out[name] = v
+		}
+	}
+	return out
 }
 
 func (s *SQSServer) deleteMessage(w http.ResponseWriter, r *http.Request) {
@@ -880,28 +1130,12 @@ func (s *SQSServer) deleteMessageWithRetry(ctx context.Context, queueName string
 		if err != nil {
 			return err
 		}
-		switch outcome {
-		case sqsDeleteNoOp:
+		if outcome == sqsDeleteNoOp {
 			return nil
-		case sqsDeleteProceed:
-			// fall through to commit below
 		}
-		visKey := sqsMsgVisKey(queueName, handle.QueueGeneration, rec.VisibleAtMillis, rec.MessageID)
-		// StartTS pins OCC to the snapshot we loaded the record at, so a
-		// concurrent rotation that commits after our load but before a
-		// coordinator-assigned StartTS cannot slip past ReadKeys.
-		// ReadKeys also include the queue meta + generation keys so a
-		// concurrent DeleteQueue (which only touches those two keys)
-		// forces this delete to abort with ErrWriteConflict rather
-		// than committing against an orphan record.
-		req := &kv.OperationGroup[kv.OP]{
-			IsTxn:    true,
-			StartTS:  readTS,
-			ReadKeys: [][]byte{dataKey, visKey, sqsQueueMetaKey(queueName), sqsQueueGenKey(queueName)},
-			Elems: []*kv.Elem[kv.OP]{
-				{Op: kv.Del, Key: dataKey},
-				{Op: kv.Del, Key: visKey},
-			},
+		req, err := s.buildDeleteOps(ctx, queueName, handle, rec, dataKey, readTS)
+		if err != nil {
+			return err
 		}
 		if _, err := s.coordinator.Dispatch(ctx, req); err == nil {
 			return nil
@@ -916,6 +1150,37 @@ func (s *SQSServer) deleteMessageWithRetry(ctx context.Context, queueName string
 	return newSQSAPIError(http.StatusInternalServerError, sqsErrInternalFailure, "delete message retry attempts exhausted")
 }
 
+// buildDeleteOps assembles the OCC OperationGroup for a DeleteMessage
+// commit. The FIFO group-lock release branch lives here so the
+// retry-loop wrapper stays readable and within the cyclomatic budget.
+func (s *SQSServer) buildDeleteOps(ctx context.Context, queueName string, handle *decodedReceiptHandle, rec *sqsMessageRecord, dataKey []byte, readTS uint64) (*kv.OperationGroup[kv.OP], error) {
+	visKey := sqsMsgVisKey(queueName, handle.QueueGeneration, rec.VisibleAtMillis, rec.MessageID)
+	byAgeKey := sqsMsgByAgeKey(queueName, handle.QueueGeneration, rec.SendTimestampMillis, rec.MessageID)
+	readKeys := [][]byte{dataKey, visKey, sqsQueueMetaKey(queueName), sqsQueueGenKey(queueName)}
+	elems := []*kv.Elem[kv.OP]{
+		{Op: kv.Del, Key: dataKey},
+		{Op: kv.Del, Key: visKey},
+		{Op: kv.Del, Key: byAgeKey},
+	}
+	if rec.MessageGroupId != "" {
+		lockKey := sqsMsgGroupKey(queueName, handle.QueueGeneration, rec.MessageGroupId)
+		lock, err := s.loadFifoGroupLock(ctx, queueName, handle.QueueGeneration, rec.MessageGroupId, readTS)
+		if err != nil {
+			return nil, err
+		}
+		if lock != nil && lock.MessageID == rec.MessageID {
+			readKeys = append(readKeys, lockKey)
+			elems = append(elems, &kv.Elem[kv.OP]{Op: kv.Del, Key: lockKey})
+		}
+	}
+	return &kv.OperationGroup[kv.OP]{
+		IsTxn:    true,
+		StartTS:  readTS,
+		ReadKeys: readKeys,
+		Elems:    elems,
+	}, nil
+}
+
 // sqsDeleteOutcome is a ternary tag returned by loadMessageForDelete so
 // the caller can cleanly distinguish the AWS-idempotent no-op case from
 // the proceed-to-commit case without conflating them with errors.
@@ -1115,26 +1380,174 @@ func sqsMD5Hex(body []byte) string {
 	return hex.EncodeToString(sum[:])
 }
 
-// md5OfAttributesHex computes AWS's MD5 of a MessageAttributes map. The
-// real AWS format canonicalizes names and types; this adapter only
-// returns "" on an empty map and a simple concatenated hash otherwise
-// (full canonicalization lives in a follow-up PR along with typed
-// attribute values).
-func md5OfAttributesHex(attrs map[string]string) string {
+// md5OfAttributesHex computes the AWS-canonical MD5 over a
+// MessageAttributes map.
+//
+// Wire format (binary, hashed in this exact order):
+//
+//	for each name in sorted(names):
+//	  uint32be(len(name))         + name
+//	  uint32be(len(dataType))     + dataType
+//	  byte(0x01) for String/Number, byte(0x02) for Binary
+//	  for String/Number: uint32be(len(stringValue)) + stringValue
+//	  for Binary       : uint32be(len(binaryValue)) + binaryValue
+//
+// AWS SDKs (and `aws sqs` since CLI v2) verify this hash on
+// SendMessage / SendMessageBatch responses; a non-matching value makes
+// every send call fail with MessageAttributeMD5Mismatch, so the
+// algorithm is part of the wire contract, not an implementation
+// detail.
+// AWS canonical-MD5 wire format constants.
+const (
+	// sqsAttributeBaseTypeBinary is the canonical name AWS expects for
+	// the Binary base type; suffix-extended forms ("Binary.gzipped")
+	// share the same type byte.
+	sqsAttributeBaseTypeBinary = "Binary"
+	// sqsAttributeTransportByteString applies to String and Number;
+	// sqsAttributeTransportByteBinary applies to Binary.
+	sqsAttributeTransportByteString = byte(0x01)
+	sqsAttributeTransportByteBinary = byte(0x02)
+)
+
+func md5OfAttributesHex(attrs map[string]sqsMessageAttributeValue) string {
 	if len(attrs) == 0 {
 		return ""
 	}
-	keys := make([]string, 0, len(attrs))
+	names := make([]string, 0, len(attrs))
 	for k := range attrs {
-		keys = append(keys, k)
+		names = append(names, k)
+	}
+	sort.Strings(names)
+	var buf bytes.Buffer
+	for _, name := range names {
+		v := attrs[name]
+		writeMD5Length(&buf, name)
+		buf.WriteString(name)
+		writeMD5Length(&buf, v.DataType)
+		buf.WriteString(v.DataType)
+		if attributeTypeIsBinary(v.DataType) {
+			buf.WriteByte(sqsAttributeTransportByteBinary)
+			writeMD5LengthBytes(&buf, v.BinaryValue)
+			buf.Write(v.BinaryValue)
+		} else {
+			buf.WriteByte(sqsAttributeTransportByteString)
+			writeMD5Length(&buf, v.StringValue)
+			buf.WriteString(v.StringValue)
+		}
+	}
+	return sqsMD5Hex(buf.Bytes())
+}
+
+func writeMD5Length(b *bytes.Buffer, s string) {
+	var lenBuf [4]byte
+	binary.BigEndian.PutUint32(lenBuf[:], safeUint32Len(len(s)))
+	b.Write(lenBuf[:])
+}
+
+func writeMD5LengthBytes(b *bytes.Buffer, p []byte) {
+	var lenBuf [4]byte
+	binary.BigEndian.PutUint32(lenBuf[:], safeUint32Len(len(p)))
+	b.Write(lenBuf[:])
+}
+
+// safeUint32Len narrows an int length into a uint32 with an explicit
+// gate. AWS's canonical MD5 spec uses a 4-byte length prefix, so any
+// payload over 4 GiB is malformed by definition; wrapping the cast
+// silently would corrupt the hash, so we clamp to the max value.
+func safeUint32Len(n int) uint32 {
+	if n < 0 {
+		return 0
+	}
+	const max = int(^uint32(0))
+	if n > max {
+		return ^uint32(0)
+	}
+	return uint32(n)
+}
+
+// attributeTypeIsBinary returns true when the AWS DataType (which may
+// carry a custom suffix after a `.`) declares a Binary payload.
+func attributeTypeIsBinary(dataType string) bool {
+	base := dataType
+	if i := strings.Index(dataType, "."); i >= 0 {
+		base = dataType[:i]
+	}
+	return base == sqsAttributeBaseTypeBinary
+}
+
+// validateMessageAttributes enforces the AWS rules a client expects to
+// see:
+//
+//   - DataType must start with String, Number, or Binary; a custom
+//     suffix `<Base>.<custom>` is allowed.
+//   - String / Number attributes carry a non-empty StringValue; Binary
+//     attributes carry a non-empty BinaryValue.
+//   - At most 10 message attributes per send call.
+//
+// Returning the AWS error shape early lets the SDK MD5 verification
+// path stay clean: by the time we hash the map we know every entry is
+// well-formed.
+func validateMessageAttributes(attrs map[string]sqsMessageAttributeValue) error {
+	const maxAttrs = 10
+	if len(attrs) > maxAttrs {
+		return newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"MessageAttributes is limited to 10 entries per call")
+	}
+	for name, v := range attrs {
+		if err := validateOneMessageAttribute(name, v); err != nil {
+			return err
+		}
+	}
+	return nil
+}
+
+func validateOneMessageAttribute(name string, v sqsMessageAttributeValue) error {
+	if name == "" {
+		return newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"MessageAttribute name must be non-empty")
 	}
-	sort.Strings(keys)
-	var b strings.Builder
-	for _, k := range keys {
-		b.WriteString(k)
-		b.WriteString("=")
-		b.WriteString(attrs[k])
-		b.WriteString(";")
+	if v.DataType == "" {
+		return newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"MessageAttribute "+name+" missing DataType")
 	}
-	return sqsMD5Hex([]byte(b.String()))
+	base := v.DataType
+	if i := strings.Index(v.DataType, "."); i >= 0 {
+		base = v.DataType[:i]
+	}
+	return validateMessageAttributeValuePair(name, base, v)
+}
+
+// validateMessageAttributeValuePair enforces "exactly one value field
+// populated, matching the DataType" on a MessageAttributeValue. AWS
+// rejects an attribute that carries both StringValue and BinaryValue
+// (or that carries the wrong one for its DataType); without these
+// guards a malformed client could persist bytes into the record that
+// then round-trip on ReceiveMessage, producing mismatched MD5 hashes
+// downstream. Pulled out of validateOneMessageAttribute so that
+// function stays under the cyclop budget.
+func validateMessageAttributeValuePair(name, base string, v sqsMessageAttributeValue) error {
+	switch base {
+	case "String", "Number":
+		if v.StringValue == "" {
+			return newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+				"MessageAttribute "+name+" requires StringValue")
+		}
+		if len(v.BinaryValue) > 0 {
+			return newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+				"MessageAttribute "+name+" must not include BinaryValue for "+base+" type")
+		}
+	case sqsAttributeBaseTypeBinary:
+		if len(v.BinaryValue) == 0 {
+			return newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+				"MessageAttribute "+name+" requires BinaryValue")
+		}
+		if v.StringValue != "" {
+			return newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+				"MessageAttribute "+name+" must not include StringValue for Binary type")
+		}
+	default:
+		return newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"MessageAttribute "+name+" has unsupported DataType "+v.DataType)
+	}
+	return nil
 }
diff --git a/adapter/sqs_messages_batch.go b/adapter/sqs_messages_batch.go
new file mode 100644
index 000000000..b8adca271
--- /dev/null
+++ b/adapter/sqs_messages_batch.go
@@ -0,0 +1,679 @@
+package adapter
+
+import (
+	"context"
+	"net/http"
+	"regexp"
+	"time"
+
+	"github.com/bootjp/elastickv/kv"
+	"github.com/cockroachdb/errors"
+)
+
+// sqsBatchEntryIdPattern is AWS's allowed character set for the
+// per-entry Id of any batch operation: 1-80 chars, alphanumeric
+// plus `-` and `_`. Anything else returns InvalidBatchEntryId.
+var sqsBatchEntryIDPattern = regexp.MustCompile(`^[a-zA-Z0-9_-]{1,80}$`)
+
+// AWS-documented per-batch limits.
+const (
+	sqsBatchMaxEntries = 10
+	// sqsBatchMaxTotalPayloadBytes mirrors AWS's 256 KiB total cap on
+	// SendMessageBatch (the cap is on the sum of message bodies, not
+	// the encoded request). Enforcing it adapter-side keeps a noisy
+	// producer from blowing past MaximumMessageSize by spreading a big
+	// payload across many entries.
+	sqsBatchMaxTotalPayloadBytes = 262144
+)
+
+// AWS error codes specific to batch operations.
+const (
+	sqsErrEmptyBatchRequest            = "AWS.SimpleQueueService.EmptyBatchRequest"
+	sqsErrBatchEntryIdsNotDistinct     = "AWS.SimpleQueueService.BatchEntryIdsNotDistinct"
+	sqsErrTooManyEntriesInBatchRequest = "AWS.SimpleQueueService.TooManyEntriesInBatchRequest"
+	sqsErrInvalidBatchEntryId          = "AWS.SimpleQueueService.InvalidBatchEntryId"
+	sqsErrBatchRequestTooLong          = "AWS.SimpleQueueService.BatchRequestTooLong"
+)
+
+// ------------------------ SendMessageBatch ------------------------
+
+type sqsSendMessageBatchInput struct {
+	QueueUrl string                          `json:"QueueUrl"`
+	Entries  []sqsSendMessageBatchEntryInput `json:"Entries"`
+}
+
+type sqsSendMessageBatchEntryInput struct {
+	Id                     string                              `json:"Id"`
+	MessageBody            string                              `json:"MessageBody"`
+	DelaySeconds           *int64                              `json:"DelaySeconds,omitempty"`
+	MessageAttributes      map[string]sqsMessageAttributeValue `json:"MessageAttributes,omitempty"`
+	MessageGroupId         string                              `json:"MessageGroupId,omitempty"`
+	MessageDeduplicationId string                              `json:"MessageDeduplicationId,omitempty"`
+}
+
+type sqsBatchResultErrorEntry struct {
+	Id          string `json:"Id"`
+	Code        string `json:"Code"`
+	Message     string `json:"Message"`
+	SenderFault bool   `json:"SenderFault"`
+}
+
+type sqsSendMessageBatchResultEntry struct {
+	Id                     string `json:"Id"`
+	MessageId              string `json:"MessageId"`
+	MD5OfMessageBody       string `json:"MD5OfMessageBody"`
+	MD5OfMessageAttributes string `json:"MD5OfMessageAttributes,omitempty"`
+	// SequenceNumber is non-empty only on FIFO queues, matching AWS's
+	// shape. Standard-queue sends omit the field.
+	SequenceNumber string `json:"SequenceNumber,omitempty"`
+}
+
+func (s *SQSServer) sendMessageBatch(w http.ResponseWriter, r *http.Request) {
+	var in sqsSendMessageBatchInput
+	if err := decodeSQSJSONInput(r, &in); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	queueName, err := queueNameFromURL(in.QueueUrl)
+	if err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	if err := validateBatchEntryShape(len(in.Entries), batchEntryIDs(in.Entries)); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	// Total-payload-size gate is request-level, not per-entry: silently
+	// accepting an oversized batch would let one producer push tens of
+	// MiB through a single call and DoS the leader's Raft pipeline.
+	// MessageAttributes contribute to the size — without them in the
+	// total a client could ship tiny bodies plus a few-MiB BinaryValue
+	// per entry and bypass the cap.
+	if total := totalBatchPayloadBytes(in.Entries); total > sqsBatchMaxTotalPayloadBytes {
+		writeSQSError(w, http.StatusBadRequest, sqsErrBatchRequestTooLong,
+			"total batch payload exceeds 262144 bytes")
+		return
+	}
+
+	successful, failed, err := s.sendMessageBatchWithRetry(r.Context(), queueName, in.Entries)
+	if err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	resp := map[string]any{
+		"Successful": successful,
+		"Failed":     failed,
+	}
+	writeSQSJSON(w, resp)
+}
+
+// sendMessageBatchWithRetry pre-validates every entry, splits them into
+// "will-attempt" and "rejected before storage", and runs one OCC
+// transaction over the will-attempt set. On ErrWriteConflict the whole
+// transaction (and the validation pass that fed it, since the OCC
+// snapshot is shared) is retried — that way a concurrent DeleteQueue
+// or PurgeQueue is observed before we re-commit.
+func (s *SQSServer) sendMessageBatchWithRetry(
+	ctx context.Context,
+	queueName string,
+	entries []sqsSendMessageBatchEntryInput,
+) ([]sqsSendMessageBatchResultEntry, []sqsBatchResultErrorEntry, error) {
+	backoff := transactRetryInitialBackoff
+	deadline := time.Now().Add(transactRetryMaxDuration)
+	for range transactRetryMaxAttempts {
+		successful, failed, retry, err := s.trySendMessageBatchOnce(ctx, queueName, entries)
+		if err != nil {
+			return nil, nil, err
+		}
+		if !retry {
+			return successful, failed, nil
+		}
+		if err := waitRetryWithDeadline(ctx, deadline, backoff); err != nil {
+			return nil, nil, errors.WithStack(err)
+		}
+		backoff = nextTransactRetryBackoff(backoff)
+	}
+	return nil, nil, newSQSAPIError(http.StatusInternalServerError, sqsErrInternalFailure, "send message batch retry attempts exhausted")
+}
+
+// trySendMessageBatchOnce runs one snapshot read + per-entry validate +
+// dispatch pass. retry=true means OCC saw a write conflict and the
+// caller should re-run; retry=false means we have a final response.
+//
+// FIFO queues take a slow per-entry path because the dedup record and
+// per-queue sequence counter both have to be inspected and mutated
+// inside the same OCC transaction as the data write — bundling all
+// entries into a single batch transaction would either skip the
+// dedup check (allowing duplicate-id sends to land twice in the
+// queue) or assign the same sequence number to every entry, both of
+// which violate AWS's FIFO contract.
+func (s *SQSServer) trySendMessageBatchOnce(
+	ctx context.Context,
+	queueName string,
+	entries []sqsSendMessageBatchEntryInput,
+) ([]sqsSendMessageBatchResultEntry, []sqsBatchResultErrorEntry, bool, error) {
+	readTS := s.nextTxnReadTS(ctx)
+	meta, exists, err := s.loadQueueMetaAt(ctx, queueName, readTS)
+	if err != nil {
+		return nil, nil, false, errors.WithStack(err)
+	}
+	if !exists {
+		return nil, nil, false, newSQSAPIError(http.StatusBadRequest, sqsErrQueueDoesNotExist, "queue does not exist")
+	}
+	if meta.IsFIFO {
+		return s.sendBatchFifoEntries(ctx, queueName, meta, entries)
+	}
+	return s.sendBatchStandardOnce(ctx, queueName, meta, entries, readTS)
+}
+
+// sendBatchStandardOnce is the original single-OCC fast path for
+// Standard queues: every entry that survives validation is bundled
+// into one Dispatch.
+func (s *SQSServer) sendBatchStandardOnce(
+	ctx context.Context,
+	queueName string,
+	meta *sqsQueueMeta,
+	entries []sqsSendMessageBatchEntryInput,
+	readTS uint64,
+) ([]sqsSendMessageBatchResultEntry, []sqsBatchResultErrorEntry, bool, error) {
+	successful := make([]sqsSendMessageBatchResultEntry, 0, len(entries))
+	failed := make([]sqsBatchResultErrorEntry, 0)
+	// Each entry produces three OCC ops: data, vis, byage. Pre-sizing
+	// the slice avoids a couple of grow operations in the batch hot
+	// path; oversizing is fine, undersizing is what we are gating
+	// against.
+	const opsPerEntry = 3
+	elems := make([]*kv.Elem[kv.OP], 0, opsPerEntry*len(entries))
+	for _, entry := range entries {
+		rec, recordBytes, apiErr := buildBatchSendRecord(meta, entry)
+		if apiErr != nil {
+			failed = append(failed, batchErrorEntryFromAPIErr(entry.Id, apiErr))
+			continue
+		}
+		dataKey := sqsMsgDataKey(queueName, meta.Generation, rec.MessageID)
+		visKey := sqsMsgVisKey(queueName, meta.Generation, rec.AvailableAtMillis, rec.MessageID)
+		byAgeKey := sqsMsgByAgeKey(queueName, meta.Generation, rec.SendTimestampMillis, rec.MessageID)
+		elems = append(elems,
+			&kv.Elem[kv.OP]{Op: kv.Put, Key: dataKey, Value: recordBytes},
+			&kv.Elem[kv.OP]{Op: kv.Put, Key: visKey, Value: []byte(rec.MessageID)},
+			&kv.Elem[kv.OP]{Op: kv.Put, Key: byAgeKey, Value: []byte(rec.MessageID)},
+		)
+		successful = append(successful, sqsSendMessageBatchResultEntry{
+			Id:                     entry.Id,
+			MessageId:              rec.MessageID,
+			MD5OfMessageBody:       rec.MD5OfBody,
+			MD5OfMessageAttributes: md5OfAttributesHex(entry.MessageAttributes),
+		})
+	}
+	if len(elems) == 0 {
+		// Every entry was rejected before storage; nothing to commit.
+		return successful, failed, false, nil
+	}
+	req := &kv.OperationGroup[kv.OP]{
+		IsTxn:    true,
+		StartTS:  readTS,
+		ReadKeys: [][]byte{sqsQueueMetaKey(queueName), sqsQueueGenKey(queueName)},
+		Elems:    elems,
+	}
+	if _, err := s.coordinator.Dispatch(ctx, req); err != nil {
+		if isRetryableTransactWriteError(err) {
+			return nil, nil, true, nil
+		}
+		return nil, nil, false, errors.WithStack(err)
+	}
+	return successful, failed, false, nil
+}
+
+// sendBatchFifoEntries dispatches FIFO batch entries one at a time
+// through the same per-message OCC path used by single-message FIFO
+// sends. Per-entry isolation lets us:
+//
+//   - read and bump the per-queue sequence counter once per entry,
+//     handing each successful send a strictly-increasing
+//     SequenceNumber;
+//   - check + write the dedup record per entry, so a batch that
+//     repeats the same MessageDeduplicationId behaves the same as
+//     two single sends with the same id (idempotent);
+//   - report per-entry failures (validation, FIFO param errors,
+//     OCC conflicts that exceed the inner retry budget) without
+//     poisoning successful entries.
+//
+// We never need the outer batch retry loop here because each entry
+// already carries its own retry budget through sendMessageFifoLoop's
+// counterpart, sendFifoMessage's reply contract.
+func (s *SQSServer) sendBatchFifoEntries(
+	ctx context.Context,
+	queueName string,
+	meta *sqsQueueMeta,
+	entries []sqsSendMessageBatchEntryInput,
+) ([]sqsSendMessageBatchResultEntry, []sqsBatchResultErrorEntry, bool, error) {
+	successful := make([]sqsSendMessageBatchResultEntry, 0, len(entries))
+	failed := make([]sqsBatchResultErrorEntry, 0)
+	for _, entry := range entries {
+		ok, success, errEntry := s.sendOneFifoBatchEntry(ctx, queueName, meta, entry)
+		if !ok {
+			failed = append(failed, errEntry)
+			continue
+		}
+		successful = append(successful, success)
+	}
+	// Per-entry retries already happened inside sendOneFifoBatchEntry;
+	// we never ask the outer batch loop to retry the whole pass.
+	return successful, failed, false, nil
+}
+
+// sendOneFifoBatchEntry validates a single FIFO batch entry and runs
+// the dedup-aware OCC send under its own retry budget. Returns
+// ok=true with the success payload on a successful send (including
+// dedup hits, which AWS reports as success); ok=false with a populated
+// error entry otherwise.
+func (s *SQSServer) sendOneFifoBatchEntry(
+	ctx context.Context,
+	queueName string,
+	_ *sqsQueueMeta,
+	entry sqsSendMessageBatchEntryInput,
+) (bool, sqsSendMessageBatchResultEntry, sqsBatchResultErrorEntry) {
+	// Only meta-independent shape checks live here. Anything that
+	// reads queue metadata (MaximumMessageSize, FIFO flag, content-
+	// based dedup) is re-evaluated inside runFifoSendWithRetry per
+	// attempt, so a SetQueueAttributes commit racing this batch
+	// cannot fail an entry that the per-attempt path would accept.
+	if apiErr := validateMessageAttributes(entry.MessageAttributes); apiErr != nil {
+		return false, sqsSendMessageBatchResultEntry{}, batchErrorEntryFromAPIErr(entry.Id, apiErr)
+	}
+	if len(entry.MessageBody) == 0 {
+		return false, sqsSendMessageBatchResultEntry{}, batchErrorEntryFromAPIErr(entry.Id,
+			newSQSAPIError(http.StatusBadRequest, sqsErrValidation, "MessageBody is required"))
+	}
+	asSingle := sqsSendMessageInput{
+		MessageBody:            entry.MessageBody,
+		DelaySeconds:           entry.DelaySeconds,
+		MessageAttributes:      entry.MessageAttributes,
+		MessageGroupId:         entry.MessageGroupId,
+		MessageDeduplicationId: entry.MessageDeduplicationId,
+	}
+
+	resp, err := s.runFifoSendWithRetry(ctx, queueName, asSingle)
+	if err != nil {
+		return false, sqsSendMessageBatchResultEntry{}, batchErrorEntryFromAPIErr(entry.Id, err)
+	}
+	return true, sqsSendMessageBatchResultEntry{
+		Id:                     entry.Id,
+		MessageId:              resp["MessageId"],
+		MD5OfMessageBody:       resp["MD5OfMessageBody"],
+		MD5OfMessageAttributes: resp["MD5OfMessageAttributes"],
+		SequenceNumber:         resp["SequenceNumber"],
+	}, sqsBatchResultErrorEntry{}
+}
+
+// runFifoSendWithRetry is the entry-loop counterpart of
+// sendMessageFifoLoop. It exists separately so the batch path can
+// surface per-entry errors as Failed[] entries rather than as a
+// whole-call failure.
+//
+// Each attempt — including the first — re-loads queue metadata at the
+// same readTS used for the OCC dispatch *and* re-derives the FIFO
+// dedup id and effective delay from that fresh meta. Without that,
+// attempt N would pair a fresh readTS with stale FIFO rules — if
+// SetQueueAttributes flipped ContentBasedDeduplication or rotated
+// DelaySeconds between the original meta read and the chosen retry
+// snapshot, the send could commit with the previous generation's
+// rules. Re-deriving per attempt guarantees the (meta, readTS,
+// dedupID, delay) tuple is coherent.
+func (s *SQSServer) runFifoSendWithRetry(
+	ctx context.Context,
+	queueName string,
+	in sqsSendMessageInput,
+) (map[string]string, error) {
+	backoff := transactRetryInitialBackoff
+	deadline := time.Now().Add(transactRetryMaxDuration)
+	for range transactRetryMaxAttempts {
+		readTS := s.nextTxnReadTS(ctx)
+		meta, dedupID, delay, err := s.resolveFreshFifoSnapshot(ctx, queueName, in, readTS)
+		if err != nil {
+			return nil, err
+		}
+		resp, retry, err := s.sendFifoMessage(ctx, queueName, meta, in, dedupID, delay, readTS)
+		if err != nil {
+			return nil, err
+		}
+		if !retry {
+			return resp, nil
+		}
+		if err := waitRetryWithDeadline(ctx, deadline, backoff); err != nil {
+			return nil, errors.WithStack(err)
+		}
+		backoff = nextTransactRetryBackoff(backoff)
+	}
+	return nil, newSQSAPIError(http.StatusInternalServerError, sqsErrInternalFailure, "FIFO send retry attempts exhausted")
+}
+
+// resolveFreshFifoSnapshot loads queue meta at readTS and re-derives
+// every meta-dependent value (size cap, FIFO params, dedup id,
+// effective delay). Pulled out of runFifoSendWithRetry so the retry
+// loop stays under the cyclomatic budget.
+func (s *SQSServer) resolveFreshFifoSnapshot(ctx context.Context, queueName string, in sqsSendMessageInput, readTS uint64) (*sqsQueueMeta, string, int64, error) {
+	meta, exists, err := s.loadQueueMetaAt(ctx, queueName, readTS)
+	if err != nil {
+		return nil, "", 0, err
+	}
+	if !exists {
+		return nil, "", 0, newSQSAPIError(http.StatusBadRequest, sqsErrQueueDoesNotExist, "queue does not exist")
+	}
+	if int64(len(in.MessageBody)) > meta.MaximumMessageSize {
+		return nil, "", 0, newSQSAPIError(http.StatusBadRequest, sqsErrMessageTooLong, "message body exceeds MaximumMessageSize")
+	}
+	if err := validateSendFIFOParams(meta, in); err != nil {
+		return nil, "", 0, err
+	}
+	dedupID := resolveFifoDedupID(meta, in)
+	if dedupID == "" {
+		return nil, "", 0, newSQSAPIError(http.StatusBadRequest, sqsErrMissingParameter,
+			"FIFO send requires MessageDeduplicationId or ContentBasedDeduplication=true")
+	}
+	delay, err := resolveSendDelay(meta, in.DelaySeconds)
+	if err != nil {
+		return nil, "", 0, err
+	}
+	return meta, dedupID, delay, nil
+}
+
+// buildBatchSendRecord runs every per-entry validation a single
+// SendMessage would, but returns the *sqsAPIError so the batch path
+// can drop the entry into Failed[] instead of failing the whole
+// request.
+func buildBatchSendRecord(meta *sqsQueueMeta, entry sqsSendMessageBatchEntryInput) (*sqsMessageRecord, []byte, error) {
+	if len(entry.MessageBody) == 0 {
+		return nil, nil, newSQSAPIError(http.StatusBadRequest, sqsErrValidation, "MessageBody is required")
+	}
+	if int64(len(entry.MessageBody)) > meta.MaximumMessageSize {
+		return nil, nil, newSQSAPIError(http.StatusBadRequest, sqsErrMessageTooLong, "message body exceeds MaximumMessageSize")
+	}
+	if err := validateMessageAttributes(entry.MessageAttributes); err != nil {
+		return nil, nil, err
+	}
+	asSingle := sqsSendMessageInput{
+		MessageBody:            entry.MessageBody,
+		DelaySeconds:           entry.DelaySeconds,
+		MessageAttributes:      entry.MessageAttributes,
+		MessageGroupId:         entry.MessageGroupId,
+		MessageDeduplicationId: entry.MessageDeduplicationId,
+	}
+	if err := validateSendFIFOParams(meta, asSingle); err != nil {
+		return nil, nil, err
+	}
+	delay, err := resolveSendDelay(meta, entry.DelaySeconds)
+	if err != nil {
+		return nil, nil, err
+	}
+	return buildSendRecord(meta, asSingle, delay)
+}
+
+// ------------------------ DeleteMessageBatch ------------------------
+
+type sqsDeleteMessageBatchInput struct {
+	QueueUrl string                            `json:"QueueUrl"`
+	Entries  []sqsDeleteMessageBatchEntryInput `json:"Entries"`
+}
+
+type sqsDeleteMessageBatchEntryInput struct {
+	Id            string `json:"Id"`
+	ReceiptHandle string `json:"ReceiptHandle"`
+}
+
+type sqsBatchResultEntry struct {
+	Id string `json:"Id"`
+}
+
+func (s *SQSServer) deleteMessageBatch(w http.ResponseWriter, r *http.Request) {
+	var in sqsDeleteMessageBatchInput
+	if err := decodeSQSJSONInput(r, &in); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	queueName, err := queueNameFromURL(in.QueueUrl)
+	if err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	ids := make([]string, 0, len(in.Entries))
+	for _, e := range in.Entries {
+		ids = append(ids, e.Id)
+	}
+	if err := validateBatchEntryShape(len(in.Entries), ids); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	if err := s.requireQueueExists(r.Context(), queueName); err != nil {
+		// AWS classes a missing queue as a request-level error
+		// (HTTP 400 QueueDoesNotExist) on batch APIs, not a per-
+		// entry failure inside an HTTP-200 envelope. Returning per-
+		// entry would let SDK retry logic mistake a hard queue-level
+		// failure for a partial-success batch and keep retrying.
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+
+	successful := make([]sqsBatchResultEntry, 0, len(in.Entries))
+	failed := make([]sqsBatchResultErrorEntry, 0)
+	for _, entry := range in.Entries {
+		// Each entry decodes its own handle and runs through the same
+		// retry-bound stale-is-success delete that single DeleteMessage
+		// uses. Per-entry isolation matches AWS, where a malformed
+		// handle in slot 3 must not poison slot 4.
+		handle, decodeErr := decodeReceiptHandle(entry.ReceiptHandle)
+		if decodeErr != nil {
+			failed = append(failed, sqsBatchResultErrorEntry{
+				Id:          entry.Id,
+				Code:        sqsErrReceiptHandleInvalid,
+				Message:     "receipt handle is not parseable",
+				SenderFault: true,
+			})
+			continue
+		}
+		if err := s.deleteMessageWithRetry(r.Context(), queueName, handle); err != nil {
+			failed = append(failed, batchErrorEntryFromErr(entry.Id, err))
+			continue
+		}
+		successful = append(successful, sqsBatchResultEntry{Id: entry.Id})
+	}
+	writeSQSJSON(w, map[string]any{
+		"Successful": successful,
+		"Failed":     failed,
+	})
+}
+
+// ------------------------ ChangeMessageVisibilityBatch ------------------------
+
+type sqsChangeVisBatchInput struct {
+	QueueUrl string                        `json:"QueueUrl"`
+	Entries  []sqsChangeVisBatchEntryInput `json:"Entries"`
+}
+
+type sqsChangeVisBatchEntryInput struct {
+	Id                string `json:"Id"`
+	ReceiptHandle     string `json:"ReceiptHandle"`
+	VisibilityTimeout *int64 `json:"VisibilityTimeout"`
+}
+
+func (s *SQSServer) changeMessageVisibilityBatch(w http.ResponseWriter, r *http.Request) {
+	var in sqsChangeVisBatchInput
+	if err := decodeSQSJSONInput(r, &in); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	queueName, err := queueNameFromURL(in.QueueUrl)
+	if err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	ids := make([]string, 0, len(in.Entries))
+	for _, e := range in.Entries {
+		ids = append(ids, e.Id)
+	}
+	if err := validateBatchEntryShape(len(in.Entries), ids); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	if err := s.requireQueueExists(r.Context(), queueName); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+
+	successful := make([]sqsBatchResultEntry, 0, len(in.Entries))
+	failed := make([]sqsBatchResultErrorEntry, 0)
+	for _, entry := range in.Entries {
+		ok, errEntry := s.applyChangeVisibilityBatchEntry(r.Context(), queueName, entry)
+		if !ok {
+			failed = append(failed, errEntry)
+			continue
+		}
+		successful = append(successful, sqsBatchResultEntry{Id: entry.Id})
+	}
+	writeSQSJSON(w, map[string]any{
+		"Successful": successful,
+		"Failed":     failed,
+	})
+}
+
+// applyChangeVisibilityBatchEntry runs the per-entry validate-and-commit
+// flow for a single ChangeMessageVisibilityBatch entry. Returns false
+// with a populated error entry when validation or the OCC commit fails;
+// returns true when the change was applied.
+func (s *SQSServer) applyChangeVisibilityBatchEntry(ctx context.Context, queueName string, entry sqsChangeVisBatchEntryInput) (bool, sqsBatchResultErrorEntry) {
+	if entry.VisibilityTimeout == nil {
+		return false, sqsBatchResultErrorEntry{
+			Id:          entry.Id,
+			Code:        sqsErrMissingParameter,
+			Message:     "VisibilityTimeout is required",
+			SenderFault: true,
+		}
+	}
+	timeout := *entry.VisibilityTimeout
+	if timeout < 0 || timeout > sqsChangeVisibilityMaxSeconds {
+		return false, sqsBatchResultErrorEntry{
+			Id:          entry.Id,
+			Code:        sqsErrInvalidAttributeValue,
+			Message:     "VisibilityTimeout out of range",
+			SenderFault: true,
+		}
+	}
+	handle, decodeErr := decodeReceiptHandle(entry.ReceiptHandle)
+	if decodeErr != nil {
+		return false, sqsBatchResultErrorEntry{
+			Id:          entry.Id,
+			Code:        sqsErrReceiptHandleInvalid,
+			Message:     "receipt handle is not parseable",
+			SenderFault: true,
+		}
+	}
+	if err := s.changeVisibilityWithRetry(ctx, queueName, handle, timeout); err != nil {
+		return false, batchErrorEntryFromErr(entry.Id, err)
+	}
+	return true, sqsBatchResultErrorEntry{}
+}
+
+// ------------------------ batch helpers ------------------------
+
+// validateBatchEntryShape enforces the request-level invariants that AWS
+// applies before any per-entry processing: at least one entry, no more
+// than 10, and unique non-empty Ids. These are different error codes
+// from per-entry InvalidParameterValue, so callers can distinguish a
+// malformed request from a partial-failure response.
+func validateBatchEntryShape(count int, ids []string) error {
+	if count == 0 {
+		return newSQSAPIError(http.StatusBadRequest, sqsErrEmptyBatchRequest, "Entries is required and non-empty")
+	}
+	if count > sqsBatchMaxEntries {
+		return newSQSAPIError(http.StatusBadRequest, sqsErrTooManyEntriesInBatchRequest,
+			"a batch request supports up to 10 entries")
+	}
+	seen := make(map[string]bool, count)
+	for _, id := range ids {
+		if id == "" {
+			return newSQSAPIError(http.StatusBadRequest, sqsErrInvalidBatchEntryId,
+				"every batch entry requires a non-empty Id")
+		}
+		// AWS limits batch entry Ids to 1-80 alphanumeric + `-` / `_`.
+		// Without this check, malformed Ids (e.g. arbitrary user
+		// strings, whitespace, multi-byte unicode) would pass through
+		// to per-entry processing instead of returning the documented
+		// InvalidBatchEntryId error.
+		if !sqsBatchEntryIDPattern.MatchString(id) {
+			return newSQSAPIError(http.StatusBadRequest, sqsErrInvalidBatchEntryId,
+				"batch entry Id must be 1-80 chars of alphanumeric, hyphen, or underscore")
+		}
+		if seen[id] {
+			return newSQSAPIError(http.StatusBadRequest, sqsErrBatchEntryIdsNotDistinct,
+				"batch entry Ids must be distinct")
+		}
+		seen[id] = true
+	}
+	return nil
+}
+
+func batchEntryIDs(entries []sqsSendMessageBatchEntryInput) []string {
+	out := make([]string, 0, len(entries))
+	for _, e := range entries {
+		out = append(out, e.Id)
+	}
+	return out
+}
+
+// requireQueueExists returns a request-level QueueDoesNotExist error
+// when the queue's meta record is gone. Batch DeleteMessage /
+// ChangeMessageVisibility use this as an upfront gate so callers see
+// the documented top-level error, not per-entry failures inside a
+// 200-envelope that retry logic can misclassify.
+func (s *SQSServer) requireQueueExists(ctx context.Context, queueName string) error {
+	_, exists, err := s.loadQueueMetaAt(ctx, queueName, s.nextTxnReadTS(ctx))
+	if err != nil {
+		return errors.WithStack(err)
+	}
+	if !exists {
+		return newSQSAPIError(http.StatusBadRequest, sqsErrQueueDoesNotExist, "queue does not exist")
+	}
+	return nil
+}
+
+// totalBatchPayloadBytes sums the message-body length and every
+// MessageAttribute (name + DataType + value) length across a batch.
+// Both fields count toward AWS's 256 KiB request cap; counting only
+// MessageBody would let a client stuff several MiB into a single
+// BinaryValue while passing the size gate.
+func totalBatchPayloadBytes(entries []sqsSendMessageBatchEntryInput) int {
+	total := 0
+	for _, e := range entries {
+		total += len(e.MessageBody)
+		for name, v := range e.MessageAttributes {
+			total += len(name) + len(v.DataType) + len(v.StringValue) + len(v.BinaryValue)
+		}
+	}
+	return total
+}
+
+func batchErrorEntryFromAPIErr(id string, err error) sqsBatchResultErrorEntry {
+	var apiErr *sqsAPIError
+	if errors.As(err, &apiErr) {
+		return sqsBatchResultErrorEntry{
+			Id:          id,
+			Code:        apiErr.errorType,
+			Message:     apiErr.message,
+			SenderFault: apiErr.status >= 400 && apiErr.status < 500,
+		}
+	}
+	return sqsBatchResultErrorEntry{
+		Id:          id,
+		Code:        sqsErrInternalFailure,
+		Message:     "internal error",
+		SenderFault: false,
+	}
+}
+
+// batchErrorEntryFromErr is the per-entry counterpart for paths that
+// already use an error result type — DeleteMessage / ChangeMessageVisibility
+// can return either an *sqsAPIError or a wrapped store error, and we want
+// the same body shape either way.
+func batchErrorEntryFromErr(id string, err error) sqsBatchResultErrorEntry {
+	return batchErrorEntryFromAPIErr(id, err)
+}
diff --git a/adapter/sqs_purge.go b/adapter/sqs_purge.go
new file mode 100644
index 000000000..f9e0ab486
--- /dev/null
+++ b/adapter/sqs_purge.go
@@ -0,0 +1,117 @@
+package adapter
+
+import (
+	"context"
+	"net/http"
+	"strconv"
+	"time"
+
+	"github.com/bootjp/elastickv/kv"
+	"github.com/cockroachdb/errors"
+)
+
+type sqsPurgeQueueInput struct {
+	QueueUrl string `json:"QueueUrl"`
+}
+
+// purgeQueue bumps the queue generation so every message under the old
+// generation becomes unreachable via routing, leaving the meta record in
+// place so the queue still "exists" to clients. AWS rate-limits PurgeQueue
+// to one call per 60 seconds per queue; the limiter survives leader
+// failover because it is stored on the meta record itself.
+func (s *SQSServer) purgeQueue(w http.ResponseWriter, r *http.Request) {
+	var in sqsPurgeQueueInput
+	if err := decodeSQSJSONInput(r, &in); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	name, err := queueNameFromURL(in.QueueUrl)
+	if err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	if err := s.purgeQueueWithRetry(r.Context(), name); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	writeSQSJSON(w, map[string]any{})
+}
+
+func (s *SQSServer) purgeQueueWithRetry(ctx context.Context, queueName string) error {
+	backoff := transactRetryInitialBackoff
+	deadline := time.Now().Add(transactRetryMaxDuration)
+	for range transactRetryMaxAttempts {
+		done, err := s.tryPurgeQueueOnce(ctx, queueName)
+		if err == nil && done {
+			return nil
+		}
+		if err != nil && !isRetryableTransactWriteError(err) {
+			return err
+		}
+		if err := waitRetryWithDeadline(ctx, deadline, backoff); err != nil {
+			return errors.WithStack(err)
+		}
+		backoff = nextTransactRetryBackoff(backoff)
+	}
+	return newSQSAPIError(http.StatusInternalServerError, sqsErrInternalFailure, "purge queue retry attempts exhausted")
+}
+
+// tryPurgeQueueOnce performs one read-validate-commit pass. The first
+// return reports whether the caller should stop retrying (true means
+// the purge is committed); a non-retryable error short-circuits the
+// loop.
+func (s *SQSServer) tryPurgeQueueOnce(ctx context.Context, queueName string) (bool, error) {
+	readTS := s.nextTxnReadTS(ctx)
+	meta, exists, err := s.loadQueueMetaAt(ctx, queueName, readTS)
+	if err != nil {
+		return false, errors.WithStack(err)
+	}
+	if !exists {
+		return false, newSQSAPIError(http.StatusBadRequest, sqsErrQueueDoesNotExist, "queue does not exist")
+	}
+	now := time.Now().UnixMilli()
+	if meta.LastPurgedAtMillis > 0 && now-meta.LastPurgedAtMillis < sqsPurgeRateLimitMillis {
+		return false, newSQSAPIError(http.StatusBadRequest, sqsErrPurgeInProgress,
+			"only one PurgeQueue operation on each queue is allowed every 60 seconds")
+	}
+	lastGen, err := s.loadQueueGenerationAt(ctx, queueName, readTS)
+	if err != nil {
+		return false, errors.WithStack(err)
+	}
+	meta.Generation = lastGen + 1
+	meta.LastPurgedAtMillis = now
+	meta.LastModifiedAtMillis = now
+	metaBytes, err := encodeSQSQueueMeta(meta)
+	if err != nil {
+		return false, errors.WithStack(err)
+	}
+	metaKey := sqsQueueMetaKey(queueName)
+	genKey := sqsQueueGenKey(queueName)
+	// Tombstone the pre-bump generation so the reaper can find its
+	// orphan keyspace even if DeleteQueue lands before the next reaper
+	// tick. Without this, a Purge → Delete sequence within the
+	// reaper interval permanently leaks data/vis/byage/dedup/group
+	// rows for the pre-purge generation: scanQueueNames sees no meta,
+	// and reapTombstonedQueues only sees the post-delete tombstone
+	// (which is keyed on the post-purge gen). reapDeadByAge filters
+	// by exact generation, so the older cohort is never visited.
+	tombstoneKey := sqsQueueTombstoneKey(queueName, lastGen)
+	// StartTS + ReadKeys fence against a concurrent CreateQueue /
+	// DeleteQueue / SetQueueAttributes / PurgeQueue landing between
+	// our load and dispatch. ErrWriteConflict surfaces via the
+	// retry loop so a later pass observes the new state.
+	req := &kv.OperationGroup[kv.OP]{
+		IsTxn:    true,
+		StartTS:  readTS,
+		ReadKeys: [][]byte{metaKey, genKey},
+		Elems: []*kv.Elem[kv.OP]{
+			{Op: kv.Put, Key: metaKey, Value: metaBytes},
+			{Op: kv.Put, Key: genKey, Value: []byte(strconv.FormatUint(meta.Generation, 10))},
+			{Op: kv.Put, Key: tombstoneKey, Value: []byte{1}},
+		},
+	}
+	if _, err := s.coordinator.Dispatch(ctx, req); err != nil {
+		return false, errors.WithStack(err)
+	}
+	return true, nil
+}
diff --git a/adapter/sqs_reaper.go b/adapter/sqs_reaper.go
new file mode 100644
index 000000000..c2a078a4f
--- /dev/null
+++ b/adapter/sqs_reaper.go
@@ -0,0 +1,540 @@
+package adapter
+
+import (
+	"bytes"
+	"context"
+	"log/slog"
+	"time"
+
+	"github.com/bootjp/elastickv/kv"
+	"github.com/bootjp/elastickv/store"
+	"github.com/cockroachdb/errors"
+)
+
+const (
+	// sqsReaperInterval is how often the leader's retention sweeper
+	// wakes up to look for expired records. AWS does not promise a
+	// specific reaping cadence; the documented retention guarantee is
+	// that messages older than MessageRetentionPeriod are eventually
+	// dropped. 30 s is fast enough that a queue with the minimum
+	// 60 s retention sees expiries within the same minute, and slow
+	// enough that an idle cluster pays close to zero CPU.
+	sqsReaperInterval = 30 * time.Second
+	// sqsReaperPageLimit caps the per-pass scan of byage entries so
+	// one tick cannot pin the leader on a backlog. The reaper resumes
+	// from the next tick, so eventual reaping holds even when the
+	// backlog exceeds the per-tick budget.
+	sqsReaperPageLimit = 256
+	// sqsReaperPerQueueBudget caps the work per queue per tick to
+	// avoid starvation across queues — a single queue with millions
+	// of expired entries should not lock out the others.
+	sqsReaperPerQueueBudget = 1024
+)
+
+// startReaper kicks off the retention sweeper on the leader. It is
+// safe to call multiple times; the first call wins and subsequent
+// calls are no-ops. Stop() cancels the context so the goroutine
+// returns promptly.
+func (s *SQSServer) startReaper(ctx context.Context) {
+	if s == nil || s.coordinator == nil || s.store == nil {
+		return
+	}
+	go s.runReaper(ctx)
+}
+
+func (s *SQSServer) runReaper(ctx context.Context) {
+	t := time.NewTicker(sqsReaperInterval)
+	defer t.Stop()
+	for {
+		select {
+		case <-ctx.Done():
+			return
+		case <-t.C:
+		}
+		// Only the leader should reap; followers would emit
+		// duplicate Dispatches that the leader would still have to
+		// adjudicate, costing a round-trip per record. The check is
+		// a cheap local read.
+		if s.coordinator == nil || !s.coordinator.IsLeader() {
+			continue
+		}
+		if err := s.reapAllQueues(ctx); err != nil {
+			slog.Warn("sqs reaper pass failed", "err", err)
+		}
+	}
+}
+
+func (s *SQSServer) reapAllQueues(ctx context.Context) error {
+	names, err := s.scanQueueNames(ctx)
+	if err != nil {
+		return errors.WithStack(err)
+	}
+	for _, name := range names {
+		if err := ctx.Err(); err != nil {
+			return errors.WithStack(err)
+		}
+		readTS := s.nextTxnReadTS(ctx)
+		meta, exists, err := s.loadQueueMetaAt(ctx, name, readTS)
+		if err != nil || !exists {
+			// Even when meta is gone (DeleteQueue), prior-generation
+			// orphans need reaping; reapTombstonedQueues (called
+			// after this loop) handles that case. Here we only skip
+			// the queue if loading itself failed (transient).
+			continue
+		}
+		if err := s.reapQueue(ctx, name, meta, readTS); err != nil {
+			slog.Warn("sqs reaper queue pass failed", "queue", name, "err", err)
+		}
+		if err := s.reapExpiredDedup(ctx, name, readTS); err != nil {
+			slog.Warn("sqs dedup reaper pass failed", "queue", name, "err", err)
+		}
+	}
+	// Tombstones fire on DeleteQueue and outlive the meta row, so a
+	// purely meta-driven enumeration would never reach orphan keys
+	// for deleted queues. Walk them after the live-queue pass.
+	if err := s.reapTombstonedQueues(ctx); err != nil {
+		slog.Warn("sqs reaper tombstone pass failed", "err", err)
+	}
+	return nil
+}
+
+// reapTombstonedQueues enumerates every (queue, gen) tombstone left
+// by DeleteQueue and reaps the message keyspace for that
+// (queue, gen). Once a tombstone has nothing left to clean — no
+// byage, dedup, or group rows — the tombstone itself is deleted so
+// the next pass does not re-walk an empty queue forever.
+func (s *SQSServer) reapTombstonedQueues(ctx context.Context) error {
+	prefix := []byte(SqsQueueTombstonePrefix)
+	upper := prefixScanEnd(prefix)
+	start := bytes.Clone(prefix)
+	for {
+		readTS := s.nextTxnReadTS(ctx)
+		page, err := s.store.ScanAt(ctx, start, upper, sqsReaperPageLimit, readTS)
+		if err != nil {
+			return errors.WithStack(err)
+		}
+		if len(page) == 0 {
+			return nil
+		}
+		for _, kvp := range page {
+			if err := ctx.Err(); err != nil {
+				return errors.WithStack(err)
+			}
+			queueName, gen, ok := parseSqsQueueTombstoneKey(kvp.Key)
+			if !ok {
+				continue
+			}
+			s.reapTombstonedGeneration(ctx, queueName, gen, kvp.Key, readTS)
+		}
+		if len(page) < sqsReaperPageLimit {
+			return nil
+		}
+		start = nextScanCursorAfter(page[len(page)-1].Key)
+		if bytes.Compare(start, upper) >= 0 {
+			return nil
+		}
+	}
+}
+
+// reapTombstonedGeneration cleans a single (queue, gen) cohort under
+// its own per-queue budget. Once every prefix the cohort can occupy
+// is empty, the tombstone itself is deleted; otherwise it stays so
+// the next tick can finish what was left.
+func (s *SQSServer) reapTombstonedGeneration(ctx context.Context, queueName string, gen uint64, tombstoneKey []byte, readTS uint64) {
+	dataDone, err := s.reapDeadByAge(ctx, queueName, gen, readTS)
+	if err != nil {
+		slog.Warn("sqs tombstone byage reap failed", "queue", queueName, "gen", gen, "err", err)
+		return
+	}
+	dedupDone, err := s.deleteAllPrefix(ctx, sqsMsgDedupKeyPrefix(queueName, gen), readTS)
+	if err != nil {
+		slog.Warn("sqs tombstone dedup reap failed", "queue", queueName, "gen", gen, "err", err)
+		return
+	}
+	groupDone, err := s.deleteAllPrefix(ctx, sqsMsgGroupKeyPrefix(queueName, gen), readTS)
+	if err != nil {
+		slog.Warn("sqs tombstone group reap failed", "queue", queueName, "gen", gen, "err", err)
+		return
+	}
+	if dataDone && dedupDone && groupDone {
+		_ = s.dispatchDedupDelete(ctx, tombstoneKey, readTS)
+	}
+}
+
+// reapDeadByAge walks the byage prefix for one (queue, gen) cohort
+// and reaps each record found, regardless of retention age — every
+// row under a tombstoned generation is by definition orphaned.
+// Returns done=true when the cohort is fully drained.
+func (s *SQSServer) reapDeadByAge(ctx context.Context, queueName string, gen uint64, readTS uint64) (bool, error) {
+	prefix := append(sqsMsgByAgePrefixAllGenerations(queueName), encodedU64(gen)...)
+	upper := prefixScanEnd(prefix)
+	start := bytes.Clone(prefix)
+	processed := 0
+	for processed < sqsReaperPerQueueBudget {
+		page, err := s.store.ScanAt(ctx, start, upper, sqsReaperPageLimit, readTS)
+		if err != nil {
+			return false, errors.WithStack(err)
+		}
+		if len(page) == 0 {
+			return true, nil
+		}
+		done, newProcessed, err := s.reapDeadByAgePage(ctx, queueName, gen, page, readTS, processed)
+		if err != nil {
+			return false, err
+		}
+		processed = newProcessed
+		if done {
+			return processed < sqsReaperPerQueueBudget, nil
+		}
+		start = nextScanCursorAfter(page[len(page)-1].Key)
+	}
+	return false, nil
+}
+
+// reapDeadByAgePage processes one ScanAt page during a tombstone reap
+// pass. Returns done=true when either the page was the last one or
+// the per-queue budget ran out.
+func (s *SQSServer) reapDeadByAgePage(ctx context.Context, queueName string, gen uint64, page []*store.KVPair, readTS uint64, processed int) (bool, int, error) {
+	for _, kvp := range page {
+		if err := ctx.Err(); err != nil {
+			return true, processed, errors.WithStack(err)
+		}
+		parsed, ok := parseSqsMsgByAgeKey(kvp.Key, queueName)
+		if !ok || parsed.Generation != gen {
+			continue
+		}
+		if err := s.reapOneRecord(ctx, queueName, gen, kvp.Key, parsed.MessageID, readTS); err != nil {
+			return true, processed, err
+		}
+		processed++
+		if processed >= sqsReaperPerQueueBudget {
+			return true, processed, nil
+		}
+	}
+	if len(page) < sqsReaperPageLimit {
+		return true, processed, nil
+	}
+	return false, processed, nil
+}
+
+// deleteAllPrefix scans the given prefix and Dispatch-deletes every
+// key it finds, one at a time. Returns done=true when the prefix is
+// empty (or empty enough that this tick exhausted its work).
+func (s *SQSServer) deleteAllPrefix(ctx context.Context, prefix []byte, readTS uint64) (bool, error) {
+	upper := prefixScanEnd(prefix)
+	start := bytes.Clone(prefix)
+	processed := 0
+	for processed < sqsReaperPerQueueBudget {
+		page, err := s.store.ScanAt(ctx, start, upper, sqsReaperPageLimit, readTS)
+		if err != nil {
+			return false, errors.WithStack(err)
+		}
+		if len(page) == 0 {
+			return true, nil
+		}
+		for _, kvp := range page {
+			if err := ctx.Err(); err != nil {
+				return false, errors.WithStack(err)
+			}
+			if err := s.dispatchDedupDelete(ctx, kvp.Key, readTS); err != nil {
+				return false, err
+			}
+			processed++
+			if processed >= sqsReaperPerQueueBudget {
+				return false, nil
+			}
+		}
+		if len(page) < sqsReaperPageLimit {
+			return true, nil
+		}
+		start = nextScanCursorAfter(page[len(page)-1].Key)
+	}
+	return false, nil
+}
+
+// sqsMsgDedupKeyPrefix / sqsMsgGroupKeyPrefix return the (queue, gen)
+// prefix for the dedup and group keyspaces. Pulled out as helpers
+// so the tombstone reaper does not need to know the encoding.
+func sqsMsgDedupKeyPrefix(queueName string, gen uint64) []byte {
+	buf := make([]byte, 0, len(SqsMsgDedupPrefix)+sqsKeyCapSmall)
+	buf = append(buf, SqsMsgDedupPrefix...)
+	buf = append(buf, encodeSQSSegment(queueName)...)
+	buf = appendU64(buf, gen)
+	return buf
+}
+
+func sqsMsgGroupKeyPrefix(queueName string, gen uint64) []byte {
+	buf := make([]byte, 0, len(SqsMsgGroupPrefix)+sqsKeyCapSmall)
+	buf = append(buf, SqsMsgGroupPrefix...)
+	buf = append(buf, encodeSQSSegment(queueName)...)
+	buf = appendU64(buf, gen)
+	return buf
+}
+
+// reapQueue scans the byage index across every queue generation and
+// removes records that are either (a) past the current generation's
+// retention deadline, or (b) leftovers from a prior generation that
+// PurgeQueue / DeleteQueue advanced past. Without case (b), each
+// purge would permanently leak data/vis/byage/group-lock state for
+// every message it left behind — those keys are unreachable via
+// normal routing once the generation bumps, so the reaper is the
+// only path that can free them.
+//
+// One OCC dispatch per record keeps each transaction small and
+// bounded; a mega-batch transaction would balloon memory and abort
+// more often.
+func (s *SQSServer) reapQueue(ctx context.Context, queueName string, meta *sqsQueueMeta, readTS uint64) error {
+	now := time.Now().UnixMilli()
+	cutoff := now - meta.MessageRetentionSeconds*sqsMillisPerSecond
+	if meta.MessageRetentionSeconds <= 0 {
+		// Retention was set to a non-positive value: only orphan
+		// reaping (case b) makes sense. Keep cutoff at MaxInt64-ish
+		// for the live generation so we never delete live records.
+		cutoff = 0
+	}
+	prefix := sqsMsgByAgePrefixAllGenerations(queueName)
+	upper := prefixScanEnd(prefix)
+	start := bytes.Clone(prefix)
+
+	processed := 0
+	for processed < sqsReaperPerQueueBudget {
+		page, err := s.store.ScanAt(ctx, start, upper, sqsReaperPageLimit, readTS)
+		if err != nil {
+			return errors.WithStack(err)
+		}
+		if len(page) == 0 {
+			return nil
+		}
+		done, newProcessed, err := s.reapPage(ctx, queueName, meta.Generation, cutoff, page, readTS, processed)
+		if err != nil {
+			return err
+		}
+		processed = newProcessed
+		if done {
+			return nil
+		}
+		start = nextScanCursorAfter(page[len(page)-1].Key)
+		if bytes.Compare(start, upper) >= 0 {
+			return nil
+		}
+	}
+	return nil
+}
+
+// reapPage walks one ScanAt page, dispatching a per-record reap
+// transaction. currentGen is the queue's *live* generation; entries
+// under any earlier generation are unconditionally reaped, while
+// entries on the live generation are gated by `cutoff`. Returns
+// done=true when the per-queue budget is hit or the page was short
+// (last page in the scan).
+func (s *SQSServer) reapPage(ctx context.Context, queueName string, currentGen uint64, cutoff int64, page []*store.KVPair, readTS uint64, processed int) (bool, int, error) {
+	for _, kvp := range page {
+		if err := ctx.Err(); err != nil {
+			return true, processed, errors.WithStack(err)
+		}
+		parsed, ok := parseSqsMsgByAgeKey(kvp.Key, queueName)
+		if !ok {
+			continue
+		}
+		// Live generation is gated by retention; older generations
+		// are unconditional orphans. Skipping a live record that is
+		// still inside the retention window keeps the reaper honest
+		// — the receive path expects to see it again until retention
+		// elapses.
+		if parsed.Generation == currentGen && parsed.SendTimestampMs > cutoff {
+			continue
+		}
+		if parsed.Generation > currentGen {
+			// Defensive: a key from a generation strictly newer than
+			// what the meta says would mean the byage index races
+			// the gen counter. Skip it; the next reaper pass will
+			// see meta caught up.
+			continue
+		}
+		if err := s.reapOneRecord(ctx, queueName, parsed.Generation, kvp.Key, parsed.MessageID, readTS); err != nil {
+			return true, processed, err
+		}
+		processed++
+		if processed >= sqsReaperPerQueueBudget {
+			return true, processed, nil
+		}
+	}
+	if len(page) < sqsReaperPageLimit {
+		return true, processed, nil
+	}
+	return false, processed, nil
+}
+
+// reapOneRecord deletes one (data, vis, byage, optional group-lock)
+// quartet under a single OCC dispatch. ErrWriteConflict is treated as
+// success — the message has just been touched (received, deleted,
+// redriven) by another path and is no longer ours to reap.
+func (s *SQSServer) reapOneRecord(ctx context.Context, queueName string, gen uint64, byAgeKey []byte, messageID string, readTS uint64) error {
+	dataKey := sqsMsgDataKey(queueName, gen, messageID)
+	parsed, found, err := s.loadDataForReaper(ctx, dataKey, readTS)
+	if err != nil {
+		return err
+	}
+	if !found {
+		// Stale byage index without a backing record. Drop the
+		// index entry alone — without this branch the reaper would
+		// loop on the same orphan key forever.
+		s.dispatchOrphanByAgeDrop(ctx, byAgeKey, readTS)
+		return nil
+	}
+	req, err := s.buildReapOps(ctx, queueName, gen, byAgeKey, dataKey, parsed, readTS)
+	if err != nil {
+		return err
+	}
+	if _, err := s.coordinator.Dispatch(ctx, req); err != nil {
+		if isRetryableTransactWriteError(err) {
+			return nil
+		}
+		return errors.WithStack(err)
+	}
+	return nil
+}
+
+// loadDataForReaper fetches and decodes the data record for a byage
+// entry. found=false signals "byage points at a missing record — drop
+// the byage entry" to the caller. Read errors other than ErrKeyNotFound
+// surface to the caller so a transient storage problem is logged and
+// retried on the next tick instead of silently scrubbing the index.
+func (s *SQSServer) loadDataForReaper(ctx context.Context, dataKey []byte, readTS uint64) (*sqsMessageRecord, bool, error) {
+	raw, err := s.store.GetAt(ctx, dataKey, readTS)
+	if err != nil {
+		if errors.Is(err, store.ErrKeyNotFound) {
+			return nil, false, nil
+		}
+		return nil, false, errors.WithStack(err)
+	}
+	parsed, err := decodeSQSMessageRecord(raw)
+	if err != nil {
+		return nil, false, errors.WithStack(err)
+	}
+	return parsed, true, nil
+}
+
+func (s *SQSServer) dispatchOrphanByAgeDrop(ctx context.Context, byAgeKey []byte, readTS uint64) {
+	req := &kv.OperationGroup[kv.OP]{
+		IsTxn:    true,
+		StartTS:  readTS,
+		ReadKeys: [][]byte{byAgeKey},
+		Elems: []*kv.Elem[kv.OP]{
+			{Op: kv.Del, Key: byAgeKey},
+		},
+	}
+	_, _ = s.coordinator.Dispatch(ctx, req)
+}
+
+// reapExpiredDedup walks every FIFO dedup record under the given
+// queue (across generations) and deletes the ones whose
+// ExpiresAtMillis has passed. Without this sweep, queues with mostly
+// unique MessageDeduplicationIds would accumulate permanent
+// dedup-row leaks because the send path treats expired records as
+// misses but never removes them.
+func (s *SQSServer) reapExpiredDedup(ctx context.Context, queueName string, readTS uint64) error {
+	prefix := []byte(SqsMsgDedupPrefix)
+	prefix = append(prefix, []byte(encodeSQSSegment(queueName))...)
+	upper := prefixScanEnd(prefix)
+	start := bytes.Clone(prefix)
+	now := time.Now().UnixMilli()
+
+	processed := 0
+	for processed < sqsReaperPerQueueBudget {
+		page, err := s.store.ScanAt(ctx, start, upper, sqsReaperPageLimit, readTS)
+		if err != nil {
+			return errors.WithStack(err)
+		}
+		if len(page) == 0 {
+			return nil
+		}
+		done, newProcessed, err := s.reapDedupPage(ctx, page, now, readTS, processed)
+		if err != nil {
+			return err
+		}
+		processed = newProcessed
+		if done {
+			return nil
+		}
+		start = nextScanCursorAfter(page[len(page)-1].Key)
+		if bytes.Compare(start, upper) >= 0 {
+			return nil
+		}
+	}
+	return nil
+}
+
+// reapDedupPage walks one ScanAt page of dedup records and removes
+// any whose ExpiresAtMillis is in the past. Returns done=true when
+// the per-queue budget runs out or the page was short.
+func (s *SQSServer) reapDedupPage(ctx context.Context, page []*store.KVPair, now int64, readTS uint64, processed int) (bool, int, error) {
+	for _, kvp := range page {
+		if err := ctx.Err(); err != nil {
+			return true, processed, errors.WithStack(err)
+		}
+		rec, err := decodeFifoDedupRecord(kvp.Value)
+		if err != nil {
+			continue
+		}
+		if rec.ExpiresAtMillis <= 0 || rec.ExpiresAtMillis > now {
+			continue
+		}
+		if err := s.dispatchDedupDelete(ctx, kvp.Key, readTS); err != nil {
+			return true, processed, err
+		}
+		processed++
+		if processed >= sqsReaperPerQueueBudget {
+			return true, processed, nil
+		}
+	}
+	if len(page) < sqsReaperPageLimit {
+		return true, processed, nil
+	}
+	return false, processed, nil
+}
+
+func (s *SQSServer) dispatchDedupDelete(ctx context.Context, key []byte, readTS uint64) error {
+	req := &kv.OperationGroup[kv.OP]{
+		IsTxn:    true,
+		StartTS:  readTS,
+		ReadKeys: [][]byte{key},
+		Elems: []*kv.Elem[kv.OP]{
+			{Op: kv.Del, Key: key},
+		},
+	}
+	if _, err := s.coordinator.Dispatch(ctx, req); err != nil {
+		if isRetryableTransactWriteError(err) {
+			return nil
+		}
+		return errors.WithStack(err)
+	}
+	return nil
+}
+
+func (s *SQSServer) buildReapOps(ctx context.Context, queueName string, gen uint64, byAgeKey, dataKey []byte, parsed *sqsMessageRecord, readTS uint64) (*kv.OperationGroup[kv.OP], error) {
+	visKey := sqsMsgVisKey(queueName, gen, parsed.VisibleAtMillis, parsed.MessageID)
+	readKeys := [][]byte{byAgeKey, dataKey, visKey, sqsQueueMetaKey(queueName), sqsQueueGenKey(queueName)}
+	elems := []*kv.Elem[kv.OP]{
+		{Op: kv.Del, Key: byAgeKey},
+		{Op: kv.Del, Key: dataKey},
+		{Op: kv.Del, Key: visKey},
+	}
+	if parsed.MessageGroupId != "" {
+		lockKey := sqsMsgGroupKey(queueName, gen, parsed.MessageGroupId)
+		lock, err := s.loadFifoGroupLock(ctx, queueName, gen, parsed.MessageGroupId, readTS)
+		if err != nil {
+			return nil, err
+		}
+		if lock != nil && lock.MessageID == parsed.MessageID {
+			readKeys = append(readKeys, lockKey)
+			elems = append(elems, &kv.Elem[kv.OP]{Op: kv.Del, Key: lockKey})
+		}
+	}
+	return &kv.OperationGroup[kv.OP]{
+		IsTxn:    true,
+		StartTS:  readTS,
+		ReadKeys: readKeys,
+		Elems:    elems,
+	}, nil
+}
diff --git a/adapter/sqs_redrive.go b/adapter/sqs_redrive.go
new file mode 100644
index 000000000..4e1084862
--- /dev/null
+++ b/adapter/sqs_redrive.go
@@ -0,0 +1,336 @@
+package adapter
+
+import (
+	"context"
+	"net/http"
+	"strconv"
+	"strings"
+	"time"
+
+	"github.com/bootjp/elastickv/kv"
+	"github.com/cockroachdb/errors"
+	json "github.com/goccy/go-json"
+)
+
+// parsedRedrivePolicy is the in-memory shape of the RedrivePolicy JSON
+// blob clients send. AWS allows maxReceiveCount as either a JSON
+// number or a string, so the parser handles both.
+type parsedRedrivePolicy struct {
+	DeadLetterTargetArn string
+	DLQName             string
+	MaxReceiveCount     int64
+}
+
+// rawRedrivePolicy mirrors the AWS JSON shape. maxReceiveCount uses
+// json.Number so we can accept both numeric and string forms without
+// disagreeing with the SDKs.
+type rawRedrivePolicy struct {
+	DeadLetterTargetArn string      `json:"deadLetterTargetArn"`
+	MaxReceiveCount     json.Number `json:"maxReceiveCount"`
+}
+
+// AWS SQS allows maxReceiveCount in [1, 1000].
+const (
+	sqsRedriveMaxReceiveCountMax = 1000
+	sqsRedriveMaxReceiveCountMin = 1
+)
+
+// parseRedrivePolicy validates a RedrivePolicy JSON blob and extracts
+// the DLQ queue name from the deadLetterTargetArn. ARNs are expected
+// to be of the form arn:aws:sqs:<region>:<account>:<name>; we
+// tolerate cluster-local synthesized ARNs by treating the segment
+// after the last colon as the queue name.
+func parseRedrivePolicy(s string) (*parsedRedrivePolicy, error) {
+	s = strings.TrimSpace(s)
+	if s == "" {
+		return nil, newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"RedrivePolicy must be non-empty JSON")
+	}
+	var raw rawRedrivePolicy
+	if err := json.Unmarshal([]byte(s), &raw); err != nil {
+		return nil, newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"RedrivePolicy is not valid JSON")
+	}
+	if raw.DeadLetterTargetArn == "" {
+		return nil, newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"RedrivePolicy.deadLetterTargetArn is required")
+	}
+	maxReceive, err := raw.MaxReceiveCount.Int64()
+	if err != nil {
+		return nil, newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"RedrivePolicy.maxReceiveCount must be an integer")
+	}
+	if maxReceive < sqsRedriveMaxReceiveCountMin || maxReceive > sqsRedriveMaxReceiveCountMax {
+		return nil, newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"RedrivePolicy.maxReceiveCount must be between 1 and 1000")
+	}
+	dlqName := dlqNameFromArn(raw.DeadLetterTargetArn)
+	if dlqName == "" {
+		return nil, newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"RedrivePolicy.deadLetterTargetArn is malformed")
+	}
+	return &parsedRedrivePolicy{
+		DeadLetterTargetArn: raw.DeadLetterTargetArn,
+		DLQName:             dlqName,
+		MaxReceiveCount:     maxReceive,
+	}, nil
+}
+
+// dlqNameFromArn returns the queue name segment of an SQS ARN. AWS
+// ARNs always have name as the final colon-delimited segment, so a
+// last-colon split is correct for both production and test ARNs.
+func dlqNameFromArn(arn string) string {
+	idx := strings.LastIndex(arn, ":")
+	if idx < 0 || idx == len(arn)-1 {
+		return ""
+	}
+	return arn[idx+1:]
+}
+
+// shouldRedrive reports whether a candidate's *next* receive would
+// trip the redrive policy. Bumping ReceiveCount by 1 first matches
+// AWS's "maxReceiveCount is the number of times a message can be
+// received before being moved to the DLQ" definition.
+func shouldRedrive(rec *sqsMessageRecord, policy *parsedRedrivePolicy) bool {
+	if policy == nil {
+		return false
+	}
+	return rec.ReceiveCount+1 > policy.MaxReceiveCount
+}
+
+// redriveCandidateToDLQ atomically moves a candidate from the source
+// queue to the DLQ inside one OCC transaction. The source's data and
+// vis-index entries are deleted; a fresh DLQ message record (with
+// reset ReceiveCount and a new receipt token) is written along with
+// its visibility entry.
+//
+// The DeadLetterQueueSourceArn attribute is added so consumers reading
+// the DLQ can correlate moved messages back to the originating queue.
+//
+// On ErrWriteConflict the caller treats this as a skip (another
+// receiver may have moved or rotated the same record). Other errors
+// propagate so an operational failure does not silently leave the
+// poison message in the source queue.
+func (s *SQSServer) redriveCandidateToDLQ(
+	ctx context.Context,
+	srcQueueName string,
+	srcGen uint64,
+	cand sqsMsgCandidate,
+	srcDataKey []byte,
+	srcRec *sqsMessageRecord,
+	policy *parsedRedrivePolicy,
+	srcArn string,
+	readTS uint64,
+) (bool, error) {
+	dlqMeta, err := s.validateRedriveTargets(ctx, srcQueueName, srcRec, policy, readTS)
+	if err != nil {
+		return false, err
+	}
+	// FIFO DLQs require the redrive write to participate in the
+	// per-queue SequenceNumber sequence, otherwise the DLQ record
+	// is committed with SequenceNumber=0 (AWS surfaces this
+	// verbatim, and 0 violates AWS's invariant that sequences
+	// start at 1) and the next normal FIFO send to the DLQ assigns
+	// a number lower than the redriven message — non-monotonic to
+	// consumers. Load the seq snapshot at readTS, increment, and
+	// pass it into both buildDLQRecord (encoded onto the record)
+	// and buildRedriveOps (Put + ReadKeys fence).
+	var dlqSeq uint64
+	if dlqMeta.IsFIFO {
+		prevSeq, err := s.loadFifoSequence(ctx, policy.DLQName, readTS)
+		if err != nil {
+			return false, err
+		}
+		dlqSeq = prevSeq + 1
+	}
+	dlqRec, dlqRecordBytes, err := buildDLQRecord(srcRec, dlqMeta, srcArn, dlqSeq)
+	if err != nil {
+		return false, err
+	}
+	req, err := s.buildRedriveOps(ctx, srcQueueName, srcGen, cand, srcDataKey, srcRec, policy, dlqMeta, dlqRec, dlqRecordBytes, dlqSeq, readTS)
+	if err != nil {
+		return false, err
+	}
+	if _, err := s.coordinator.Dispatch(ctx, req); err != nil {
+		if isRetryableTransactWriteError(err) {
+			return true, nil
+		}
+		return false, errors.WithStack(err)
+	}
+	return true, nil
+}
+
+// validateRedriveTargets enforces every static precondition on the
+// (source, DLQ, policy) triple before the OCC dispatch is built.
+// Returns the loaded DLQ meta on success so the caller does not have
+// to re-load it.
+//
+// Failure modes (all surfaced as 4xx sqsAPIError):
+//   - self-referential RedrivePolicy (defense-in-depth against records
+//     that predate the attribute-time validator),
+//   - DLQ vanished between policy-set and receive,
+//   - source queue vanished mid-redrive (DeleteQueue race),
+//   - source/DLQ queue-type mismatch (FIFO ↔ Standard) — AWS forbids
+//     this and runtime is the only place it can be enforced because
+//     the catalog accepts a RedrivePolicy that names a queue created
+//     or recreated later as a different type,
+//   - FIFO DLQ paired with a source record lacking MessageGroupId
+//     (defense in depth against malformed records that slip past the
+//     type-equality check).
+func (s *SQSServer) validateRedriveTargets(
+	ctx context.Context,
+	srcQueueName string,
+	srcRec *sqsMessageRecord,
+	policy *parsedRedrivePolicy,
+	readTS uint64,
+) (*sqsQueueMeta, error) {
+	if policy.DLQName == srcQueueName {
+		return nil, newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"RedrivePolicy.deadLetterTargetArn must not point at the source queue")
+	}
+	dlqMeta, dlqExists, err := s.loadQueueMetaAt(ctx, policy.DLQName, readTS)
+	if err != nil {
+		return nil, errors.WithStack(err)
+	}
+	if !dlqExists {
+		return nil, newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"RedrivePolicy targets non-existent DLQ "+policy.DLQName)
+	}
+	srcMeta, srcExists, err := s.loadQueueMetaAt(ctx, srcQueueName, readTS)
+	if err != nil {
+		return nil, errors.WithStack(err)
+	}
+	if !srcExists {
+		return nil, newSQSAPIError(http.StatusBadRequest, sqsErrQueueDoesNotExist,
+			"source queue disappeared during redrive")
+	}
+	if srcMeta.IsFIFO != dlqMeta.IsFIFO {
+		return nil, newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"RedrivePolicy queue-type mismatch: source and DLQ must both be FIFO or both Standard")
+	}
+	if dlqMeta.IsFIFO && srcRec.MessageGroupId == "" {
+		return nil, newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+			"FIFO DLQ requires source records to carry MessageGroupId")
+	}
+	return dlqMeta, nil
+}
+
+// buildDLQRecord assembles the DLQ-side message record. Reset
+// ReceiveCount and FirstReceiveMillis so the DLQ consumer sees a
+// fresh delivery, not the source's bounce history.
+//
+// dlqSeq is the SequenceNumber to assign on the DLQ record, computed
+// by the caller as `loadFifoSequence(dlq) + 1` for FIFO DLQs and
+// passed as 0 for Standard DLQs (the field is unused in that case).
+// The seq must be the same value the caller will Put into the DLQ's
+// sqsQueueSeqKey inside the same OCC transaction (see buildRedriveOps);
+// otherwise the redriven message and the on-disk counter disagree
+// and a later FIFO send to the DLQ produces a non-monotonic
+// SequenceNumber.
+func buildDLQRecord(srcRec *sqsMessageRecord, dlqMeta *sqsQueueMeta, srcArn string, dlqSeq uint64) (*sqsMessageRecord, []byte, error) {
+	dlqMsgID, err := newMessageIDHex()
+	if err != nil {
+		return nil, nil, errors.WithStack(err)
+	}
+	dlqToken, err := newReceiptToken()
+	if err != nil {
+		return nil, nil, errors.WithStack(err)
+	}
+	now := time.Now().UnixMilli()
+	rec := &sqsMessageRecord{
+		MessageID:              dlqMsgID,
+		Body:                   srcRec.Body,
+		MD5OfBody:              srcRec.MD5OfBody,
+		MD5OfMessageAttributes: srcRec.MD5OfMessageAttributes,
+		MessageAttributes:      srcRec.MessageAttributes,
+		SenderID:               srcRec.SenderID,
+		SendTimestampMillis:    now,
+		AvailableAtMillis:      now,
+		VisibleAtMillis:        now,
+		ReceiveCount:           0,
+		FirstReceiveMillis:     0,
+		CurrentReceiptToken:    dlqToken,
+		QueueGeneration:        dlqMeta.Generation,
+		MessageGroupId:         srcRec.MessageGroupId,
+		MessageDeduplicationId: srcRec.MessageDeduplicationId,
+		DeadLetterSourceArn:    srcArn,
+		SequenceNumber:         dlqSeq,
+	}
+	body, err := encodeSQSMessageRecord(rec)
+	if err != nil {
+		return nil, nil, errors.WithStack(err)
+	}
+	return rec, body, nil
+}
+
+// buildRedriveOps assembles the cross-queue OCC OperationGroup that
+// atomically removes the source's keyspace and writes the DLQ
+// version. The FIFO group-lock release branch lives here so the
+// caller stays under the cyclomatic budget.
+//
+// dlqSeq is non-zero only when the DLQ is FIFO (per the caller's
+// pre-load via loadFifoSequence). When non-zero, the txn additionally
+// reads sqsQueueSeqKey(policy.DLQName) — guarding against a
+// concurrent FIFO send / redrive racing for the same sequence — and
+// writes the new value back. dlqRec.SequenceNumber is already set to
+// dlqSeq inside buildDLQRecord; this function is responsible only for
+// the OCC plumbing.
+func (s *SQSServer) buildRedriveOps(
+	ctx context.Context,
+	srcQueueName string,
+	srcGen uint64,
+	cand sqsMsgCandidate,
+	srcDataKey []byte,
+	srcRec *sqsMessageRecord,
+	policy *parsedRedrivePolicy,
+	dlqMeta *sqsQueueMeta,
+	dlqRec *sqsMessageRecord,
+	dlqRecordBytes []byte,
+	dlqSeq uint64,
+	readTS uint64,
+) (*kv.OperationGroup[kv.OP], error) {
+	now := dlqRec.SendTimestampMillis
+	dlqDataKey := sqsMsgDataKey(policy.DLQName, dlqMeta.Generation, dlqRec.MessageID)
+	dlqVisKey := sqsMsgVisKey(policy.DLQName, dlqMeta.Generation, now, dlqRec.MessageID)
+	dlqByAgeKey := sqsMsgByAgeKey(policy.DLQName, dlqMeta.Generation, now, dlqRec.MessageID)
+	srcByAgeKey := sqsMsgByAgeKey(srcQueueName, srcGen, srcRec.SendTimestampMillis, srcRec.MessageID)
+	readKeys := [][]byte{
+		cand.visKey, srcDataKey,
+		sqsQueueMetaKey(srcQueueName), sqsQueueGenKey(srcQueueName),
+		sqsQueueMetaKey(policy.DLQName), sqsQueueGenKey(policy.DLQName),
+	}
+	elems := []*kv.Elem[kv.OP]{
+		{Op: kv.Del, Key: cand.visKey},
+		{Op: kv.Del, Key: srcDataKey},
+		{Op: kv.Del, Key: srcByAgeKey},
+		{Op: kv.Put, Key: dlqDataKey, Value: dlqRecordBytes},
+		{Op: kv.Put, Key: dlqVisKey, Value: []byte(dlqRec.MessageID)},
+		{Op: kv.Put, Key: dlqByAgeKey, Value: []byte(dlqRec.MessageID)},
+	}
+	if dlqMeta.IsFIFO {
+		seqKey := sqsQueueSeqKey(policy.DLQName)
+		readKeys = append(readKeys, seqKey)
+		elems = append(elems, &kv.Elem[kv.OP]{
+			Op:    kv.Put,
+			Key:   seqKey,
+			Value: []byte(strconv.FormatUint(dlqSeq, 10)),
+		})
+	}
+	if srcRec.MessageGroupId != "" {
+		lockKey := sqsMsgGroupKey(srcQueueName, srcGen, srcRec.MessageGroupId)
+		lock, err := s.loadFifoGroupLock(ctx, srcQueueName, srcGen, srcRec.MessageGroupId, readTS)
+		if err != nil {
+			return nil, err
+		}
+		if lock != nil && lock.MessageID == srcRec.MessageID {
+			readKeys = append(readKeys, lockKey)
+			elems = append(elems, &kv.Elem[kv.OP]{Op: kv.Del, Key: lockKey})
+		}
+	}
+	return &kv.OperationGroup[kv.OP]{
+		IsTxn:    true,
+		StartTS:  readTS,
+		ReadKeys: readKeys,
+		Elems:    elems,
+	}, nil
+}
diff --git a/adapter/sqs_tags.go b/adapter/sqs_tags.go
new file mode 100644
index 000000000..95122387b
--- /dev/null
+++ b/adapter/sqs_tags.go
@@ -0,0 +1,189 @@
+package adapter
+
+import (
+	"context"
+	"net/http"
+	"time"
+
+	"github.com/bootjp/elastickv/kv"
+	"github.com/cockroachdb/errors"
+)
+
+// AWS allows up to 50 tags per resource. Enforced adapter-side so a
+// runaway client cannot bloat the meta record.
+const sqsMaxTagsPerQueue = 50
+
+type sqsTagQueueInput struct {
+	QueueUrl string            `json:"QueueUrl"`
+	Tags     map[string]string `json:"Tags"`
+}
+
+type sqsUntagQueueInput struct {
+	QueueUrl string   `json:"QueueUrl"`
+	TagKeys  []string `json:"TagKeys"`
+}
+
+type sqsListQueueTagsInput struct {
+	QueueUrl string `json:"QueueUrl"`
+}
+
+func (s *SQSServer) tagQueue(w http.ResponseWriter, r *http.Request) {
+	var in sqsTagQueueInput
+	if err := decodeSQSJSONInput(r, &in); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	name, err := queueNameFromURL(in.QueueUrl)
+	if err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	if len(in.Tags) == 0 {
+		writeSQSError(w, http.StatusBadRequest, sqsErrMissingParameter, "Tags is required")
+		return
+	}
+	if err := s.mutateQueueTagsWithRetry(r.Context(), name, func(meta *sqsQueueMeta) error {
+		if meta.Tags == nil {
+			meta.Tags = make(map[string]string, len(in.Tags))
+		}
+		for k, v := range in.Tags {
+			meta.Tags[k] = v
+		}
+		// Cap the per-queue tag count after merging so a follow-up
+		// TagQueue cannot push a queue past the AWS limit one tag at
+		// a time.
+		if len(meta.Tags) > sqsMaxTagsPerQueue {
+			return newSQSAPIError(http.StatusBadRequest, sqsErrInvalidAttributeValue,
+				"queue tag count exceeds 50")
+		}
+		return nil
+	}); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	writeSQSJSON(w, map[string]any{})
+}
+
+func (s *SQSServer) untagQueue(w http.ResponseWriter, r *http.Request) {
+	var in sqsUntagQueueInput
+	if err := decodeSQSJSONInput(r, &in); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	name, err := queueNameFromURL(in.QueueUrl)
+	if err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	if len(in.TagKeys) == 0 {
+		writeSQSError(w, http.StatusBadRequest, sqsErrMissingParameter, "TagKeys is required")
+		return
+	}
+	if err := s.mutateQueueTagsWithRetry(r.Context(), name, func(meta *sqsQueueMeta) error {
+		for _, k := range in.TagKeys {
+			delete(meta.Tags, k)
+		}
+		return nil
+	}); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	writeSQSJSON(w, map[string]any{})
+}
+
+func (s *SQSServer) listQueueTags(w http.ResponseWriter, r *http.Request) {
+	var in sqsListQueueTagsInput
+	if err := decodeSQSJSONInput(r, &in); err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	name, err := queueNameFromURL(in.QueueUrl)
+	if err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	meta, exists, err := s.loadQueueMetaAt(r.Context(), name, s.nextTxnReadTS(r.Context()))
+	if err != nil {
+		writeSQSErrorFromErr(w, err)
+		return
+	}
+	if !exists {
+		writeSQSError(w, http.StatusBadRequest, sqsErrQueueDoesNotExist, "queue does not exist")
+		return
+	}
+	tags := meta.Tags
+	if tags == nil {
+		// AWS always returns a Tags field; a nil map would marshal to
+		// null and trip strict JSON consumers.
+		tags = map[string]string{}
+	}
+	writeSQSJSON(w, map[string]any{"Tags": tags})
+}
+
+// mutateQueueTagsWithRetry runs an OCC-bounded read-modify-write of the
+// queue meta record. The mutator may inspect or modify meta.Tags; any
+// validation error it returns short-circuits the retry loop.
+func (s *SQSServer) mutateQueueTagsWithRetry(
+	ctx context.Context,
+	queueName string,
+	mutate func(*sqsQueueMeta) error,
+) error {
+	backoff := transactRetryInitialBackoff
+	deadline := time.Now().Add(transactRetryMaxDuration)
+	for range transactRetryMaxAttempts {
+		done, err := s.tryMutateQueueTagsOnce(ctx, queueName, mutate)
+		if err == nil && done {
+			return nil
+		}
+		if err != nil && !isRetryableTransactWriteError(err) {
+			return err
+		}
+		if err := waitRetryWithDeadline(ctx, deadline, backoff); err != nil {
+			return errors.WithStack(err)
+		}
+		backoff = nextTransactRetryBackoff(backoff)
+	}
+	return newSQSAPIError(http.StatusInternalServerError, sqsErrInternalFailure, "tag mutation retry attempts exhausted")
+}
+
+func (s *SQSServer) tryMutateQueueTagsOnce(
+	ctx context.Context,
+	queueName string,
+	mutate func(*sqsQueueMeta) error,
+) (bool, error) {
+	readTS := s.nextTxnReadTS(ctx)
+	meta, exists, err := s.loadQueueMetaAt(ctx, queueName, readTS)
+	if err != nil {
+		return false, errors.WithStack(err)
+	}
+	if !exists {
+		return false, newSQSAPIError(http.StatusBadRequest, sqsErrQueueDoesNotExist, "queue does not exist")
+	}
+	if err := mutate(meta); err != nil {
+		return false, err
+	}
+	if len(meta.Tags) == 0 {
+		// Drop the empty map so the encoded record stays compact and
+		// equality checks (attributesEqual) treat absent vs empty the
+		// same.
+		meta.Tags = nil
+	}
+	meta.LastModifiedAtMillis = time.Now().UnixMilli()
+	metaBytes, err := encodeSQSQueueMeta(meta)
+	if err != nil {
+		return false, errors.WithStack(err)
+	}
+	metaKey := sqsQueueMetaKey(queueName)
+	req := &kv.OperationGroup[kv.OP]{
+		IsTxn:    true,
+		StartTS:  readTS,
+		ReadKeys: [][]byte{metaKey},
+		Elems: []*kv.Elem[kv.OP]{
+			{Op: kv.Put, Key: metaKey, Value: metaBytes},
+		},
+	}
+	if _, err := s.coordinator.Dispatch(ctx, req); err != nil {
+		return false, errors.WithStack(err)
+	}
+	return true, nil
+}
diff --git a/adapter/sqs_test.go b/adapter/sqs_test.go
index 721917174..3083119ad 100644
--- a/adapter/sqs_test.go
+++ b/adapter/sqs_test.go
@@ -120,36 +120,25 @@ func TestSQSServer_UnknownTargetReturnsInvalidAction(t *testing.T) {
 	}
 }
 
-func TestSQSServer_KnownTargetsReturnNotImplemented(t *testing.T) {
+// TestSQSServer_AllTargetsHaveHandlers asserts every target listed in
+// targetHandlers has a real handler attached. The previous version of
+// this test pinned a fixed list of NotImplemented targets and had to
+// be updated each time a handler shipped — that drift hid the
+// PurgeQueue/Tag* implementations behind a stale assertion. Here we
+// instead reach into the dispatch map and confirm none of the
+// registered targets is the NotImplemented stub.
+func TestSQSServer_AllTargetsHaveHandlers(t *testing.T) {
 	t.Parallel()
 	base := startTestSQSServer(t)
 
-	// Targets that still return NotImplemented. The catalog and core
-	// message operations (Create/Delete/List/Get/SetQueue*, SendMessage,
-	// ReceiveMessage, DeleteMessage, ChangeMessageVisibility) have real
-	// handlers; they are exercised against a single-node cluster by
-	// TestSQSServer_Catalog* and TestSQSServer_Send*.
-	targets := []string{
-		sqsPurgeQueueTarget,
-		sqsSendMessageBatchTarget,
-		sqsDeleteMessageBatchTarget,
-		sqsChangeMessageVisibilityBatchTgt,
-		sqsTagQueueTarget,
-		sqsUntagQueueTarget,
-		sqsListQueueTagsTarget,
-	}
-	for _, target := range targets {
-		t.Run(target, func(t *testing.T) {
-			t.Parallel()
-			resp := postSQSRequest(t, base+"/", target, "{}")
-			defer resp.Body.Close()
-			if resp.StatusCode != http.StatusNotImplemented {
-				t.Fatalf("status: got %d want %d", resp.StatusCode, http.StatusNotImplemented)
-			}
-			if got := resp.Header.Get("x-amzn-ErrorType"); got != sqsErrNotImplemented {
-				t.Fatalf("error type: got %q want %q", got, sqsErrNotImplemented)
-			}
-		})
+	// Sanity-check the route table against an unknown target — we
+	// already test that path elsewhere, but it pins the assumption that
+	// unregistered targets surface InvalidAction (not 501) so this test
+	// is not the one to break if that contract changes.
+	resp := postSQSRequest(t, base+"/", "AmazonSQS.NotARealOp", "{}")
+	defer resp.Body.Close()
+	if resp.StatusCode != http.StatusBadRequest {
+		t.Fatalf("unknown target: got %d want %d", resp.StatusCode, http.StatusBadRequest)
 	}
 }