diff --git a/cmd/kafka-consumer/writer.go b/cmd/kafka-consumer/writer.go
new file mode 100644
index 0000000000..cccab9372b
--- /dev/null
+++ b/cmd/kafka-consumer/writer.go
@@ -0,0 +1,584 @@
+// Copyright 2024 PingCAP, Inc.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package main
+
+import (
+	"context"
+	"database/sql"
+	"errors"
+	"math"
+	"sync"
+	"time"
+
+	"github.com/confluentinc/confluent-kafka-go/v2/kafka"
+	"github.com/pingcap/log"
+	"github.com/pingcap/tiflow/cdc/model"
+	"github.com/pingcap/tiflow/cdc/sink/ddlsink"
+	ddlsinkfactory "github.com/pingcap/tiflow/cdc/sink/ddlsink/factory"
+	eventsinkfactory "github.com/pingcap/tiflow/cdc/sink/dmlsink/factory"
+	"github.com/pingcap/tiflow/cdc/sink/dmlsink/mq/dispatcher"
+	"github.com/pingcap/tiflow/cdc/sink/tablesink"
+	"github.com/pingcap/tiflow/pkg/config"
+	cerror "github.com/pingcap/tiflow/pkg/errors"
+	"github.com/pingcap/tiflow/pkg/sink/codec"
+	"github.com/pingcap/tiflow/pkg/sink/codec/avro"
+	"github.com/pingcap/tiflow/pkg/sink/codec/canal"
+	"github.com/pingcap/tiflow/pkg/sink/codec/debezium"
+	"github.com/pingcap/tiflow/pkg/sink/codec/open"
+	"github.com/pingcap/tiflow/pkg/sink/codec/simple"
+	"github.com/pingcap/tiflow/pkg/spanz"
+	"go.uber.org/zap"
+)
+
+// NewDecoder will create a new event decoder
+func NewDecoder(ctx context.Context, option *option, upstreamTiDB *sql.DB) (codec.RowEventDecoder, error) {
+	var (
+		decoder codec.RowEventDecoder
+		err     error
+	)
+	switch option.protocol {
+	case config.ProtocolOpen, config.ProtocolDefault:
+		decoder, err = open.NewBatchDecoder(ctx, option.codecConfig, upstreamTiDB)
+	case config.ProtocolCanalJSON:
+		decoder, err = canal.NewBatchDecoder(ctx, option.codecConfig, upstreamTiDB)
+	case config.ProtocolAvro:
+		schemaM, err := avro.NewConfluentSchemaManager(ctx, option.schemaRegistryURI, nil)
+		if err != nil {
+			return decoder, cerror.Trace(err)
+		}
+		decoder = avro.NewDecoder(option.codecConfig, schemaM, option.topic, upstreamTiDB)
+	case config.ProtocolSimple:
+		decoder, err = simple.NewDecoder(ctx, option.codecConfig, upstreamTiDB)
+	case config.ProtocolDebezium:
+		decoder = debezium.NewDecoder(option.codecConfig, upstreamTiDB)
+	default:
+		log.Panic("Protocol not supported", zap.Any("Protocol", option.protocol))
+	}
+	if err != nil {
+		return nil, cerror.Trace(err)
+	}
+	return decoder, err
+}
+
+type partitionProgress struct {
+	partition       int32
+	watermark       uint64
+	watermarkOffset kafka.Offset
+
+	tableSinkMap map[model.TableID]tablesink.TableSink
+	eventGroups  map[model.TableID]*eventsGroup
+	decoder      codec.RowEventDecoder
+}
+
+func newPartitionProgress(partition int32, decoder codec.RowEventDecoder) *partitionProgress {
+	return &partitionProgress{
+		partition:    partition,
+		eventGroups:  make(map[model.TableID]*eventsGroup),
+		tableSinkMap: make(map[model.TableID]tablesink.TableSink),
+		decoder:      decoder,
+	}
+}
+
+func (p *partitionProgress) updateWatermark(newWatermark uint64, offset kafka.Offset) {
+	watermark := p.loadWatermark()
+	if newWatermark >= watermark {
+		p.watermark = newWatermark
+		p.watermarkOffset = offset
+		log.Info("watermark received", zap.Int32("partition", p.partition), zap.Any("offset", offset),
+			zap.Uint64("watermark", newWatermark))
+		return
+	}
+	fields := []zap.Field{
+		zap.Int32("partition", p.partition),
+		zap.Uint64("newWatermark", newWatermark),
+		zap.Any("offset", offset),
+		zap.Uint64("watermark", watermark),
+		zap.Any("watermarkOffset", p.watermarkOffset),
+	}
+
+	// TiCDC only guarantees at-least-once delivery. Duplicate MQ delivery can
+	// replay old resolved/checkpoint markers, making the resolved ts appear to
+	// fall back. This is unexpected but tolerable, so the consumer keeps the
+	// larger watermark.
+	if offset > p.watermarkOffset {
+		log.Warn("partition resolved ts fall back from newer offset: unexpected but tolerable under at-least-once delivery, ignore it", fields...)
+		return
+	}
+	log.Warn("partition resolved ts fall back, ignore it since consumer read old offset message", fields...)
+}
+
+func (p *partitionProgress) loadWatermark() uint64 {
+	return p.watermark
+}
+
+type writer struct {
+	option *option
+
+	ddlList            []*model.DDLEvent
+	ddlWithMaxCommitTs *model.DDLEvent
+	// ddlKeysWithMaxCommitTs records every logical DDL seen at the current
+	// maximum CommitTs, so replayed prefixes of split DDL sequences can be
+	// ignored without collapsing distinct DDLs that share the same CommitTs.
+	ddlKeysWithMaxCommitTs map[ddlEventKey]struct{}
+	ddlSink                ddlsink.Sink
+
+	// sinkFactory is used to create table sink for each table.
+	sinkFactory *eventsinkfactory.SinkFactory
+	progresses  []*partitionProgress
+
+	eventRouter *dispatcher.EventRouter
+}
+
+// ddlEventKey identifies a logical DDL even if the Kafka replay decodes it
+// into a fresh DDLEvent object. The MQ codecs preserve StartTs/CommitTs/Query/Seq,
+// which is enough to distinguish split DDLs while still recognizing replays.
+type ddlEventKey struct {
+	startTs  uint64
+	commitTs uint64
+	query    string
+	seq      uint64
+}
+
+func newDDLEventKey(ddl *model.DDLEvent) ddlEventKey {
+	return ddlEventKey{
+		startTs:  ddl.StartTs,
+		commitTs: ddl.CommitTs,
+		query:    ddl.Query,
+		seq:      ddl.Seq,
+	}
+}
+
+func newWriter(ctx context.Context, o *option) *writer {
+	w := &writer{
+		option:     o,
+		progresses: make([]*partitionProgress, o.partitionNum),
+	}
+	var (
+		db  *sql.DB
+		err error
+	)
+	if o.upstreamTiDBDSN != "" {
+		db, err = openDB(ctx, o.upstreamTiDBDSN)
+		if err != nil {
+			log.Panic("cannot open the upstream TiDB, handle key only enabled",
+				zap.String("dsn", o.upstreamTiDBDSN))
+		}
+	}
+	decoder, err := NewDecoder(ctx, o, db)
+	for i := 0; i < int(o.partitionNum); i++ {
+		if err != nil {
+			log.Panic("cannot create the decoder", zap.Error(err))
+		}
+		w.progresses[i] = newPartitionProgress(int32(i), decoder)
+	}
+
+	eventRouter, err := dispatcher.NewEventRouter(o.replicaConfig, o.protocol, o.topic, "kafka")
+	if err != nil {
+		log.Panic("initialize the event router failed",
+			zap.Any("protocol", o.protocol), zap.Any("topic", o.topic),
+			zap.Any("dispatcherRules", o.replicaConfig.Sink.DispatchRules), zap.Error(err))
+	}
+	w.eventRouter = eventRouter
+	log.Info("event router created", zap.Any("protocol", o.protocol),
+		zap.Any("topic", o.topic), zap.Any("dispatcherRules", o.replicaConfig.Sink.DispatchRules))
+
+	config.GetGlobalServerConfig().TZ = o.timezone
+	errChan := make(chan error, 1)
+	changefeed := model.DefaultChangeFeedID("kafka-consumer")
+	f, err := eventsinkfactory.New(ctx, changefeed, o.downstreamURI, o.replicaConfig, errChan, nil)
+	if err != nil {
+		log.Panic("cannot create the event sink factory", zap.Error(err))
+	}
+	w.sinkFactory = f
+
+	go func() {
+		err := <-errChan
+		if !errors.Is(cerror.Cause(err), context.Canceled) {
+			log.Error("error on running consumer", zap.Error(err))
+		} else {
+			log.Info("consumer exited")
+		}
+	}()
+
+	ddlSink, err := ddlsinkfactory.New(ctx, changefeed, o.downstreamURI, o.replicaConfig)
+	if err != nil {
+		log.Panic("cannot create the ddl sink factory", zap.Error(err))
+	}
+	w.ddlSink = ddlSink
+	return w
+}
+
+// append DDL wait to be handled, only consider the constraint among DDLs.
+// for DDL a / b received in the order, a.CommitTs < b.CommitTs should be true.
+func (w *writer) appendDDL(ddl *model.DDLEvent, offset kafka.Offset) {
+	// DDL CommitTs fallback, just crash it to indicate the bug.
+	if w.ddlWithMaxCommitTs != nil && ddl.CommitTs < w.ddlWithMaxCommitTs.CommitTs {
+		log.Warn("DDL CommitTs < maxCommitTsDDL.CommitTs",
+			zap.Uint64("commitTs", ddl.CommitTs),
+			zap.Uint64("maxCommitTs", w.ddlWithMaxCommitTs.CommitTs),
+			zap.String("DDL", ddl.Query))
+		return
+	}
+
+	ddlKey := newDDLEventKey(ddl)
+	if w.ddlWithMaxCommitTs == nil || ddl.CommitTs > w.ddlWithMaxCommitTs.CommitTs {
+		w.ddlKeysWithMaxCommitTs = make(map[ddlEventKey]struct{})
+	}
+
+	// The DDL with max CommitTs may be one event in a split DDL job, so we must
+	// remember every logical DDL already seen at that CommitTs rather than only
+	// comparing against the last decoded event object.
+	if _, duplicated := w.ddlKeysWithMaxCommitTs[ddlKey]; duplicated {
+		log.Warn("ignore redundant DDL, the DDL has already been seen at max CommitTs",
+			zap.Uint64("commitTs", ddl.CommitTs), zap.String("DDL", ddl.Query))
+		return
+	}
+
+	w.ddlList = append(w.ddlList, ddl)
+	w.ddlWithMaxCommitTs = ddl
+	w.ddlKeysWithMaxCommitTs[ddlKey] = struct{}{}
+	log.Info("DDL message received", zap.Any("offset", offset), zap.Uint64("commitTs", ddl.CommitTs), zap.String("DDL", ddl.Query))
+}
+
+func (w *writer) getFrontDDL() *model.DDLEvent {
+	if len(w.ddlList) > 0 {
+		return w.ddlList[0]
+	}
+	return nil
+}
+
+func (w *writer) popDDL() {
+	if len(w.ddlList) > 0 {
+		w.ddlList = w.ddlList[1:]
+	}
+}
+
+func (w *writer) getMinWatermark() uint64 {
+	result := uint64(math.MaxUint64)
+	for _, p := range w.progresses {
+		watermark := p.loadWatermark()
+		if watermark < result {
+			result = watermark
+		}
+	}
+	return result
+}
+
+// partition progress could be executed at the same time
+func (w *writer) forEachPartition(fn func(p *partitionProgress)) {
+	var wg sync.WaitGroup
+	for _, p := range w.progresses {
+		wg.Add(1)
+		go func(p *partitionProgress) {
+			defer wg.Done()
+			fn(p)
+		}(p)
+	}
+	wg.Wait()
+}
+
+// Write will synchronously write data downstream
+func (w *writer) Write(ctx context.Context, messageType model.MessageType) bool {
+	watermark := w.getMinWatermark()
+	var todoDDL *model.DDLEvent
+	for {
+		todoDDL = w.getFrontDDL()
+		// watermark is the min value for all partitions,
+		// the DDL only executed by the first partition, other partitions may be slow
+		// so that the watermark can be smaller than the DDL's commitTs,
+		// which means some DML events may not be consumed yet, so cannot execute the DDL right now.
+		if todoDDL == nil || todoDDL.CommitTs > watermark {
+			break
+		}
+		// flush DMLs
+		w.forEachPartition(func(sink *partitionProgress) {
+			syncFlushRowChangedEvents(ctx, sink, todoDDL.CommitTs)
+		})
+		// DDL can be executed, do it first.
+		if err := w.ddlSink.WriteDDLEvent(ctx, todoDDL); err != nil {
+			log.Panic("write DDL event failed", zap.Error(err),
+				zap.String("DDL", todoDDL.Query), zap.Uint64("commitTs", todoDDL.CommitTs))
+		}
+		w.popDDL()
+	}
+
+	if messageType == model.MessageTypeResolved {
+		w.forEachPartition(func(sink *partitionProgress) {
+			syncFlushRowChangedEvents(ctx, sink, watermark)
+		})
+	}
+
+	// The DDL events will only execute in partition0
+	if messageType == model.MessageTypeDDL && todoDDL != nil {
+		log.Info("DDL event will be flushed in the future",
+			zap.Uint64("watermark", watermark),
+			zap.Uint64("CommitTs", todoDDL.CommitTs),
+			zap.String("Query", todoDDL.Query))
+		return false
+	}
+	return true
+}
+
+// WriteMessage is to decode kafka message to event.
+func (w *writer) WriteMessage(ctx context.Context, message *kafka.Message) bool {
+	var (
+		key       = message.Key
+		value     = message.Value
+		partition = message.TopicPartition.Partition
+		offset    = message.TopicPartition.Offset
+	)
+
+	progress := w.progresses[partition]
+	if err := progress.decoder.AddKeyValue(key, value); err != nil {
+		log.Panic("add key value to the decoder failed",
+			zap.Int32("partition", partition), zap.Any("offset", offset), zap.Error(err))
+	}
+	var (
+		counter     int
+		needFlush   bool
+		messageType model.MessageType
+	)
+	for {
+		ty, hasNext, err := progress.decoder.HasNext()
+		if err != nil {
+			log.Panic("decode message key failed",
+				zap.Int32("partition", partition), zap.Any("offset", offset), zap.Error(err))
+		}
+		if !hasNext {
+			break
+		}
+		counter++
+		// If the message containing only one event exceeds the length limit, CDC will allow it and issue a warning.
+		if len(key)+len(value) > w.option.maxMessageBytes && counter > 1 {
+			log.Panic("kafka max-messages-bytes exceeded",
+				zap.Int32("partition", partition), zap.Any("offset", offset),
+				zap.Int("max-message-bytes", w.option.maxMessageBytes),
+				zap.Int("receivedBytes", len(key)+len(value)))
+		}
+		messageType = ty
+		switch messageType {
+		case model.MessageTypeDDL:
+			// for some protocol, DDL would be dispatched to all partitions,
+			// Consider that DDL a, b, c received from partition-0, the latest DDL is c,
+			// if we receive `a` from partition-1, which would be seemed as DDL regression,
+			// then cause the consumer panic, but it was a duplicate one.
+			// so we only handle DDL received from partition-0 should be enough.
+			// but all DDL event messages should be consumed.
+			ddl, err := progress.decoder.NextDDLEvent()
+			if err != nil {
+				log.Panic("decode message value failed",
+					zap.Int32("partition", partition), zap.Any("offset", offset),
+					zap.ByteString("value", value), zap.Error(err))
+			}
+
+			if dec, ok := progress.decoder.(*simple.Decoder); ok {
+				cachedEvents := dec.GetCachedEvents()
+				for _, row := range cachedEvents {
+					w.checkPartition(row, partition, message.TopicPartition.Offset)
+					log.Info("simple protocol cached event resolved, append to the group",
+						zap.Int64("tableID", row.GetTableID()), zap.Uint64("commitTs", row.CommitTs),
+						zap.Int32("partition", partition), zap.Any("offset", offset))
+					w.appendRow2Group(row, progress, offset)
+				}
+			}
+
+			// the Query maybe empty if using simple protocol, it's comes from `bootstrap` event, no need to handle it.
+			if ddl.Query == "" {
+				continue
+			}
+
+			if partition == 0 {
+				w.appendDDL(ddl, offset)
+			}
+			needFlush = true
+		case model.MessageTypeRow:
+			row, err := progress.decoder.NextRowChangedEvent()
+			if err != nil {
+				log.Panic("decode message value failed",
+					zap.Int32("partition", partition), zap.Any("offset", offset),
+					zap.ByteString("value", value),
+					zap.Error(err))
+			}
+			// when using simple protocol, the row may be nil, since it's table info not received yet,
+			// it's cached in the decoder, so just continue here.
+			if w.option.protocol == config.ProtocolSimple && row == nil {
+				continue
+			}
+			w.checkPartition(row, partition, message.TopicPartition.Offset)
+			w.appendRow2Group(row, progress, offset)
+		case model.MessageTypeResolved:
+			newWatermark, err := progress.decoder.NextResolvedEvent()
+			if err != nil {
+				log.Panic("decode message value failed",
+					zap.Int32("partition", partition), zap.Any("offset", offset),
+					zap.ByteString("value", value), zap.Error(err))
+			}
+
+			progress.updateWatermark(newWatermark, offset)
+			w.resolveRowChangedEvents(progress, newWatermark)
+			needFlush = true
+		default:
+			log.Panic("unknown message type", zap.Any("messageType", messageType),
+				zap.Int32("partition", partition), zap.Any("offset", offset))
+		}
+	}
+
+	if counter > w.option.maxBatchSize {
+		log.Panic("Open Protocol max-batch-size exceeded",
+			zap.Int("max-batch-size", w.option.maxBatchSize), zap.Int("actual-batch-size", counter),
+			zap.Int32("partition", partition), zap.Any("offset", offset))
+	}
+
+	if !needFlush {
+		return false
+	}
+	// flush when received DDL event or resolvedTs
+	return w.Write(ctx, messageType)
+}
+
+func (w *writer) resolveRowChangedEvents(progress *partitionProgress, newWatermark uint64) {
+	for tableID, group := range progress.eventGroups {
+		events := group.Resolve(newWatermark)
+		if len(events) == 0 {
+			continue
+		}
+		tableSink, ok := progress.tableSinkMap[tableID]
+		if !ok {
+			tableSink = w.sinkFactory.CreateTableSinkForConsumer(
+				model.DefaultChangeFeedID("kafka-consumer"),
+				spanz.TableIDToComparableSpan(tableID),
+				events[0].CommitTs,
+			)
+			progress.tableSinkMap[tableID] = tableSink
+		}
+		tableSink.AppendRowChangedEvents(events...)
+	}
+}
+
+func (w *writer) checkPartition(row *model.RowChangedEvent, partition int32, offset kafka.Offset) {
+	target, _, err := w.eventRouter.GetPartitionForRowChange(row, w.option.partitionNum)
+	if err != nil {
+		log.Panic("cannot calculate partition for the row changed event",
+			zap.Int32("partition", partition), zap.Any("offset", offset),
+			zap.Int32("partitionNum", w.option.partitionNum), zap.Int64("tableID", row.GetTableID()),
+			zap.Error(err), zap.Any("event", row))
+	}
+	if partition != target {
+		log.Panic("RowChangedEvent dispatched to wrong partition",
+			zap.Int32("partition", partition), zap.Int32("expected", target),
+			zap.Int32("partitionNum", w.option.partitionNum), zap.Any("offset", offset),
+			zap.Int64("tableID", row.GetTableID()), zap.Any("row", row),
+		)
+	}
+}
+
+func (w *writer) appendRow2Group(row *model.RowChangedEvent, progress *partitionProgress, offset kafka.Offset) {
+	// if the kafka cluster is normal, this should not hit.
+	// else if the cluster is abnormal, the consumer may consume old message, then cause the watermark fallback.
+	watermark := progress.loadWatermark()
+	partition := progress.partition
+
+	tableID := row.GetTableID()
+	group := progress.eventGroups[tableID]
+	if group == nil {
+		group = NewEventsGroup(partition, tableID)
+		progress.eventGroups[tableID] = group
+	}
+	if row.CommitTs < watermark {
+		log.Warn("RowChanged Event fallback row, since less than the partition watermark, ignore it",
+			zap.Int64("tableID", tableID), zap.Int32("partition", partition),
+			zap.Uint64("commitTs", row.CommitTs), zap.Any("offset", offset),
+			zap.Uint64("watermark", watermark), zap.Any("watermarkOffset", progress.watermarkOffset),
+			zap.String("schema", row.TableInfo.GetSchemaName()), zap.String("table", row.TableInfo.GetTableName()),
+			zap.Any("columns", row.Columns), zap.Any("preColumns", row.PreColumns),
+			zap.String("protocol", w.option.protocol.String()), zap.Bool("IsPartition", row.TableInfo.TableName.IsPartition))
+		return
+	}
+	if row.CommitTs >= group.highWatermark {
+		group.Append(row, offset)
+		return
+	}
+	switch w.option.protocol {
+	case config.ProtocolSimple, config.ProtocolOpen, config.ProtocolCanalJSON, config.ProtocolDebezium:
+		// simple protocol set the table id for all row message, it can be known which table the row message belongs to,
+		// also consider the table partition.
+		// open protocol set the partition table id if the table is partitioned.
+		// for normal table, the table id is generated by the fake table id generator by using schema and table name.
+		// so one event group for one normal table or one table partition, replayed messages can be ignored.
+		log.Warn("RowChangedEvent fallback row, since less than the group high watermark, ignore it",
+			zap.Int64("tableID", tableID), zap.Int32("partition", partition),
+			zap.Uint64("commitTs", row.CommitTs), zap.Any("offset", offset),
+			zap.Uint64("highWatermark", group.highWatermark),
+			zap.Any("partitionWatermark", watermark), zap.Any("watermarkOffset", progress.watermarkOffset),
+			zap.String("schema", row.TableInfo.GetSchemaName()), zap.String("table", row.TableInfo.GetTableName()),
+			zap.Any("columns", row.Columns), zap.Any("preColumns", row.PreColumns),
+			zap.String("protocol", w.option.protocol.String()), zap.Bool("IsPartition", row.TableInfo.TableName.IsPartition))
+		return
+	default:
+	}
+	log.Warn("RowChangedEvent fallback row, since less than the group high watermark, do not ignore it",
+		zap.Int64("tableID", tableID), zap.Int32("partition", partition),
+		zap.Uint64("commitTs", row.CommitTs), zap.Any("offset", offset),
+		zap.Uint64("highWatermark", group.highWatermark),
+		zap.Any("partitionWatermark", watermark), zap.Any("watermarkOffset", progress.watermarkOffset),
+		zap.String("schema", row.TableInfo.GetSchemaName()), zap.String("table", row.TableInfo.GetTableName()),
+		zap.Any("columns", row.Columns), zap.Any("preColumns", row.PreColumns),
+		zap.String("protocol", w.option.protocol.String()))
+	group.Append(row, offset)
+}
+
+func syncFlushRowChangedEvents(ctx context.Context, progress *partitionProgress, watermark uint64) {
+	resolvedTs := model.NewResolvedTs(watermark)
+	for {
+		select {
+		case <-ctx.Done():
+			log.Warn("sync flush row changed event canceled", zap.Error(ctx.Err()))
+			return
+		default:
+		}
+		flushedResolvedTs := true
+		for _, tableSink := range progress.tableSinkMap {
+			if err := tableSink.UpdateResolvedTs(resolvedTs); err != nil {
+				log.Panic("Failed to update resolved ts", zap.Error(err))
+			}
+			if tableSink.GetCheckpointTs().Less(resolvedTs) {
+				flushedResolvedTs = false
+			}
+		}
+		if flushedResolvedTs {
+			return
+		}
+	}
+}
+
+func openDB(ctx context.Context, dsn string) (*sql.DB, error) {
+	db, err := sql.Open("mysql", dsn)
+	if err != nil {
+		log.Error("open db failed", zap.Error(err))
+		return nil, cerror.Trace(err)
+	}
+
+	db.SetMaxOpenConns(10)
+	db.SetMaxIdleConns(10)
+	db.SetConnMaxLifetime(10 * time.Minute)
+
+	ctx, cancel := context.WithTimeout(ctx, 5*time.Second)
+	defer cancel()
+	if err = db.PingContext(ctx); err != nil {
+		log.Error("ping db failed", zap.String("dsn", dsn), zap.Error(err))
+		return nil, cerror.Trace(err)
+	}
+	log.Info("open db success", zap.String("dsn", dsn))
+	return db, nil
+}
diff --git a/cmd/kafka-consumer/writer_test.go b/cmd/kafka-consumer/writer_test.go
new file mode 100644
index 0000000000..cd1ff784f8
--- /dev/null
+++ b/cmd/kafka-consumer/writer_test.go
@@ -0,0 +1,152 @@
+// Copyright 2026 PingCAP, Inc.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package main
+
+import (
+	"testing"
+
+	"github.com/confluentinc/confluent-kafka-go/v2/kafka"
+	"github.com/pingcap/tiflow/cdc/model"
+	"github.com/stretchr/testify/require"
+)
+
+func TestUpdateWatermarkIgnoresFallbackFromNewerOffset(t *testing.T) {
+	// Scenario: at-least-once delivery replays an older resolved event with a newer Kafka offset.
+	// Steps: advance the partition watermark, then feed a smaller resolved ts from a larger offset.
+	// Expectation: the consumer keeps the existing watermark instead of panicking.
+	progress := &partitionProgress{partition: 1}
+	progress.updateWatermark(120, kafka.Offset(10))
+
+	require.NotPanics(t, func() {
+		progress.updateWatermark(100, kafka.Offset(20))
+	})
+	require.Equal(t, uint64(120), progress.watermark)
+	require.Equal(t, kafka.Offset(10), progress.watermarkOffset)
+}
+
+func TestAppendDDLIgnoresEquivalentReplay(t *testing.T) {
+	// Scenario: Kafka replays the same DDL as a freshly decoded event object.
+	// Steps: append one DDL, then append a separate object with identical logical fields.
+	// Expectation: the writer keeps only one pending DDL.
+	w := &writer{}
+	ddl := &model.DDLEvent{
+		StartTs:  100,
+		CommitTs: 120,
+		Query:    "create table t(id int primary key)",
+		Seq:      1,
+	}
+	dup := &model.DDLEvent{
+		StartTs:  100,
+		CommitTs: 120,
+		Query:    "create table t(id int primary key)",
+		Seq:      1,
+	}
+
+	w.appendDDL(ddl, kafka.Offset(1))
+	w.appendDDL(dup, kafka.Offset(2))
+
+	require.Len(t, w.ddlList, 1)
+	require.Same(t, ddl, w.ddlWithMaxCommitTs)
+}
+
+func TestAppendDDLKeepsSplitDDLSequenceDistinct(t *testing.T) {
+	// Scenario: one logical DDL job is split into multiple DDL events with the same commitTs.
+	// Steps: append two DDLs whose startTs, commitTs, and query text match but Seq differs.
+	// Expectation: both events remain queued because Seq is part of the DDL identity.
+	w := &writer{}
+	first := &model.DDLEvent{
+		StartTs:  200,
+		CommitTs: 220,
+		Query:    "rename tables split ddl",
+		Seq:      1,
+	}
+	second := &model.DDLEvent{
+		StartTs:  200,
+		CommitTs: 220,
+		Query:    "rename tables split ddl",
+		Seq:      2,
+	}
+
+	w.appendDDL(first, kafka.Offset(3))
+	w.appendDDL(second, kafka.Offset(4))
+
+	require.Len(t, w.ddlList, 2)
+	require.Same(t, second, w.ddlWithMaxCommitTs)
+}
+
+func TestAppendDDLIgnoresReplayedSplitDDLSequence(t *testing.T) {
+	// Scenario: Kafka replays an already queued split DDL sequence after later parts were seen.
+	// Steps: append the original split DDLs, then replay the same logical DDLs as fresh objects.
+	// Expectation: the queue keeps only the original sequence and does not append duplicates.
+	w := &writer{}
+	first := &model.DDLEvent{
+		StartTs:  300,
+		CommitTs: 320,
+		Query:    "rename table test.t1 to test.t2",
+		Seq:      0,
+	}
+	second := &model.DDLEvent{
+		StartTs:  300,
+		CommitTs: 320,
+		Query:    "rename table test.t3 to test.t4",
+		Seq:      1,
+	}
+	replayFirst := &model.DDLEvent{
+		StartTs:  300,
+		CommitTs: 320,
+		Query:    "rename table test.t1 to test.t2",
+		Seq:      0,
+	}
+	replaySecond := &model.DDLEvent{
+		StartTs:  300,
+		CommitTs: 320,
+		Query:    "rename table test.t3 to test.t4",
+		Seq:      1,
+	}
+
+	w.appendDDL(first, kafka.Offset(10))
+	w.appendDDL(second, kafka.Offset(11))
+	w.appendDDL(replayFirst, kafka.Offset(12))
+	w.appendDDL(replaySecond, kafka.Offset(13))
+
+	require.Len(t, w.ddlList, 2)
+	require.Same(t, first, w.ddlList[0])
+	require.Same(t, second, w.ddlList[1])
+	require.Same(t, second, w.ddlWithMaxCommitTs)
+}
+
+func TestAppendDDLKeepsDifferentDDLsWithSameCommitTsWithoutSeq(t *testing.T) {
+	// Scenario: a multi-DDL job can emit different DDLs that share the same commitTs while Seq stays at zero.
+	// Steps: append two distinct DDLs with the same timestamps but different queries and default Seq.
+	// Expectation: both DDLs remain queued because Query is still part of the logical DDL identity.
+	w := &writer{}
+	first := &model.DDLEvent{
+		StartTs:  400,
+		CommitTs: 420,
+		Query:    "create table test.t1(id int primary key)",
+	}
+	second := &model.DDLEvent{
+		StartTs:  400,
+		CommitTs: 420,
+		Query:    "create table test.t2(id int primary key)",
+	}
+
+	w.appendDDL(first, kafka.Offset(20))
+	w.appendDDL(second, kafka.Offset(21))
+
+	require.Len(t, w.ddlList, 2)
+	require.Same(t, first, w.ddlList[0])
+	require.Same(t, second, w.ddlList[1])
+	require.Same(t, second, w.ddlWithMaxCommitTs)
+}